# HG changeset patch
# User ufz
# Date 1749058600 0
# Node ID 315c2ed31af1d35b3a6af913eac8d1bff4b3b1ca
planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/phi-toolkit commit 45c746567f48e6c9bcc19ba4e94e87348df3ac7a
diff -r 000000000000 -r 315c2ed31af1 phitk.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/phitk.xml Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,247 @@
+
+
+
+ 0.1.0
+ 0
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ bioconductor-biostrings
+ bioconductor-genomicranges
+ bioconductor-gmoviz
+ r-formattable
+ r-here
+ r-janitor
+ r-kableextra
+ r-patchwork
+ r-tidyverse
+ r-base64
+ r-pdftools
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
\ No newline at end of file
diff -r 000000000000 -r 315c2ed31af1 report.Rmd
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/report.Rmd Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1081 @@
+---
+title: "PHI Prophage-Host Interaction Toolkit report"
+subtitle: "Toolkit for the Detection, Comparison, and Annotation of Prophages in Bacterial Genomes."
+date: "`r format(Sys.Date(), '%B %d, %Y')`"
+output:
+ html_document:
+ theme: flatly
+ toc: yes
+ toc_float: false
+ number_sections: yes
+ code_folding: none
+ fig_width: 12
+ fig_height: 8
+ fig_caption: true
+ df_print: paged
+editor_options:
+ markdown:
+ wrap: 72
+params:
+ outdir: "data"
+---
+
+
+------------------------------------------------------------------------
+
+```{r setup_env, include=FALSE}
+knitr::opts_chunk$set(echo = FALSE)
+
+cat("params$outdir:", params$outdir, "\n")
+```
+
+```{r setup_libraries, message=FALSE, warning=FALSE, echo=FALSE, results='asis'}
+# Define required packages
+required_packages <- c("tidyverse", "janitor", "here",
+ "kableExtra", "gmoviz", "circlize",
+ "GenomicRanges", "patchwork", "fs",
+ "tools", "scales", "formattable",
+ "pdftools", "base64")
+
+# Load required packages
+invisible(lapply(required_packages, library, character.only = TRUE))
+```
+
+```{r helper_functions, echo=FALSE}
+log_file <- "debug.log"
+
+log_debug <- function(message) {
+ if (!exists("log_initialized") || !log_initialized) {
+ cat(paste0(Sys.time(), " - DEBUG: ", message, "\n"), file = log_file, append = FALSE)
+ assign("log_initialized", TRUE, envir = .GlobalEnv)
+ } else {
+ cat(paste0(Sys.time(), " - DEBUG: ", message, "\n"), file = log_file, append = TRUE)
+ }
+}
+
+load_file <- function(path) {
+ log_debug(paste("Attempting to load:", path))
+ if (file.exists(path)) {
+ ext <- tools::file_ext(path)
+ if (ext %in% c("tsv", "csv")) {
+ data <- read_delim(path, delim = ifelse(ext == "csv", ",", "\t"), show_col_types = FALSE) %>% clean_names
+ log_debug(paste("Loaded", nrow(data), "rows from", path))
+ data
+ } else if (ext == "fna") {
+ data <- Biostrings::readDNAStringSet(path)
+ log_debug(paste("Loaded", length(data), "sequences from", path))
+ data
+ } else {
+ log_debug(paste("Skipping", path, "- unsupported file type"))
+ NULL
+ }
+ } else {
+ log_debug(paste("File does not exist:", path))
+ NULL
+ }
+}
+
+get_file_info <- function(path, loaded_data) {
+ log_debug(paste("Processing file info for:", path))
+ if (file.exists(path)) {
+ ext <- tools::file_ext(path)
+ if (ext %in% c("tsv", "csv", "fna")) {
+ data <- loaded_data[[basename(path)]]
+ rows <- if(ext == "fna") length(data) else nrow(data)
+ tibble(exists = TRUE, rows = rows, size = file.size(path), path = path)
+ } else {
+ tibble(exists = TRUE, rows = NA_integer_, size = file.size(path), path = path)
+ }
+ } else {
+ tibble(exists = FALSE, rows = NA_integer_, size = NA_real_, path = NA_character_)
+ }
+}
+
+process_genome_folder <- function(folder, host_analyses_dir, virus_analyses_dir) {
+ log_debug(paste("Processing folder:", folder))
+ genome_name <- basename(folder)
+
+ paths <- list(
+ genomad = file.path(host_analyses_dir, "genomad", genome_name, paste0(genome_name, "_summary"), paste0(genome_name, "_virus_summary.tsv")),
+ genomad_phages = file.path(host_analyses_dir, "genomad", genome_name, paste0(genome_name, "_summary"), paste0(genome_name, "_virus.fna")),
+ genomad_annotations = file.path(host_analyses_dir, "genomad", genome_name, paste0(genome_name, "_summary"), paste0(genome_name, "_virus_genes.tsv")),
+ defense_finder = file.path(host_analyses_dir, "defense-finder", genome_name, paste0(genome_name, "_defense_finder_systems.tsv")),
+ checkv = file.path(virus_analyses_dir, "checkv", genome_name, "quality_summary.tsv"),
+ iphop = file.path(virus_analyses_dir, "iphop", genome_name, "Host_prediction_to_genome_m90.csv"),
+ drep = file.path(virus_analyses_dir, "drep_compare", genome_name, "data_tables", "Cdb.csv"),
+ phatyp = file.path(virus_analyses_dir, "phatyp", genome_name, "phatyp.csv"),
+ abricate = file.path(virus_analyses_dir, "abricate", genome_name, paste0(genome_name, "_virus_vfdb.tsv")),
+ vibrant = file.path(virus_analyses_dir, "vibrant", genome_name,
+ paste0("VIBRANT_", genome_name, "_virus"),
+ paste0("VIBRANT_results_", genome_name, "_virus"),
+ paste0("VIBRANT_AMG_individuals_", genome_name, "_virus.tsv"))
+ )
+
+ loaded_data <- map(paths, load_file)
+ file_info <- map_dfr(paths, ~get_file_info(.x, loaded_data), .id = "file_type")
+
+ virus_count <- if(!is.null(loaded_data$genomad)) {
+ count <- sum(loaded_data$genomad$virus_score > 0.5, na.rm = TRUE)
+ log_debug(paste("Virus count:", count))
+ count
+ } else {
+ log_debug("No genomad summary found, virus count set to 0")
+ 0
+ }
+
+ log_debug("Returning results from process_genome_folder")
+ list(file_info = file_info, virus_count = virus_count, loaded_data = loaded_data)
+}
+```
+
+
+```{r compile_results, message=FALSE, warning=FALSE, echo=FALSE}
+compile_results <- function() {
+ base_dir <- params$outdir
+ log_debug(paste("Base directory:", base_dir))
+
+ host_analyses_dir <- file.path(base_dir, "host_analyses")
+ virus_analyses_dir <- file.path(base_dir, "virus_analyses")
+
+ # List all sample-level directories from all tools under virus_analyses
+ tool_dirs <- list.dirs(virus_analyses_dir, full.names = TRUE, recursive = FALSE)
+
+ genome_folders <- list.dirs(file.path(base_dir, "host_analyses", "genomad"),
+ full.names = TRUE, recursive = FALSE)
+
+ # cat(length(genome_folders), "sample(s) processed\n")
+
+ log_debug("Processing genome folders")
+ genome_data <- map(genome_folders, process_genome_folder,
+ host_analyses_dir = host_analyses_dir,
+ virus_analyses_dir = virus_analyses_dir) %>%
+ set_names(basename(genome_folders)) %>%
+ compact()
+
+ log_debug("Creating summary dataframe")
+ summary_df <- map_dfr(genome_data, ~{
+ file_info <- .x$file_info
+ tibble(
+ Sample = basename(file_info$path[1]),
+ Virus_Count = .x$virus_count,
+ geNomad = file_info$exists[file_info$file_type == "genomad"],
+ CheckV = file_info$exists[file_info$file_type == "checkv"],
+ VIBRANT = file_info$exists[file_info$file_type == "vibrant"],
+ dRep = file_info$exists[file_info$file_type == "drep"],
+ iPHOP = file_info$exists[file_info$file_type == "iphop"],
+ PhaTYP = file_info$exists[file_info$file_type == "phatyp"],
+ Defense_Finder = file_info$exists[file_info$file_type == "defense_finder"],
+ geNomad_Path = file_info$path[file_info$file_type == "genomad"],
+ CheckV_Path = file_info$path[file_info$file_type == "checkv"],
+ VIBRANT_Path = file_info$path[file_info$file_type == "vibrant"],
+ dRep_Path = file_info$path[file_info$file_type == "drep"],
+ PhaTYP_Path = file_info$path[file_info$file_type == "phatyp"],
+ Defense_Finder_Path = file_info$path[file_info$file_type == "defense_finder"],
+ Virus_Contigs = ifelse(file_info$exists[file_info$file_type == "genomad_phages"],
+ file_info$rows[file_info$file_type == "genomad_phages"],
+ 0)
+ )
+ }) %>%
+ mutate(across(ends_with("_Path"), ~ifelse(is.na(.), "Not available", as.character(.))))
+
+ host_genomes_fasta <- list.files(
+ path = file.path(params$outdir, "genomes"),
+ pattern = "\\.fna$",
+ full.names = TRUE
+ )
+
+ host_genomes_paths <- tibble(
+ name = tools::file_path_sans_ext(basename(host_genomes_fasta)),
+ path = host_genomes_fasta
+ )
+
+ data_gtdbtk_host <- read_tsv(
+ file.path(params$outdir, "host_analyses/gtdbtk/gtdbtk.bac120.summary.tsv"),
+ show_col_types = FALSE
+ ) %>% clean_names()
+
+ data_checkm_host <- read_tsv(
+ file.path(params$outdir, "host_analyses/checkm2/quality_report.tsv"),
+ show_col_types = FALSE
+ ) %>% clean_names()
+
+ log_debug("Returning summary dataframe, genome data, and host data")
+
+ log_debug(paste("summary_df dimensions:", nrow(summary_df), "rows,", ncol(summary_df), "columns"))
+ log_debug(paste("summary_df column names:", paste(colnames(summary_df), collapse = ", ")))
+ log_debug(paste("genome_data length:", length(genome_data)))
+ log_debug(paste("genome_data names:", paste(names(genome_data), collapse = ", ")))
+ log_debug(paste("host_genomes_paths dimensions:", nrow(host_genomes_paths), "rows,", ncol(host_genomes_paths), "columns"))
+ log_debug(paste("host_genomes_paths column names:", paste(colnames(host_genomes_paths), collapse = ", ")))
+ log_debug(paste("data_gtdbtk_host dimensions:", nrow(data_gtdbtk_host), "rows,", ncol(data_gtdbtk_host), "columns"))
+ log_debug(paste("data_gtdbtk_host column names:", paste(colnames(data_gtdbtk_host), collapse = ", ")))
+ log_debug(paste("data_checkm_host dimensions:", nrow(data_checkm_host), "rows,", ncol(data_checkm_host), "columns"))
+ log_debug(paste("data_checkm_host column names:", paste(colnames(data_checkm_host), collapse = ", ")))
+
+ list(
+ summary = summary_df,
+ genome_data = genome_data,
+ host_genomes_paths = host_genomes_paths,
+ data_gtdbtk_host = data_gtdbtk_host,
+ data_checkm_host = data_checkm_host
+ )
+}
+```
+
+```{r run_main_function, echo=FALSE, message=FALSE, warning=FALSE}
+log_debug("Starting execution of main function")
+result <- compile_results()
+
+if (is.null(result)) {
+ log_debug("Main function execution failed")
+ stop("Main function execution failed")
+}
+
+summary_df <- result$summary
+genome_data <- result$genome_data
+host_genomes_paths <- result$host_genomes_paths
+data_gtdbtk_host <- result$data_gtdbtk_host
+data_checkm_host <- result$data_checkm_host
+log_debug("Data extracted successfully")
+
+# Remove any extensions from names in data gtdbtk and checm2
+data_gtdbtk_host <- data_gtdbtk_host %>%
+ mutate(user_genome = str_remove(user_genome, "\\.[^.]+$"))
+
+data_checkm_host <- data_checkm_host %>%
+ mutate(name = str_remove(name, "\\.[^.]+$"))
+
+result$summary <- result$summary %>%
+ mutate(Sample = str_remove(Sample, "_virus_summary.tsv"))
+```
+
+# Summary {.tabset .tabset-fade}
+
+## Overview Table
+
+This table provides sample-by-sample information on detected viruses and key host genome statistics. It includes taxonomy, virus count, genome quality classification, CheckM2 metrics (completeness and contamination), and genome assembly statistics such as size and N50.
+
+```{r render_table, message=FALSE, warning=FALSE, echo=FALSE, results='asis'}
+data <- result$summary
+
+log_debug("Assigning checkm2 host data")
+checkm_host_data <- data_checkm_host %>% clean_names() %>%
+ select(name, completeness, contamination,
+ contig_n50, genome_size)
+
+log_debug("Assigning GTDB-Tk host data")
+gtdbtk_data <- data_gtdbtk_host %>%
+ select(user_genome, classification)
+
+log_debug("Defining color-blind friendly palette")
+cb_friendly_colors <- list(
+ green = "#009E73",
+ blue = "#0072B2",
+ orange = "#E69F00",
+ red = "#D55E00",
+ grey = "#999999"
+)
+
+log_debug("Defining function to color cells")
+color_cell <- function(values, color_true = cb_friendly_colors$green,
+ color_false = cb_friendly_colors$red) {
+ ifelse(values,
+ cell_spec("Yes", color = "white", bold = TRUE, background = color_true),
+ cell_spec("No", color = "white", bold = TRUE, background = color_false))
+}
+
+log_debug("Defining function to create bar plot")
+create_bar_plot <- function(values, max_value, color = cb_friendly_colors$grey) {
+ sapply(values, function(value) {
+ if(is.na(value) || !is.numeric(value)) {
+ return("N/A")
+ }
+ bar_width <- min(max(value, 0), max_value) / max_value * 100
+ sprintf('
%.1f%%',
+ color, bar_width, value)
+ })
+}
+
+log_debug("Defining function to format large numbers")
+format_large_number <- function(x) {
+ sapply(x, function(value) {
+ if (is.na(value) || !is.numeric(value)) {
+ return("N/A")
+ } else if (value < 1000) {
+ return(as.character(value))
+ } else if (value < 1e6) {
+ return(paste0(round(value / 1e3, 1), "K"))
+ } else if (value < 1e9) {
+ return(paste0(round(value / 1e6, 1), "M"))
+ } else {
+ return(paste0(round(value / 1e9, 1), "G"))
+ }
+ })
+}
+
+log_debug("Defining function to extract last known taxonomy level")
+extract_last_known_taxonomy <- function(classification) {
+ if (is.na(classification) || classification == "") {
+ return(list(level = "Unknown", name = "Unknown"))
+ }
+
+ parts <- strsplit(classification, ";")[[1]]
+ for (i in length(parts):1) {
+ level <- sub("^[a-z]__", "", parts[i])
+ if (level != "") {
+ prefix <- sub("__.*$", "", parts[i])
+ return(list(level = prefix, name = level))
+ }
+ }
+ return(list(level = "Unknown", name = "Unknown"))
+}
+
+log_debug("Defining function to format taxonomy")
+format_taxonomy <- function(classification) {
+ result <- extract_last_known_taxonomy(classification)
+ if (result$level == "Unknown") {
+ return("Unknown")
+ } else if (result$level == "s") {
+ return(paste0("", result$name, ""))
+ } else {
+ genus <- str_replace_all(result$name, "_", " ")
+ return(paste0("", genus, " sp."))
+ }
+}
+
+log_debug("Defining function to calculate quality score and determine genome quality class")
+calculate_quality_score_and_class <- function(completeness, contamination) {
+ if (is.na(completeness) || is.na(contamination)) {
+ return(list(
+ score = cell_spec("N/A", color = "white", bold = TRUE, background = cb_friendly_colors$grey),
+ class = cell_spec("Unknown", color = "white", bold = TRUE, background = cb_friendly_colors$grey),
+ numeric_score = NA
+ ))
+ }
+
+ quality_score <- completeness - (5 * contamination)
+ formatted_score <- sprintf("%.1f", quality_score)
+
+ if (completeness > 90 && contamination < 5) {
+ class <- "High-quality draft"
+ color <- cb_friendly_colors$green
+ } else if (completeness >= 50 && contamination < 10) {
+ class <- "Medium-quality draft"
+ color <- cb_friendly_colors$blue
+ } else {
+ class <- "Low-quality draft"
+ color <- cb_friendly_colors$red
+ }
+
+ list(
+ score = cell_spec(formatted_score, color = "white", bold = TRUE, background = color),
+ class = cell_spec(class, color = "white", bold = TRUE, background = color),
+ numeric_score = quality_score
+ )
+}
+
+log_debug("Preparing the data")
+
+table_data <- data %>%
+ #mutate(Sample = basename(Sample) %>% trim_sample_name()) %>%
+ mutate(Sample = basename(Sample)) %>%
+ left_join(checkm_host_data, by = c("Sample" = "name")) %>%
+ left_join(gtdbtk_data, by = c("Sample" = "user_genome")) %>%
+ mutate(
+ quality_data = pmap(list(as.numeric(completeness),
+ as.numeric(contamination)),
+ calculate_quality_score_and_class),
+ Quality_Score = map_chr(quality_data, ~.$score),
+ Genome_Quality = map_chr(quality_data, ~.$class),
+ Quality_Score_Numeric = map_dbl(quality_data, ~.$numeric_score),
+ Virus_Count_Numeric = as.numeric(Virus_Count),
+ Virus_Count = cell_spec(
+ Virus_Count,
+ color = "white",
+ bold = TRUE,
+ background = case_when(
+ Virus_Count == 0 ~ cb_friendly_colors$red,
+ Virus_Count == 1 ~ cb_friendly_colors$blue,
+ Virus_Count > 1 ~ cb_friendly_colors$green
+ )
+ ),
+ Completeness_Numeric = as.numeric(completeness),
+ Completeness = create_bar_plot(as.numeric(completeness), 100),
+ Contamination = create_bar_plot(as.numeric(contamination), 100),
+ `N50 (contigs)` = format_large_number(as.numeric(contig_n50)),
+ `Genome size (bp)` = format_large_number(as.numeric(genome_size)),
+ `GTDB Taxonomy` = sapply(classification, format_taxonomy)
+ ) %>%
+ mutate(`#` = row_number()) %>%
+ select(`#`, Sample, `GTDB Taxonomy`, Virus_Count,
+ Quality_Score, Genome_Quality, Completeness, Contamination,
+ `Genome size (bp)`, `N50 (contigs)`)
+
+log_debug("Creating the table")
+kbl(table_data, escape = FALSE,
+ align = c("c", "l", "l", "c", rep("c", 2), rep("r", 2), rep("r", 2))) %>%
+ kable_paper(full_width = TRUE) %>%
+ column_spec(1, bold = TRUE, width = "2em") %>%
+ column_spec(2:3, bold = TRUE) %>%
+ column_spec(4:5, width = "5em") %>%
+ column_spec(6:7, width = "60px") %>%
+ column_spec(8:9, width = "4em") %>%
+ add_header_above(c(" " = 4, "Host Genome Quality" = 2, "CheckM Metrics" = 2,
+ "Statistics" = 2)) %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive"),
+ font_size = 9,
+ html_font = "Arial",
+ position = "left") %>%
+ row_spec(0, bold = TRUE, color = "white", background = "#333333") %>%
+ row_spec(0, extra_css = "border-bottom: 2px solid #000000;") %>%
+ column_spec(9, extra_css = "border-right: 2px solid #000000;") %>%
+ scroll_box(width = "100%", height = "100%",
+ extra_css = "overflow-x: auto; border: 1px solid #ccc; border-radius: 4px;")
+```
+
+## Tools Documentation
+
+The following tools are utilized in this workflow. Each tool name below is a link to its respective documentation.
+
+**Host-analyses**
+
+- [**CheckM2 v1.1.0**](https://github.com/chklovski/CheckM2): Assesses the quality of the host. Most useful when working with assembled genomes.
+
+- [**GTDB-Tk v2.3.2**](https://ecogenomics.github.io/GTDBTk/index.html): Assigns a taxonomy to the host genome.
+
+- [**Defense-Finder v2.0.0, models 2.0.2**](https://ecogenomics.github.io/GTDBTk/index.html): Detects known anti-phage systems in the host.
+
+- [**geNomad v1.7.1**](https://portal.nersc.gov/genomad/): Predicts and annotates proviruses.
+
+**Virus-analyses**
+
+- [**CheckV v1.0.1**](https://pypi.org/project/checkv/): Evaluates the quality of viral genomes.
+
+- [**dRep v3.4.5**](https://drep.readthedocs.io/en/latest/): Compares viral genomes within the same host.
+
+- [**Abricate v1.0.1**](https://github.com/tseemann/abricate): Identifies virulence genes in the prophage genomes with the [VFDB database](https://www.mgc.ac.cn/VFs/).
+
+- [**iPHOP v1.3.3**](https://bitbucket.org/srouxjgi/iphop/src/main/): Predicts other potential hosts of viral genomes.
+
+- [**VIBRANT v1.2.1**](https://github.com/AnantharamanLab/VIBRANT): Used to identify Auxiliary Metabolic Genes in the prophages.
+
+## Workflow
+
+The workflow begins with the input of bacterial genomes by the user. These are processed by the **host-analyses** tools. Prophage prediction is
+performed by **geNomad** only. Afterward, prophages identified by **geNomad** are processed by the **virus-analyses** tools.
+
+If more than one prophage is recovered in the same sample, **dRep** is used to compare and determine if the viruses are identical or different within the same host.
+
+*PLACEHOLDER FOR PIPELINE*
+
+## R Session Info
+
+Information about the R session used to render this markdown document.
+
+```{r}
+sessionInfo()
+```
+
+
+# Results {.tabset .tabset-fade}
+
+```{r}
+# Creating combined_unique object
+
+combined_unique <- bind_rows(
+ checkm_host_data %>%
+ # select(bin_id) %>%
+ # dplyr::rename(Sample = bin_id),
+ select(name) %>%
+ dplyr::rename(Sample = name),
+
+ data %>%
+ #mutate(Sample = str_remove(Sample, "_virus_summary.tsv")) %>%
+ select(Sample)
+) %>%
+ distinct(Sample) %>%
+ arrange(Sample)
+
+log_debug(paste("combined_unique samples:", paste(combined_unique$Sample, collapse = ", ")))
+```
+
+
+
+```{r main_workflow, fig.width=6, fig.height=6, out.height="100%", out.width='100%', dpi=300, fig.align='center', warning=FALSE, message=FALSE, results='asis'}
+# Process proviruses data
+process_proviruses <- function(data_genomad) {
+ proviruses <- data_genomad %>%
+ dplyr::filter(topology == "Provirus") %>%
+ dplyr::mutate(contig = sub("\\|provirus_.*", "", seq_name)) %>% # take everything before "|provirus"
+ dplyr::mutate(contig = paste0("c", as.numeric(factor(contig)))) %>% # map them to c_1, c_2, ...
+ dplyr::select(seq_name, coordinates, length, contig, virus_score, n_hallmarks)
+
+ proviruses <- proviruses %>%
+ tidyr::separate(coordinates, into = c("start", "end"), sep = "-")
+
+ proviruses$start <- as.integer(proviruses$start)
+ proviruses$end <- as.integer(proviruses$end)
+
+ proviruses_gr_features <- GRanges(seqnames = proviruses$contig,
+ ranges = IRanges(start = proviruses$start,
+ end = proviruses$end))
+ proviruses_gr_features$length <- proviruses_gr_features %>% ranges %>% width
+ proviruses_gr_features$score <- as.numeric(proviruses$virus_score)
+ proviruses_gr_features$n_hallmarks <- as.numeric(proviruses$n_hallmarks)
+
+ proviruses_gr_features$n_hallmarks_pos <-
+ abs(start(proviruses_gr_features) - end(proviruses_gr_features)) / 2
+
+ return(proviruses_gr_features)
+}
+
+plot_genome_ideogram <- function(genome_current, proviruses_gr_features) {
+ fasta_file_path <- file.path(params$outdir, "genomes", paste0(genome_current, ".fna"))
+ #cat(fasta_file_path, "\n\n")
+ genome_ideogram <- getIdeogramData(fasta_file = fasta_file_path)
+
+ # Replace any seqlevel to c_1, c_2, c_3, ...
+ new_seqlevels <- paste0("c", seq_along(seqlevels(genome_ideogram)))
+ names(new_seqlevels) <- seqlevels(genome_ideogram)
+ genome_ideogram <- GenomeInfoDb::renameSeqlevels(genome_ideogram, new_seqlevels)
+ colours <- rep("#a58bc5", length(seqlevels(genome_ideogram)))
+
+ par(mar = c(2, 2, 2, 2)) # minimal margins around the plot
+
+ gmovizInitialise(genome_ideogram,
+ sector_colours = colours,
+ sector_border_colours = colours,
+ sector_labels = FALSE
+ )
+
+ for (i in 1:length(proviruses_gr_features)) {
+ name <- as.character(seqnames(proviruses_gr_features[i]))
+ start <- as.numeric(start(proviruses_gr_features[i]))
+ end <- as.numeric(end(proviruses_gr_features[i]))
+ region <- data.frame(start = start, end = end)
+ circos.genomicRect(seqnames = name,
+ region,
+ ytop = .5,
+ ybottom = 0,
+ track.index = 1,
+ sector.index = name,
+ border = "#e9d27d",
+ col = "#e9d27d")
+ }
+
+ length <- as.numeric(proviruses_gr_features$length)
+ length <- ifelse(length > 1000000,
+ paste0(round(length/1000000, 2), "mb"),
+ paste0(round(length/1000, 2), "kb"))
+ labels <- paste0(as.character(seqnames(proviruses_gr_features)), " (", length, ")")
+ circos.labels(sectors = as.character(seqnames(proviruses_gr_features)),
+ x = as.numeric(start(proviruses_gr_features)),
+ labels,
+ facing = "clockwise")
+}
+
+process_sample <- function(sample, combined_unique, host_genomes_paths, genome_data) {
+ genome_current <- sample # Add this line
+ tryCatch({
+ log_debug(paste("Starting to process sample:", sample))
+
+ # Check if sample exists in genome_data
+ if (!(sample %in% names(genome_data))) {
+ log_debug(paste("Sample", sample, "not found in genome_data"))
+ cat(paste("Error: Sample", sample, "not found in genome_data\n\n"))
+ return()
+ }
+
+ cat(paste("## ", sample, "{.tabset .tabset-fade} \n\n"))
+
+ host_genome_path <- host_genomes_paths$path[host_genomes_paths$name == sample]
+ if (length(host_genome_path) == 0) {
+ log_debug(paste("Host genome path not found for sample:", sample))
+ cat(paste("Error: Host genome path not found for sample", sample, "\n\n"))
+ return()
+ }
+
+ host_genome_ideogram <- tryCatch({
+ getIdeogramData(fasta_file = host_genome_path)
+ }, error = function(e) {
+ log_debug(paste("Error loading host genome ideogram for sample", sample, ":", conditionMessage(e)))
+ NULL
+ })
+
+ if (is.null(host_genome_ideogram)) {
+ cat(paste("Error: Unable to load host genome ideogram for sample", sample, "\n\n"))
+ return()
+ }
+
+ sample_data <- genome_data[[sample]]$loaded_data
+ genomad_summary <- sample_data$genomad
+ genomad_annotation <- sample_data$genomad_annotations
+ checkv_data <- sample_data$checkv
+ defense_finder_data <- sample_data$defense_finder
+ abricate_data <- sample_data$abricate
+ iphop_data <- sample_data$iphop
+ vibrant_data <- sample_data$vibrant
+
+ cat("### Host Genome\n\n")
+
+ cat("**GTDB-Tk taxonomy**: \n\n")
+ data_gtdbtk_host %>% filter(user_genome == sample) %>%
+ select(classification) %>%
+ kbl() %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+ kable_paper("striped", full_width = TRUE) %>%
+ scroll_box(width = "100%", height = "100%") %>%
+ cat()
+
+ # Cat checkm summary for this genome
+ cat("**CheckM2 Summary**:\n\n")
+ #checkm_summary <- data_checkm_host %>% filter(`bin_id` == sample)
+ checkm_summary <- data_checkm_host %>% filter(`name` == sample)
+ checkm_summary %>% clean_names %>%
+ #select(number_contigs, n50_contigs, completeness, contamination, strain_heterogeneity) %>%
+ select(total_contigs, contig_n50, completeness, contamination) %>%
+ kbl() %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+ kable_paper("striped", full_width = TRUE) %>%
+ scroll_box(width = "100%", height = "100%") %>%
+ cat()
+
+ # Display defense-finder as a table
+ if (!is.null(defense_finder_data) && nrow(defense_finder_data) > 0) {
+ cat("**Defense-Finder Systems**:\n\n")
+
+ defense_finder_data %>%
+ select(sys_id, type, subtype, sys_beg, sys_end, protein_in_syst, genes_count, name_of_profiles_in_sys) %>%
+ kbl() %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+ kable_paper("striped", full_width = TRUE) %>%
+ scroll_box(width = "100%", height = "100%") %>%
+ cat()
+ } else {
+ cat("No Defense-Finder systems detected.\n\n")
+ }
+
+ if (is.null(genomad_summary) || nrow(genomad_summary) == 0) {
+ log_debug(paste("No geNomad summary data found for sample:", sample))
+ return()
+ }
+
+ if (length(seqlevels(host_genome_ideogram)) == 1) {
+ host_genome_size <- sum(width(host_genome_ideogram))
+ } else {
+ virus_containing_contigs <- unique(sub("\\|.*", "", genomad_summary$seq_name))
+ virus_containing_contigs <- paste0("c_", as.numeric(factor(virus_containing_contigs)))
+ filtered_host_genome <- subset_and_update_ideogram(host_genome_ideogram, virus_containing_contigs)
+ host_genome_size <- sum(width(filtered_host_genome))
+ }
+
+ # Process proviruses
+ proviruses_gr_features <- process_proviruses(genomad_summary)
+
+ cat("**Genomad and CheckV Summary**:\n\n")
+ genomad_summary %>%
+ select(seq_name, taxonomy, topology, coordinates, length) %>%
+ left_join(
+ checkv_data %>% select(contig_id, gene_count, viral_genes, checkv_quality, miuvig_quality),
+ by = c("seq_name" = "contig_id")) %>%
+ select(seq_name, length, gene_count, viral_genes, checkv_quality, miuvig_quality, taxonomy, topology, coordinates) %>%
+ kbl() %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+ kable_paper("striped", full_width = TRUE) %>%
+ scroll_box(width = "100%", height = "100%") %>%
+ cat()
+
+ cat("**Host Genome Ideogram with Phages**:\n\n")
+ plot_genome_ideogram(sample, proviruses_gr_features)
+ cat('In this circular plot, **"c"** indicates the contig, and the number that follows (e.g., **c1**) represents the contig number.
+If multiple contigs are present in the genome, each will be shown with a distinct label (e.g., **c1**, **c2**, etc.).\n\n')
+ cat("\n\n")
+
+ # Process phage genomes
+ cat("### Prophages {.tabset .tabset-fade} \n\n")
+ cat("**Select prophage to show: ** \n\n")
+ for (i in seq_len(nrow(genomad_summary))) {
+ log_debug(paste("Processing phage", i, "of", nrow(genomad_summary), "for sample", sample))
+ process_phage(genomad_summary[i, ], genomad_summary, genomad_annotation, checkv_data, host_genome_size)
+ }
+
+ # Plot dREP if applicable
+ if (nrow(genomad_summary) > 1) {
+ cat("### vOTUs\n\n")
+ plot_drep(sample, genomad_summary)
+ }
+
+ # Creating table with Abricate data
+ if (nrow(abricate_data) > 0) {
+ cat("### Virulence Genes {.tabset .tabset-fade} \n\n")
+ cat("Screening of virulence genes present in the prophage contigs. \n\n")
+ abricate_data %>% select(-number_file) %>%
+ kbl() %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+ kable_paper("striped", full_width = TRUE) %>%
+ scroll_box(width = "100%", height = "100%") %>% cat()
+ cat("\n\n")
+ }
+
+ # Creating table with iPHOP
+ if (nrow(iphop_data) > 0) {
+ cat("### Prophage-Host Prediction {.tabset .tabset-fade} \n\n")
+ cat("Prediction of potential hosts for the prophage contigs. \n\n")
+ iphop_data %>%
+ kbl() %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+ kable_paper("striped", full_width = TRUE) %>%
+ scroll_box(width = "100%", height = "100%") %>% cat()
+ cat("\n\n")
+ }
+
+ # Creating table with VIBRANT AMGs
+ if (nrow(vibrant_data) > 0) {
+ cat("### AMG Predictions {.tabset .tabset-fade} \n\n")
+ cat("Prediction of auxiliary metabolic genes in the prophage contigs. \n\n")
+ vibrant_data %>%
+ kbl() %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+ kable_paper("striped", full_width = TRUE) %>%
+ scroll_box(width = "100%", height = "100%") %>% cat()
+ cat("\n\n")
+ }
+
+ log_debug(paste("Finished processing sample:", sample))
+ }, error = function(e) {
+ log_debug(paste("Error in process_sample for", sample, ":", conditionMessage(e)))
+ cat(paste("Error processing sample", sample, ":", conditionMessage(e), "\n\n"))
+ })
+}
+
+process_phage <- function(virus, genomad_summary, genomad_annotation, checkv_data, host_genome_size) {
+ cat(paste("#### Phage ID:", virus$seq_name, " {.tabset .tabset-fade} \n\n"))
+
+ current_contig <- sub("\\|.*", "", virus$seq_name)
+
+ provirus_start <- as.numeric(sub(".*provirus_(\\d+)_\\d+", "\\1", virus$seq_name))
+ provirus_end <- as.numeric(sub(".*provirus_\\d+_(\\d+)", "\\1", virus$seq_name))
+ virus_length <- provirus_end - provirus_start + 1
+
+ current_contig_base <- sub("\\|provirus_.*", "", virus$seq_name)
+ current_provirus_range <- sub(".*\\|provirus_", "", virus$seq_name)
+ current_annotations <- genomad_annotation[grepl(paste0(current_contig_base, "\\|provirus_", current_provirus_range, "_"),
+ genomad_annotation$gene, fixed = FALSE), ] %>%
+ mutate(arrow_pos = ifelse(strand == -1, "start", "end"))
+
+
+ cat("\n\n**Phage–Host Genome Ideogram:**\n\n")
+
+ plot_phage_circos(virus, genomad_summary, current_annotations, virus_length, host_genome_size, provirus_start, provirus_end, checkv_data)
+
+ cat("\n\n")
+ cat("\n\n**Genes Annotation (geNomad):**\n\n")
+
+ current_annotations %>%
+ select(gene, length, marker, annotation_accessions, annotation_description) %>%
+ kbl() %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+ kable_paper() %>%
+ cat()
+ cat("\n\n")
+}
+
+plot_phage_circos <- function(virus, genomad_summary, current_annotations, virus_length, host_genome_size, provirus_start, provirus_end, checkv_data) {
+ tryCatch({
+ log_debug("Starting plot_phage_circos function")
+ log_debug(paste("Current virus:", virus$seq_name))
+ log_debug(paste("Virus length:", virus_length))
+ log_debug(paste("Host genome size:", host_genome_size))
+ log_debug(paste("Provirus start:", provirus_start))
+ log_debug(paste("Provirus end:", provirus_end))
+
+ # Check for NA or invalid values in input parameters
+ if (is.na(virus_length) || virus_length <= 0) {
+ log_debug("Error: Invalid virus length")
+ return(NULL)
+ }
+ if (is.na(host_genome_size) || host_genome_size <= 0) {
+ log_debug("Error: Invalid host genome size")
+ return(NULL)
+ }
+ if (is.na(provirus_start) || provirus_start < 0) {
+ log_debug("Error: Invalid provirus start position")
+ return(NULL)
+ }
+ if (is.na(provirus_end) || provirus_end <= provirus_start) {
+ log_debug("Error: Invalid provirus end position")
+ return(NULL)
+ }
+
+ # Extract contig information
+ current_contig <- sub("\\|.*", "", virus$seq_name)
+ log_debug(paste("Current contig:", current_contig))
+
+ contig_viruses <- genomad_summary[grepl(paste0("^", current_contig), genomad_summary$seq_name), ]
+ if (nrow(contig_viruses) == 0) {
+ log_debug("Error: No viruses found for the current contig")
+ return(NULL)
+ }
+
+ contig_length <- max(as.numeric(sub(".*_(\\d+)$", "\\1", contig_viruses$seq_name)))
+ if (is.na(contig_length) || contig_length <= 0) {
+ contig_length <- virus_length # Use virus length as fallback if contig length is invalid
+ log_debug(paste("Using virus length as contig length:", contig_length))
+ } else {
+ log_debug(paste("Contig length:", contig_length))
+ }
+
+ if (provirus_end > contig_length) {
+ log_debug("Error: Provirus end position exceeds contig length")
+ return(NULL)
+ }
+
+ log_debug("Clearing circos")
+ circos.clear()
+
+ log_debug("Setting circos parameters")
+ circos.par(start.degree = 180, gap.degree = 10, track.margin = c(0.01, 0.01))
+
+ main_color <- "#a58bc5"
+ zoom_color <- "#e9d27d"
+
+ zoom_start <- (provirus_start / contig_length) * 100
+ zoom_end <- (provirus_end / contig_length) * 100
+
+ log_debug(paste("Zoom start:", zoom_start))
+ log_debug(paste("Zoom end:", zoom_end))
+
+ log_debug("Initializing circos")
+ circos.initialize(factors = c("Zoom", "Main"), xlim = c(0, 100))
+
+ format_genome_labels <- function(x) {
+ ifelse(x >= 1e6, paste0(round(x / 1e6, 2), " Mb"),
+ ifelse(x >= 1e3, paste0(round(x / 1e3, 2), " Kb"),
+ paste0(x, " bp")))
+ }
+
+ log_debug("Adding link")
+ tryCatch({
+ circos.link("Main", c(zoom_start, zoom_end), "Zoom", c(0, 100),
+ rou1 = 0.8,
+ rou2 = 0.97,
+ h.ratio = 0.55, # width?
+ lty = 2,
+ lwd = 0.5,
+ h2 = 1,
+ col = "grey99", border = "grey80")
+ }, error = function(e) {
+ log_debug(paste("Error in circos.link:", e$message))
+ })
+
+ log_debug("Adding zoom track")
+ circos.track(factors = "Zoom", ylim = c(0, 1), track.height = 0.15,
+ panel.fun = function(x, y) {
+ circos.rect(0, 0, 100, 1, col = zoom_color, border = NA)
+ axis_labels <- seq(0, virus_length, length.out = 6)
+ axis_positions <- seq(0, 100, length.out = 6)
+ circos.axis(h = "top", major.at = axis_positions,
+ labels = format_genome_labels(axis_labels),
+ labels.cex = 0.7, direction = "outside")
+
+ for (i in 1:nrow(current_annotations)) {
+ gene_start <- current_annotations$start[i]
+ gene_end <- current_annotations$end[i]
+ arrow_start <- (gene_start - provirus_start) / virus_length * 100
+ arrow_end <- (gene_end - provirus_start) / virus_length * 100
+
+ circos.arrow(arrow_start, arrow_end, y1 = 0, y2 = 1,
+ arrow.head.width = 0.75, arrow.head.length = cm_x(0.1),
+ arrow.position = current_annotations$arrow_pos[i],
+ col = ifelse(is.na(current_annotations$annotation_description[i]), "grey", "#7fbfff"),
+ border = ifelse(is.na(current_annotations$annotation_description[i]), "grey20", "darkblue"))
+ }
+ }, bg.border = NA)
+
+ log_debug("Adding main track")
+ circos.track(factors = "Main", ylim = c(0, 1), track.height = 0.1,
+ panel.fun = function(x, y) {
+ circos.rect(xleft = 0, ybottom = 0, xright = 100, ytop = 1, col = main_color, border = NA)
+
+ for (i in 1:nrow(contig_viruses)) {
+ virus_start <- as.numeric(sub(".*provirus_(\\d+)_\\d+", "\\1", contig_viruses$seq_name[i]))
+ virus_end <- as.numeric(sub(".*provirus_\\d+_(\\d+)", "\\1", contig_viruses$seq_name[i]))
+
+ virus_start_percent <- (virus_start / contig_length) * 100
+ virus_end_percent <- (virus_end / contig_length) * 100
+
+ rect_color <- if (contig_viruses$seq_name[i] == virus$seq_name) zoom_color else adjustcolor(zoom_color, alpha.f = 0.7)
+
+ circos.rect(xleft = virus_start_percent, ybottom = 0,
+ xright = virus_end_percent, ytop = 1,
+ col = rect_color, border = NA)
+ }
+
+ axis_labels <- seq(0, contig_length, length.out = 6)
+ axis_positions <- seq(0, 100, length.out = 6)
+ circos.axis(h = "top", major.at = axis_positions,
+ labels = format_genome_labels(axis_labels),
+ labels.cex = 0.7, direction = "outside")
+ }, bg.border = NA)
+
+ log_debug("Locating phage positions")
+ phage_positions <- sapply(1:nrow(contig_viruses), function(i) {
+ virus_start <- as.numeric(sub(".*provirus_(\\d+)_\\d+", "\\1", contig_viruses$seq_name[i]))
+ virus_end <- as.numeric(sub(".*provirus_\\d+_(\\d+)", "\\1", contig_viruses$seq_name[i]))
+ ((virus_start + virus_end) / 2 / contig_length) * 100
+ })
+
+ log_debug("Annotating names on phage positions")
+
+ # Extract start and end positions from sequence names
+ start_positions <- as.numeric(sub(".*provirus_([0-9]+)_.*", "\\1", contig_viruses$seq_name))
+ end_positions <- as.numeric(sub(".*provirus_[0-9]+_([0-9]+)", "\\1", contig_viruses$seq_name))
+
+ # Create phage labels with the desired format
+ phage_labels <- paste0(round(contig_viruses$length / 1e3, 2), " Kb")
+
+ # Apply labels to circos plot
+ circos.labels(
+ sectors = "Main",
+ x = phage_positions,
+ labels = phage_labels,
+ facing = "reverse.clockwise",
+ niceFacing = TRUE,
+ col = "black",
+ cex = 0.6,
+ side = "inside",
+ connection_height = 0.02,
+ line_col = "gray"
+ )
+
+ center_x <- 50
+ virus_name <- virus$seq_name
+ taxonomy <- virus$taxonomy
+
+ log_debug("Adding taxonomy and virus name to the plot")
+ circos.text(x = center_x, y = -0.2, labels = taxonomy,
+ sector.index = "Zoom", track.index = 1,
+ facing = "bending.inside", niceFacing = TRUE,
+ adj = c(0.5, 0.7), cex = 0.8)
+
+ checkv_info <- checkv_data[checkv_data$contig_id == virus$seq_name, ]
+ if (nrow(checkv_info) > 0) {
+ checkv_quality <- checkv_info$checkv_quality
+ gene_count <- checkv_info$gene_count
+ viral_genes <- checkv_info$viral_genes
+ host_genes <- checkv_info$host_genes
+ miuvig_quality <- checkv_info$miuvig_quality
+ completeness <- checkv_info$completeness
+ completeness_method <- checkv_info$completeness_method
+ contamination <- checkv_info$contamination
+
+ circos.text(
+ x = center_x, y = -0.5,
+ labels = paste("CheckV Quality:", checkv_quality, " - miuvig Quality:", miuvig_quality),
+ sector.index = "Zoom", track.index = 2,
+ facing = "bending.inside", niceFacing = TRUE,
+ adj = c(0.5, 0), cex = 0.7
+ )
+
+ circos.text(
+ x = center_x, y = -1.5,
+ labels = paste("Gene Count:", gene_count, " - Viral Genes:", viral_genes, " - Host Genes:", host_genes),
+ sector.index = "Zoom", track.index = 2,
+ facing = "bending.inside", niceFacing = TRUE,
+ adj = c(0.5, 0), cex = 0.7
+ )
+
+ circos.text(
+ x = center_x, y = -2.5,
+ labels = paste("Completeness:", completeness, " - Contamination:", contamination),
+ sector.index = "Zoom", track.index = 2,
+ facing = "bending.inside", niceFacing = TRUE,
+ adj = c(0.5, 0), cex = 0.7
+ )
+ }
+
+ log_debug("Adding legend")
+ # Add legend
+ legend("topright",
+ legend = c("Annotated gene", "Unknown gene"),
+ fill = c("#7fbfff", "grey"),
+ border = c("darkblue", "grey20"),
+ cex = 0.8,
+ bty = "n")
+
+ log_debug("Clearing circos")
+ circos.clear()
+ log_debug("Finished plot_phage_circos function successfully")
+ }, error = function(e) {
+ log_debug(paste("Error in plot_phage_circos:", e$message))
+ circos.clear()
+ })
+}
+
+plot_drep <- function(sample, genomad_summary) {
+ drep_file_path <- file.path(params$outdir, "virus_analyses", "drep_compare", sample, "data_tables", "Cdb.csv")
+ drep_data <- read_csv(drep_file_path) %>% clean_names()
+ drep_data <- cbind(genomad_summary$seq_name, drep_data)
+
+ cat("When more than 1 phage is detected in the host genome, we perform a clustering step using the tool dRep.\n\n")
+ cat("A threshold of 0.95 was applied to the ANI similarity index to define clusters of virus operational taxonomic units (vOTUs).")
+
+ cat("\n\n**Final cluster designations**\n\n")
+ drep_data %>%
+ kbl() %>%
+ kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+ kable_paper("striped", full_width = TRUE) %>%
+ cat()
+
+ # Insert the PDF plot
+ plot_path <- file.path(params$outdir, "virus_analyses", "drep_compare", sample, "figures", "Primary_clustering_dendrogram.pdf")
+ png_path <- file.path(params$outdir, "virus_analyses", "drep_compare", sample, "figures", "Primary_clustering_dendrogram.png")
+
+ if (file.exists(plot_path)) {
+ pdftools::pdf_convert(plot_path, format = "png", filenames = png_path, verbose = FALSE, dpi=150)
+ base64_str <- base64enc::dataURI(file = png_path, mime = "image/png")
+ cat("**Primary clustering plot**\n\n")
+ cat(sprintf(
+ '',base64_str
+ ))
+ } else {
+ cat("**No dRep clustering plot found.**\n\n")
+ }
+
+}
+
+subset_and_update_ideogram <- function(ideogram, contigs) {
+ filtered <- ideogram[seqnames(ideogram) %in% contigs]
+ seqlevels(filtered) <- contigs
+ seqinfo(filtered) <- seqinfo(filtered)[contigs]
+ filtered
+}
+
+render_all_samples <- function(test_mode = FALSE) {
+ if (test_mode) {
+ if (nrow(combined_unique) > 0) {
+ cat("**Select sample to show:** \n\n\n")
+ current_sample <- combined_unique$Sample[6]
+ process_sample(current_sample, combined_unique, host_genomes_paths, genome_data)
+ } else {
+ print("No samples can be further analysed.")
+ }
+ } else {
+ cat("**Select sample to show:** \n\n\n")
+ for (i in seq_len(nrow(combined_unique))) {
+ current_sample <- combined_unique$Sample[i]
+ process_sample(current_sample, combined_unique, host_genomes_paths, genome_data)
+ }
+ }
+}
+
+# Execute the main function
+# Test mode processes one sample only
+render_all_samples(test_mode = F)
+```
+
+# Citation
+
+Cite this work: XXXXX
+
+
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_000913.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_000913.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
+NC_000913.fasta NC_000913.3|provirus_2461306_2476510 6550 6912 + gtrA 1-363/363 =============== 0/0 100.00 88.70 vfdb NP_706257 (gtrA) bactoprenol-linked glucose translocase/flippase [LPS (VF0124)] [Shigella flexneri 2a str. 301]
+NC_000913.fasta NC_000913.3|provirus_2461306_2476510 6909 7813 + gtrB 1-905/930 =============== 0/0 97.31 80.66 vfdb NP_706258 (gtrB) bactoprenol glucosyl transferase [LPS (VF0124)] [Shigella flexneri 2a str. 301]
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_002737.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_002737.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,8 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
+NC_002737.fasta NC_002737.2|provirus_1186916_1222544 2808 3614 + mf3 1-807/807 =============== 0/0 100.00 100.00 vfdb NP_269520 (mf3) deoxyribonuclease [DNase (VF0252)] [Streptococcus pyogenes M1 GAS]
+NC_002737.fasta NC_002737.2|provirus_1186916_1222544 9081 10193 - hylP 1-1113/1113 =============== 0/0 100.00 100.00 vfdb NP_269528 (hylP) hyaluronidase phage associated [Hyaluronidase (VF0246)] [Streptococcus pyogenes M1 GAS]
+NC_002737.fasta NC_002737.2|provirus_529627_569283 33078 34091 + hylP 1-1014/1014 =============== 0/0 100.00 100.00 vfdb NP_268936 (hylP) hyaluronidase phage associated [Hyaluronidase (VF0246)] [Streptococcus pyogenes M1 GAS]
+NC_002737.fasta NC_002737.2|provirus_529627_569283 38950 39657 - spec 1-708/708 =============== 0/0 100.00 100.00 vfdb NP_268943 (spec) streptococcal exotoxin C precursor phage associated [Spes (VF0248)] [Streptococcus pyogenes M1 GAS]
+NC_002737.fasta NC_002737.2|provirus_777501_820593 35641 36759 + hylP 1-1119/1119 =============== 0/0 100.00 100.00 vfdb NP_269179 (hylP) hyaluronidase phage associated [Hyaluronidase (VF0246)] [Streptococcus pyogenes M1 GAS]
+NC_002737.fasta NC_002737.2|provirus_777501_820593 41680 42357 + spei 1-678/678 =============== 0/0 100.00 99.85 vfdb NP_269185 (spei) streptococcal exotoxin I precursor [Spes (VF0248)] [Streptococcus pyogenes M1 GAS]
+NC_002737.fasta NC_002737.2|provirus_777501_820593 42383 43093 + speh 1-711/711 =============== 0/0 100.00 100.00 vfdb NP_269186 (speh) streptococcal exotoxin H precursor [Spes (VF0248)] [Streptococcus pyogenes M1 GAS]
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_008261.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_008261.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_009012.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_009012.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_014168.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_014168.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_014212.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_014212.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_014364.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_014364.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_015761.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_015761.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
+NC_015761.fasta NC_015761.1|provirus_1007223_1045009 24347 26694 - sopA 1-2348/2349 =============== 0/0 99.96 89.91 vfdb NP_461011 (sopA) type III secretion system effector SopA E3 ubiquitin ligase [TTSS(SPI-1 encode) (VF0116)] [Salmonella enterica subsp. enterica serovar Typhimurium str. LT2]
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_017033.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_017033.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_018068.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_018068.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_018515.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_018515.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_019936.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_019936.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/abricate_results/NC_021184.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_021184.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE SEQUENCE START END STRAND GENE COVERAGE COVERAGE_MAP GAPS %COVERAGE %IDENTITY DATABASE ACCESSION PRODUCT RESISTANCE
diff -r 000000000000 -r 315c2ed31af1 test-data/checkm2.Quality_report.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkm2.Quality_report.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,23 @@
+Name Completeness Contamination Completeness_Model_Used Translation_Table_Used Coding_Density Contig_N50 Average_Gene_Length Genome_Size GC_Content Total_Coding_Sequences Total_Contigs Max_Contig_Length Additional_Notes
+NC_000913.fasta 100.0 0.13 Neural Network (Specific Model) 11 0.876 4641652 314.20629775410976 4641652 0.51 4319 1 4641652 None
+NC_002737.fasta 99.99 0.48 Neural Network (Specific Model) 11 0.856 1852433 298.1390765765766 1852433 0.39 1776 1 1852433 None
+NC_003450.fasta 100.0 0.29 Neural Network (Specific Model) 11 0.872 3309401 313.8808205796158 3309401 0.54 3071 1 3309401 None
+NC_008261.fasta 100.0 0.14 Neural Network (Specific Model) 11 0.837 3256683 316.0170197985412 3256683 0.28 2879 1 3256683 None
+NC_009012.fasta 100.0 1.09 Neural Network (Specific Model) 11 0.849 3843301 320.7092407298411 3843301 0.39 3398 1 3843301 None
+NC_012982.fasta 100.0 0.05 Neural Network (Specific Model) 11 0.897 3455622 328.879173290938 3455622 0.45 3145 1 3455622 None
+NC_014008.fasta 100.0 0.02 Neural Network (Specific Model) 11 0.902 3750771 358.93038779402417 3750771 0.54 3146 1 3750771 None
+NC_014168.fasta 99.99 0.03 Neural Network (Specific Model) 11 0.907 3157527 311.3860162601626 3157527 0.67 3075 1 3157527 None
+NC_014211.fasta 14.07 0.01 Neural Network (Specific Model) 11 0.836 775354 308.61626248216834 775354 0.72 701 1 775354 None
+NC_014212.fasta 99.99 0.16 Neural Network (Specific Model) 11 0.904 3249394 303.41267387944356 3249394 0.62 3235 1 3249394 None
+NC_014363.fasta 99.7 0.35 Neural Network (Specific Model) 11 0.874 2051896 337.48281690140846 2051896 0.65 1775 1 2051896 None
+NC_014364.fasta 99.98 1.88 Neural Network (Specific Model) 11 0.931 4653970 337.5459421641791 4653970 0.49 4288 1 4653970 None
+NC_015761.fasta 100.0 0.14 Neural Network (Specific Model) 11 0.871 4460105 320.1726352185725 4460105 0.51 4049 1 4460105 None
+NC_017033.fasta 99.99 0.04 Neural Network (Specific Model) 11 0.872 3603458 329.2016938519448 3603458 0.63 3188 1 3603458 None
+NC_017095.fasta 99.95 2.67 Neural Network (Specific Model) 11 0.916 2166381 329.75584286424663 2166381 0.39 2011 1 2166381 None
+NC_018014.fasta 99.99 9.38 Neural Network (Specific Model) 11 0.891 5227858 357.07764759935674 5227858 0.6 4353 1 5227858 None
+NC_018068.fasta 99.99 0.42 Neural Network (Specific Model) 11 0.824 4926837 296.0867001528718 4926837 0.42 4579 1 4926837 None
+NC_018515.fasta 100.0 1.83 Neural Network (Specific Model) 11 0.834 4873567 302.3391304347826 4873567 0.42 4485 1 4873567 None
+NC_019897.fasta 99.95 0.34 Neural Network (Specific Model) 11 0.874 4206343 318.1461139896373 4206343 0.61 3860 1 4206343 None
+NC_019904.fasta 100.0 0.23 Neural Network (Specific Model) 11 0.869 5608040 351.0986827898942 5608040 0.45 4631 1 5608040 None
+NC_019936.fasta 100.0 0.13 Neural Network (Specific Model) 11 0.896 4575057 320.7199437543942 4575057 0.63 4267 1 4575057 None
+NC_021184.fasta 100.0 3.04 Neural Network (Specific Model) 11 0.823 4855529 289.67620906527867 4855529 0.45 4611 1 4855529 None
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_000913.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_000913.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_000913.3|provirus_563848_584430 20583 Yes 9846 32 13 6 Low-quality Genome-fragment 16.3 HMM-based (lower-bound) 52.16 1.0 low-confidence Provirus
+NC_000913.3|provirus_1196867_1213107 16241 No NA 24 9 2 Low-quality Genome-fragment 42.32 AAI-based (high-confidence) 0.0 1.0
+NC_000913.3|provirus_1412000_1434224 22225 No NA 27 13 1 Low-quality Genome-fragment 34.35 HMM-based (lower-bound) 0.0 1.0
+NC_000913.3|provirus_1627517_1653915 26399 Yes 17700 41 10 9 Low-quality Genome-fragment 36.3 AAI-based (high-confidence) 32.95 1.0 low-confidence Provirus
+NC_000913.3|provirus_2461306_2476510 15205 No NA 20 12 1 Low-quality Genome-fragment 30.84 AAI-based (high-confidence) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_002737.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_002737.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_002737.2|provirus_529627_569283 39657 No NA 46 41 0 High-quality High-quality 96.74 AAI-based (high-confidence) 0.0 1.0
+NC_002737.2|provirus_777501_820593 43093 No NA 65 42 1 High-quality High-quality 96.04 AAI-based (high-confidence) 0.0 1.0
+NC_002737.2|provirus_1186916_1222544 35629 No NA 52 39 1 High-quality High-quality 100.0 AAI-based (high-confidence) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_003450.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_008261.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_008261.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_008261.1|provirus_1070550_1127691 57142 Yes 43960 68 25 10 High-quality High-quality 100.0 AAI-based (high-confidence) 23.07 1.0
+NC_008261.1|provirus_1784095_1821197 37103 No NA 44 21 1 Medium-quality Genome-fragment 63.2 HMM-based (lower-bound) 0.0 1.01
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_009012.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_009012.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_009012.1|provirus_1938476_1983993 45518 No NA 52 23 2 Medium-quality Genome-fragment 68.64 AAI-based (high-confidence) 0.0 1.0
+NC_009012.1|provirus_2022140_2067593 45454 No NA 54 21 0 Medium-quality Genome-fragment 87.05 AAI-based (high-confidence) 0.0 1.0
+NC_009012.1|provirus_2931283_2970170 38888 No NA 62 28 3 Medium-quality Genome-fragment 83.53 AAI-based (medium-confidence) 0.0 1.01
+NC_009012.1|provirus_3339258_3389049 49792 No NA 53 6 2 Medium-quality Genome-fragment 74.06 HMM-based (lower-bound) 0.0 1.51 high kmer_freq may indicate large duplication
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_012982.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_014008.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_014168.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_014168.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_014168.1|provirus_27479_67296 39818 No NA 60 29 0 Medium-quality Genome-fragment 88.69 AAI-based (high-confidence) 0.0 1.0
+NC_014168.1|provirus_1141631_1162952 21322 No NA 36 19 0 Medium-quality Genome-fragment 51.44 AAI-based (medium-confidence) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_014211.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_014212.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_014212.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_014212.1|provirus_1170297_1209132 38836 No NA 48 10 1 Medium-quality Genome-fragment 62.91 AAI-based (medium-confidence) 0.0 1.0
+NC_014212.1|provirus_1746722_1764354 17633 No NA 38 3 0 Medium-quality Genome-fragment 89.95 AAI-based (medium-confidence) 0.0 1.01
+NC_014212.1|provirus_1893193_1914973 21781 No NA 32 6 0 Medium-quality Genome-fragment 65.66 AAI-based (medium-confidence) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_014363.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_014364.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_014364.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_014364.1|provirus_2121424_2157334 35911 Yes 29611 44 12 3 Medium-quality Genome-fragment 63.36 AAI-based (medium-confidence) 17.54 1.0
+NC_014364.1|provirus_2329685_2350621 20937 No NA 29 6 1 Low-quality Genome-fragment 22.17 HMM-based (lower-bound) 0.0 1.01
+NC_014364.1|provirus_2666253_2703772 37520 No NA 56 15 0 Medium-quality Genome-fragment 73.62 AAI-based (high-confidence) 0.0 1.0
+NC_014364.1|provirus_2976748_3014759 38012 No NA 44 12 0 Medium-quality Genome-fragment 69.42 HMM-based (lower-bound) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_015761.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_015761.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_015761.1|provirus_847397_862760 15364 No NA 19 11 1 Low-quality Genome-fragment 44.56 AAI-based (high-confidence) 0.0 1.0
+NC_015761.1|provirus_1007223_1045009 37787 No NA 52 17 0 Medium-quality Genome-fragment 54.82 HMM-based (lower-bound) 0.0 1.03
+NC_015761.1|provirus_3084741_3115735 30995 No NA 41 32 0 High-quality High-quality 97.62 AAI-based (high-confidence) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_017033.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_017033.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_017033.1|provirus_1052334_1094910 42577 No NA 66 28 3 High-quality High-quality 100.0 AAI-based (medium-confidence) 0.0 1.0
+NC_017033.1|provirus_1557694_1600481 42788 No NA 71 28 0 Medium-quality Genome-fragment 89.2 AAI-based (medium-confidence) 0.0 1.01
+NC_017033.1|provirus_2089294_2107522 18229 No NA 25 3 0 Low-quality Genome-fragment 29.18 HMM-based (lower-bound) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_017095.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_018014.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_018068.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_018068.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_018068.1|provirus_1361108_1399802 38695 No NA 52 24 0 Medium-quality Genome-fragment 85.96 AAI-based (high-confidence) 0.0 1.0
+NC_018068.1|provirus_2072558_2098541 25984 No NA 36 4 1 High-quality High-quality 100.0 AAI-based (medium-confidence) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_018515.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_018515.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_018515.1|provirus_3418112_3436097 17986 No NA 25 18 2 Low-quality Genome-fragment 37.3 AAI-based (medium-confidence) 0.0 1.0
+NC_018515.1|provirus_4659544_4694673 35130 No NA 49 20 0 Medium-quality Genome-fragment 66.0 HMM-based (lower-bound) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_019897.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_019904.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_019936.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_019936.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_019936.1|provirus_2347508_2361929 14422 No NA 24 2 0 High-quality High-quality 100.0 AAI-based (high-confidence) 0.0 1.93 high kmer_freq may indicate large duplication; contig >1.5x longer than expected genome length
+NC_019936.1|provirus_3233292_3242961 9670 No NA 14 2 0 High-quality High-quality 100.0 AAI-based (high-confidence) 0.0 1.0
+NC_019936.1|provirus_4295725_4304306 8582 No NA 13 2 0 High-quality High-quality 100.0 AAI-based (medium-confidence) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/checkv_quality_summary/NC_021184.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_021184.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id contig_length provirus proviral_length gene_count viral_genes host_genes checkv_quality miuvig_quality completeness completeness_method contamination kmer_freq warnings
+NC_021184.1|provirus_19778_35564 15787 No NA 22 5 1 Low-quality Genome-fragment 40.5 AAI-based (medium-confidence) 0.0 1.0
+NC_021184.1|provirus_4466413_4519129 52717 No NA 62 22 3 High-quality High-quality 100.0 AAI-based (medium-confidence) 0.0 1.0
+NC_021184.1|provirus_4563831_4615358 51528 No NA 59 23 4 High-quality High-quality 100.0 AAI-based (high-confidence) 0.0 1.0
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_000913.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_000913.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,10 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_000913.3_Lit_3 Lit Lit Defense NC_000913.3_1111 NC_000913.3_1111 NC_000913.3_1111 1 Lit__Lit
+NC_000913.3_RM_Type_IV_9 RM RM_Type_IV Defense NC_000913.3_1130 NC_000913.3_1130 NC_000913.3_1130 1 RM_Type_IV__Type_IV_05
+NC_000913.3_Hachiman_1 Hachiman Hachiman Defense NC_000913.3_2589 NC_000913.3_2590 NC_000913.3_2589,NC_000913.3_2590 2 Hachiman__HamA_2,Hachiman__HamB
+NC_000913.3_RnlAB_6 RnlAB RnlAB Defense NC_000913.3_2591 NC_000913.3_2592 NC_000913.3_2591,NC_000913.3_2592 2 RnlAB__RnlA,RnlAB__RnlB
+NC_000913.3_CAS_Class1-Subtype-I-E_11 Cas CAS_Class1-Subtype-I-E Defense NC_000913.3_2706 NC_000913.3_2713 NC_000913.3_2706,NC_000913.3_2707,NC_000913.3_2708,NC_000913.3_2709,NC_000913.3_2710,NC_000913.3_2711,NC_000913.3_2712,NC_000913.3_2713 8 cas1_I-E_1,cas2_I-E_2,cas3_I_5,cas5_I-E_3,cas6e_I_II_III_IV_V_VI_1,cas7_I-E_2,cas8e_I-E_1,cse2gr11_I-E_1
+NC_000913.3_MazEF_4 MazEF MazEF Defense NC_000913.3_2734 NC_000913.3_2735 NC_000913.3_2734,NC_000913.3_2735 2 MazEF__MazE,MazEF__MazF
+NC_000913.3_MazEF_5 MazEF MazEF Defense NC_000913.3_4140 NC_000913.3_4141 NC_000913.3_4140,NC_000913.3_4141 2 MazEF__MazE,MazEF__MazF
+NC_000913.3_RM_Type_IV_10 RM RM_Type_IV Defense NC_000913.3_4262 NC_000913.3_4263 NC_000913.3_4262,NC_000913.3_4263 2 RM_Type_IV__FAM_1,RM_Type_IV__FAM_2
+NC_000913.3_RM_Type_I_8 RM RM_Type_I Defense NC_000913.3_4265 NC_000913.3_4267 NC_000913.3_4265,NC_000913.3_4266,NC_000913.3_4267 3 RM__Type_I_MTases_FAM_2,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_52
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_002737.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_002737.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_002737.2_AbiAlpha_1 AbiAlpha AbiAlpha Defense NC_002737.2_745 NC_002737.2_745 NC_002737.2_745 1 AbiAlpha__AbiAlpha
+NC_002737.2_VP1853_2 VP1853 VP1853 Defense NC_002737.2_750 NC_002737.2_750 NC_002737.2_750 1 VP1853__VP1853
+NC_002737.2_CAS_Class2-Subtype-II-A_7 Cas CAS_Class2-Subtype-II-A Defense NC_002737.2_832 NC_002737.2_835 NC_002737.2_832,NC_002737.2_833,NC_002737.2_834,NC_002737.2_835 4 cas1_I_II_III_IV_V_VI_5,cas2_I_II_III_IV_V_VI_6,cas9_II-A_II-B_II-C_3,csn2_II-A_4
+NC_002737.2_CAS_Class1-Subtype-I-C_5 Cas CAS_Class1-Subtype-I-C Defense NC_002737.2_1263 NC_002737.2_1269 NC_002737.2_1263,NC_002737.2_1264,NC_002737.2_1265,NC_002737.2_1266,NC_002737.2_1267,NC_002737.2_1268,NC_002737.2_1269 7 cas1_I_II_III_IV_V_VI_6,cas2_I_II_III_IV_V_VI_5,cas3_I_5,cas4_I_II_III_IV_V_VI_4,cas5_I-C_11,cas7_I-C_13,cas8c_I-C_1
+NC_002737.2_RM_Type_I_4 RM RM_Type_I Defense NC_002737.2_1533 NC_002737.2_1535 NC_002737.2_1533,NC_002737.2_1534,NC_002737.2_1535 3 RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_51
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_003450.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_003450.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_003450.3_RM_Type_IIG_2_7 RM RM_Type_IIG_2 Defense NC_003450.3_730 NC_003450.3_730 NC_003450.3_730 1 RM_Type_IIG__Type_IIG_FAM_0.einsi_trimmed
+NC_003450.3_Uzume_1 Uzume Uzume Defense NC_003450.3_1364 NC_003450.3_1364 NC_003450.3_1364 1 Uzume__UzuA
+NC_003450.3_RM_Type_II_4 RM RM_Type_II Defense NC_003450.3_1762 NC_003450.3_1764 NC_003450.3_1762,NC_003450.3_1763,NC_003450.3_1764 3 RM_Type_II__Type_II_MTases_FAM_0,RM_Type_II__Type_II_REase29,RM_Type_II__Type_II_REase38
+NC_003450.3_Wadjet_I_3 Wadjet Wadjet_I Defense NC_003450.3_2782 NC_003450.3_2785 NC_003450.3_2782,NC_003450.3_2783,NC_003450.3_2784,NC_003450.3_2785 4 Wadjet__JetA_I,Wadjet__JetB_I,Wadjet__JetC_I,Wadjet__JetD_I
+NC_003450.3_RM_Type_IIG_6 RM RM_Type_IIG Defense NC_003450.3_3041 NC_003450.3_3041 NC_003450.3_3041 1 RM_Type_IIG__Type_IIG_FAM_2.einsi_trimmed
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_008261.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_008261.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,8 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_008261.1_RM_Type_II_5 RM RM_Type_II Defense NC_008261.1_127 NC_008261.1_128 NC_008261.1_127,NC_008261.1_128 2 RM_Type_II__Type_II_MTases_FAM_0,RM_Type_II__Type_II_REase18
+NC_008261.1_RM_Type_III_7 RM RM_Type_III Defense NC_008261.1_340 NC_008261.1_341 NC_008261.1_340,NC_008261.1_341 2 RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_008261.1_RM_Type_IV_8 RM RM_Type_IV Defense NC_008261.1_962 NC_008261.1_963 NC_008261.1_962,NC_008261.1_963 2 RM_Type_IV__FAM_1,RM_Type_IV__FAM_2
+NC_008261.1_DRT_2_1 DRT DRT_2 Defense NC_008261.1_983 NC_008261.1_983 NC_008261.1_983 1 DRT2__DRT2
+NC_008261.1_RM_Type_II_6 RM RM_Type_II Defense NC_008261.1_985 NC_008261.1_987 NC_008261.1_985,NC_008261.1_986,NC_008261.1_987 3 RM_Type_II__Type_II_MTases_FAM_0,RM_Type_II__Type_II_MTases_FAM_22,RM_Type_II__Type_II_REase34
+NC_008261.1_PD-Lambda-5_2 PD-Lambda-5 PD-Lambda-5 Defense NC_008261.1_1563 NC_008261.1_1564 NC_008261.1_1563,NC_008261.1_1564 2 PD-Lambda-5__PD-Lambda-5_A,PD-Lambda-5__PD-Lambda-5_B
+NC_008261.1_RM_Type_I_4 RM RM_Type_I Defense NC_008261.1_2512 NC_008261.1_2515 NC_008261.1_2512,NC_008261.1_2514,NC_008261.1_2515 3 RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_51
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_009012.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_009012.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,14 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_009012.1_RM_Type_III_8 RM RM_Type_III Defense NC_009012.1_532 NC_009012.1_533 NC_009012.1_532,NC_009012.1_533 2 RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_009012.1_SEFIR_3 SEFIR SEFIR Defense NC_009012.1_1184 NC_009012.1_1184 NC_009012.1_1184 1 SEFIR__bSEFIR
+NC_009012.1_RloC_2 RloC RloC Defense NC_009012.1_1211 NC_009012.1_1211 NC_009012.1_1211 1 RloC__RloC
+NC_009012.1_RM_Type_II_4 RM RM_Type_II Defense NC_009012.1_1577 NC_009012.1_1579 NC_009012.1_1577,NC_009012.1_1578,NC_009012.1_1579 3 RM_Type_II__Type_II_MTases_FAM_38,RM_Type_II__Type_II_MTases_FAM_4,RM_Type_II__Type_II_REase32
+NC_009012.1_AbiU_1 AbiU AbiU Defense NC_009012.1_1698 NC_009012.1_1698 NC_009012.1_1698 1 AbiU__AbiU
+NC_009012.1_RM_Type_II_5 RM RM_Type_II Defense NC_009012.1_1826 NC_009012.1_1827 NC_009012.1_1826,NC_009012.1_1827 2 RM_Type_II__Type_II_MTases_FAM_16,RM_Type_II__Type_II_REase01
+NC_009012.1_CAS_Class1-Subtype-III-D_11 Cas CAS_Class1-Subtype-III-D Defense NC_009012.1_2140 NC_009012.1_2149 NC_009012.1_2140,NC_009012.1_2141,NC_009012.1_2142,NC_009012.1_2143,NC_009012.1_2144,NC_009012.1_2145,NC_009012.1_2146,NC_009012.1_2147,NC_009012.1_2149 9 cas10_III-D_3,csm2gr11_III-D_6,csm2gr11_III-D_7,csm3gr7_III-A_III-D_2,csm3gr7_III_1,csm3gr7_III_1,csm3gr7_III_IV,csx10gr5_III-D_2,csx1_III_9
+NC_009012.1_CAS_Class1-Subtype-I-B_9 Cas CAS_Class1-Subtype-I-B Defense NC_009012.1_2404 NC_009012.1_2411 NC_009012.1_2404,NC_009012.1_2405,NC_009012.1_2406,NC_009012.1_2407,NC_009012.1_2408,NC_009012.1_2409,NC_009012.1_2410,NC_009012.1_2411 8 cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-B_1,cas6_I_II_III_IV_V_VI_14,cas7_I-B_6,cas8b1_I-B_12
+NC_009012.1_RM_Type_II_6 RM RM_Type_II Defense NC_009012.1_2429 NC_009012.1_2430 NC_009012.1_2429,NC_009012.1_2430 2 RM_Type_II__Type_II_MTases_FAM_2,RM_Type_II__Type_II_REase30
+NC_009012.1_RM_Type_II_7 RM RM_Type_II Defense NC_009012.1_2587 NC_009012.1_2588 NC_009012.1_2587,NC_009012.1_2588 2 RM_Type_II__Type_II_MTases_FAM_4,RM_Type_II__Type_II_REase07
+NC_009012.1_CAS_Class1-Subtype-I-B_10 Cas CAS_Class1-Subtype-I-B Defense NC_009012.1_3357 NC_009012.1_3361 NC_009012.1_3357,NC_009012.1_3358,NC_009012.1_3359,NC_009012.1_3360,NC_009012.1_3361 5 cas3_I_5,cas5_I-B_17,cas6_I_II_III_IV_V_VI_12,cas7_I-B_8,cas8b1_I-B_4
+NC_009012.1_CAS_Class1-Subtype-III-D_12 Cas CAS_Class1-Subtype-III-D Defense NC_009012.1_3361 NC_009012.1_3378 NC_009012.1_3361,NC_009012.1_3365,NC_009012.1_3366,NC_009012.1_3367,NC_009012.1_3368,NC_009012.1_3369,NC_009012.1_3370,NC_009012.1_3372,NC_009012.1_3375,NC_009012.1_3376,NC_009012.1_3377,NC_009012.1_3378 12 cas10_III-D_3,cas1_I_II_III_IV_V_VI_10,cas2_I_II_III_IV_V_VI_3,cas4_I_II_III_IV_V_VI_1,cas6_I_II_III_IV_V_VI_12,csm3gr7_III-D_2,csm3gr7_III-D_3,csm3gr7_III_1,csx10gr5_III-D_3,csx19_III-D_11,csx1_III_21,csx1_III_9
+NC_009012.1_CAS_Class1-Subtype-III-D_12 Cas CAS_Class1-Subtype-III-D Defense NC_009012.1_3361 NC_009012.1_3378 NC_009012.1_3361,NC_009012.1_3365,NC_009012.1_3366,NC_009012.1_3367,NC_009012.1_3368,NC_009012.1_3369,NC_009012.1_3370,NC_009012.1_3372,NC_009012.1_3375,NC_009012.1_3376,NC_009012.1_3377,NC_009012.1_3378 12 cas10_III-D_3,cas1_I_II_III_IV_V_VI_10,cas2_I_II_III_IV_V_VI_3,cas4_I_II_III_IV_V_VI_1,cas6_I_II_III_IV_V_VI_12,csm3gr7_III-D_2,csm3gr7_III-D_3,csm3gr7_III_1,csx10gr5_III-D_3,csx19_III-D_11,csx1_III_21,csx1_III_9
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_012982.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_012982.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_012982.1_AbiC_1 AbiC AbiC Defense NC_012982.1_420 NC_012982.1_420 NC_012982.1_420 1 AbiC__AbiC
+NC_012982.1_RM_Type_IIG_5 RM RM_Type_IIG Defense NC_012982.1_623 NC_012982.1_623 NC_012982.1_623 1 RM_Type_IIG__Type_IIG_FAM_1.einsi_trimmed
+NC_012982.1_RM_Type_III_6 RM RM_Type_III Defense NC_012982.1_1629 NC_012982.1_1630 NC_012982.1_1629,NC_012982.1_1630 2 RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_1.einsi_trimmed
+NC_012982.1_CBASS_I_3 CBASS CBASS_I Defense NC_012982.1_1825 NC_012982.1_1826 NC_012982.1_1825,NC_012982.1_1826 2 CBASS__Cyclase_II,CBASS__Phospholipase
+NC_012982.1_Rst_DUF4238_4 Rst_DUF4238 Rst_DUF4238 Defense NC_012982.1_2416 NC_012982.1_2416 NC_012982.1_2416 1 Rst_DUF4238__DUF4238_Pers
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_014008.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014008.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_014008.1_RM_Type_I_6 RM RM_Type_I Defense NC_014008.1_1177 NC_014008.1_1181 NC_014008.1_1177,NC_014008.1_1180,NC_014008.1_1181 3 RM__Type_I_MTases_FAM_3,RM__Type_I_REases_FAM_1.einsi_trimmed,RM__Type_I_S_52
+NC_014008.1_Viperin_3 Viperin Viperin Defense NC_014008.1_1182 NC_014008.1_1182 NC_014008.1_1182 1 Viperin__pVip
+NC_014008.1_dGTPase_4 dGTPase dGTPase Defense NC_014008.1_1769 NC_014008.1_1769 NC_014008.1_1769 1 dGTPase__Sp_dGTPase
+NC_014008.1_Ceres_1 Ceres Ceres Defense NC_014008.1_2641 NC_014008.1_2641 NC_014008.1_2641 1 Ceres__CrsA1
+NC_014008.1_Gao_Mza_2 Gao_Mza Gao_Mza Defense NC_014008.1_2741 NC_014008.1_2744 NC_014008.1_2741,NC_014008.1_2743,NC_014008.1_2744 3 Gao_Mza__MzaB,Gao_Mza__MzaC,Gao_Mza__MzaE
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_014168.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014168.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_014168.1_RM_Type_II_2 RM RM_Type_II Defense NC_014168.1_1355 NC_014168.1_1356 NC_014168.1_1355,NC_014168.1_1356 2 RM_Type_II__Type_II_MTases_FAM_41,RM_Type_II__Type_II_REase25
+NC_014168.1_RM_Type_IIG_3 RM RM_Type_IIG Defense NC_014168.1_1738 NC_014168.1_1738 NC_014168.1_1738 1 RM_Type_IIG__Type_IIG_FAM_2.einsi_trimmed
+NC_014168.1_DS-20_1 DS-20 DS-20 Defense NC_014168.1_2356 NC_014168.1_2356 NC_014168.1_2356 1 DS-20__DS-20
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_014211.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014211.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_014212.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014212.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_014212.1_Ceres_1 Ceres Ceres Defense NC_014212.1_142 NC_014212.1_142 NC_014212.1_142 1 Ceres__CrsA1
+NC_014212.1_RM_Type_III_2 RM RM_Type_III Defense NC_014212.1_571 NC_014212.1_572 NC_014212.1_571,NC_014212.1_572 2 RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_014212.1_CAS_Class1-Subtype-III-A_4 Cas CAS_Class1-Subtype-III-A Defense NC_014212.1_712 NC_014212.1_723 NC_014212.1_712,NC_014212.1_713,NC_014212.1_714,NC_014212.1_715,NC_014212.1_716,NC_014212.1_719,NC_014212.1_720,NC_014212.1_721,NC_014212.1_722,NC_014212.1_723 10 cas10_III-A_1,cas1_I_II_III_IV_V_VI_1,cas2_I_II_III_IV_V_VI_8,cas6_I_II_III_IV_V_VI_22,csm2gr11_III-A_1,csm3gr7_III-A_1,csm4gr5_III-A_2,csm5gr7_III-A_2,csx1_III_21,csx1_III_21
+NC_014212.1_CAS_Class1-Subtype-I-E_3 Cas CAS_Class1-Subtype-I-E Defense NC_014212.1_1246 NC_014212.1_1255 NC_014212.1_1246,NC_014212.1_1248,NC_014212.1_1249,NC_014212.1_1251,NC_014212.1_1252,NC_014212.1_1253,NC_014212.1_1254,NC_014212.1_1255 8 cas1_I-E_1,cas2_I-E_1,cas3_I_2,cas5_I-E_2,cas6e_I_II_III_IV_V_VI_2,cas7_I-E_16,cas8e_I-E_5,cse2gr11_I-E_8
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_014363.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014363.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,7 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_014363.1_AbiE_1 AbiE AbiE Defense NC_014363.1_207 NC_014363.1_208 NC_014363.1_207,NC_014363.1_208 2 AbiEii__AbiEi_4,AbiEii__AbiEii
+NC_014363.1_AbiE_2 AbiE AbiE Defense NC_014363.1_473 NC_014363.1_474 NC_014363.1_473,NC_014363.1_474 2 AbiEii__AbiEi_4,AbiEii__AbiEii
+NC_014363.1_VP1839_3 VP1839 VP1839 Defense NC_014363.1_1184 NC_014363.1_1184 NC_014363.1_1184 1 VP1839__VP1839
+NC_014363.1_RM_Type_II_6 RM RM_Type_II Defense NC_014363.1_1186 NC_014363.1_1187 NC_014363.1_1186,NC_014363.1_1187 2 RM_Type_II__Type_II_MTases_FAM_0,RM_Type_II__Type_II_REase15
+NC_014363.1_CAS_Class2-Subtype-II-A_7 Cas CAS_Class2-Subtype-II-A Defense NC_014363.1_1233 NC_014363.1_1236 NC_014363.1_1233,NC_014363.1_1234,NC_014363.1_1235,NC_014363.1_1236 4 cas1_I_II_III_IV_V_VI_5,cas2_I_II_III_IV_V_VI_6,cas9_II-A_1,csn2_II-A_3
+NC_014363.1_RM_Type_I_5 RM RM_Type_I Defense NC_014363.1_1659 NC_014363.1_1664 NC_014363.1_1659,NC_014363.1_1662,NC_014363.1_1663,NC_014363.1_1664 4 RM__Type_I_MTases_FAM_2,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_04,RM__Type_I_S_04
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_014364.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014364.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,7 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_014364.1_TIR-IV_4 TIR-IV TIR-IV Defense NC_014364.1_392 NC_014364.1_393 NC_014364.1_392,NC_014364.1_393 2 TIR-IV__TIR-IV_A,TIR-IV__TIR-IV_B
+NC_014364.1_SoFic_3 SoFIC SoFic Defense NC_014364.1_418 NC_014364.1_418 NC_014364.1_418 1 SoFic__SoFic
+NC_014364.1_MazEF_2 MazEF MazEF Defense NC_014364.1_697 NC_014364.1_698 NC_014364.1_697,NC_014364.1_698 2 MazEF__MazE,MazEF__MazF
+NC_014364.1_CAS_Class1-Subtype-I-C_5 Cas CAS_Class1-Subtype-I-C Defense NC_014364.1_1062 NC_014364.1_1069 NC_014364.1_1062,NC_014364.1_1063,NC_014364.1_1064,NC_014364.1_1065,NC_014364.1_1066,NC_014364.1_1067,NC_014364.1_1068,NC_014364.1_1069 8 WYL_I_II_III_IV_V_VI_4,cas1_I_II_III_IV_V_VI_6,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-C_11,cas7_I-C_7,cas8c_I-C_4
+NC_014364.1_CAS_Class1-Subtype-IV-B_6 Cas CAS_Class1-Subtype-IV-B Defense NC_014364.1_2494 NC_014364.1_2499 NC_014364.1_2494,NC_014364.1_2496,NC_014364.1_2497,NC_014364.1_2498,NC_014364.1_2499 5 csf1gr8_IV-A_5,csf2gr7_IV_1,csf3gr5_IV-B_1,csf4gr11_IV-B_4,cysH_IV-B_1
+NC_014364.1_AbiE_1 AbiE AbiE Defense NC_014364.1_2619 NC_014364.1_2620 NC_014364.1_2619,NC_014364.1_2620 2 AbiEii__AbiEi_4,AbiEii__AbiEii
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_015761.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_015761.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,9 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_015761.1_PrrC_6 PrrC PrrC Defense NC_015761.1_263 NC_015761.1_265 NC_015761.1_263,NC_015761.1_264,NC_015761.1_265 3 PrrC__EcoprrI,PrrC__EcoprrI,RM__Type_I_REases_FAM_0.einsi_trimmed
+NC_015761.1_DarTG_2 DarTG DarTG Defense NC_015761.1_279 NC_015761.1_280 NC_015761.1_279,NC_015761.1_280 2 DarTG__DarG,DarTG__DarT
+NC_015761.1_RM_Type_III_7 RM RM_Type_III Defense NC_015761.1_310 NC_015761.1_311 NC_015761.1_310,NC_015761.1_311 2 RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_015761.1_PfiAT_4 PfiAT PfiAT Defense NC_015761.1_932 NC_015761.1_933 NC_015761.1_932,NC_015761.1_933 2 PfiAT__PfiA,PfiAT__PfiT
+NC_015761.1_CAS_Class1-Subtype-I-E_8 Cas CAS_Class1-Subtype-I-E Defense NC_015761.1_2549 NC_015761.1_2556 NC_015761.1_2549,NC_015761.1_2550,NC_015761.1_2551,NC_015761.1_2552,NC_015761.1_2553,NC_015761.1_2554,NC_015761.1_2555,NC_015761.1_2556 8 cas1_I-E_1,cas2_I-E_2,cas3_I_5,cas5_I-E_3,cas6e_I_II_III_IV_V_VI_1,cas7_I-E_2,cas8e_I-E_1,cse2gr11_I-E_2
+NC_015761.1_dCTPdeaminase_5 dCTPdeaminase dCTPdeaminase Defense NC_015761.1_3620 NC_015761.1_3620 NC_015761.1_3620 1 dCTPdeaminase__dCTPdeaminase
+NC_015761.1_Mokosh_TypeII_3 Mokosh Mokosh_TypeII Defense NC_015761.1_3957 NC_015761.1_3957 NC_015761.1_3957 1 Mokosh_TypeII__MkoC
+NC_015761.1_DS-17_1 DS-17 DS-17 Defense NC_015761.1_3965 NC_015761.1_3965 NC_015761.1_3965 1 DS-17__DS-17
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_017033.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_017033.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_017033.1_PrrC_3 PrrC PrrC Defense NC_017033.1_586 NC_017033.1_589 NC_017033.1_586,NC_017033.1_587,NC_017033.1_588,NC_017033.1_589 4 PrrC__EcoprrI,PrrC__PrrC,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_02
+NC_017033.1_DS-6_1 DS-6 DS-6 Defense NC_017033.1_1067 NC_017033.1_1068 NC_017033.1_1067,NC_017033.1_1068 2 DS-6__DS-6A,DS-6__DS-6B
+NC_017033.1_Mokosh_TypeII_2 Mokosh Mokosh_TypeII Defense NC_017033.1_1863 NC_017033.1_1863 NC_017033.1_1863 1 Mokosh_TypeII__MkoC
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_017095.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_017095.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,8 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_017095.1_RM_Type_I_4 RM RM_Type_I Defense NC_017095.1_540 NC_017095.1_543 NC_017095.1_540,NC_017095.1_541,NC_017095.1_542,NC_017095.1_543 4 RM__Type_I_MTases_FAM_0,RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_51
+NC_017095.1_CAS_Class1-Subtype-III-B_7 Cas CAS_Class1-Subtype-III-B Defense NC_017095.1_1486 NC_017095.1_1502 NC_017095.1_1486,NC_017095.1_1487,NC_017095.1_1488,NC_017095.1_1489,NC_017095.1_1490,NC_017095.1_1491,NC_017095.1_1495,NC_017095.1_1497,NC_017095.1_1499,NC_017095.1_1500,NC_017095.1_1502 11 HTH_III_1,cas10_III_6,cas2_I_II_III_IV_V_VI_3,cas2_I_II_III_IV_V_VI_3,cas6_I_II_III_IV_V_VI_14,cmr1gr7_III-B_1,cmr3gr5_III-B_III-C_6,cmr4gr7_III-B_III-C_1,cmr5gr11_III-B_4,cmr6gr7_III-B_3,csx1_III_9
+NC_017095.1_CAS_Class1-Subtype-III-A_6 Cas CAS_Class1-Subtype-III-A Defense NC_017095.1_1495 NC_017095.1_1512 NC_017095.1_1495,NC_017095.1_1497,NC_017095.1_1499,NC_017095.1_1500,NC_017095.1_1502,NC_017095.1_1503,NC_017095.1_1504,NC_017095.1_1505,NC_017095.1_1506,NC_017095.1_1507,NC_017095.1_1508,NC_017095.1_1509,NC_017095.1_1512 13 HTH_III_1,cas10_III-A_1,cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas2_I_II_III_IV_V_VI_3,cas6_I_II_III_IV_V_VI_14,cas6_I_II_III_IV_V_VI_19,casR_III_1,csm2gr11_III-A_15,csm3gr7_III-A_1,csm4gr5_III-A_1,csm5gr7_III-A_2,csx1_III_9
+NC_017095.1_CAS_Class1-Subtype-III-A_6 Cas CAS_Class1-Subtype-III-A Defense NC_017095.1_1495 NC_017095.1_1512 NC_017095.1_1495,NC_017095.1_1497,NC_017095.1_1499,NC_017095.1_1500,NC_017095.1_1502,NC_017095.1_1503,NC_017095.1_1504,NC_017095.1_1505,NC_017095.1_1506,NC_017095.1_1507,NC_017095.1_1508,NC_017095.1_1509,NC_017095.1_1512 13 HTH_III_1,cas10_III-A_1,cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas2_I_II_III_IV_V_VI_3,cas6_I_II_III_IV_V_VI_14,cas6_I_II_III_IV_V_VI_19,casR_III_1,csm2gr11_III-A_15,csm3gr7_III-A_1,csm4gr5_III-A_1,csm5gr7_III-A_2,csx1_III_9
+NC_017095.1_Esos_1 Esos Esos Defense NC_017095.1_1541 NC_017095.1_1541 NC_017095.1_1541 1 Esos__VCA0450
+NC_017095.1_VP1840_2 VP1840 VP1840 Defense NC_017095.1_1651 NC_017095.1_1651 NC_017095.1_1651 1 VP1840__VP1840
+NC_017095.1_RM_Type_II_5 RM RM_Type_II Defense NC_017095.1_1662 NC_017095.1_1664 NC_017095.1_1662,NC_017095.1_1663,NC_017095.1_1664 3 RM_Type_II__Type_II_MTases_FAM_38,RM_Type_II__Type_II_MTases_FAM_4,RM_Type_II__Type_II_REase32
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_018014.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_018014.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_018014.1_DS-6_5 DS-6 DS-6 Defense NC_018014.1_132 NC_018014.1_133 NC_018014.1_132,NC_018014.1_133 2 DS-6__DS-6A,DS-6__DS-6B
+NC_018014.1_Pycsar_6 Pycsar Pycsar Defense NC_018014.1_571 NC_018014.1_573 NC_018014.1_571,NC_018014.1_572,NC_018014.1_573 3 CBASS__2TM_5,Pycsar__AG_cyclase,Pycsar__AG_cyclase
+NC_018014.1_DISARM_1_4 DISARM DISARM_1 Defense NC_018014.1_3050 NC_018014.1_3053 NC_018014.1_3050,NC_018014.1_3051,NC_018014.1_3052,NC_018014.1_3053 4 DISARM_1__drmMI,DISARM__drmA,DISARM__drmB,DISARM__drmC
+NC_018014.1_CBASS_III_3 CBASS CBASS_III Defense NC_018014.1_3068 NC_018014.1_3071 NC_018014.1_3068,NC_018014.1_3069,NC_018014.1_3070,NC_018014.1_3071 4 CBASS__Cyclase_II,CBASS__Endonuc_big,CBASS__TRIP13,CBASS__bacHORMA_1
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_018068.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_018068.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,13 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_018068.1_Hachiman_2 Hachiman Hachiman Defense NC_018068.1_1171 NC_018068.1_1172 NC_018068.1_1171,NC_018068.1_1172 2 Hachiman__HamA_1,Hachiman__HamB
+NC_018068.1_RM_Type_I_10 RM RM_Type_I Defense NC_018068.1_1178 NC_018068.1_1180 NC_018068.1_1178,NC_018068.1_1179,NC_018068.1_1180 3 RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_03
+NC_018068.1_RM_Type_IV_14 RM RM_Type_IV Defense NC_018068.1_1186 NC_018068.1_1186 NC_018068.1_1186 1 RM_Type_IV__Type_IV_03
+NC_018068.1_RM_Type_II_11 RM RM_Type_II Defense NC_018068.1_1192 NC_018068.1_1193 NC_018068.1_1192,NC_018068.1_1193 2 RM_Type_II__Type_II_MTases_FAM_7,RM_Type_II__Type_II_REase10
+NC_018068.1_CAS_Class1-Subtype-I-C_15 Cas CAS_Class1-Subtype-I-C Defense NC_018068.1_1411 NC_018068.1_1418 NC_018068.1_1411,NC_018068.1_1412,NC_018068.1_1413,NC_018068.1_1414,NC_018068.1_1415,NC_018068.1_1417,NC_018068.1_1418 7 cas1_I_II_III_IV_V_VI_6,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-C_11,cas7_I-C_13,cas8c_I-C_4
+NC_018068.1_RM_Type_III_13 RM RM_Type_III Defense NC_018068.1_1541 NC_018068.1_1542 NC_018068.1_1541,NC_018068.1_1542 2 RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_018068.1_Ceres_1 Ceres Ceres Defense NC_018068.1_3152 NC_018068.1_3152 NC_018068.1_3152 1 Ceres__CrsA1
+NC_018068.1_MazEF_6 MazEF MazEF Defense NC_018068.1_3456 NC_018068.1_3457 NC_018068.1_3456,NC_018068.1_3457 2 MazEF__MazE,MazEF__MazF
+NC_018068.1_Rst_HelicaseDUF2290_7 Rst_HelicaseDUF2290 Rst_HelicaseDUF2290 Defense NC_018068.1_3757 NC_018068.1_3758 NC_018068.1_3757,NC_018068.1_3758 2 Rst_HelicaseDUF2290__DUF2290,Rst_HelicaseDUF2290__Helicase
+NC_018068.1_Hachiman_3 Hachiman Hachiman Defense NC_018068.1_3759 NC_018068.1_3760 NC_018068.1_3759,NC_018068.1_3760 2 Hachiman__HamA_1,Hachiman__HamB
+NC_018068.1_Septu_8 Septu Septu Defense NC_018068.1_4412 NC_018068.1_4413 NC_018068.1_4412,NC_018068.1_4413 2 Septu__PtuA,Septu__PtuB
+NC_018068.1_RM_Type_II_12 RM RM_Type_II Defense NC_018068.1_4429 NC_018068.1_4430 NC_018068.1_4429,NC_018068.1_4430 2 RM_Type_II__Type_II_MTases_FAM_25,RM_Type_II__Type_II_REase09
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_018515.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_018515.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,10 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_018515.1_AbiAlpha_1 AbiAlpha AbiAlpha Defense NC_018515.1_121 NC_018515.1_121 NC_018515.1_121 1 AbiAlpha__AbiAlpha
+NC_018515.1_VP1839_11 VP1839 VP1839 Defense NC_018515.1_122 NC_018515.1_122 NC_018515.1_122 1 VP1839__VP1839
+NC_018515.1_CBASS_IV_7 CBASS CBASS_IV Defense NC_018515.1_324 NC_018515.1_328 NC_018515.1_324,NC_018515.1_325,NC_018515.1_326,NC_018515.1_327,NC_018515.1_328 5 CBASS__2TM_type_IV,CBASS__Cyclase_SMODS,CBASS__OGG,CBASS__QueC,CBASS__TGT
+NC_018515.1_BREX_I_4 BREX BREX_I Defense NC_018515.1_329 NC_018515.1_335 NC_018515.1_329,NC_018515.1_330,NC_018515.1_331,NC_018515.1_332,NC_018515.1_334,NC_018515.1_335 6 BREX__brxA_DUF1819,BREX__brxB_DUF1788,BREX__brxC,BREX__brxL,BREX__pglX1,BREX__pglZA
+NC_018515.1_Prometheus_9 Prometheus Prometheus Defense NC_018515.1_337 NC_018515.1_337 NC_018515.1_337 1 Prometheus__ProA
+NC_018515.1_Azaca_2 Azaca Azaca Defense NC_018515.1_349 NC_018515.1_351 NC_018515.1_349,NC_018515.1_350,NC_018515.1_351 3 Azaca__ZacA,Azaca__ZacB,Azaca__ZacC
+NC_018515.1_Wadjet_III_13 Wadjet Wadjet_III Defense NC_018515.1_1811 NC_018515.1_1814 NC_018515.1_1811,NC_018515.1_1812,NC_018515.1_1813,NC_018515.1_1814 4 Wadjet__JetA_III,Wadjet__JetB_III,Wadjet__JetC_III,Wadjet__JetD_III
+NC_018515.1_SpbK_10 SpbK SpbK Defense NC_018515.1_2272 NC_018515.1_2272 NC_018515.1_2272 1 SpbK__SpbK
+NC_018515.1_Kiwa_8 Kiwa Kiwa Defense NC_018515.1_3261 NC_018515.1_3262 NC_018515.1_3261,NC_018515.1_3262 2 Kiwa__KwaA,Kiwa__KwaB_2
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_019897.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_019897.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,13 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_019897.1_RM_Type_III_11 RM RM_Type_III Defense NC_019897.1_86 NC_019897.1_87 NC_019897.1_86,NC_019897.1_87 2 RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_019897.1_MazEF_3 MazEF MazEF Defense NC_019897.1_128 NC_019897.1_129 NC_019897.1_128,NC_019897.1_129 2 MazEF__MazE,MazEF__MazF
+NC_019897.1_RM_Type_II_9 RM RM_Type_II Defense NC_019897.1_789 NC_019897.1_790 NC_019897.1_789,NC_019897.1_790 2 RM_Type_II__Type_II_MTases_FAM_2,RM_Type_II__Type_II_REase27
+NC_019897.1_Mokosh_TypeII_4 Mokosh Mokosh_TypeII Defense NC_019897.1_913 NC_019897.1_913 NC_019897.1_913 1 Mokosh_TypeII__MkoC
+NC_019897.1_Druantia_I_2 Druantia Druantia_I Defense NC_019897.1_2741 NC_019897.1_2744 NC_019897.1_2741,NC_019897.1_2742,NC_019897.1_2743,NC_019897.1_2744 4 Druantia_I__DruB,Druantia_I__DruC,Druantia_I__DruD,Druantia__DruE_1
+NC_019897.1_CAS_Class1-Subtype-III-D_14 Cas CAS_Class1-Subtype-III-D Defense NC_019897.1_3030 NC_019897.1_3035 NC_019897.1_3030,NC_019897.1_3031,NC_019897.1_3032,NC_019897.1_3033,NC_019897.1_3034,NC_019897.1_3035 6 cas10_III-D_3,csm3gr7_III-D_2,csm3gr7_III-D_3,csm3gr7_III_1,csx19_III-D_17,csx1_III_11
+NC_019897.1_CAS_Class1-Subtype-I-B_12 Cas CAS_Class1-Subtype-I-B Defense NC_019897.1_3046 NC_019897.1_3053 NC_019897.1_3046,NC_019897.1_3047,NC_019897.1_3048,NC_019897.1_3049,NC_019897.1_3050,NC_019897.1_3051,NC_019897.1_3052,NC_019897.1_3053 8 cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas3_I_2,cas4_I_II_III_IV_V_VI_6,cas5_I-B_17,cas6_I_II_III_IV_V_VI_20,cas7b_I-B_I-C_2,cas8b1_I-B_8
+NC_019897.1_CAS_Class1-Subtype-I-C_13 Cas CAS_Class1-Subtype-I-C Defense NC_019897.1_3155 NC_019897.1_3158 NC_019897.1_3155,NC_019897.1_3156,NC_019897.1_3157,NC_019897.1_3158 4 cas3_I_5,cas5_I-C_5,cas7_I-C_7,cas8c_I-C_4
+NC_019897.1_Wadjet_II_6 Wadjet Wadjet_II Defense NC_019897.1_3286 NC_019897.1_3289 NC_019897.1_3286,NC_019897.1_3287,NC_019897.1_3288,NC_019897.1_3289 4 Wadjet__JetA_II,Wadjet__JetB_II,Wadjet__JetC_II,Wadjet__JetD_II
+NC_019897.1_RM_Type_I_8 RM RM_Type_I Defense NC_019897.1_3326 NC_019897.1_3328 NC_019897.1_3326,NC_019897.1_3327,NC_019897.1_3328 3 RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_51
+NC_019897.1_RM_Type_II_10 RM RM_Type_II Defense NC_019897.1_3527 NC_019897.1_3528 NC_019897.1_3527,NC_019897.1_3528 2 RM_Type_II__Type_II_MTases_FAM_16,RM_Type_II__Type_II_REase01
+NC_019897.1_Ceres_1 Ceres Ceres Defense NC_019897.1_3704 NC_019897.1_3704 NC_019897.1_3704 1 Ceres__CrsA1
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_019904.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_019904.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,18 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_019904.1_HEC-05_12 HEC-05 HEC-05 Defense NC_019904.1_318 NC_019904.1_318 NC_019904.1_318 1 HEC-05__HEC-05
+NC_019904.1_RM_Type_I_19 RM RM_Type_I Defense NC_019904.1_371 NC_019904.1_374 NC_019904.1_371,NC_019904.1_372,NC_019904.1_374 3 RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_01
+NC_019904.1_dCTPdeaminase_15 dCTPdeaminase dCTPdeaminase Defense NC_019904.1_408 NC_019904.1_408 NC_019904.1_408 1 dCTPdeaminase__dCTPdeaminase
+NC_019904.1_RM_Type_I_20 RM RM_Type_I Defense NC_019904.1_411 NC_019904.1_413 NC_019904.1_411,NC_019904.1_412,NC_019904.1_413 3 RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_03
+NC_019904.1_Gabija_8 Gabija Gabija Defense NC_019904.1_430 NC_019904.1_431 NC_019904.1_430,NC_019904.1_431 2 Gabija__GajA,Gabija__GajB_2
+NC_019904.1_Gao_Qat_11 Gao_Qat Gao_Qat Defense NC_019904.1_1323 NC_019904.1_1326 NC_019904.1_1323,NC_019904.1_1324,NC_019904.1_1325,NC_019904.1_1326 4 Gao_Qat__QatA,Gao_Qat__QatB,Gao_Qat__QatC,Gao_Qat__QatD
+NC_019904.1_SoFic_14 SoFIC SoFic Defense NC_019904.1_1676 NC_019904.1_1676 NC_019904.1_1676 1 SoFic__SoFic
+NC_019904.1_Gabija_9 Gabija Gabija Defense NC_019904.1_1900 NC_019904.1_1901 NC_019904.1_1900,NC_019904.1_1901 2 Gabija__GajA,Gabija__GajB_3
+NC_019904.1_RM_Type_II_22 RM RM_Type_II Defense NC_019904.1_1947 NC_019904.1_1949 NC_019904.1_1947,NC_019904.1_1948,NC_019904.1_1949 3 RM_Type_II__Type_II_MTases_FAM_2,RM_Type_II__Type_II_REase06,RM_Type_II__Type_II_REase38
+NC_019904.1_Sirona_13 Sirona Sirona Defense NC_019904.1_1950 NC_019904.1_1950 NC_019904.1_1950 1 Sirona__VCA0356
+NC_019904.1_CBASS_II_5 CBASS CBASS_II Defense NC_019904.1_3143 NC_019904.1_3145 NC_019904.1_3143,NC_019904.1_3144,NC_019904.1_3145 3 CBASS__Cyclase_II,CBASS__E2,CBASS__Effector_2TM_Sa_NUDIX
+NC_019904.1_AbiE_2 AbiE AbiE Defense NC_019904.1_3195 NC_019904.1_3196 NC_019904.1_3195,NC_019904.1_3196 2 AbiEii__AbiEi_3,AbiEii__AbiEii
+NC_019904.1_RM_Type_I_21 RM RM_Type_I Defense NC_019904.1_4383 NC_019904.1_4389 NC_019904.1_4383,NC_019904.1_4387,NC_019904.1_4388,NC_019904.1_4389 4 RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_01,RM__Type_I_S_51
+NC_019904.1_AbiD_1 AbiD AbiD Defense NC_019904.1_4385 NC_019904.1_4385 NC_019904.1_4385 1 AbiD__AbiD
+NC_019904.1_Cernunnos_7 Cernunnos Cernunnos Defense NC_019904.1_4390 NC_019904.1_4390 NC_019904.1_4390 1 Cernunnos__VCA0410
+NC_019904.1_Gabija_10 Gabija Gabija Defense NC_019904.1_4391 NC_019904.1_4392 NC_019904.1_4391,NC_019904.1_4392 2 Gabija__GajA,Gabija__GajB_1
+NC_019904.1_Ceres_6 Ceres Ceres Defense NC_019904.1_4414 NC_019904.1_4414 NC_019904.1_4414 1 Ceres__CrsA1
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_019936.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_019936.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,11 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_019936.1_Gabija_5 Gabija Gabija Defense NC_019936.1_617 NC_019936.1_618 NC_019936.1_617,NC_019936.1_618 2 Gabija__GajA,Gabija__GajB_3
+NC_019936.1_RM_Type_I_12 RM RM_Type_I Defense NC_019936.1_860 NC_019936.1_862 NC_019936.1_860,NC_019936.1_861,NC_019936.1_862 3 RM__Type_I_MTases_FAM_3,RM__Type_I_REases_FAM_1.einsi_trimmed,RM__Type_I_S_52
+NC_019936.1_Shango_6 Shango Shango Defense NC_019936.1_896 NC_019936.1_898 NC_019936.1_896,NC_019936.1_897,NC_019936.1_898 3 Shango__SngA,Shango__SngB,Shango__SngC
+NC_019936.1_RM_Type_I_13 RM RM_Type_I Defense NC_019936.1_1070 NC_019936.1_1072 NC_019936.1_1070,NC_019936.1_1071,NC_019936.1_1072 3 RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_03
+NC_019936.1_RM_Type_IV_16 RM RM_Type_IV Defense NC_019936.1_1377 NC_019936.1_1377 NC_019936.1_1377 1 RM_Type_IV__FAM_0
+NC_019936.1_AbiC_1 AbiC AbiC Defense NC_019936.1_2817 NC_019936.1_2817 NC_019936.1_2817 1 AbiC__AbiC
+NC_019936.1_RM_Type_I_14 RM RM_Type_I Defense NC_019936.1_3312 NC_019936.1_3317 NC_019936.1_3312,NC_019936.1_3313,NC_019936.1_3314,NC_019936.1_3317 4 RM__Type_I_MTases_FAM_3,RM__Type_I_REases_FAM_1.einsi_trimmed,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_52
+NC_019936.1_CBASS_III_4 CBASS CBASS_III Defense NC_019936.1_3322 NC_019936.1_3325 NC_019936.1_3322,NC_019936.1_3323,NC_019936.1_3324,NC_019936.1_3325 4 CBASS__Cyclase_II,CBASS__Endonuc_big,CBASS__TRIP13,CBASS__bacHORMA_1
+NC_019936.1_RM_Type_I_15 RM RM_Type_I Defense NC_019936.1_3936 NC_019936.1_3940 NC_019936.1_3936,NC_019936.1_3939,NC_019936.1_3940 3 RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_06
+NC_019936.1_dCTPdeaminase_7 dCTPdeaminase dCTPdeaminase Defense NC_019936.1_4004 NC_019936.1_4004 NC_019936.1_4004 1 dCTPdeaminase__dCTPdeaminase
diff -r 000000000000 -r 315c2ed31af1 test-data/defense_finder_systems/NC_021184.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_021184.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,25 @@
+sys_id type subtype activity sys_beg sys_end protein_in_syst genes_count name_of_profiles_in_sys
+NC_021184.1_SoFic_11 SoFIC SoFic Defense NC_021184.1_113 NC_021184.1_113 NC_021184.1_113 1 SoFic__SoFic
+NC_021184.1_RM_Type_I_21 RM RM_Type_I Defense NC_021184.1_221 NC_021184.1_224 NC_021184.1_221,NC_021184.1_223,NC_021184.1_224 3 RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_51
+NC_021184.1_RM_Type_I_22 RM RM_Type_I Defense NC_021184.1_242 NC_021184.1_244 NC_021184.1_242,NC_021184.1_243,NC_021184.1_244 3 RM__Type_I_MTases_FAM_2,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_52
+NC_021184.1_MazEF_8 MazEF MazEF Defense NC_021184.1_395 NC_021184.1_396 NC_021184.1_395,NC_021184.1_396 2 MazEF__MazE,MazEF__MazF
+NC_021184.1_CAS_Class1-Subtype-I-B_29 Cas CAS_Class1-Subtype-I-B Defense NC_021184.1_509 NC_021184.1_516 NC_021184.1_509,NC_021184.1_510,NC_021184.1_511,NC_021184.1_512,NC_021184.1_513,NC_021184.1_514,NC_021184.1_515,NC_021184.1_516 8 cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas3_I_2,cas4_I_II_III_IV_V_VI_6,cas5_I-B_17,cas6_I-B_III_1,cas7b_I-B_I-C_2,cas8b1_I-B_9
+NC_021184.1_CAS_Class1-Subtype-I-B_30 Cas CAS_Class1-Subtype-I-B Defense NC_021184.1_770 NC_021184.1_779 NC_021184.1_770,NC_021184.1_773,NC_021184.1_774,NC_021184.1_775,NC_021184.1_776,NC_021184.1_777,NC_021184.1_778,NC_021184.1_779 8 cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-B_17,cas6_I_II_III_IV_V_VI_20,cas7_I-B_8,cas8b1_I-B_14
+NC_021184.1_Wadjet_II_17 Wadjet Wadjet_II Defense NC_021184.1_925 NC_021184.1_928 NC_021184.1_925,NC_021184.1_926,NC_021184.1_927,NC_021184.1_928 4 Wadjet__JetA_II,Wadjet__JetB_II,Wadjet__JetC_II,Wadjet__JetD_II
+NC_021184.1_RM_Type_I_23 RM RM_Type_I Defense NC_021184.1_963 NC_021184.1_967 NC_021184.1_963,NC_021184.1_965,NC_021184.1_967 3 RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_06
+NC_021184.1_Kiwa_6 Kiwa Kiwa Defense NC_021184.1_1016 NC_021184.1_1017 NC_021184.1_1016,NC_021184.1_1017 2 Kiwa__KwaA,Kiwa__KwaB
+NC_021184.1_PfiAT_10 PfiAT PfiAT Defense NC_021184.1_1033 NC_021184.1_1034 NC_021184.1_1033,NC_021184.1_1034 2 PfiAT__PfiA,PfiAT__PfiT
+NC_021184.1_BREX_I_4 BREX BREX_I Defense NC_021184.1_1159 NC_021184.1_1165 NC_021184.1_1159,NC_021184.1_1160,NC_021184.1_1161,NC_021184.1_1162,NC_021184.1_1165 5 BREX__brxA_DUF1819,BREX__brxB_DUF1788,BREX__brxC,BREX__pglX1,BREX__pglZA
+NC_021184.1_AbiE_1 AbiE AbiE Defense NC_021184.1_1208 NC_021184.1_1209 NC_021184.1_1208,NC_021184.1_1209 2 AbiEii__AbiEi_4,AbiEii__AbiEii
+NC_021184.1_RM_Type_III_26 RM RM_Type_III Defense NC_021184.1_1419 NC_021184.1_1420 NC_021184.1_1419,NC_021184.1_1420 2 RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_021184.1_Gabija_5 Gabija Gabija Defense NC_021184.1_1422 NC_021184.1_1423 NC_021184.1_1422,NC_021184.1_1423 2 Gabija__GajA,Gabija__GajB_2
+NC_021184.1_PD-T7-2_9 PD-T7-2 PD-T7-2 Defense NC_021184.1_1424 NC_021184.1_1428 NC_021184.1_1424,NC_021184.1_1428 2 PD-T7-2__PD-T7-2_A,PD-T7-2__PD-T7-2_B
+NC_021184.1_RM_Type_IV_28 RM RM_Type_IV Defense NC_021184.1_1656 NC_021184.1_1656 NC_021184.1_1656 1 RM_Type_IV__Type_IV_05
+NC_021184.1_RM_Type_II_24 RM RM_Type_II Defense NC_021184.1_3394 NC_021184.1_3396 NC_021184.1_3394,NC_021184.1_3395,NC_021184.1_3396 3 RM_Type_II__Type_II_MTases_FAM_16,RM_Type_II__Type_II_REase01,RM_Type_II__Type_II_REase17
+NC_021184.1_Wadjet_I_15 Wadjet Wadjet_I Defense NC_021184.1_3691 NC_021184.1_3693 NC_021184.1_3691,NC_021184.1_3692,NC_021184.1_3693 3 Wadjet__JetA_I,Wadjet__JetB_I,Wadjet__JetC_I
+NC_021184.1_Wadjet_I_16 Wadjet Wadjet_I Defense NC_021184.1_3803 NC_021184.1_3806 NC_021184.1_3803,NC_021184.1_3804,NC_021184.1_3805,NC_021184.1_3806 4 Wadjet__JetA_I,Wadjet__JetB_I,Wadjet__JetC_I,Wadjet__JetD_I
+NC_021184.1_CAS_Class1-Subtype-I-C_31 Cas CAS_Class1-Subtype-I-C Defense NC_021184.1_4025 NC_021184.1_4031 NC_021184.1_4025,NC_021184.1_4026,NC_021184.1_4027,NC_021184.1_4028,NC_021184.1_4029,NC_021184.1_4030,NC_021184.1_4031 7 cas1_I_II_III_IV_V_VI_6,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-C_11,cas7_I-C_7,cas8c_I-C_2
+NC_021184.1_RM_Type_III_27 RM RM_Type_III Defense NC_021184.1_4091 NC_021184.1_4092 NC_021184.1_4091,NC_021184.1_4092 2 RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_021184.1_Lamassu-Hypothetical_7 Lamassu-Fam Lamassu-Hypothetical Defense NC_021184.1_4235 NC_021184.1_4237 NC_021184.1_4235,NC_021184.1_4236,NC_021184.1_4237 3 Lamassu-Fam__LmuA_effector_hypothetical,Lamassu-Fam__LmuB_SMC_hypothetical,Lamassu-Fam__LmuC_acc_hypothetical
+NC_021184.1_AbiH_2 AbiH AbiH Defense NC_021184.1_4301 NC_021184.1_4301 NC_021184.1_4301 1 AbiH__AbiH
+NC_021184.1_RM_Type_II_25 RM RM_Type_II Defense NC_021184.1_4531 NC_021184.1_4532 NC_021184.1_4531,NC_021184.1_4532 2 RM_Type_II__Type_II_MTases_FAM_27,RM_Type_II__Type_II_REase01
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_000913.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_000913.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000002.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000003.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000000.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
+sequence_000001.fasta.fasta,4_0,0.010000000000000009,average,ANImf,4
+sequence_000004.fasta.fasta,5_0,0.010000000000000009,average,ANImf,5
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_002737.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_002737.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000001.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000000.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_008261.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_008261.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_009012.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_009012.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000002.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
+sequence_000003.fasta.fasta,4_0,0.010000000000000009,average,ANImf,4
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_014168.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_014168.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_014212.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_014212.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000001.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_014364.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_014364.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_1,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,1_2,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000003.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_015761.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_015761.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000002.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_017033.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_017033.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000001.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000000.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_018068.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_018068.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_018515.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_018515.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_019936.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_019936.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000001.fasta.fasta,1_1,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,1_2,0.010000000000000009,average,ANImf,1
+sequence_000000.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare/NC_021184.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_021184.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000001.fasta.fasta,1_1,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,1_2,0.010000000000000009,average,ANImf,1
+sequence_000000.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_000913.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_000913.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_002737.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_002737.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_008261.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_008261.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_009012.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_009012.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_014168.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_014168.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_014212.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_014212.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_014364.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_014364.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_015761.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_015761.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_017033.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_017033.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_018068.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_018068.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_018515.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_018515.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_019936.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_019936.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/drep_compare_clustering_dendrogram/NC_021184.fasta.pdf
Binary file test-data/drep_compare_clustering_dendrogram/NC_021184.fasta.pdf has changed
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_000913.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_000913.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1685 @@
+>NC_000913.3|provirus_563848_584430
+TTATATTAATTCGTATAATTTGGCGTAGTCGATAAGCTCTACAATTGAATGCAAACCTAG
+CTTGCCATAAATATTAGATTTATGCGCACTAACTGTTTTATTGCTAAGTAATAACTTATC
+GGCAATTTCTTTATTAGATAATCCGCTAACCAGATAACGTAATATGGTCACTTCACGATT
+AGATAGCACAGTGACCGTTGAACTATTCGTACTACATTTATTGCTTTTTATATAGTTAAG
+CGTTTCGCTGGGAAAAAACGTGTATCCGGAGAGGATCATCTGAACGGCATGAAAAATATC
+ATTCTGATCATTGCATTTACTGACAAAACCGTTAGCACCAGCTTGTATCGCTCTGCCAGC
+ATAAAAGCATTCTGATTTCGATGATAAAAATAACACTTTCACTGTGCTCTGGATTTGTTT
+GATCCTTTTCAGGAAGGTAAAACCGTCTGTTCCGGGCAAGTCTATATCCATAATGATTAA
+ATCAACAGGACGGGTTCGGAGATAATCGATGGTTATGCGATAATCATCCGTTTTCAGGAC
+AATCTGCAATTCACTGTTTTTTTGCAACAGAACTTCAATAGACATTCTGATGATAGGATG
+AGTATCCATAATGATCACCGACGTTGGTTTCATAGTTACCAGTCTCATAGGAGCGGACAA
+TTTTCCGTTAGGTCGGGAAATTGTACTTTGATACATGAAAATACGGGTTTTCTTGATTCA
+GACGCGCAGCGGTGTGCGTTTGTTTGCCGCTATAGCGAAATAAATCAGAAAATCAGACGC
+GGTCGTTCACTTGTTCAGCAACCAGATCAAAAGCCATTGACTCAGCAAGGGTTGACCGTA
+TAATTCACGCGATTACACCGCATTGCGGTATCAACGCGCCCTTAGCTCAGTTGGATAGAG
+CAACGACCTTCTAAGTCGTGGGCCGCAGGTTCGAATCCTGCAGGGCGCGCCATTACAATT
+CAATCAGTTACGCCTTCTTTATATCCTCCATAATTTCAGAGTGGGACATATTTGGGACAT
+TATCACCAAAAATGTCGTCTATTTTCCTCGCATGCTCTGTCAAATGATTAGGCGCAAGGT
+GAGCATACCTACGAACCATTTCTATGGACTCCCATCCGCCCATTTCCTGAAGCACTGATA
+ATGGGACGCCTGACTGAATCAGCCAGCTTGCCCAGGTGTGTCTGAGGTCATGGAAACGGA
+AATCTTCAATTCCTGCACGACGACAAGCTGATAGCCATGATGTCTTGCTGTCGATGCGCA
+TCTTCCTGACCGCAGGCGTTGATGTTCCATCTGCTCGCTTAGCCGCCTTGGTATGTACAA
+ACACCCATTTGTGATGCTTGCCTATTTGATCACGCAACACTTTACAGGCGGTATCGTTCA
+GCGCCACACCAATGGCGCGGTTTGATTTGCTCTCTTCTGGATTCACCCAGGCAACTCGTC
+GCTGCATGTCGATTTGTTGCCATTCCAGATTTATGATGTTCGACTTTCTCAGACCAGTTG
+CCAGCGCAAACTTGACGACAGATTTCAGTGGTTCGGGGCACTCATCAATAAGGCGTTTTG
+CTTCCTCCTTTTCCAGCCATCTGACTCGCTTGTTTCTGACCGCTGGTATCTTGATGACAG
+GCGCTTTTTCCAGCCACTTCCAGTCGCGTTCTGCAGCACGGAGAATGGCCTTTATCATGG
+CAAGATGCTTTGCCTTTGTCTGAGTTGATACTGGCTTTGGTTCATAAACAGGCAGTTCTT
+TACCTTTCCTGATGGCGGCCTGAACTTTCTGTTTCCATATTTCTTTCGTCTTTCTGTTAT
+GCATTCTGCTTACAGCAGAGTAAATCTTTGCCTCCGAGATATCTTTAAGCCTTATACCCT
+CAAAATGTTCAAGCCAGAACTCAATCCGGCTTTTATCTGAATCGAGAGATTTTTTATCAG
+CTTTTTCCTCAAGCCATCTTAGGCAGGCCTCTTCAAAAGTGACATCAGGTAAATCCCCTA
+GCTTTTCTACTCGCCAGAGTTCTGCTTTTCGCTTGTCGTGCAACTCCTGAGCTTGCCGTT
+TGTCCTTTGTGCCAAGAGATTCCTTAATTCGTTTCCCGCCCGGGAGCGAATACGAGGCAT
+ACCATATTTCATTTCTGCGGAAGAGTGACATTTTCTTTCCTCTGTTATGCCATCACCCGC
+GCTCACCTGGACAGTATGCAGCGGAGACTGAAGCGCCGCAATGCAGGCTTGCCGTGTTGT
+GAGGTACCCGGATATTATCGTGAGGATGCGTCATCGCCATTGCTCCCCAAATACAAAACC
+AATTTCAGCCAGTGCCTCGTCCATTTTTTCGATGAACTCCGGCACCATCTCGTCAAAACT
+CGCCATGTACTTTTCATTCCGCTCAATCACGACATAATGCAGGCCTTCACGCTTCATGCG
+CGGGTCATAGTTGGCAAAGTACCAGGCATCTTTTCGCGTCACCCACATGCTGTACTGCAC
+CTGGGCCATGTAAGCCGATTTTATTGCCTCGAAACCACCGAGCCGGAATTTCATGAAATC
+CCGGGAGGTACGAGTATTGCCGGAAGCGTGGCCTGTATCCGGATGCAGAGTCTTATCCGT
+GGAAATCGAACGCGCATTACTGGTTGGTTACCAACTTGTACCAGAACATGCGGGCCAATG
+CGCTGGCTGACGCGGAATTACGGCGCAAGGCTGCCGATGAACTGACCTGTATGACAGCGC
+GAATTAACCGTGGTGAGACGATACCTGAACCAGTAAAACAACTTCCTGTTATGGGCGGTA
+GACCTCTAAATCGTGCACAGGCTCTGGCGAAGATCGCAGAAATTAAAGCTAAGTTCGGAC
+TGAAAGGAGCAAGTGTATGACGGGCAAAGAGGCAATTATTCATTACCTGGGGACGCATAA
+GAGCTTCTGTGCACAGGACGTTGCCGCGGTAACAGGCGCAACCGTAATCTGATCTTACCC
+AGCAATAGTGGACACGCGGCTAAGTGAGTAAACTCTCAGTCAGAGGTGACTCACATGACA
+AAAACAGTATCAACCAGTAAAAAACCCCGTAAACAGCATTCGCCTGAATTTCGCAGTGAA
+GCCCTGAAGCTTGCTGAACGCATCGGTGTTACTGCCGCAGCCCGTGAACTCAGCCTGTAT
+GAATCACAACTCTACAACTGGCGCAGTAAACAGCAAAATCAGCAGACGTCTTCTGAACGT
+GAACTGGAGATGTCTACCGAGATTGCACGTCTCAAACGCCAGCTGGCAGAACGGGATGAA
+GAGCTGGCTATCCTCCAAAAGGCCGCGACATACTTCGCGAAGCGCCTGAAATGAAGTATG
+TCTTTATTGAAAAACATCAGGCTGAGTTCAGCATCAAAGCAATGTGCCGCGTGCTCCGGG
+TGGCCCGCAGCGGCTGGTATACGTGGTGTCAGCGGCGGACAAGGATAAGCACGCGTCAGC
+AGTTCCGCCAACACTGCGACAGCGTTGTCCTCGCGGCTTTTACCCGGTCAAAACAGCGTT
+ACGGTGCCCCACGCCTGACGGATGAACTGCGTGCTCAGGGTTACCCCTTTAACGTAAAAA
+CCGTGGCGGCAAGCCTGCGCCGTCAGGGACTGAGGGCAAAGGCCTCCCGGAAGTTCAGCC
+CGGTCAGCTACCGCGCACACGGCCTGCCTGTGTCAGAAAATCTGTTGGAGCAGGATTTTT
+ACGCCAGTGGCCCGAACCAGAAGTGGGCAGGAGACATCACGTACTTACGTACAGATGAAG
+GCTGGCTGTATCTGGCAGTGGTCATTGACCTGTGGTCACGTGCCGTTATTGGCTGGTCAA
+TGTCGCCACGCATGACGGCGCAACTGGCCTGCGATGCCCTGCAGATGGCGCTGTGGCGGC
+GTAAGAGGCCCCGGAACGTTATCGTTCACACGGACCGTGGAGGCCAGTACTGTTCAGCAG
+ATTATCAGGCGCAACTGAAGCGGCATAATCTGCGTGGAAGTATGAGCGCAAAAGGTTGCT
+GCTACGATAATGCCTGCGTGGAAAGCTTCTTTCATTCGCTGAAAGTGGAATGTATCCATG
+GAGAACACTTTATCAGCCGGGAAATAATGCGGGCAACGGTGTTTAATTATATCGAATGTG
+ATTACAATCGGTGGCGGCGGCACAGTTGGTGTGGCGGCCTCAGTCCGGAACAATTTGAAA
+ACAAGAACCTCGCTTAGGCCTGTGTCCATATTACGTGGGTAGGATCAACCAGCATAAATC
+AGGCTGCGGCTAAAATGGCGCGGGCAGGAATCCTGGTCGTTGATGGTAAGGTCTGGCGAA
+CGGTGTATTACCGGTTCGCTACCAGAGAAGAATGGGAAGGAAAGGTGAGCACGAATCTGA
+TTTTTAAGGAGTGTCGCCAGAGTGCCGCGATGAAACGGGTATTGAGGGTATATAAAAGAA
+CATCAATGGGAACACAATGATGAAACAGGTGAGTTGAGTTCAAACTGTAGTACAATTCTC
+TCCAGTTTGAACAGGAAAGAATATGCTATGAACCCTTATATTTATCTTGGTGGTGCAATA
+CTTGCAGAGGTCATTGGTACAACCTTAATGAAGTTTTCAGAAGGTTTTACACGGTTATGG
+CCATCTGTTGGTACAATTATTTGTTATTGTGCATCATTCTGGTTATTAGCTCAGACGCTG
+GCTTATATTCCTACAGGGATTGCTTATGCTATCTGGTCAGGAGTCGGTATTGTCCTGATT
+AGCTTACTGTCATGGGGATTTTTCGGCCAACGGCTGGACCTGCCAGCCATTATAGGCATG
+ATGTTGATTTGTGCCGGTGTGTTGATTATTAATTTATTGTCACGAAGCACACCACATTAA
+AATAATTTGTTTCTAAACGACTAAAATATGGAGGCTCTTATATTTATATGAGCCTCGTTT
+TATGCTTTTTGTTAATGTCTTTATTTTTTATGTATTCTTTTGTGCTTTCAAGATTATGGC
+GTAAGAAAATTGCAATACGATTATTGTTGTATATTCAAGATAATGTGACCTTAATTGTCT
+TTTTAAATAAAAAATAAACAAAAATTATATCCCACCACTAAGGTTTATAAAAGCATACGT
+TAGCAGGTGTCACCATGAAAAAAGCCATAGCATATATGCGATTTTCATCACCAGGTCAGA
+TGTCTGGCGACTCATTAAACCGACAGAGAAGACTTATTGCTGAATGGTTAAAGGTAAATA
+GTGATTATTATCTTGATACCATAACATATGAAGATTTAGGATTAAGTGCATTCAAAGGAA
+AGCATGCACAATCAGGAGCTTTTTCGGAATTTTTAGATGCTATAGAGCATGGTTATATAT
+TGCCAGGAACTACATTGTTAGTTGAAAGTCTGGACAGACTTTCAAGAGAAAAAGTCGGTG
+AAGCGATTGAACGTCTGAAATTGATTTTGAATCACGGTATTGATGTTATAACTCTTTGCG
+ACAATACAGTCTATAATATTGACTCTTTGAATGAGCCATATTCATTAATAAAAGCCATAC
+TTATAGCACAAAGGGCAAATGAAGAAAGCGAGATAAAGTCAAGTCGGGTTAAATTATCAT
+GGAAGAAAAAACGGCAGGATGCACTGGAATCAGGTACGATTATGACGGCGTCTTGTCCGA
+GATGGCTCTCCTTAGATGACAAAAGAACGGCTTTTGTTCCAGACCCCGACAGGGTGAAAA
+CTATTGAGCTAATTTTTAAACTCAGGATGGAAAGGCGCTCATTGAATGCAATAGCCAAGT
+ATTTAAATGATCATGCTGTAAAGAATTTCTCAGGAAAAGAAAGTGCATGGGGACCTTCTG
+TAATTGAAAAATTATTAGCGAATAAAGCTCTGATAGGTATTTGCGTACCTTCATATCGTG
+CAAGAGGGAAAGGGATAAGTGAAATCGCTGGCTATTATCCCAGAGTCATATCAGATGATT
+TGTTTTACGCTGTACAGGAAATTCGGTTGGCACCTTTTGGTATTAGCAATAGTAGCAAGA
+ATCCTATGCTAATAAATCTACTTCGAACAGTTATGAAGTGTGAGGCTTGTGGTAATACCA
+TGATTGTTCATGCGGTATCTGGAAGTTTGCATGGCTATTATGTTTGTCCGATGAGAAGAT
+TACATCGATGTGACAGGCCATCAATAAAAAGAGATTTGGTTGATTATAATATCATTAATG
+AATTGCTTTTTAATTGTAGCAAAATTCAACCAGTTGAAAACAAGAAAGATGCTAATGAAA
+CTTTAGAGTTAAAAATTATTGAGCTTCAGATGAAAATTAATAATTTAATCGTTGCATTGT
+CTGTCGCGCCTGAAGTTACCGCTATAGCAGAGAAAATAAGACTATTAGATAAGGAATTAC
+GAAGGGCTTCGGTATCATTGAAAACTTTGAAGAGTAAAGGTGTAAATTCATTCAGTGATT
+TTTATGCTATTGACTTAACCAGTAAAAATGGACGAGAGTTATGCCGTACACTTGCCTATA
+AAACATTCGAAAAAATCATAATTAATACGGATAATAAAACCTGTGATATCTATTTTATGA
+ATGGCATTGTTTTTAAACACTATCCTTTAATGAAAGTAATATCCGCCCAGCAGGCGATAA
+GTGCTCTCAAATATATGGTTGATGGTGAGATTTATTTCTAAATAATGATCTCGGATTTTA
+AGTTATGCTATGGTGATAAAGTGCAAGACAGAATTAATTATCTTTGACGAAACTTAATGG
+GTAATTACTTTGTTTGCTCCCACAAGCGAGTTTTGTACGGCTGTATTGGGGTAGTAAATG
+AGCTATACAATCTTAATCATTTGTTAGGTGAGAACTCTTGGTCGCAGATTCAAATACTGA
+AAATACGTGACAAATTATTATGAGCAAAATGGTGTATGTCACGTATTTTGAATGGTAGGT
+TAAAAAATAACACCGACTTTCGTAGGTGTTACTAATAATAAAGCAGAGTTTTTAGATAGT
+ATCAATGTGCTTTGTGTATATTGTGGCAAATAATTGGGTTGGGGGTACAATTGTGATTGC
+TTTTGCATGAACATTGCGCCTTTATGCATAATGAGATAAAGGAATATCAAATAAAATAAC
+GATAGGTCATAACAAAGAGGTTTTTATGAAAACACTTATCGTTTCAACTGTATTGGCATT
+CATAACATTTTCTGCGCAGGCTGCAGCATTTCAGGTCACTAGTAATGAAATAAAAACAGG
+AGAGCAACTTACAACGTCTCATGTCTTTTCTGGATTTGGGTGTGAAGGTGGTAATACATC
+GCCCTCATTAACCTGGTCTGGTGTTCCTGAAGGTACCAAAAGCTTTGCCGTAACTGTATA
+TGATCCAGATGCACCTACAGGCAGTGGTTGGTGGCATTGGACTGTTGTTAATATTCCAGC
+AACAGTAACATATTTGCCCGTTGATGCAGGGAGACGTGATGGAACAAAACTGCCGACTGG
+TGCTGTTCAAGGCCGAAATGATTTTGGCTATGCTGGGTTTGGTGGCGCATGTCCTCCTAA
+AGGAGATAAACCACATCATTACCAGTTTAAAGTATGGGCTCTAAAAACTGAAAAGATTCC
+TGTAGATTCTAACTCCAGCGGAGCGTTAGTTGGTTATATGCTTAATGCTAATAAAATCGC
+AACCGCTGAGATAACACCAGTTTATGAGATAAAGTAGGGTGAGAGTATGCTGGCAAGAGG
+TAAGACTAACTTAAAGATCGAAGAAATACGGATGCATAAACATCATGAGATTCATAGGGT
+TAAGCCTCTTATGCCAGCTTTGTGTCGTATCCGTCAGGGAAAGAAAGTTATCAATTGGGA
+GACGCATACTTTAACTGTTGATAATAATCAAATAATATTATTTCCTTGTGGTTATGAATT
+TTATATTGAGAATTATCCTGAAGCAGGGCTTTATCTTGCAGAAATGCTTTACTTACCCAT
+TGATTTAATTGAGAGTTTCCAAAAACTTTATACGGTAACTGATCAAATACGTAACAAAAC
+AAGTTTCTTTTTACCTCAGAATCCTGAGTTAATATATTGTTGGGAGCAACTAAAAACATC
+TGTTTCCCGAGGCTTCTCAACTAAAATTCAGGAGCACTTAGCAATGGGCGTTCTACTTTC
+GTTAGGAGTGAATCATGTTAATCATTTACTTTTATCATATAGTAAACAATCATTGATAAG
+TCGTTGTTATAACCTGCTGCTATCCGAACCCGGCACAAAATGGACAGCAAACAAGGTTGC
+TCGATATCTCTACATTTCTGTTTCTACATTACATCGCCGTCTAGCAAGCGAGGGGGTAAG
+TTTCCAAAGTATACTGGACGATGTGAGGTTAAATAATGCGTTGTCTGCTATACAAACGAC
+GGTAAAACCTATAAGCGAGATTGCCAGAGAAAATGGTTATAAGTGTCCTTCTCGTTTTAC
+TGAAAGATTTCATAATCGTTTTAATATAACACCAAGAGAGATAAGAAAAGCTTCCAGAGA
+GTAAAAGTGTTTTAAGAAGGAGCAATTCTATCGATTTTGATTTTGGGAAATCAACACGGC
+ATAATTATGTCACCGGAGCCTGAACAACTCCGGTGACTTCTGCGCTAAACGGGGACGTTT
+ATGCGCACATACAATCCAAACTCTCTTCTCCCTTCACAGATGCAGAAATGCACCTGCAAT
+TCTTTGCATCTAGCGTTTGACCTCTGCGGAGGGGAAGCGTGAACCTCTCACAAGACGGCA
+TCAAATTACATCGCGGCAACTTCACCGCTATCGGTCGGCAGATCCAGCCTTATCTGGAGG
+AGGGCAAATGCTTTCGCATGGTGCTTAAACCGTGGCGTGAGAAACGCAGTCTTTCCCAGA
+ATGCACTCAGCCACATGTGGTACAGCGAAATCAGTGAATACCTCATCAGCAGGGGTAAAA
+CGTTCGCCACTCCAGCTTGGGTAAAAGATGCTCTCAAACACACATATCTCGGTTATGAAA
+CCAAAGACCTGGTTGATGTCGTAACCGGTGATATCACCACTATCCAGTCGTTACGCCATA
+CCTCCGATCTTGATACCGGAGAGATGTATGTCTTCCTGTGTAAGGTTGAAGCCTGGGCGA
+TGAATATTGGTTGCCACCTGACTATTCCACAGAGCTGCGAGTTCCAGCTGCTGCGCGACA
+AGCAGGAGGCGTAATGGCTACACCGCTTATTCGTGTCATGAACGGACACATCTACAGAGT
+ACCAAATCGTCGTAAGCGTAAACCTGAGCTGAAGCCATCCGAAATACCAACACTGCTCGG
+ATATACCGCCAGCTTGGTTGATAAAAAATGGTTGCGACTGGCAGCAAGGAGGAGTCATGG
+CTGATTTGAGAAAAGCAGCGCGTGGTCGGGAATGCCAGGTAAGAATCCCTGGCGTATGTA
+ATGGCAACCCTGAAACGTCTGTACTGGCACATATCCGGCTGACTGGATTGTGCGGCACCG
+GTACGAAACCGCCAGACCTGATTGCCACCATTGCATGTTCTGCCTGCCACGACGAAATCG
+ACCGCCGCACGCATTTTGTTGACGCTGGATATGCAAAAGAATGCGCGCTGGAAGGTATGG
+CGAGAACACAGGTTATCTGGCTGAAAGAGGGGGTTATTAAGGCGTGAATACCTACAGCAT
+CACATTACCCTGGCCTCCGAGCAATAATCGCTATTACCGCCATAATCGCGGGCGCACGCA
+CGTCAGCGCAGAGGGGCAGGCATACCGCGATAACGTCGCCCGAATCATTAAAAACGCAAT
+GCTGGATATCGGCCTGGCTATGCCTGTGAAAATCCGCATTGAGTGCCACATGCCGGATCG
+CCGTCGCCGTGACCTGGATAATCTGCAAAAAGCCGCTTTTGACGCACTCACTAAAGCAGG
+TTTCTGGCTGGATGATGCTCAGGTCGTTGATTACCGCGTTGTGAAGATGCCTGTTACCAA
+AGGTGGGAGGCTGGAACTGACCATCACCGAAATGGGGAATGAATGATGTTTGAGTTTAAT
+ATGGCAGAACTTCTTCGCCACCGCTGGGGGCGTCTGCGCTTATATCGTTTCCCCGGTTCT
+GTTTTGACCGATTACCGAATACTGAAGAATTACGCCAAAACCCTGACAGGAGCAGGAGTA
+TGAAGTCAGAGATAACAATCAACTAATACTGTTTTGTTGATTTTTGCTTGTAATTGGCGT
+TCTGGTCTGATTTTTGTGGAGTAAGTTGATGCGTGATATTCAGATGGTTCTTGAGCGTTG
+GGGAGCGTGGGCGGCTAATAATCATGAAGATGTGACCTGGTCGTCCATTGCCGCCGGTTT
+TAAGGGATTAATTACTTCAAAAGTAAAATCTCGCCCGCAATGTTGTGACGATGACGCGAT
+GATCATTTGCGGGTGCATGGCCCGTCTGAAAAAGAACAACAGCGATTTGCACGATTTATT
+AGTAGATTATTATGTAGTCGGTATGACATTCATGTCACTGGCAGGTAAGCATTGCTGCTC
+TGATGGTTATATCGGGAAAAGGTTACAGAAGGCTGAGGGCATAATTGAAGGGATGTTAAT
+GGCATTAGATATCCGGTTAGAGATGGATATCGTTGTTAATAACTCTAATTAATATGCCAA
+TTGTTTACTAAAAATTATTAAAAATGGGGCGTTGAGACGCCCCCAAAAATAAAGGGTAAT
+ATATAACAGAAGGTTTATATAGTTAGAAGCAAGGTTGTGCTTCTAAAGGAAGTGGCTTGA
+GGGAGCCACTTATATGTTGGGGAGGCAACGCCTCCCGCAACATATCTTTTTCGTAATCAG
+ATTAGAACTGGTAAACCAGACCTACAGCAACGATGTCATCAGTGCTTACACCGAGTGCTT
+TAGGGAAGGTGCGAATAAGCGGGGAAATTCTTCTCGGCTGACTCAGTCATTTCATTTCTT
+CATGTTTGAGCCGATTTTTTCTCCCGTAAATGCCTTGAATCAGCCTATTTAGACCGTTTC
+TTCGCCATTTAAGGCGTTATCCCCAGTTTTTAGTGAGATCTCTCCCACTGACGTATCATT
+TGGTCCGCCCGAAACAGGTTGGCCAGCGTGAATAACATCGCCAGTTGGTTATCGTTTTTC
+AGCAACCCCTTGTATCTGGCTTTCACGAAGCCGAACTGTCGCTTGATGATGCGAAATGGG
+TGCTCCACCCTGGCCCGGATGCTGGCTTTCATGTATTCGATGTTGATGGCCGTTTTGTTC
+TTGCGTGGATGCTGTTTCAAGGTTCTTACCTTGCCGGGGCGCTCGGCGATCAGCCAGTCC
+ACATCCACCTCGGCCAGCTCCTCGCGCTGTGGCGCCCCTTGGTAGCCGGCATCGGCTGAG
+ACAAATTGCTCCTCTCCATGCAGCAGATTACCCAGCTGATTGAGGTCATGCTCGTTGGCC
+GCGGTGGTGACCAGGCTGTGGGTCAGGCCACTCTTGGCATCGACACCAATGTGGGCCTTC
+ATGCCAAAGTGCCACTGATTGCCTTTCTTGGTCTGATGCATCTCCGGATCGCGTTGCTGC
+TCTTTGTTCTTGGTCGAGCTGGGTGCCTCAATGATGGTGGCATCGACCAAGGTGCCTTGA
+GTCATCATGACGCCTGCTTCGGCCAGCCAGCGATTGATGGTCTTGAACAATTGGCGGGCC
+AGTTGATGCTGCTCCAGCAGGTGGCGGAAATTCATGATGGTGGTGCGGTCCGGCAAGGCG
+CTATCCAGGGATAACCGGGCAAACAGACGCATGGAGGCGATTTCGTACAGAGCATCTTCC
+ATCGCGCCATCGCTCAGGTTGTACCAATGCTGCATGCAGTGAATGCGTAGCATGGTTTCC
+AGCGGATAAGGTCGCCGGCCATTACCAGCCTTGGGGTAAAACGGCTCGATGACTTCCACC
+ATGTTTTGCCATGGCAGAATCTGCTCCATGCGGGACAAGAAAATCTCTTTTCTGGTCTGA
+CGGCGCTTACTGCTGAATTCACTGTCGGCGAAGGTAAGTTGATGACTCATGATGAACCCT
+GTTCTATGGCTCCAGATGACAAACATGATCTCATATCAGGGACTTGTTCGCACCTTCCTT
+AGTGAAGTCATTTTTGTCAAGCAGGTTGATTTTGTAATCAACGAAAGTAGACATATTTTT
+GTTGAAGTAATAGGTTGCACCTACATCAACATATTTGACTAAGTCCTGATCGCCCCATAC
+TCCAAGATCCTTACCTTTAGATTGCAGGTAAGCAACGGACGGACGCAGACCGAAATCGAA
+CTGATATTGTGCAACAGCTTCGAAGTTTTGGGCTTTATTAGCAACGAAGTGATCAGCAAA
+TACAGTCATATTCTGGGTTTCAGAATAGGTAGTGGCCAGGTAAATGTTGTTAGCGTCATA
+TTTCAGACCTGCGGCCCAAACTTCTGCATTTTTACCGGAAGCAAATACTTCAGGAAGAAC
+TTTCCCTGCATTAACTTGAGTGTCGGTACGATCAGATTTCGCATAAGTTGCACCGATACC
+GAATCCTTCGTATTCATAGGTAGCAGAGAAACCGAAGCCATCACCGTTACCTTCAGTGTA
+GTTATCGAAATCGCTACGATCGTTTTTGCCTTGGTACTGAGCAGCAAAGTTCAGACCATC
+AACCAGACCAAAGAAGTCGTTGTTACGATAGGTTGCAACACCAGTTGCACGTTGAGTCAT
+GAACACGTCGGTTTGAGTCCAAGTGTCACCACCGAATTCTGGCAGGACGTCAGTCCACGC
+ACCGATGTCGTATGCTACACCGTAGTTACGGCCGTAATCGATGGAGCCGTAGTCACCGAA
+TTTCAGGCCAGCGAAGGCAAGACGGGTTTTATCTTTGGAGGAACCTTGAGATTCAGCGCG
+GTTGCCTTTGAATTCATATTCCCACTGACCGAAACCAGTCAGTTGATCGTTGATTTGGGT
+TTCACCTTTGAAGCCAAGACGGGCATAAGTAGTATCACCATCATCTGCATCATTAGAGGA
+GAAGTAGTGCTTAGCATTAACTTTCCCGTACAGATCCAGCTTGTTACTGTCTTTATTATA
+AATTTCAGCTGCCTGAGCAGACATCGCCATTAGTACTGATGCAGCTACAGCAGAAATTGC
+CACTGTTAATTTTTTCATCGTGAGCCCTTTTTTTGAACTATTATTAAAAAATGATGTCAC
+TGCGCGATAAATATTCATCTAATCAATGTGATTATTTCAAGATGTAAGTTTTGGTTTCTC
+GTTTGATTTGTGAAGTAGATCTCTATTTTTATCTGAACTTTTTTCTATCGAATCCTATTC
+ATGGCTCTTGGCTGAATAAAAATAAATCTATTAGCCAATTTATATTAACGGCTGTTATTT
+ATAAGTGCTCTATAATTTGAAGGTTCAATTTAAACCGGCTAAAAATAACACTGGAAATTA
+TTTTTTGGTTATTTGTTGAGATTTGCTTATGTATTTGTAGTGGTGTTTTCAATACTCGGT
+AGCATTCTCTCAAATATCATTTAGTGGTTTACGTACGTAAAAAATTGGTTATGCTGTTAA
+GAGTGGTTACTTCGTCACACAGCTTAAACCCGCCGTCGAGCGGGTTTTTCCATTTTTTGA
+GTCTCGATATTAGCTGATAACCCAATACCTGAGTTATTCACTGACTCCGAGTCTGTTACG
+TTTCGTAGTATTCCCTCAATTTACACCCGCTTTGTCTGCGAGGTGGGGTTATGAAATCCA
+TGGATAAGTTAACAACGGGTGTCGCCTATGGCACCTCAGCAGGTAGTGCCGGGTACTGGT
+TTTTACAGCTGCTAGATAAAGTCACTCCCTCACAGTGGGCAGCAATAGGTGTGCTGGGTA
+GCCTGGTATTTGGCCTGCTGACGTACCTGACAAACCTTTATTTCAAGATTAAAGAAGATA
+AGCGCAAGGCTGCGAGAGGTGAATAATGCCTCCATCATTACGAAAAGCCGTTGCTGCTGC
+TATTGGTGGCGGAGCAATTGCTATAGCATCAGTGTTAATCACTGGCCCAAGTGGTAACGA
+TGGTCTGGAAGGTGTCAGCTACATACCATACAAAGATATTGTTGGTGTATGGACTGTATG
+TCACGGACACACCGGAAAAGACATCATGCTCGGTAAAACGTATACCAAAGCAGAATGCAA
+AGCACTCTTGAATAAAGACCTTGCCACTGTCGCCAGACAAATTAACCCGTATATCAAAGT
+CGATATACCGGAAACAACGCGCGGCGCTCTTTACTCATTCGTTTACAACGTGGGTGCTGG
+CAATTTTAGAACATCGACGCTTCTTCGCAAAATAAACCAGGGCGATATCAAAGGCGCATG
+TGATCAGCTGCGTCGCTGGACATACGCTGGCGGTAAGCAATGGAAAGGCCTGATGACTCG
+TCGTGAGATTGAGCGTGAAGTCTGTTTGTGGGGGCAACAGTGAGCAGAGTAACCGCGATT
+ATATCCGCTCTGATTATCTGCATCATCGTCAGCCTGTCATGGGCGGTCAATCATTACCGT
+GATAACGCAATCGCCTACAAAGTCCAGCGCGACAAAAATGCCAGAGAACTGAAGCTAGCG
+AACGCGGCAATTACTGACATGCAGATGCGTCAGCGTGATGTTGCTGCGCTCGATGCAAAA
+TACACGAAGGAGTTAGCTGATGCGAAAGCTGAAAATGATGCTCTGCGTGATGATGTTGCC
+GCTGGTCGTCGTCGGTTGCACATCAAAGCAGTCTGTCAGTCAGTGCGTGAAGCCACCACG
+GCCTCCGGCGTGGATAATGCAGCCTCCCCCCGACTGGCAGACACCGCTGAACGGGATTAT
+TTCACCCTCAGAGAGAGGCTGATCACTATGCAAAAACAACTGGAAGGAACCCAGAAGTAT
+ATTAATGAGCAGTGCAGATAGAGCTGACCATATCGATGGGCAACTCATGCAATTATTTTG
+AGCAATACACACGCGCTTCCAGCGGAGTATAAATGCCTAAAGTAATAAAACCGAGCAATC
+CATTTACGAATGTTTGCTGGGTTTCTGTTTTAACAACATTTTCTGCGCCGCCACAAATTT
+TAGCTGCATCGACAGTTTTCTTCTGCCCAATTCCAGAAACGAAGAAATGATGGGTGATGG
+TTTCCTTTGGTGCTACTGCTGTCTGTTTGTTTTGAACAGTAAATGTCTGTTGAGCACATC
+CTGTAATAAGCAGGGCCAGCGCAGTAGCGAGTAGCATTTTTTTCATGGTGTTATTCCCGA
+TGCTTTTTGAAGTTCGCAGAATCGTATGTGTAGAAAATTAAACAAACCCTAAACAATGAG
+TTGAAATTTCATATTGTTAATATTTATTAATGTATGCCAGGTGCGATGAATCGTCATTGT
+ATTCCCGGATTAACTATGTCCACAGCCCTGACGGGGAACTTCTCTGCGGGAGTGTCCGGG
+AATAATTAAAAACGATGCACACAGGGTTTAGCGCGTACATGTATTGTATTATGCCAACAC
+CCCGGTGCTGACACGGAAGAAACCGGACGTTATGATTTAGCGTGGAAAGATTTGTGTAGT
+GTTCTGAATGCTCTCAGTAAATAGTAATGAATTATCAAAGGTATAGTAATATCTTTTATG
+TTCGTGGATATTTGTAATCCATCGGAAAACTCCTGCTTTAGCAAGATTTTCCCTGTATTG
+CTGAAATGTGATTTCTCTTGATTTCAACCTATCATAGGACGTTTCTATAAGATGCGTATT
+TCTTGAGAATTTAACATTTACAACCTTTTTAAGTCCTTTTATTAACACGGTGTTATCGTT
+TTCTAACACAATGTGAATATTATCTGTGGCTAGATAGTAAATATAATGTGAGACATTGTG
+ACGTTTTAGTTCAGAATAAAACAATTCACAGTTTAAATCTTTTCGCACTTGATCGAATAT
+TTCTTTAAAAATGGCAACCTGAGCCATTGGTAAAACCTTCCATGTGATACGAGGGCGCGT
+AGTTTGCATTATCGTTTTTATCGCTTCAATCTGGTCTGACCTCTTTGTGTTTTGTTGATG
+ATTTATGTCAAATATTAGGAATGTTTTCAATTAATAGTATTGGTTGCGTAACAAAGTGCG
+GTCCTGCTGGCATTCTGGAGGGAAATACAACCGACAGATGTATGTAAGGCCAACGTGCTC
+AAACCTTCATACAGAAAGATTTGAAGTAATATTTTAACCGCTAGATGAAGAGCAAGCGCA
+TGGAGCGACAAAATGAATAAAGAACAATCTGCTGATGATCCCTCCGTGGATCTGATTCGT
+GTAAAAAATATGCTTAATAGCACCATTTCTATGAGTTACCCTGATGTTGTAATTGCATGT
+ATAGAACATAAGGTGTCTCTGGAAGCATTCAGGGCAATTGAGGCAGCGTTGGTGAAGCAC
+GATAATAATATGAAGGATTATTCCCTGGTGGTTGACTGATCACCATAACTGCTAATCATT
+CAAACTACTTAACCTGTGACAGAGCCAACACGCAGTCTGTCACTGTCAGGAAAGTGGTAA
+AACTGCAACTCAATTACTGCAATGCCCTCGTAATTAAGTGAATTTACAATATCGTCCTGT
+TCGGAGGGAAGAACGCGGGATGTTCATTCTTCATCACTTTTAATTGATGTATATGCTCTC
+TTTTCTGACGTTAGCCTCCGACGGCAGGCTTCAATGACCCAGGCTGAGAAATTCCCGGAC
+CCTTTTTGCTCAAGAGCGATGTTAATTTGTTCAATCATTTGGTTAGGAAAGCGGATGTTG
+CGGGTTGTTGTTCTGCGGGTTCTGTTCTTAGTTGACATGAGGTTGCCCCGTATTCAGTGT
+CGCTGATTTGTATTGTCTGAAGTTGTTTTTACGTTAAGTTGATGCAGATCAATTAATACG
+ATACCTGCGTCATAATTGATTATTTGACGTGGTTTGATGGCGTAGATGCACGTTGTGACA
+TGTAGATGATAATTATTATCATTTTGTGGGTCCTTTCCGGCGATCCGACAGGTTACGGGG
+CGGCGACCTCGCGGGTTTTCGCTATTTATGAAAATTTTCCGGTTTAAGGTGTTTCCGTTC
+TTCTTCGTCGTAACTTAATGTATTTATTTAAAATACCCCCTGAAAAGAAAGGAAACGACA
+GGTGCTGAAAGCGAGCTTTTTGGCCTCTGTCGTTTCCTTTCTCTGTTTTTGTCCGTGGAA
+TGTGCAATGGAAGTCAACAAAAAGCAGCTGGCTGACATTTTCGGTGCGAGTATCCGTACC
+ATTCAGAACTGGCAGGAACAGGGAATGCCCGTTCTGCGAGGCGGTGGCAAGGGTAATGAG
+GTGCTTTATGACTCTGCCGCCGTCATAAAATGGTATGCCGAAAGGGATGCTGAAATTGAG
+AACGAAAAGCTGCGCCGGGAGGTTGAAGAACTGCTGCAGGCCAGCGAGACAGATCTCCAG
+CCAGGGACTATTGAGTACGAACGCCATCGACTTACGCGTGCGCAGGCCGATGCACAGGAG
+CTGAAAAATGCCAGAGACTCCGCTGAAGTGGTGGAAACCGCATTCTGTACTTTCGTGCTG
+TCGCGGATCGCAGGTGAAATTGCCAGTATTCTCGACGGGATCCCCCTGTCGGTGCAGCGG
+CGTTTTCCGGAACTGGAAAACCGACATGTTGATTTCCTGAAACGGGATATCATCAAAGCC
+ATGAACAAAGCAGCCGCGCTGGATGAACTGATACCGGGGTTGCTGAGTGAATATATCGAA
+CAGTCAGGTTAACAGGCTGCGGCATTTTGTCCGCGCCGGGCTTCGCTCACTGTTCAGGCC
+GGAGCCACAGACCGCCGTTGAATGGGCGGATGCTAATTACTATCTCCCGAAAGAATCCGC
+ATACCAGGAAGGGCGCTGGGAAACACTGCCCTTTCAGCGGGCCATCATGAATGCGATGGG
+CAGCGACTACATCCGTGAGGTGAATGTGGTGAAGTCTGCCCGTGTCGGTTATTCCAAAAT
+GCTGCTGGGTGTTTATGCCTACTTTATAGAGCATAAGCAGCGCAACACCCTTATTCCAGC
+TGGCTTCGTGGCTGTTTTCAACAGTGATGAGTCATCGTGGCATCTCGTTGAAGATCATCG
+GGGTAAAACGGTTTATGACGTAGCGTCAGGGGACGCGTTATTTATTTCTGAACTCGGTCC
+GTTACCGGAAAATGTTACCTGGTTATCGCCGGAAGGGGAGTTTCAGAAGTGGAACGGTAC
+AGCCTGGGTGAAAGATGCAGAAGCAGAAAAACTGTTCCGGATTCGGGAGGCGGAAGAAAC
+AAAAAACAGCCTGATGCAGGTAGCCAGTGAGCATATTGCGCCACTTCAGGATGCTGTAGA
+TCTGGAAATCGCAACGGAGGAAGAAACCTCATTGCTGGAAGCCTGGAAAAAATATCGGGT
+GTTGCTGAACCGTGTTGATACATCAACTGCACCTGATATTGAGTGGCCTACGAACCCTGT
+CAGGGAGTAATCATTGGGATTATGCCGCAGCACGTCTTAAGCAAGAACATGCTGCGGTTG
+GATGCTATTTTTTTCCTGAAGCGGAAAACATTACTACAGTACCTTGAACCTTGGTTTTAA
+CATTCTCGAAATGCTCTGAGAGTATATGTGTTAAGCCTTCTTCGGAATCTTTTGTGTTTG
+AAAAGATGCCTTTCTGATTGTAAATGCGCATCAGTTTTTGACCGAAGCTATTGTGCACAA
+CTCCATCGCCAAGAATTGTGGCTCCGTATAGAGTTCCATCGTCAGTTAAGGCCTGCGCCG
+CATTGCGTATTACACAGCTTTTTGTAGATATATTTCCAGGCAGGCAGTGAAGAAGGTAAG
+ACATGGAAATGGAATCAAATTGACCATGTAACGCCGCGGGATAAGGTTCAAAAACATCAT
+GGCTAATTTTATGTTTAATTTTTGATTCCCCAGCCCTTGTAGATGCCGCGTTCAGGCTAG
+CTTCGTTCAAATCCATTAAAGATATCAGACTACTCTCAGGTACGTGAGTAAGGTAAAACC
+CAGTTCCAACACCAATATCCAGATGGTTGTTACCTAAATGTTCCAGAAAGTGTGGAAGAA
+GGTGTTCCTTTGTAGGACATCCCCATGCAAGCCGATTTGATACTCCCAAAACCCACCAGT
+CATAAAGCTTTAGGGTAAGTGGTGTGTAAATTCTAGCCCCATCATCTGTGTTTTTTTATT
+AATTTCACCATGTTATAGTTTTATTTGTGAATTAAATCAATTATGGCAATGAATTACAAG
+GGGTTAAATGCTGCCGCAGCATAGCGATATTGAAATAGCCTGGTATGCTTCAATACAGCA
+GGAGCCGAATGGCTGGAAGACCGTCACCACACAGTTCTACATCCAGGAATTCAGTGAGTA
+TATTGCGCCACTGCAGGATGCTGTAGATCTGGAAATCGCAACGGAGGAAGAAAGATCGTT
+GCTGGAAGCCTGAAAAAAGTATCGGGTGCTGCTAAACCGTGTGGACACTTCCGTAGCACC
+AGATATCGAGTGGCTTATTCAACCATAATAAACAGTATGTATATCATAGGTTATTAATTG
+TGAGTTTTTTCGGTGTGTTATTTGTTTGTTTGATGTTATGCTTTTGCGCCCCAAAAGGTT
+GTTTAGATGTATTTTATCAATTGATTTTCAATATCGTTTAATAAAGAAAAATTAAGCAAG
+CTGGATGTTGGTTTTTTGTTAATTGAATGGTTCTAATAATGTTTTTTTACTGTTGTTGAA
+TGTGACTTGATAAGAAATGCAAGTAAAAATGATACTCTTTTTATTTTAAATTCAAACGGT
+TGACATATATATAGCAAGAGGTTTCAGGTGCGTTGTAGTGAGTTTATGTTAATAAAAAGC
+ATAGTAAGCGTTGAAAAATGTAACTTTGAAATAAGTTAGAATAAAAAACAACATACATAT
+AATAATTTAATCTTAAATGAAATTTATTAAAATTTGCAAACTATAATTTTGTGTATAAAA
+ATATAAATGCACATCATCCTGATTATGATTGTGTATTTAATTGGTTGTTATTTGACTACT
+ATCAACTTGTTTTAATTTTATGATAGGTGCAAGATGGATTATGTTTGCTCCGTAGTTTTC
+ATCTGTCAATCATTTGATTTAATTATAAACAGGAGAGTTATCTCGTTCAAAAAAAATTCA
+TTGTTTATTGTAAGCGACAAAATTAGAAGGGAGTTACCAGTATGCCCCTCTAAACTAAGA
+ATTGTTGATATAGATAAGAAAACATGTTTATCCTTTTTTATCGACGTGAATAATGAGCTG
+CCTGGCAAATTTACTCTTGATAAGAATGGCTATATTGCTGAAGAGGAACCTCCATTATCG
+CTTGTTTTTTCTCTGTTTGAAGGGATTAAAATAGCAGACTCACACTCCCTTTGGTTAAAA
+GAAAGACTATGTATATCCTTACTTGCCATGTTCAAAAAACGCGAAAGTGTAAATTCATTT
+ATACTAACAAATATAAATACATTTACCTGTAAAATTACTGGAATAATCAGTTTTAATATT
+GAGCGGCAATGGCATTTAAAAGATATTGCGGAATTGATTTATACGAGTGAAAGTTTAATA
+AAAAAAAGATTAAGGGATGAAGGAACGTCATTTACTGAAATATTGAGAGATACTAGGATG
+AGGTATGCAAAAAAACTCATAACTTCAAACTCTTATTCTATCAATGTCGTAGCCCAGAAA
+TGTGGCTATAACAGTACTTCATATTTCATATGTGCATTTAAAGATTATTATGGTGTCACG
+CCATCTCATTATTTTGAGAAAATAATCGGCGTCACAGATGGAATAAACAAAACAATTGAC
+TGA
+>NC_000913.3|provirus_1196867_1213107
+TTATATTGCATTACAACTCCCAACAGTGACATATGAACTTCCTGCTTTACTCCACGACTT
+TAATATTTCAAGGCCATGTGAAGAACATATTTCTTGCACTGCGAGTTCATCGAGTAATCC
+ATAGTAAGAAACACTTTTTGAATTTTTGTAAATGTATCCGTAAAGATGTTTTCTTCCTGT
+TTCGTATTTTTTGAAGTATGAGCTTTTATATTGATTTACAATAAGAGTCTCACCTCCTGA
+TTTTAGTAATCTCTTGATGCTAAGAACTATTTTGTCGATTGTATCCCGACAAGGAACGGC
+AGAGAGAACATTAGAGCAAAGGATGAAATCGTAACCCCCAATTATTTTGTCGACATCCTC
+GAAAGCAACTGTATTTGCATTTTTATAATATCGTGGGACATAGTCAATAATTTTAGTTTT
+AATTCCTCTAATAATTTGCTCTCTTTCAAGTTGCCTTTTCGAGTCTAGAAAAGTAACTTC
+ATCAAATTTACTGATTAATTCATCAGAATATCTAAGTTTTCCGCAGCCAAAATCAAGGGC
+GTGGCCATTTTTCTCAATGCTTCTAATATACTCGCAAAGATATCTAGAGGGCATCGTATG
+AGGTTTTGCTGCATTCTCTGAGCGAATATTAACTCCGTGCATATTATAGTTCAAAGCAAG
+TACCATTCAATTAATGTTATTTTTAGTGAAAAATTCTTTTATTTTATCGTCCGGGATTTT
+TCCGACTTGACTTTCAGTTCTGGGCTTAACTGTCAAAGCAAAGATAATACCACTCACTGA
+GAATGATAAAATTACAAAAAAGAATAAAGACAGCAAAGAACCTTCAACATGAAAAATATC
+CATTTGTTTGCAAAAAAAGATTATTAGGAAGGAAATTAATGCAATTATCGAAAATTCAAA
+AAATATCCAAAAATAGTATACTTTATTCCAGAAGAGTTCAATATAATGTTTGTCTTCAAT
+TTTTCTTACTTCAGGGTAATATAGATTGCTCATTACATTGTGAGCTTCATCTTTATTTAA
+TTTTCTGTTGACTCCAGCTCTCCGTGATAACGGTTTTATAATTAGATGCTTATCCCAAAG
+ATATCGCACCCGAAGTAGTTTGGCTGCATTGTTATGTAGGTCTAACGCACCGCTAATTAA
+ATATGCAAAAATCGCAAAAGCACAAGGTAATATACCAAAAGATAGTGCCCAATTAATAAA
+GCTCTCATGATCTTTAATAGGTGGGACATACTTGGTTGGTAATGTTATTAAAGGGATGTA
+TTCGTAAATAACTAGAAGTATGCAATATATTAGCGTATTTAAGAAAGTTGCTTTATGAAG
+TTTAGGCAACATTTCATTATAATTTTTGGGGGGTTCGAACATATTATTCACCTGAGTCAC
+GCTTTAGGATAGTGTAATGGTAATATTTAATTAAGTGTCATTATATACTTTTCAGTAGGT
+TAGTTACAATTTTTTGTATCTGTTCAGGCTGACCTAGCTTCGCTGACAGACAATATTGTG
+ATCAGTAGCACGTATCGAGGAGGAGTAGCGCTACAAATTTGACGCTGGGTGAGAATCTGA
+AATTGATAGAAATGAAATAATGAAATAATGAAATGATGAAATGATGAAATGATGAAATGA
+TGAAATGATGAAATGATGACAGAGTGTCCAGTGGGCACGGATGGTGTCTTACGACATGCT
+TACCTTAATCGTTCCCAGTGTGCCTATAGCAGATATTCTAAACATGTCGATAATTCATTA
+CGCATATAGTATCGAACATAGAAAAAACTGAAGATTCATCTTATTTTGTATATACTACCT
+AGCCCAACAATGTAGAGGTTAACGAAAAATGCGCTCACCAATTTGTCATCTTTTCTCAGC
+AATTAATTCATCACCATTTAAGATTGCACCAGAGAAGGAGCAAGATCTTAAAACGATAGT
+TGACGACAAAAAAATTATAATTTCAGTTGTGAGTGAACCTGGTTTTAATATCCGAGTCAG
+GAAGAATGAGAGTAATAATTCACATGAAATAGTTCTAACAGTAGCTTCACTTGAATATAT
+TTGGGCATTTTCCAATTTCTTTTGGGTTTTTACGCAAGAGTACTCCAAATCTCAGAAAAA
+TAATGATGAGCACTTTGATTTAACAGGAAAAAATAGGCTTAAAAAGTCTGATGAACTTCT
+TAAATGGGCAAGGAAAAACTTGCAAACAACAGGTTGCGAATCATGGCCTAAAAAATGTCC
+CAAGCCAGAAGCATATTTACAAGGAAGCGAAGACTCACAAGTTGCTAGCGAGATATTTCT
+TTGTGCTATTGCTTGGATTCTTCATCATGAAATAAGTCATGTTGTTTTACAGCATCCATT
+GGTCACTACAGCATTCTCCACTCAAGAGGAGCGTGAAGCAGATTCACATGCTACAAAATG
+GATATTAGGCAACCTGTATGAATCCGCTCCTGAATTAAAGAAACGTGCACTTGGCATTGC
+TACGGCAGTGCTTTGTATACAAAGCTTAGAAGTTGAAAATTACTTCTGTTTACAAAATAC
+ACACCCAGCTGCATATGAGCGTATATATTCGAATATTTCATGCTACCCTGTCGGAAATGA
+AGAGTTGATTGAAGCTCTATGTACAGTGATGCTTCAATATCTTTTCCATGGCAAAAATAT
+CAATGTGAATCTAGATGGGGAGTCCTTTTCATCGATTTTAGGTGATCTTCTCTGTGATAT
+TTCACGTCTTACCAGTAACTGATATGGCTGTCCGCCGCTCGCTTAAAGTGGACTTTTTAG
+TTTTTATCATGTGCGGTGAGAAATTCAATGTGGCGTTGAGATGCTTAAAGGTTCACAACG
+CTACTTTGCTCCATCCTTTACCTCGATCATCATGATAACGATCGGTTTGTTGTTGTGTTT
+TATGACCAAGTAGTTTTTGTGTGTCTAACCCCTGTTCTTTATACAGACGTTCAGATAAAG
+ACCTTTGCTCATGGAATGTCGCAGGTGAACCCTCTCCCCAGTCAATTCTTGCTAAATCTC
+TCGCTTTACTAAAATTCATCGTCAATGTATTGGCTTTAACCTGCGCTCCGCGCTCTGCTT
+GTGAAGTTGAACGAAAAAAATGCACTAAGTATGCACTGACTGCATAGTCACGGCAGCGGG
+CTACTACATCGCGTAAACTCCAGTTAATCGCATTGAGGCGAAGAGAAAGAGGAATTGCGA
+TTTTGCTCCCGGTCTTTTCCTGAATGACATGAAGATGATCATCCCAAATATCGCTAAATT
+TCATACGCGAAATATCACCTAACCGCTGACCAGTAACCAGCGCTAACAGCATGGCATTTC
+CCATGTAACGATGAGTAGCGTCTGCGATATCGAAGATTTTTTTCCATTCTTCAAGGCTCA
+GCCGTTGTCGGGTAATTTTTCTTCTTGGTTGTTTAGTGGCTAATGCTGGGTTATAGCCAG
+GAGGTACTTCTCCGTAGTGCTGCGCCTCTTTGAAAACATCAATCAGGACGGAGCGAACTA
+CTTGTGCCATTCTTGGCCGCCCAGCGGCGATATACTCATCAAGCAATTGTGCTATATCTC
+TGACATCAACGGCTGAGATCAACTTCATTCCTGCTCGTTCTCTGAGCAAGGATACTGGTT
+TAGCTTTTTGTTTATAGGTGTTGAGTCTTATATCACCACTTTTAAGCCTGTCATCCTGGA
+TCGCTTGATAGCGATCTAACCAGGTTGACGTTGTGATAGCCTTTCCTTTGCTGGTTGCGA
+TCCTGTCACTGATAGCCAGAATCTGCCGGGTTCTTTGTTCAGCCAGGCGAGTGTTGGCCT
+CAGTGGCAATAGCGATAGCTTCAGCTTCGTTTGTTCCCAAAGCATGGAATTTTCCTGTCA
+CTGGATGCTTATACCGCCAATAGACTTTATTTACCTTCCTACTATAAAGCGGATATAAGT
+TAGGGACTGAAACATTATTCTTACGCGGTCTGGCTGCCATTACTCAAAATCCGTTGCAAA
+AGTAATGAGTCATTTTTCTTGATTACAGGTGTTACCAACTCCCCAACTAACTCGGCGTCC
+TCACGCACTCGCCATAACCGGCCTTGTTTCATGGCCGGTGGACAAAATAAATTCTGCTTA
+GCATAACGACGCAATGTGGACACACTTGGAGGATTACTTCTGTATTTTTCAGCAGCCCAT
+TCTTCAAGAGTTAACATTTGAAGCATATGCGATCACCTTATTACTACACTAACTGCTTAG
+TCTCAGCATATCGACCCTGCACGGTCGGTTAGTTTCTCCACAAAACAGAGAAGAGCACCT
+GTGGCCACAGCTATCAGGATGGGTCGGGTTATTAACCCGTCATCCGGGGATACTCTTCTC
+TGTTTTGTAAAAAGGGCGGTACCAGAAAGGACTAAGGAAAAAACTGGTACCGCCAAGACT
+ACACACAGCATAAAGTTGTGGTGTCGGGTGCCCCCGGTGCCTGGCGAAGGTTGCACACCA
+GGCGGGTGGGTATCCACAGAAGGTCGATTGTCAGCCTCAACCTTAACCCGCGTGCGCTGA
+GCCGCATTCACCACAACGCTAAGGATTCTCTCTGGTTGAAAATACTTAGCTGTTATGTGC
+CTGTCTTTTCACCACTTCAGGCTCGGTGGTATGCTGGAGTTCTCACACAGCCAGCAAGCA
+AGGAAACTTAATGAACCAGTTTTATGTTCACGTTCGTCTATTTGAAGACACAGCCGAACA
+GACCAAAAAATTTGAAGAATTAATGCTTAACTTTCTGTACCAGAAAACAGTTAAAGAGTC
+TGACGATAGCTGCTGCAGACTGATTCCAGAGGGATATATCCTCAAAAGTACAATGAACTG
+CCAACAAATCCTTGATCAAACATTTTCAATTGCTAACAGTGCCGGTGTTGACGCAAATAT
+ATTTGTCTGTAAATTTGAACAAAGCGCATGCTTACTTCCGTCTGCTTCCTTAGTTGGTAA
+CGATTTCGTTCATTACGATCTTACGCCTAAGCCCATCAAGCTCGATTCTTAAAGCCTTAA
+CCATTGTGTCGTGATAAACACGGCTCACCTTCTCTCCATTGCATGGCAGAGGGGTGAGTG
+TGTTAGCCATGAAATTCATGAACTCGGTTCGACCAGGGGCTTGCGCCCCGCAAGTCTTTA
+ATGCCTGTTTTGCTAACAAAATGCGGGCCTCAGTGCCTGCATTTGGCTCTATCTGCTGCA
+AACGTTTAGCGTCTTCCAGCAACAATGCGATCACATGCTTCAAATTCTGCTCATTCATCT
+ATTCTCTCCACTGAAATCATCCGCTAACGAATCATCCCGGTCTTCGTACGTACCGGGCGG
+GCTACTTCGTGGGCGTCCTGCCTGTTTGTTGTTTCTCTTGGGTACATTATGTATCTCAAA
+GGTACATTGTCAAGTATAAAAAAACCTGCCGAAGCAGGTTCATAAACATTGATTAGGCTT
+TGATTTTGTATCTTCTTGGTTTTCCTGAGAAAATCACAGTACCAATTATAGAGCAATTAC
+CGTTGATCTTAATGTAAGGCTCAGGCCAGTTTGGGTTTAACGCTTTGAGATAACGCTGTG
+TCCCATCTTCTATCAACCTTTTGAAGGTGGTTTCACCTGTATCGTGCATCAATGCAATAA
+CGTCGTCACCGTGGCAGGCAGGTACTTCAGGATCGACAAAAATCATGTCTCCCGGGCGGT
+ACTCATCAATCATTGAATCACCTATTACCCGCAAGATATAAGTCATTTCCCCACAGGGTA
+CAGGGCAGGGATACGTTTCTGCTGTGCTCAAATCAACCTCAGAATATCCAACTTCTTTCC
+ATGCTCCGGCCTGTACCCATGATATGACAGGGACTAATGTGATTTGTTTATTAGTGATTG
+AAACATCAGGTTTTTTTGTGATGTTCGTTGTCTGGTGTTCTTGATCGAGCCATCCTACAG
+GCAGGTCGAAACATTTTTCGATGTGTCGTGCCATGCTGTCACCGATATTTTTAGTAGCAC
+CATCTCCCATAAACCTGCTGGTCTGGGTTGGCTCGCGATCAATCATAGTGGCAAAGGAAG
+AATTCCCGCCAACACCATCTCTCAGTTTTCTGGCGTTAGACCGCCGGATGTCATGGATTG
+TTTTCATAACGAAATTAAAACCCTTGTACCGTTAAGGTACAAGTATCTTGAAGGTTCATT
+TCAATCATGTAATATGTACACCGGAGGTACATATTGTATGAAAGCGTATTGGGACTCTTT
+AACCAAAGAACAGCAGGGCGAGTTGGCCGGAAAAGTTGGCTCAACACCTGGCTACTTACG
+GCTGGTTTTCAATGGCTATAAAAAAGCCAGTTTTGTGCTGGCTAAAAAACTTGAGCAATA
+CACATCAGGTGCAATTACGAAATCTGACTTAAGACCGGATATCTATCCGAAAGATTAGCA
+GAACACTTTCAATTTTTAACCACAGAACGATGAGGCTAATCGTGGGTAAGCATCACTGGA
+AAATAGAAAAACAGCCTGAGTGGTACGTGAAAGCTGTCAGAAAAACTATCGCGGCGTTGC
+CGAGTGGTTACGCTGAAGCGGCTGACTGGCTCGATGTAACAGAAAACGCTTTATTCAACC
+GCCTTCGTGCAGATGGCGATCAGATTTTCCCGCTGGGATGGGCAATGGTTTTACAGCGTG
+CTGGTGGCACTCACTTCATTGCTGATGCTGTGGCGCAGTCTGCAAATGGCGTCTTTGTGT
+CTCTTCCTGACGTCGAGGATGTGGACAACGCCGATATTAACCAGCGTCTGCTGGAAGTCA
+TTGAACAGATCGGCAGTTATTCAAAACAGATTCGTTCAGCAATCGAAGACGGTGTAGTGG
+AACCGCATGAGAAGACAGCAATTAACGACGAGCTGTATCTCTCAATTTCGAAGCTGCAGG
+AGCATGCAGCACTTGTCTACAAAATTTTTTGCATTTCAGAAAGTAATGACGCCCGCGAGT
+GTGCAGCTCCGGGCGTCGTGGCGTCGATTGCTTCTGGTTGTGGAGAAACTAACGCATGAA
+CAGTTTAACAACACACTACCGTCGCTCGCAACTGATTGCGCTTCCTGTACCGGGTGGAAA
+AGCGAAGGTGGAATATTGCTATGCAGTGAATGTACCAGGTGACAGGGAAATTGTAACCCA
+CAGCTTTGCAGAGTGGGCTGTGGGTGATTTCAACCGGCAGAAGGAGACAGTCCTTTGCGA
+CAAGTTAACCGCTGGTTCAAAGATCACTACGGAGTGCCCGTCAGAGTCATTCGTTGGGAG
+CCGGAAACACAACGGGTTATCTACCTCCGCGAAGGTTATGAGCATGAATGCTTCAGCCCG
+CTCGAACAGTTTCGTCGTAAATTCAGGGAAATAGAGGTCGGTCATGAGCACTAAATTAAC
+CGGCTATGTATGGGATGGTTGCGCTGCATCAGGCATGAAGTTATCCAGCGTGGCAATTAT
+GGCCCGCCTGGCTGATTTCAGTAATGACGAAGGTGTGTGCTGGCCATCAATTGAAACCAT
+TGCCCGTCAGATTGGCGCGGGGATGAGTACCGTCAGAACGGCTATCGCACGGCTGGAAGC
+AGAAGGCTGGTTAACGCGTAAGGCGCGTCGCCAGGGTGATGGTTCATCACCCCACTGTGC
+CGTGGTGGATGAATATCACGAGCACGCCACAGATGCGCTTTACACCACGATGCTTACCGG
+GATGGGGGCGCGACGCCAGCCACTGATGTGGGCCATTACCACCGCCGGGTACAACATTGA
+GGGGCCGTGCTACGACAAACGGCGGGAAGTCATCGAGATGCTCAACGGCTCGGTGCCAAA
+CGATGAACTGTTCGGGATCATCTATACCGTTGATGAAGGTGACGACTGGACCGACCCGCA
+GGTGCTGGAAAAAGCCAATCCAAATATTGGCGTGTCGGTTTATCGCGAATTTTTGTTAAG
+TCAGCAGCAGCGTGCGAAAAATAACGCCCGTCTGGCAAACGTCTTTAAAACAAAACACCT
+CAATATCTGGGCGTCGGCGCGTTCGGCGTATTTCAACCTGGTGAGCTGGCAGAGCTGCGA
+GGATAAATCACTGACCCTTGAGCAGTTCGAGGGGCAGCCGTGCATTCTGGCCTTTGACCT
+GGCGCGTAAGCTGGATATGAACAGCATGGCGCGACTTTATACCCGCGAGATTGACGGTAA
+AACGCATTACTACAGTGTGGCCCCGCGTTTCTGGGTACCGTATGACACGGTGTACAGCGT
+CGAGAAAAATGAAGATCGCCGGACAGCCGAACGCTTTCAGAAATGGGTGGAAATGGGCGT
+TCTGACCGTTACCGATGGTGCGGAGGTGGATTATCGCTACATCCTCGAAGAGGCCAAAGC
+GGCGAACAAAATCAGCCCGGTCAGTGAGTCACCCATCGACCCCTTCGGGGCGACCGGGCT
+GTCACATGACCTTGCTGATGAAGACCTGAACCCCGTCACCATCATTCAGAACTACACCAA
+CATGTCCGATCCGATGAAAGAGCTGGAAGCGGCGATTGAATCGGGGCGCTTTCATCATGA
+CGGCAATCCCATCATGACCTGGTGTATCGGCAACGTGGTCGGCAAAACCATTCCGGGTAA
+CGATGATGTGGTGAAGCCCGTCAAGGAGCAGGCGGAAAACAAAATCGATGGTGCAGTTGC
+GCTGATTATGGCGGTTGGCAGAGCCATGCTGTACGAGAAAGAAGACACGCTGTCTGATCA
+CATTGAGTCCTACGGGATCCGCTCGCTTTAACTGAGGTAATTATGATCATGCTGATTCTC
+GCGCCTCTGGTGGGCGTGCTGGGTGCGCTTTTGCTGGCGTATGGTGCCTGGCTGATTTAT
+CCCCCGGCGGGTTTTGTTGTTGCCGGGGCGCTGTGCCTGTTCTGGTCGTGGCTGGTGGCG
+CGATATCTCGACCGTACACAGTCGTCTGTCGGCGGAGGTAAATAGTGTTCTTTTCGGGAT
+TATTTCAACGAAAAAGTGACGCACCGGTGACCACGCCAGCAGAGCTGGCGGATGCCATCG
+GGCTGTCGTATGACACCTATACCGGAAAGCAGATCAGCAGTCAGCGGGCTATGCGACTGA
+CGGCGGTTTTTTCCTGCGTCAGAGTGCTGGCAGAGTCGGTCGGGATGTTGCCCTGCAATC
+TGTATCACCTGAACGGCAGCCTGAAGCAGAGAGCCACCGGCGAACGTCTGCATAAACTGA
+TCTCCACGCATCCCAATGGCTATATGACGCCGCAGGAGTTCTGGGAGCTGGTGGTCACCT
+GTCTGTGCCTGAGGGGAAACTTTTACGCCTACAAAGTGAAAGCATTTGGCGAAGTGGCTG
+AACTGCTGCCCGTCGATCCCGGCTGTGTGGTATATGCGCTGGGAAGGTGTCAGCGATGGC
+CTGAAGGTGACCGCCGGGAGTGTTATTCAGCGCGATGACCTGGTGCAGTACACGACAACT
+GACGATGCAACCAGCTCCGGTGGTGTCCTGCGCGTGCCGATCGCCTGCTCAAGTGCAGGT
+GCGGTCGGTAACGCTGACGACGGTACGGCATTAATCCTGGTCACGCCGGTGAATGGTCTG
+CCGTCTTCCGGTGTGGCTGACACCCTGACAGGCGGATTTGATACTGAAGAGCTGGAAACG
+TGGCGCGCCCGCGTCATTGAGCGGTATTACTGGACGCCGCAGGGCGGGGCTGACGGGGAC
+TATGTCGTCTGGGCTAAAGAAGTGCCCGGCATTACCCGCGCATGGACATACCGTCACTTG
+ATGGGAACGGGAACTGTCGGTGTGATGATTGCCAGCAGTGACCTGATTAATCCCATTCCG
+GAAGAATCAACGGAAACGGCGGCAAGACAACATATCGGGCCACTGGCCCCGGTGGCAGGC
+TCTGATTTGTATGTGTTCAGGCCGGTGGCACATACGGTGGATTTTCATATCCGCGTGACG
+CCGGACACACCAGAAATACGGGCTGCCATTACCGCGGAGTTGCGTTCGTTCCTGCTGCGT
+GATGGTTATCCGCAGGGAGAACTCAAGGTATCGCGTATCAGTGAGGCGATTTCCGGTGCG
+AACGGGGAATACAGCCATCAGTTGCTTGCACCGGTGGACAATATCTCCATTGCGAAAAAC
+GAACTGGCGGTACTGGGGACGATTTCATGGACGTGACAAACGATGATTACATCCGCCTGT
+TATCGGCACTGTTGCCGCCCGGTCCGGTGTGGTCAGCCAGCGATCCGGCGATTGCCGGTG
+CGGCACCGTCATTAACCCGTGTTCATCAGCGTGCGGATGCCCTGATGCGGGAGCTGGATC
+CGCGCACCACCACTGAACTGATAAACCGCTGGGAGCGTCTGTGCGGTCTGCCGGATGAAT
+GTATTCCGGCGGGAACGCAGACCCTTCGCCAGCGTCAGCAACGGCTGGATGCGAAGGTTA
+ACCTGGCGGGCGGCATCAACGAGGATTTTTATCTTGCACAGCTTGCTGCCCTGGGCAGAC
+CAGATGCCACCATCACGCGATACGACAAAAGCACTTTCACCTGCTCATCGGCCTGTACTG
+ACGCGGTGAATGCGCCGGAATGGCGGTATTACTGGCAGGTCAACATGCCAGCCACCACCA
+ACTCCACCTGGATGACATGTGGCGATCCCTGTGATTCCGCACTGCGTATCTGGGGTGACA
+CCGTTGTCGAGTGTGTGCTTAACAAACTCTGCCCGTCGCATACCTACGTAATTTTTAAAT
+ATCCGGAGTAATCCATGCATCGTATAGACACGAAAACCGCGCAGAAGGATAAGTTCGGCG
+CGGGTAAGAACGGTTTTACCCGTGGTAACCCCCAGACCGGCACGCCTGCCACCGATCTGG
+ATGATGACTACTTTGACATGTTGCAGGAGGAACTTTGCAGCGTGGTGGAGGCATCCGGTG
+CCAGCCTGGAGAAGGGGCGGCACGACCAGTTACTTACCGCACTTCGCGCGCTGCTGTTAA
+GCCGCAAGAATCCGTTTGGCGATATCAAATCGGATGGCACTGTGCAAACGGCTCTCGAAA
+ACCTTGGTTTGGGAGAAGGAGCAAAACTCAATGCAGCAACGGCTACATTAGGACGCACCG
+GTTTCATAGCTATACCGGTTATGATTGGTGGTATTGAGCAATCAGTAATCATTCAGTGGG
+GGTGGAATGCCGCAAAAGCATCTGCCTCTGGGGGGGATGGAAATACAGTTGTATTCCCGG
+TTGCGTTTAATAATGCCTGTGTTGCCGTTGTTGCAAATTATGACAATGTCAGCGCACCTA
+TCAATGCAGTGGCAACGGGGGGATATACAACCACTTCGTTTTTATTACGGTGCGCAGCTC
+AAACGGGTAGTTATTACTATAACTGGATTGCTATTGGGTATTAAGATGAAAATATACTGT
+TGCTTAAATACCGTTGGTTTTTTTATGGATGGCTGTGGCGTCATTCCGCCAGATTCTAAA
+GAAATAACGGCAGAACACTGGCAGTCATTATTAAAATCTCAAGCTGAAGGAGGCGTGATC
+GATTTTTCTGTTTTTCCTCCTTCTATTAAAGAGGTTATCCGTACTCATGATGATGAAGTC
+GCAGATGCGAACTTTCAAAAGCAGATGCTTATCTCTGATGCAACTGATTTTATCAATAGC
+AGACAGTGGCAGGGTAAGGCTGCATTGGGAAGACTTAAAGAAGATGAGCTGAAACAATAT
+AATTTGTGGCTGGATTATCTGGAAGCACTGGAACTGGTTGATACATCCAGTGCGCCAGAT
+ATTGAATGGCCTACGCCTCCGGCAGTTCAGGCCAGATGACATCCGGCGCGGTGCTGGTAT
+CTGTTGCCGTCACCGCGTCAATGTAATCCAGCACAGCGTTAAGTCTGGTTGTTTCTGCCT
+GCGTCAGTTTACGTCCGGCCTGCAATTTCAGTTGAATCAGACTAATGGAAGCCATTGCAG
+CATCAATCAGTGACTGGCGCTGTGCTTCTGCCGCGTCTACTGCGGCGCTATGCTGTGCTT
+CAGTATCGGTCACCCATTTCTCACCATCCCATTTATCGTATGGAGATAAAGGGGCGATAG
+TGGTTGTATTTTCAGGGTAATCACCCGGAGCTTTGATTTCTTTTGATTCTCCAGTTTTGG
+TGCTATAGACCGTTTCACCGCGATGGTCTGGCACATATTCCCATGAGTTAAAATCTGCAG
+AACGGCAGATTGCATAACCAGCCTTATGTGTACCAGGGGCATCTAAACAGGAACATGCCG
+GAATGCCGACACCAACGGCAAGATATTCATTTGAAGTGGAAATATATTCCCGTGTTTCAC
+CATCGTAGTTATAAACGGTAACATCCCCTGCCTTTGTTGCAATAAGGTCACTATTTAATA
+TTGCTTTATGCATCAGGCTGCCCTCACGATATAGTTAAATGCAATATTACGCGGACGCGT
+TTCTGAGGCTGCGGCACCTAAACCATCCACTGATTGTTTATATGTTTTAAAGGTTCCATA
+ATCCGGGGCTGGTAATCCGGCATCGTTTGTGTTTCCTCTTTTGATAATGTCAGTGCCACT
+ATTTACCCATATTTCATCAAAATAGAAATTAATCGTTGCATCAGTCACAATCGTGGATCT
+TGACGGTAATCCATGAGCATGATCCTCCGTTGCATACCCCTGAATACTTAAAATAGAGCG
+ACCTGTATCAATCCCCCGCCCGTCATCCCAGCCACGAATAAACTCACCACGTAAATCAGG
+CAATTTATTTGTCGGATAAGCCTTTGCCAGTTCCGGGTATTCTTCAGCAGAAAAAGCGGC
+ACCATTGCATTTCAGCCAGCCTGTTGGCGGAGTGGCTGAAGGCCACGGAACCGGGACACC
+AACAGGTAATGCAGAGCCTTCTCCCAAACCAACGTTTATGAAAATGAAGAAATAACAAGC
+AAATGGCATCATTCCTGCTTTTACCAGGGGGATTTAACATGCTTATTGGCTATGTACGCG
+TATCAACAAATGACCAGAACACAGATCTACAACGTAATGCGCTGAACTGTGCAGGATGCG
+AGCTGATTTTTGAAGACAAGATAAGCGGCACAAAGTCCGAAAGGCCGGGACTGAAAAAAC
+TGCTCAGGACATTATCGGCAGGTGACACTCTGGTTGTCTGGAAGCTGGATCGGCTGGGGC
+GTAGTATGCGGCATCTTGTCGTGCTGGTGGAGGAGTTGCGCGAACGAGGCATCAACTTTC
+GTAGTCTGACGGATTCAATTGATACCAGCACACCAATGGGACGCTTTTTCTTTCATGTGA
+TGGGTGCCCTGGCTGAAATGGAGCGTGAACTGATTGTTGAACGAACAAAAGCTGGACTGG
+AAACTGCTCGTGCACAGGGACGAATTGGTGGACGTCGTCCCAAACTTACACCAGAACAAT
+GGGCACAAGCTGGACGATTAATTGCAGCAGGAACTCCTCGCCAGAAGGTGGCGATTATCT
+ATGATGTTGGTGTGTCAACTTTGTATAAGAGGTTTCCTGCAGGGGATAAATAAAGTTAAA
+GACACTTTGTGTACAAAAGAAAGTAAAACAACAGCAACTTGTTGCAATTTTATCAATAAA
+AGTAGTATTGTCGTGAAAAATTGATTAAAGATTAATATTATGCATGTTTTTGATAATAAT
+GGAATTGAACTGAAAGCTGAGTGTTCGATAGGTGAAGAGGATGGTGTTTATGGTCTAATC
+CTTGAGTCGTGGGGGCCGGGTGACAGAAACAAAGATTACAATATCGCTCTTGATTATATC
+ATTGAACGGTTGGTTGATTCTGGTGTATCCCAAGTCGTAGTATATCTGGCGTCATCATCA
+GTCAGAAAACATATGCATTCTTTGGATGAAAGAAAAATCCATCCTGGTGAATATTTTACT
+TTGATTGGTAATAGCCCCCGCGATATACGCTTGAAGATGTGTGGTTATCAGGCTTATTTT
+AGTCGTACGGGGAGAAAGGAAATTCCTTCCGGCAATAGAACGAAACGAATATTGATAAAT
+GTTCCAGGTATTTATAGTGACAGTTTTTGGGCGTCTATAATACGTGGAGAACTATCAGAG
+CTTTCACAGCCTACAGATGATGAATCGCTTCTGAATATGAGGGTTAGTAAATTAATTAAG
+AAAACGTTGAGTCAACCCGAGGGCTCCAGGAAACCAGTTGAGGTAGAAAGACTACAAAAA
+GTTTATGTCCGAGACCCGATGGTAAAAGCTTGGATTTTACAGCAAAGTAAAGGTATATGT
+GAAAACTGTGGTAAAAATGCTCCGTTTTATTTAAATGATGGAAACCCATATTTGGAAGTA
+CATCATGTAATTCCCCTGTCTTCAGGTGGTGCTGATACAACAGATAACTGTGTTGCCCTT
+TGTCCGAATTGCCATAGAGAATTGCACTATAGTAAAAATGCAAAAGAACTAATCGAGATG
+CTTTACGTTAATATAAACCGATTACAGAAATAAAATTATTTATTAAAGTCACATTTAAGA
+CGTAATACCCTACAGGGTAAAAATTTTCTCTGATCTTAACTTCTGCAAATGTTAACTGCT
+ATTTTTATGCTAAAAATGGTTATCAAAACTCAAAAACACATGTTTATAATCAATGAGTTA
+TAGAAATGCTAAGGGCTAATGAGTTATATGCAAATTAGTAAAATTATGTTGCTATGTCAG
+ATAGTTACGATTTAGTCATCTAACTAATGCTGCGCCATATGGGTTGGACTGAAGCGGCTG
+ACCTGATTGTTAAAGGTATGGAAGGCGCAATCAATGCCAAGACCGTAACTTATGACTTCG
+AACGTCTGATGGAAGGCGCTAAGCTGCTGAAATGTTCAGAGTTTGGTGAAGCGATCATCG
+AAAACATGTAATCTCTCCATGTGTTAAATATTGAAACGGGCGTATAACACGCCCGTTGTT
+TTATTTATGTGGATATTATTAATAGCATATCGAGCATATTTATATGAAGCCCATTACTTG
+AGCCCATATGGGCATATTTTTATAATGCAACTATTATGTAAACATTTATTTGTTATTTTG
+CTTTCTCCTGGAGGACACTCTTGACTGCTTTTGAGTAAACTCCATAAATCCTTGTTGAAT
+GGTGCGATGTGATAAATAGTAATAGGATATTCTTTATCCTTAAGGATAATACCAGACTTA
+ACCGGTGTAAATATACTGCCAGGAGGGAGAAATATAGTAGATTGATACCAGATGATCATT
+TTCATATTACCCCATATGGCTGAAAAAGATATACCACATGTAGGTTGAATTACCGTGTCA
+ATTACTATCCACTTCATTTGTTATGTCTTATCCCACGGTATTTAATATGGTTCATTAGGA
+TGTTTATTTCTTGATTTTGCATATGAGTATATTACCCCCCCCTCAAAAAAATAAATTAAT
+TAAAATGATGGCTTATATAAAATAAAATTTAAAGCAAGGAATCTCAATGGATGTTAAACA
+AAATGAGATTTTGTGAAAGCAATAAATTATTGACTTCGTTTTAGATTTGTTTAGCTATAA
+TGTTATACATTCAAATGACTGAACATCCTGTAATTAAAACATAGCCTTTATGCTACTTTG
+TGCCAATTTGCTAAACATTATGGTTGCCTTTTTATATAACGATAATAATGAATATAAGCA
+TGACATGAGAATAAGGTTTCAATTTTTGAGTTATATAGGAATGATTTAACCTGTTCCTGG
+CTAAAATACATATAACCGGATGATGACTAAACCAAAATACATGTGCGTTAAGTATTGAAA
+CGGACGTGTGGCACGGCCGTTGTTTTTATAAATATGTTAACCGTTATAAAATAACGTATC
+AAAAGTCAAGTGATCACATTTCAAATATCAAGTTGATAGTATTAGTCTGGTGATTATTTA
+TGGGTGACAATAAAAAGACAGTATTAATCATCCATAGAGATAGTCTCTGCACTTTTATTT
+CCATTATGCTAATGCCTTACTGAATTATGAAGCATTTCTTAAGTATCCAACTTTAGCTAG
+ATTAATGGTTTATTATTTTCTACATCTTCAATATATAAAAGCGTATTATCAATGGCGTAG
+TAACTGCGTTTGTTATGATTAACATCAGTAACCCACCGGAAAACGCCCGCGCCTGCCAGT
+GTTGAACAGTATTCCCGAAATGTAGATTTTCCGCAAATATGAAGCAATGCGGCCTCTTTT
+ATTTTAGCAGGGTTCTTGGTCGTACTAACTTTTAACAGGTTCCTGGTTCCTCTTAATAAC
+AAAACCGTATCATCGTGAGTAATAATTCTGATGTTATCCGTAGCCAGATAATAAATGTAA
+TGTGCAATACGGTGATGTTTTAATTCTGAATAAAACCAGGAGAAGTTTTGCTCTTTTCTC
+ACTTGCTCAAACATCTTTTGAAAAACAACGACCTGATCCAT
+>NC_000913.3|provirus_1412000_1434224
+CTACGATAACCGCGCATTCAACATGGCTATCTGTTCGTCGTTCATGTCATCAATCCACAT
+ACCGTAAATTTCATACACCATCTGCGCAGTTTCATGCCCCATTTGGCTGGCTATAAATGC
+CGGGTTCGCTCCTGCCGTCAACAGCCAGCAGGCAAAAGTATGCCGCGTATGGTACGGATT
+ACGGCGGCGAATACCAGCACGTTTTACTGCTGCATTCCACCTTGCCCCCAAACTGCTTAC
+CGAGTAATAAGGTTTTTGTTTTCCGTTACACACCCTGGGCATGAAAACAAAATGCAGTTT
+TTGCTTTTCGGTTCTGCCGTACTCCCGATGATAAAAGGTGATTTCGCTTTTGCGATGATG
+CCCGGTCAGTTTGTATTGCTCCTTCAGTGCTTCAAGAGCAGGCTGCAGTAGTGTTACTGT
+TCGGATCCCGGCATTTGTTTTTGGGGGACCGAACATATCAAGTATCGTCAGGTTTCTTCT
+GACATTCACTATTCCCTTTTCGAGATCCACATCCTCCCACGCCAGAGCTGCCAGTTCCCC
+GTGACGAAGTCCTGAGTAAACGGCAAATTTCCACAAGTTCTGGCTCTGTCCTTTTTCACT
+TTCCATTAATGCATTGAATTCTGTTTTAGATAACGGATCAGGCTTTATTCTGTTTCGCTG
+TAATTTTTTTACTCCTTCAAATGGTTTGGTTGATATAAATCCCGACTGATACGCAAAACG
+CAACAGCGAACAGAGCAGGGCGATATAGTTATCAACTGTGCGCACGGTTCTTCCTTTTTT
+GTTGGATCTTGGATTATCCAGGTAAAGCGTTTCTCCATGCAGCAGTTCATTCCGGTAGTT
+TAAGATATCGCTATAACGAATATGTGATATCGGGGTACTTTCACAAATTATTATTCTGAG
+TGTTTTTAATTGTGATTTCGTTTTCTTCATTGTGTTTGTTGTTAACTCTGTCTCTTTAAT
+TTTTGTCCAGATATCACAAAGCTCTCCGAACGTTTTTATGACTCTCGTTGTCACCATTTT
+TGCCCCAGTGCTGGACTGGGGAAAACGTCTTAAATACTCAAATTCACCGGAGTTTATTTC
+ATGAACTATCAGCGCTCTTAAATTTCCGGCCTTTTTAATATTACTGTTTGTAATCTCCCA
+GCCTTTTAATGTTTCCCGACATCGTTTTCCTCGAAACATGAACCAGATGCGAATGTATCT
+ACCTCTAATCTCGACACCTGTTGGTAATTTAGACATATCATGAGTCTTTGATAAACTGAT
+TTATCTTTGGATAGTTGTACCAGATAATCCCTCGTTTGCTGTCTGGCTTACCTAAAGGAG
+ATACTCGTTTGAAGTGGAAGCCCTCCACCCAACAGTTCTGGCGGTATGCTTCAATTTGTC
+TGGCCCCCAGACCAGTGCGAAGCATCAGGCCGTATTCAACCATCCACTCTTCATTAAAGA
+TTACTTGTGCCATCGCATCACCTCTGGCAGGCGCCAATGTTAGACTGAAATTGACGCCCG
+ATGTTGATTATTAATAATCAGCTATGAAGTTTTAATTTGAATACAATGCAATTCTCGAGG
+ACTGAAGTTTCTCGCAATTAAAATTTATCAGTTTTACTTTCTGCTCTCTGGAAACGCCTG
+CTTCTTTTTTACCTGAGAGCATTTTTTCGCATTCTGATTTCGTTAGTTTAGATTTTGAAT
+ATCTTGTCCAGTTAGTAGGAGTGCCACCTTCCTTTTCAATAGTGGCGGTAATTTTATACA
+TGAACACCTCCATTATTATTTCCAGTGGTTCGTTTATTCCATCTTTCGAGTGCTTCTTTT
+TCACTTCCACCATAACCGGTTCGGGATTCGCATCCGTTACACTTCGCTCGGTAATATCCT
+GAAATGGCTTTCACCGTTACTGATGGACAACCACAAAATGGACATGGTTTAACATTGTCA
+TATCTCATAATTTTTCTCATAAAAAATATTTCAAGTTGGCGGTGCATTACACCGCCAGGC
+TGAATTATTCCTCTGAATTATCGATTACACTGTATTCCCCGGTTAATACAGAGGAATCTG
+CAGGATCGATTGTCAGTGGTTCCTTTTCATCCATTGATACTGCACGCTGGATCTCAATTG
+ATACGGGCAAATATTTGAACAGGCGACGAATAGCCGTTTTCTTTGCCATTTCTTCCCAGT
+GAGTTACCCACGGCCCGTTATTACCAGCTTTACTCAGGCTGCGCACCAGCTCAATCTGTT
+TGCGCGTCATAACTTCAAACTGAGTACCTCCGTCTTTCAGTCTTGCGACAGCATAGACGT
+GGGTAACCGGGGCATCTTCGTTTTCTCCCGGGCGGTGTATTAACTTTTCATCAAGGCCAA
+ATTCGAAGCTAAACTCGTCACCTTCACGGACAACACGGGCTGACAGGCTGGCGATTTGAC
+CAGAACGGCGAGCCAGATCAATCATGCCGCGATAGCCAATGATTAGCTGAACGTTCTTTT
+TACCGCTCTTTTCGTTTTTATTACCAAAAGGCAGTAAATATGCATGACCGAGGGCGCTAC
+CTGGCTCAAGTCCGAGCTGTGAACACTGTACGATCGCACTGACAAAACTCATAGTGTCAC
+AGTTTCCTAACGCCGGAACTTTACGAATTTCTGTGGTGGCGATACGGATCATACGTTCAG
+CCGTCATATGGCGTGGAAGAGCTGCTGCCAGTTGCTCTTTCATTGATGGCTGGTTAATAA
+AACTAATCACGTCGCTATTTTTAACTGCTGCTGGTGCACGGTTTCCCTGAGTTTTTTGCA
+GATCGGCTTTTGCGATTGGTGGTTGCTTAGTCATTTGCATATTCCTTAGCCCAGCGGGGC
+AGTGATAATGTCTTAATAGCTGGCCATTCATCGGTATTCAGGCAGTCAGACAGGGTTCGC
+AGATTGCGGTGATATTCCTGTTGACCTGCCAGTTTTGCTTCTTCGCCCATCATGAAAATT
+TCAACCGGATAACGTCCGCATTCAATAGTTGTGCTGGCAACCAGAAAAACGAAAGTTGGC
+TGCACTCCAAACTGTGCTTCATAACCGTCACTGTAGAATGCATCCTGAACGTGATAGCGG
+TAGTCGTAATAAGCGGTTTTGAATCGTTGAATATCCGCCGTAGTTTTCACGTCCATGATC
+CAGTGAAATTCAGGGATAATTTTGTCCGGACGGCACCGACACAAAATTCCTGTTTCAGGA
+TCTTCCCAGTAAATTGATGATTCAGCGTGTCCGGCGCTTTCAACAAGCCATTGCCCCAGC
+GGCAAAGCCATAACGCTTTGATACATGAGTTCAATTTTCCGGCCTTCTTCCGCAGTGATA
+ACCGTTTTTCCTGTGCTTGCGCATTCCATCAGAAACGCTTTCTCTTCTTCTTTTCCGGCG
+TTTGTACGGCGGTTAAATTCAGGTGCTACGATAAAGCGGTTACTGAATTCTTCCGGTTCA
+AGTACCCGGCAGTGGAAAGCAGTTCCTAAATCGAGCGTTTTTGTCTTTGTGGTGTCCACG
+GGGGCATTTTTACGCCACAAATATAGTGCCGGAGTATCAGCAATGTCATCGAGCTGAGAC
+TTACTGATACCGGGACCCGCGTGGTAATTCTCATTCGAAATTCCGTAATAAATACCTGGC
+TCTATGTCTTCTACGATTACGGGATCTGCGACTTCGCCAGTTTCATCACTGCAATCGCGA
+TGCGGATCGCTGCCAGCATTCTCATTGTGCGGATGTTCAGCGCCTTCCATTTCCTCCGGA
+TCATTTTCCTTAGCTTCAACCTGACTCTCTTCATCGAATGTTTCCTGGTATGTTGCGTCG
+CCCATCACCGCACCACAGTCAGGGCAGTTATCCCCGCCAGTCTGGCCGCAGGCATTGCAG
+GCTATTTCCGGTTCCTGTTGCACTACTGGCTCAGGTTGATTCATATCTGGGCTGGTTTTT
+TCCGTTTCTGGCTGGTTCTGGTACACACAATCGCGAGTCTGGATCCCCTTTACCCATTTC
+GGATCGTTCGGGTCGCTAATTCCGTCAACAAATTCACCACGTGATGCAGCAAGCAATTTA
+TCGTCATCGACAGGATTTTTTGATGGAATGTTTTTCCGGGCTTCATGGAGTTCTGCCCGC
+AGTTCCTGATATTTCGCATCAACAGAATTTACCTGTGACTGAGCATCCAGCGGCTGCGTG
+TCCTGATGATGTTCAGTTGCGTCCGGTTCCATTGTTTCAGCCTCTCCCTGTTCAACTGCC
+GTTGTTCCAGATGGTTGCGGTTTTTCTTCATCATCCTGTTTTCCTTCTTCTGTTACTCGC
+TGCGGCATCGGGGCAGAGGAGCGACCGCAGGCAATATCCACGATTTCCGGATCAGGGTTG
+GCATGATCGGTTTCAGTCAGTACTTTGTTCAGATATTCAGTGACGTGCGCGGGGATGACC
+TCGATCCCAATTGGTGCTTCTTTTACGGACGCAACCACGATGGCGCGGGAATAATCCAGC
+CCGCCAGGCATGGTGATGAATTTGTCGCGGAAAACAGAAAAGGGCGGTTTATTTTCAGCG
+ATAATTTCCTCAATGCGTTTAGCGTGTGCCGGATGAAGGTTATAGATGTCCAGATCCATT
+GAACGGGCCAGTACGCCAGTGGCTACGTCGCGCGCCAGTGACGTCAGATCGTGTACGAAA
+CCTTCGCCGCGATCGGTGAGGTTTCCGCCGCCAGCATTAGCACCGGAAGCCGTGCGAGTG
+ATGTGTGAAACACGATTACCCTTCATCCACTCTTTTGTCAGCAGTCCTCGATCGGTGTAG
+TCAGCGTTCAGGTATGCTTCGAAAAAAGCAGTTATCAGTCCCAGGTTTGAATTACCAGGA
+TTAGGGAAAACTTTGTCAGTGTCACGAACCAGTTTGTGGAGTTCGCGAATTTCCAGCGGG
+TCGAGCAGGCTGGTTTTGTGGGAAACAGCCAGGGCAGTAACAGCCGGTAGTTCTTCAGCC
+CGAGCAATGTGTAATGCCTGGAGTCCGTCGCGTGAAACGTGCGTTACCGGTTTTTCGCTG
+CCGTGTTGAGCAAGCCAACGAATGGGCAGTTCCTGGCCAGAAATTGGGAGTAGCATATTC
+TCCTCAATCTCAGTCATGTCTTCGCCGTTGACGTTGGTATTGCCTTGATAGTGAGCGTTG
+TCTGGTGCTGCTCCCGGTTTTAGTTCCCATGTCATGGAGTCTTTGCTGAGTTGATAGCGT
+TCACTCCAGGTAAAATCGATCTCACCTTCAGCGGGCAGGTCATTAACGACAGGAAAATTC
+GTGGCAACAGCTTTAAAATAGCTGCTCAGTTTTTTACCTGACTTAACGATCAGGTAGTCC
+AGAGTGGCACAGGTCGATTCAAAATCGTTGCTTGCCCACAGGACGACGTCAGGTTCACCG
+GATGATTTTTTCGCTTTCCGTAACAGGAAGAGTGGTTTTGTGCTCATTGTTTTTTAACCT
+CAACTCAGATTAAAATTCGTTTTGTTCAGTGAATGATCTTGCCGGATACACACTGTTCAT
+AGCCTGCGCCATACGCAGGCTATTTCTTTCAGATTTCACCTTTTAATTTCATTGCAATTA
+GAGTTGCCAGAAATTCGGCTTTTTTTTCTGCGGGCAGATTCTTTCCGATATGCACCAGGC
+ACATTTTTTTGACACCTTCATCAAGTGTTTTTACGTTGCCTGATGGACCATCGATATCAA
+CCACAGTGAATGGGGTTTCTTTATTTTCTGTTTTAATTACGTAGCCAATGCGCTTTCCTT
+CCAGATTCACCTCGTGAACAATGTCATCGGTAGTTACAACAGTGGCTTCATAATTGGTAA
+TCATGTTTTTCTCCTTAATTAAGGTTGAGCGAATACCTGCCATTTCTGGCATAAATTCAG
+TTTCGAATAGTCAATTAATTAAAGTTCATGTGCCATCTGGTCTTTTTCGGCACAAGCTTC
+ACTGCAATATTTTCTCGGTTCGTCTTTTGATAAAATCCCGTGCATGAAGTGAAGCATTCT
+TTCAATAGCTTTGCTTTCTTCAACGTCTTTTTTGCAAAGGTGGTAAGCACATTTTATTTT
+CTTAGTCATCACCATGACTCCGCCTTTACAGGTAAACCATCACGACCGAGGAAGACTTTA
+ATCATGCGGTCAGTAATGAATGTTTTTGTGGTCAGGTTACGAATATATAGTTTTCGCTTT
+TTAATATTGTTTGCCGAGGCAATATATGTCCGGCCTTCATGAAGAACATAATCGCCAGGA
+GTCACACACTGACGTGGTATTTCATCAGTTCCGAAGTGATGTGCAATCATAATTATCTCC
+ATTTTTACAAATGAACTTTGTTGATGCGGTGTCTGGTGCCTCCAGGTGACTGCAACCAGT
+TAACAATTACAGTCGGCTTTCCCACCCAAACCAATAAGGACTAACATGACTTTTAACTGT
+GCCACGTGCGCTTAGCCGCATTCACCGCATCACAAAATTCACTTTAAAAAGGGCGGACAT
+CAGCCGAACTTCAAGAAAAAAACTGATGCCGCCAGGACTACACACAGCAATGTCGTTATT
+TACAACCGGAGGCGCACTCCCACCATTTAAATTTAACAGACAAGACCGACTCTTTATGGA
+TATCGGAAATGCGCCTTCGTGTTGTGCCCGGTTTTATTTCACCACCTCCGGGCTTCGGTG
+GTCTCGGCTATACCCCTACAGCGAGAGCTTGTGTTAACATTTCAATACCCTTACAGTTGA
+GAGTTATTGATATGTTGGATGTATTTACTCCATTGTTGAAACTTTTTGCTAACGAGCCAC
+TCGAAAGACTTATGTATACGATTATCATTTTTGGTCTCACTCTCTGGCTGATACCGAAAG
+AGTTTACTGTCGCATTCAATGCTTATACTGAAATACCTTGGCTCTTTCAGATTATCGTTT
+TTGCCTTTTCTTTCGTGGTCGCCATTTCCTTCTCAAGATTGCGAGCACATATTCAAAAGC
+ATTATTCATTACTACCAGAGCAACGAGTATTGCTTCGTTTATCTGAGAAAGAAATCGCTG
+TATTTAAAGATTTCCTTAAAACAGGAAATCTTATTATCACTTCTCCTTGCCGTAACCCGG
+TTATGAAAAAATTAGAACGGAAGGGCATCATTCAACATCAGAGTGATAGCGCAAACTGTT
+CTTATTATCTCGTCACCGAAAAATACTCCCATTTTATGAAGTTATTCTGGAACAGCAGGA
+GTAGACGTTTTAATCGTTAGCTTACTGTGTGCTTCTCCAACCATCGGCGCGCACCAGTTT
+CGGTTTTAAATGTTTTGCTTTTGGTATACGTCATGGCAGTGAACGTTCCATCCTGGTTGG
+GGAACACGCCGCACACCAGGGATTCGTTGTTGCCGAGGTCGATTTTTTGCATTTTGCGAA
+TCTCACATCTTGTTGCTACGTATAGCGACTTCTGCCTGCCAGAGATCCCAGTCGTTGCTG
+CGTAAAGCCTGCACAGCCTGGTTGTAAGTGATACCGCAACAATCCATCAAATACTGAACT
+ACTTCGTAATGCACCATCTTATCTCTCCCCTTAACGCCGGGTGGCGGAACTAACTGCTGC
+ACTGCAAAATTTGAATCCCGCCGTCATGTTCATACGCCTCGGGCTGGCTACTTAACCCCT
+TACCACTGCCTGGTAACTCGAAGTATTGCCCGGCGTTCTGTGGGGCGGGGTGGGTGGTAT
+GCTGGAACTATAGGTAATGCCTAATTGATTGTCAATAGGCTATGCCTAATGTTTTGAGCG
+TAACCTAATAGGTGATGGCGACAGCAGAAAGTGATGGGGGGGTTAAATAACGGAATCCAG
+GAGTTTTCCGTCAGACCATATAAGTTTAAGTTCCAGTTTTTGTGATGTTCTGGCTTTTCC
+GTTCAGATTCAAGAGCTTTCAGATACTTACCCACTTTCATTTCCATCGCTGCTATGTAGG
+CGCGAACATCGTGGTCAACCCAATCTGGTTCTGTAGCATTTCCAGATAACAGGAAAGCTA
+CAATCGCTCTTATTTCATCAGAGGCTGCTTGATAAAGGTTGTTTATATCTAAAAGTTCAC
+TTTTTGTATCTGAATTGGTGGGGGTTGGTATGGGGTATTCGTTAAGCCCCCAATGCTCTG
+GACCAACAACATCAGAAAAGAAACGCCATAATTCTGGAAGTTTATCTTTACTTATAGAGC
+CTTTCTTAATCCAGTCATAAATTGATGGTGGTTGGACTTTAAAGTGGCGTGCGACCTCCG
+CCTTTGATTTGACGGATCCCGATGCGATTTTTTTGTTAATGGCCTGCTCTATCGCTCGGC
+CTAAGTCTTTACCACTAAGCATTGCTTAATATTCTCCTATGCGCATTACATTAGGCAATC
+CCTACCCTTACTGCATTAGGCACAGCCTATTGACAATTGCGTTAGGCGTCGCCTAATATT
+TCTGTGTGTTTTTGGAGTTCATTCGATGAAAAAAGAGAACTATTCATTCAAGCAAGCTTG
+TGCTGTTGTCGGTGGGCAATCAGCAATGGCTAGGCTTTTAGGTGTATCACCTCCAAGCGT
+AAATCAATGGATCAAAGGGGTACGTCAATTGCCTGCCGAGAGATGTCCAGCAATTGAACG
+TGCAACAAGAGGTGAGGTTCTGTGCGAAGAACTTCGTCCTGATATTGACTGGTCATATTT
+ACGACGTTCGGCATGTTGTTCGCAGAATATGTCAGTGAAGCAACTAAATGACAGTAACAA
+ATCCTCATTTGATCATACCTGAAACATCAAGAGGCAAATGATTCATGAAAATCAAGCATG
+AGCACATCGAATCAGTGTTGTTTGCCCTAGCAGCCGAAAAAGGGCAGGCATGGGTAGCCA
+ATGCAATTACTGAAGAATATCTGCGCCAGGGGGGCGGCGAATTGCCCCTGGTTCCAGGCA
+AGGACTGGAACAATCAGCAGAATATCTATCACCGTTGGTTGAAAGGTGAAACGAAAACGC
+AAAGAGAAAAAATTCAGAAGCTGATCCCAGCAATTCTGGCAATCCTTCCGCGCGAGCTGC
+GTCACCGACTCTGCATCTTCGATACCCTGGAACGCCGTGCATTACTGGCGGCGCAGGAAG
+CGTTAAGTACGGCAATTGATGCGCATGATGATGCAGTCCAAGCCGTTTACCGGAAAGCGC
+ATTTCAGCGGCGGCGGTTCTTCCGACGATTCTGTCATTGTTCATTAAGCAAAAGTTTCCA
+TGCTGTTTGTGCTTATTCTAAGCCACCGGGCAGCATCATACGGGGCAATTATGGCCGCAT
+TACCATACATGCAACTGTACATAGCTGATTACCTGGCTGACACCATGCATTTGTCAGCAG
+AGGAGCATGGTGCGTATTTGTTGCTGATGTTCAATTACTGGCAAACAGGAAAGCCAATAC
+CTAAAAACAGGCTGGCAAAAATTGCCCGTCTGACTAACGAGCGATGGGCTGATGTTGAAC
+CATCCTTGCAGGAGTTTTTTTGCGATAACGGCGAGGAATGGGTGCATCTTCGGATTGAGG
+AAGATCTGGCATCAGTCAGGGAAAAATTAACCAAAAAATCAGCCGCAGGAAAAGCATCTG
+TTCAGGCCAGAAGAAGCAGAAAGGAAGCAGATGTTCAAACAAAACAAGAGAGAAATTTAA
+CAGGTGTTCAAACAGATGTTGAAGTGGTGTTTGAACATGATGTCAACACAAAGGCAACTA
+ATAAAGATACAGATAAAGATCTAAAAACAGATCCCCCCCTAAATCCCCCCCGGGGGAATC
+GAGGTGTCAAAAAGTTTGACCCTCTGGATATTACTTTGCCGAACTGGATTTCTGTCTCGC
+TTTGGCGTGAGTGGGTTGAATTTCGCCAGGCATTGCGAAAACCGATTCGAACGGAGCAGG
+GCGCTAACGGGGCGATACGGGAGCTGGAAAAATTCCGCCAGCAGGGTTTTTCACCTGAGC
+AGGTGATTCGACACAGCATCGCCAATGAATACCAGGGCTTGTTCGCGCCGAAAGGTGTTC
+GACCTGAGACGTTACTCCGACAGGTTAACACCGTCTCGTTACCGGATAGTGCGATCCCGC
+CAGGCTTCAGGGGGTAACTGACCATGAAAAATATTGCGACAGGCGATGTTCTTGAACGTA
+TCCGCAGACTGGCCCCGTCACATGTAACCGCGCCATTCAAGACGGTAGCGGAGTGGCGCG
+AGTGGCAACTTTCCGAAGGCCAGAAACGTTGTGAGGAGATCAACCGTCAGAATCGTCAGT
+TGCGGGTGGAAAAAATTCTGAATCGCTCTGGCATCCAGCCATTGCACCGCAAATGCTCGT
+TTTCGAATTACCAGGTGCAGAACGAAGGGCAGCGATACGCGTTGAGTCAGGCGAAATCCA
+TCGCTGATGAACTGATGACCGGGTGTACAAATTTTGCGTTCAGCGGAAAACCTGGTACCG
+GGAAGAACCACTTAGCGGCAGCTATCGGGAATCGCCTGCTGAAAGACGGTCAGACAGTGA
+TTGTGGTTACCGTGGCTGATGTTATGAGTGCCCTGCACGCCAGCTATGACGATGGGCAGT
+CAGGCGAAAAATTTTTGCGGGAACTGTGCGAAGTGGATCTGCTGGTTCTTGATGAAATTG
+GCATTCAGCGCGAGACGAAAAACGAGCAGGTGGTACTGCACCAGATTGTTGATCGCCGGA
+CAGCGTCGATGCGCAGCGTGGGGATGCTGACAAACCTGAACTATGAGGCCATGAAAACAT
+TGCTCGGCGAGCGGATTATGGATCGCATGACCATGAACGGCGGGCGATGGGTGAATTTTA
+ACTGGGAGAGCTGGCGTCCGAATGTCGTCCAGCCAGGAATTGCGAAGTAATTTTTACCGG
+GAGAAAAATTTAATGGAGACTGTTTTTGACGCACTGAAAGCAATGGGAAAAGCCACATCC
+ATAGAACTTGCTGCGCGACTTGATATCAGTCGTGAAGAAGTGCTGAACGAACTATGGGAA
+CTGAAAAAGGCTGGTTTTGTTGATAAAAGCGCGTACACCTGGCGTGTGGCTGATAACAAT
+GTTCAGCAGGAACAGCCAGCGCAGGCAGAACTGCCGGAAGAAATCACCACAGCAACAGTA
+GCGAAAATCTCAGAGTGCGATTTAACCGCGACGATTGAACAACGAGGACCACAAACGGCT
+GATGAGCTGGCTACATTGTTTGGTACCACATCACGCAAAGTGGCTTCAACGCTGGCAATG
+GCAATCAGCAAAGGTCGTCTGATTCGCGTAAATCAGGGCGGTAAATTTCGTTACTGCATA
+CCGGGCGATAATTTACCAGCAGAGCCGAAAGCAGCATCGGTATCTCCGCTCTGGTTATCT
+GCATCGTCGTCTGCCTGTCATGGGGTGTTAATCATTACCGTGATAACGCCATCGCCTACA
+AAGAACAGCGCGACAAAAATGCCAGAGAACTGAAGCTGGCGAACGCGGCAATTACTGAGA
+TGCAGATGCGTCAGCGTGATGTTGCTGCGCTCGATGCAAAATACACGAAGGAGTTAGCTG
+ATGCGAAAGCTGAAAATGATGCTCTGCGTGATGATGTTGCCGCTGGTCGTCGTCGGTTGC
+ACATCAAAGCAGTCTGTCAGTCAGTGCGTGAAGCCACCACCGCCTCCGGCGTGGATAATG
+CAGCCTCCCCCCGACTGGCAGACACCGCTGAACGGGATTATTTCACCCTCCGGGAACGAC
+TGGTAATGATGCAGGCCCAACTTGAAGGTGCTCAGCAATACATAACCGAGCAGTGTTTAA
+AGTAAAATCTTAACTACAATATGATTCATTTTGATGATTGTTTCATAAGGAACAGTGAAG
+TAAGATCTAAGAGGAGTTAAATTTTATACAGTATAATCATAATATTGCAGCAAGGTGGTT
+ATAATTGAAAGAATATTTAGATATGAATACATCTCATGTAAGAGTTGTTACTCATATGTG
+TGGGTTCCTGGTTTGGCTCTATAGTCTTTCAATGTTGCCACCAATGGTTGTAGCATTGTT
+TTATAAAGAAAAAAGCCTGTTTGTTTTCTTTATAACTTTCGTTATATTTTTTTGCATTGG
+TGGCGGAGCGTGGTATACAACTAAGAAATCTGGCATTCAATTACGTACCCGTGATGGGTT
+TATTATAATTGTAATGTTTTGGATTTTGTTTTCTGTTATTAGTGCATTCCCTTTATGGAT
+TGACTCAGAACTTAATTTAACGTTCATTGATGCTCTGTTTGAAGGGGTTTCTGGAATAAC
+AACAACAGGAGCAACTGTAATTGATGATGTTAGTTCATTACCTCGGGCATATTTGTACTA
+TCGGTCACAGTTAAATTTTATAGGTGGTTTAGGAGTTATTGTTCTGGCGGTTGCTGTATT
+GCCATTATTGGGTATTGGTGGTGCAAAGCTTTATCAGTCAGAAATGCCGGGGCCATTTAA
+GGATGACAAACTCACTCCCCGCCTGGCCGATACGTCACGGACACTGTGGATAACTTATTC
+TTTATTAGGTATTGCTTGTATTGTCTGTTATAGACTTGCAGGAATGCCTTTGTTTGATGC
+TATTTGTCACGGGATTTCCACAGTTTCGCTTGGTGGTTTCTCAACTCATAGCGAGAGTAT
+CGGATATTTTAATAACTATTTGGTTGAGCTGGTGGCTGGTTCTTTTTCCCTGCTATCGGC
+TTTCAACTTCACTCTTTGGTATATTGTTATTAGCAGGAAAACGATAAAACCTTTAATCAG
+AGATATTGAACTTCGTTTCTTTCTGTTAATAGCCTTAGGGGTGATCATTGTTACCTCTTT
+CCAGGTCTGGCATATAGGTATGTATGACTTGCATGGAAGTTTTATTCATTCGTTTTTTCT
+TGCCAGCTCCATGCTCACTGATAATGGTTTAGCTACGCAGGATTATGCAAGTTGGCCCAC
+GCACACGATAGTGTTTTTGCTGTTGTCAAGTTTCTTTGGGGGATGTATAGGTTCAACTTG
+TGGTGGAATTAAGTCACTTCGATTTCTTATACTTTTCAAACAAAGCAAACACGAGATAAA
+TCAGCTTTCTCATCCCAGAGCGTTGTTGAGTGTAAATGTAGGAGGGAAGATAGTTACAGA
+TCGTGTAATGAGGTCTGTATGGAGTTTCTTTTTTCTTTATACTCTCTTCACGGTGTTTTT
+TATACTGGTGTTAAATGGTATGGGATATGATTTTCTTACATCATTTGCAACAGTGGCTGC
+ATGTATTAATAATATGGGATTAGGTTTTGGGGCTACTGCATCGTCATTCGGAGTGCTTAA
+TGACATTGCAAAATGCTTAATGTGCATAGCTATGATTCTTGGTCGCCTTGAAATTTATCC
+TGTTATTATATTGTTTTCAGGTTTTTTTTGGCGCTCCTAATATATGGCTGATTTATAATT
+GTGAGTTTAATATTATGTTGACTCACTCATTGATCCAATACCTAACTTTACCAGCAACAC
+CTCCGTCCCCAGTAGCACTGGCTGCTGGGGTGCGTTTTATTCATAAAGCAAGGCTGTATG
+AGCGAGAAATTAAAGATAGTCTATCGCCCATTACAAGAATTGTCACCGTATGCGCACAAC
+GCCAGGACGCACAGTACTGAGCAGGTGGCACAACTGGTAGAAAGTATTAAGCAATTCGGC
+TGGACTAATCCGGTGCTGATTGACGAAAAGGGCGAAATTATTGCGGGTCACGGTCGTGTT
+ATGGCGGCTGAAATGCTCAAAATGGATTCTGTTCCGGTCATTGTTCTGTCTGGCCTGACG
+GATGAGCAGAAGCAGCGATAACGATCAGTATCGCTCCCGTAATGCATTAATCCGTCGCCA
+CATTGAGAAAATGGATGCCAGTTTGCACGTCGGAACGAAGGAGTTTGATATTTCAAAGGT
+TTCCGAGGTGGATTCTGTTGATGATTTACTCATTGATAATGCCGCTCGTTATCTGCTGAA
+AGACTGGAAAGGGGTTGGTGAACTGGTTAATGGTGTTGAGGTTGCACTGGAATATACGGC
+AGAACGAGGGATCGCGCTGCTTAAGCAGAATCCAGAGTTGTACTGGCAGATCCTTGCAGA
+AGCAGCCAGCATCGCCCAGGGTAAAGAGCAGCAGAAGCAGGATACGATAAAAAAGCCATA
+GCTGCCCAGCGGTGGTTATCGGAGTTCGGGGGAGAAAGGGGGGAAAAGGCAAGATGGAAG
+CGAGAAAAACTCAGGTTGCCACCGATACCGGAACCAGAAATAGACCCGGTGCTTAAGGAG
+TTGTTGTACGCCTATTCGGTAATATCCCGTGCCCGACGTTATGCTGGAATGGCTGGGGTG
+CCTTTGCCTTTATCTCTGACAGAGATAAATGAATATTTAGCCACTCATCCGGTATTGATT
+GAGCGCGATGAATTTGAAGCAGTGATCTTTGCACTGGATGACCAGTATTTTCAGGAGCAG
+TGTGTGTAGTTGTTAATTACGTACACTCTGTTACAGAGATGTGATGGTGTCTTTAATTAA
+ATCGATGATGCTCCTGGAGAAAAGCATTGCGTGGCCTCGTAATCGCTATATCTACTATTA
+TGTCGCCTGAAACCCACTTCGCGGTGGGTTTTTTGTTGTCAGGAGTTTTAATAAATGGCA
+GAGCAAACCTCGCGTCTCGCAATAATTATTGATAGCACTGGAGCGAAAAATAATGCTGAC
+AATCTGACCTCCTCATTAGTCAAAATGACGCAGGCTGGGGAAACTGCTGCAAATAGCGCA
+GGGAAAGTGACTAAGGCAACAGAAGATGAGAAGAACGCGCTCGCAAAATTAAAAGCAGCT
+ATTGATCCAGTTGGTGCCGCAATTGATACTGTCGGTCGACGCTATTCTGAATTAAAGAAA
+TTTTTCGATAAAGGGCTTATTGATAAAGAAGAATATGAATTTCTTGTCCGTAAACTTAAT
+GAAACCACAGAGGAATTGAGCGGGGTTGCGCAAGCGCAGAGAGAAGCCGAGAAGGCCGGA
+AAACTTGCTGCCGCTCAGCAGGAAGCGCAGGCTCAGGCCTTTCAAAGAATGCTGGACAAG
+ATCGACCCTCTGGCTGCGGCGCTAAGAAATCTTGAACAACAGCATGATGAACTTAATGCT
+GCGTTTGCATCCGGGAAAATAAATGGTTCTCAGTTTGAGAATTATAGCCGAAAAATACAG
+GAAACACGGCGAGAGCTTACCGGAGAGGCTCAGGCAGAGCGAGAAGCAGCAAAAGCGCAT
+GATGAACAGGTTGTTGCTTTGCAACGTCTGATTGCTCAACTTGATCCTGTCGGAACTGCT
+TTTAATCGTCTGGTAGAACAACAGAAACAGCTCAATGAAGCAAAAGCTAAGGGGATGCTT
+TCTCCTGAAATGTATGAGGAGCTTTCTGGAAAACTTCGTGCTATGCGGAGTGAGCTTGAG
+GTTACTCAATCACAATTAAGCAAAACCGGAATGTCGGCAAAACAAACGGCTTTTGCTATG
+CGCATGTTGCCTGCACAAATGACGGATATTGTTGTTGGGTTGTCCACTGGTCAGTCGCCA
+TTTATGGTGTTAATGCAGCAGGGCGGCCATTCAGCTATGCAGGAGACAAGAATCGCCAGC
+TTACCCGTTACAGCGATACCCGCTGGCATGAAGATTCCGTGCGTAACCGCTGGTTCAGCG
+TGATGGTGGGGCCGTCTGTGCGCGTGAATGAATGGTTCAGCGCGTATGCGATGGCGGGTA
+TGGCTTACAGCCGTGTGTCGACTTTCTCCGGGGATTATCTCCGCGTAACTGACAACAAGG
+GAAGGTGCGAATAAGCAGGTCATTTCTTCCCAAGCTGACTCGCTGATTAAAATTTCGCGG
+ATCTGGGCCGATTTTTTTCCCGCAAACACATCGAATCAGCCTATTTAGGCTATTTTTTCC
+ACCATTTCTGGCGTTATTTCCGGTTTTTACTGAGATCTCTCCCACTGACGTATCATTTGG
+TCCACCCGAAACAGGTTGGCCAGGGTGAATAACATCGCCAGTTGGTTATCGTTTTTCAGC
+AGCCCCTTGTATCTGGCTTTCACGAAGCCGAACTGCCGCTTGATGATGCGAAACGGGTGC
+TCCACCCTGGCACGGATGCTGGCTTTCATGTATTCGATGTTGATGGCCGTTTTGTTCTTG
+CGCGGATTCTGCTTCAAGGTTTTTACCTTGCCGGGACGCTCGGCGATCAGCCAGTCCACA
+TCCACCTCGGCCAGCTCCTCGCGCTGTGGCGCTCCTTGGTAGCCGGCATCGGCTGAGACA
+AATTGCTCCTCTCCATGAAGCAGATTACCCAGCTGATTGAGGTCATGCTCGTTGGCCGCG
+GTGGTGACCAGGCTGTGGGTCAGGCCACTCTTGGCATCGACACCAATGTGGGCCTTCATG
+CCAAAGTGCCACTGATTGCCTTTCTTGGTCTGATGCATCTCCGGATCGCGTTGCTGCTCT
+TTGTTCTTGGTAGAGCTGGGTGCCTCAATGATGGTGGCATCCACCAAAGTGCCTTGGGTC
+ATCATGACGCCTGCTTCGGCCAGCCAGCGATTGATGGTCTTGAACAATTGACGGGCCAGT
+TGATGCTGCTCGAGCAGGTGGCGGAAATTCATGATGGTGGTGCGATCCGGCAGGGCGCTA
+TCCAGGGATAATCGGGCAAACAGGCGCATGGAGGCGATTTCGTACAGGGCATCTTCCATG
+GCACCGTCGCTCAGGTTGTACCAATGCTGCATGCAGTGAATACGCAGCATGGTCTCCAGC
+GGATAGGGCCGTCGGCCATTGCCCGCCTTGGGATAAAACGGCTCGATGACAGCGGTCATA
+TTCTGCCATGGCAGAATCTGCTCCATGCGGGAGAGGAAAATCTCTTTTCGGGTCTGACGG
+CGCTTAGTGCTGAATTCACTATCGGCGAAGGTGAGTTGATGGCTCATGATGTCCCTCTGG
+GATGCGCTCCGGATGAATATGATGATCTCATATCAGGAACTTGTTCGCACCTTCCCAAGG
+GGAAAACGCACGACGTGCTGACCGGAAGTGATGACGGTCGCCACAGCAACACGTCTCTGG
+CGTGGGGAGCTGGCGTGCAGTTTAACCCGACCGAATCCGTGGCCATTGATATTGCTTATG
+AAGGCCCCGGCAGTGGCGACTGGCGCACTGACGGTTTCATCGTGGGTGTCGGTTATAAGT
+TCTGATTAGCCAGGTAACACAGTGTTATGACAGCCCGCCGGTTCAGGCGGGCTTTTTTGT
+GGGGTGAATATGGCAGTAAAGATTTCAGGTGTACTGAAAGACGGCACAGGAAAACCGGTA
+CAGAACTGCACAATCCAGCTGAAAGCAAAACGTAACAGCACCACGGTGGTGGTGAACACG
+CTGGCCTCAGAAAATCCGGATGAAGCCGGGCGTTACAGCATGGACGTTGAGTACGGTCAG
+TACAGCGTTATTCTGTTGGTGGAAGGATTCCCGCCGTCACATGCCGGGACCATTACCGTG
+TATGAAGATTCTCAACCCGGTACGCTGAATGATTTTCTCGGTGCCATGACGGAGGATGAT
+GCCCGTCCGGAGGCACTGCGCCGTTTTGAACTGATGGTGGAAGAGGTGGCGCGTAACGCG
+TCCGCGGTGGCACAGAACACGGCAGCCGCGAAGAAGTCAGCCAGTGATGCCAGCACATCA
+GCCCGTGAGGCGGCAACCCATGCGGCTGATGCTGCGGACTCAGCACGCGCAGCCAGCACG
+TCAGCCGGACAGGCCGCGTCGTCGGCTCAGTCAGCGTCTTCCAGCGCAGGAACGGCATCA
+ACAAAGGCCACTGAAGCATCAAAAAGTGCTGCCGCTGCAGAGTCCTCAAAAAGCGCGGCG
+GCCACCAGTGCCGGTGCGGCGAAAACGTCAGAAACGAATGCTTCAGCGTCACTACAATCA
+GCAGCCACATCTGCATCCACCGCGACCACGAAGGCATCAGAAGCTGCGACCTCGGCCCGG
+GATGCGGCGGCCTCAAAAGAAGCGGCAAAATCATCAGAAACGAACGCATCATCAAGCGCC
+AGTAGTGCAGCTTCCTCGGCAACGGCGGCAGGAAATTCCGCGAAGGCGGCAAAAACGTCC
+GAGACGAACGCCAGGTCTTCTGAAACGGCAGCGGGACAGAGCGCCTCGGCTGCGGCAGGC
+TCAAAAACAGCGGCTGCGTCGTCTGCCAGTGCAGCGTCAACAAGTGCCGGGCAGGCCTCA
+GCCAGTGCCACCGCCGCCGGAAAATCGGCAGAAAGCGCCGCATCGTCTGCTTCAACAGCC
+ACAACGAAGGCTGGCGAAGCCACTGAACAGGCCAGCGCAGCAGCGAGGTCTGCTTCCGCA
+GCGAAGACATCCGAAACGAACGCGAAAGCGTCGGAAACAAGCGCAGAATCCTCAAAAACG
+GCTGCCGCATCGTCAGCCAGTTCGGCGGCGTCATCGGCATCATCGGCGTCTGCTTCAAAA
+GATGAGGCGACCAGACAAGCGTCAGCAGCGAAGAGCAGCGCCACGACGGCATCCACGAAG
+GCGACAGAGGCTGCTGGCAGTGCGACGGCGGCAGCTCAGAGCAAAAGTACGGCGGAATCC
+GCGGCAACGCGCGCCGAGACAGCAGCTAAACGGGCAGAGGATATTGCATCCGCCGTGGCG
+CTTGAGGATGCAAGTACGACGAAAAAGGGGATAGTACAGCTCAGCAGTGCGACCAACAGT
+ACGTCTGAAACGCTGGCGGCAACGCCAAAGGCAGTAAAATCAGCCTATGACAATGCAGAG
+AAACGTCTGCAGAAAGACCAGAACGGCGCTGATATACCCGATAAGGGATGCTTCCTGAAC
+AACATTAACGCGGTCAGTAAAACAGACTTTGCTGATAAGCGTGGTATGCGTTATGTGCGG
+GTTAACGCTCCTGCAGGTGCAACATCTGGAAAATATTACCCTGTTGTTGTTATGCGTTCT
+GCTGGCTCAGTAAGCGAACTGGCATCAAGAGTCATTATCACCACGGCAACGCGAACCGCA
+GGCGATCCGATGAATAACTGCGAGTTTAACGGATTTGTTATGCCTGGTGGCTGGACTGAC
+AGGGGGCGTTATGCTTATGGCATGTTCTGGCAATATCAAAACAATGAACGAGCCATTCAC
+TCAATAATGATGAGTAATAAGGGCGATGATTTGCGCTCTGTGTTCTATGTTGATGGCGCT
+GCTTTCCCTGTTTTTGCGTTTATTGAAGATGGCCTGTCAATATCCGCACCTGGTGCTGAT
+CTCGTTGTTAATGATACGACCTATAAGTTTGGGGCAACAAATCCGGCGACTGAATGTATC
+GCGGCGGACGTTATCCTTGATTTTAAGAGTGGGCGTGGTTTTTATGAGTCTCATTCGTTA
+ATCGTTAACGATAACTTGTCGTGCAAAAAACTTTTTGCCACAGACGAAATTGTAGCGCGT
+GGTGGTAATCAGATTCGAATGATAGGTGGGGAGTATGGTGCATTATGGCGTAATGATGGC
+GCTAAAACTTACCTGCTGCTTACCAATCAAGGTGATGTTTATGGTGGCTGGAATACATTA
+AGACCGTTTGCTATTGATAACGCAACCGGCGAACTGGTTATTGGAACCAAACTGTCCGCA
+AGTCTGAACGGTAATGCATTAACAGCAACAAAGCTGCAAACGCCAAGACGGGTTTCTGGT
+GTTGAGTTTGATGGTTCCAAAGATATTACTTTAACCGCCGCGCATGTGGCTGCTTTTGCC
+AGAAGGGCAACGGATACATATGCCGATGCGGATGGTGGCGTTCCATGGAATGCCGAATCT
+GGCGCTTACAATGTCACCCGCTCTGGCGACAGCTATATTCTGGTTAACTTCTATACCGGA
+GTCGGAAGTTGCCGGACCCTGCAGATGAAGGCGCATTACAGAAATGGTGGTCTGTTCTAC
+CGTTCTTCAAGAGACGGTTATGGTTTTGAGGAAGACTGGGCAGAAGTTTATACCTCGAAA
+AATCTTCCACCAGAAAGCTACCCAGTCGGCGCACCAATCCCGTGGCCATCAGATACCGTT
+CCGTCTGGTTATGCCCTGATGCAGGGGCAGGCTTTTGACAAATCTGCTTACCCGAAACTT
+GCAGCCGCTTATCCGTCAGGCGTGATCCCTGATATGCGTGGCTGGACGATTAAGGGCAAA
+CCTGCCAGTGGTCGGGCCGTATTGTCTCAGGAACAGGACGGCATTAAATCGCATACCCAC
+AGCGCCAGCGCATCCAGTACAGATTTGGGGACGAAAACCACATCGTCGTTTGATTACGGC
+ACTAAATCCACGAATAACACCGGGGCACATACACACAGTGTGAGCGGCTCTACAAACTCG
+GCTGGAGCACACACACACTCACTAGCCAACGTGAACACGGCTAGTGCTAACTCCGGTGCT
+GGTAGTGCATCAACAAGATTGTCTGTTGTGCATAATCAAAACTATGCAACATCATCTGCT
+GGCGCACATACCCACTCACTGTCCGGCACTGCTGCAAGCGCAGGTGCACACGCGCATACT
+GTCGGTATTGGTGCTCATACGCACTCCGTTGCGATTGGTTCACATGGACACACCATCACC
+GTTAACGCTGCTGGTAACGCGGAAAACACCGTCAAAAACATCGCATTTAACTATATTGTG
+AGGCTTGCATAATGGCATTCAGAATGAGTGAACAACCACGGACCATAAAAATTTATAATC
+TGCTGGCCGGAACTAATGAATTTATTGGTGAAGGTGATGCATATATTCCGCCTCATACAG
+GTCTGCCAGCAAACAGTACCGATATTGCACCGCCAGATATTCCGGCTGGCTTCGTGGCTG
+TTTTCAACAGTGATGAGTCATCGTGGCATCTCGTTGAAGATCATCGGGGTAAAACGGTTT
+ATGACGTGGCTTCCGGCAACGCGTTATTTATTTCTGAACTCGGTCCGTTACCGGAAAATG
+TTACCTGGTTATCGCCGGAAGGGGAGTTTCAGAAGTGGAACGGCACAGCCTGGGTGAAGG
+ATACGGAAGCAGAAAAACTGTTCCGGATCCGGGAGGCGGAAGAAACAAAAAACAACCTGA
+TGCAGGTAGCCAGTGAGCATATTGCGCCGCTTCAGGATGCTGCAGATCTGGAAATTGCAA
+CGGAGGAAGAAATCTCGTTGCTGGAAGCATGGAAAAAGTATCGGGTATTGCTGAACCGTG
+TTGATACGTCAACTGCACAGGATATTGAATGGCCAGCACTGCCGTAGGGTAAAACATATA
+AATTCTATAATTAGATGTATCTTTCCATTTACGGCAAGGAAGGGGGCTTGGAAGACGTAA
+AGCATCTCACACCGAGATTATTTTTTATATGTCAGGTGTCTGAAGTTTTGCTTTGGCTCT
+TAAAATGGTTTGCCGCGAGGTTTTGAATTCCCGGGCAATGGCACTTATACTTACACCTGA
+CTTAATTCGTTCGAATACCACCTGTTTCTGTTCTTCATTTAACACAGGAGGTCGACCAAA
+ACGTTTCCCTGCGCCGCGGGCTCTTACTATCCCGGAATGAGTGCGTTCAAGTAAAAGGTC
+TCGTTCAAATTCAGCGACTGCTGAAATTACTTGCATCATCATTTTTCCTGTTGGACTGGT
+CAGGTCAATGCCACCCAATGCTAAGCAATGCACTCTGATACCTGTTTCGGTCAGTTGTTC
+CACTGTTTTCCTGATATCCATTGCATTACAACCAAGGCGATCCAGTTTTGTCACAATCAA
+TTGATCACCACATTTCAGGCGAGCAAGCAACCGGTTAAAACCAGGACGCTCACTGGTTGC
+TGCTGAGCCGCTAATGTGTTCTTCGATTATTTGCTGAGGTTTGATTTTAAAACCTGCACT
+TTCGATTTCCCGGCGTTGATTTTCGGTGGTCTGATCCAGCGTTGATATCCGACAGTAAGC
+AAAAATTCGAGACATAGTGAGACTCTATACGAAATTGGTGTTCATATCATAATGCATCTC
+AGAAAATAATTATGATTATTTTTGTGCATATTTGTATGTACACGTTCGAAAATAAACGAA
+TGCGTATGCAACCCCGTAATTTTGGTGAGACCCAAAATCGATTTTGTGAAAAATGGCTTT
+AACTCGGTTTGTTTTTCGAGTTCCGGGCGGACTCAAGGAAGAAGAATAGTGTTGCGTGTT
+ATTTTAACCAGATTTCAAGTTGTTTGGTCGTGGAAAAGTGGAGCAAAATGTTGTTAAAGT
+GGAAAAATGATAAAAAAGTAAGTTTATTATATTACATTTTACCATTTAAATTTTGGTTGT
+CTTTAAGAACTGATATCGCTGTTTGTAATAATTCTTTGTTATCCAGCCATGATGTTTTCT
+TTATGTTTCCTTCAATGTAATCAAGCAATGTTCTGGTATTGATAGGTCTTCCCTGTTTTG
+CTACTTCCACTACAGCATCCCCTAGGATAATTCTTACTTCAGGAAGCTGCGCAGGGAACC
+ACTTTAGGGTGTCTTTTGATTTCAT
+>NC_000913.3|provirus_1627517_1653915
+ATGATCGTTTTAGTAACTGGAGCAACGGCAGGTTTTGGTGAATGCATTACTCGTCGTTTT
+ATTCAACAAGGGCATAAAGTTATCGCCACTGGCCGTCGCCAGGAACGGTTGCAGGAGTTA
+AAAGACGAACTGGGAGATAATCTGTATATCGCCCAACTGGACGTTCGCAACCGCGCCGCT
+ATTGAAGAGATGCTGGCATCGCTTCCTGCCGAGTGGTGCAATATTGATATCCTGGTAAAT
+AATGCCGGCCTGGCGTTGGGCATGGAGCCTGCGCATAAAGCCAGCGTTGAAGACTGGGAA
+ACGATGATTGATACCAACAACAAAGGCCTGGTATATATGACGCGCGCCGTCTTACCGGGT
+ATGGTTGAACGTAATCATGGTCATATTATTAACATTGGCTCAACGGCAGGTAGCTGGCCG
+TATGCCGGTGGTAACGTTTACGGTGCGACGAAAGCGTTTGTTCGTCAGTTTAGCCTGAAT
+CTGCGTACGGATCTGCATGGTACGGCGGTGCGCGTCACCGACATCGAACCGGGTCTGGTG
+GGTGGTACCGAGTTTTCCAATGTCCGCTTTAAAGGCGATGACGGTAAAGCAGAAAAAACC
+TATCAAAATACCGTTGCATTGACGCCAGAAGATGTCAGCGAAGCCGTCTGGTGGGTGTCA
+ACGCTGCCTGCTCACGTCAATATCAATACCCTGGAAATGATGCCGGTTACCCAAAGCTAT
+GCCGGACTGAATGTCCACCGTCAGTAATTTTTATACCCGGCGTAACTGCCGGGTTATTGC
+TTGTCACAAAAAAGTGGTAGACTCATGCAGTTAACTCACTCACAAGCAAGAACGAATGAC
+CGTCGAAACGCAACTTAATCCCACACAGCCTGTCAATCAGCAGATTTATCGTATTCTTCG
+TCGCGACATTGTCCATTGCCTGATTGCTCCAGGCACACCGTTGTCGGAAAAAGAAGTTTC
+TGTTCGTTTCAATGTGTCACGCCAGCCGGTTCGTGAAGCCTTTATTAAACTGGCGGAAAA
+CGGCCTGATTCAAATTCGTCCGCAACGTGGCAGCTACGTCAACAAAATTTCCATGGCCCA
+GGTGCGCAACGGCAGTTTTATCCGTCAGGCCATTGAGTGCGCGGTGGCGCGTCGGGCGGC
+GAGCATGATTACCGAAAGCCAGTGCTATCAACTGGAACAAAATCTTCACCAGCAACGCAT
+TGCCATTGAGCGCAAGCAACTGGATGATTTTTTTGAACTTGATGACAACTTCCATCAACT
+CCTGACGCAGATTGCCGACTGTCAACTGGCGTGGGATACCATTGAGAACCTGAAAGCGAC
+CGTTGATCGCGTGCGCTATATGAGTTTCGACCACGTTTCTCCACCAGAAATGCTGTTACG
+CCAGCATCTTGATATTTTCTCTGCCCTGCAAAAACGTGATGGCGATGCGGTAGAACGTGC
+AATGACGCAACATTTGCAGGAAATCAGCGAATCCGTGCGCCAGATCCGCCAGGAAAACAG
+CGACTGGTTTAGCGAAGAGTAATTCATTTCCTCTCATCCCATCCGGGGTGAGAGTCTTTT
+CCCCCGCCTTATGGCTCATGCATGCATCAAAAAAGATGTGAGCTTGATCAAAAACAAAAA
+ATATTTCACTCGACAGGAGTATTTATATTGCGCCCGTTACGTGGGCTTCGACTGTAAATC
+AGAAAGGAGAAAACACCTATGACGACCTACGATCGTAACCGTAACGCAATCACCACTGGC
+AGCCGTGTTATGGTTAGCGGCACCGGTCACACTGGCAAGATCCTGTCGATTGATACTGAA
+GGTCTGACCGCTGAGCAAATCCGCCGCGGAAAAACCGTAGTTGTTGAAGGTTGTGAAGAG
+AAACTGGCACCACTGGACCTGATTCGTCTCGGCATGAACTAAGCGTGTGAATGCCGCCGA
+TGGCGGCATTGCTTTTTTACTTCACGGAATATTTTGCCACGGTCGCTTTCGCGCCATGCG
+CTAATAAAGACAAGTACGTTTCCGTCACTCTTGCAGTAAACAAACTATTGTCTGGCAAAT
+CATCACCAAAGATCGCCTTAATCGCCAGCAATGACTGGACGCGCGCTTTCCCTTCGGCAC
+TACTTTGTACAGCCTTCTGAATAACAGGTAACAGTGGGTCACTGATTTCTATCGGATTTC
+CCTGTTCATCAACACCACCGACATAACGCATCCAACCCGCGACGCCCAGCGCCAGCAGAT
+CGAACTTGCTGTCATGCGCCAGATGCCAGCGAACAGAATCCAACATCCGCTGTGGCAATT
+TCTGGCTACCATCCATCGCAATCTGCCAGGTTCGATGACGTAACGCCGGGTTGCTATAGC
+GTGCAATTAATCGGTTAGCGTAATCTTGCAAATCAACGCCCTGCACTTTCAACGTCGGCG
+CTTGTTCCTGCAACATCAAGCCATACGCCGCATAACGATAATGTTCATCTTCCATACAGT
+CATTAATGTGCTGATATCCTGCAAGATACCCCAGATACGCCAGGAATGAATGACTGCCGT
+TGAGCATGCGCAACTTCATCTCTTCATAAGGCAGCACATCGCTAACCAGTTCGGCTCCCG
+CTTTTTCCCATTCCGGACGTCCGGCAACAAAGTTATCTTCTATTACCCACTGGCGGAAAG
+GTTCACAGGCAACGCCCGCAGGATCGCGCACACCGGTAAGTTGTTCGATTTTCGCCAGCG
+TATCCTCTGTCACTGCGGGCACAATACGGTCCACCATTGTTGATGGGAAAGTCACGTTAT
+CTTCGATCCATTGTGCCAGTTTTACATCAACGGCTTGTGCGTAGGAAGTGACAACGTCAC
+GCATAACATGACCGTTTTCTGGCATGTTGTCACATGACATGACGGTAAATGCGGGAAGTC
+CTGCCGCTTTACGGCGAGCCAGCGCCTCAACAATCACCCCTGTTGCTGTTTTCGGCTGGT
+GGGGATTTTGCACGTCGGCAGCTACCATCGGGTGATCGAGCATTAACTGTCCGGTCGCCG
+GAGAGTGGAAATACCCTTTTTCGGTGATTGTCAGAGAGACAATCGCGATTTGCGGTTCAC
+ACATCGCTGCCAACACGGTTTCTAAGCCATCTATCTGTACGTGCAAGGCTTTTTTAACGA
+CGCCAACGACGCGAGCCGTCCACACATCGGCCGACATTTCCGCAACGGTATAAAGATTAT
+CTTGCTGTTGTAAATCGGCAATTTGCTGTTCGCCGCCGATTAAGTTGACCTCATAATATC
+CCCAGTCACTGAAATGTTCCGTAGCAAGAATATCGGCATACACACCCTGATGCGCACGGT
+GAAATGCACCAAAGCCTAAATGAACAATTCTTGGAGCCAGGTTATTAAGATCATAAACAG
+GGAGTGTCGCTTTTGCTGATAACAAATTATTTCCCATAACAATTCCTTAAATATAAATAT
+GGCAAGCTATATGTTTTGTTATATGAATAAAAATCCCCTCTCCGGTAAGAGAAGGGATTA
+AGGGTTTACAGACTTCTGGAAGGTTGCGCAGCTCTTACAACACGCGGTTGATCTTCCGCA
+GCGTCTTCCAGCGCACTTAAATCACGGTCTTTCACCTCTGGCATTTTCAGCGCAGAGATT
+AAACCAATCACTGAATATGCCATGATCATAATGGCGATCGGATACCAGGATTCCGTCATG
+GTGCAGAAAATACCCGCCAGGATAGGACCAAAACCGGAAGCGATAAGACCACCAATTTCT
+TTAGAAATAGCCATCCGGGTAAAGCGGTTTTTACAGCCGAACATTTCTGCCATGGTAATG
+TTTTCCAGAGCAAATAATCCCAGCACCGCACAGTTATGAATCACAATCAGTGCAACCATA
+ATGGTGCTCGGGGCATAGCTTTTATCTACAATGATAGAAAGCATTGGCCATGCCAGCACA
+ATCGCGGAGGTATTCATAATAATATACGGGATCCGGCGACCAATTTTATCGGATAACCAA
+CCAAGGAACGGAATGGTCATAAAGCCGAGAATCGAACTGATCATCAATGCATCTGTTGGA
+ATTGCTTTGTTAAACAATAACGTCTGCACTAAATAGCCTGCAAGGAAAGTCTGAATTAAC
+CCGGAGTTACCCGCCTGACCAAAACGCAGCCCTGTTGCCAGCCAGAAGGATTTGCTCTGG
+AACATGCTACCAGCAGGTGCAGGTTTTGCTGTCGGTTGGTTACTGTCGTTAACCTTCTCA
+AAGACCGGGCTTTCTTTCAGATTCATACGCAACCAGATAGCAAAGACCATCACGACAACA
+CTCGCCAGGAACGGTATACGCCATCCCCACGCCAGCAGTTCCTCTTTACTGAGAATGAAG
+AACATAAAGGCCCAGATTGCCGTTGCGCTCAAGGTTCCGCAGTTAGTTCCCATAGCCACA
+AATGAGGAGATAATTCCGCGCTTACCTTTTGGCGCATATTCCGCCAGCATCGTACCGGCA
+CCGGAAATTTCCGCACCTGCACCCAACCCCTGAATAATACGCAACGTCACCAGCAAGATG
+GGTGCAAAAACACCAATCTGTGCATAGGTCGGTAACACACCAATTAAGGTGGTACAGATC
+CCCATCATGGTGATGGTAATAAAGAGCACTTTTTTACGCCCTATTCTGTCGCCCATTTTG
+CCGAAAATAAATGCTCCGACAATACGCGCCACATAACCTGCACCGTAGGTTCCCATTGCC
+AGAATTAACGCCATTGCCGTTGATGATTCAGGAAAAAATATTTCATGAAACACTAACGCT
+GCGCCGAGCGAATATAACTGGAAATCCATAATTCACAGGTGTTTTTTCCCATCCTGTGGT
+TTCCTTGGCGTTTTCTAGGTTTTTTCAGATAGTTGCATTTTTTTAAAAAGCATCCTAAGT
+TCGATCTCAGTGTCTATCTGGGGCCTATTTCTGTCCCATATATGCCCCAAAAAAACTCCC
+CAACAGATAAGTAGTTTTTTCATGGATTTATGCGTAAAATCAAGAACGGCTGGAAATCAT
+TCAATACTCACACTATCGAAAAATTTACCAGCCAATCGCAGCACGTTCTTGCATAAGGTG
+TGTCTGCGGTTTTTCAACTATTCAGATACATCACTCCCATCACATTCATTCCTCCGCATC
+AAAGGCATATAGGCTATATCACCTTGATATTTTTCTTTTTCAGATAAAAACTGTTATCTA
+TGTATACTTTTAAACCCAATCCGTGTAGAGTCTCTACATAAGATAGTTTGCAGTTGCCGC
+TTCAGCTTGCGCCATAAACCGCCTGATTTTTGCTGCCACCTGTTAGCATTCCTGTATACC
+TGAAACGACAATGTTTATCTACGAACTTTAAGAACACCCAAGATAAAAATTGTCAACTAT
+ATCATATATAACACATTACTAATTCGAGGCTATATGAACAGCATACTGATAATCACATCT
+CTCCTTATCATATTCAGCATTTTTAGTCATGCCCTAATAAAATTAGGGATTGGCATATCC
+AATAACCCAGACAAAACCGATGTATAAGTCAACATATCCTGAATCAGACATACAATATCG
+CAATGAAAATCAATAATATTTTAAGGAATATCTTCATGAAATCAAAAGACACCCTAAAGT
+GGTTCCCTGCGCAGCTTCCTGAAGTAAGAATTATCCTAGGGGATGCTGTAGTGGAAGTAG
+CAAAACAGGGAAGACCTATCAATACCAGAACATTGCTTGATTACATTGAAGGAAACATAA
+AGAAAAAATCATGGCTGGATAACAAAGAATTATTACAAACAGCGATATCAGTTCTTAAAG
+ACAACCAAAATTTAAATGGTAAAATGTAATATAATAAACTTACTTTTTTATCATTTTTCC
+ACTTTAACAACATTTTGCTCCACTTTTCCACGACCAAACAACTTGAAATCTGGTTAAAAT
+AACACGCAACACTATTCTTCTTCCTTGAGTCCGCCCGGAACTCGAAAAACAAACCGAGTT
+AAAGCCATTTTTCACAAAATCGATTTTGGGTCTCACCAAAATTACGGGGTTGCATACGCA
+TTCGTTTATTTTCGAACGTGTACATACAAATATGCACAAAAATAATCATAATTATTTTCT
+GAGATGCATTATGATATGAACACCAATTTCGTATAGAGTCTCACTATGTCTCAAATTTTT
+GCTTACTGTCGGATATCAACGCTGGATCAGACCACCGAAAATCAACGCCGGGAAATCGAA
+AGTGCAGGTTTTAAAATCAAACCTCAGCAAATAATCGAAGAACACATTAGCGGCTCAGCA
+GCAACCAGTGAGCGTCCTGGTTTTAACCGGTTGCTTGCTCGCCTGAAATGTGGTGATCAA
+TTGATTGTGACAAAACTGGATCGCCTTGGTTGTAATGCAATGGATATCAGGAAAACAGTG
+GAACAACTGACCGAAACAGGTATCAGAGTGCATTGCTTAGCATTGGGGGGCATTGACCTG
+ACCAGTCCAACAGGAAAAATGATGATGCAAGTAATTTCAGCAGTCGCTGAATTTGAACGA
+GACCTTTTACTTGAACGCACTCATTCCGGGATAGTAAGAGCCCGCGGCGCAGGGAAACGT
+TTTGGTCGACCACCTGTGTTAAATGAAGAACAGAAACAGGCGGTATTCGAACGAATTAAG
+TCAGGTGTAAGTATAAGTGCCATTGCCCGGGAATTCAAAACCTCGCGGCAAACCATTTTA
+AGAGCCAAAGCAAAACTTCAGACACCTGACATATAAAAAATAATCTCGGTGTGAGATGCT
+TTACGTCTTCCAAGCCCCCTTCCTTGCCGTAAATGGAAAGATACATCTAATTATAGAATT
+TATATGTTTTACCCTACGGCAGTGCTGGCCATTCAATATCCTGTGCAGTTGACGTATCAA
+CACGGTTCAGCAATACCCGATACTTTTTCCATGCTTCCAGCAACGAGATTTCTTCCTCCG
+TTGCAATTTCCAGATCTGCAGCATCCTGAAGCGGCGCAATATGCTCACTGGCTACCTGCA
+TCAGGTTGTTTTTTGTTTCTTCCGCCTCCCGGATCCGGAACAGTTTTTCTGCTTCCGTAT
+CCTTCACCCAGGCTGTGCCGTTCCACTTCTGAAACTCCCCTTCCGGCGATAACCAGGTAA
+CATTTTCCGGTAACGGACCGAGTTCAGAAATAAATAACGCGTCGCCGGAAGCCACGTCAT
+AAACCGTTTTACCCCGATGATCTTCAACGAGATGCCACGATGACTCATCACTGTTGAAAA
+CAGCCACGAAGCCAGCCGGAATATCTGGCGGTGCAATATCGGTACTGTTTGCTGGCAGAC
+CTGTATGAGGCGGAATATATGCATCACCTTCACCAATAAATTCATTAGTTCCGGCCAGCA
+GATTATAAATTTTTATGGTCCGTGGTTGTTCACTCATTCTGAATGCCATTATGCAAGCCT
+CACAATATAGTTAAATGCGATGTTTTTGACGGTGTTTTCCGCGTTACCAGCAGCGTTAAC
+GGTGATGGTGTGTCCATGTGAACCAATCGCAACGGAGTGCGTATGAGCACCAATACCGAC
+AGTATGTGCATGCGCGCCTGCGCTTGCAGCAGTGCCGGACAGCGAGTGGGTATGAGCACC
+ATCTGATGATGTCTTCCCTGCATTACGAGTCTGGCCACTACCGCTTGTTGTGCTCATAAT
+CCCCGCGCTTAGATTTGAAATCGCGGTATAACCATTAGGGAAAATGCTCGTGTTCGTGCC
+ACCAAATGCACCGGAACTCTTGTGTTGGTGCGCACCGGCACTATTTGCGGTCCCGCTAAT
+ACTATGGGTATGCGCCCCGGTGTTATTCGTGGATTTGGTTCCGTAATCAAACGACGATGT
+GGTTTCCGTCCCCAAATCCGTACTGGATGCGCTGGCGCTGTGGGTGTGCGATTTAATGCC
+GTCCTGTTCCTGAGATAATACGGCCCGACCACTGGCGGGCTTGCCCTTAATCGTCCAGCC
+ACGCATATCAGGGATCACGCCTGACGGATAAGCAACTGCAAGTTTCGGGTATGCAGATTT
+GTCAAAAGTCTGCCCCTGCATCAGGGCATAACCAGACGGAACGGTATCTGATGGCCACGG
+GATTGGTGCACCGACTGGATAAAACTCTGCAGGAGGATGAGCCGAGGTGTAAAGCTGCGC
+CCACGGCGACCAGTTTGCGTCGGTCGTATCCCGTCGTGAACGAATAAATGCCGGAGCATG
+AGCACCGCTTGTACCACTCCAGCCGATGAGTAACTCACCTTCGCCAACGGCTGTCATCCC
+TTTCAGGTGAATGATATTTCCATACGCTGTTGGATATCCGTTGTTATACACCTCGTATAA
+CTCAAGACCTGCTGCCCCCTGCGTATTGTCTGTCAGCGCGGTTATATTCACTCAGCAACC
+CCGGTATCAGTTCATCCAGCGCGGCTGCTTTGTTCATGGCTTTGATGATATCCCGTTTCA
+GGAAATCAACATGTCGGTTTTCCAGTTCCGGAAAACGCCGCTGCACCGACAGGGGGATCC
+CGTCGAGAATACTGGCAATTTCACCTGCGATCCGCGACAGCACGAAAGTACAGAATGCGG
+TTTCCACCACTTCAGCGGAGTCTCTGGCATTTTTCAGCTCCTGTGCGTCGGCCTGCGCAC
+GCGTAAGTCGATGGCGTTCGTACTCAATAGTCCCTGGCTGGAGATCTGTCTCGCTGGCCT
+GCCGCAGTTCTTCAACTTCCCGGCGCAGCTTTTCGTTCTCAATTTCAGCATCCCTTTCGG
+CATACCATCTTATAACGGCGGCAGAGTCATAAAGCACCTCATTACCCTTGCCACCGCCTC
+GCAGAACGGGCATTCCCTGTTCCTGCCAGTTCTGAATGGTACGGATACTCGCACCGAAAA
+TGTCAGCCAGCTGCTTTTTGTTGACTTCCATTGTTCATTCCACGGCCAAAAACAGAGAAA
+GGAAACGACAGAGGCCCAAAAGCTCGTTTTCAGCACCTGTCGTTTCCTTTCTTTTCAGGG
+GGTATTTTAAATAAAAACATTAAGTTACGACGAAGAAGAACGGAAATGCCTTAAACCGGA
+AAATTTTCATAAATAGCGAAAACCCGCGAGGTCGCCGCCCCGTAACCTGTCGGATCACCG
+GAAAGGACCCGTAAAGTGATAATGATTATCATCTACATATCACAACGTGCGTGGAGGCCA
+TCAAACCACGTCAAATAATCAATTATGACGCAGGTATCGTATTAATTGATCTGCATCAAC
+TTAACGTAAAAACAACTTCAGACAATACAAATCAGCGACACTGAATACGGGGCAACCTCA
+TGTCAACGAAGAACAGAACCCGCAGAACAACAACCCGCAACATCCGCTTTCCTAACCAAA
+TGATTGAACAAATTAACATCGCTCTTGAGCAAAAAGGGTCCGGGAATTTCTCAGCCTGGG
+TCATTGAAGCCTGCCGCCGGAGACTGTGCTCAGAAAAAAGAGTTTCTTCTGAAGCAAACA
+AAGAAAAGAGTGACATTACTGAATTGCTCAGAAAACAGGTCAGACCAGATTGAAGCAATT
+TAGATAATCGTGCAGACTACGCCCCCTCATATCACATGGAAGGTTTATCTATGGATCAGG
+TAGTCATTTTTAAACAAATATTTGATAAAGTTCGAAACGATTTAAACTATCAATGGTTTT
+ATTCTGAGCTAAAACGTCACAATGTCTCACATTACATTTACTATTTAGCCACAGAGAATG
+TTCATATTGTATTAAAAAATGATAATACAGTGTTATTAAAGGGCCTAAAAAACATTGTGT
+CTGTCAAATTTTCAAAGGATAGGCATCTTATAGAAACGACCTCTAATAAGCTGAAATCCA
+GAGAGATCACATTTCAGGAATACAGAAGAAACCTTGCTAAAGCAGGAGTTTTTCGGTGGG
+TTACAAATATCCACGAACAAAAAAGATATTACTATACCTTTGATAATTCATTACTATTTA
+CTGAAAGCATCCAGAAAACTACACAGATCTTACCACGCTAAACCATAACGTCCGGCTTCT
+CTCACTCCTGAGCCGGACTGCATTGGTTTAATAAAAACCATCAACAATTGTGATTTAGAT
+ATTCGGAACCATTCAAATATAACAAAACCCCGTAAAAACGAGGTTTATGGATAAATTTTA
+TTATTGAATACATCAGATTAAATTAATCTTGACATCATAGCTTTCAAGACCCGTCATTTT
+TTCCCGTGCGGTAAACTGAATACTGGTAACTTCTTTCCCGGTCTTTTTCTTAAGTTCAAT
+AATTTTTTTTGTTATATATTCAGAAATATCTGCTTCTGCTTTTGTTTTTAAGTTTTCAAT
+ATTCATCATTTCCTCTTTTAGTCTGTTATGACTTTCCAGTTACACAGTAAGTCGATTATA
+TGGTGCAAACGTGTAAAAGATAAGATGAAACATCGCAATAATCAACATACGATAGTCTAA
+ATTTTACACAAACAGACAAAGAGAATTTTCCTGAATTATCAATGCAATAGCATCAAATCA
+ACTCAAGAGCCTTATTGCTGCTTCCAGAATTTCTTCTGAAGTAACATGTCGATCCGCGGC
+TACATAAATGACTTTATGATCTCCGGTCAGAGATGGAAACCCTGCGGCCATTACAGTAAG
+GTGTGTTTTTTCGCCATTTGGATATTCACGCATGATGGTGTTAACTCCAGTCATCGCTGG
+CACTACCACTGCTGGTTCAGAGTTAAAAAAACTATGATTTTTTTCATGATGTTACCGTAG
+TATGTGAGTATCCATCGAATAGACACCAAGCAAAAAAGCTCCCGAAGGAGCCTTCATTTT
+CACTTTTTTAAATCCAACGACAGACGGCTGGCATTTAAGTATTGTGAAATATTATCAAAT
+GTAATCATCATTGATTTACAAAAGATACATTTTGCCCCGAAAGGATTCATGTCAGAAACA
+TCAAAAGATGATGTTCTATACTGGGAACCATGACAACACGGGCATCTAAAGTGAATATGG
+TTTGTAATATTGTCTACCTCAAAGCGCCACTACATGAACAGCGGCAGGACCTTTAGGTCC
+GTTCTCAATACCAAATTCAACTTCCTGATTCTCAGTTAATGTTTTGAAATCGTTGCTCTG
+AATTGCTGAGAAATGGACAAACACATCTTTGCTGCCATCTTTCGGCGTGATGAAACCAAA
+ACCTTTTTCAGGGTTAAACCATTTCACTAAACCAGTCATTTTGTTAGACATAATTATTAC
+CTTTTGAAGAAATTAGCCCTTGGGCAGAATGGTCCGAAAAAAAATATCAGAGAGAAAAAC
+CAACAAGGAAATCTCAAGAGGTACAAATAATAAAATTATAACAATGACTGCTTCAGATAA
+ATTTGTAACAAACCAGAACACCATTAACGCATGATTAACCACCCATAGCAAGGATTACTT
+TTGTAAAGAAAAACACAGCAATGAAAGAATAGCTTTATTTATTAATAAAACGTGTCATTC
+TGATTAAGACCTTTTATCTTACCCTTAAGATTTCAGGAATTTTGGCTCATGGAAGAGTCC
+TTTTTATTTAAATTTTACATTCCGCGATGTAAATGTTCCGATTTAATATTACCCTACATT
+TGATGCTTTTTATCTCTTAAAGATTCATAGATCTGTTGACAAGTCACTCCTGCGATGTAG
+CGTTCGTCAGCAATTTCAGCATAAAGCTGAGCTTCTGCTGCAATATCTCCGAGCATGTTG
+GTGAGCATTCCTTCGGCGGTTTTGGTTGTTTTGCCTCTGACGGCAGCGGCAAGATCTGCG
+GTATGCTTCGCTGCGTCAAGGCGTATGGCATATTTTTTTGCTTCGGCACGCAACTGGTTA
+ACACTATCAGACAGATAAGCAGCCCTGGCAGAAATTTCAGCAGATTTCTGTTGCGCATCT
+TTAACAGCCTCATCACGGGCTATAGTTCGCCCCTGTTCAATTATTCGAGCAGCAAATTGA
+GCATTTACCTCTTGTGATAATGCGGCAGCATCACGTTCCGCCCATTTTTTTTGCCATCCT
+CGGTCGCTCCAGACATTTCCGACGATAAATCCTGACAACACGAGAAAAATCACCATGAAT
+ATCTGATTCACTGTTCTATCCCCCAGCAGGTTAATGCGCTCTCCTGGTCACGACGAATAA
+CCTGACCGTAACAGTTATTTGAACGAATGCGGCAATCGCGTCCGCCATCCTTAATCCACC
+AGCGAATCGCTTCGCATGCACCTTTACGATCACCAGCATTCAGCCGCTTATAAAACGTCG
+ACGGGAAACACTTACCGGGGCCAATGTTATAGGGACAAAATGACGCGATACCCGCTTTTT
+GTGGTTCGGTCAGTGGTACTTTAATATTGCGCTCCACCCATGCCAGCGCCTTATCACGCT
+CAATGGCGTTGACCTGGTCGCATTTTTCCTTCGACAGTTTCATATTGGGAAAAACGGTTT
+TTCCATCCACCACTGTGGCACCCCGACAGATGGTCCATATGCCAGAACCATCGCGGTATG
+CCATTGTGTGGTTACCTTCTTTTTCGTCCAGAAACTGGTCAAGTATCTGAGGAGCAGATG
+CGCCAGCACCAATCAGCGCCAGAACGGCAGCCGACAGGCCGTATCTGATTTTTGTGTTCA
+TAGATATTTATGATGAGGACGCTCGTGCTTATTGGCAGGATTTTCAATCTTAAAGGAGTA
+CTGATGCTGCAGATAAGACTCAACTTTTTCTGACAATTTTTCTGCTACTTCCAGGAAGAC
+TTGCCGGACGCTCCTTCTGGCTGCTGCCTCATAAAACTCCAGCGCAGCTCCTTCAACACG
+GTCCATGGCGACATCCAGGTCAAAAATTTCACCGTCAAAGCGTTCTTTGTCCTGTAAGGC
+TACAGTTACCGTAACTTTATTCTCAAAATTACGGACTCCTTTCACAACCAGTTCATAGTC
+TTGAGTCATTGGATTACTCTCCTCTCGCAGCCTTACGCCTGTCTTCTTTAATCTTGAAAT
+AAAGATTTGTCAGATACGTCAGCAGGCCAAAAACCAGGCTACCCAGCACACCGATTGCAG
+CCCACTGTGACGGAGTTACTTTATCGAGTAACTGCAATGCCCAGAAACCAGCATTACCCG
+CCGATGTGCCATAGGCAACACCTGTTGTTAACTTATCCATTGATTTCATATCCTCACCCC
+GATGTACACGGATGGTGCAATATGTTTGAAAAGATCGGAGTCTACGGGGTAGTTTTGACA
+GCACACGTTGTTCTCAACGGCGCTAAAAAAACATACACATTAAAAATGTGGGTAATTATT
+TTGAAAGAAAGTCATATATAAAATAATAATACGAGAAATGTTTTCATATTTAGTGTACTG
+TATACGGCCATTTATACAGGAAAAGCCTATGTCAGAACGTAAAAACTCAAAATCACGCCG
+TAATTATCTCGTTAAATGTTCCTGCCCAAACTGCACCCAAGAGTCAGAACACAGTTTTTC
+AAGAGTACAAAAAGGTGCCCTTTTGATCTGCCCTCATTGCAACAAAGTATTCCAGACAAA
+TCTTAAAGCTGTAGCCTGATTGATTTTATTAGTAACAAGTATTTTTTATATTTTAATAAT
+ATATTTAAAGCAGATAATAAAAAACCCGCCTGAGCGGGTTTGAGATTGTGGTGCTTTTTG
+TGGGAGTCATCCACTTACGCACTTTGTTTTGCCATGCCAGCAGTTAGCTTCTGCTGTAAA
+ACTATTCATGCAGCAAACCTGCACTTCACCACAATGGTTAGCATACTTTTCCTGATTAAG
+ATTTTGCCAAATATGCTAGCCATTGTTTCATGTATTGGACCTCCTTACTTTTTATTAAAG
+AGATCCAATATTCACTACTCTGTCCGTATCTCTACTCAGGCATCAGCCTTCTTCGTTATC
+GTATACAGACGAGCGATGAATTTTAATCAGTAATGATGACATTTGCTGCTGCAGGACCTT
+TAGCACCACTCTCTATAGAGAAGGTAACCTTTTGACCTTCAAATAAGGTTCGATAATTAT
+CATTCTGAATCGCAGAAAAATGCACAAACACATCTTTACTACCATCAACAGGAGAAATAA
+AGCCGAAACCTTTATCAGCGTTAAACCATTTTACTAAACCAGTCATTTTATTTGACATTC
+TACATTCCTTAACTTGAGCCTTTCGGCATAAATGGTTTGCATAACAGAAACGACTTCGTA
+CTTAATTGGAGAGACTCAAAGAAGGAATAAGTGAATAACACCTGAAATGAGAACTGCTTT
+AGTAAACTACTTCGTATATCGTCTGTTCTTCAAACCGACGCAATCATTAACGCATAGTTG
+AACATATGAAGCAATGTTTATTTTAGACATCCAGCCATCTTCAACCCCATCAAAAAACTA
+TAGCTTTCTTCAGGAACGTGTGTATAGTGCGCCAAGTTATCAGTATTAAGGAATTTTTTT
+GTCCCGTAAAATGACAGGAATTGTCAAAACCTTTGACGGCAAAAGCGGCAAGGGTCTTAT
+CACCCCATCCGATGGTCGTATCGATGTCCAGCTTCATGTTTCAGCGCTCAATCTCCGCGA
+TGCAGAAGAAATTACCACCGGATTACGCGTGGAATTTTGCCGGATAAATGGTCTGCGTGG
+CCCTTCAGCTGCCAATGTTTACCTTTCATGAGCTATATTAAAGCTTTAATTTCAGGCCCC
+ATCGGATCACACATGGAGAGTTTTTATGAATAACCCCGTCTGTCTTGATGACTGGTTGAT
+TGGCTTTAAAAGCTTATGCTGTACTTTGGCCGTAATAGCTCTGCTAATAATATAATAAGC
+AGACTCATTGTGTTTAGGGACATTGTACTGGAAGAAAACATTTTAAACATCAGGCAAATA
+ACCAAGTCACCAGCTAAATAATAAGTTAACAGACATGAGTCCCGGGATGAGATTCAACAT
+TACCATTGCCCCATTTAAAGCACAAAACCCGCTCATCAGCGGGTTTTCTACTTTTTCTTA
+ACGTCGGGTATACAAAGCCCATCGTTGAAAAAATTTTATCCATATTTTTTGAAAAATGCA
+AACATCATGTCGCCATCTTCAGCAAAAATCATTTATCTCGTCACCTTCCTCAATTGCGCT
+TCCGCGTATGCTTCTTCCTGCCAGCACTTTGTTACCAGTTTACCAATGACGTCCGCATAC
+CCCTTATACCACTGATAATCGGTCAGGTCTGGTACCAGCTTCTGGACATGACGTCGTGCC
+AGCGTGGTCGGTAAACGACTAAACCGGTTTCCATTACAACGCCCACAAATCTTATATACC
+GGTACGCCATGAAACCGGGTTCTTTTTTCATCCAGAACAATCCCTTTACCCTTACACCCT
+CTGCACGCTGTGCTGGCTTCGCCCTTACCATGGCAATGCTGACATAGTTCCTTCACCCAT
+TCTTCCTTGATTACAGATTCCCCGCGTCTGTAGTGTTTCACCACTTCGCGCAATACATTA
+TAAAATCCCGTACCTGAACAATGCTCACAGCGAGCCTTACTTGCCGCAGACCTGGAGTAA
+TCAGCAAAGGCAAAACTCACGAGGTAAGGAATAATCTGTAACCGGATTTCTTCACTCAAT
+TTGTTCAATGTCGGGTTATCCAGTGCCATCGCGTAATTTAGCAGGCCTTCAATCGCAAAC
+TGAGGGTCCTGAACACCAACTTTTGCCAGAAATAAGGCCAACCCAAGTGGTGCTTTCGAC
+TGCACCATCCCCTGCGCTGCCATTACATCCGTAATTGTTAAACAACCGGTGCCTGTCGCT
+GGAGCGTCATCGCTCAATTTTGGAGATTTTGGGGAGTAATATTTTGGTAAGGCTTCAAGG
+TTCATGCTCGTTCTCCACTTACGCCAGTACGCCAATTGCCAGCGCGCGATCGATAAAACG
+AAATATCAGCTCCAGTTGGGAGCCATACTTATCTTCAAATGCCACTGTATCCGTATGCAG
+CTCGTTGTGATGCTTTCTGCACAAAGGCAACACAAAGAGATCATGTGCTTTTGTTCCCAT
+TCCGCCCTGCCCGTGACCAATCAGATGATGCGGATCGTCGGCTGGCATACCGCAGCAAGC
+ACACGGCTGTGTCTTAACCCAACGTGTGTATTTCTCCTTAACCCAGCGGCGACGTTTAGG
+CAGCTTCATGAAAGATTCCGGAGACTCTGGATCAACGGTGATGCTTACCACCGTCTTTTC
+CTGTGGTGATTTTTGTTGCTGGTGGGCGTAAGGCAACGGTGCAAGATTTTTTGTGCGTTG
+TTTCAATATGCTGGTGGCGGTCAGCTCTCCCGGTACGATGTCGCTTTCGCGGTACACCGA
+GCAGATTTTTTCCGCTGGTAATCCCAGCGAACGACGCGATACAGCCTCAGGTAGTGCATC
+CACCACCTGATTGCAGACCGCCCACCAGGATAATTCAGCCAAAGATAATTCCCGCTCCTG
+CGTACCGCTTATTGCGTGACGGATGACGTCAATCACCCATGCTGTCAGATTTTGTTGAGC
+AAGCAGCTCCAGTGATTCCGATGTCTGGTCACGCAGTTGGTTGTCGCAGTGCCAGCACAA
+CACCATTGCGCCGGTACCATAACGGTGAATGACTGTTTCAGTGTGATGGTAATCGCCATT
+AGGCCACTGGCAGGATGTAACATGACGTAATAGCCAGTCGGACAATGCGCCAACGCCGCC
+AGCAGCACGAATCACCCGTTCGTTACTAAAAAACGGCAGCAATGTTTTGTCTTCCGCCAG
+CGGCTGGCGAACGGCAGGAACGACTCCGGATGGCAGATTACGCATGCTTTTTGGTTCCGG
+TTCCACCAGCACTCGAGGATTATGAAATATCTGTATGGATTCACGGCCCGGCTTAAGGAC
+CACCAGCCCAAGCTCAGGCACCAGAACAGGTCTAAGTAATACCCGCACGTTACCTCCAGA
+TCCGTTGCTGGAAAGTGCGGGACGCACGTGGTGGGCGTTCGGAATAAGGCAGCCTGACAG
+AGATTATCCAGTGCCGATAGTCGAGACTGAGAGCTTTCTTAACCTCGAACCCGCGCCTGC
+GGTAAGAATGAATCAGCCATTCGGCCTGTTCTGCAGTGCATGGAGGGTGCTGGAACCATT
+CAGACTTGAATGCGTGAGAATACCGCCCGTGCGTGCAGGCAAGAACGGGCGAATTATCAG
+AATTGTAATATTTTGCGTTGCGTGCCATCGGTTTTCTCCGGTGGCACGGTGTTACTCAGC
+GGGAGTTCAGCCCCGCGCAAGATTGTAGATGAGTTTATTCTCCTGAAAAAGCAGAAAAGC
+CAGCTTTTATTCCGATCTCTTTCAATGCCTGTAATGAAGTGACAAACTCACCTTCGCGCA
+AGATAAATCCGTCCGTGACCCGAGCATCCACAAAATTAATTAACGCAGCCCCATTCTTTC
+GCAAACACATAATGCGGTAATGACTAACAAGATTTCCATTTTCAACGCACACAGCATAGA
+GGCCATCTTCACAAAAAATTTTACGCAGTTCTTCGATGTTCATCATCAGAATCCTTCCGG
+ATAATTAGCTCTCCCCTTTAAGGGACCATCCCTCTTATCCCTGCGCGCTACTTAAGTATT
+TTTGATTCTATTCCGGCACCGTCCAGAACTTCAAACGCGTTGAAAATAAAAACAAAAACC
+CGCCGAAGCGGGTTAAGTGCGGGTGCGTTGAGGATGCCTGCCACATCAGAGGTGGCGAGG
+GATTTCTCCCCCGCCGGGTCTCTTACTCCTCAGGTTCGTAAGCTGTGAAGACAGCGACCT
+CCGTCTGGCCGGTTCGGATTCGTACCTCGCAGAGGTCTTTCCTCGTTACCAGTGCCGTCA
+CTATGACGGTTAAACAGATGACGATCAGGGCGATTAACATCGCCTTTTGCTGCTTCATAG
+CCTGCTTCTCCTGTCAACGCAAAGCAGAAGTGTCACCTTCGGTGCGAAACAGAGATGTCA
+TGCTTTGGTTCAGAGAATGCGTTTGACCGCCTCGCTATATACTTCCGAGCGTTCTCTTTT
+CCCAACAGAAATCACGAAAACGACAACTTTCTCGTCTATAACCTGGTATACAAGGCGATA
+GCCTGAAGACCGGAGCTTAATCTTGTAACAATCAGGCATACCACGGAGCTTGTTTGCTTC
+AATCCGGGGTGACTCAAGTACTTCAACCAGCTTCTTTTTCAACTGTTCACGTACCGTCGA
+GCCCAGCTTTCGCCATTCCTTTAGTGCCCGCTCGTCAAAATCCAGAAAATACGCCATCAG
+AGTTCATCCAGCGTCACACGTACTGGCTTAGGATTACGAAGCCGTTCTTTCACTATCTCC
+ACAAGTTCAGCATCTTCATCACTCAGGAGTGTCTGTTTGAACGGCAAGCGTTCATTGTCA
+GCGATATACTCGAGCATGAGACGAAGCGCTTCAGAAGGAGTTACACCCATTTTTTCAAGC
+GCGGCGTAAGAACGCGCTTTAAGTTCATCGTCAATACGCAGGTTAATGCTACCCATGTCT
+TACACCTCTTGTAATTACAAATGTCATTACAAGTATCGCACTACAACATGCTTAGGGCAA
+GTCACGAAGGAAGTCAGAAAGTAGTCGTAAGAACGGTGATCACTGTCCGCTTTGTGCCAG
+GAGCAGCCATTGCTAAGTCCATCCTGTATTGTGCAGGTCAGCTCGTTTTTAAAGAGTCCG
+GCCATCATCTTACTGGTACAGACACCATATACTTTGTGACGGTCAGGCTACATATGCACA
+ACTCAACTTATTCATCTATTTTTTGCTTTAGCATGTCAGTGTTGCTTTCTCGTCGGCGGG
+TGAGCGGTGACCTGACCTGTCGATAAAGGAACGTAACACGTTTTATGCAACACCCGCATG
+CGGCAGAAAATTATTGCCGAACGTTTACCCCTGTCAACAAGCTTTACTTTCTGAGGCGCG
+CCAGCCCGCGAGGAAAACAATCTGAACATCAAACAATTAATGACACAAGAAATACGATTA
+AAGATTTTTTTGTGCATGCCGATAGTGCTTTTTTAAAAGGAGAAATCTATGTCTGTCACA
+ATTCAGGGAAATACCTCAACCGTTATTTCAAACAACTCCGCCCCGGAAGGAACATCAGAA
+ATAGCCAAAATCACAAGACAAATTCAGGTGCTGACTGAAAAGCTTGGGAAAATCTCATCG
+GAAGAGGGGATGACGACACAGCAGAAAAAAGAAATGGCTGCATTGGTACAGAAGCAAATT
+GAAAGCCTCTGGGCTCAACTGGAGCAGTTGTTAAGGCAGCAGGCAGAGAAAAAGAATGAA
+GACGCGACAGTTCAGCCTGATAAAAAAGAAGAGAAAAAAGACGATACAAATACCGCTGGC
+ACCATTGATATTTACGTCTAAGTGACAGCCGTATTGTGGCCCTCATCGGGCCACTTTTCG
+CCATCAGCCTTTTCTTTAAAGACATATTATCTTTGTATCATTTCTGATAGTTAACATTAC
+AAGATATAAGTAATGGACGCACTCCCAATTAGTCTATTTAAATCGCCACGAGTTTAACTG
+ACAACCCATGATCAATTATGAATTGCAACTATTTCTGTAGTCACTTTTGTGGGGACAGTC
+CACAAAACTGCCAACTTCCGCTTCTTGCTCTTAGCGGACATTAGCATAGGCTATTTACCA
+TAACGCCTCATTACGCGCACCGCCCAGACTGACTCAGCGCGTTTCTGGCATATCCCCGGT
+AAAACAAGTAACAAACCACCCGAAAATGAACACCAGAAACGCGACTTAAGAATCTACCCT
+ATGAATGGATATGCACTCAACCGAATCGATCTTGGTTTCAATCTTTTTTATCGGGATCAG
+GCTTCTTTTTAGGTAACTTCGGGGGCTTAACTTGCTGATGACTTTGCGTTCGGCGCGTAA
+GCCAGGGATGGTCAGCTTTAGGTTTAACATAGTATTTTGAGCGTAAATCAATACGGGCAT
+TATCCACTCGTTCATGGACACTCTTTTCATCATCCAGTGGTAGCCTCCATAATTGCAGGC
+ACTAGCGCCGTGAACTTTTCACGCTTATCCCTGGTGTCGATAGCCTTCCAGCGTTCAAAT
+ATCTTCACTCGATTAACGCCAAGCGCTCGCTGATCAATCGCGCCACCTTCATATGTGACA
+CGCTGAACATCGATGTTCGGGCGCTCTTTCAAAGCCCAGAATGCTTCAGTGATTAATATC
+GTCGCCTGCTCCTGTGTCATTCCTGGTCGACATATCCAGGCATCCAGAGCCTCACGAGCC
+TGTTCAGGAGTGATTTTCATTGTTCAACCGCCCCGCCCGCTTCGTCTTACGATATTCATC
+ATAAACTTTGGGATCATACTGAAGCTCCCCGCCAGATGCCTCCTGTAGACGCATCGCGCG
+ACCTTCGGGAACTAAATCCCCTTTCCAGCTATAAAGCGAAGCCAAACGAATACCTGCTGC
+TTGTGCAAGTTTTGTTTTTGAACCGAAATACAAAAGAGCGTCAGTTTTAAGCATTTAAAA
+CACCTTTATTGTTAGTCATAACTAACAAGATAGATGTTAACAAAAACATAGTCAATACGA
+TTTAGCATTAGCTAACTATGGAAACAAAAAATTTAACTATCGGCGAACGCATCAGGTATC
+GTCGGAAAAACCTCAAACACACCCAAAGGTCTCTTGCTAAAGCCCTGAAAATCTCCCATG
+TGTCTGTATCACAATGGGAACGGGGTGATAGTGAACCTACAGGGAAGAACCTTTTTGCCC
+TCAGTAAAGTATTGCAATGCTCACCAACATGGATTCTATTTGGCGATGAAGACAAGCAAC
+CAACACCACCTGTTGAGAAGCCAGTTGCCTTATCCCCCAAAGAACTAGAGCTCCTTGAGC
+TGTTTAATGCACTGCCAGAATCAGAACAGGATACCCAGCTCGCCGAAATGCGAGCTCGAG
+TAAAAAACTTCAATAAACTCTTTGAAGAATTACTAAAAGCCCGTCAGCGGACAAATAAAA
+GATAACATCATCAATGAGTTATCTTTTACCACATCAATTATGTTAGCTATAGCATACAAA
+ATCACTTGACCGATATGTTAGTCATGGCTAATCTTGTTTGCATCAACACACCGCACGGTG
+TTCTCAGCAAACAGTTCCGCTACCCCAGCGTTAAGGGGAAATGAGGTCAGCATGGATACT
+ATCGATCTTGGCAACAACGAATCTCTGGTGTACGGCGTGTTTCCAAACCAGGACGGCACG
+TTCACCGCAATGACGTATACCAAAAGCAAAACGTTTAAAACCGAAAATGGTGCCCGTCGC
+TGGCTGGAAAGAAACTCAGGTGAGTGATATGGATTTCGACACAATCATGGAAAAGGCTTA
+CGAAGAATACTTCGAAGGCCTTGCCGAAGGCGAAGAAGCTCTCAGCTTCAGTGAGTTTAA
+ACAGGCGCTTTCCAGTTCGGCAAAATCTAACGGCTGATAAGCGAAACAGCACCGCGAGGA
+ATCAGTATGCAGAAACGAGAACCCGTCATCATCGCGCCAGACTATACCGATGATGAACTT
+TATGAGTGGATGCGCCAGAAAATTAATGCAGCGCAGGATCTGAAATGGGCTAATGAAGCC
+AGGGCTAAGCAGGCTGAAAATCTGTCCGCTCTGGAGCAGGATATCACCAATCTGGAAAAA
+GCAGCGGCATTAAGCATTGCCAGAATGATTACATACCCGCGTTAGTAGCTAATCAACAAA
+GCTAAGGTTAGTAATTAAGGAGTTCTCCACGGGTGAGGTGGAGTGCGTGCGCCGGACACG
+GGTGCGCATCCGGAACTGACAGTTTACTGAAAGGATATTTCCCTGAAAAGTCAGACCATA
+ACGCGAAAGCGCATGGCGAGGTAGCTGGTTCATAGATAGCCTGTCGTTAAATTTTCGTCG
+ACCGTGCGCTTCCGGTTGTGGCAACCCGCGAAATGGCGCGGCGGTAAGTATGGCGGGGTT
+ATTCCTTCCCCGTTGAGGACACCGGGTTGTCAGGTTGACCATACGCTTAAGTGACAACCC
+CGCTGCAACGCCCTCTGTTATCAATTTTCTGGTGACGTTTGGCGGTATCAGTTTTACTCC
+GTGACTGCTCTGCCGCCCTTTTTAAAGTGAATTTTGTGATGTGGTGAATGCGGCTGAGCG
+CACGCGGAACAGTTAAAACCAAAAACAGTGTTATGGGTGGATTCTCTGTATCCGGCGTTA
+ATTGTTAACTGGTTAACGTCACCTGGAGGCACCAGGCACTGCATCACAAAATTCATTGTT
+GAGGACGCGATAATGAAAACGTTATTACCAAACGTTAATACGTCTGAAGGTTGTTTTGAA
+ATTGGTGTCACTATCAGTAACCCAGTATTTACTGAAGATGCCATTAACAAGAGAAAACAA
+GAACGGGAGCTATTAAATAAAATATGCATTGTTTCAATGCTGGCTCGTTTACGTCTGATG
+CCAAAAGGATGTGCACAATGAATTCAGCATTTGTGCTTGTTCTGACAGTTTTTCTTGTTT
+CCGGAGAGCCAGTTGATATTGCAGTCAGTGTTCACAGGACAATGCAGGAGTGTATGACTG
+CAGCAACCGAACAGAAAATTCCCGGTAACTGTTACCCGGTCGATAAAGTTATTCACCAGG
+ATAATATCGAAATCCCGGCAGGTCTTTAAAACAGTTCCGTAATAAATATCCGGTTTCATT
+CTTATATGCCAGCAATGGCAGGGATTTGTTCATCCTTAAATCTGTCATGAGGTTAAAACA
+AATGAGTAAAGTCTTTATTTGCGCCGCTATTCCTGACGAACTGGCAACAAGGGAAGAAGG
+CGCTGTGGCTGTAGCCACAGCCATTGAAGCTGGCGACGAACGCCGTGCTCGAGCAAAATT
+TCACTGGCAATTCCTGGAACATTATCCGGCTGCTCAGGACTGCGCTTATAAATTTATTGT
+CTGCGAGGATAAACCTGGCATACCCCGCCCTGCCCTCGATTCATGGGATGCTGAATATAT
+GCAGGAAAACCGCTGGGATGAGGAGTCTGCTTCTTTTGTCCCGGTTGAGACTGAATCCGA
+TCCGATGAACGTCACTTTTGACAAGCTGGCCCCTGAAGTACAGAACGCTGTCATGGTTAA
+GTTCGACACATGTGAAAACATCACCGTTGATATGGTTATTAGCGCACAGGAATTGTTGCA
+GGAAGACATGGCAACATTCGACGGACATATCGTTGAAGCGTTGATGAAAATGCCAGAAGT
+TAACGCCATGTATCCGGAGCTTAAGTTGCACGCCATTGGGTGGGTTAAGCATAAATGTAT
+TCCTGGTGCTAAATGGCCCGAAATTCAGGCAGAGATGCGCATCTGGAAAAAACGTCGCGA
+AGGTGAACGCAAGGAAACCGGAAAATACACGTCTGTTGTTGATCTCGCCCGCGCCAGAGC
+CAATCAACAGTACACTGAAAATTCAACAGGAAAAATCAGCCCGGTCATTGCTGCCATTCA
+TCGCGAATACAAGCAGACATGGAAAACACTGGATGACGAACTGGCCTATGGGCGCTGCTT
+CGCAGACAGGCAGAACTTGATGGTATGCCTGCGATCAATGCCAAACGTGTTTACCGGATC
+ATGCGCCAGAATGCGCTGTTGCTTGAGCGAAAACCTGCTGTACCGCCATCGAAACGGGCA
+CATACAGGCAGAGTGGCCGTGAAAGAAAGCAATCAGCGATGGTGCTCTGACGGGTTCGAG
+TTCTGCTGTGATAACGGAGAGAGACTGCGTGTCACGTTCGCGCTGGACTGCTGTGATCGT
+GAGGCACTGCACTGGGCGGTCACTACCGGCGGCTTCAACAGTGAAACAGTACAGGACGTC
+ATGCTGGGAGCGGTGGAACGCCGCTTCGGCAACGATCTTCCGTCGTCTCCAGTGGAGTGG
+CTGACGGATAATGGTTCATGCTACCGGGCTAATGAAACACGCCAGTTCGCCCGGATGTTG
+GGACTTGAACCGAAGAACACGGCGGTGCGGAGTCCGGAGAGTAACGGAATAGCAGAGAGC
+TTCGTGAAAACGATAAAGCGTGACTACATCAGTATCATGCCCAAACCAGACGGGTTAACG
+GCAGCAAAGAACCTTGCAGAGGCGTTCGAGCATTATAACGAATGGCATCCGCATAGTGCG
+CTGGGTTATCGCTCGCCACGGGAATATCTGCGGCAGCGGGCTTGTAATGGGTTAAGTGAT
+AACAGATGTCTGGAAATATAGGGGCAAATCCACAGGTGAACTACGCTCCTCTGTTTGTTA
+CGCAATAAAAACTGGTGTTTTCGACTATGCAAAACAGTTTCCCTCCTCACGCAATCTGGA
+AAAATTTGGTGAGGCCCGACAAGATTTAACCATAAAAGAACTGGCTGAAAAATTTCTGGC
+ACTGAAAGAAACTGAAGTCGCCAAAACATCACTCAACACATACCGTGCCGTCATCAAAAA
+TATCCTGAGCATAATCGGTGAAAAAAATCTTGCCTCATCGATTAATAAAGAAAAATTACT
+GGAGGTTCGTAAAGAGTTACTGACTGGATACCAGATCCCCAAAAGTAACTATATTGTTAC
+ACAACCAGGGAGATCGGCTGTAACTGTAAATAATTACATGACAAATCTTAACGCCGTGTT
+CCAGTTTGGTGTTGATAACGGTTACCTGGCAGATAATCCGTTTAAGGGGATCTCGCCATT
+AAAGGAATCAAGAACCATTCCGGATCCTCTTTCGCGGGAAGAATTTATCCGTCTTATCGA
+TGCGTGCAGAAATCAGCAAGCAAAAAATTTATGGTGTGTTTCTGTTTATACTGGAGTTCG
+CCCTGGTGAGCTGTGTGCACTTGGATGGGAGGACATAGATCTGAAAAATGGAACAATGAT
+GATCAGGAGAAATTTAGCAAAAGACCGTTTCACGGTACCAAAAACACAGGCGGGAACCAA
+TCGGGTCATTCATCTTATTAAGCCAGCAATCGACGCTCTCCGGAGTCAGATGACATTAAC
+GAGACTGAGCAAAGAGCATATCATTGATGTTCACTTCAGAGAGTATGGCAGAACAGAAAA
+ACAAAAATGCACCTTTGTTTTTCAACCTGAAGTGTCAGCGAGAGTAAAAAATTATGGTGA
+CCATTTTACCGTTGACTCAATAAGGCAGATGTGGGACGCAGCGATAAAACGTGCCGGACT
+CCGCCATCGAAAATCATATCAGTCGAGACATACTTATGCCTGCTGGTCGCTGACAGCTGG
+TGCTAACCCGGCATTTATAGCAAACCAGATGGGCCATGCAGATGCGCAAATGGTATTTCA
+GGTATACGGAAAATGGATGTCTGAAAACAATAATGCACAGGTAGCTTTGTTAAATACACA
+GTTAAGCGAGTTTGCCCCAACCATGCCCCATAACGAAGCAATGAAAAATTAATTTAATAT
+TTATCAAATAGTTAACACGCATGACTCTTGAAATCCATAAATTCAAGCGCAGTGCCCAGC
+CATCCCGATACTGCTGCTTTCACCAAATCCTTAGTGCTTCTTTCGTGTTTTTCTATTGTC
+ATAATGGTTATCTCTAAAAAAGAGGTAAGATGCGTACTACTTACTCGCCGTTATTGGTAT
+TATTCAGAAAAAGTGAGTAAGACTTTGCAGCAATGTTTTTGATCCTGTTCAAATAAACTA
+ATGGCATCAGCAACATGCTGGAAATCAAACGTATGGGTAATTAATTTTTCTGGTTTAATT
+AACCCTTTACTTAACCAGTCGATAACGATCGGGAATTTATTTGCATTTAAGCGTGAAGAG
+AAAATAGAGAGTTCTTTTCCGGTAATTCCTTGCTGAATCACTTCAGACGGTTCACTGGAG
+AACCCCATCAATACAATACGTGCCGCTGGAGAAGCCAGCGTTACGGCCTCTTTCAGGATA
+GAAGGATGACAAGCCGCATCGATAATTAATGTCGGCTTGATGCCTTTTTCAGTGAAAATC
+TCGCCAAGCGGTGTCTGGCTGTTATTAATCGCCCAGTCAGCCCCGCTCTCTTTCGCTTTT
+TCCAGTCGTTCATCAATGCGATCGGCAACAATCACATTTTTAACGTTATAGACGCCTTTT
+AATACCTGAACGATCGTCAGGCCGATTGGACCGGCACCATAAACCAGAACGGTATCATTT
+TCAGTCGGTTGACCATGTCCGGTTACGTTAGCCGCAATGGTAAAAGGTTCGATCATTACC
+GCATATTGATCGGCCACTGCTTCAGGAATTTTCCACGCATTTTTTGCCGGAACCACGGCA
+TATTCACTGAAACCACCGTCAGCGTGCACACCTAATACAGCCAGTGTCGTACAAACGTTC
+GGTTTACCTATAGAGCACGGATAGCAATGCCCACAGCTGACCACCGGATCGACAGCAACA
+CGTTCACCGACTCTGGCGCTTTCCACGCCTTCACCCACTGCATCAATGACGCCAAAGAAT
+TCATGACCAATGACGCGCGGATATTTCGCAAAAGGATTATGCCCACGATAAATATGGCTA
+TCTGAACCACAAATTCCGGCAAGTTTCACTTTTACTCGTACTTCACCCGCTGACGGGGTG
+GGTATTTCACGTTCGACAATCGCCAGTTGATTCGGTTTTTCAATTAATATGCTTTTCAT
+>NC_000913.3|provirus_2461306_2476510
+ATGAGCCAGAAAACCCTGTTTACAAAGTCTGCTCTCGCAGTCGCAGTGGCACTTATCTCC
+ACCCAGGCCTGGTCGGCAGGCTTTCAGTTAAACGAATTTTCTTCCTCTGGCCTGGGCCGG
+GCTTATTCAGGGGAAGGCGCAATTGCCGATGATGCAGGTAACGTCAGCCGTAACCCCGCA
+TTGATTACTATGTTTGACCGCCCGACATTTTCTGCGGGTGCGGTTTATATTGACCCGGAT
+GTAAATATCAGCGGAACGTCTCCATCTGGTCGTAGCCTGAAAGCCGATAACATCGCGCCT
+ACGGCATGGGTTCCGAACATGCACTTTGTTGCACCGATTAACGACCAATTTGGTTGGGGC
+GCTTCTATTACCTCTAACTATGGTCTGGCTACAGAGTTTAACGATACTTATGCAGGCGGC
+TCTGTCGGGGGTACAACCGACCTTGAAACCATGAACCTGAACTTAAGCGGTGCGTATCGC
+TTAAATAATGCATGGAGCTTTGGTCTTGGTTTCAACGCCGTCTACGCTCGCGCGAAAATT
+GAACGTTTCGCAGGCGATCTGGGGCAGTTGGTTGCTGGCCAAATTATGCAATCTCCTGCT
+GGCCAAACTCAGCAAGGGCAAGCATTGGCAGCTACCGCCAACGGTATTGACAGTAATACC
+AAAATCGCTCATCTGAACGGTAACCAGTGGGGCTTTGGCTGGAACGCCGGAATCCTGTAT
+GAACTGGATAAAAATAACCGCTATGCACTGACCTACCGTTCTGAAGTGAAAATTGACTTC
+AAAGGTAACTACAGCAGCGATCTTAATCGTGCGTTTAATAACTACGGTTTGCCAATTCCT
+ACCGCGACAGGTGGCGCAACGCAATCGGGTTATCTGACGCTGAACCTGCCTGAAATGTGG
+GAAGTGTCAGGTTATAACCGTGTTGATCCACAGTGGGCGATTCACTATAGCCTGGCTTAC
+ACCAGCTGGAGTCAGTTCCAGCAGCTGAAAGCGACCTCAACCAGTGGCGACACGCTGTTC
+CAGAAACATGAAGGCTTTAAAGATGCTTACCGCATCGCGTTGGGTACCACTTATTACTAC
+GATGATAACTGGACCTTCCGTACCGGTATCGCCTTTGATGACAGCCCAGTTCCTGCACAG
+AATCGTTCTATCTCCATTCCGGACCAGGACCGTTTCTGGCTGAGTGCAGGTACGACTTAC
+GCATTTAATAAAGATGCTTCAGTCGACGTTGGTGTTTCTTATATGCACGGTCAGAGCGTG
+AAAATTAACGAAGGCCCATACCAGTTCGAGTCTGAAGGTAAAGCCTGGCTGTTCGGTACT
+AACTTTAACTACGCGTTCTGATAACGCGTTCGCCTGGATAAAGTCACCTGCATAGCAGGT
+GACTTTAACTCCCCCACTTCACCGAAAGTAGTGTCCTCATTGCTTACCTCCTGAGTTTTG
+CAAACAGCCTGTTGGCAGCTTGCCCTTTCAAATCAATAAGCGGTATCCACAGACAAACCT
+GAAGGGAAAGGCATATTTTCAGGCGTTCTGCTCGTCCTTCTCAAAGAGTTTACTTTTCTG
+CATTTCCAGGATACTCCCCCCCCCTGGCTATTGTGCGCTCATACACTCAAATTAAAGATA
+GGTTCTAAATAAATGAGCGTTTTTTGATAGTCTATTTCATTAGGTAATATATATTTGTAA
+CAAATCAATCAAAATGGAATAAAATCATGCTACCATCTATTTCAATCAACAATACCAGCG
+CAGCTTACCCAGAATCCATCAATGAAAATAACAATGATGAAGTTAATGGATTAGTACAAG
+AGTTCAAAAACCTTTTTAATGGTAAGGAAGGAATAAGCACCTGTATTAAACATCTACTTG
+AGCTTATAAAAAACGCCATACGAGTAAACGACGATCCTTATAGATTTAATATTAATAATT
+CCTCAGTTACTTATATTGATATTGACTCCAATGATACAGACCATATTACTATTGGTATCG
+ACAACCAAGAACCAATAGAATTACCTGCGAACTATAAAGACAAAGAACTCGTCCGTACTA
+TCATTAATGACAACATAGTTGAGAAGACTCATGATATCAATAACAAGGAAATGATCTTCA
+GCGCATTAAAAGAAATATATGATGGAGATCCTGGTTTTATCTTCGATAAGATATCACACA
+AACTCAGACATACGGTAACGGAATTTGATGAGAGCGGGAAAAGCGAACCAACGGACTTAT
+TTACCTGGTACGGTAAAGATAAAAAAGGCGACTCTCTCGCTATTGTAATTAAAAATAAAA
+ACGGAAATGATTACTTATCTCTCGGTTACTACGATCAGGACGACTACCACATTCAAAGAG
+GAATTCGTATTAATGGTGATAGTCTCACCCAATATTGTAGTGAAAACGCCAGGAGTGCTT
+CAGCGTGGTTTGAAAGCAGTAAAGCTATCATGGCAGAATCATTTGCAACTGGTTCCGATC
+ATCAGGTTGTAAACGAGCTCAACGGGGAAAGACTGAGAGAACCAAACGACGTTTTTAAAC
+GTTATGGTCGAGCAATAAGATATGATTTTCAAGTGGACGATGCAAAATATAAATGCGACC
+ATCTAAAAGAAATAGTTTCTACTTTAGTCGGTAACAAAATTAACGTTGGCCATTCTCAAA
+AAATATATAAGCATTTTAAGGATCTCGAAGGTAAAATTGAAGAAAGGCTTCAAAATCGCC
+AGGCTGAATATCAAAATGAAATTAATCAACCATCTGCGCCAGGTGTTAATTTTGATGATA
+TTTAAAATTATTTTTCCAGTTTTTTGATTTTTCAACAGCTGAATATCGGAAATAGTCAGT
+GACGAACATCAGTATTTTTACATAATTACGTCTAGGTCATTGTCGGTTTATCTCCTTTTA
+CTTGTGGTAATTGAGGGATAACAACAAAAAAGGTGAGTTTTGCGACTCACCTTTTTTATT
+TGTTTCTTATTCAGAATCAATATCTTTTAAATCATCCTGAATCGCTTGTGCGTTCGGATT
+TTCCTGCGGTTTGAGTTCGCCGCCATTAGCGATGAAATCATGACGCTGGAAGTACGCTTC
+GCGCACCATAATATAAGGATCGGACGACTGACGCAGCAGACCATCGGAATCCAGCAGCTG
+AGCGCGGGTTTCGATCCCTTCAAGCGTCCATTTACCCACAGACATCGGCCAGGTCAGCCA
+GGAAAGAACCGGGTAAAAACCATCCGCCATATCACCACCGTCATCACGCAGCGTGAAGCT
+ACCGTAGAACGGTAACTGAACGTAAGGCCCATAACCCACGCCATAATGACCAAGCGTACT
+ACCGAAGCGGTGAGGTTCAGTCCGTTGCAGTTTCGGGTTCGCCATCCCTGCAACATCAAT
+AAAACCGCCCATCCCCAAAATGGTGTTCAGGAAAAAGCGGGTAAAGTGGACCATCCCCTG
+ATAAGGGTCGCCCTGCAAGAAGTAGTTAACCATCACCGCAGGTTCTTCAAGGTTGCCAGT
+AAAGTTGCTCAAACCGTTACGCGCCGGTTGCGGAACATAATCACGCCAGGCGACAGCGAC
+CGGTCGAACAATATACGGGTCTAATACATTGAAGTTGAAGTTGTACATGGTGCGGTTGAA
+CCCTTCTAACGGGTCAGAACGCCCTTGCTGATCTGTACCGGAACTCGCACACCCCACCAG
+AAGCGTAGTTCCCAGAGCAAGCGCCGACAGGCGAAGCTTCATAAATGTCTCCCTGTTTTT
+TTATGGCTTATGCAGTTTGCCATCCATGACGGAACGATACCGTATCCGCCTGTTTAGGTG
+TGGGCGATTGTAACAGCACGTCAACTGATGTCCAGACGCCCTGATTTGCTGATTTGATCA
+TAGCCTGGTAATCGCCGCCCTGTAGGCTACTTGATTCTATAGAAACAGAAAAAGGCAAAC
+GCAGCCTTTTCTACATTTTCAGAGTAACTCCCGTCAGTTGCGAGCAAAAAAGCCGCTACG
+CTTTAGCTATACGTGCTAATTCAAGAGAAGAGACCATGGACAACGACAAAATTGATCAAC
+ACAGCGACGAAATTGAAGTTGAGAGCGAAGAAAAAGAGCGCGGCAAAAAAATAGAAATAG
+ATGAAGACCGACTCCCCTCCCGGGCGATGGCAATTCATGAGCATATCCGCCAGGATGGTG
+AAAAAGAGCTGGAACGCGACGCAATGGCGCTACTGTGGTCAGCCATTGCGGCGGGTCTGT
+CGATGGGCGCTTCGTTACTGGCAAAAGGGATATTTCAAGTCGAACTGGAAGGTGTGCCGG
+GCAGCTTCTTGCTGGAGAATCTCGGTTATACCTTTGGTTTTATTATCGTCATTATGGCCC
+GCCAGCAATTATTTACCGAAAATACCGTGACTGCGGTACTACCCGTCATGCAAAAACCGA
+CAATGAGCAACGTCGGCTTACTTATACGGTTATGGGGCGTCGTGCTGCTGGGTAATATTC
+TCGGGACAGGTATTGCGGCGTGGGCATTTGAATATATGCCTATCTTCAATGAAGAAACTC
+GCGATGCATTTGTCAAAATCGGCATGGATGTGATGAAGAACACCCCCAGCGAGATGTTTG
+CCAACGCGATCATTTCCGGCTGGCTGATCGCCACTATGGTTTGGATGTTTCCTGCAGCGG
+GTGCGGCAAAGATTGTGGTGATTATATTGATGACCTGGCTTATTGCCCTGGGTGACACCA
+CCCATATCGTGGTCGGTTCTGTTGAAATCCTCTATCTGGTGTTTAACGGTACGCTGCACT
+GGAGCGATTTCATCTGGCCCTTCGCACTACCTACTTTAGCGGGGAACATCTGCGGCGGCA
+CCTTTATCTTCGCGTTAATGAGTCATGCACAGATTCGTAACGACATGAGCAATAAGCGTA
+AAGCAGAAGCACGCCAAAAAGCAGAACGTGCGGAAAACATTAAGAAAAATTATAAAAACC
+CGGCATAAATGGCGAGGGTTTAAGCAATCGAGCGGCAGCGTACTTACCCCGCACTCCATT
+AGCGGGTATACTCATGCCGCATTGTCCTCTTAGTTAAATGGATATAACGAGCCCCTCCTA
+AGGGCTAATTGCAGGTTCGATTCCTGCAGGGGACACCATTTATCAGTTCGCTCCCATCCG
+TACCAGTCCGCAAAATCCCCTGAATATCAAGCATTCCGTAGATTTACAGTTCGTCATGGT
+TCGCTTCAGATCGTTGACAGCCGCACTCCATGACGGGTAAAAAGTGGATAAAATAATTTT
+ACCCACCGGATTTTTACCCATGCTCACCGTTAAGCAGATTGAAGCAGCAAAGCCGAAAGA
+AAAACCATACCGCCTTCTCGATGGTAATGGCCTGTACCTTTATGTCCCTGTGTCAGGGAA
+AAAGGTATGGCAGCTTCGCTACAAGATTGACGGTAAGGAGAAAATCCTGACCGTCGGAAA
+ATATCCGCTTATGACTTTGCAGGAGGCAAGGGATAAAGCATGGACTGCGAGGAAAGACAT
+CTCGGTTGGCATCGATCCTGTAAAGGCGAAAAAGGCTTCGTCTAACAACAATTCCTTTAG
+TGCGATTTACAAGGAATGGTACGAGCACAAGAAGCAAGTATGGTCAGTAGGGTATGCAAC
+TGAACTTGCCAAAATGTTTGACGACGACATTTTACCTATCATTGGCGGCCTTGAAATTCA
+GGATATTGAGCCGATGCAACTGCTGGAAGTAATCCGCAGGTTTGAAGATCGCGGTGCAAT
+GGAACGAGCCAACAAAGCACGCAGAAGATGCGGCGAGGTTTTCCGTTACGCTATTGTCAC
+CGGAAGGGCTAAATATAACCCGGCACCTGACCTTGCTGACGCCATGAAGGGATACCGCAA
+GAAGAACTTCCCGTTTCTTCCTGCAGACCAGATCCCGGCATTCAACAAAGCACTGGCAAC
+ATTTTCAGGAAGTATCGTATCGCTCATTGCGACCAAAGTTTTACGCTACACAGCCCTAAG
+AACGAAAGAGCTTCGTTCCATGCTATGGAAGAACGTCGATTTTGAAAATAGGATTATCAC
+CATCGACGCCAGTGTGATGAAAGGACGCAAAATTCATGTGGTTCCTATGTCAGACCAGGT
+AGTTGAACTTCTCACTACGCTAAGCTCCATCACCAAACCAGTCTCAGAGTTTGTTTTTGC
+CGGGCGCAACGATAAGAAGAAGCCAATCTGCGAGAACGCGGTACTGCTTGTGATCAAACA
+AATCGGCTATGAGGGTCTGGAAAGCGGTCACGGATTCAGGCATGAATTCAGCACGATTAT
+GAACGAGCACGAATGGCCTGCTGACGCTATTGAAGTGCAACTGGCACATGCAAACGGCGG
+ATCTGTGCGTGGGATTTACAACCATGCTCAGTATCTCGATAAACGCAGAGAAATGATGCA
+ATGGTGGGCGGACTGGCTTGATGAGAAGGTGGAGTGAGCGACCTTAACAACTATCGAATA
+GCACAAAGTCTTGCAATCCAGTGCAAAGCTTTGTGTGTATAAGTTTTGTCTCATCAACCA
+CAGCAAGTATCGATCGATTAAGACTTGGATGATAGACTTCATTCCTTTGATTATTAGCTG
+ATAGAAGAAATGTTAAAGCTATTTGCAAAGTACACCTCTATTGGTGTGCTGAACACCCTT
+ATACACTGGGTGGTTTTTGGTGTTTGTATCTATGTCGCGCATACAAACCAAGCTCTTGCA
+AACTTCGCAGGTTTCGTTGTGGCTGTGAGCTTTAGCTTCTTCGCGAATGCAAAATTCACA
+TTCAAGGCATCGACTACAACGATGCGCTACATGCTATATGTTGGGTTCATGGGGACACTG
+AGTGCTACTGTTGGATGGGCTGCTGATAGATGCGCACTTCCCCCGATGATAACTCTTGTC
+ACCTTCTCCGCCATCAGCCTGGTGTGCGGTTTCGTCTATTCAAAGTTCATTGTCTTTAGG
+GATGCGAAATGAAGATATCTCTTGTAGTTCCTGTCTTCAATGAAGAAGAAGCGATACCAA
+TTTTTTATAAAACGGTACGTGAATTCGAAGAATTGAAGTCATATGAAGTGGAAATCGTTT
+TCATAAATGACGGCAGCAAAGACGCTACGGAGTCAATCATTAATGCTCTGGCTGTTTCAG
+ATCCTCTAGTTGTTCCGCTGTCATTTACACGCAACTTTGGTAAAGAACCAGCATTGTTTG
+CAGGGTTAGACCATGCAACCGGGGATGCGATAATCCCAATTGATGTTGACCTGCAAGACC
+CGATTGAGGTTATTCCTCATCTTATTGAAAAATGGCAAGCAGGTGCTGATATGGTTCTTG
+CTAAAAGATCTGACCGCTCAACTGATGGACGCCTGAAGCGAAAAACGGCTGAGTGGTTCT
+ATAAGCTCCACAATAAAATAAGCAATCCTAAAATTGAAGAGAATGTTGGTGATTTCAGGC
+TGATGAGCCGTGATGTTGTCGAAAATATTAAACTTATGCCAGAACGAAACCTTTTCATGA
+AAGGTATTCTGAGCTGGGTAGGAGGAAAGACAGATATTGTTGAATACGTGCGAGCGGAAA
+GAATTGCTGGAGATACAAAATTTAATGGATGGAAACTTTGGAATTTAGCACTTGAGGGTA
+TTACAAGCTTTTCCACATTCCCTCTTCGCATCTGGACATACATAGGGTTAGTGGTAGCCA
+GTGTAGCATTTATTTATGGGGCGTGGATGATTTTAGATACTATCATATTTGGAAATGCTG
+TTAGGGGATATCCTTCACTACTTGTTTCAATACTGTTTTTAGGTGGAATTCAGATGATTG
+GAATAGGAGTATTAGGTGAATATATTGGACGCACATACATTGAAACCAAAAAACGCCCGA
+AATACATCATCAAGAGAGTCAAAAAATGAATAAAGCAATAAAAGTATCATTGTATATATC
+TTTTGTTTTGATTATTTGCGCCTTATCTAAAAACATAATGATGTTAAATACATCTGATTT
+CGGAAGAGCCATTAAGCCATTAATTGAAGACATACCAGCATTTACATATGACTTACCTTT
+ATTGTATAAATTGAAAGGTCATATTGATTCAATTGATAGCTATGAGTATATAAGTTCATA
+TAGTTATATTTTGTATACATACGTCCTGTTTATTAGCATTTTTACTGAATATCTTGATGC
+TAGGGTGTTATCGTTATTTCTAAAAGTAATATATATTTATTCATTATATGCGATATTTAC
+TTCATATATAAAAACAGAAAGGTATGTAACTTTATTTACATTCTTTATTTTAGCTTTTCT
+TATGTGTTCTTCATCAACACTGTCAATGTTTGCATCATTCTATCAAGAGCAAATAGTTAT
+AATTTTCCTTCCATTTTTGGTGTATTCATTAACATGCAAAAACAATAAATCTATGCTTTT
+GCTATTTTTTTCGTTGCTAATAATATCTACTGCTAAAAATCAATTTATATTAACCCCACT
+AATAGTGTATTCATATTATATTTTTTTTGATAGACACAAACTAATTATTAAATCTGTAAT
+ATGCGTGGTGTGCTTGCTTGCGTCAATATTTGCAATATCTTATTCAAAAGGTGTTGTTGA
+ATTAAATAAGTACCATGCAACATACTTCGGTAGTTATCTTTATATGAAAAACAACGGGTA
+TAAAATGCCATCGTATGTTGATGATAAGTGTGTTGGGTTAGATGCCTGGGGTAATAAATT
+CGACATATCATTTGGCGCAACCCCAACAGAAGTTGGAACGGAATGTTTCGAATCTCATAA
+AGATGAAACGTTTTCGAATGCACTCTTTTTATTGGTTAGCAAACCAAGCACCATCTTCAA
+ACTTCCATTTGATGATGGTGTGATGTCTCAGTATAAAGAAAATTATTTCCATGTATATAA
+AAAACTACACGTAATATATGGAGAATCAAACATACTAACGACTATTACTAACATAAAAGA
+CAATATATTTAAAAACATTAGATTTATATCATTGTTATTATTTTTTATTGCTTCTATTTT
+TATTAGAAATAATAAAATAAAGGCATCTTTATTTGTAGTATCTCTTTTTGGAATATCTCA
+ATTTTATGTGTCATTTTTCGGGGAAGGATATAGAGATTTAAGCAAGCATTTATTTGGAAT
+GTATTTTTCGTTCGACCTTTGCTTATACATAACAGTCGTTTTTTTAATTTATAAAATAAT
+TCAAAGAAATCAAGACAATAGCGATGTAAAGCACTAAGTTTAAATTGCGCGCCAATCATG
+GCGCGCACAAGCTATAATACCAACCTAATTTCTCCTCCTCTTAGAGTGACTATATCTCCT
+GATAGAATTGCGGTATTGACTATCAAATGCCCTGATTCGTTGTTTATTGTAATATCTCCT
+CTATCTGCAGACGATAACTTAAATGCATCATTGCCCACAACAAACCCCCTCCAGAACCAA
+GTGCTGATATTATCATCAACAGTGATAGATACATATACTAACTGATTATCGTTATAAGTG
+ATTCCTGTCTTATACTTAACATAAGGACTTCCACTTTGATTCTCGATAGACACATAACAT
+CCAGGGGTTATGTTTGTATGCGTCCCGCGACTATCGCCCCATTAACGCCATACGATAAAT
+GGGATGGTGAGAAATGGGTGACGGATACCGAGGCACAGCATAGCGTCGCAGTAGATGCAG
+CAGAAGCACAGCGCCAGTCGCTGATTGATACTGCAATGGCTTCCATTAGTCTGATTCAAC
+TGAAATTACAGGCTGGGCGGAAGCTGATGCAGGCAGAGACCTCCCGACTTAACACTGTGC
+TGGATTACATTGACGCGGTGACGGCAACAGATACCAGCACCGCGCCGGATGTCATCTGGC
+CTGAACTGCCGGAGGAGTAGGCCATTCAATATCTGGCGCACTGGAAGTATCGACCAGCTC
+CAGTGCGTCCAGATAATCCAGCCACAAATTATATTGCGCCAGTTCCTCACCTTTCAGACG
+ACCAATAGCCGCTTTACCAGCCCATTGTTTACTGTTCATATAATCGTTGGCCTGATTAAT
+CAATTGCTGCTTTTTCAGTTCGGCTGCAGCAATCTGTTCCTCATGTGTTGGTGGTGGAAT
+TTCAGACCATGCAGGAAAACCATTTTCTCCAGCGATACGGATTTTTCCTTTCGGCGGTAA
+TCCGGAAAACTCAATATACACTTGCTCATCAACTTCAACAGCATCATCTGGCCATGAGCC
+AGCTTGCGTGTAATCCTCTTTCATCTCCAAGGGATAGAAAGAGTTTGTAGTCGCGGAATA
+TATGTAATTCATTTTTCACTCCATAAAGTTAAAAGAAATTAACACCCTAATGCGAAAAAT
+GAAGCACCGATACCGGGTACGCCTGCTCTGGAAATAAATTTCACCGGGTCCTGGTTATAA
+CCGGCACAAGCTATATAGCCAACATTTGCACTGCCGGGAGTGTAATCCTGAGTCGCAAAT
+ACCCGCAGACATCTATTCGGAAATGCAATCGGAAAATAGGTTACTGTGTCCTGAGACGTC
+AGCGGAACATCAATTGGCCCCCATTGAATAATTAAACCGGATGGCAATTTTTGATATCCA
+GGAACTGAAGCAGAAAGCATAAAACTACCCATATCAGGTATCTGATTCGCCCCTGTCCCT
+ACATTTCTTTTAGCCGCTTCTCCCAAACCAAGGTTTTCGAGAGCCTTTTGCACCGTGCCG
+TCCAATTTGATATCGCCAAACGGATTCTTGCGGCTTAACAGCAGCGCACGAAGCGCGGTA
+AGCAGCTGGTCATGCCGCCCCTTCTCCAGGCTGGCACCGGAGGCCTCCACAACGCTGCAA
+AGCTCCTCCTGCAACATGTCAAAGTAGTCATCATCCAGATCGGTGGCAGGCGTGCCGGTC
+TGGGGGTTACCACGGGTACGGGGGATTACCAAAGGCAGCACCTTTAAGCTCCGCAAGACG
+TTCTGACCAGTCATGCGCCAGCGCGTTGTCTTCCGCAGTGTAATACGCGGCACATTTGGC
+GTTATCACCATCAGTAAACAGATCCAGAACAAACGGGCCAAACAGGGTGTTAATTCCCCA
+GAAAATGTTGTCCGGCGTGCGCCACTGATCGCCCACTTCCTTCAGTTCATGGGCTGGTTT
+GTTCCGCAGCTCCACCAGCGCCTGGCAATATTTATTACTCATTAAGCCCCCACGTAATTC
+CCTGAGAGATACCACTCTTCACCTGATGCAGCCCGCTTACTGCTTTTCCGTAAACACCGT
+TCACGACGCGCCAGAAAATTGTTTCGTTCTGGCTGGGAGTGGCTTTCACGGAATGCCGCC
+ATCCACACCGTTGCAGCACGACGGTATAAGCCCCTGGACTCCAGTTCTTCCGCCTGGCGG
+GTCAGGCACAAAATCACCCGCGGGTCGTTAGTGCCGACATAGAAATTGCGCACAGGTCTG
+GTTTCACGAACTGGTTGTGGTTCCGGATCCTGCGCTCTCTCAGTCAGGCGCGGGAAATGT
+CTGTGTGTATCTCCTTCACAACGGTGAGCCACACGCCCACTCTGACGTAACTTGCTTGCT
+GACTGCAGAACGCGCTGCCGTGAGTAACCTGCAAAAGCATCCGCAATGTCTCCGGAAGTA
+CAGCCCGGATGGGCTTCAATGAATTTCTGAACGTCATTCAAAAGACTCATGCTCACCCCC
+TGAATCCTGCCGGGATCTGGCTGTAGTCCACATTGTCGTAACTGGCTTTGAAGTACGGGT
+CTTCGCGTTTTTCTGTGTACGTGCTGACGGACGGCGATAAGCGCAGGGAAAGCTCATCCC
+ATTTTTCCCGCAGCTTCGACGGGCTGAGCACGTTACGGCACCAGAACGGATCGCGGCTGA
+CGCGGCTGTACATCTCGCAGATTTGTTTGTGAGTACGACCATCCTGCACACACATCAGGC
+GAATTTCGTTTGCCCAGGCTGTCCAGTTCGGTTCTTTGGGACGAACCACCTCGCCGTCAC
+ATTCGGCGGCCTGCTCGTACAGGGCGATGATTTTTTTCCAGAGCCACTGTGCGCAGGTCA
+AATCATCCTGCGTTCCCCACTGGCGCTTTTTAGGGCTGAATACAACCGCATCAGGATGGC
+GAGTTAAAAAATCCTGTTCATCCGTCTGCGTGTCCGGTTGCGAAGCGTCCGGACGAGAAG
+GTTTTTTATCTGACGGATCATGTTTTGATTTTACTGACGGATCCCCGCCAGATTCTGACG
+GGTGAAAACCCGATTTTTTGCCAGATTTCGACGCATCAAATTTTGACGGGTCAGATTTTG
+ATGCGTCAGATTTTGACGGGTCAGAGTCTGACAGTTGAGAAAATGCCGCTGCCTGAAGCT
+TCGCAACGTTAAGCTGATAAACATTCGACGCATTGCGGTTATGATGAGGAGCAGCAAAAT
+GGCTAGCGAACGCAGTACTGATGTGCAGGCATTTATCGGGGAGCTGGACGGCGGCGTATT
+TGAAACCAAAATCGGCGCAGTTCTCAGTGAAGTCGCTTCCGGTGTGATGAACACGAAAAC
+CAAAGGTAAGGTCTCACTCAACCTGGAAATCGAACCATTTGATGAGAACCGTCTGAAAAT
+CAAACACAAACTCTCATATGTTCGCCCGACTAACCGTGGGAAAATTTCCGAAGAAGACAC
+CACCGAAACGCCGATGTATGTCAATCGCGGTGGTCGCCTGACTATTCTGCAGGAAGACCA
+GGGACAATTACTGACTCTTGCCGGTGAGCCTGACGGAAAACTCCGCGCAGCAGGTCATTA
+ATATCATTCTTAATTAACTAATTATTTATCTCATCACTGAATATCTTAATATAGTGAGGA
+CTTATTATGTCTCAGAACTTAGACGCAACCGCAATTAATCAAATCCATGCCCTTATTTCT
+GCTCAGGGTGTTAATGAAATTATCAGTAAGATTGGTGCCGATGCTGTGGCATTGCCTGAG
+AATTTCCGCATTCATGATCTGGAAAAATTTAATTTAAATCGCTTCCGTTTCCGTGGTGCG
+CTTTCCACTGCCAGCATCGATGACTTTACCCGTTATTCTAAAGATCTTGCAGATGAAGGC
+ACCCGCTGCTTTATCGATGCTGATAATATGCGTGCCGTCAGTGTGCTTAACCTGGGTACT
+ATTGATGAACCAGGTCACGCAGATAACACCGCCACTCTCAAACTGAAAAAGACAGCACCG
+TTCTCTGCCCTGTTGTCTGTTAACGGCGAGCGTAACTCCCAGAAATCACTGGCAGAATGG
+ATTGAAGACTGGGCCGACTACCTTGTGGGCTTTGATGCTAATGGTGACGCCATTCAGGCA
+ACAAAAGCGGCTGCGGCAATCCGTAAAATCACGATTGAAGCAAACCAGACCGCTGATTTT
+GAAGATAATGACTTCAGCGGCAAACGCTCCCTGATGGAATCTGTCGAAGCGAAGACCAAA
+GACATTATGCCAGTGGCATTTGAATTTAAATGCGTTCCGTTTGAAGGTCTGAAAGAACGT
+CCGTTTAAATTACGCCTCAGCATTATCACTGGCGATCGTCCTGTACTGGTTCTGCGCATT
+ATTCAGCTGGAAGCGGTGCAGGAAGATATGGCTAACGAATTTCGTGATCTGCTTGTTGAG
+AAATTCAAAGACAGCAAAGTAGAAACCTTTATTGGTACTTTCACCGCCTGATTTCATTAC
+TGCAAATGCCCCTGCGGGGGCATTTATGGAAACGTAATTAACTCAATAATCACCGGATGG
+TGAGGGCTTCCTTTTACCCAAACTCAGCGCGGTGCAGCGCATATACGTGGAGAACAAAAT
+GTCATTTATTAAAACTTTTTCCGGGAAGCATTTTTATTATGACAAGATAAATAAAGACGA
+CATCGTGATTAACGATATCGCGGTTTCCCTTTCAAATATCTGCCGCTTTGCCGGTCATCT
+TTCTCACTTCTACAGTGTCGCCCAACATGCGGTGCTTTGCAGCCAGCTGGTGCCGCAGGA
+ATTTGCTTTTGAAGCATTAATGCATGATGCAACAGAAGCGTATTGCCAGGACATCCCCGC
+ACCACTGAAACGCCTTCTTCCTGACTATAAACGGATGGAAGAAAAAATAGATGCAGTAAT
+CCGTGAGAAATACGGGTTACCTCCTGTTATGAGCACGCCAGTGAAATATGCCGATCTCAT
+TATGCTGGCAACCGAACGCCGTGATCTCGGGCTTGATGATGGCTCTTTCTGGCCTGTACT
+GGAAGGCATCCCGGCAACAGAGATGTTCAACGTGATTCCACTGGCACCGGGTCATGCCTA
+CGGGATGTTTATGGAACGTTTTAACGATTTATCGGAGTTACGCAAATGCGCATGAATGTT
+TTCGAAATGGAAGGGTTTCTTCGCGGGAAATGTGTACCGCGAGATCTGAAAGTGAACGAA
+ACAAATGCTGAGTACCTGGTACGTAAATTCGACGCGCTTGAAGCTAAATGTGCGGCACTG
+GAAAACAAAATAATACCAGTGTCAGCTGAACTGCCACCAGCAAATGAAAGTGTTCTGTTA
+TTTGATGCTAACGGAGAAGGCTGGCTGATTGGCTGGCGTTCTCTCTGGTACACCTGGGGA
+CAAAAAGAAACCGGAGAATGGCAGTGGACATTTCAGGTTGGGGACCTTGAAAACGTCAAT
+ATCACTCACTGGGCAGTAATGCCAAAAGCACCGGAGGCTGGAGCATAATGACCACATTTA
+CCAATAAAGAACTGATTAAAGAAATCAAAGAACGAATCAGCAGCCTAGAGGTTCGAGACG
+ATATTGAGCGCCGTGCTTATGAAATCGCACTCGTATCTCTGGAAGTAGAGCCAGATGAAC
+GCGAAGCCTATGAATTATTCATGGAAAAGCGTTTCGGTGACTTAGTAGATCGTCGGAGAG
+CAAAAAACGGCGATAACGAATACATGGCATGGGATATGACTCTCGGTTGGATCATCTGGC
+AGCAACGAGCTGGTATCCATTTTTCAACAATGTCACAACAAGAGGTGAAATAATAGAGCC
+ATACAGCCTCACACTCGATGAGGCCTGTCAGTTTCTTAAAATATCCTGATCTACCATCGC
+CGTCATAGAGCGTATTTTTATTACCTGATTTGCAGGTTCGATTCCCTATTCGGAGATAGC
+ACTCATGCAACACGAACTACAGCCTGATTCACTGGTTGATTTGAAATTCATCATGGCTGA
+TACTGGCTTTGGTAAAACCTTCATCTATGACCGGATTAAGTCAGGCGACCTGCCAAAAGC
+CAAAGTTATCCACGGGCGAGCAAGATGGTTATATCGTGACCATTGTGAATTCAAAAATAA
+GCTCTTAAGCCGCGCCAATGGGTAA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_002737.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_002737.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1977 @@
+>NC_002737.2|provirus_529627_569283
+TTAAAACTTAAAAATAATATCGATGTTATCCATAGTAACCTCGACTCTATCTATCAATTG
+CTTAACTATCCTAGATTGAACATCATACGAAGATTTTCTAATGTCAAGGTTATCCATCAG
+CATTCCAAGAGAGTCTTCGTTTTTCTTGTCTAAATAATTCAATTTAATTGCTTTGTTATA
+ATCATCTTTTAAATGATTGAGTTCTTCGATGTCTTTTTTTAGTTTTGGTAGGTCAATCAA
+ATCATTAATATATAAATCGTTTAGACGATTGATTTTTTTATCGATTATCTCTATTTCTTT
+TTTTAAAGGTGTAATATCAATTATATTGTCATCTTTTTTTATTTTTTTAAGATATTCTTT
+ATCGTGTTGAAGTTTATAAAGAACATCAATAACATATTTTTCGATGTGTTTTTTTTCATA
+TCGACCAGTGTTACAAATCTTTTGGTTATTATAATTATTAACACTTCGTCTAGCCAAACT
+TTCTGTTTTATTAACACAAACGTAAGTTTGCCTTCTCGTACCATCGTTCTTAGCTCTTCC
+TGTGCATACTTTTAAAGGGGCACCACAATAACCGCATTTTGCTATGTGAGAAAGCATATA
+TTTCCCTTGAAAAGGTCTAGTATTTGTTTTCGTATCTGTCCTATGTGCTAAAGCTATTTG
+CGCTTTATTATATGTTTTTTCGTCGATAATGGCTTGATGATCACCTGAGAAAGTTTGTTC
+CCTATACTTCACTAATCCTTTATATGTTTCGTTTTCTAATATTCTTTTTACTTTTACATG
+TGTCCACGTATTCCCGACGAAATTGTCTCTCGCGTAATTTGTAATTGACATGATTGAGCA
+GCCAGAGATTATCATGTCAAACATCTGCCTGACATTAGCAGCCTCTAACTCGTTGACCGA
+CAATGTTTTTTCGTCTTTGTTGTATCTATATCCATAAGGTGGTGTTTTCCAAGCCGTTGT
+TTTTCCAGATTTTGCTCTATTCATAACACCAAACTGCATTCGCTCTTTAATCTGTTCTCT
+TTCAAACTCTGCAATAGCTGACAAGAGAGTGAGAAAGAGATTTCCCATTGCTGAAGAAGT
+GTCGATATTTTCTTTTAAGCTGACAAAATGGATATTGTTAGCAGTAAATACATCTTTGAC
+TAAGTAAAGTGTGTCTTTTACATTTCTTGATAGCCTGTCTAGTTTATAGACTAAAATAGT
+ATCAAATTTATTGTTTTTACCGTCTTCAATCAATTCTGTTATTGCCGGTCGTTCAAGTTT
+ACCGCCTGAAAAACCTGCATCAGAGTAGTTTTTGTAAATTTTCCATTCCATTGCCTCACA
+ATACTTTGTTAAAGCTTCAATCTGTCCTTGAATGGAATATCCTTCTTCGGCTTGATTTAT
+TGTTGATACTCTAGAGTAAATAGCTACTTTTCTCATTGTTTTTTACCTCATTTTTTGTTA
+AAATGAGTACAGTAAAGAGACCTACTTAAAGCAGGTTTTTACTATACTAGATTCGCCTCA
+CGCTCGCACCGACCAAAGTTGAGCGGGGGGCTTTTTTTATTTTGTCTCAAATATACAGCT
+GCACTCGTTACAGTGCCATTGCTTCTTCCCTTTTTCTCCTAAAAATCCCATAACTGTTCC
+ACCTATTAAAAGAGTTCCTGCGACGGCCTTTTTAACAGAAAATGTCTTTTTACCTTGCTG
+CATAAATCCAACATTAGTACTTTTACATTTTGGACATCTTACCGCCTCTTTTTCTTTTTT
+TATCACTTGTTTTATTTCGCTATTTAATTGGGTCTGTCGTACTGAGTTTTTCATTACTTG
+CTTTAAGCCACGGTTTTCAATCTCATTCATCTTTTCTGCATTGTTTTTTGCTTCAAAATA
+TTCTCCCAGATTTTTTGATTTTAAAAGTTGTTTTAACGTCATATCATTGTCCTCTCTAAA
+AACATTAGTTAAAATTCAATCGGTGTAAAACTACCAACAACGTCATATATTTTAATGTAT
+GTATCTTCTGCTGGTGGATAGCCAATAAAAATATCGCTATATTTTTTATTAAGTGATACT
+AATCGAAGTCCATCATGTTCAGTGTAAACTTTTTTAAAATAAGTGTTCCCGTTATGTACA
+ACAATACATAATTGTCCGCTGTATGTTGACATTCCTTTATCAACGATATAAAGCATATCT
+CCTTGCTCGTACTTTGGTAACATGCTATCGCCTCTTATGCCAATAGCATAATCATAATGT
+GGAGGTTCTTCGTCTGTATAAACTGTATAAGTATCATAGTCATCTGCTTCAAAACCTCTA
+CCAAATCCGCTTGCTGCTGCAGCAAAAGTCGTTCCTTTAACTTCAAAAATATCTTCGATA
+TCAGTTTTTTTATCACTGAAATTGATGATTTTTGTTTGTTCTTCCAATTGCTCTTTTGCT
+GTATCTAAAACAATTACTCTTCGTTGTTCTTCTAATTCGCGGTATATTCCAAGCAGTTCC
+GAACCATCTACTTCGCTATTTAAATCAATACCAAGTAAAAACTCTGTTGATATATTAAGT
+GCTTTAGCAAAATCATCTGCCCTGTTTAAAGGAAATTCTCTTGTTTTATTAAAATATCTA
+GACATCGTTGATTTTGCAATACCAACATTTCTAGCCAACTCACTCATTGACATCTTTCTT
+TCTTCTACTTTGCTCTGTATCAAAGAAATAATTTCGCTGTTTGTTCTCATGTTTTGTTAT
+CCTTAATGTTATTTAGTAATATCATTATACCATCGTTCCCAAAAAAATACAATAAAACGC
+TAAAAAACAAATAAACGTATTTTTTTTAGAAAAAATCGTTGACAATTTGGAACGTAGGTT
+TTATAATAAAGGTGTTCCAAAACGGGAACAAAAATAAAAAAAGGAGTATGTATATGACAA
+TCAATTTGAAGCGACTAAAAGCCGAGCGAATTGCTAGCGGTATGACACAATGTGAAGTTG
+CACAATCTATGGGGTGGAAAACACGAACACCATATGCAAAAAGAGAGAACGGTATTGTTT
+CAATTGGAGCTGATGAGCTTGCAAAAATTACTTTGATTTTTGGATTACCAATCGAAAAAA
+TAGCAATTTTTTTTGATAAAGACGTTCCCGTAATGGAACGATGATGCAAATAAAAAAGCC
+CTGTAAAATAGCAGTTTACGGGACAGACAGATTCTTATGAGGCAATTTTACCATGAAAAA
+CAAAAAAGAGCAATGGACCCCAAAAGTTCACTGTTTTCGAAAAGATGGTTCACAATGTGA
+GCCAGAAAATATAACAGTGCCAATTTCTTTTGCAGGTTACTATCAAATTTTATTAGAACT
+AGGAGTATAACATGAAACTATTAGATTTTATTTTTACAAAACCAAAAAAACAGGAACCGA
+TTAAACACGATACTAAGCGATTGTCATCTGAAAAGCAGTATGATGCATTCCACGCTTATA
+TGAGAAAAAAAGTATGAAACAACAACTAATTAACGACAACGAATTTTTGCGAGACGAAAA
+TCGCAGGTTAAATAATGAATTGGCGGAACATTACTTTGTAGTTACAGCTAAAGCAAATTT
+ATTAGATGTCATTATTGCTAGTGATTTTATCTTGAAAAGTACGCTAGATAAATGCATTGC
+TGAATTGGATGAAATTGATCAAATAGCCCTGTTAAAAGCATGGAACAAGGGAGAATTATA
+ATGTCAATAACAATAAACAAACTTGAAATCGAAAACGTTAAGCGTATTAAAGCGGTAAAG
+ATTGAACCATCTGCAACAGGCTTGACCATTATCGGTGGTAATAATAACCAAGGCAAAACA
+AGCGTATTAGATGCTATTGCTTGGGCACTAGGCGGTAATAAATACAAGCCTAGTCAAGCT
+ATGCGCGAAGGATCGCAAGTGCCACCTACGCTTAAAATTACCATGTCAAATGGACTTATT
+GTTGAACGGAAAGGCAAAAATGCCAGTCTTAAAGTAATTGATCCAAACGGCCAAAAAGGT
+GGTCAGCAGTTGCTAGATAGCTTTGTAGAAGAATTGGCTATTAACTTGCCGAAATTTATG
+GATAGTACACCAAAAGAGAAAGCAGATGTCTTGCTTGAAATTATTGGTGTCGGTGATCAG
+CTAGCAGAGTTAGAGCTAAAAGAAAAAGAAATATACAATCAACGTCACGCTATCGGTGTT
+ATAGCAGACCAAAAAGAAAAGTTTGCTAAGGAGATGACATATTATCCTGACGCACCTAAA
+CAACTGGTAAGTATTTCTGAGCTTATCCAACAACACCAAGCTATCTTAGCCAAAAACGGA
+GAGAATGCTCAAAAGCGTCAAAATGTAGAACGTATTCGCTATGATTATAATCAATCTATC
+TTGGAAGTTGACCGTTTACGCAAGTTATTAGCAGATGCAGAAGCTAAGACGAATAAGTTA
+AGCGAGGATTTAAAAATAGCAAATACTGACGCTATGGATTTACATGATGAATCAACAGCT
+GAAATCGAGGCGAATATTGCCGATATTGATGAAGTCAACCGCAAAGTGCGCGCTAACTTT
+GATAAAGATAAAGCTGAAGAAGATGCTAAACAGCAGCGTGAACAATATAACATATTGACT
+AATGATATTGAGTCAATTCGTCAACAAAAAAGAGACTTATTGATTAATGCAGATTTGCCG
+CTTGAAGGCTTATCAGTAGATGATGGAAAGTTACTTTACCTTGGTCAAGAGTGGGATAAC
+ATGTCAGGCAGCCAACAACTAATAGTAGCAACTGCTATTGTACGTAAACTAAAACCAGAT
+TGTGGCTTTGTTTTGATTGATAAACTCGAACAGATGGACAACATCACACTTGAACAATTT
+GGTAAACGGCTAGAGCAGGAGGGTTTGCAAGCTATTGCAACCCGTGTATCAATTGGTGAA
+GAGTGTGCCATCATTATAGAAGATGGATACTCAGTGGAAAACAAAGCTCATAACTTTAAA
+ACAGCAGAGGGTGGTAATTTTGCTGAAACAGTAGCACCGACTTGGAAAGGTGAGTTTTAG
+AAAGAGAGGTAAATATGCAAATTACAAGAGGTAAACGAGCACGTGCTCAACGTGTCATCA
+TTTATGGACCAGAAGGAATCGGTAAATCTAGTTTTGCTGCTAATTTTCCTGAACCATTGT
+TCATTGATACGGAGGGATCAACAGACAATATGGATGTGGCCCGTATGGATAAACCAACAA
+GCTACACTATGCTAAAAAATCAAATTGCATGGATTAAAGCGAATCCAACATGTTGCAAGA
+CACTGGTCATTGACACAATCGATTGGGCAGAAAGCTTAATAGTAGATGATGTCTGTGCTC
+AACATGGCAAGAAAGGTATCGAGGACTTTGGTTGGGGCAATGGTTATACCTACACAAAAG
+AGGAAGTAGGTCGATTCTTGAATATGCTCCAAGAACTGATTGAACTCGGTATCAATATTG
+TATTAACTGCCCATGCACAAATGAGAAAATTTGAACAACCTGACGAGATGGGAGCTTATG
+ACCGTTGGGAGTTGAAACTTGGTAAAAAGACAAGCTCACAGACTGCCCCCTTGGTCAAAG
+AATGGGCTGATATGGTCTTGTTTGCCAACTACAAAACAGTAGTTATGACTAGCGAATCAA
+AAAAGAAAAAGGCAACTGGTGGTCAACGTGTGCTATACACGCAACATCACCCAGCGTGGG
+ATGCAAAAAACCGTCATGGGTTACCAGACGAAATGCCTCTTGACTATGCAGTAATCGCAC
+ATCTATTCGCACAAGTACCAACTCAACCAGTGCCACAAACGCCACCAGTACAGGAAACTC
+CTGCATCACAAACCGCACATGAATCCGTACATGAGCAAGCTGAAAAAGCACCAGAACAAC
+CACCTATGCAACCGACATCTGCGCCGGTAGCCTACCCACCAAGTATGCCAAAAGCATTGA
+CTGACTTGATGTCGGCAGAGCAGGTCACTCCTGATGAGCTTGTGGCAGTAGCAAACATCC
+GAGGACACTTCCCGCCAATGACACCAATTGAAAACTTCCCGTCAGATTATTGGAATATGA
+TTGTGGCCAATTGGTTAGCTACGTTAGAAGTGATTAAAACGCAAGTGCGTACTGTCGAGC
+CACCCTTTACTGTGGAAGGCGCATAGGTTTTGGGAATTAGAAATTATAGCGAGGTATAAC
+AAACAATGAATAAAACAATCAAATTAGACTTGTCTGCCATCGGAGAAGGTGGCTTACAAG
+AAAAAGTAGACAAGGAATTGGAAAAAGTCTTTGACAATATCTTAGATCCTAATACAGAAA
+CAAAAGTAGCCCGTAAAGTAACTATTACGTTAACTATGAAACCAGACGATGCCCGTCAAA
+CTGTTTCAACAGCTATGGAAGTTAAGTCAACGCTAGCACCACAGACAGGCGTGGCTACAA
+CGGTCCTTGTTGGTCAAAAAGATGGTAAGGTTTATGCTAACGAGCTCAAAAGCGCGATGC
+CTGGTCAAACTTATTTTGACGATGAGGCAGTGCTAAGAACTGACATCGGTGAACCAATTG
+ATCACCTTGAAAAAGGTATTAATGAAGATGTTATTGATTTTAATAAGCAAAAGAAAGTAG
+GAAACTAACATGACAGAAAACATTAAAGAAGCTTTGGAATATGCAGTAAATACAGCTCAC
+GAAAAACCTAAGACTATCTTGGGTAGTGATGGTAAAGAGTATTATGATCGCAACAAATAT
+TCTTTGGTTGAACTTAAAACTAAGTATTATCCAAAAACATTGAATTTAAACACGCTTGAC
+AGTTTAATTGATTATCTTAAATCAGATATGAACAATATTAATTCCAAGCGTCTTATGGTC
+ATTGTAGAAGGCCCTCGTGAAGTTATTGTTTGCGAAGAAGATGATGACGACCTTAATCGA
+AATGTGTTAGTAACTGTGGAGGCAATTATTCCAAATGTTCAATTTGGCCACTATGATTCA
+CCTTCTGATTTTAATATTAGTCTGCAATCATTATTCGTTAACGCTGACGATCGTAACACA
+GTTATTGAATTCGCTAGTGCATTAAAAATCGAAAATGGCTCAGAAATTGTTGATGATGGC
+ATTGGTCAAACTGCCACAATTAAACAAGGTGTGGCAAGCCTTGCAAAAGCTAAGGCGCCA
+AACCCAGTTACATTACGTCCATACCGCACATTTTCTGAAGTAGAACAACCTTCAAGTGAG
+TTCATTTTCCGCATTAATCAACTTGCTAATATGGCTTTGTTTGAAGCAGATGGTGGAAAG
+TGGCGCTTAGATGCTATCAATAATATTGCTAACTACTTAAAAGAAGAACTTGCTGATCAA
+ACTAACATTACAATTTTAGCTTAATAGAAAATAGGAGAAATAAAAATGACTGAATACAAT
+AACAACTTTGACCGTGAATTGGGATGGGATGATGAAATTACACAAGACAGTGTAGGTTTT
+GTTCAATTAGTGCCTGGTGATTATCAATTCACAGTAACCAATATGGAGCGTGCTCGTCAC
+ACACCTAATCCGAAGAGTCCAGGAAAATTACCAGCGTGTAACAAGGCGGTCGTTACGATT
+CAAATAGAAACATCAGAAGGAATCGCGCAATTAACTCATAACTTATTCCTACATACTACA
+ACAGAAGGTATGCTATCAGCTTTCTTTGGAGCTATTGGTCAAAAGAAACATGGGGAACCA
+CTTAAAATGAACTGGAATACCGTCATCGGAGCTAAGGGGGTTGCTCGTATTAATAAACGT
+AAAGGCACCGGCGATTATGCTGATCGCGAATACGATAACATCAAATCTATGATTTACGCT
+GATGAAGTTGATTGGACAAAAGTATTAAATAAAGATGTCGCACAACCACAGCAAATGACA
+CATCAACAATCTGCTCAACCTACATATCAGGGACAACAGGCACAAGGCACTAATTTTGCA
+CAACAACCAGCAACGCAGTCATATCAACAAGGTCAAATGCAAACACCTCAACAACCTCAA
+GGCGGATGGGGAGGATTCTAATGCAGCTTAGACCTTACCAAGAAGAGGCAAGGTCAGCAG
+TGCAACACGAGTGGGAAGACGGCAAGAAGAGAACTCTTCTTGTCCTTCCAACTGGTTGCG
+GTAAAACTATTGTCTTTTCGAAAATTATCGAAGACCGTGTAAGGCTCGGAGAGAGAGTTT
+TGGTTCTGGCTCATAGGTCCGAACTTTTAGAACAGGCTAGTGATAAATTGATGACAGCAA
+CTGGATTAGGGACAGCATTAGAAAAAGCAGAGAATACTTCTTTAGGGTCATGGTTCAGGG
+TTGTAGTTGGATCAGTTCAAACGATGCAGAGAGAGAAGCGTTTGAGTAAGTTTCCTACAA
+ATCATTTTGACACAATTATTATTGATGAAGCCCATCATGCCATCTCTGATGGTTACCAAA
+GAGTTTTGCAACACTTTGATAGTAGCAATGTTTTGGGAGTGACAGCGACACCAGATCGCG
+GTGACAAACAAAATCTAGGTAAGTATTTCGATAGTTTAGCTTATGAATATTCCTTAGTAG
+ATGCCATCAAGTCTGGTTACTTATCTAAAATTACCGCAGTTACTATCCCGTTGACTTTGG
+ACTTATCTACAGTTAGTCAGCAAGCTGGAGATTTTAAAGCAAGTGAGATTGGGACGGCGC
+TTGACCCGTACCTAGAACAAATTGCCGATGAAATGGTGAAGCAATGCGCAAACCGTAAAA
+CAGTTGTATTTCTTCCGCTTGTTAAAACTTCCCAAAAATTTCGTGATATTCTAAACCAAA
+AAGGATTTAAAGCAGCAGAGGTCAATGGGGAATCGAAAGACCGCGCTGAAGTCCTAGAAG
+ACTTTGATAATGATAAATATAATGTACTATGCAATTCAATGCTTTTAACGGAGGGGTGGG
+ATTGCCCGACAGTCGATTGCGTAGTTGTACTGAGACCCACAAAAGTAAGAGCTCTTTATA
+GTCAAATGGTTGGTCGTGGCACACGATTAGCGCCGGGGAAAGAAAATCTACTATTATTAG
+ATTTTTTATGGCATACCGAACGCCATGAACTTTGTCGTCCTGCTCATCTAATTGCAAAGA
+CACCAGAAGTTGCTCAAAAAATGGTCGATAACATGACAGAGGAAACTGAAGTAACCTTTG
+AATTGTTAGAAGCTGAAGAAGTAGCTAGCAAAGATGTTGTCGCAGAACGAGAAGAAGCAC
+TCGCTAAGCAGTTAGCAGAAATGCGTAAGCGTAAACGTGCATTAGTTGATCCGTTGCAAT
+TTGAAATGTCTATCAATGCTGAAGACTTAGTGGACTATGTACCAGAATTCGGCTGGGAAA
+TGGCTCCTGTTTCTGATAAACAAAAGAACGCTTTAGAAAAATTTGGTATTTTTACCGACG
+ACATTGGAAATGCAGGTAAAGCTACTAAATTATTGGAGCGATTGGCCAAGAGGAGAGAAA
+CTGGCCTAACAACACCTAAACAAATCAGAATGCTAGAACGATACGGATTTAAAAACGTTG
+GAATGTGGAAATTTGAAGTAGCATCAAACATGATTAACCGCATTGCTGCTAGCGGATGGC
+GCCTACCAAAAGGCATCAATGCTCGAGAATACCAACCTGAATAGGAGACAAAAATGGGAG
+AATATTGTCACTTAAAAGAATTAGATGGACTTAGATTTGGATCATTGACAGTCATTAATA
+GAAACCGTAACAATTCTAAGGGTGGCAATGCACGATGGAATTGTCTTTGCGACTGCGGAA
+ATAAAACAGTTGTTATTGGAAGTAAATTAAGAAGTGGTTATACAAAATCATGTGGATGTG
+CACGTAAAAATGACAACGCTAAAGGTTATTCATCTACAAGACTTTACAGAATTTGGAAAG
+GCATGATGAATAGATGCTATAACCACAAAAACGATAATTACAAATATTATGGTGGAAAAG
+GTATTTCAATCTGTGATGAATGGCTAACTTTTATTAATTTTAGAACATGGTCGCTCTCTA
+ATGGATATAAAGAATCATTAACCATTGATAGAATAAATCCAAAAGGTAACTATACTCCAC
+TAAATTGCAGATGGGTAAGTATGAAAATGCAGCAAAACAATAAAACGAATAATAGGTATT
+TATCATATTTAGGTCAAGAATATACTATTGCTGAATTTTCAGAGAAGTTAAATGTTACCT
+ATTGGACTGTAATAAATCAATTGAAATTAGGTTGGAGTGTAGAAAGAATAGTAGAAGAAG
+CGAGAATGAAAAATGACAGATGATAAATTTGATTTATTACCTTTACTTGATTATATTGAT
+CCATCAAAACTATCATATCAAGACTGGGTGAATGTTGGTTTTGCCCTAAAACACGAAGGA
+TATACTGCTATGGATTGGGACATTTGGTCACAGTCTGACAGTAGATACAAAAAGGGTGAA
+TGTTTCGCTAAATGGGATAGTTTCCAAGGTAATGGACTTGGGACTGTCACTGGCGCAACT
+ATCACACAGTTAGCGAAAGAAAACGGGTGGACATCTGACTACCGTACGAGTGATGAAGCC
+CACGAGCTTGATTGGGATAGCACTATTGATCGTGACTATAAAATTATTGACAAGAACTGG
+ATCGAAGCAAAAGAAATTAGAGAACCTACTAACTGGTCACCCGTTCACGATTTGATTACT
+TACATCAACACTCTTTTTGAATCAACTGACAAAGTCGGATATGTAACAGAAACATACCCG
+ATTGAAATAGATAAGGGCATTATCTATAAACCAACAAAAGGAGCCTATGACAGGACAGCT
+GGTCAGCTTATCCAAGAATTACAAAAAAATCCTAATGACATTGGTGCTGTCCTCGGTGAC
+TATAAAGAAGAAGCTGGTGCATGGATACGATTTAACCCTTTAGATGGCAATGGTGTCAAA
+AACGACAATGTAACAGACTTTAGGTATGCCTTGGTTGAATCCGATAGTATGGAACTTGGT
+AAGCAGTATGCTTTATTTAAAGAACTAGAATTGCCAATAGCGACATTGGTCCATAGCGGT
+AAAAAATCATTACACGCTATTGTCAAAGTAGATGCTAAAGATTATCAGGAGTACCGCAAA
+CGGGTTGATTACATCTATCAAATCTGTAAGAAAAACGGCCTTGATATTGACACACAGAAT
+CGTAATCCAAGTCGTCTATCACGAATGCCAGGTATTATGCGAAATGGTCACAAGCAATTT
+TTGATTGATACAAATATTGGTAAAACCAATTATGAAGAATGGTATCAATGGATTGAAGAT
+TTAAATGATGATTTACCAGAGCCAGAAACGCTAGCTGATGAATGGGATAATTTGCCAGAG
+CTGGCTCCTGAATTAATTAAAGGAGTGTTACGCCAAGGACATAAAATGCTAATTGCAGGA
+CCATCAAAAGCCGGTAAGTCATTTGCATTGATTGAGTTATCTATTGCTTTGGCTGAGGGA
+CAGAAATGGTTAGGTTGGCAATGTGAACAAGGGAAAGTCCTCTATGTCAATTTGGAGCTA
+GACAGACCATCAGCTTTGCACCGCTTTAAAGATGTTTATGATGCGATGGGATTACCTCCC
+GCTAATGTGGCAAACATTGACATTTGGAACCTCCGTGGAAAAACAGTACCAATGGATAAA
+TTAGCACCTAAACTTATCAGACGCTCACTGAAGAAAAATTACCAAGCTGTTATTATCGAC
+CCTATTTATAAAGTTCTCACTGGCGATGAAAACAGTGCTGATCAGATGGCCCATTTTACA
+AATCAATTTGATAAGGTGGCCACTGAACTTGGATGTAGCGTAATTTATTGCCACCACCAT
+TCTAAAGGAAGTCAAGGTGGCAAAAAATCCATGGACAGGGCAAGTGGTTCTGGAGTATTT
+GCTCGTGACCCTGATGCATTGATTGACTTAGTGGAGCTTGAGTTGACTGAAGACCTTATC
+AAGGCACGCTCAGAAAAAGCAGCTGCTAAGATTTACCAACAAGCGTTGCAGGAAAAAGCT
+CTAGGATACTATCAACAGGAAGTAACGCTAGACGACCTAGAAAGTCGTTATCAGATGCAA
+CAACATTTTGACAAAGCTATCAAGGATATCATGGTTAAACAGCCATATCTTGAGGCCGTC
+AAAAAAGCCCAGCATGAGGTAGAAATTGCCACAGCGTGGCGAGTTGATGGAACGCTACGT
+GAGTTTGCGAAGTTTCAGCCAGTTAATATGTGGTTTAGTTATCCCAAGCACGAGGTGGAT
+ACAACTGGCGTGTTGGCTGATATTCAGTTGGAAGATAGTAAACCTCTTTGGAAAAAAGCT
+AAAGAAGCTAGGAAAAGTAAAGAAGAGAATCTCAAGGAACGGAACCAAAAACTTGAGACA
+GCTTATAGCGCCTTATTTGATGGTTCAACACCGGTTACAGTGCAAGAAATTCGTGAATAC
+TTGGATTTAAAATCCAATAAAAGCGTTGAAAATTATATCAAGGAACACGATGGTTACGAT
+GTCAAAAAAGGTGTTGTGTTCCAAATTTCTGATAACAAAGAAACGGAAAAGAAAGAAAAT
+AACTAGAAGAATTCTAAAGAAAAATTACGTTATTTTCTTTTCTCAAATCAGAAAAATACT
+AGTTAATTTCTTTTCTGTTTAATTTTAGAAAAACAAGAAAAATACTAGTTAATTTCTAAG
+AAAATACAGCCTATAACTCTTTCAGAGTTATTATAAAATGTTTTTCCTTCGTCAAAAGTC
+AAAGGGAAAAGGAAGAGGGGCGACTGAGCTACGCCCCCTCTGTCCTTTGTCCCATATTTG
+ACAAAGGCGCATATAAAAAACACAAATTGGAGATGAGGTAAAAATGGAAATTTACAAACA
+AAGAATGATTGAAGAATATAAACAGTTAAAAAAACGCGCAGAAAAACTATCTATTGTGCT
+AAACAGATACTACCTTGATGAGTTAGATTTTGAATTATCTTGCCCAATTGAACTTTTACA
+AACGCAATGGCATATTATGGGAGCGTATTTGAAAATTCTAGAACAAAGATTTTTGGTTGA
+AGGGATTTATTTTAATGATTGAATTTTTTTTGCCTATGGATAAAATCCCGACGACAACTC
+ATCAGCAAAAGAAAGTGACTGTCATAAATGGCAAGCCTCACTTTTACGAGCCTGAGAGTT
+TGAAAAATGCTAGGGATAAGTTTACAAGTCTTTTGGCTCAGCATGTACCACCCAGTAAGT
+TAGATGGTCCTATCCGTCTGACAGTCAAGTGGCTATTTCCCAAAATCAAGGGCAGCACAA
+ACGGACAGTACAAAACGACAAAACCAGATACCGACAACCTGCAGAAGCTGCTTAAAGACT
+GCATGACCGAATTGGGATTTTGGAATGATGATGCGCAGGTTGCTTCGGAAATTATTGAGA
+AGTTCTGGGCTGATACAGTAGGAATATACGTAAAGGTGGAAGAGTTATGAAAATTGATTA
+TATTAATTTTTTTGAACAAGTGGTTCCTGACTGGATGAGAGAGAGTAATGTCAAAATGCA
+AGAAGTTGGATTTAATACTGAAGCGTATTGGCAATGGGCAAATCAATCTATTGTTGCAAT
+CTGCGAAAAGTACGGAAATGACAGTCTGATCAATGGGCAGTTTCATCTGATTTGGGAATG
+GTTGGAGGATAAAGCAAACGGAGGTTAACGATGACTGAAGAGCAAGAACTAATAAAACCG
+CTGCTAGAAGAGATAGAGCGGAAAGATGATAGATTGTATATGCAGTCTAATGTAATTGCC
+GTCTTAATGACAGCAGTTCTTATGTTACTGATGATAAGTATAGCCTTACAAAACCACTAC
+GAGTCGCAAATCACAGGACTACGTACACAGCTAAGCAGGACACAAAAGCAGCTTAAACGT
+GCTAGCGAAGATAGAGCTAGACAGACAAAGCGAATTGCGGAACTTACGCACAACGGAGGG
+TAACATGATTAAGATCGATGAGATACATCGCATACTAGGCATCGACGAAGTTTATAAAGC
+ACCCAAACGACTTACGGACATACTCTTTGATAAAGATAGTCGTGAGGATATATTTAGACA
+GTTTTTGAAATATGAAACAGATGTATCTTACGACTGGTTTATGCAATATTTTGAGGAAGA
+ACAAGCTGACCGCAAAAATAAAAAGCAAGACTTTACTCCTAAATCGGTTAGTACACTATT
+ATCTAAAATAATAAGTGGTAATCAATACTACGAGGTAGCAGTCGGGACGGGTGGGATACT
+TATCCAAGCATGGCAAGAACAACGATTAAATGACAGTCCATTTACTTATCGTCCGAGTAA
+ATACTGGTATCACGTAGAAGAGTTATCGGACAAAGCAGTACCGTTTCTACTCTTTAATAT
+GTCTATAAGAGGGATAAATGGTGTGGTGGTGCATGGCGACTCTTTAACAAGACAAGTTAA
+AAACATTTATTTTTTGCAAAATACAAAAGACGACATGCTGAGTTTTAGTGATATTAACGT
+TATGCCAAGGACTCAAGATATTGAGCGAGAATTTAATGTCAAAGAGTGGATTGGTGATGG
+GATAGAACACATTGAAAATCCACTAATTGAATGGATATAACCAATAACGGTATCCCGCAC
+GTTCGACTCGTGCGGTTGGTATTGACCGAAATTGAAAAATAGAAACGAGGACCTCCTTAC
+ACCAAAACAAAATCTAACGCTGGTTATCGGTCACTGGCTATTATTTAAGGCGCTAATACT
+GACATCGTACGCCTGTGTCAAAATAAAAAAAGGAAGAGAGGGCTTTTCTCCACAAAACAA
+AAAGACGTCCACACGGAACGCCCCCTTGGTTAAATTTAAGCTTAAATAAATTATACCATA
+CTGGAGGCTTTCATGACGTTTTTTCCTGAGATTGATATCCAAAAAACAAAATCCAATGCC
+AAGCGTAAATTGAGAGAGTATCCACGCTGGCGAAGGATAGCTAATGACGTAGATACTCAA
+AAAGTTACAGCTACTTACTCCTTTGAGCCAAGGCAATCACATGGGGTTCCTAGCAAACCG
+GTTGAGAGACTAGCGCTAAACCGTGTGTCAGCAGAACAAGAGCTGGATGCGATTGAGCAA
+GCCGTCAGTATGATACTAGAGCCAGAGAGACGCAGGATTTTGTATGACAAATACTTAGCG
+CCTTATAAAAAGGCAGATAAGGTTATTTATACAGAATTGTGTATGTCAGAGAGCTTTTAC
+TATGATACACTTGACATTGCTTTGTTAGCTTTTGCAGAGCTGTACAGAGAGGGTGTGTTG
+CTTGTTGAGGAAGGAGTTTTTAGCTAGTTTTTATACAGTAATAAGATAGTTTATACATAT
+TTTTACATGTTATTATAGTATTATCAAAATAACAAGAAGAGATAACCTTTTAATCACTGA
+CTATTTTATTTAGTCGCCAACTTTAACTACGATCAAACTTGTTATTTTATGGTATGTGGG
+ACGTGCAGGTTCGATTCCGACTGTTCCTGTGAAAAGCTCTAAGAAGCCTACGGGCCTTAG
+GAGCGATGAAGTTAGAGAATTGCATATCGCTCTAACTCAATATGCACTAGTCATCACACC
+GTGGTGGCTTTTTATTATGTAAAAAAGGAATAAAACATGGAGTTTGTGGACAAAAAATTA
+AGTGAAATAACACCTTATAAAAATAACCCTAGAAACAATGATGAGGCTGTTGGACCAGTT
+GCTGAATCTATTAAAGAGTTTGGTTTTAAAGTGCCTATTGTCGTTGATAAAAACGGCGAA
+ATCGTAAACGGCCACACTCGTTATAAAGCAGCCCAAAAATTAGGGCTAGAAACAGTTCCT
+GTTATTGTCGCAGATGACTTATCTGAAGAGCAAATTAAAGCGTTCAGACTTGCTGACAAT
+AAAGTTGGTGAGATTGCGGTTTGGGATTTAGATTTGTTAAACGAAGAATTAAACGACATT
+TTAGACCTCGATATGTCTGCTTTTGGATTTGACGTTTTAGATAATTTAGATGATTTAATC
+GAAGATGAAAAAGATTTAGACGATTTTACAGGGACTGTGCCAGATGAGCCAAAGTCAAAA
+CTTGGTGACATTTATCAACTTGGTAGTCACAAGTTGATGTGCGGCGACAGTACAAATGGA
+GCCGATGTTAAAAAACTTATGAATGGAGAATTAGCTGATTTACTACTTACAGACCCACCA
+TACAACGTGGCTTATGAGGGTAAAACAAAAGATAGTTTAACTATAAAAAACGACAGTATG
+GATAATGACAGTTTTAGACAGTTCTTGGTTAATGCTTTTAGTTCTGCAAATGAAGTTATG
+AAGCCAGGCGCTGTTTTTTATATTTGGCATGCTGATTCAGAAGGCTATAATTTTAGAGGT
+GCTTGTTTTGATATCGGTTGGACAGTACGTCAATGCTTAATTTGGAATAAAAACTCAATG
+GTTCTCGGTCGCCAAGATTATCATTGGAAGCACGAACCTTGTCTTTATGGCTGGAAAGAT
+GGCGCTGGTCACTTGTGGGCTTCAGACAGAAAGCAAACATCAGTTATTGATTATGAGAAA
+CCTCAACGAAATGGCGTTCATCCAACAATGAAACCTGTCGGACTTTTTGATTACCAAATC
+AAAAACAACACAAAGGGAAGCGACATTGTCCTTGATTTGTTTGGTGGCTCTGGGACAACG
+TTAATTGCTTGTGAGTCAAATGGTCGTCACGCTAGATTAATGGAATATGACCCAAAATAT
+GTAGATGTCATTATAAAACGCTGGGAAGAATTAACTGGAGAAAGTGTTATACAACTAAAC
+TAAAAATCCCTTAAAACCGTTGACTTAACAGTGTTTCAGAGCTATCATGTGATCACAAAG
+ACAAAGAGGTAAATAACATGCTAGTAACAAAAGTAATTCACAAAATCTAAAATATTGAAC
+CAAGCGAAAAAGATTCGGCCTTAAAATATAGATACGCCAACGAACTTGAGTATCTCGTTT
+ACAATCTGTTTTATAGCGCAATTAAAGAAATAACTGCAAAAGATATCAAAAATAACTTTT
+TTTATCAAGATGATCAAGCCTTTATTATTAATTGGCTAGGACTATAAAATAATTTTAAAA
+GGGCGAAAGCCTTTTTTTTATATTTAAAAGTAAGGAAGTGAGGCGATGGCAAATGAAGAT
+AATTTGATACCAAACTCCAAACGAACCCCGAGCGAACTCCGAGAAATTGCAAAAAAAGGA
+GGCATAGCTTCCGGCAAAGCTAGGAGGGAAAAAGCGAATTTGAGAAAAGCTGTGGAGCTG
+GTGTTAGGATCAACTGTACCAAGCGCCTTGCTTCGAGAACAATTAGAACAATTGGATATT
+TCCCCCACAAATCAATCAGCTATTGCACTCAAGCTTGTGGAAAATGCTTTAAAGGGTGAT
+GTTAGATCTGCAGAGCTATTAGCTAAAATTACAACTACCGAGGTCAAAGATAGCCTGGAT
+AGAAAAGAACAAAGACAGCGAATTAAGGCCGCGGAGCTCGCCACAGACGAGCAACGAACG
+CGCATCGAGCTGCTTAAAGTCAAACTTGACGCAGAGAAGGGCGCTAAGCCTGATACTAGC
+TTAATGAGAGCCTTGTTAGATGCTGTGGAAGGAGGTGATTAGCCTTGGAGATTATCTTTT
+CAAATAAACAAAAAGACGTCATTAGACGCCCTTTTAACTACGAATTAGAGGTCAACGAGG
+GCACTTGACCCCTCGTAGCGGAAAGACCACAGCTGGGCATTTTCGTTATGCTAGGTATCT
+GATTGAGTCAGAAGATGAAAATCACCTTGTGACTGCTTATAATCAAGAACAAGCTTATCG
+TTTGTTTATCGACGGCGATGGTACGGGTTTGATGCATATATTTGACGGTAACTGTGAAAT
+AAAACACGACGAGCGTGGAGATCACTTGTTAATCACGACACCAAAAGGCAATAAGCGCGT
+TTATTATAAAGGCGGCGGTAAAGTTAACAGTGTTGGTGCTATTACAGGTATGTCTTTAGG
+ATCAGTAGTATTCTGCGAGATTAACTTACTGCACATGGATTTTATCCAGGAGTGTTTTAG
+GCGTACTTGGGCGGCTAAGCTACGTTATCATCTAGCAGATTTAAATCCCCCAGCACCTCA
+ACATCCAGTAATTAAAGATGTCTTTGATGTTCAGAACACGAGGTGGACTCATTGGACCAT
+GGATGATAACCCAATACTAACCGCAGAGCGTAAACAAAACATTATCAACAGTCTTAAAAA
+AAATCCATATCTATACAAACGAGATGTACTTGGACAGCGGGTCATGCCTCAGGGAGTTAT
+TTATGGCCTTTTTGACACGGAAAAAAATGTTTTGGATGCTTTGATTGGCGAACCAGTAGA
+GATGTATTTCTGTGCAGATGGAGGTCAATCAGATGCCACCTCTATGTCTTGTAATATCGT
+AACAAGAGTTAGAGATAACGGTAGGATAAGCTTCAGACTTAATCGTGTAGCTCACTACTA
+CCACAGCGGAGCTGACACTGGCCAAGTAAAAGCTATGTCAACCTACGCTTTAGAGTTAAA
+AGTTTTTATAGACTGGTGCGTTAAAAAGTATCAGATGCGCTATACAGAGGTATTTGTGGA
+TCCTGCCTGTAAATCTTTGAGAGAGGAGCTGCATAAGTTAGGAGTATTTACTCTGGGAGC
+TCCGAACAATTCTAAAGATGTATCTAGCAAAGCAAAAGGTATTGAGGTCGGTATCGAACG
+CGGCCAAAACATTATCTCAGATGGCGCTTTTTATCTTGTTAATCATAGCGAAGAAGAGTA
+TGACCACTACCACTTTTTAAAAGAGATAGGGCTGTACAGTCGTGACGACAATGGCAAACC
+TATTGATAAAGATAACCATGCCATGGACGAGTTTAGATACAGCGTCAACGTGTTTGTGCA
+TCGGTATTACAACTAAAGGAGTTGCTTAAATGGGAGTAATCCAAAAAATAAAAAATCTTG
+TTACAAGGAGTAAATACGTGATGACAACGCAGAGTCTTACAAATATAACTGATCATCCTA
+AAATAGCTATCAGTAAGCTAGAGTACGATCGTATAACAACCAATCTAAAGTATTATAAGA
+GCGATTGGGATAGTGTTTTATACTTAAACACGGACGGCGAGACTAAAAAAAGAGATCTTA
+ACCATCTACCAATTGCACGGACAGCTGCTAAAAAGATTGCCAGTCTAGTCTTTAACGAGC
+AGGCAGAGATTAAGGTTGATGATGATGCGGCTAACGAATTTATTAGTGAGACACTAAAAA
+ACGACAGGTTTAATAAAAACTTCGAGCGGTATCTGGAGAGTTGTTTAGCGTTAGGCGGAT
+TAGCTATGAGGCCTTATGTGGATGGTGATAAAGTTAGGGTAGCATTTGTTCAAGCGCCTG
+TTTTTTTGCCGCTGCAGAGTAATACGCAAGACGTTTCGAGTGCCGCCGTCGTCATTAAGT
+CCGTTAAGACAATCAACGGCAAAGAGGTCTACTATACCTTGATAGAGTTCCATGAGTGGC
+AGAGCTCTGATGATTATGTTATCTCAAATGAGTTATATCGCTCGGATGATAAAGCCAAAG
+TAGGTAGCCGAGTGCCGTTATCTGAGGTATACAAGGACTTAAAAGACGAGGCAAAAGTTA
+CAGATGTGACTAGGCCTATCTTTACTTATCTCAAGACCCCTGGAATGAATAACAAGGATA
+TTAATAGCCCACTTGGGCTATCTATCTTTGATAACGCCAAGACAACGATTGACTTTATCA
+ATACGACCTATGACGAATTTATGTGGGAAGTTAAGATGGGTCAACGTCGAGTTGCTGTGC
+CAGAGAGTTTGACCGCTTTAACTGTTCGTACCGCTGATGGCGATGTTGTTCCAAGGCCTC
+GGTTCGAGTCTGATCAAAACGTTTATATCCGTATGGGCGGCAGGGATTTAGACTCAAGCG
+CAATACAGGACCTAACAACCCCTATTAGAGCTGATGACTATATCAAGGCTATCAACGAGG
+GCTTGTCGTTGTTTGAAATGCAAATAGGCGTATCCGCTGGGTTATTTAGTTTTGATGGCA
+AAAGCATGAAGACTGCAACAGAAATCGTCTCTGAAAACTCAGACACCTACCAAATGCGTA
+ACAGTATTGTTACTTTAGTAGAGCAATCGCTAAAAGAGTTAGTTATCTCTATTTTTGAGA
+TTGCTAAAGCTTATGATTTGTACCAAAGCGAAGTTCCAAGCATGGATAACATCAGCATAA
+GTCTTGATGACGGTGTTTTTACAGATCGAGACGCTGAGTTAGACTACTGGATAAAAGTTG
+TTAATGCTGGCTTTGGCACTCGTGAGATGGCCATCCAAAAAGTGCTAAACGTGACAGAGG
+AAAAAGCCCAAGAAATAGCTGCAGAAATTAATACTGGAATCGTTGACGAAATCAATCAAC
+AGCGCACTGATACACATTTATACGGAGAGTGATTAGATGAAAAAGAAGCCTATTAAGTTA
+AATGACGAACAGCTTCTTTTGGAAGCTAGTCAGTTATCTGATATGTATCATCAGCTGACT
+CTTGATTTATTTGATCAAGTGATTGAGAGGATAAAAGCCAGAGGCTCAGCGAGCTTAGCC
+GATAATCCTTATCTTTGGCAAGCTAATAAGTTACATGACGTTGGACTGCTTAATGCAGAT
+AACATCAAGCTTATTGCAAAGTATTCTGGCATTGCGGAAGCTCAACTTCGCTATATTATC
+AAGAATGAAGGATTTAAAATTTATAAAAACACGTCTGAGCAGCTAGAAGAGGCTCTAGGT
+AGAGAGTCTGGGGTAAACAGTACTATCCAAGACGACCTATCTAACTATGCTAGACAAGCT
+ATTGATGATGTGCATAATTTGACTAACACCACCTTGCCATTTAGTGTTATAGGAGCTTAT
+CAAGGGATAATCCAAGACGCTGTTGCTGGTGTGGTGACAGGCTTAAAAACGCCTGACCAA
+GCTATCAATCAAACTGTGATTAAATGGTTTAAAAAGGGGTTTTATGGTTTTACAGATAAA
+GCTGGGAGAAAGTGGAGAGCAGACTCTTATGCTCGTACCGTTATCAATACTACGACTTGG
+CGAGTCTTTAACGAAGCCAAAGAAGCCCCTGCTAGGGAGTTTGGCATTGATACCTTCTAT
+TACTCAAAAAAAGCTACAGCTAGAGAGATGTGTGCACCTTTGCAACATCAAATTGTCACT
+ACTGGCGAAGCGAGAGAAGAAGGAGGGATAAAAATCTTAGCTTTATCTGATTACGGGCAT
+GGTGAGCCTGATGGATGCTTGGGAATCAACTGCAAGCACACTAAAACGCCGTTTGTCGTC
+GGTGTGAATAGTAAGCCAGAATTGCCAGAGCATCTAAAAAATATCACTCCTGCACAAGCT
+AAAGCTAATGCGAATGCGCAAGCTAAGCAGAGGGCAATCGAGAGATCAATACGTAAGAGT
+AAAGAGCTACTGCACGTTGCGAAGCAATTGGGTGATAAAGAGTTGATTAGGCAATATCAA
+TCGGATGTTAGAAGTAAACAAGATGCACTCAATTATCTGATAAACAACAATGCCTTTTTA
+CATCGCAATCAAGCCAGAGAAAAGCGTTACAATAATCCTTATACCAAAACTCAAAGTGAA
+GTCGAAGTTAGAAAAGAAAAAGCTAAATTAGATAAACGTAGGGATGTTGAAAGTGCTATA
+ATAGGAGTAGAAACTAGTGAAGGGATACCGCTAAAAATAACAAAGCATTTAGCCGAAAGG
+GCGGTGCTGAGAAATATAGCACCTATTGATATTGTCGATTCTATAAAAGAACCGTTGAAG
+ATAGCTCCTATTAAGTACGATAACCTTGATAGACCTTCCCAGAAATACATTGGTAAGTGT
+GTCTCGACAGTAATAAACCCGATAGACGGAAATATTGTTACAGTTCATGCTACTAGCACG
+AGAATCCGCAAAAAATATGGAGGAAATTGATGAAATTAAAAAGTATTTTAAATGATAGTC
+AAATCGATTTTGTCAAAAATGAACTTCCGGGATTACCTGTGGATATAGATGTTAATTCCG
+AAAAGTATGATGTTTTTTGTGAAGGTATAGAGACTTACTACCAGACAGAAAGCTTTGATG
+AAAAGTACAATATAACAGCTAAAGGTAAACTAGCTGAGAGTATTATTGATTTACTGACTG
+ATAAAGGTTATTGGTGACTAGTACACCAAACTACGACTTATTAAATCTAGAGCATTTAGC
+TAAAAGCTAGGTGCTTTTTTGTACTTAAAAAATAGGAGGGAACATGAATAAACGCATTAA
+GAAAAAACGTAAACTAGAAACAGCAGTTGTGATGCTTGTTGCAGAAAATGCCATGCAGGT
+TGAAGCAATTAAAAATCAAAACAAACAAATCATGGAGCTAAAATCAATCGTTCAACGAAA
+CGCTCTGGCAACAAACGAAGAGTTAGCGACTGTTAAAGCTGCTACTTTAGATAACCAATC
+AGTTATCAAGGCAATTGGTGACACGGTTGACTATATTAAGAAAAACTACAAACGGAAGTG
+GGGGAAATAAAGTTTAACCGTGTCGAATTCGACCCCTTTAGAAATCAAAGTCGTAGCAAT
+ACGGCTTTTTATTATGCCTTTATCCGCAGGCGTTAAAGAACGGAAATCAGCGACCTATCG
+CATTTATAGGAGGGAATGCACATGGAAAATGTGACAAACGAAAATGTCGACCAAGAGACT
+ACTGACTTGGAAAATAATCAACAAGAAGATAAAGCATTTACACAAGATGATCTCAACCGA
+GTGGGAACTAAAGAGCATTCTAAAGGCTATAACAAAGCAGTTAAAGACTTGGGTTTTGAT
+GATGTAGAGTCTGCCAAGGATGCACTAAAAGCCTTCCAAGAGTGGCAAGAGTCACAAAGA
+AGCGAGTCAGAAAAACAAACAGAAATCTTGAATGCTAAAGACAAAGAGCTTGAGGAAGCT
+CGGGCAAACAATAAGGCTCTTAATGCAAAGCTAGCAGCAATGTCTTTAGGTGTGAACGCT
+GAATCTATTGATGATGTGATTGCACTATCTGAGCGTCTTGTCACTGACGAGACAAGCATA
+GAGGATGCAATCAAAACGGTTTTGGGTAAGTATCCTCACTTTGGCCAAACAAAGGATAAA
+GCTCCCAAAATCACAGTGGCAGGCAACCCGTCTGCTGATAACGGACAAGGTTCGGTGTCT
+AAGGAAGACTTTGCAAAGATGTCTTACCAAGAAAAACTGGACCTAAAACTAAAAAATAAG
+AATCTTTATGACCAATTGAAAGGAAATTAAAAAATGGCAGTAGGAACAACTAAAATGGCA
+CAAATGCTAGACCCTGAGGTTCTAGCGGATATGATTGACGCAGAGGTAGGGAAAGCGATT
+CGCTTTGCTCCTCTTGCTGAAGTAGATACAACTTTAGAAGGACAACCAGGTACAACTTTA
+ACAGTGCCTAAATGGGATTACATTGGTGACGCAGAAGATGTTGCCGAGGGTGAAGCTATC
+CCAATGACTCAACTTGGCTTCAAAAAGACTACTATGACCATTAAAAAAGCCGGAAAAGGT
+GTAGAAATCACTGACGAAGCTATCTTATCTGGGTATGGGGATCCTGTAGGTCAGGCAGCA
+AAGCAAATCGTTGAGGCTATTGACCACAAAGTCGATGCAGACGTGCTTGATGCGTTAAGT
+AAATCGACTCAAACTGTGGAAGCTACTGCTACGGTTGATGGTGTATCTAAAGCGCTAGAT
+ATTTTTAATGACGAAGATGACGCAGAGACAGTCATTGTCATGAATCCGGCGGATGCCTCT
+ACCCTACGTTTAGATGCCGCGAAGGAGTGGTTAGGTGCTACCGAGGTTGGAGCAAATCGT
+GTTGTCTCTGGTGTTTATGGTGAAGTTTTAGGGGTACAAATTGTGCGTTCTCGCAAATGC
+CCTAAAGGAACTGCCTACATGGTTCGCAAAGGTGCACTACGTATCATGCTTAAACGTAAC
+ACAATGGTTGAAACAGACCGAGATATCACAAAAGCGATTAATCAAATCGTAGCTAATAAG
+CATTATGGTGTTTATCTTTATAAGGCAGAAAAAGCCGTCAAAATTACACTTAAAGATGCC
+GCAAAAAAGTAGCTAAGGCTAAGGCTGCCAAGAGAGAGGAAGATGACGCTCTCGAGTCTT
+AGCCGATGGAGGTGGTTATTATCGCTTTTTTAACGCAAAAAGAATTTGAAGATTTGGGTT
+TTGACGAGGTAGAAGATTTTGAAAAAATGGAAAAACGTGCTAGCCACGCTGTCAATCTTT
+ACTGTCGTAATCGCTATGATTACAAAGATTTAAAAAAAGAAATAGCCCTAGTGCAAAAGG
+CTGTAAAGCGGGCAATCGCTTATCAGATAGCATATTTAAATGACTCAGGAGTAATGACAG
+CAGAGGATAAACAATCCTTTGCTGGAATATCTCTAGGACGGACAAGTATTAGCTACACTG
+TCGGGCATGGCCAAGGCAGCCAACAAAAAACTCTGGCAGACAGGTTTAATCTCTGTCTAG
+ATGCAGAGAATGAGTTACTAGCTGTTGGGTTGGGATATACGGGTATTAGCTATGATCGAT
+AAAAGACTGCTTATTGACGAACTGCAGGTAAAACTTGTCAAAGATAAAGGTGATTATGGA
+GGGTTTGTCTATGACGAACCTTTTACACTCTCTCCCGTTAGGTTTGACCGTAATCTTGCA
+ACCGCAGGTAAAGATAATGCAAGGCAAGAGACTAAGCCGTCGGTTATCTTTATTTATCCT
+AAATACTGTAAGACAGTAGCCGATAGGTCATGGGTTGATGCTGTTGTCATTGATGGTGAT
+ACTGAGTACACCGTTGATAAAGTGATACCAGTCTACCACCCACTAACAAACAAAATTTTT
+TGTTTTGAAGTGGAGGTTATCTAATGGCTAAGGTAGTGGTAGAGTTGGGAGGCATCAAGC
+GTAAAGTATCTCCGCAAGCATTAGCTAAAGGAAAGCTCATCATGAACAACCAAGTCATGA
+TGTCCATGAACCCTTATGTTCCTTACAGAGACGGAGCTTTGAGAGGAAGCTCGAGAGCTA
+ACAGTGTAGGTGTAACGTGGAGCGGACCACACGCCAGAGCCCAGTTTTATGGTGGTGCTT
+ACAACAAGTACAAGTCCTTTAAATTTAAAAAGTACACAACACCAGGTACAGGCAAACGTT
+GGGATAAACGTGCGTTAGCTAATGCAACAATTGTCAAGGATTGGGAAAAATCCTTACTGA
+GAGGAATGGGATTTAAATGACAAATGACTTTGCAACTGTTTTGAGGCAATTTGTCGAAGG
+ATTAGACTTAGGCATAAAGCCCAGACTTGACTATCTAACAAGACAAGAAGATTTAGCCAT
+TTATCCAATGCCAGGTGGGAAGGTAAATAACGAGTACATGGACGGTACTCGTGAGATAAG
+CCTGCCTTTTGAGATTGCAATCAAAACTAAAAATCAGGAGTTAGCAAGCACTGTGATGTG
+GACTATTAACAGTGCTTTGTCTAACTTTGACTTAAAATTACCAAGTCTTAATCATTCGTA
+CACATTTATTAGCCTTGATGTCGAAAAGCCGTTTTTAAATGACTTAAGCGATCAAGGTTT
+TTATATTTATGTGCTGGATATTACAGCACACTTAGAAATAGAAGGGAATAACTAATGAGA
+CAAAAGAACGCCCTACGTGGGCATTTTATCGCACCTTATGTAAAAGGTGAGGAAAAGACA
+GAAGTTACAAAAGAGAAGCTTTTGGAATTGGCTAGATGGATTAAAGACATCTCAGACGAT
+ACCGACGAAAAGACAGAAGATGAGGCGTACTATGACGGAGATGGAACAGAAGAAACAACC
+GTTGTAGGAGTTAAGGGCGCGTACACTTTCGAAGGGACGTATGATCCAGAAGACAAAGCT
+CAAGCTCACATTGCAAGTCTTAAGTATAAGCTAGGAGATGAGCGAAAAGTTTGGCATTTG
+ATTGTATCGGCTGATGGGAAAACCCAGTGGCTAGGGGTTGCAACAGTGACAGAAATTATT
+GCTGGTTCTGGTGCTGCCGCCGATTTTGAAGCCTTTGGTTGCAAGATTACTTATAACTCT
+CTGCCAAAGGAAAGCAAGGAAATTATACCTAAAAAAATGAATTGAGCGTAGCGATGTGAG
+ACAAGGGTGGGCTAAACCACCCTTTTAAGGAGGAATTATGTCTGGAATTGTAGTTGACCT
+AAAGCGCACAGGGTTTCCGGTCAAAATTGGGCAGGTAGAGCTTTGGTTTGATACAAGCCA
+AGAGCGATTGATTGAGTTTTTTGATATTGAGACAGAAGTAAATCGTCGCCTCAATGAATA
+CGAAAAACAGGTTATCGAAGCCAACTTAGACAACGAAATTGAAGATAAAGGGGTTACGAA
+AGATGTTGCCCAAAGTGCTTTAGATTTGGAAGCTAAATACTTAGAAATCAATTATGATCT
+ACTATTCGGAGAAGGTACATTTGCACAGCTCTACGCGGAGTATCCCGACAAAGAAGCACT
+CGAGAATACTCTGGAAATTGTTTGCAGGGAAATCGAGGTCAAACTCAAAGAGTTAGCTAT
+CGAAAGAGAAAAAATCGTTAAGCAGAAAACGAAAAAGTACAAAAAGGAGTAGCCTATGAA
+ACTAAACGATCCATTAGTAGAGTCGTTTGAGTTTAGAGGTGAAATCTATCCTATTGATTT
+GAGCTTTAACAAGGTTTTAGATGTCTTTGATGTTATTGATGATGATTTTTTAAACGAGGC
+GGAAAAGTGTTTTTTGTGCCTTGATATTTTGCTAGATAGGACAGATTTACCTTTTACTTA
+CGCGGTGGATCTTTGGGTTTATATCAAAACCAATTTTATCGATGCAGAAAGGCCCGAGAA
+ACCTCAGCTCGACATCAAAGGGAATCCAATGCCTGTAGTAAAAGAAAAAGAGGATAACAA
+AAAAGTCATTGATTTGAGTTTAGACGCTGAGTTTATCTATGCGAGCTTTAGGCAAGCCTA
+CCAAATCAATCTTTTAAAAGAGCAAAACAGATTGTCTTGGATTGAATTCAAGGCTCTTTT
+AAATGCTCTTCCAGACGATACTGTCATGCAGCGTATCATAGCCATTAGACAGTGGGAAGA
+TGATGGTGAAGGCAGTAAAAAATACAGAGATAACATGCGTAAGCTAAAGGCTAAGTACAG
+TTTAGATGAAAGAGAGGAGGAGGACGATGGCAGCTGATGGTAAGGTAACGATACTTGTTG
+ACGTTGATGGTAAGCAGGTAAAGGTACTCAATAGTGAGTTAGATAAAGTTGCCAAGCACG
+GTGACAAAGGCAGCTCCTCTCTTAAAAAATTTGCGGTTGGTGCAGGAGTCTTTAAATTAG
+CTTCGGCTGCAGTTGATTTGGTTAGTCAATCTCTTGGCAAGGCTATCACAAGATTTGACA
+CGCTTGAAAAATATCCAAGGGTCATGAAAGCTATGGGGCATAGCGCTGAGTATGTTGCTA
+GATCAACTGATAAGTTAGCGAACGGAATTGATGGACTACCAACAACTTTAGACGAGGTTG
+TCGGAACCGCTCAACGTTTGACCTCTATTACTAAGGATATCAATAAATCAACTAATCTCA
+CACTAGCATTAAATAATGCCTTTTTAGCTTCAGGAGCTTCATCAGAGGCTGCAAGCCGAG
+GGCTGGAGCAGTATGCCCAAATGCTATCAGCTGGTAAGGTTGATATGCAAGCTTGGAAAA
+CCCTCCAAGAAACAATGCCTTATGCCTTGCAACAAACTGCGGAAGCTTTTGGATTTGCAG
+GGGCATCAGCTCAAAAGGATTTTTATGAGGCATTAAAAAACGGGCAAATAACATTTGACC
+AATTTTCTAATAAGTTGATTGAGTTAAATGATGGTGTCGGCGGTTTTGCAGAACTAGCCA
+AAGAAAATAGTAAAGGGATTGAAACCTCTTTTAACAACATCAAGAACGCTATTGCAAAAG
+GTGTGGCCAACAGCATTAAGGCTTTGGATGATTTATCTAAGGCTGCAACAGGTAAGGGCA
+TAGCTGATCATTTTGATAGTTTGAAAGTTGTTATCAATGCCTCTTTTAGCGCCATCAATG
+CAAGTATTAAAGCTAGTACATCGCTATTTAAACTTTTGTTTAGTGTTATTGGTGCTGGAA
+TATCAGTCGTCAAAGCTCTGTCGCCTGCCTTAGTTGGTGTAGCATCTGGTCTAGCTGCCA
+TGAGGGCAGTTAATGAGACTATAACAATGATTAAAGCGCTAAATAGAGCTTGGGTTATGG
+CATCTGCATCAATGAGTATTGGAGCAACAACCATTAAGACTGTGACTGCGGTACAAGCGG
+TAAGTACCACGATGACTAAAGCAGATATGGTTGCAAGACTATCTCAGTTAGGTGTCTTAA
+AAGCCAGTACCGTGATTTATGGTGTTATGACAGGCGCTATCAGTTTATCTACTGCTGCAA
+CCATAGCCAGTACTGCTGCGGTAACTGCGTTAAAAGCAGCACTTGTAGCCTTAACAGGTC
+CCGTTGGTTGGGTAGTTGGAGCTATCGGTGCTTTAGTTGCTGTCGGAGTAAGCTTATGGT
+CATGGCTAACTAAAGAGTCAGACGAGACCAAAAAGCTGAAAAAAGAGCAGGAGGGGCTAG
+TCGAAAGCAACAAACAGCTAAGAGATTCTGTCCGTGAGGGCGTGCAAGAGCGTAAGAAGG
+GCCTTGAGTCCGTCAAAGAGAGCACTGCAGCTCATCAAAAATTAGCTGACGAAATCATTA
+AGTTAGCCGCCAAAGAAAACAAAACTGCAGGCGAAAAACAAAACTTAAAAAATAAGATTG
+ATCAGCTTAATGGGTCTATTGATGGCTTAAACTTGGCCTATGACAAAAACTCCAATTCTC
+TTTCTCACAATGCAGATCAAATTAAGTCACGCATTAGTGCCATGGAAGCAGAAAGCACAT
+GGCAAACAGCACAACAAAACCTGTTAAATATTGAACAGAAACGTAGTGAGGTTAGTAAAA
+AGCTAGCTGAAAATGCCGAGCTACGTAAAAAGTGGAATGAAGAAGCTAACGTCTCCGACT
+CTGTCCGAAAAGAAAAGATTGCCGAACTCACAGAAGAAGAGGGTAAGCTTAAAAATATGC
+AGACTCAATTGCAGGAGGAGTATAACAAGACATCAGCTACTCAACAAGCTGCTGCAGACG
+CTATGGCTGCCGCTGAAGAATCAGGATCAGCAAGACAGGTTATAGCGTACGAAAATATGT
+CAGAAGCTCAACGAACTGCCATAGACAATATGCGCACTAAGTACTCTGAACTTTTAGAGA
+CAACGACATCTATTTTTGATGCTATCGAACAAAAGACTGCTCTGTCAGTGGAGCAAATGA
+ATGCCAACCTTGAAAAAAATAGAGCTGCTACTGAACAATGGGCTACGAATTTGGAAATTT
+TAGCTCAGCGTGGTGTAGACCAAGGCATCTTGGAACAGCTTAGGCGGATGGGACCTGAGG
+GGGCAACACAGACACAGGTTTTTGTGGATGCCACAGATGCCGAGCTAGCACCCTTGCAGG
+AAAACTTTAGAGCAGCCACAGAAACTGCTAAAAATGCAATGGGGAGCGTTTTAGACTCAG
+CAGGTGTGGAAATGCCAGAAAAAGTTAAAGGGATGGTCACTAATGTTTCTACGGGATTAC
+AGGCGGAACTGCAAGCTGCTAACTTTGCTCAACTTGGTCAAGAAATCCCTAATGGGGTTT
+CTCAAGGTATAAGTCAAGGGGCAGGTAAAGCAAGTGACGCAAGTGTCAAAATGGGTCAAG
+AAGTTAAACGCTCTTTCCAAGGAGAGTTGGGTATCCACTCGCCATCGCGAGTATTTACTG
+AGTACGGTGGCCATATTACTGATGGCTTGAGTAATGGTGTGACAAATGGAACGTCAAAAG
+TTATGCAAACCATGCAGAGCTTGGCTCAACAGATGTCTCAAAAAGGACAGCAGATTGTTA
+ATGACATGCGTAGCAAGTCGAACCAAATCACAGATGCTTTTAGCACGATGAGTGGTCCAA
+TGCACTCTCATGGTGTTAATGCCATGCAAGGTTTGGCCAATGGTATTTATGCAGGGTCGG
+GGGCAGCTTTAGCGGCAGCTCAAAGCATTGCGGCACGTATCACCGCAACAATTCAAAGTG
+CCTTAGATATCCACTCGCCATCTCGTGTTATGAGGGATGAGGTTGGACGTTTTATCCCTC
+AGGGTATCGCTGTAGGTATTGATGCGGATAGAAAAGTCATTGACTCATCTATGCAAAAGC
+TAAAAGAGTCAATGACGATTAATGCGACCCCAGAAATAGCCTCTGGATTTGGCGGAGGAG
+TTGCGGGGATTGCTAATCAGACCACAAATAACTCAAATAACAGTTTTACCCTTAATGTCA
+AGGTTGATGAATCCGACGGTAATAGCCGCGAGAAATATCAACGCTTATTCAGAGAATTTA
+GCTGGTATATTCAACAACAACAAGGAAGGTTAGGTGATGTTAAATGACAGCTTTTATCAA
+GTTTGATGGTAAAAAATCTTCAGATTTTGATTTGAGAATTATTAATGACGTTGAGCATGA
+CTCGTCCTTTTACGATGTTGATCAAGTTAAGGTACCTGGTCGTGATGGTGTGGTTTTAAA
+GGACAATAAAAGGCTTGAGGCTATTGAACGGTCTTACCCTTTACGTCTATATAGCAAAAG
+ACGACTCACCGAAGTAGAAACTGACATAAGCAATTGGCTGAATGTAAAAGGTTGGAAAGA
+CTTAGAGTTGTCATGGGAGCCTGATTATATCTATAAAGCAACACATATCACCCCTTTTAG
+CATAAAGGAGGTTTTAAGGAATTTCGGCAGACTGAAAATCAACTTCTTAATCCACCCTAT
+CAAATATTTAAAAACAGGTAAGCAAGAGGTGCCTCTCGTTAATGGCGGTACTCTACAAAA
+TCCCGGCAATGTTCAAGCTAAACCTATCCTAAAAATCAAAGGCACAGGCAATGGTATTTT
+AACCATTAATGACTTTGAGACAGGACTTGAAAATGTGCAGAGCGAGCTTGTTATAGATAT
+GGAAAGGCACCTAGTCTATAAAGATGTCCTATCTGCTTGGGATAATATCGTAAGAACAGA
+ACGCCACCGCATGCCGTTATTTGACGTTGGACAAAATAAAATCTCGTGGACTGGTAGCTT
+TACAATTACCGCAGTGCCAAACTGGGGGGTTAAAGTATGATACCAGTTTTGTATGAGGCT
+AAGGAAACCAAGTTTAGGACTTTTGGTCTCGGTGAGATTGCGGATGCTTATGAGGTTAAA
+GCCACTCGTGAGCGCAATGGTAATTACTCACTGTACATCAAATATCCGCTAGATGGTGTC
+TTTGCCTCAGTTTTTAAAGAGGAAATGAAGATTAAGTCTGACGCTGGTCGTAGAACCAAA
+TGGCAGACTTTTGAGATTAATCGGGTACTACGAAATAGTAAAGACCACATCGAGATTTTT
+GCGCGTCATATCTCTATGCGCACACAGGATATTGCTTTAAAACCGTTTGTAAACGGTGCG
+AGCGTAGGAGCCGAATCAGCTTTAGAAATCTGGAAGAAAAACCTTGTCGGTGATGATAAG
+TTTGACGTTAAAAGCGACATCTTAACGCTTGGTAGCTTTAACTGGGAAATTGATAAAATC
+GGCAATGCCCGTGGTGCTCTAGGAGGTGTCGCTGGCTCTATCCTAGATGTTTACGGTGGT
+GAGTACGAGTTTGACAACCGTACAATCATCTTACGCAAGCAAATGGGGCGTAAAGCTCCC
+ACGGTATTGGAGTATGGCCGTAATATCGTCAGCGTAGAGGAGGAGCGATTGCTAGATGGC
+AATTACACCTCTATCTATCCTTACGTAAGATATACGCCACAACCAAAACCGCAAGAGGAA
+CCCCCTGGTAAGCCGCATGTAGGCGAGCATAAACAACCCGAAGAACAGCTAGTGACATTG
+CCTGAATTTATCCTAGATGGTCAGTATCTCAGCTTATATGCTCAGCGCAGAATCCAAATG
+GTTGATTTATCAAGTCATTTTAACGATGACAAAAATAAAAAAGAGCCAACGATCGAAGAA
+ATCCGAAAGCTGGCTCAGAAATACCTTAAGGATAATAACGTTGGTGCACCAAAAGTCAGC
+ATTGAGGTTGATTATATTGACTTGTCACAAACGCTTGACTATCAAGATTTTAGAGTCATG
+GAAGAGGTTGAGCTTTGCGACATTGTACCACTTTATTATCCAAAGTTTGGCATCACAACT
+GAGTCTGAAAAAGTCGTTGAGATTGTCTATGACGTCTATACAGATAGCAACCATACAATA
+AAACTTGGCACGATTGGTCAGTCCATCTCTAAGAGTTTGACAGGTGGGGTCTCAGAGCGT
+ATCAATGCTTTGGAAAATAACCAAAAGGTTATCACCAACAGCCAGAAGCAGTTTGAACTC
+AATCTGCCTAAATACCTCAATGACCTCAATGGTAAACGCGTTTGGTACGAAAAACCAGAT
+GACAATATTGAGCACAAGATAGGCGACTATTGGTTTGAAAAAAATGGCAAGTATCAGCGT
+ACTTGGATTTGGGATGGCAATCAATGGGTCAAGGTACTAGATACAGAGGATTTAAACCCC
+AATCAACGAGCTTTTGATGCCGCAATAGCCGAACTCGAAAAAGCAAAAAAAGCGCAAGAA
+GAAATCAACCAGCGTACTGACAAAGAGCTTGAAGAATTTAGAGCCACCCTCAAAAACCTA
+GCTTTACCAGAAGAAGCGATTAAAAAAATCACAGAGGCTATCAAAGTTGATGACATCCCG
+TCTATTAAACAAAGCTTTGATGACCTCAAAAATAGAGTGAGTGAGACAAGCGAAGAATCT
+CGTTTAACTGCCGAAATTTTAGGAAACAACGGTAAAACCCGCTACAACAAAAATTTATTG
+GTTGGTGAGCCTAATCGCACGAAGTCTTACGACCAGGATTACATCGAGGTAGAAGCCAAC
+GACGGTGGTTTCAAGCGTGGCGAGACCTATACGATTAGCTTTAGCCAGACATGTGAGCCA
+CTCAAAAAAGTGGCTATCACGCTGACACAGGCTAACAACAAGGGAGTTAAGTTAGTGCTG
+ACACCAACTAAAGCAAAAATGGAGTCGCAGACCTTTGACCTCACTAAAGATAAAGAGGCT
+ATCAGTGTTTATCCGTTTAGCTACACAGTGCTTGTAACCAGCGACTGGTATAAATCTAAG
+CAGATAGATTTAAACGCGTCGGAGGTGAAGGAATTGGCTCTGGAGATGGATTATAAAGAG
+ATTGCAGATGCCAAAGGTGCAACTATCACAGGGGCATGGTCAGACAGTCCACAAATTATA
+TTAGACGGAGGTAAAAAATGAGTGAAAATATACCGCTGCGAGTCCAATTTAAGCGCATGA
+AAGCCGCCGAGTGGGCTCGTAGTGATGTCATCTTACTGGAGAGCGAGATAGGCTTTGAGA
+CAGACACAGGTTTTGCCAGAGCAGGTGATGGCCACAATCGATTTAGTGACCTTGGATACA
+TTAGCCCACTCGATTACAATCTACTGACTAACAAGCCAAATATCGATGGATTAGCGACAA
+AAGTCGAGACCGCTCAGAAACTACAACAAAAAGCAGATAAAGAGACCGTCTATACAAAAG
+CTGAATCGAAGCAAGAGCTTGACAAGAAATTAAATCTCAAAGGTGGCGTTATGACAGGTC
+AACTAAAATTTAAGCCAGCCGCCACTGTTGCTTATTCCTCGTCAACGGGTGGAGCGGTCA
+ATATTGACTTGTCGTCTACCAGAGGTGCTGGTGTTGTTGTCTATTCTGACAATGATACCA
+GTGATGGGCCGTTAATGAGCTTGCGGACGGGTAAAGAGACCTTTAATCAATCGGCGCTTT
+TTGTCGACTATAAGGGGACAACAAATGCTGTTAATATTGCGATGCGTCAGCCAACCACCC
+CCAATTTTTCATCGGCGCTTAATATTACTAGCGGCAATGAAAATGGTAGTGCAATGCAGC
+TACGAGGGTCAGAAAAAGCGCTAGGAACGCTAAAAATTACTCATGAGAACCCAAGTATTG
+GAGCGGATTATGATAAAAATGCGGCAGCGTTATCCATTGATATTGTCAAAAAGACAAACG
+GTGCAGGAACAGCCGCTCAGGGAATCTACATTAACTCAACCTCAGGCACGACAGGGAAGT
+TGCTTAGGATTAGAAACCTTAGTGATGATAAGTTCTACGTCAAGTCTGACGGTGGTTTTT
+ATGCCAAGGAAACTTCGCAGATTGATGGCAACCTGAAACTCAAGGACCCCACAGCGAATG
+ATCATGCGGCAACCAAAGCTTATGTAGATAAAGCAATTTCTGAGTTAAAAAAACTCATAC
+TAAAAAAATAGATTAAGGAGGATAAATGAGCAGAGACCCAACACTTATTTTAGACGAGTC
+AAACCTCGTTATTGGTAAGGATGGACGTGTGCATTACACATTTACCACAGAGGACGACAA
+CCCAAAAGTCAGACTAGCTAGCAAGTGTCTAGGCACAGCGCATTTTAATCAGCTCATGAT
+TGAGCGAGGAGACCAAGCTACTAGCTATGTTGCGCCAGTAGTAGTTGAGGGTACAGGTAA
+TCCGACTGGACTATTTAAAGACCTCAAAGAGATTAGCTTAGAGCTGACAGATACTGCTAA
+TTCCCAGCTTTGGTCAAAAATCAAGCTGACTAACCGTGGTATGTTGCAGGAATACTACGA
+CGGTAAGATCAAGACCGAGATAGTCAACTCCGCCAGAGGTGTCGCTACACGTATCAGCGA
+GGATACTGATAAAAAGCTAGCGCTCATCAATGACACCATTGATGGTATCAGGCGTGAGTA
+TCGAGATGCTGATAGGAAGCTATCCGCAAGCTATCAGGCAGGCATCGAGGGGCTAAAAGC
+CACAATGGCCAATGATAAAATCGGTTTACAAGCTGAGATTAAAGCCTCAGCACAAGGGCT
+ATCGCAAAAGTATGATGATGAGTTGCGCAAGCTATCGGCTAAGATCACAACAACCTCAAG
+CGGCACTACAGAGGCCTACGAGAGTAAGCTTGCGGGCTTACGTGCTGAGTTTACTCGCTC
+AAATCAAGGCACGAGGACAGAGCTCGAGTCACAAATTAGCGGGCTAAGAGCGGTACAGCA
+GTCAACAGCTAGCCAAATCTCTCAAGAGATTAGAGACCGTGAAGGTGCTGTCAGTCGTGT
+GCAGCAGAGTTTGGAGAGTTACCAAAGGCGGATGCAGGACGCAGAAGAAAACTATAGTAG
+CTTGACCCATACGGTTAGAGGGCTACAGAGCGACGTTGGATCTCCGACTGGTAAAATCCA
+ATCGCGCCTTACTCAACTAGCAGGACAAATTGAGCAGCGGGTTACTAGAGATGGTGTCAT
+GAGTATTATTAGTGGCGCTGGAGACAGCATTAAATTAGCTATCCAAAAGGCTGGCGGCAT
+TAATGCCAAAATGTCTGGTAATGAGATTATCTCAGCAATTAACCTCAACTCCTACGGAGT
+AACAATCGCAGGTAAACACATCGCTCTCGATGGGAATACGACGGTTAATGGCACCTTTAC
+CACAAAAATAGCCGAGGCTATCAAGATTAGGGCTGATCAGATTATTGCAGGCACGATTGA
+CGCTGCTAGGATTAGAGTGATTAACCTTAACGCAAGTAGTATCGTTGGTTTAGACGCTAA
+CTTTATCAAAGCTAAAATTGGCTATGCTATCACTGATTTGCTCGAGGGTAAGGTCATTAA
+GGCTCGTAATGGAGCGATGCTTATCGACTTAAATACAGCTAAGATGGACTTTAATAGCGA
+TGCCACAATTAATTTTAATAGCAAAAACAATGCCTTAGTACGTAAAGATGGCACACATAC
+TGCCTTTGTACATTTTAGTAATGCGACGCCCAAAGGTTATACAGGGTCAGCGTTGTATGC
+ATCGATCGGGATAACCTCATCTGGTGACGGTGTTAACTCGGCTTCTTCCGGTCGTTTTGC
+AGGGCTAAGGTCATTTAGGTACGCTACGGGATATAATCACACTGCGGCAGTCGACCAGAC
+TGAAATTTACGGTGATAATGTTTTAGTTGTGGATGATTTTAATATTACTCGGGGATTTAA
+GTTTAGACCAGACAAGATGCAAAAAATGCTTGACATGAACGACTTGTATGCGGCTGTAGT
+AGCCTTAGGCCGCTGTTGGGGGCACTTGGCTAACGTCGGCTGGAATACTGCTCATAGCAA
+TTTTACAAGTGCTGTGAATAGGGAATTGAATAACTACATCACAAAAATTTAACAGGAGAT
+AATATGCAATTAACTATTAAAAACAAAGATTTAAACACACTATATCGTGTACTAGACAAA
+ATCAAAATCACTAATATGCGTGCTAATCGTGGCCGTGCTAAGCTACTCGCAAAAGTAGTC
+GATAAAATCAACGAGTATGCAAAAGATGAGACCGACTTAATTGATATGTATGCAGCTAAG
+GATAAAGATGACAAATTTGTCATTGATGAGCACAAAAACATCAAGCTAGCAGACCCCGCT
+AAACTCGACGAGCTCAACGACCTACTCAACGAGCTAGCAGACGAAGAAATTGTGATTAAA
+GGGGGTGAGTACTCCAAGCGATTTATTGACTTTTTAAACTTTTTAGAAGAGTGTGAAGAT
+GAATTTACATCATCTGAAATCATTCTTATCGACAACATTTTGGAACAATTTGAAGAAAGT
+AAAAAAGGAGAATAACCATGAGAAATTGGAAAGTGACAGGAAAATACCCACAATTTGACA
+GCACAGGAGCAGTCGCAAGCACACATATTATTATCACTGCTGAGGATGGCTCAGTCATCT
+CTCAACCAATCAAGCAGGACTTAACCTCAACTAATGACACAGAGATTATCAAAGCTACTT
+TGGAAGAATTTAAAAAATCTGAATACGTTGAAATCGCTATGGGCGAAGCCGTGCAAAAAG
+TAGACGACCTTGAAAAAATCTCACAGGAAACCGCTAAGACCGCTAAAACAGCCCAAACAG
+CCGCAGGATTAGCTAAGGTGTCCGCAGAGCGTACACAGCGAATGATTAACTTGCAAACCA
+TCCACATGTTAACGAGCGGCGGCAAGATTGATTCTGACATTTATAAAGGCATGCTTGAGC
+TAATCGAGCCAGCCCAAAAAGGTGAGTATCAAGCCTATGATGTCTTTACGGTGGTCGACA
+GTACTAAAGAGGAAGACGGAGAGGCTGGTGAAGGTAACCTAGTCTTCGTACACGTTAACG
+AAGCATTTGAGTATGACAAACAAACCTTAGAGGAGCTAGAGTCAGAAGCCAAAGTAACAG
+TTATCAAGTACGCTGATTTGGTTAAACAAGATTAGAGGTGGTTTATGGCAACAGAGTTGA
+TATTTGGCGTTGGTGGCTTTATTTTAGCTATCGTCACGACTTACAATATTTTTAATGCAA
+AATCCATCAAGCATGCGACAGATATTACTTTGTTGCAATCTGAGGTAGAGCATTTAAAAA
+TTGTTACACGCCAAAATGCTCGGCGGCTTGAAGAGCACGCTGAGCAAAATAAAACGTTGA
+TTACAATGACAGAGCAAATTAAAAATTTAACAGATGATGTTAAAGATTTAAAAGATATGA
+TGAGAGGAGAAATCAAATGATCAATTTAAAATTACGACTACAAAACAAAGTAACCTTGAT
+GGCTATTTTGGGAGCTATCTTTTTACTGGCACAGCAATTAGGTATTAAACTACCATCAAA
+CATCGCAGATATTGCAAACACAGCTGTAACGCTTTTGGTATTGCTCGGTGTTGTCACAGA
+TCCAACCACGAAAGGCCTGTCAGATAGTGAGCAAGCATTGACTTACCATGAGCCCAAAAA
+ATAGGAGGAGCCATGCGAGCAATCACACGATTAGCGTTAATACTAGCAATCGCAATACTG
+TATGTGCCATTATCTGTGGTTGCTCTTATCTTTTATCCGTTTTTAGATAAGGAGGACAGA
+TGACCTTTTTAGATAAAATTAAACAAGGCTGTTTAGATGGCTGGGCTAAGTACAAAATCT
+TGCCATCCTTGACCGCAGCACAAGCTATCTTAGAGAGCGGGTGGGGCAAACATGCCCCAC
+ACAACGCTCTGTTTGGTATTAAGGCAGATAGCTCTTGGACTGGTAAATCATTTGATACCA
+AAACCCAAGAGGAATATCAAGCAGGTGTTGTCACGGATATTGTGGACCGATTTAGGGCGT
+ATGATAGTTGGGATGAGTCGATAGCTGATCACGGACAATTTTTAGTTGATAATCCACGCT
+ATGAGGCAGTTATTGGGGAGACTGACTATAAAAAGGCTTGTTACGCTATTAAAGCAGCTG
+GATACGCTACGGCAAGTAGCTATGTCGAACTTTTAATCCAACTGATTGAGGAAAACGACT
+TACAAAGTTGGGATAGAGAAGCTCTTAAAAATAATAAGGAGGAAACGATGACAACCGCAA
+ACGAAATTGTACAATACTGTGTTAACCTTGCTAATTCAGGCATGGGTGTTGACAAAGACG
+GTGCTCACGGGACGCAATGCTGTGACTTGCCTTGTTTTGTCGCTAAAAATTGGTTTGGTG
+TTGATCTTTGGGGCAATGCGATTGATTTATTAGACAGCGCAAGTGCGCAAGGCTGGGAAG
+TCCATCGTATGCCAACAGAGGCAAACCCAAAAGCAGGCGCTACATTTGTCCAATCAGTGC
+CGTATCATCAATTTGGACATACGGGAATTGTTATCGAGGATAGTGACGGTTACACCATGC
+GCACTGTCGAGCAAAACATTGATGGCAATCCTGATGCTTTGTATGTCGGTGCACCAGCTC
+GTTTTAACACTCGTGACTTTACTGGCGTGATAGGTTGGTTTTACCCACCATATCAAGGGG
+ATACAGTCACGCAACCAGTCAGCACCGAGCCGCAAACTTCTGACACTATCGTAGAGACAG
+CAAAAACAGGCACCTTTACCCTTGATGTTGCAGAGATCAATATCAGACGCTGGCCAAGTC
+TAGCCAGCGAGGTTGTAGGTATCTACAAGCAAGGTGATACTGTCAGCTTTGATAGCGAGG
+GCTACGCTAATGGCTATTATTGGATTAGCTATGTTGGAGGCTCAGGTATGCGTAACTACC
+TAGGTATTGGACAGACTGATAAAGATGGGAATCGCATCAGCCTTTGGGGTAAATTAAATT
+AGGAGGTAAAGCTCCGAGATAAGACAAAACCGCTCAGATTATTCTGGGCGGTTTTTTGTG
+TATGATGAATTATTTTTCAAGATAAATATCGAAATGACTAAAGTTCTTCATATTGATAAT
+TCTATTATCTTTATATTTTGCAAAAATATCTGATCTAGTCCCTTCATTTGGTGAGTCAAA
+TAAGTCTATTTGCTCATGTTTCCCATCTTTTGTGCCAATTTCGATTCTGCCGCTTACATA
+AGGAGAAGTAGCGTCATAAATTTTATAATTATCCATAAGGTATTTTCTGATTTTAAAGTC
+AATTTCCTGGAAAGTTACGATATCTTTTTCTAGAATAATTTTGTTATTTAAGTTCTGTTG
+AGATTCTCCCGAAATAAATAGATTTCCCAATAATTTATGATTTACTTTATTATTTTGAGC
+AGGCGTAATTCCTCCATAGATGTACTCACCGGTGTGAGAATTAAGAATATAAAATAATCC
+AAAAACATCTACATGATCATCTCGTTTAAATTTTTGAGAGGCCTCATAAGACATTTCGGA
+ACTAATATAATAGTCTTTCCCTCTATATTTTTGAGTATCAATGTTTAATGTGTGTGTCGT
+TGAAAAATTTACCCTGCAATTTTTATAATCATAAGGAGTTATAGTGTATGCATAAAGTAA
+ATCACTTTTAACATTCGAAATGTCTTTCTTAGAGTCACTTTTGATGATAGGTGAAATAGT
+AGAAATCAGTATGACTGTAATTATGAAAACTATTTTGATGATGTTAATCTTTTTCAT
+>NC_002737.2|provirus_777501_820593
+ATGTATAAAAATATTATCGTAACTGGTGGAGCTGGTTTCATCGGATCTAACTTTGTGCAC
+TATGTCTACAATAACCACCCAGATGTTCATGTAACTGTCCTTGATAAATTGACATATGCA
+GGTAACCGTGCTAACATTGAAGCTATTCTTGGTGATCGTGTTGAGTTAGTTGTTGGTGAT
+ATCGCTGACGCTGAATTGGTAGATAAATTGGCTGCCAAAACGGATGCTATTGTTCACTAT
+GCGGCTGAGAGCCACAACGATAACTCATTGGAAGATCCAAGTCCATTTATCCATACAAAC
+TTTATCGGAACTTACACTTTGCTTGAAGCAGCTCGTAAATACGATATCCGTTTCCACCAC
+GTGTCAACTGATGAAGTTTATGGAGATCTTCCACTTCGTGAAGACCTTCCAGGACAGGGT
+GAAGGACCAGGTGAAAAATTCACTGCTGAAACAAAATACAATCCATCATCACCTTACTCA
+TCAACTAAGGCAGCTTCTGACCTTATCGTTAAGGCATGGGTACGTTCCTTCGGTGTGAAA
+GCGACCATTTCGAACTGTTCAAATAACTATGGACCATACCAACACATCGAAAAATTCATT
+CCACGTCAAATTACAAATATCTTGGCAGGAATCAAACCAAAACTTTATGGTGAAGGTAAA
+AACGTCCGTGACTGGATTCATACTAATGATCATTCTACAGGAGTATGGGCTATTTTGACT
+AAGGGTCGTATCGGTGAAACATACCTTATTGGTGCCGACGGCGAGAAAAACAACAAGGAA
+GTTCTTGAGCTTATCCTTGAGAAAATGGGTCAACCAAAAGACGCTTATGATCACGTAACT
+GACCGTGCTGGTCACGATCTTCGTTACGCTATTGATTCTACAAAATTGCGTGAAGAACTC
+GGCTGGGAACCACAATTTACAAACTTTTCAGAAGGTTTGGAAGAAACTATTAAGTGGTAC
+ACAGAAAATGAGACATGGTGGAAAGCAGAAAAAGATGCTGTAGAAGCCAAGTATGCTAAA
+ACTCAAGAAGTGATTAAATAAAACATTAAAGAACCTTGTCATATCAACGTTTGTTGAAGA
+TATCAAGGTTTTTTCTTGTGTTTTGGGGCATTTTTGGGGCATATTTGGGGTATATTATAG
+CCGGTTTAAGATGTCGACGACTTCATTTTTCATGCTTTTCGTGACGTGGGTATAGATTTG
+TTGAGTAGTTTTCGAGTCAGCATGTCCAACTCTATCCATGATAGTTTTTAAGGGCACTTT
+GTTTTCTGCAAGGCGACTCACCAGGGTGTGACGGAAGATGTGGCTGGTGAGTTCTTTTTG
+AATCGGTTTTTCTAGTCTCTTATTTGCCGCTCTGATAGAGGTGTTGAGGGCGTTGTCTTG
+AATAGGAACACCATTTCTGGAAATGAAGATGTAGCCCATGTCCTTGTAATTAGGATTAGT
+ATTTTTTTCAAGAGCATTAATTTTCAGTATATCCTGAATAATTTCTTTTTCACGTTTGGT
+TATCAATGTTTCACGCCAACTGGAATTTGTTTTAGGGGTGGTTTTGATAGCGTTTCTATA
+GCCATTTGAGGTGTAGTCAAGAGTTCCGTGGATTTCAATGATATCATTTTTGATATTGTC
+TGGCTGTATAGCTAGAGCTTCTCCAATGCGGCAGCCATTTAAGCTCATAAATTCTGCCAG
+ATAAGCCATTTTAATCGATCCTTTACGTCTATACATTTCATCTAATAGCCTTTTGAGTTC
+ATCTTTTTCTAAAAACTTCTGGGCAACGTCTTCAAAGTCTTTGATGGTCTTAACAGGTTT
+TGCGAGTTGGGTACTAATAACTGGATTGATTGAGACATACTCTAAAGCGATAGCGTAGTC
+GAAGGTTTGTTTGAGCAGCTGCCGTGCTCGTTTACGTTTGTCATAACTACCTGGTATTTT
+GTCGATAATACTTTGCAGGTATTTCGTGGTTATCTTGGCAATCATCACTTCTGGATCAAT
+TAAGTTTCGCAATTCTCTTATTCTAAAATCAAGAGAGCGGACAGAAGTTGATTTGAGTGA
+TTTCTGATGATGTTCCCACCATTCGTTCATGACATCTAGTAGGTAGGCATCGGTTGTGGT
+AAGACTTGTTAAGATTTTAGATATTTTTTCGTCAAGATATTTTTGGGCTTCTTTTCGTAT
+TCGTGGCGTGTCTTTTTCCATAAGGACAGAAGCTCTGCACCACTTGCCAGTGTATGGGTG
+TTTGTACCGTTCTACAAAATTTACTTTTCCGCTTTTGTGTTTTTCTGACCACATTGTTTT
+TTACCTCATTTTCTGTTAAAATAGGTATAGTAAAGAGACCTACGGCAAAGCAGGTTTTTA
+CTATACTAGATTTGCCTCGCGCTCAGAGTCGCCAAACTTTGAGAGCGTGGGGCTTTTTTA
+TTTTTCTAAAACAAAAAAGAGCACTTATTCGAAAACAGGCGCTCACAGTGGAGTTGGACA
+CTCCAAAATAATGTTTCAGTGGTAGCGAGGCTACCAAGATTACACCTTAATTCTAACATA
+GTGATATTTAATTGTCAAGTTTCCCCCACTGGCCAGATAATAACTGCCTTGCGAGAGCTT
+TATCAATGTTGTCCATGATTTCTTTAGACAATGTTATTTTTCCGACAGGGTCAAGATCGT
+TAATTGGTTTAGCGATTTTTAGTTTACTGACAGAAGTGATTGAGTCCAGCTTGGCGTAGG
+ACACCTTGTCATAATTTGCATATCTTTTTTTGAGGAAGTTAATTTTGTCTAAGTCTGATT
+GTATCCATTTTCGGACGGTAATGTTTGCTACGGGGACATGAATCCCTTTAGGGTCATTCC
+TATTGTAATATTTCATCCATATATCATGATATTTATTTTCTTTTTTAATCTGAAAAAACG
+CTGGGGGAACTGGTAACGAGTGGTGTATCCGTTCTACTTCAGTTGTTAGGTTTAGCACAT
+TTTGAACTGTTTGAACTGTTTTTTCGGCATCATCCATTATGCTCGTAAAAATCTCTTTGT
+TAATTGACAGACTCTCTTTAGAGTTTTTTGATGTTAGCGGTAAGATAGTTAGCTTTCCGT
+TATTGGGATGATCTTTTTTATTCAGCACAATCCCAAAGTGCGAATCGGAAAATTCATTGC
+CGATATTTACTCCAAAATGAATAAAGACGATAGTTCCTCGTTTGTATCTCTGATATTTTT
+GAGATTTAATTAAGTTTTCTGTTTTAAAAATTTTAGCGCGCTCGAGTTCTTGTCTTGATA
+ATTTGTAAAATTTGGGATTTTTCGGATTATCAGAGATATTCAACAGAATTTTCTTGCTAC
+GGCTTAAATTTTGTTTATTCAATGCTTTACTATCCATTTCTGCTCCTGCCTATCTCTCCC
+TATAACTCCCCATAACTTCACCAATAATCCTAAAGTCGCTATCTCTATCTATCGGTATAT
+CTGGATAATCACCGCATTGATTTAAACTGTGTAAAAACGCCCCCTTGTCATTTATAAGTA
+GCTGTTTGATATAAGCGTCACCATAGTATTCAAAGACGCCTATATCGCCATCTGTAAGCT
+CTACGGATAGCTTAACAAATACATAATCCCCAGAGTGATACTTCGGTTCCATGGAATCAC
+CATAAACAGGGATAACAAAGTCTGCGTCATAATCGACTGGTAATTCAATTGTTTCTACTT
+GTACATCATTTAGATACTGACCTGTACCAGCTGAAGCTGCGTGGTCGTAGTAATTGTAGG
+TGTAGTAGGTGGCTTGTGGTTCTTCTACTGTGTTTTGTTGTTCTAATTGTGTTTCGGCAT
+AATCAAGCACGTTTAGTTGTCGCTTGTGTTCTAATTGAGAAGAAGTAGAGTTTATTTTTT
+GTAGGGTAGATGGGATGAGTTCAACTTGGGGGGCGGTGGGAGTGGGATTATCTCCAAACA
+TCATTTTCTTAGGCTCTACACCGAAGAATTTTGCTATCTCTTCAATCTCATATATTTTAG
+GAGAACGCGTCCCTTTTTCCCATTTTGATATTGTCGACTTTGTTTTTCCAACTTCTTCTG
+CCAACTGTTCCATGGTCAAATTCTTACTAAGTCTAAGTTCTTTGACCATTGCCGGAAATG
+CAATAGTGGAAGCCATATAAATTCTCCTTTTTATAGCTTATTTATCTACATTATAATTAC
+ATGTTTACAAAATGTCAACAAAAATGGCAAATAATCAAATCCAAAAAAGTTGACATTTTT
+AACACAAAATAGTTGACAAAAAGGAAACTCGGAGTTATACTATAATCAAGCTTAAGGAAT
+TAAGCAAAACGAAAGGAGGTACAAAATGAATTGGAAAAAACTAATGTTTGGCGATTTAGA
+ACACACGTTTACTAATCATGATGGCAAAGAAAAAACAAGCATCGAATTTGAAGGTGGAGT
+TTTACCAGCTCTGTTAGTGTTGGGCGGTATTGCTTGGATGATCGCTTGGTTTATTACAAA
+ATAAAAACTCCCAAGAGGGAGTGGAAAGGAGGAAAATATGATATTCATAGCAATAATTCT
+ATCTGTATTAATATCGTTTCTGGTATCACTGGTTATGATGAAATGGCATATATGGAATGC
+CAATAAATTACTGAATAAATATTTCGATATTGAACAATCAAATATAGAGAAGTTTTCAAA
+ATCTATTCTAGACAAACTGAAATAAATTTTTTTCCGAAATCTGTTAAGGAGACCTTTCCT
+TTTTCAATCTTAATATCATATTTTGTGTTTGATGTTTTGAATAAATTAAGAGTGTTAATT
+TCACTTTCAAGAGATTTGTAAATTGTTGTTTGTTTAATTGATTCATAATTTGAATCCAAT
+GGATAATGAAGATAATCAACTTTGATTAGCCCTAATCTGGTTAAATTATCAATAGAAGAA
+GCAATAATATCTGGTGAGTAATCTAACTTTGATAAGTATATATTATTTGCCTTGTTAACG
+GTTCCTGAAAGGTTTTCTTTACTGTAGTGTACTCCTATTTGTAGATTTGCAATGAGATTA
+TTTCCCTCTTGATTTATCAATAATAGATTTTGTGCATCAAGTGGTGTCATTTGTTTGATG
+ATTTGAACAAAAGCTGAGTGAAGATCCTTTTCTTTGTCCTGATTAAATGTTGAAGCTATC
+GTTCTAGCGAACATATTTCTAAGTGTTTCGTTACTTAAATATTGCTCTGACTCATTTATC
+GCAGGATATAAGATATACTCAACGGGTTCTTTTAAACTAGTTTGCGGTATTTTAGAAAAT
+TCGCAATCAATCTCATTTTTGAATTTTTCTTGATTTTCTAATTTTCTTTTTTCAATCTCA
+TAGATGTATTCATTTTCAATCTCTTTTAATTTTGCTTTTCGCTCAGTTAGGTATCCATAT
+TTTGAATACCACATGTGGTTTAGCGATGTAAAGATAGGTTTCAGACCACCTTGGGTAATA
+AACAAACCAAAAGCACTAGAAGTCATTGGCCAATATGTTTCGATATTACTAAAATCAATC
+ATACTTTTTTTGCCTCACATTTTTATTTCAATTATACCACAGAAAGGGGGTGGGGGAGAA
+AATGGAGAAAATGAAAGCACCTAGCCTAGAAGTTAATCTACGGCTAGGCGAAAAGGAAAT
+CAAGGCAGTTGTTTCTGGATCAACTCATCAATCCTCTGAGCAATCAAAGGTTGAAGTTGA
+TGAGCAAAATCTTGAGAAATAGAAATCGAAAGCTCTTCTGTTAGTTCTTGCAGATTACTA
+AAACTGTCTAATTGTGGCAATTCAGAAGGTTCAAAAGTATTTGCAAGTTTTAAAACAACT
+TGACGGAAATCGCCGTCAAACTTTATGTTAATTTTTAATGGATCCATCACATTCACCTCC
+TTTCTGCTCACATTATAGCAGATTAGAGGTACTAAAAACAGATAGAAAGGAGGTGGGGGA
+ATGCAGGAAAATGCTTTCGAGCAATTAATTGATGATAGCGGAATTAAAAAGAAAGTTATC
+GCAACTAAAATGGGTTTTACGCGCTCTGGATTTTATCAGAAACGTAAAAAACCCAAAAAA
+TCATTCGATGCGTCAGAAGTGGCAATGCTAGCGGATATTTTAGGGGTAGACCCCGGAAAA
+GTCCTGGAAGCCATTTTAATTTCATAGAAAAGTTGACAAAAATAACACAACACTGGAAAG
+GACAATATGAATCAACTAATTAACGTAACACTAAACGAAAATCAAGAACCAGTTGTCAGT
+GGTCGTGATTTGCACAAAGTACTTGAAATTAAAACACAATATACAAAATGGCTTGAGCGA
+ATGAGCGAATATGGTTTCGTTGAAAACGAAGACTTCATGGCTATTAGTCAAAAAAGACTA
+ACAGCTCAGGGCAATCAAACAGAATATACAGACCACGTTCTAAAACTAGACATGGCAAAA
+GAAATAGCTATGCTTCAACGCAATGAAAAATCTAAAGAAGTCCGTAAATACTTCATCCAG
+GTTGAAAAAGATTTCAACAGTCCTGAGAAAATCATGGCAAGGGCGTTGCTGATGGCGGAC
+AAGAAAGTGCATAAATTAGAGGCTCAGATTGAGGCAGACCGTCCAAAGGTGCTATTTGCT
+GATGCCGTAAGTGCTAGCCATACCTCTATATTGGTCGGAGAACTTGCAAAGTTACTCAAG
+CAGAATGGGGTAAATATTGGAGCGACTCGTCTCTTCACTTGGCTTCGTAAACACGGCTAT
+CTTATCAAGCGTAATGGCCGAGATTGGAATATGCCTACTCAGAAAAGCGTAGAGCTTGGA
+CTTATAAGGGTCAAGGAAACTAGCATCACCCATTCTGATGGCCATATTACAGTAAGCAAG
+ACACCTCTGGTAACCGGAAAAGGTCAGCAATACTTTATCAACAAATTTCTTAATCAGGAA
+TATCTACCAGTTTAGAAACGTAACAAAACTAACGAAGGGAGAAAATATGGAAGAGAAAAA
+ATTTTTTACTACATATGAAATGGATCTGATGAATTCAGTTGTAACTCTTCAAAAATCAAT
+CTTAACGCAAACGGAACATTTGTCAGATCAACTAACAAAAAAGCTTCATCACCTAGAAGA
+CTACAATAGTCCGATTGATGATGAAGCAATTAGATTGGCTGAGGTAACAGCAGAATTTTA
+CAAGTTGTTAATCAAGTCTCCTAGTGTTGGAGCAACTGTCAAGGAGATTGTGAGCGAGGG
+ACATAAGCGTTAAGGCCGTAAGAGCGTCATTGAGATTATCTGGATTGTAGTATTTGAGTT
+TGTGAGCTTTAGAGTTGCGATAAAGGTGAGCGATTGCAAGTAGCAAATTTTTTAATCCCT
+TATACTCACTTTGTTCGTCTAGAGTCTGCAATTTATTACCGTTGATAATCACAATGGGTT
+CTCCGGGTTTGAAACATTGATCTATCAGACTAGCTGAGTCCATTGCTGAGCCCGTTAGCA
+GACGAATACGATGAAAAACACCTTTACTTGCTTCAAATACGGCATGAAAATAGTTTTCTT
+GTAAGAGCTCTTGAGTGCAGAATTTTAAAACGTGAGGGTGTACTTTTAATTCTTTTAATC
+TACTATCAAGTGTTTCGAAGCGTTTTTTGGCCTCTGATAAAGTTTTTGAAGTAGTAGTAG
+TAACAATTTGTCCGCTATCTGATACAATCAAACCTTTTAGCGAGAGCGGAATGTTAATGG
+CGGTTCTTAACTGTTCAAAAATTGAAACTTCATTAATGTATCTTAAAGGATTACAGACGT
+ATTCAATCACAAGTTTTATATTATCTGTATTCTGTGTCCTATTTAATATATCGGACACGA
+GATTGTGCACCCGTTTGTGCTTGTTAAATCCAGAATTTTGGTCGTTTTGGGGATAACCTA
+AAACTTCGCCCATTCGGGTTATTTCAGAATGCGAAACATAGTCAGATAGTATTTTACCGA
+TTGTATCAACGAATTGGGTGTCAATATTTAACATAACAAACCTCGTTTTTATTTAAATTA
+TACCACAGAAAGGAGAACCACATGAGACCAAAACGATATCCGTATAGCGGAGAGAAAAAG
+AGAGCCTATCATAAGATAGACCCTGAACTGATAAAAACCGGTAAAGTTGATTGCATCAAT
+CTCCCTTAAGTACGCCAAGCTCTAACAATGCATTTGTCATAGCTGCGATAGTAGATTTAG
+AGGTTGACTTAGAGACATACTCCAAAATATTAACGATATGCTGAGCTTGCTTTTGTGTAA
+TAGGTGCATTCATTTGATTAAGTTCCGCAACGACAAATTCAACTAATTGGTTGTCAACAT
+TGAAATTTTGGTTGATATGTTTTGAGACAACAGAAAGGAAGAAAAAAATCATTGAAATTT
+GATGATGTCGTTAAAATCGCCGATGTCTTAGGTGTCAGCTTGGACGAATTCAGATAACAA
+AAAAAGTCCGACGGCAATCGGACTCAAAACTAGATTAATTTACTTAATTATACCACAAGA
+GAGAGGATATTAATATGCCGCAGAAATTACTTATAGAGCAGTTGATGTTAATGAAACAGC
+TTCTCATGGTGATTATAAACACTTGATTCAACAATGGGAGGGGTTGACAGTTGCTACTGC
+AAAGCAGTGGGCGACAGAAATGCGTGATCATCCAGACTTTAAACAGTTTGTATTAAATCC
+AACGCATAGAATCGTATTCATTGATTACGAAGGATTCAAACTGTTTGTACAGTGGAAATC
+TCGCAATCGTTATAAAACAAAAAAAGAGACACTGTCAGAAATGCTTGAAAATATTAAATT
+CGAAAAAAGAGTAGGAGCATAACATGAACAAATTAGAACTATTTTTATTAGTAACAACGA
+TCATCTTAGCAATCATCACTAGAGTACAACACGAAGTCATTAAAAAACATAATTCGCCAG
+AGAATAAACGCAGAATTTTTAGAGAAGTGGCTTTAGAAAACAGCAAAGGGTGGAGCGAGA
+AGCGTTCTGGAGGAAAGGTGGTCAGCTGATGCAGTACATTTTTCAAAAATACGACAAGTA
+GCTATACATCCGTTAGCAACGAATTTATAGATGATTGTGAATTATCCCTAAAATCAAAAG
+GCCTGCTTATGGTAATTCTTAGAAATAAAGAAGATTGGAGAGTATATCCAGAGGAATTGG
+CTAGAAGGTCCAGAGATAGCGTGAGAGTTGTAAGGACTTGCTTAGAAGAATTAGAGAGAG
+TCGGATATGTGAGAACTTACAGAAAATCTTTAGGGCGAGGGAAAGGCATACAATATTATA
+GATTTTGCTCAGATAAAAAGATATCCGAACAAGCATTTAAAAAAATGATTAGTGATTTTA
+CAACTTAACGTTTTACAAAGTTGTATTTTACAAAGTTGTATTTTACAAAGTTGTAAAACG
+TAACACTAATAATTACTAACTTATAAATAAATACTAAATAACAATAAATACTAACAGATA
+ATAAGCATCATCATCAACATCAGGAGGAGCTATGGACGAAAAAAAGCTTTTTGAAAATTT
+CCAATTAACTTTTGGACGGATGATATCGCCATTTGAAATCGAAGATATTCAAAAGTGGAT
+TCACGAAGATAACATGCCAATTGAAGTTGTCAACCTTGCCTTAAGAGAAGCGGTAGAAAA
+CAACAAAATCAGTTGGAAGTATATCAATAAAATCTTAGTTGATTGGTATAAATCTGGAGA
+TACGACAGTAGAAAAGGTCAGAGACAGGTTGCAACGGTTTGACGATAGTAAAAAACAACG
+AAGTGTAACTACCTCAAACGTCCCAAGCTGGTCGAATCCAGACTACAAAGAACCAGATTT
+AGAAGAATTTGCTCTAGGAAGCATGGACGGTATAGAAGATGGATCAGGAGATTTTTAATT
+TTTTTAACAAACAAATCAAAAAAGATTTTGGTAAAACGGCGAGTAAAGAGACTTTTGCTA
+AGTTTGCTAGTTACTGCGCCGAAGGAATCGAAAAAAATGGAGTTAAGCCAATTTTTAATT
+GGATAAACCTATACGCTTTTGGAACTGGTATGACAACAGCAGAAGCAGACCGGTTGAGAA
+TAGAGCGATATAAACAGGAGAATGCGTTATGACAAAACAACATAGAGAAACACTTATCTG
+GTACCGAGCAAGTCATCAAGAGCGTGAGAGATTGCTTGATTTTGGACTAGTTGATAAAGC
+ACGGTACGTGACACTATTGCGGCAATTGCGTAAGAAATATGCGATTTAGGAGGAAATATG
+ACACCAGAACAAGTAGAAAAAGCAAAAATCAGAGCTAAACAAGAACTTGAAACGTTTAGC
+ATATACCTTGACCAGGCAGTTGATGAACTCGGTGGAGTTTTAACTTCGCGAGAAGTCTTT
+TTGGCAGCGGGATTCACCTACCTTGGCGCAGGTCAGACAGATATACATGCTGCAGTCGAG
+GGATTATGTGAGCAAATCCAATGATTTTAAATTTAGTGAAGACTGGGAGAGCAACTAAAA
+CACAAAAAGAGGAAATGAAATGAACATCAAAGAAAAAATTGTAGTGCTAAGAAACACTGA
+AGACGGAAGTTTTTTAAAGAGTTTCAAAAACAAAAAAGATGTACTTGCTTATAATGTGGA
+ACTTACAGATAGCATTCAACTGGCATCATTTTTACCAGAAGAAGCTTACAACATACAAAA
+AGAAAAAATTGATAATTTGGCAGAAACGCTTGGGTGTGATGTTGTAGTTATCGAAGCATC
+ATATGACCTAAAATTTGTTGATGGCGAGGATGTTCCAGAGTTAACAAAAGAGCAAAAAGT
+TAAAAGTATGGTAAACGGAATGTTTGAGCAGGTTTTTGGAGGTGAATAGAGATGGCAAAT
+CAATTATCAACACAACAAGTTAAACGTGATATCACAACTGATCCAACTTTGCTGACAGGA
+GCTGATATTAAAAAATATTTTGATCCTCAGAACTTGCTTAGCGAAAAACAAGTAGGGCAA
+GCTCTGGCTTTGTGTAAGGGGCGCAACCTTAATCCATTTGCAAACGAAGTTTATATTGTG
+GCCTATAAAAATAATAGCGGCACAGATTTCAGTTTGATTGTATCTAAAGAGGCATTTATG
+AAACGTGCTGAACGTTGTGAAGGATATGATGGATTCGAGGCTGGCATTACTGTTATGAGA
+AATGGTGAGATGGTTGAAATTGAGGGCTCTCTAAAACTACCTGATGATGTTTTGATAGGT
+GGATGGGCCATTGTTTACCGCAAAGACCGCTCACATCGATACAAAGTTACTGTTGACTTT
+AACGAATATGTCAAACTTGACAAATATGGTAATCCACGAAGTACTTGGAAATCAATGCCA
+GGAACAATGATTAGAAAAACAGCACTTGTTCAGACACTTAGAGAGGCTTTTCCTGATGAA
+CTCGGTAATATGTACACCGATATTGACGGTGGCGATACTTTTGATGCTATTAAAGATGTG
+ACTCCTCAGGAAACACAGGAAGAAGTCAGAGCACGGAAGATGGCACAGATTGAGCAGTAC
+AAGCAAGAACAGACTCAGAAACAAACTCAAAAAGCAGACACTAGCTATCCCGTTGATGAA
+GTGTCTGAACATACTGATGATCCAGTACAAGGAGAACTACTTGATGGAGAACTGGAGTAT
+TAGGAGGAAACCATGCAAGAATTACAATTAAAAGTCACACAGGCACAAGTTGAAATTATT
+GATCGTGAAAAATTTGAACAAAACATCAACGAAGTTGTGGCAAAATACCAAAATTATGCA
+GTCACAGCTGGAACTATCAAAGATGACAAGCAAGTCCTAGCTGATCTACGCAAGCTCAAA
+AAACAGTTGTCTGATGAGCGTATCAAAGTAAAAAAGGAACTCTCAAAGCCTGCTGACGAC
+ATTGATGGATATATCAAACAGGCAAGCAAGCCACTAGATGACACGATTGACAAGATTGCA
+ACTGATGTCAAAGAATTCGAAGACCATCAAAAAGCGCTGCGATTAGATACAGTAAAGAGC
+TACTTGTCTAATAAGGCATCCGAGTATATGCTTGACCCCCGTATTTTTGACGAAAAAGCT
+ATGGAGTACACCAAAGCTGGCAATTTTATGGCGGACGGTGTAACCCTCAAAAAAGTCACC
+ATGAAATCTCTTGAGGACTTGGTTACCTTTGAATATCAAAAGGAGCAAGAGGTCGAAAAA
+GCAAAAGCTACCATCTCAGGACAATGTGCTGAGTATGGTATGACTGACCAACCTTACATC
+CGTATGCTAAAAGAGATGACGCTTGTAGAGGTGCTAGGTCAGATTAAAGCTGATTATCTC
+GCTGAAAAGCAAAAGTAGGAAATGCGAAAAGCCGAGGAGGAAAGAGAGCAACTTTTAGCA
+GCTCAGCAAACTAAAGAACAAGAACAGGCTCAGAAATCAGCAGAAATACCACAAATCGAC
+AAGGAAACAGGCGAAATCTTGGATGGTTGGCAATTATCCCAAAACAACCAAGAAACGCTC
+ACAGGAGCTGAAAACGAGTTTAAAAAGTACAATCAAAAAATGACACTTGAGGTGTACTTT
+GAAGATACGGCTGAAAAAGACCGTTTCAAGACCGGTCTAACTCAGCTAGGTTTTGATTTT
+AAAAAAAATTATCAAGTCAGCGGTTATCAAAATATAGAGCCTCTTACTCAAGCTGAATTG
+GCTCGGCGGTGCGGATGGTAAATAAAAAATAGTTTTTTAACAACCTATTGCAAAGTGAAG
+CTCAGCCTTTGCAGTATCAATATTTTCCGAGTGAGAAAGGAAAGTTGGAATATCGTCAAG
+TTAACAGGATTGATGATATAAAAAATTGCTACACTCGTCCTTGCCAATGCTCACACACAA
+TTTTAGGGCGAGTGTGGATTTTAAAAGGTGAGAAATATGGAACAAATCAAAATTACAGAA
+ACAGGAATGGTCGTTATAAGCGATAAAGCACTCAAAACTTTTGTGATTGCAGGACATTTA
+TCGGAGAGGTGGGAATTTACCTCTAAATTTAAAAAATTAGATGAGCCATCACTTGATGAA
+AACGGAGATTTGTTTGAGCCTGTATACGAGTTGATGCTTGAAGCCAGGTCGAAGGGACAA
+ATTAGCATAACATCATCATATTGTGGCAAAAATCACAAAAAAGACACAGACGAAATCATA
+AAAGTATTCTCGTTTATCGAAGATAACAAGAGAAATATTTTTGAAAACCTTGGTATTCGT
+GGGGTGCTTGAATGAGCAATCTAGTTTTATCGTTAGACATCTCAACATCTGGAACAGGGT
+GGGCCTTATTTAAAGGCTCAGACCTTATCCAGAGTGGTGTCTTAAAACATAAGAGTAAAT
+CCTACTTTGAGCGCGGACGCTATATGGCTAGCCAATTAGGACTAATCCAGTCACGAGCAT
+TAAAAAAATACGATTGCTATTTTAGTACAATCGCAGTCGAAAAAAATTCAGTTATGGGAC
+CTAACCAGCAATCCATGCTTAAAATCGGTATTGTTACAGGAATTATCTTAGGAAGATTAA
+TAGCTGATAACGTCGCCTTTATAAATGTATCAACGTGGCGTAAGCACTGGAAGTTTAGCT
+ACAAAGACCGCTCTAAAAAAGCGATGAAAGCACAATCGAAAGAAAAAGCTCTCGAATATT
+GCGGAAAAACAGTAAAAGATGATGAAGCGGATGCTATTTTGATTGGCTCATACTATGTCA
+ATCAAGGCTATCTTGATGAATTGGAGACACATGACTACTACTAAAAAACACGTTGTGAGA
+GTTTACAACAAAGGTATTACAGCGACTTACGCGATCTATGACAAAAAACTGTTTAAGGAG
+CACGAGTTCGCAACCAAAAACGAAGCGATGCGGTTTATTAGACAGCTAGAGTTAGCTAAT
+GATAAGCGAGCGACAGAATATTATTTGAGAGAGGTAGAGAAATGATACCAAATTTTAGAG
+GGTTTAACAAAAAAACTAAAAAAATGTATAGCATTGATGGCTTTAAATCAAGTGAACGCA
+AAATATACAGATGCAGCTTAGCAGATGATGAGTTTCGCTCTGGTCGCTTAGAGACATTCC
+ATTTTGTAGAGGATAATCTTGTGGAAAAGTGCAACAGACCACCTGAACGATTTTATCGAC
+AAAAACAAGTACGCAAAAGTGACAGGCGACTTATGGCAAGGCAGTGATCAAGTCATTGCT
+GAGCAGTGTTTTTTAAAAGTATTAGAGGAGATGCAAAAATGAATATAGAAGAAGCGAAAG
+AATTAGTAGATAATTCAAAATTTTATGGAAAGACTAGCAGTGTTATAAAAGCCGAGGTTC
+GCGACATTATAGACCAGTTAAACCAACCAAAACCAGAAGTACCGCAGTGTGTGGCGGATT
+GGATAGAAGAGTGCAAAGAAGAAGATTTAACTTTAAAAGGCTTGTTTTCTAACAGCGATA
+TGCCTGCAAAAATTTTTGATTGGATTTTTGGTAGTGACGAAAATTGTAGGTTAATGGCTG
+AAGCATGGATTAACGGCTACACAGTAGAAAAAGAAAAGCTCTACACTGTCGACTTACCAA
+ACGGTCAACCTTTAGTGCGCGGCATAAACACTTTGTATTTTAGTCAAAATCTAGCAACCG
+AAAATGTAAAACTCACCGAATCCGAAATCCGCAAAGATTTTGAATGGGCGTGGCAGTTTG
+CTGAAGAGGTGACTGAATGACTGAAGAGTTAGGAGTGTTATATAGCGAAAAATGGCATAA
+GTATTATTTATATAAAACTTGCAGGTATATATCTTATGTTGATAATCCACATCAGGCTAC
+TAAATGCACCCGCAAACAAGCAGAACAGTTTCCACAGTTTAAATGGGTATCGCTGACAAA
+ATTATAACCCCACGCAAGCGCTCAAGAGCCTGCGATGGCTCTGTGGGGGTGGACCGAAAT
+TAAAAAATAGAAACGAGAACCTCCTTACACCAAAACAAATCTAAAGCGGGTTATCGGTCA
+TCCGTGATTATCCAAGGCGTCGCTAATGCTTTAACACGACATCGTGCGCCTGTGTCAAAA
+AACAAAGGAAAGAGAGGACTTTTCTCCACAAAACAAAAAGACGTCCATACGGAACGCCCC
+CTTGGTTAAATTTAAGCTTAAATAAATTATACCACATTGGGGGGCTTTCATGACGTTTTT
+TCCTGAGATTGATATCCAAAAAACAAAATCCAACGCCAAGCGTAAATTGAGAGAGTATCC
+ACGCTGGCGGAGGATAGCTAATGATGTAGATACTCAAAAAGTTACAGCTACTTACTCCTT
+TGAGCCAAGACAACCGCATGGAACGCCAAGCAAGCCTGTTGAGAGACTAGCGCTCAACCG
+TGTGTCGGCAGAACAGGAGCTGGATACGATTGAGAGAGCAGTCAACGGGATATTTGATCC
+AGAGTATAGATTGATACTGATTGACAAGTATTTGCTCACATATCCAAAGACTGATTGTGA
+TATTTATACAAAACTTGGTTATGAAAAAAGCCAGTATTACAACATGCTAGATAATGCTTT
+GTTGTCGTTCTCAGAGCTATATAAAGAGGGAATGTTGCTTGTCGAAAAATTGGAAAAAAG
+CTGGAATTAATATGGAATAATTATGTACTTTATATATAATTATTCATGTTATTATAGTAC
+TATCAAAATAACAAGAAGAGATAACCTTTTAATCAATTGGCTATTTATTTAGTCGCCAAC
+TTTAACTACAATCAAACTTGTTATTTTGTAGCCTGATGGCGGTACAGCGAGTTGAGACGA
+CAACTGGGTATGCAGGTTCGATTCCGACTGTTCCTGTTGCATTTAATGCAAACTCCATAT
+TTTTATTAAAAAGCCTATTATACCTATTGTGTAAGGGCTTTTTTAATAGTATTATTAAAG
+TGATAAAAAATATGGAGATAAAATATGGAAAACAAACCCGCAAAAGCAAGTTTCTTTAAA
+TTAAGTTCTTCTAAAGAATCTAATTTAAAATTGTTTATCGAAAAGATGGAGGAAATGTTT
+GATAATTTTAGAAAAAAACAATATAGTAACATTCCAACATTAGAGATAAATGATCTTATG
+TATTATATAAATGCAATGCAGAAGGTAACAAGTGAAGAAGAATTAAATGGAACGAATCTA
+TTTTATTGGTTAGTCACCATTTCACGGGTGGACACAGAATCTCCAATTATTCTTGCGAAT
+CTTGAAAAAAATATTGATGTAAGAAAAAGGGAAATTGAACATGGGGATAATGAGGGCCTT
+GTGGTTGATACAAGATTATTATTTGATCCATTTAGACAAATTTTAGTTGTTTATAATCAA
+AGAGGTACAATTAATAATTACGACTTAAGAAGGTTTTTTTGTCAAATAATTGGAGTTAGA
+GGATTGAAGTTTGATATTATATTAAACAGTGATGCTTTCAAAAGGGTTGGTAAGCTTGAC
+GTTGTAAATTCAATTAGTTATACTGTTGCAAGCCCAACAAACTTTAAGGAGTTTCGAGAT
+GATACTCAAAGTGAAAATGCCGATTTAAAGTTTGCAAATTCTATGCTAGGAGAGTCAATG
+CAGGTTGTTATAAAGTCAAACCATCTTTCTAAAAAAAATATATTTGATAAATTTTCAGAT
+ATGTTAGTTAATGACTCAGTTAATGTAAAAAATGCTAAAGTTGAAGGTTTTACCGATGGT
+CATCCGGAATTAATAGACTTAATAAAAAATAAATTGGAATATAAGGGAACTATTTTTTAT
+GAAAATACTTTAGACGATGAGGCTGTTTATGCATTTCTGAATACCGCGTATAGCTTTCAT
+TTTAGTCATTTAAAAAGAATGTTTACTATAACTTTATAACTTATATTGAGGTATGCGATG
+AAAAAAGGAAGGTTTAAAAGAAACTGGCCGATTATACTATTTGGTATAATAGTTTTTATA
+TTTAGTTTTTATTTTAAAATTTCTCCAAAAAGTTTAAAAAATTTTACTGATATAATGTCG
+GCATCTCTATCATTTTCAGCAATTGTAACCGCAATATTCTTTGCTAGTTTTTCATTGATA
+CCAACTTCCGGTTCTAATAAATTAGTAGTGATGATGGAAGATTTAGGGACAGAGATAAAA
+ATAATGGACCGCCTATTAGTTGCTACTTTTTTATCTTTCATTAGTTCTTTATTATCTTTT
+ATTTCTCTATTCTTTAGTAAGACTGATACTGATTTAATTTCAATTTTAGTAGTTTCAAGT
+TGGTTGAGCTCAACAGTAATGATGTTCCTAAGTTCGTTCTTTGTGCTAAGAACATTAATT
+TTGTTAGTTGAAACTTATAATAATTTCAAAAATAAATAGGTCATCACATTGTGGTGGCTT
+TTTATTATGGATTGGAGGTGGTGGAAAATCGCATACGAGGAATTAACCGAAAAACAACAG
+CGTTTTGTGGATAAGTACATCACCACATTTAACGCTACTGAGTCTGCAAAACAAGCTGGA
+TATTCTGAAAAAAGCGCTTATAGCCAAGGTCAACGCTTGTTGAAAAATGTTGAAATTCAA
+AAAGCAATGAAGGAACGTTTTTTGGAGGCAAAAGATACTAAAGGAGACCGTATTCAAGAT
+GTTGCAGAAACGTTGGAACAAGATACATCGATAGCCCGTGGAGAAATCCAAATATCTGAA
+TTCAAAGAAACAGATATGCTGACAGGTCAAGTGGTTATCCACACGAAAAGAGAATATACC
+CCAAGTCACGAAGAACAGGGTAGGGCTAGGGATAGAATTTATAAAGTTAATGGAGCTTAC
+TCAGAAAAACGTGAATTAGAGCATTCTGGAACGGTGGTGTTTGCAAATGAAGACAACATC
+CCTGATTAAAGTAGATTTGCCATCAACAATCGGTATAGGTTATGGCGCTTTTTGGCGGTC
+TAGAAATTTTTATCGAGTAGTTAAAGGCAGCCGTGGATCTAAAAAATCTAAAACGACTGC
+TTTAAATTTTATCGTCAGACTGCTGAAGTACCCTTGGGCTAACTTATTGGTCATCCGTAG
+ATACTCAAACACTAACAAACAATCTACTTATACCGATTTTAAATGGGCGTGTAATCAATT
+AAAGGTTACACACCTTTTTAAGTTTAATGAGAGTTTGCCAGAAATAACTGTAAAGGCAAC
+GGGCCAAAAGATACTGTTCCGTGGACTTGATGATGAGTTAAAAATCACATCTATTACTGT
+CGATGTTGGCGCTTTGTGCTGGGCTTGGTTTGAAGAGGCTTATCAAATTGAGACCGAAGA
+TAAGTTTTCAACAGTTGTCGAATCAATCCGCGGTAGTTTAGATGCTCCTGATTTTTTTAA
+ACAGATAACAGTCACGTTTAACCCGTGGTCAGAAAGACATTGGCTTAAACGTGTCTTTTT
+TGATGAAGAAACTAAACGGGCTGATACATTTTCTGGGACTACAACATTTAGAGTAAACGA
+ATGGCTTGATGATGTCGATAAAAGACGCTACGAAGATTTGTACAAGACTAATCCAAGGCG
+GGCTAGAATCGTGTGCGATGGTGAATGGGGCGTTGCTGAAGGTCTTGTTTTTGATAACTT
+TGAAGTCGTAGATTTTGATGTTGAAAAAACAATTCAACGCGTTAAAGAGACCTCGGCCGG
+TATGGACTTTGGGTTTACTCAAGACCCTACAACTCTTATATGTGTTGCAGTTGACCTCGC
+AAACAAAGAGTTATGGCTTTACAACGAACATTATCAAAAGGCTATGTTAACAGATCATAT
+TGTCAAAATGATAAGAGATAAAAACTTGCATAGGTCTTACATCGCAGGGGATAGCGCCGA
+AAAACGCCTCATTGCAGAAATAAAAAGTAAAGGGGTGTCTGGAATTGTCCCGAGTATTAA
+AGGTAAAGGGTCAATCATGCAAGGGATTCAATTCATGCAGGGGTTTAAGATATATATTCA
+CCCATCTTGCGAACACACAATAGAAGAGTTTAATACTTACACTTTTAAGCAAGACAAAGA
+AGGTAATTGGTTAAACGAACCGATAGATAAGAATAACCACGTTATTGATGCGATTAGATA
+TGCGCTTGAAAAATACCATATCAGAAGCAACGAGTCAAATCAGTTTGAAGTTCTTAGGGC
+TGGTTTTGGTTACTAGAAAGGAAAATAATGTACACAGAATCATTTAGAGATAGTACGGGA
+AAGACTAAAACATTAGAGTTTAGGTTCCACCGTGAAGCTCGCATGAGGTATCAAGCGGAA
+AGTCTAGAAAGCTTGTTAACCGAAAAATATAAGCTACTCCGTGAAATGATTGAACACCAC
+GATAAAGTCCAAAAACCACGCATACAAGAGCTTCTAGATTATGCAGAGGGAAATAACCAC
+ACCATCAGCGAAATAGGCCGTAGGAAAGACGATGACATGGCTGATGTTCGTGCTGTGCAT
+AACTATGGTAAGTATATTTCAACGCTCAAACAGGGCTATTTGGTGGGTAATCCTATTCGT
+GTAGAGTATATTGATGGTACCGAGCAGTAGCAAGACCTATTAAAGGACCTATCTGTTAAA
+AACAATTTCCACCAGCTGAACCGCAGATTAGTAAAAGACCTATCCAAGGTTGGTCGAGCG
+TTTGAATTGATTTATCGCAGCATGGATGACAAGACAGAGGTCGTTAGACTAGATCCACGG
+GAAGTATTTGTTATCTATCAAAATAACCTAGAGCAATCAAGCTTAGCTGGTGTGCGGTAC
+TATAACAAAAATCAATTAGATGGTACTACAAAAATTGTCGAGCTTTACACCGATAATAAA
+ATCCTGAAGTTTGAATATGATGGTGATTTAACACCTATCGGAGAGACTTCCTCTCATGCG
+TTTGGTTCGGTGCCAATCACGGAGTACCTCAACACAGATGACGGCATGGGTGACTACGAG
+ACAGAGTTGTCTTTAATCGACTTGTATGATGCAGCGCAGTCTGACACAGCTAACTACATG
+CAGGATTTGTCAGACGCGATTCTGGCAATCATTGGTCGTGTATCATTCCCTGGCTATGTC
+GACACTGCCGAAAAAGCCATTGAATACTTACGTAAGATGCGTAAAGCTAGATTACTTAAC
+TTAGAGCCTCCTGTCGACCAAGACGGGCGTGAGGGATCTGTAGATGCCAAATATCTATAT
+AAACAATATGACGTACAAGGAACCGAAGCCTATAAAAATCGTATTGTGTCCGACATCCAT
+AAATTTACCAATACGCCAGACATGACAGACAGTAAGTTTGCCGGTCAACAATCTGGCGAG
+GCGTTGAAATGGAAGGTGTTTGGACTTGACCAGGAACGTGTAGATATGCAAGCTTTATTT
+GAGCAATCTCTTAAACGTAGGTACAAACTAATCGCTCGTGTAAGCCAACTGCTTAAAGAG
+ATTGATGACTTTGACATCAGCAAGCTTAAAATCACATTTACGCCAAACCTACCTAAGTCG
+CTACAAGAAAAGATTGAAGCCTTTAAAGCATTGGGTGGAGAGTTGTCGCAAGAGACAGCT
+ATGGCTATTACAGACATCGTGGAAGATGCTAAGAAAGAAATTAGCCTTATCAACAGCGAG
+TCGAAATCACGTAGTCAACTAGCGCAGAAGTTAGAAGAAACCAGTAGATTGACTGATAGG
+GAGTTAGCTCATGACCACCAGAAAGAGTAAATACTGGCGTGACCGTATCAAGAAAGAAAT
+GGATGCTAAAGAGGCAGACGATATCTCTCTTGAGCAATCCATGAAGCAATTGCACGATTA
+TCATTTCAGGAATATCGAAAAAGAAATTGAGTCGTTTTATCAACGTTATGCTGACAAAGA
+GAAAATAGACCTTTCAGAAGCCCGTAAGAGAGCTTCTGAGCTTGATATTTCTGCTTACCA
+GAAGAAAGCTAAGGAACTTGTTGCAAAGGCTGAGAAACTACGAAGAGAAGGTAAGATAGT
+AACAAGAGATGACTTTACCCACCAAGAAAATGCAGACATGTCTATTTACAACTTAGCCAT
+GAAAACGAATGCTTTGGAACTATTGCGCTTAAACATTGATTTAGAAATGCAAGAACTTGC
+CAACGGCGAACACAAGCTAACCAAGAAATTTCTTGATGAAGGCTATCGCAAAGAAACCGA
+GTTTCAAGCTGGGCTATTAGGATTATCAGTTGCTAGCCAAGCGAGTGTGAAAAGCTTAGC
+TGATGCCGTTATTAATGCTAATTTCAAAGGAGCAAAATGGTCAGATAACATTTGGGACAG
+ACAAGATAAGTTACGTAGCATCATATCTCAAAGCGTCCAAAGTGCTATCCTAAAAGGTAA
+AAATGGCTTAACTATTGCAAGGGATATCAGACGAGAATTTGATGTGTCAGCGTCTTACGC
+AAAGCGACTAGCGATAACGGAGCATGCAAGGGTTCAGATGGAAGTTGGTAGATTATCCAT
+GGCGGAGAATGGCTTTGCTATGTTTGATATATTGCCTGAGCCTAAAGCATGTGATGTTTG
+CAAGGATATAGCTAAGCATGGTCCATATCACCTTGACAAGTGGAGAATAGGGGAAAACTC
+TCCGCCGTTTCATCCGTATTGTCGTTGTGCGATTGTAGGGGTAGATGAAAGTGGTGTTGC
+AACAGACAGGCAATTGGACTATAATCGAAACATGAACAATATTGATTTGATGGCTAAAAC
+TCAATCTTTTATCATTAACAAAGATGTCCGAGTAAGTGCCAAGAAAGTTGTCGGCACAAG
+ATATGATTTTTGGGCGCAAGATAATACCAAAAAAATTAGAGATACGATTCAAAGTGTTGG
+AGAGCACTTAGACAACTTAGAAGGGTATAGCATTCCTAAAATTGTATTTGTTAAAAAAGC
+TAAGCTCCAAGGCTGGGCGGGATATGATTATAAACAAGACACTTTGTTTATAAGTGATTT
+GTTGAATTCAAAAGCCGCTGTGAGTGATATGCTGCTGGATAACTACTTTGCGGCTGTCGA
+CTTAAACGGTATTCTAGTGCATGAGTTAACCCACAAAAAACATTGGGATACTGCTAAACA
+ATTTTACAAACATAATAAAAAGCGTTATAATACACTTGAAGAGGCAAAAAATGCACTTGA
+TTCGTCTCTAGTTTCCTATATTAAAGAACAAAAGCAATCTGATTATAATTATTTATATAA
+AATAAGCGAGTATGCTGATGTTGCTAGTTTACAAGGGAAATATAACGAAGTTATAGCCGA
+GGCAATGACTGCGGGAGATAAATTATCAGATCCGCTATTGTTAGAAAAAATAAAGGAGGT
+ATTCAGATGGAAATGATGTCAAGACCGACTCAAGAAGTGCTAACGTTTTCTAAAATCATC
+CGCCGATGGATTGTAGGCGATGAAACCATTGGCGGCAAGAAAAAATTCATTTTCAGAGAT
+GATACTCCGGAAGATGTTTTAGAGCTATATCAAAAAATAAAAAATAAGTTAGATTTTGCA
+TATTAATTAAGCGCTTAGCTATTATAGTTAAGTGCTTTTCTTATGCTTAAAAACAGGAGG
+AAAACGTGAATAAACGAATCAAGAAAAAACATAAATTGGAAACAGCAGTTGTGTTGCTTA
+TCGCAGAAAATGCTATGCAGGCTGAAGCTATTAAGAATCAAAACAGACAAATTGCAGAGC
+TGAGATCGATTATACAACAAAACGCCCAAGCAATAAATAGAGAGTTTGCAGCAGTTAAAG
+GTGTGTGTCTTGATAATCAAGCAGCTATTACAAACATTGCAGTTGATATTAACTACGTCA
+AGAAAAACTACAAACGGAAGTGGGGGAAGAAATAGGCTTTTTCATATTTTTAAAAATTTT
+TTAAAAATCGCTTGACAAATGTCGACAATAGTTTTATTATACTTATGTCGGCAAAAGTGA
+GGTGATGAACTTGACTGACAAAAAGAAAATGGGGCGACCTACTAGCGACCCTAAGACTGT
+TAAATTGACTGTTAGAATTAACGAGGATACGAACAAAACTTTGGAAGAATATTGTAAGAA
+TAATAATGTTTCCAAAGCTGACGGTGTTAGAGAAGCTATTAGTCGTCTGAAATAACAAAT
+ACCGTCTAGCTCTCGGTCGGCAAACTTGCGAGCTAAACGGTATCACCACAGAAGTGTTTC
+TGCATGAAATATTATATCATGTAGAGACGCTCTTTTCAAGATACACGAAGGAGTGTTTTT
+ATTATGGCGAAAATTGATATTATTGATAATTATGAGACATTGCTAATTAGTGTCGAAGAA
+ATTAGAGCAAGTTTGGAATCCTTGCATGCCTGGCTGGATAAAGACATTGATTGGGATAGT
+CAGTGTGATTGGTACGATTTTATTTCTCAACACAGTTCCCAAATTGCGATTCTAAACTTG
+ATTATGTACCGTTTAGACAGTTTAGAAGTGGAACACAGAAGCGTTATCGAAAACACAATG
+AAAGGTAAATAATATGGAATTACAAGTATTTACTAATGAACAGTTTGGAGAAGTGCGTAC
+AGCGACAATCAACAATCAAATTTATTTCAATCTTAACGATTGTTGTCAGATTTTGGAATT
+AAGCAATCCTCGTAAAACAATTGAAAGACTTAATAAAGATGGTGTAACTACTAGTGACAT
+CATCGACAGTCTTGGTCGAACTCAACAAGCCAACTTCATCAACGAAAGCAACTTCTACAA
+GCTAGTCTTCCAATCTCGCAAGCCAGAAGCTGAAAAGTTTGCGGACTGGGTAACATCGGA
+AGTCCTACCATCAATCCGCAAACATGGCGCATATATGACCGAACAGACTTTAGAGCAGGC
+GCTGACAAGCCCAGACTTCCTCATACGGCTTGCCAATGAGTTAAAAGAGGAAAAGGAGCG
+CAGTCGTCAGTTAGAGGCTGAGAAGTCAATTTTGAGCGTTGAGAACATGGTTATGAAGCC
+AAAGGCTGATTATTTTGATGATTTGGTTGACCGCAATTTATTGACTAGTTTCCGTGAAAC
+TGCTAAACAATTAAAAGTTAAGGAACGACGATTCATTCAATTTCTACTTGATAAGAAATA
+CGTTTACAGAGACAAGAAAGGTAAGCTTATGCCGTTTGCAGATAAAAATAACGGGTTATT
+TGAAGTCAAGGAAAGTGTTAACGAAAAGACCAACTGGGCAGGAACTCAAACCTTAATAAC
+TCCAAAAGGTCGTGAAACTTTTAGACTGTTATTTATTTAATTCACTTTAAAGTCGTAGCA
+ATACGGCTTTTTATTATGTCCAAGCATTGACGACGTAAAAAGCTATGGATTTTATAGTCG
+GGGACGACTTAAAACATAGGAGGTGCCAACCATGGCAGAAGAAACACAAACAGTTGAAAC
+GGTTGAAGAGCAAGTGGTACCAGAAGCAAAACAACCGCAAGACGAAAAAAAGTACACAGA
+TGCAGATGTGGACGCTATCATCGACAAAAAGTTTGCGAAGTGGAAGTCAGAACAAGAAGC
+GGAGAAATCGGAAGCTAAAAAAATGGCTAAGATGAATGAAAAAGAGAAAGCAGACTACGA
+AAAGCAGAAGCTGTTAGACGAATTGCAAGAGCTAAAAAACGATAAGACACGCAATGAGTT
+AACAGCAGTAGCTCGTCAAATGTTTGCAGAATCTGAAATCAACGTCAACGATGACGTACT
+TGGTTTAGTTGTGACTTTGGACGCAGAACAAACAAAAGCAAATGTAACAACGCTAGCAAA
+CGCATTTGCTAAAGTTATCGCTGATGACCGCAAGGCTCTTGTACGCCAGACTACTCCGTC
+AACAGGTGGTGGATTGAGCAAACAAACCAATTACGGTGCTAACTTGGCTAGTAAGGCAGC
+ACAACAAAGCACCAAACTTTTTTAGGAGGAAATTATGAATAAACGTAAAGTAACAACATC
+TAAAGAGATTCTACACAATCTCGACTATGAAGCTATTTCAGTAACTTTGGATTCAAACAA
+AATCGGCAAGAAAGTTGTTCCAGCTGGGACAATTTTGGCAGGCAAAGATAAATCCATTTT
+TGAAGACCGCAAACAGAAAGTAGAAACCGTGACAAATGAAGAAGTCTCTACAAAAGAATA
+TGTCGATGGTATTTTACTTACAGATGTCGATTTAACAAATGGCGATGCAGTCGGTTCCTG
+TGTTTATCGTGGGACTATCAATGCAGACAAGCTTGCTGATTCATCTGTTGCGGAAAATTA
+TGATGATTTGGAAGAAGTACTACCACACATTGTCTTTATCAAAGGAGGTAAATAAACATG
+GCATTGATCCACGAAATTATCACATCGGAAAATATCAAAGGTTTTTATAACGCTAAAAAC
+GAAAATGTTGAAAATACATTGGGAGAAAAAGCATTCCCGCCAAAACAACAACTGGGCCTT
+AAGTTGTCATTTATTAAAGGTGCAGCAGGAAAACCGGTTACTCTTAAAGCGGCCGCTTTT
+GACACTAAGGTGCCTCTACGTGACCGCATGGCTGTTGAATTGATTGACGAAGAAATGCCA
+TTCTTTAAAGAGGCTATGCTTGTTAAAGAGGCTGACCGTCAACAACTCAACATGTTAGCG
+CAAACTAAAAATAACGAACTTATCGACACCATCTTGGCATCTATCTACAATGACCAGGCT
+ACGCTTATTGCAGGTGCTAAAGCACGCCTTGAAGCAATGCGCATGGAAGTGTTATCTAAA
+GGTAAAATTCATATCCAGTCTAACGGCGTGATGAAAGACATCGACTATGGATTGGCCGAA
+GATCAAACGACCAAACCAGACGCCAAATGGGATAGCGCAGGAACAGCTACACCACTTAAA
+GACATTGAAAAGGCTATCGAAAAAATGGCAGAGCGTGGTTTTGTGCCAGAAGCTATCATC
+ATGAACTCTAAGACATTTAGTTTGATTAAAAACGCAGAGAGCACCTTAGATGTCGTGAAG
+CCTATGGCACCAAATGGGGCAGCGGTTACTAAACGTGACCTAAACACATATCTTGAAGAT
+GAACTACAAATCAAAGTCATCCTAAAAGATGGCATGTTTGTTGGTGATGATGGTGAATCT
+CGTAAATACTTCCCAGATGGTTTTGCAACATTAGTACCTAACGGCAACCTTGGCTACACT
+GTATTTGGCACAACTCCAGAACAGTCAGACTTGCTTGGTGGTGAAGCGACAGATGCAAAT
+GTCTCAATTGTCGAAACTGGTATCGCAATCACAACAACCAAGACAACTGATCCAGTAAAC
+GTCCAAACCAAGGTATCTATGATTGCCTTGCCATCATTTGAACGCTTGGAAGAAGTACAT
+ATTATTAATGGCTTGCAAGATGCATAAGGAGGTGCTTTATGGCCAAAGTTATTAAGACTT
+TTAGAGATAAAGTGACGACTAATGCTTATTATGTAGGCGATGATTACAAAGGAGATCGTA
+TCGAGGAATTGACAGCCAATGGTTACTTGGCCGGAAATACTCCTAAACTGGATACTGTCG
+AAGAAGTTGACCTAGATAAACTCAAAAGCGATGAAATCAAGGCAAAACTTGACGAATTGG
+GCATTGAGCACGATTCTAAGCTTAAAAAGGCGGAATTGTTGGAGCTTTTAAAAGCTAACA
+TTTAACGGAGGTGTTTATGGCAAATGTAAACACATTTAGCATTGTAAAAAATGTCAAGCT
+CGATTTAGGCATTGAGGACGACAATCAAGACCAGTTGTTGGAGATGTTGCTAAATCGTAT
+TACAGACCACTTCAAAGCAAATTATGGCGTGTTAGAAATTGACAATGCTTTTTCTTTTGT
+CTTGGAAGATTGTCTGATTGCTCGTTTTAACCGTAGAGGTTCAGAGCGTGCCAAAACAGA
+GGAAGTGGAAGGTCATAAAACAACCTACTACGACCATTTGAATGAGTTTGAACCCTACGA
+TGCCATGATTATGGCAAAGCTTAATTTAATCAAAGACAAATCTCGTAAAGGGGGACTGTA
+CTTTTTATGAGATATGCAGATAGAGTTACATTTGTTAAAACGACGGATGAGCAATACAAT
+CCCGATTTAGGTGAGTATACGCACACAGAGGTCATAAGTATCACAAAACCTTGTTTTGTG
+ATGGACATGGGCATGGAAAAGTCCGTACAGATTTTTGGAGATTATCAAAAGGATCGTAAA
+GTTATCTACCTAAAGCAGCCTTATACAAAAGCATTTGATTATTGCGAGTATGAGGGCAGG
+AGATACAAAACGCAGGCAAATAAGCTTGGCGCTATTGTTTTTTATCTGGAAGGAGATGAC
+TCTATTGGTGGCTGATATATCTTTAAAAGTAGTTGGAACAGCTGGTTTAAAAAAGAAACT
+TGAGCTTATTATCAAAAAAGATGCCGTCAAGAAGATTGTCAGAGACAATGGGACGCAGCT
+TCAAAGGAAAATGATTAATAAAGCGGTATTTACAAAAGGCTATTCAACAGGTGCAACTAG
+ACGTTCTATTACCATGCAAATCGGCGATGGTGGATTGAGTGTCAAGGTTAAACCAGGAAC
+TCATTATGCCGGCTACCTTGAAAGAGGAACTCGCCTTATGAGCAAACAACCGTTTGTTTT
+GCCAGCTCTAAAAGAGCAAAAAGTAAAATTTAGAAAAGATTTGGAGGCGCTTGTCAAATG
+ATTAAAACTAGAGATCAGTCTATTTTTGACGAAATGTTTAAACGCATCCAGTCTTTAGGT
+TTTAAGGTTTACGATTATAAACCGATGACGGAAGTTCCATATCCATTTGTGGAAATGGAA
+TCTACTGATGCGGAATATATTCCAAATAAAGATGACATTAAAGGTTCTGTTGAACTTATG
+TTGTCTGTTTGGGGGGTGCAGAAAAAACGGAAGCAGGTGTCTGACATGGCATCTGCTATT
+TTTTCGCAAGCTTTGACAGTAGAGAGTTCTGACGTTTTCCGCTGGTCATTAAATACTCGT
+CAATCATCTATTCAAATGTTAGATGACACAACAACTGTGACACCTCTTAAACGAGCGATT
+GTCACACTTAGATTTAATTTGAGATAGGAGGTAGAAATGCCAGAATCAGAAACATTATCC
+CCTGACATTCATACCAAAAGTCACGAAGATAGTCCAAATACTGTAAAAAAACAGGAGGAA
+GTAATGGAAACACAATTAGAAGCAAAACAAGGGATTCATTCAATCTTGTTATTTCGTTTG
+TTGAAAGAAGCATCTAGTGAGGCAGCAACTAAACTTGCTTTTCAAACAGAGCATGAAGTA
+GGTAAAAGCCGTGACGTAGATGGACAAAAAACTAAAGATGGTATTATCCAGTCCGTGGGG
+GCTTTGGAGTACGACTTTAAAGCAACATCTATTTTAGCTAAAGGTGACGTACTAGCAGCT
+AAACTAGAAAAAGCCATGGAGAATGGTGAGCTTGTAGAAATTTGGGATATTGATTTAGAA
+GAAACAAGCAAAAACGGCGACAGCGACAATAAGCTTGCAAACGTTTGGGGTATTGATAAA
+AATGGAACAAACAGAGGAAACGGTAAATACCTAGCGACTTATTACCAAGGGTACATCTCA
+AGCTTCAGTGCTAAGAAAAATGCTGAGGAAAATATTGAAATTGAAATGGAATTTGCCATC
+AACGGTGTTGGCCAAAAAGGATTCGCTACATTAACAGATGCCCAAAAAGCAGCTGTACAG
+TACGCATTTAAAGATACAACGAAAGGTTAATCAACAAGGCCAGTTAATTACTGGTCTTTT
+ATTTTTAAGTTTTTAAAGGAGAAAGAATAATGCAATTGGAAATTAAAGGTAAAACTCATA
+ACGTAAAATTTGGTACACGATTTGTTGCCGAGATGGACAAAAATCATATAGCAGAACGTC
+AGGGATTTAAATTTGGAGCTGGTCTACAATCTAGCGTTCCGTTTTTAATCGACCACAGCG
+TTGTTACTCTTGCGGAAGTAATTTATACAGGTACAATCACCGAACCACCACGTCCTAGTT
+TGAATGATATTTACGACTATATTGACGAAGTTGAAGATATTGAAAAGCTTTTTGATGATG
+TTTTAGACGAACTACGTCAATCAAACGCATCAAAGTTGTTTATGGCTCAGGTGGAAAAAG
+ACCTGGCGGAAGCCAAAGCGTAACAAATATAAAAAAGAGTTATTCTTCTCAAGAAAGCTT
+TGAGATGATTGTGCTTAATTGCATTAGATACCTTGGCATGACTGACATCAATGAAATCGG
+GCGATTAACTTTGTATGAATATGATTTATTAATGACAGGCAAAGCACTAGCGGCTGTTGA
+TGAATCACATAAAGCTCACAAACAAGCTTGGATAAACCACCAAGTTACGGCAACAAAACT
+TGTTGGTGGCAAGAAAAATAAAAAAGAAGTCCCTGTTTATAAAAAATTCAAGGACTTTTT
+TGATTATGAGGAAGAAATCCGAAAAATCACTCAAGAAATTGATGAAGGTTACGACAAGAA
+AGGTATGGATTTACTTCTCAAAGCTAACCTTTAAAGAAAGGAGGTTAAATGGGAGAATCT
+TATTCTGTTGAAGCGGTTTTGACAGCTGTTGATAAAACCTTTGGCAAAACATTACAATCG
+GCAATCCGTTCAATCGATGGCTTGGAAAAGCGTTCAACCGGTTTTTCATCGGTGTCTCAA
+AAAGCTAGTTCCATGTTTAAATCCATGTTAGGAGCGAATTTAGCCGGACAAGCTATCTCA
+GCAATGACAAGGACAGTGTCATCAGGCCTTGGCTCTATGCTTGGCGAGATGAATAGTTCA
+GCGAAAGCGTGGAAAACTTTTGACGCCAATTTAGCGGACATTGGGTTTGGAAAAAAACAA
+ATTTTGGCAGCTAAAACGGCGATGCAAGACTATGCAACTAAAACAATCTACTCGGCATCA
+GATATGGCTAGCACGTATGCACAGTTAGCGGCAGTTGGTGTGAAAGATACCGGAAAGCTC
+GTAAAAGCTTTTGGCGGTTTAGCTGCATCTGCTGAAAACCCGAAGCAGGCCATGAAGTCT
+ATCAGTCAACAAATGACGCAAGCAGTAGGAAGACCAACAGTTGCATGGCAAGACTTTAGG
+ATAATGCTGGAACAGGCGCCTGCAGGGATGGCTAAAGTCGCTAAATCTATGGGTAAAAAT
+CTTGATGAACTCGTCGCCGATATCCAGGCGGGTAGGGTTAAAACCAGCGATTTTTTGGAA
+GCGGTAAAAAAAGCAGGCAATGATAAGAGTTTCCAAAAGATGGCAACTGAGTTCAAAACT
+GTTGACCAAGCCATCGACGGTATGCGAGAAGGCTTATCCAACAAATTGCAACCAGCGTTT
+GAAAAAGTGAACCAATTTGGAATTAGAGCGATCGAAGCAATCGGTAAACAACTCGATAAA
+GTTGATTTTTCTAAGTTTGCTAGTAATCTTGGGAAATTCCTTGAAGGAATTAATATCGAT
+AAAATTGTATCTAATATTTCATCGGCGATTTCATCTGTCACTTCAAAGGTTAAAGAATTT
+TGGGGCGGTTTCAAACAAACTGGAGCAATTAGTGCTTTTTCAGGAGCTTTAAAAAGTGTT
+TGGGGAGCGTTAAAAAATGTAGCTAGCGCTATGAGTGGAGGCAGTTGGAAAAACTTTGGC
+TCTATTGTAGGCGGAATTGTAAAGCATGTGTCTAATTTTGCAAAAGCTATTGCTGATGTT
+GTCGGTAAAATGGAACCTGGCAGATTGCAAAGCTGGATAGCCACTTTTGCAGCAGTCGGG
+GGAGGGTTAAAGTTATTTGAAAAGCTAACAGGACAAAGCGTTGTTGGCTCTTTTTTAGAT
+AAAATCAGTACAAAATTTGGATTATTTGGCAAAAAAGCTAAAGAAGGAACCGATCAAGCA
+GCGAATGGCTCTCGTAAAAGTGGTGGAATCATCAGCCAAATCTTTAATGGCTTGGGTAAT
+ATCGTTAAGTCTGCTGGTACAGCCATATCAACAGCTGCAAAAGGTATCGGTACAGGGATT
+AAAACCGCCTTGTCTGGGGCACCTCCTATCATTAGTTCTCTAGGAACCGCAATATCAACA
+GTTGCGCAAGGTATAGGCACTGGGCTAGCAATCGCTTTTAGAGGTTTAGGAGCTGCAATC
+GCTATGGTGCCTCCCACCACTTGGCTAGCTTTAGGAACGGCTATTTTAATGGTAGGAGCG
+GCTTTTGCCTTAGCAGGAACTCAGGCTGATGGCATTAGTCAAATTTTAAGGACTATTGGC
+GATGTTGTTGTACAAGTTTTACAACAGGTCACTGATAGTCTAGCCACTTTACTAACTATT
+ATCGCAAACGCTATTGGCTCTATGTTGCCAATTGTAGCTGGAGCTATCTCTCAGATTGTA
+GGCGCAGTAGCGGGCGGATTATCTCAGCTCATTATAGCCGTTTCAACAGGGGTATCTCTC
+GTTATAGGAGCTTTCACAGGACTTCTTGGTGGTATTTCTGGGGTTATTAACTCCATTAGC
+GCTGTTATCCAATCGCTAACTGGTGTGATTACCGCAGTATTCAATGGCATAGCTACTGTT
+ATTTCATCTGTCGGTTCGACTATCAAAGATGTATTGACGGGTCTAGGAACCGCTTTTGAA
+GGATTTGGGAATGGTGTAAAATCAGCTCTAGAAGGTGTTGGGGCAGTAATTGAATCATTT
+GGTAGTGCAGTTAGGAATGTCCTTGACGGTGTTGCAAATATCCTTGATTCTATGGGGACT
+GCGGCACTTAATGCAGGCCGTGGCGTCAAAGAGATGGCTAAAGGTATTAAGATGCTTGTT
+GATTTATCCCTTGGAGATTTGGTTGCTACATTAGCAGCTGTGGCAAGCGGTCTAGGGAAG
+ATGGCTAGCTCAGCTGGCGAAATGACAACATTAGGTTCTGCTATGAGCAAAGTAGCCAAT
+GGTATGACACGTCTAGCAACAAGTGCTACGATAGCAATTACTGGATTAACAGTCTTTGCC
+ACCACCATGGCAACTATTAAGACAGCAGTTGCAACTCTACCGCCAGTCCTAACGATGGCA
+GCGAGTGGGTTTACCACATTTACTACTCAGGCGGTGGCAGCAGTGACTGGATTGGCTGCA
+ATTAATGCTCCAATCACTATGTTTAAAGCTCAACTAATGACAATAACACCAGCTCTAGCA
+CAAGCTGGCGCTGGCTTTGCCGCGTTTGTTGCTCAATCATCAACATTTAGTACAGGTTTA
+GCATCTGCCGGTCCTACAATAGCAGCATTCAATGCTAATTTGATGAGCTTATCTGCAACA
+ACAGGAGTGCTAGTTGCATCAATAGCTGGTTTATCAGCTGTGCTTTCTGTTGTATCAGCT
+GGCTTTAGCCAAATAGGGGCTTCTGCGACAGCAACTGTTGGTCAAATACAAGCTTTTGCT
+TCTAGTACAACAGTTGTTTCGTCAGCATTTGCTAGCATGCAATCTATGATTCAATCTGCC
+ATGGCTGCAATAGTAAGCAGCATTATAACATCATTTAATCAAGCGGCCTCTCAAATGCAA
+TCAATCTTATCTCGAATGCTATCTCAGGCCAGGACATTTGGGTCTCAACTAGAGCAACAA
+ATGAGACAATCGGGACAGCGTTCAGGACAAAATCTTGCTCGGGGGCTATCTTCTCAACAA
+GGTGCTGTTATTAATGCTATTTCTAGCATGGTTAATGCTGCGGTATCAAGAGCCAACGCG
+GGAGCTGGTCCTATGCGTCAAGCTGGAGCGTACATCGGACAAGGGCTTGCGCAAGGAATG
+TATTCAGCGCTAGGAGCTGTAACAGCTGCAGCAAACGCCCTTGTAGCACAAGCCGAGAGA
+GCAGCAAGAGCCAAGGCGATGATTCATTCGCCGTCAAGGTTGTTTGCAAAACGAGTTGGT
+CAATATATCCCGCAAGGGGTAGCTATGGGTATCGACAAAAACGCTGATGTCGTTGACGAC
+TCTGTTGGCGGGTTATTTGATAGCATCAATAGCTTTGATTTTAATATCGCAGATAGACTG
+ACTAGCATTGGAGCTAAATTCCAAGGTGTTGTCAAATCAGAGAGTTCGCAATCGTTATCG
+CAGCAACAAGAGTTTGTACATACAGCTCAACCAGCGTATATAAACTTTAGTTTAGGCGGA
+AACGAATACGAAGCATTTGTAAGTGACATCACTAATCAACAAGCAAAAATTGAAAAAATC
+AGACTAAAGAGAAGCAGCTGGTAGTTGTTTCTCTTAGTTTTTTTGAAAGGAGTAAAATGT
+ACGAATTTAACGATACTATCAGAGGTACTCCGAAAGTTACTTTTAATTTAAAGACAACAA
+TTGGTGGAAAGGTATTAGAAGACGAACTCAATAATGGTTTCGGTACCTTTAGGACATTGA
+CTGTTTCTGGTCGTGATGTGGTGGACTTAGAGCATCAAACAACAAGTGTGTTAGGACGAA
+ACGGAGAGTATTTCCACAATGCCACAGTTGAAGTCAGAAAACTAGAAATAAAAGCTAAAA
+TCAGTGGAAAAGATAACAAGTCAATGCGTTTACAATATGAAAAATTAAACAAATTAATTG
+TTAGTCACAATCAAGTTTTTTTATCATTTTCAGACGAACCTGACAGAAATTATCTAGGCA
+TCTTTAAATCTAAAGATGTCCCAGAAGAAGTTTCTAACGAGCAGATTATAGGACTAACAT
+TCATCTGCTACAATCCGTTTAAAATGTCTGATGTAAAAACTAAAAAAGGAACATCTATCC
+AAAATGGTGGGTTATTTCAAACAAAGCCTATCATCACTCTCAACCTATCATCACCAACAA
+AAGAAATTAAGTTGTTGCATGTCGAAAGCCAGAAGTATATCAGATTGACTGGAACTTATA
+CCACTGACGAAATCAAGATTGATATGGCCACGGGTAAGATTACCCAGAACGGACGCAATA
+TCCTTGGCGATTTAGATATGATTAATAGTAGGTATTTTGAGCTATTACCTGGTAATAATA
+CATTACAGTGTGCCAATGCCGCCATAACCGCAGAGTTTAGAGAGGTTTATCTATGATATA
+CCTGTTTGATAAACTTGAGCGATTGGTCGCTACTGTTGGTACTGATGACTTGCTCTCATG
+GCACTTTAAGGTCAAAAACAATGATTGGGACCAGGCTAGTTTTGAGGTGCCAGTTGATTA
+TGACGTAGAGCCATTTGTCTACTTTGGTTTTTTTAACTACGACCCTCATCAAAAAGAAGA
+TGTCTTTAAGCTCTTTAAAGTCATTGATTACAACCTAGAAGATAGCAAGTTTTACAAAGG
+CTTAGACAAAGCTGAGAGTGATCTTGATACCATTGCCATTATCAAAGATAAGCGATTTAG
+ACAATCGTCCGCAGATGCTTGTATTGATGGTGCTTTAGAGGGTACGGGTTATCAAGTCGG
+CAAAGTTGAGGGAATAACAAATGTTAGAACACTTAGTTATTACTACATCAGTCCACGAGC
+GGCTCTGATTAAGATTGTGGAAGCTTTTAACTGCGAGTTCAATGTCAGGTATACCTTTAT
+TAATAACAAAATCACTAGTCGTTATATCGACCTCAAAAAGCGCTTTGGAAAGCCAACAGG
+CAAGCAATTTGAACATGGCAACAACCTACTAAAAGTCGTCTACGAGGAATCAACAGATGA
+CATTGTGACTTGTCTGATTGGCAGAGGTAAGGGTGAGGAAATCCAACACGAAGAAGCTGA
+GCCTAAAGATGTCGAGGGACACTTGCCACAGGAAGAAAGGCGGCAAGGCTACGGTCGAAG
+AATCGAATTTACTGATGTTGTCTGGTCGGTCGAAAAAGGCGACCCGATAGACAAACCAGC
+TGGTCAAAACTTTGTAGCACTAGATAGTGCAAGGGAAGAATACGGTTTGTCTCAAAATGG
+TGAGCTAAAACACCGCTGGGGTGTCTTTGTCAATGAGGAAATCGAGGATAAGACAGAACT
+CTTAAAAGCAACTTGGGAAGAATTGCAGCGTTTGTCAATCCCTATCAGAATTTACAAGGC
+AGAAATCTTAGACATTGGTCCAGAGACGTGGAAAGGCGACTCAGTAGCCATTATCTATGA
+TGAGGTAAAAATAGCTTTTGAAACTCGGGTTGATGAGATTGATATTGACAAGCTTAATTT
+TAACAGGTCAGTCGTAACACTTGGTGATTACAGCGTTGTCCAAAATCGTGAGTCACGGTC
+TCGTAAAGAGGCTGTCCAAAACATGATAGATGAATCTTTAGAGACTATCACAGACTTAGG
+GATGACATTTCAGGAATTTTTGCAAGGCATCGAAAAACGCATCGAGACTGGCAAAAAGGA
+GATGGAAGACAATTGGCGCAAAGTTAACCTTGAATTTGATAACTTTAAAAAGAAGGTTGA
+GCAAGAAGGCTTGCAATTCAACACCTTGAAAGAACAAATCAAAGAAGTTGATGAACGCAC
+CGATAAAGAGCTTGAAGAGTTCCGAGCCACCCTCAAAAACCTAGCGTTACCGGAAGAAGC
+CATCAAAAAAATCACCGAGGCTATCAAAGTTGATGACATCCCGTCTATTAAACAAAGCTT
+TGATGACCTAAAAAACAAAGTCAGTGAAACGAGCGAGACGTCCCGTCTAAACGCCGAAAT
+TTTAGGTAACAACGGTAAGACCCGCTACAACAAAAATTTGCTGGTTGGCGACCCTAACCG
+CACCAAAACCTATGATGAGGATTACATAGAAGTAGAAGCTAACGACGGTGGTTTTAAGCG
+TGGCGAGACCTACACGATTAGCTTTAGCCAGACTTGTGAGCTACTCAAAAAAGTGGCTGT
+CACGCTGACACAGGCTAACAACAAGGGAGTTAAGTTAGTGCTGACACCTACCAAGGCTAA
+GATGGAAGCACAGACGTTTGAGGTCGCTAAGGATAAACAGTCTATAGAGGTTTATCCTTT
+GAGCTACACGGCTGTTTTAACTGGCGACTGGTATAAATCTAAGCAGATAGATTTAAACGC
+GTCGGAGGTGCAGGAATTGGCCCTGGATATGAGCTATAAAGATGTTGTGGACGGTAAAGG
+AGCAACTATCACAGGGGCATGGTCAGACAGCCCACAAATTATATTAGACGGAGGTAATTA
+ATGGCTGAAAATATACCGCTACGAGTCCAATTTAAGCGGATGAAAGCCGCCGAGTGGGCA
+AGTAGTGATGTCGTCTTACTGGAGGGTGAGATTGGCTTTGAGACTGACACTGGTTTTGCT
+AAGTTTGGCGATGGTCAAAACACTTTTAGTAAGCTTAAGTACCTTACTGGTCCCAAAGGT
+CCTAAAGGAGACACTGGTCTCCAAGGTAAAACTGGAGGAACTGGTTCTCGGGGCCCTGCT
+GGCAAGCCTGGAACGACAGATTATGATCAACTCCAAAATAAACCAGATCTAGGTGCGTTT
+GCACAAAAAGAAGAAACTAATAGTAAAATCACCAAATTAGAATCAAGCAAAGCAGATAAA
+AACGCTGTTTACTTAAAAGCAGAGTCAAATGCAAAGCTAGACGAAAAATTAAATCTCAAA
+GGCGGCGTCATGACAGGACAACTACAGTTTAAACCTAATAGTGGTATTAAACCCTCATCT
+TCCGTAGGAGGAGCGATTAACATTGATATGTCTAAATCGGAAGGTGCTGCTATGGTGATG
+TATACAAATAAAGATACTACTGATGGACCATTGATGATTTTACGCTCTAACAAAGATACG
+TTTGATCAGTCAGTTCAATTTGTCGATTATAAGGGAACAACAAATGCCGTTAATATTGTG
+ATGCGTCAGCCAACCACCCCCAATTTTTCATCGGCACTTAATATAACCAGTGCTAACGAA
+GGCGGTAGTGCGATGCAAATTAGAGGCGTCGAAAAAGCATTGGGAACGCTCAAAATCACA
+CACGAAAACCCAAGCGTTGACAAAGAATACGATAAAAACGCTGCAGCGTTATCCATTGAT
+ATTGTCAAAAAACAGAAAGGCGGAAAAGGTACTGCTGCCCAAGGAATCTACATTAACTCA
+ACATCAGGCACGACAGGGAAGTTGCTTAGGATTAGAAACCTTAATGATGATAAGTTCTAC
+GTCAAGCCTGACGGTGGTTTTTATGCCAAGGAAACTTCGCAGATTGATGGCAACCTGAAA
+CTCAAGGATCCCATAGCGAATGATCATGCGGCAACCAAAGCTTATGTTGATGGTGAAGTC
+GAAAAATTAAAAGCACTCTTAGCGGCTAAGCAAATGTAAAAAGGAGGATAAATGAGTAGA
+GATCCAACGTTGACATTAGACGAGTCAAATCTCGTTATTGGTAAGGATGGACGTGTGCAT
+TATACATTTACTGCTAGTCAAGACAACCAAACAGTTAGACTAGCCAGCAACTGCTTAGGC
+ACAGCGCACTTTAATCAGCTCATGATTGAGCGAGGGGATAAAGCGACTGGCTATGTGGCG
+CCTGTGGTTGTTGAGGGTAGCGGTGAGTTGACAGGTGTGTTTAAAAGTCTTGAGGAGATG
+CTTAGTAGCTTGAGATCTATTAATTTAGAGCTGACAGACACCAAAGACTCTAAGCTTTGG
+TCAAAAATCAAGTTGACTAACCGTGGCATGTTGCAGGAGTACTATGACGGTAAGATCAAG
+ACTGAGATAGTCAACTCCGCACAAGGTGTGGCTACTCGTATCACAGAGGAGACTGGCAAA
+AAGCTAGCACTTATCAATGAGTCTATCAACGGTATAAGGCGAGAGTATCAAAACGCTGAT
+AAAAAGCTATCAGCTAGCTATCAGCTGGGCATAGATGGTCTCAAAGCCACCATGCGTAGT
+GATAAAATCGGCTTACAAGCTGAGATACAAACAACCGCTCAAGGCTTGTATCAAAGGTAT
+GATAACGAGATACGCAAGCTGTCCGCTAAAATAACCACTACCTCGTCAGGCACTACAGAG
+GCCTATGAAAGCAAGCTCGATGGCTTACGAGCTGAGTTTACTCATAGTAATCAAGGTATG
+CGCGTAGAGCTGGAGTCAAAAATCAGTGGGTTGCAATCAACGCAACAAGCAACTGCCAGG
+CAAATCTCACAAGAGATAAGTAACCGCGAAGGTGCTGTCAGTCGTGTACAACAGGGCCTA
+GACAGTTACCAACGACGATTACAGTCCGCAGAGGGTAATTACAATAGTTTGAGAGAGACT
+GTAGCGGGTTATGAGCGCAGGATATCCAATCAGGATAACACTATCTCCTCTAACTTTACA
+CAGCTAAAAAGCTTGATAAATCAGTCTGTGACCTTAGGAAAAATACAGTCCCTCTTGCGG
+CAATCTGGCGACAGTATCATGCTTGCGATTAAAGACAAAATCCCGCAAAGTAAAATGTCT
+GGCAGCGATATTATCTCAGCGATTAACTTGAATTCCCGCGGTGTGCAAATAGCTGGTAAA
+AACATCGCTCTTGATGGCAATACGACGGTTAATGGAGCTTTTGGGGCTAAGTTAGGGGAG
+TTTATCAAGCTAAGAGCCGACCAGATTATCGGTGGGACAATCGATGCAAACAAAATCAAT
+GTGATTAATCTCAAAGCTAGCAGTATTGTTGGTTTAGACGCTAATTTTATCAAGGCAAGA
+ATTAGCTATGCTATCACTGATTTGCTTGAGGGTAAAGTTATTAAGGCTCGTAATGGTGCG
+ATGACAATAGACTTGCAAAGCGGTCAAATCAACCATTACACAAATGAGTCAGCCATGAGA
+CGTATCGATAGCAGTACAGCTAGTCAGTTTATAAAGATGACAAAGTCAGGCTTTATATCT
+GAGATAGGTAACATGCAAGCTGCAATGACGGTTATAGGCTCTAATAGCGATGGGTCAGAA
+AACCATGAAAATAAAACCTTCGGAGGCATAAGAATTTGGAACGGGAAGTCATCTTATCAA
+TCGACAAGTTTTGTTGAATTAGTTGGTAACCGTGTAGCAATCTATGGAAATAAAAATCGT
+AGTCCATGGCTCTTTGACTCAACAACGTCAGGATATGCTTACCTTATCCCTCAAAATGAC
+AGAGGTATAAAGCATGTCATAGGGAGAGCTGATCGTAAGATAGACCAAATCCACGTTGGA
+GATATCTATGTGCAAGGCGAACGTGTAGCCATGATGTTAAAAGATTTAGCACTTAAAATT
+GGCTATATAGGTACAGGTGGTTGGGCTAACCGCATAGGATAAATTAGGAGAAACAATGCA
+AGAAAAATTATTAGGTAAAATTATTAACGATTTAGCACTTAAAGTTGCTAATTTAACGCT
+AGAAAATGCTCAATTAAAAGCACAGCATGAAATCGAATTGGAAGAACTAAACGCACAATT
+GGATGAAGCAACAGCACCGAAGGAAGAAGGTAAATAAACATGAGAAATTGGAAAGTAACA
+GGAAAATATCCACAACTTGATGGCACAGGAGCAGTCGCAAGCACACATATTATTATCGCT
+GCTGAGGATGGAGCTGTTATCCCGCAACTTATTAAGCAAGACTTAACCTCAACTAATGAC
+ACAGAGATTATCAAAGCCGCTTTGGAAGAATTTAAAAAATCTGAATACGTTGAAATTGCA
+ATGGGCGAAGCCGTGCAAAAAGTAGACGACCTTGAAAAAATCTCACAGGAAACCGCTAAG
+ACCGCTAAAACAGCCCAAACAGCCGCAGGATTAGCTAAGGTGTCCGCAGAGCGTACACAG
+CGAATGATTAACTTGCAAACCATCCACGTATTGACAAGTGGTGGGAACGTTGAACCCGAT
+ATCTACAAAGGTATGTTAGAGCTTATTGAGCCTGCTAAACAAGGCGAGTATCAGGCTTAT
+GACGTGTTTACTGTTGTAGATGAGTCGCACGAAGATCAAGCGGTAGAAGGGAACCTTGTC
+TTTGTACATGTCAACGAGCCGTTTACTTATGAGGCGCAAACTCTTAAAGATTTGGAATCA
+GAGGATAAAGTCACAGTTATTAAATATGCGGATTTGGTTAAACAAGATTAGAGGTGGTTA
+GATGATAGATTTTGTACAAATTGGTGCTTTTTGTGGCGCTGCTTTGTCTATCTTGGGTGT
+TTGGGGATTTATCGTCAATCCCTTTAAAAAAGCCATGGAAGCTAATGAGTTTGCCATGGC
+TCAACTCAAGGACTCAATTAAGGAGTTAGCTTATGAGCTTAAAAATCTTGATCGTGAACG
+TGAGATTACCAAAAAAATTATCGACAGACACGAGGAGCGTTTAGGTCGCGTAGAAGACGA
+AGTTATTATCAACAAGGAGCGTATTATTACGCTATTTAAAAAAGGAGAAGAAAAATGAAT
+AACTGGTTTAAAAAAGTAGCAATTAAAACAATTAAAACAATGGCACAAATGGCCGTTGGT
+CTAATCGGGTCAAGCGTGTTAATCACGGATATTAATTGGCCAACAATGTTGTCAGCAGTG
+CTGTTGTCAGGACTAACATGTATCCTGATGAATGTGTCACAAATCAAGGAAGAGGAATAG
+GTCATGCGAGCAATCACACGATTAGCATTAGTTATAGCAATCGCAATACTGTATGTGCCA
+TTATCTGTGGTTGCTTTGATTTTTTATCCATTTTTAGATAAGGAGGGATAAATGGCTACA
+TATCAGGAATATAAAAGTCGTTCAAATGGCAATGCTTACGATATTGATGGATCGCTTGGT
+GCGCAATGTTGGGATGGCTACGCAGACTACTGTAAGTATCTAGGACTGCCATACGCAAAC
+TGTACAAATACAGGATATGCAAAGGATATATGGGAACAACGTCACAAAAATGGTATTTTA
+AACTACTTTGACGAAGTAGAGACTATGCAAGCTGGAGATGTCGCAATTTTTATGGTAGTT
+GCAGGTGTTACACCGTATAGCCATGTGGCTATTTTTGATAGTGATGCAGGTAGTGGATAC
+GGATGGTTTTTAGGTCAAAACCAGGGTGGAGCAAACGGAGCATATAATTTAGTAAAAATA
+CCATATTCAACGACTTATCCTACTGCATTTAGACCAAAAGTTTTTAAAAATGCAGTTACT
+GTTATAGGTAATATAGGACTAAATAAAGGCGATTATTTTATTGATGTATCAGCTTATCAA
+CAAGCAGACTTAACCGCTACTTGTCAGCAAGCTGGCACTACTAAAACGATTATCAAAGTA
+TCCGAGTCACTCGCTTGGCTGTCTGATAGGCATCAGCAACAAGCTAATACTAGTGACCCT
+ATTGGTTATTATCACTTTGGACGATTTGGAGGAGATAGCAACTTAGCGCAACGAGAAGCA
+GATTTATTTCTGTCCAATTTACCAACCAAAAAAGTCTCTTACTTAGTCATTGATTATGAA
+GACTCTGCAAGTGCCGACAAAGAAGCTAACACTAATGCAGTTATTGCGTTTATGGATAAA
+ATTGCAAACGCTGGATATAAGCCTGTTTATTACAGCTATAAACCATTTACGCTTAATAAT
+ATTGATTATCAGCAAATTATCGCTAAGTACCCAAACAGCATTTGGATAGCTGGTTATCCA
+GACTACGAAGTACGAACAGAGCCACTTTGGGAGTTCTTCCCTTCAATGGATGGTGTGCGC
+TGGTGGCAGTTCACAAGTGTAGGAGTAGCAGGTGGTTTAGATAAAAATATTGTATTATTA
+GCAGATGATAGTAGCAAAGTGGATATACCTAAGATTGACAAACCACAAAGCCAGCTTACT
+TTTAATCAAAAGCTAGATACTAACACTAAATTAGACAACTCGAATGTACCTTACTACGAA
+GCAACCCTTAGAACAGACTATTATGTAGAGTCTAAGCCAAACGCAAGTAGCGCTGATAAA
+GAATTTATCAAGGCAGGAACTCGTGTAAGAGTCTATGAAAAAGTGAATGGATGGTCACGT
+ATTAACGCTTCTCAGTCTGACCAGTGGGTCGAAGATAAGTATTTATCTAATGCAACACAA
+GTATAAAATAGGAGGTAAAGCTCCTTTAGATAAGACAAATGCCCTCGCTTTTGCGGGGGC
+TGTTTTTGTTATAAAGATTTTAATTGTTATTTAAGCATTTTCGTTGATTTTTTTCTTTTT
+TGTGCTAAAATATTTTGTGATTTCTTATTATTAAAGAAGAATAGGGTACACTTATAAGTG
+AGAAAAATTGTAAATGTTAATTTTAAAAAGTTTTTAACTTCATCTTTTCTATTGTGGGTA
+TTTATATCAGCTATAATTCCAACGTGTTACGCGTATGAGATGAGTAGTGTGGGAGTTATT
+AATTTAAGGAATTTATACTCTACATATGATCCAACAGAAGTAAAAGGAAAAATAAATGAA
+GGTCCGCCATTTTCAGGTAGTTTGTTCTACAAAAATATTCCTTATGGCAATAGTTCGATT
+GAATTAAAAGTAGAACTTAATAGCGTAGAAAAAGCTAATTTTTTTTCTGGTAAAAGGGTG
+GATATATTTACTTTGGAGTATTCTCCTCCCTGTAACTCTAATATAAAAAAGAATTCATAT
+GGAGGTATTACTTTAAGCGACGGTAATAGAATTGATAAAAAAAATATACCTGTTAATATT
+TTCATAGACGGCGTTCAACAAAAATATAGCTATACAGATATAAGTACAGTGAGTACTGAT
+AAGAAAGAGGTTACGATTCAGGAACTTGATGTGAAATCAAGATATTATCTTCAAAAACAT
+TTTAATATATACGGATTCGGTGATGTTAAAGATTTTGGCCGCTCCTCTAGATTTCAATCT
+GGCTTTGAGGAAGGAAATATTATTTTTCATTTGAATAGTGGAGAGAGAATTTCTTATAAT
+CTTTTTGATACAGGACATGGTGACAGAGAGAGTATGCTAAAAAAATACAGTGATAATAAG
+ACCGCTTATTCTGATCAACTTCATATTGATATATACTTAGTTAAATTTAATAAATAAAAC
+TCTCACTTCTTAAGGAGAAAAAATGAGATATAATTGTCGCTACTCACATATTGATAAGAA
+AATCTACAGCATGATTATATGTTTGTCATTTCTTTTATATTCCAATGTTGTTCAAGCAAA
+TTCTTATAATACAACCAATAGACATAATCTAGAATCGCTTTATAAGCATGATTCTAACTT
+GATTGAAGCCGATAGTATAAAAAATTCTCCAGATATTGTAACAAGCCATATGTTGAAATA
+TAGTGTCAAGGATAAAAATTTGTCAGTTTTTTTTGAGAAAGATTGGATATCACAGGAATT
+CAAAGATAAAGAAGTAGATATTTATGCTCTATCTGCACAAGAGGTTTGTGAATGTCCAGG
+GAAAAGGTATGAAGCGTTTGGTGGAATTACATTAACTAATTCAGAAAAAAAAGAAATTAA
+AGTTCCTGTAAACGTGTGGGATAAAAGTAAACAACAGCCGCCTATGTTTATTACAGTCAA
+TAAACCGAAAGTAACCGCTCAGGAAGTGGATATAAAAGTTAGAAAGTTATTGATTAAGAA
+ATACGATATCTATAATAACCGGGAACAAAAATACTCTAAAGGAACTGTTACCTTAGATTT
+AAATTCAGGTAAAGATATTGTTTTTGATTTGTATTATTTTGGCAATGGAGACTTTAATAG
+CATGCTAAAAATATATTCCAATAACGAGAGAATAGACTCAACTCAATTTCATGTAGATGT
+GTCAATCAGCTAA
+>NC_002737.2|provirus_1186916_1222544
+TTATTTAAAAGAAAGTAAACGCAAGCCATTTAAAATCACTAAAATCGTTGAGCCTTCGTG
+TCCAACAACACCAAGCGGCAAGTTAACTACCTGAAAAACATTGGCTAAAATCAATAAGGT
+AATCACAGATAAGGCAAAAACAATATTTTGTTTGATAATGGTCTTCATTGTGCGGGAAAG
+TTGAATCGAAAATGGAATACGAGTCAAGTCATCCATAATCACACTGTCTGCACTTTCCAT
+TGCAATATCTGTTCCTGATCCAATAGCATAAGAAACATCTGCTTGAGCAAGGGCAGGAGC
+ATCATTAATACCATCTCCTACCATAGCCACAAAACCATATTTAGTCTTTAATTCTGCTAA
+CTTAGCCACCTTATCTTGAGGCATACAGTTGGCTACCACTTCATCAATACCAAGTTTTTG
+TGCCACATAATTGGCGGTTCGTTCTTGGTCACCTGTTAACATGACTGTTTTGATTCCCAT
+GGCATGAAGAGACTTAATAGCACGTTTTGATTCTATTTTGATATCATCCAAGAGGGCATA
+GTAAGCTATCAATTGATGGTCACGTGAAACAAAGATTAGGGTTTTCCCTTGATTTTCTTC
+CACTTGAATAGTTTCTTCAAAAGCTGATAGGTCTTGAACCTTTTCCAAAATGTAGGTTTT
+CTTGCCAATTCGCCATTCTTGCCCTTGATAGAAGCCCTGAAAACCTTTCCCAGAAATTTC
+TTCTAAGTGGTCAAAGGTCAGTGGCTCCAATTTTTCAGTGTATTCAAGAAGGGCTTTAGA
+AATAGGATGGGTACTAGCAGTCTCTGCTCCTTTTACCAGTCTATTCACGAGCAACTCATC
+TTCCAAATAATGAGCATTCACAACAGAAGGTTTTCCTTGGGTGAGCGTTCCCGTTTTATC
+CATGACAACAGCCTTAATATCTCCCATGTTATCGACAATATCCCCTCCTTTGATAATCAA
+TCCCTTTCTGGCTGCACGAGAAATAGCAGCCAAGCTAGCAGGTGTGGAACTGGCAATTAG
+GGCACATGGTGAAGCTACTGTTAAGAGAATCATCCCTCGGTAAAAAGCAGCCAACCAAGT
+CCAAGAAAGCACAAAGTGGCTAAAGAGGATAAAGGCAGGAATAAGGACGAGCACAAATTT
+GACATAACCATCTTCTAAGCTTTCGATAAAGGTGGCGGTTTTGCTTTTCTTTTCTTGGGC
+AGATTCCACCAGATTAATAATCTTGGCAAAGAGAGTATCGTCATTTTCAATAGTAACCAA
+CATATCTATGGTTTGTCCTTGGTTAATGGTTCCCCCAATCAGATCCTGGCCTTCTGCCTT
+ATCAACAGTGATAGGCTCACCAGTGACCATAGATTCATCAAATTGACCAAAAGGACTAAG
+CAACTGCCCGTCAATTGGAACAGCTTCGCCTTTACGAACTTGTAAACGGTCACCAACACT
+CAAGGATCTGGTCTCAACTTCTAAAATATGGCCATCTTCTTGGTATTGACGAGCTGTATC
+TGGCGTCAAGGACATCAAGGCTGAAATAGCATCCTTACTTTTTTCCATGGCCATTTCTTC
+AAGCGTATTGGACAACGAAAAGATAAAAATAAGCAGAGCACCCTCCAGCCAATAGCCGAT
+AATTCCAGCACCGATAGCTGCCAAAATCATCAAAATATCCACTGACAAGTGTTTGTTCTT
+CACCAAATCCAATATACCCGTTTTTGCAGACGCATATCCTCCAATCAAGAAGGCTGTAAT
+GAAAATAGCGGAAGCCACTTGTGGAAATGAGTGTAAAAAGGCTAGGCCAATTATTATTAA
+TACCAAACACGCTAAAGTCTCCATCAAATGAAGATGGTCTGCCATCCATTGTCTGATTGT
+CATTTTTAGTTCCCTCGCAATTAAAAGTTATTCAATCTTTAAGATATATTAATTATAATA
+ATTCTAAATAAATAAGTCAAGTAATTTAGAAACATTCTAAATAAACTTTTTTAAACTTAC
+CTTTTGCTTTCAAAAATCCTAACTTCAACTATTTGCAAATATGAAAAAAACTCCCCCTAC
+CTGCGGAAATGATATACTAATAGAAGGATGACTGACCATTATAGAGTGCATGCTTTAGAA
+CTTGGCTTAACTGAAGAGAAAACTACTAACTTTATGCCCCAAATATAAAAAAAGAACCTT
+GTCGCTATCAATAAACATCGATAGCAACAAGATTTTTCTAGACGAATTATTTAACAGCGT
+CTTTTAAAGATTACTTAATATTGTGCACATATAATATAATAAACTTTGATTTTATAAAGC
+TACAAAATAACGAAACTTTATATAATTGCTTCGAATCAACTATGTAAGTTTTAAACTTAT
+GCCCCCTATTTACCCCTTTAATAAAACTACTTCTCAGGGGGCAAAGAAAATACTTATCTC
+GAAAGCTCCACCAGCACCTCTTCCACTTTTTCCTTAGTCACAACTTCTCCATTCTTTACT
+TTCTCATGTGGCAACACATAATCAAAAATCTGTCCGTCTTTACGCACGATCGCTACTGTA
+TCGCCTGCGATATATCCATTGTCAATCGCTTGCTTAAACTCGTCGTATGTTAGCATTTTT
+ACCCTCCTACTTATTTATTCGTATTTTACAGGAAATAATATAATTAAATTTAAAGGTCGT
+TTAAATTTAATTAACATCTTTTTTGTTACAAACTAAAATATTGATTGTTAGCGAATATTA
+AATAAAAAGAAATTTTAGCGTAATATTATTGATAAATTAATTTTATTAATTTTAAGTTTT
+TTTAATTTAAAGTGATATAATTAACCTGTAAATAATAAAAGGAGGACATGGATATGTCTA
+AATCAAATCGTCGTACTTGGCAAGGTTTAGTTGTTATTTTAATAGCTATTCTCACCACTT
+TTACCACAAGTACTGTTACGGCAGCCAGAAAAATTAGAAATTTCCCTGATACCACGGAAA
+TTTTGTTAGGAACGAAGGCGACTGAGACACCAGGAATCTTACCATTCACTGGTAGCTACC
+AATTAGTTTTGGGCGATCTTGACAATCTGCAAAGGCCAACCTTCGCACACATCCAGCTAA
+AAGATCAAGATGAGCCTAATATTAAACGAAAAGGACTTAAATTCAATCCTCCTGGCTGGC
+ATAATTACAAATTGACTGACGCTAATGGAAAAACAACTTGGTTAATGGACCGTGGCCATT
+TAGTTGGTTACCAATTTAGCGGCTTAAATGACGAGCCTAAAAACCTAGTTACAATGACAA
+AATATCTTAATACTGGCTTTAGTGACAAAAATCCTTTAGGAATGCTCTATTATGAAAATA
+GATTAGATAGCTGGTTAGCTCTACACCCTAACTTCTGGCTAGACTATAAAGTTACTCCTG
+TTTATCATAAAAATGAGTTAGTTCCTCGCCAAGTAGTTCTACAGTATGTTGGAATTGATG
+AAAATGGAGATCTACTTCAAATTAAGTTAGGTAGTGAAAAAGAAAGTGTAGACAACTTTG
+GAGTAACATCAGTTACATTAGATAACGTATCTCCTTTAGCTGAATTGGATTACCAAACAG
+GAATGATGCTAGATTCAACTCAAAACGAAGAAGATAGTAATTTAGAAACCGAAGAGTTTG
+AAGAAGCGGCTTAACATAAACTTATACTTAATAAAAATATCTAGATTGTGAACATTATCC
+CAAATGTTAGATTATTTATTTAATATTTGGGGTAATTTGTATAAAGTTAAATTTTGAAGA
+AAAATTAGTATAGGCTACTATCTGTGCTATTTTTTAAAAAAACAACGTCTATTTAGAAAG
+TCCCTTAAATAGGACTTTGAGAAATTAGTCTGTTTTAACGGCCTTTGTTGAGGATGATTG
+AATCGAGTAATATGTATAGTAGATTGAAAAAAAAGGGTGATTTTATGAAAAGGTCCAAAA
+AAGCATCGTTACTTAGTGTTATTGTTGGAATGGCTTTAGCTGTGATACCAATTTATATTG
+TTAATTATGACAATGAACTTATCGTTCTTTTAATGAGTATTTTTTTTAATGGGATAATTG
+TTTCCGCTTTTGAACTTATTAAAACATATGATGGTTTGCAGGAAGAATATAAAAAGCTAA
+CTGTAGATAGATGGAAGAATACTATTTTACTGGCTTTCAATTCATTATATTTTGCTTCTA
+TTTTGACAAATAGTCTATCAAATAATTTATCGACCATTTTATCAACTAATCGTTCTGACA
+AAGTAAGTGCAATATTTCTTACAGGTTGTTCTATTTTAGCACTACTTCCATTCCTCCTTC
+ATAGGTTAATAAAACGAGAAATAGAAATTGAAAATGAAAGAAAAAAATTAAAAAAATAAT
+TACTTAAACACAAAAAACCGCCCTCGATTAAGAGAGCGGTTTTGTCTTATCTAAAGGAGC
+TTTATCTCCTAATTTAATTTGCCCCAAAGGCTGATAATGTTACCGTCTTTGTCAGTTATC
+CCAATAGCCGTGTAGTTTCGCATACCCGAGCCGCCAACGTAGCTAATCCAGTAGTAACCA
+TTGGCGTAACCCTCACTATCAAAGCTGATAGTATCACCTTGTTTATAGCTACCTACTACC
+TCGCTAGTTAAACTTGGCCAACGTCTGATATTGATTTCTGCGACATCAAGCGTAAAAGTA
+CCTGTTTTTGCTGTCTCTACGATAGTGTCAGACGTTTGTGGCTCGGTGCTGACTGGTTGC
+GTGACAATATCTCCTTGGTAAGGAGGGTAAAACCATCCTGTCACGCCGGTAAAATCACGA
+GTATTAAAACGAGCTGGTGCACCGACATACAAAGCATCAGGATTGCCATCAATGTTTTGC
+TCGATAGTTCGCATGGTATAACCGTCGCTATCCTCAATGACAACTCCTGTGTGACCAAAT
+TGATGATATGGCACTGATTGGACAAAAAATGCTCCAGTCTGTGGATTTGCATCTGTCGGC
+ATGCGGTGGACTTCCCAACCTACGGCAGCAGCGCTATCTAGTAAGTCAATCGCATTTCCC
+CAAAGATCAACACCAAACCAGTGCTTTGCTGCATAACAAGGCACATCTGTGCATTGCCAG
+CCCGCAAAACCATCTTTATCCACGCCAACCCCAGCATTTACCAAGTTAATAAAAAATTCA
+ATGACTTCTCGACATTGAGAACTAATCATTTGCTTCTCCTTTCTGACAATAGCCTCTTCA
+TCCCATTCCTGAAGGTCATTTTCCTCGATTAGTTGGATAAGCAACTCTGCATAACCGCTA
+GCTGTGGCATAACCTGCATCTTTTATAGCGTGACAAGCTTTTTTGTAATCAGTCTCACCA
+ATCACAGCCTGATACCGTGGATTATCGTTTAAAAATTTACCGTGATCAATAATGCTGTCA
+GTCCAACTATCATACGCCCTAAATCGGTCCACAATATCCGTGACAACACCTGCTTGATAT
+TCCTCTTGGGTTTTGGTATCAAATGATTTACCAGTCCAAGAGCTATCTGCCTTAATACCA
+AACAGAGCGTTGTGTGGGGCATGTTTGCCCCACCCGCTTTCTAAGATTGTCTGCGCTGCG
+GTCAAGGATGGCAAGATTTTGTACGTTGTCCAGCCATCTAAACAGCCTTGTTTAATTTTA
+TCTAAAAAGGTCATCTGTCCTCCTTATCTAAAAATGGATAAAAGATCAGAGCAACAACAG
+ATATCGGCACATACAGTATTGCGATTGCTATAACTAATGCTAATCGTGTGATTGCTCGCA
+TGGCTCCTCCTATTGTTTTGGTTCGTGGTAAGTCAATGCTTGCTCACTGTCTGACAGGCC
+TTTTGTGGTTGGATCTGTGACAACACCGAGCAATACCAAAAGCGTTACAGCTGTGTTGGC
+AATATCCGCGATGTTTGATGGTAGTTTAATACCTAATTGTTGCGCTAACAAAAAGATAGC
+TCCCAAAATAGCCATCAAGGTTACTTTGTTTTGTAGTCGTAATTTTAAATTGATCATTTG
+ATTTCTCCTCTCATCATATCTTTTAAATCTTTAACATCATCTGTTAAATTTTTAATTTGC
+TCTGTCATTGTAATCAACGTTTTATTTTGCTCAGCGTGCTCTTCAAGCCGCCGAGCATTT
+TGGCGTGTAACAATTTTTAAATGCTCTACCTCAGATTGCAACAAAGTAATATCTGTCGCA
+TGCTTGATGGATTTTGCATTAAAAATATTGTAAGTCGTGACGATAGCTAAAATAAAGCCA
+CCGACGCCAAATATCAACTCTGTTGCCATAAACCACCTCTAATCTTGTTTAACCAAATCA
+GCGTACTTGATAACTGTTACTTTGGCTTCTGACTCTAGCTCCTCTAAGGTTTGTTTGTCA
+TACTCAAATGCTTCATTAACGTGTACAAAGACTAGGTTCCCTTCGCCTGCTTCACCGTCT
+TCCTCTTTAGTACTGTCGACCACCGTAAAGACATCATAGGCTTGATACTCACCTTTTTTG
+GCTGGCTCGATTAGCTCAAGCATGCCTTTATAAATGTCAGGATCAATCTTGCCGCCGCTC
+GTTAACATGTGGATGGTTTGCAAGTTAATCATTCGCTGTGTACGCTCTGCGGACACCTTA
+GCTAGTCCAGCAGCTGTTTGAGCAGTTTTGGCAGTCTTAGCGGTTTCCTGTGAGATTTTT
+TCAAGGTCGTCTACCTTTTGCACGGCTTCGCCCATTGCAATTTCAACGTATTCAGATTTT
+TTAAATTCTTCCAAAGTAGCTTTGATAATCTCTGTGTCATTATTTGAGGTTAAGTCCTGC
+TTGATTGGTTGAGAGATGACTGAGCCATCCTCAGCAGTGATAATAATATGTGTGCTTGCG
+ACTGCTCCTGTGCTGTCAAATTGTGGGTATTTTCCTGTCACTTTCCAATTTCTCATGGTT
+ATTCTCCTTTTTTACTTTCTTCAAATTGTTCCAAAATGTTGTCGATAAGAATGATTTCAG
+ATGATGTAAATTCATCTTCACACTCTTCTAAAAAGTTTAAAAAGTCAATAAATCGCTTGG
+AGTACTCACCCCCTTTAATCACAATTTCTTCATCAGCTAGCTCGTTGAGTAGGCCGTTGA
+ACTCGTCGAGTTTAGCGGGGTCTGCTAGCTTGATGTTTTTGTGCTCATCAATGACAAACT
+TGCCATCTTTGTCTTTTTGAGCATACAGATCAATAAGGTCACCCTCATCCTTGGCGTACT
+CTTTGAATTTATCTACTACTTTTGCGAGTAGCTTAGCACGTCCGCGGTTTGCTCGCATGT
+TCGTGACTTTGATTTTGTCTAGTACACGATATAGTGTGTTTAAATCTTTGTTTTTAATAG
+TTAATTGCATATTATCTCCTGTTAAATTTTAGTGATGTAGTTATTCAATTCCCTACTCAC
+AGCACTTGTAAAATTGCTATGAGCAGTATTCCAGCCGACGTTAGCCAAGTGCCCCCAACA
+GCGGCCTAAGGCTACTACAGCCGCATACAAGTCGTTCATGTCGAGCACTTTTTCCATTTT
+GTCTGGTCTAAATTTAAATCCTCGATTGATGTTAAAGTCATCTGCAATCAAGACATTATC
+ACCGTATAGCTCGGTTTGGTCGACTGCAGCAGTATGGTTATATCCCGTAGCGTACCTAAA
+TGACCTTAGCCCTGCAAAACGACCGGAAGAAGCGCTGTCGATGCCATCTCCTGATGAGGT
+AATGCCGATAGAGGCATATAACGCTGAGCCTCTATAGCCTTTTGGTGTGGCATTACTAAA
+ATGTACAAAAGCAGTATGTGTGCCATCTTTACGTACTAAGGCATTGTTTTTGCTATTAAA
+ATTAATTGTGGCATCTCGATTAAAGGTCATATTGGCATTATTTAGGTCCCACTGACTTGC
+CCCATTTGTAGCGGCTAATACACCTCCAGTAATTTTGCTAGCTGATAGTGTTACAGATTG
+GACTGATGTTGCAAAGATGTCTTTGGCAAACAACGTCCTAAAATATCCCTCGTTAGCAGT
+GAGTTTATTAAAAAAGGCATAGTCCATCTTAATTTTCTCACCAGTAATGGCCTCGGTTGC
+AATCCTATTAGCATTAAGATAACCAGTATTAATCTTACCGGCATCCATGTTAGCAATATG
+AGCATCTTTGATGACAGCGTTGCTGATGTAGCTGTTACCATCAAGAGTGATATTTTTTCC
+AGTGATTTTAACCCCAGACCTATCAAGATTGATTGCCGAGATAATCTCACTGCCAGACAT
+TTTGCTTGCTGGGAGTTTATCCCTGATTGCGAAGGCTATCTTGTCGTAACTCTGAGCAAT
+AGTTGTCTCAACATCACCTTTTGATACCTTTGTGCTGATCAGGTCACTTAACTGATTAAT
+CCGACTTGTAGCATTTGATTGATTATCACGTACAGTTGTTTGTAGTCCCTGTACAGTCTG
+AGACAAACTGCTGTAATTTTGGTTTGCATTTGTGATTTGTGACTGCAATCCTTGTGCTGT
+CTGAGACAATCGAGAAACATCATTAGCTGCATTACTAACTCGTAAATCAATGCCACTTAC
+CTTTTGAGATAGCGTTGAGTAGTTACCAACACCATCATCAAGACGACTGCTAAGACTATC
+AATTGTTTGGCTCAAACGACTGTATTTGCCATCAAGTCCACTAATACGACTATCAAACAT
+TGATGCTAGCTGAGTACGTGCGGATTCAACTGACTCACTTTTGACAGTTTGTTTGATACC
+ATTCAGAGTTTGCTCAAATTTGGAATATCGTTCATCATCAATAGACTTGACTTGTAACAA
+TATCTGCTCAGCTGATTGCGCAATGGCACTTGACATCTCTTTGTTGGCGTACTCGACTAG
+CATTGCCTTATTATTGAACTTGATTTTGCCCCACAAATCTGACTTAGGGTCTTTTAGCTG
+TAAATCAAGCTCTTTGACCTGCTGAGCTAGTCCAAAAGCTTGTTGAGTGGTAACTTTAGG
+CTTTACAAAGTCGTGCATTGTATTGTCATCCTCGACCTGTAGCTTTTTGATTATGGTATT
+GCCAAGGCAACTACTGTTAAGTCTCACAGTCTCACTTGACTTATCTGCCTTAAAGGTCAC
+ATAAAAACGACCATCTGCAAAAGATAAGTCGTGCTCGTTTATTGTATATGTTGGGTCTCT
+GCTCATTTATCCTCCTTAATCTATTTTTTTAGTATGAGTTTTTTTAACTCAGCAATTTTT
+TCATCTACGTAATCTTTAGTCGCAGCATGTTTTCCAGATGTTGGATCTTTAACTGTTAGA
+TTACCATCCACAATTGAACTTGCACATGACCAAAAGTCACCATCTGGACCTACATAAAAT
+TTGTCTTTATTTTTATTTCTGATTCTGAGCATTTTACCAGCTGTGCCTGATGTTGAGTTA
+ATGTAGATTCCTTGAGCAGCAGTACCTTTTCCGCCTTTCTGTTTTTTAACGATATCAATA
+GATAACGCTGCAGCGTTTTCATCGTATTCTTTGTCAACGCTTGGGTTTTCGTGTGTGATT
+TTGAGCGTTCCCAATGCTTTTTCGACGCCTCTAATTTGCATCGCACTACCGCCTTCGTTA
+GCACTGGTTATATTAAGTGCCGATGAAAAATTGGGGGTGGTTGGCTGACGCATCACAATA
+TTAACGGCATTTGTTGTTCCCTTATAATCGACAAATTGAACTGACTGATCAAACGTATCT
+TTGTTAGAGCGTAAAATCATCAATGGTCCATCAGTAGTATCTTTATTTGTATACATCACC
+ATAGCAGCACCTTCCGATTTAGACATATCAATGTTAATCGCTCCTCCTACGGAAGATGAG
+GGTTTAATACCACTATTAGGTTTAAACTGTAGTTGTCCTGTCATGACGCCGCCTTTGAGA
+TTTAATTTTTCGTCTAGCTTTGCATTTGACTCTGCTTTTAAGTAAACAGCGTTTTTATCT
+GCTTTGCTTGATTCTAATTTGGTGATTTTACTATTAGTTTCTTCTTTTTGTGCAAACGCA
+CCTAGATCTGGTTTATTTTGGAGTTGATCATAATCTGTCGTTCCAGGCTTGCCAGCAGGG
+CCCCGAGAACCAGTTCCTCCAGTTTTACCTTGGAGACCAGTGTCTCCTTTAGGACCTTTG
+GGACCAGTAAGGTACTTAAGCTTACTAAAAGTGTTTTGACCATCGCCAAACTTAGCAAAA
+CCAGTGTCAGTCTCAAAGCCAATCTCACCCTCCAGTAAGACGACATCACTACTTGCCCAC
+TCGGCGGCTTTCATCCGCTTAAATTGGACTCGTAGCGGTATATTTTCAGCCATTAATTAC
+CTCCGTCTAATATAATTTGTGGGCTGTCTGACCACTGCCCTGTGATTGTGGCATTATTAC
+CGTCAACAACATCTTTATAATCCATCTCCAGAGCCAATTCCTGCACCTCCGACGCGTTTA
+AATCTATCTGCTTAGATTTATACCAGTCGCTGGTTACAAGCACTGTGTAGCTAAACGGAT
+AGACATTGATAGTCTCAGTATCCTTAGTCAAGCCAAAACTCTCGACAACTAATTTGGGAT
+TTTTAGGTGTTAACACTAAGCGAGCACCTTTCATGTTAGCCTGTGTCACTGTGATTCCTA
+CTTTACGCAGTAGCTCACAGGTTGCCTCAAAGCTGATAGTGTATGTCTTGCCTTCTTCAA
+AACCTTCACCATTATGGGCAATGTCAATATAACCTTGTTCAAAAGTGATAACTTTGTCAG
+TATCACCATCCAGTCTGTTGCGATTGTAAAACGTGCCGCCAGTTGATCCAACAATGTTAG
+CTGTAACTGTGGCAGTTTCAGACGTGTCTTCCAGTTTAGCTTTAATGTCAGCTAAGCTAT
+CCTTGCTAAAACCGGCTTTGGCCAAAGCATCATCAATCTGCTTTTCATCAACTTCAAGGT
+CTTTAAGAGACGTTCTAAATTCTTCAAGTTTTTTATCAAAATCTTGCTCTTTAGTGTCAG
+CATCAGATAAAAATTTTTTGAGTCGCTCATCGACTGCCTTGGCTAGCTCCTCAGCTTCCA
+GCACTTTAGCGTTAACCTCAGCAACTTTGACCTCTGCATTAGCTTCAGCTTTTTTGATGC
+CATCTTCAATCTCTTCACGGAGTTTAGCTTCTTTTGTGTCAAAAATACGATTAGCATTAT
+CAATCTGCTTTTGTAATTTTGCTTCAAATGCTGCGTCATGTTGAGCAGTTGATTCAGCTA
+CCTTATTGTCAATTTGATTGCTAATTTGTTTTGCTAAGTTGGTCTTAATCTCTCCAAAGA
+TGATGGATTTTAACCGATTAGCCATAGGGGCGAACCGATAGCCAGTGATTTGCATTCGTA
+AGTCTCTGTCATAGAGCTCGTGGAAGACAATTGCTGTGTCAAATAGCCTAACAGCGCCCT
+CGTAGTTATTAGTAACATCAATTTTTAAACTATTACCTGGTATGTCGCAAAGAGTTTTTT
+CAAAGTATTTCTTACCATATGCAAGCAAGTCCTCTTCTGTTTTGACATCTTGATCCTGCA
+CCTTGATAGTCTTTTCAACAATTATCGGATGAGTGTCTTTGAGCTTGCTCTCAACAGATA
+CCCTAATTGTTTTCTTTTTCGGTGATTCACTATGACCAATGTTTCCATCTGAAGCTTCTC
+TGGTTTCTACTTCATGTTCTTCTTCTACTTCAGCAACTAAATGAAGGATAGAGACAAGCC
+CTTTGATAGTATCTGTTTCCTCATAAGATTTGAGGTTTTTCTTGTACATGAACAAGGTTT
+CGGTATCTTTGCCAGCTTTTTTGAGCAAGTTAATTTGGTATTTATTTCGTACAAGTTCGC
+CACCCCACTGCCCCATGATTGAGTGCTTGCCATTAGCTAAAGCGTCCATAACAGATACGT
+CTGATTGATTAAATGTGTGACGACCGTCAATATCACTAAAAAAGCTAAAAGGATGCTCAC
+GCTTGATACTACCTGCTAACTCTGACATTACTGTCATGCCTTGCACCCTATCAACACTGA
+TAGTGTCAATTGCATAGCCATTTAAGTCATCAGCGACCTGATTAGCGTAAACGTTAATAT
+AGCCATGCCGCTTAGTAATTTCAAAAATCCTAAAAAGCTGAGAACCATGCAGATCATCAG
+CTTCTAAGATTATTCCTTTTTTTATTAAAGGGCGATACTCGTGTTTAGCAGGATACTTAA
+AATTTAGTTTGTAATCACTATTGGCCTCCTGTGTAATCTCATCTTCAAAGGCTGCTACAA
+GAGGGGTATTATCATCTTTAATCGATATCAAACCTTATACCTCCACCTTGGACTAATTAT
+TGTTCTAGTAATGCCTCCACTGACGGCAATACCTTGTGTGCCAGGTTGTATTTCAAAAAA
+ACTTCCTCTTATTCGGATTGAGTTTTTCACATTACCTTCAGCATCATAGACGCATTGTTG
+GCCATGTTTGCACTCAATCGTTGCTTTACCTGACAAATTTAATTCCATGACCTGTTTGCC
+AATGGTTAGCGTTCCTTTACCAGTACCCTCAACAACTATCTTAGGTTCGCTGAAAACATT
+TCCTGCATTGTTAATGTTTCCGTTGCCTGCAATTACTACATCTGAGACACCTTTTGCGTA
+TCTAAATGGATAAAGAGCAAGTTTGAGAGTCACACGCCATGATGACATGGTTACCGCATT
+GATTTTGACAGATAAGCAATCATAGTAATAAATAGAGTTAGGTATGTGCCAAAATTCGAT
+TTTTTTACTAAGGCCGTCTAAATGATTAATTAGATTAACTGCATCATCAAAAGTACTCAA
+ATGCCACATTATGGTTGGTTTAGATTCATTATATGACTCCAATTCCCTACTAGTTCCATT
+CATGCCATAAGCTTCATTTTCGACAAAACTAGGGGATAGAATATCCCCCACATCGTAACC
+GGTCAAAACACAATTAGGGATTGAAGATGTGTCAAAATCATCAATAATAACTTTAGGTAT
+CATACAATCCCCTCTCTAGCCATAATTTTGGCAAATTCTTCGTATAAAATAGCGCTGACT
+TTTTCTTTGTCTAGATAGACATCCGTATTTTTATCAAGGATATCTTGCAACAGAGCAAGC
+ACCTTAACAAAGAATAATGACAAGTCACTTGTAGCAGAACCGACTGTAGTTTTAGTACTA
+ATATTGCTTGATAGTAAGTCATCAGCTGTGACGCTTGGTTTAGCATCGATACCGAGAGAT
+AGACTTTTACCTGTCATGGTGCTTGCAAGGTCGTCAGCCATGCCAGAGACATTTGATTTA
+ACCTCTTTAAAGCCGTCAATCAAGCTTGTATTAAGTCCACCCATAATTGCTTTACCAGCA
+GGTTTTAGTAGAACTCTATCATAAGAGATAGGTCCTTTATGTTCTGCAATCCAGTTGGCG
+ATACCGCTCACAAAACTTTTGACGGCTCCCCAAGCTGATTTCAAACCGTTTAAGAAACCA
+TTCATAATTGCGGCACCAGCTCCAGAAATATCAATGTTTGCCAAACCTCTAATTGTGCTT
+GAGATTGAATCGATAACTCCATTTACTGCTGAACCAACACTAGACACTAAGCTACTAAAA
+CTACTGAAGGCTGATTTTATGCCATTTATAACAGAGCTTATGATACCCTTAGCCACATTT
+ATTGCGTCTCCCATTGCCATCCAAGCAAGTGAGAAAATGTTTTTTAGGACGCCAACTGCA
+GAACCGGCACCACTGAACGCTAATTTTATGTAGTCAATAACCGTAGATATGATTGTTCCA
+GCAGTTGAAATTGCAGTCTGAATGTTAGTCCAAGCGCTCTTAATAAAAGCGCTCAAGCCT
+TGGCCGGCTGTGCCTAAATTACCAAACATACCGATAGCAACTCCAATCCATTCTGCAATG
+ACACTGAGAACAGGTTGTACAAAATTAAGACCTTGAACCAGCAAGTCAATAATTGGTGTG
+ACTAGTTGTATAGCCACTTTAACTGCATCAAAGGCAAAGCTAACTCCCATAAGCGCACCT
+TTTACAACACCACCTAAGAAAGACCCTAAAATTTGAAATACTGGCATCAAGGCATCACTT
+AGTATCGAAATTAAAGGTTGTGCTGCATTCCACATGCCAACAAACGAGTCAACAACTCCT
+GAGATAGCTGGTCCAACAATCGCAGCGAAGTTAGAAAAACCTGCCTGTAGGGCTGGTAAA
+ATTGCTGAAATTAAAGCCTCAAAACCACTGAAATCTAATCTGGCTAATCCGCTAATAATA
+GTGTCTATTACTGGTGCAACTGCACTACCAATGCTAGTAAAAAATGATGGCAACTGACTA
+AAAGCCGTTTTTAAACCGTTAAAAACAGGTTGTAAATTTTGGCCAATCTGTGCAAATTTA
+GCAGTAATAGGACTTAAATCAATACTAATTCCAAGGCTACTCATTAGACCTTGGAATTGA
+CTTGTGATAATAGGAGCTGCGGCTCCAATAAAAGTACCAATTGCCGATGGTAATCCTTTA
+AAGATATTTGCCACCATCGGAATAAAGTTACCAAATAAGAAATTAGAAGTTGTCTCAGCC
+AGTCCTCGTAAAGCCGGTCTGATATCATCTCCTAGTGATAAACCTGCCATTACATTTGTA
+AAAGAGGACTTCATAGCAGCTAGTGAGCCTGAAAATGTAGTTTTTGCTTCTTCAGCAGCA
+ACTCCAGCGATACCCATGTTATCCTGTACCAAGTGTATAGCCTCAACCACATCAGCATAA
+TTACTCAAATCAAACTTCTTGCCCATAGCGGCAGGTAACTTTTCAGCGTCTGATAAAAGA
+CGCTTCATCTCTTCTTTTGTGCCGCCGTACCCAAGTCTTAGGTTATCAAGCATTGTATAG
+TTTTGCTTAGCAAATCCCTGGTAAGCCATTTGGATTGATGTGATATCAGTACCCATCTTA
+GCCGAGTTGTCGGCCATATCCATGATTGCCATGTTAGCAGCCTTGGCAGCCGCGACAGCA
+TCACCTCCAAGTGATTGCTTTAGAGATGCACCCATTGAAACTGCTTGCTCTGCATAAGTA
+TTTGCTGATATTCCAGCTTTGTATGCCTCTTTAGCAAACCCTTTGACAGCAGTCTCAGCG
+CCCTTATACAATGTGTCAATACCACCAAAAGATTGCTGCAAATCAGCACCAGCGGACAAG
+GCAGACGAAATCATCTTACCGATTCCAGCAGCTGCAATGGCACCACCAATCATTTTAACG
+AGATTACCACCAATGAGCGAACCAGCGCTCAATCCAGCCGACCTTGCTTCGGGATCAAGT
+TGCTTCGAGATTGCTCCACTTATTCCACGAGCGGATGGCATAATTTGCACATACGCTTGA
+CCAAGTTCTGTTGCCATTAGCCATCACCTCCTAGTAATTGTTTACGTGCATTTTCAAAAT
+CCTCGCCAGACACAAAAGAAATGACATCATTAGCTTTTTGTGATTTAGATCCAGATATAG
+CTTCCACCACGGATTTAGGTTTGTTTTGACCAGATTGACCATCCTTAGTTTTAGACCAAA
+ACAGCAAATTAGTATTATCATAAATACCAGCTAACAAAACAGTATCCAAAGCCTCAGTCT
+CTCCAGATAATGCCATTTTTATCCTAGAGTTAGATCTCAAACCGACAGCAAAAACAGCCA
+CCTGATAAGCAGGTAGCTGTCTGTAATCATATATGCCGTATGTTTCAGCTAAATCACAAG
+TCAATGCATCATCATCTTTTGCTATCATCTGAGCGAGGATTGCTAGTTTTTTAAATCTTT
+TTGACTTTCAAAAATTTCTTTGATTTCTACTCCGATAGCTTCAACGTCTACGATACCTTC
+TGCATCTCGTACATGTTCTTTTAGAGACTTAGCAGCATCACCAAGTAACAAATTAACGAT
+TTTAACTACCGCTGTTGGATCAGTTTCCTCTTCTGCAATAGCTTCAACAAGTTCAAAGTT
+TTTTAATCGTTTTTTAGGAATTTCGTATTCAAATCCTGATGTTGTTTTTCCTTTTAAGAT
+TTCCATTTACTCCCCTTTACATTTCAAAGCTGTTTTCTTTTTTATTAGCTTCTCCAGGTT
+TTACAATATACTCACGGTGTGTATCACCATCCTTGTCCGGGAAACATTTTAGTGTTGTTT
+CATAACCAACGACTTCGCCGTCAACATACTTAATTTCACCTACCTCATCGACTTTTGCAT
+TTGGTAAGACAATTCGTTTAAGAATGCCGCCATTCATGATCATGTCAACAACAATTACGT
+GAGCTTCTAACTCTTTTGAATTTGATTTAATCTGGATTCCCCCACTTAAATCTCCAGTAA
+CATTGACAGCGCCATAAACTTCTTTTAAGACTTCTACATTTAGTGACTCAATCAGCTTAT
+AAGTAAATTTATCCTCTTTTTCTGTCTGTACAGCCCCGACAATATCTCCACCCCACGCTT
+TAATATTTTCGGATGAACGTGTATCTTCATTGACCACACCATCCTCGGATACATAACCCA
+AATTCTTAAATTTAGTATTTAATTCTGATTTTGCATCCTTGGGCAATTCAGTACCAAGCG
+GTGCCGAATAAATCGCCCCACCGGTCTTGGGCTTTGCAGATGTTACATTTTTAGTATCAT
+TCTTATTCATCAATATCTCCTTTAATAATGATTAATATCAAATACAGCTTGATAACGATA
+GCGCTTAGTTGCTGTATCTGTAAAATTGTAGTCAGCGTTAAGATGTACACCAGAAACTTG
+TGGCAAGACATCAAGCTGCTCAATTACTTGCTTTACTTTGTCATTAAGTAAAGCCGCCTC
+ATACAACGATTCGGCATAACTTTGAAAAGCAAACGTGGAACTTAGCAAATGATTTTGCTT
+AGCCCCACTAGTCTTTTCTAAGATGATGAATCGTGCAGGTTCATCTTTTTGATGTTCAAA
+AAAAGACGGCACATCTAAGTGCTCGTCTAAATATTTTTTGATAATTACTTCAATCAATCA
+TCGCACCGCCTTCAACAGTGTGTTATTTTTTGAGTTATCTTTCTTGGCCTTTATGGTTTT
+AGTACTGACCATAGCATTAGCCCTATTTTTCCCAACATGGATATCTTGGACATAACCATC
+ACCACAACGTTCTCTGATGGCTGTGGCCTTAGTGGTTAATACCTGCTGCATTTCTGATGA
+TTTCATCAATTCGGCAACACCAGCTCTATTAAGCTTGAATTTAAACTTACTCATATCTTT
+CCACCATAACTTTCTTATTCCAGTCTAGTGGTATAAGCTCTTCAATACCTTCTAGTGGAA
+TTCCTACTGTGCGCCATTTTTTGCCGAAAAATCTAACTTCCTTATTTTCCCAATCGTGTT
+CGTCTCCTTTTGGTATAGCCAAGACATATTCAACCTTTTTTCCGGTCAAAGATAACTGAT
+TAGTGATATCTTCGGTAGTTGCTGGTGCAACAAGCACATTCTCAATTTTGATATCAAAAT
+CAACTGTTACAGGATTTCCAAAAGGGTCTTTTCCGCTAATCGACTTATCGGCTAAAGCAA
+CTGTTATCCCTTTCAATTTCGCCATAAAGTTCAATTCCTCCATATCGTTGTTTTTTTAGT
+CCAAGACGCTTCAACTCACTGTCCTTAATAAAAAGACCGCCGCCTGGAACTAAATAAGTG
+CCTGACCATGTGTATCCTAAAGCTGATTGGCTCTCTTGGGCCATTGGTTCGCCTCGAGTA
+GATGTCATCAGCGTTCTCGCTACAATGTCAACCGTAACCGATTTAATAACATTAACAAAA
+TAAGGCTTATCAACCATCGTTTTATCTAAGTCTTTGCCAACTTTGTCAGCTTCCATTCTT
+AATGTATCTGATACGACTTTCAAGAGTGCATTTGCACGTTTCAATTCGTCAACAGATAAG
+GGACGCCATAACAAAATGACGTCATCTGTTGTTGCGAAATTGCCCACTTTTACCTCCTAA
+CCAGGCAAGAGTGCCTCTAATTCAGGTTTCTTAGCTTTAGAGCTATATTTTATCCCAGCA
+GCATCTAACTGACGTTTAATTTCTGCTACTGTTTTTGCTTTTTCGCCTGTCTGCTGTTCA
+ACCAAAGTCCAATCTCCACCACAAACAGGGACGGAGCTATAAAAACTAGCTCCAGTCTTA
+CTGTTAACGTATAACATTATACTTCTCCTTTAGTGACACGAGCAAAGCTCTTAGCGTCCA
+AAATACCCCAGCCGATATACGCCTCAGCACGTAAGTAAATTTGGTTATACCCTTTAAGGT
+CTTTCCCCGAATTATCAGGATCACCGTATTTAATGATTTCCATTGGAATTTGTTTTGCAT
+AACCCCACTTAAACATGCTTTCAAAATCGCCAATAATTACTAAATCTTTGGATTCTGCTT
+CATCAGCTCCAGCACCAACAGTAGTATTGACGGACGATTTCAAGCCATTGATGCTATCTG
+GATTCGCTCCCCAAGCAAGTTCAGGGTACATTTTAGGCCCCATCTCCCCATTGGTAACTT
+TCGCCAGTGCTGTTGAAAACTCTGTATCCATCGCAAGCCCTGTCACTACACCTTCAGACC
+CCTGAATTAGATTAACAGCTGCTTCGATATTTGCATCAGCGTCTTCGCTCTCTGTAAATT
+TAACCACTTGCGTCACTTTACTATCAAAGTGATTCGTGCCGATAACGTCAGACGCTTTTT
+TTGTACGTGGATTGATACCATGCATCGCCATTAGGTCAATACCACGAGCGAGTTTTTTCG
+CAAACCCTTCGTTAAAAGCTTTCAAAATATCAATCTTTTCCTCTTCTGTTGCATATAAAA
+ATTCATCAGAAAGACGAGCACCATACTCAACCTTGATTGGTACGATAGTAACAGGCTCTA
+GCGATAAGCCACCGTGTGTTTTTTTACCGTTTTCAGCAACCACATCAATATCAGAATCTA
+ATGTAAACGTAAATTCTTTAGATCCGTTAAACGGAATAGGTTTTTGGCTAGATAGTTTAG
+CTAGTGAGCTATGCCCCTTAACTTTATTGATAAGATCTGATACTAAATGTTTGTCAAATA
+AGCTCGCTTTTGATGTTTCTGTTCCCATATTTTTTCTCCTTTAATTAATCTTCTAATCTT
+CTGTACTTAATCCTTGCACTAACGCTCTGTAATTTGCGTCTGCATTACTATCGATATTTG
+GTTCGTTTGATTTTGCTGGCGGTTGTGGTTGGGATGGCTTAATAAAGGATGCTAAGCGTT
+CTGCATCTACTTTGAGTCCATCTTCATCATCTCCTTGCAAACGATCAGCTAAATCAATCG
+GTAAGCCATACTGTAACGCTACCTTTGTCCGTAAATTTGCCGTCTCATAATCGGCAATTT
+GATTCTTCAGGGTGCTAATCTCTTCCGTATAGCTATCAGTGTTTGATTTAGCATCATTCA
+AAGCAGTTTGTAAGCTGCTGTTTTCGGTTTCTAGTTCTTCAACACGAGTTTTCAGTTGGT
+CGTAATCTTGATATTTCTCACGTTCTCGAGCAATGCGAGCTTTCACAATCGTGTCCAACT
+CTTCTTGTGTTTCAATAACTTTAAATTCTGACATATTAACGTCCTTTCTCCTGCTTTCCC
+GGCAGTTCGGTAGATTTTTTAGCAGTAAAAAAACACCCTTTCGGATGTCGTTTTTTAACA
+GCTGGTTCTTTGCTTTCTTTTTGGCTTCGTTGTGTAACAAATCCAGTGCGCAAGCAATGC
+ACTGTCCATTAAGCTAATGTCTCTATCATCATAAAGCGATTTATACCCAAAACCACCATT
+AGAGCCAATTTGCCTCTTTTCACAGTTTGTGACTACTGCTGTCAAAGATGGCTGATCACT
+ATGACAAATGGTTTCCTGCATGATCCCCTGCTCCCACATCATGTTAGCTGTGATAATTTC
+AGCAACTTTAGGCAATTCTGGTTTCTTTAGACCTTGATCTTTCATCTCCTGAGCAAGTAA
+TTCTTGACCACTTGCACCATCAATGACAACCTTAGCGATATCAGCCGATTTCAAAAAATT
+AATAATCCATTGAGTTCCATTTCTGACCGATAAACAGTCAATAGTCTCAACAAATACCTT
+ATTTTCTGATGTTCTTGCTGCAATTGATAGTGATACGTTGTTGCCATCTTGACCAAACTT
+GATACCGACAAAAAGCTTGCTTTTGAGTTCTGGCACTTGCTCAACTTTGAGTTTTGCCCA
+TTCTTTTTCGGATATAACTGATTTTTGGTTAAAGGATGGCCAATAACCTAAGCGTTGGAT
+GTTGTGATCAATCTCATCTTCACCTAATTCAGCTTCGATTTTCCTCTCGTTGAGGTGGAA
+TCCCATAGATGGGTTGGAAATATACCAGGAAGATACATCGTTAATCTTAACCATCTCAGG
+AACTGACCATTCAGCCCAACCAGAATAACGCTTATTGCCTTTTAAGCAATCTTTCCGATA
+TGCTTCAAATACTGTACCAGTAGATACCATCGTTGGCGGCGTTCCACACATAATAGTCAT
+TGGATTATCACTATCAGTAACTGTGTACTTCAATGCTGATTCTTGCTCAGATGTGTATTC
+TTGTGCCTCGTCAATGATAAGTAAGTCAAATCCCTCACCAAGTCCACCGTTTGATGTCCT
+AGTTCGGAACTGGATAACAGCGCCGCTGGCTTTGAACTCTATACGCTCTTGACCCTTGGC
+TTTATTTGATATAAAGTCTTCTCCATCAACATAACCTGACATCTCAAGGTATTTTTTTAC
+CTTTTCGAATGATGCATGAGATGTGCTAATTCGATGAGCTGTATGCAAGATTTTTAAACC
+TTTATGCAAAGCCCACAGCTCAACAATATAGACTACTTCCGTCTTACCGTTACGCCGTGG
+GATAGCATACCCATACTTTTGATGAACCCACAGACCATTTTCATCTATGGCCATAATTGG
+GATAAGCATATTTACTTGCCATGGATAGCAGCTTAGCCCTGTTTTTTTGTAGTAATTAAT
+AGCTTCATGCGCTAGAGATTTAGCAAAATGTAAATTTACCGATTGAGTAGGTCGCTGATT
+GCCAAGCTTTGTTTTCGTCTTAGTAACCATACTTATTCCTTTCAATCGTACTGCCTAGTT
+TTTAGCCATGCGACAGGGCACAATAAAAAGCCGTATTGCTACGACTTTGATTTCTAAAGG
+GGTCGAATTCGTTTAAAATTTATTTTCCCCATTTTCGCTTGTAATTTTTCTTAATATAGT
+TAACGTCAATTGCAATATCTGCAATAGCTGATTGGTTATCTAAAGTAGCAGCTTTAACAG
+ACGCAAACTCTTCGTTTGTTGCCAGAGCGTTTCGTTGAACGATTGATTTTAGCTCCATGA
+TTTCTTTGTTTTGATTTTTAATTGCTTCTGCTTGCATAGCATTTTCCGCAACCAGCATCA
+CAATAGCCCGTTCGAGTTTACGTTTCTTTTTGATTCGCTTATTCATCGCCTTCTCCTTTA
+TTTAACTTTGTTGCACACGACATTTTAGGGACAAAATTTTCCGCAGCTTCTAAGGCTTTT
+TCGTAAGCTTCTTTTGTTTCATTGACTTTATTCATGATTTGTTGAAATTCGTCTTTGTTT
+TCCCAAGTCATTTCGACATTTAATGATATTTTATTCATATTTTTCTCCTTTTTGGGCATA
+AGAAAAGCACCAGATTGCTCTAGGTGCTTAATATATTGCGTTTTCTGGATCTGGACCAAT
+CGCCACCCCGCTATTAATAGCTTTGTTTAATTCCAGTGTTGCATCTGGTAGAACCTTTTT
+CCACTCATCAAAGTAAACGTCTGGCTCCCAAAAAAATACTCTATCAAGCGAGTCTTCTCC
+AAACTTTTCAAGATATTGTTTTTCAGCGTCGTCATATTTTTGACGCAGTTGCCGATGTAA
+TTTTGGTTCCATATTTATCACACTTTCACAAATAATCCAATAATAAAATTCAAAAATTCA
+GGGTCGTCATTGATTGTCTTGTAGTCATATTTCCATGTTTTTTTGTCAAAGGACTTAGCA
+AATCGTTCTTCAGGAACAAAAATACCTTGTAATCCCATAGTGAAAACTTCAGCTGCATCG
+CTGTAGTATTTACCAATATATGGTGATATAAAGTCATCTTTCTTAGTAACTTCCCCAATA
+CCATAATTTGAACTTGGAAAAATATCTTTCAAGCGAACCTCAGCTTCATTAGCAGTTCTT
+TTATCTACCCAGGCTTTCTCTAATCTTACTAAATCAGGATTAACCAGTTCAATCATATGT
+CCTATCTCATGGTAAGGTGTTGTTTTTCTTGTTCCATTTGTAGCAATAACTAAATCTTCA
+TCATATCCATCGAAGTAACCGCGCTTCCTTTTTATAGCTTTTAGTTTTTTACCAATACCG
+TCCGGAACAGCTGCCCACTCAGTTGGATAATTTTGAAAAGCCTCTTGTAGCTGGTCTTTA
+ACAAGTTTAGATGAACCTTTTGCCCAAGTATTTTTAGGTATTTCTCCACCGATTTCACGA
+AAATTTGAGAAAATTTCTTTTAATTTCTCTTTATCTCCTATATGTTCTGAAACTCTAAAG
+TGATAATTGATACGTTTCCCTATATCAATTATATCACTCGGACCAACCTTTGTCATATCT
+AACTTAGCGATATCATTTTTGATAGATTCTACTAGAGCACTTTCCTTAAATTTTTCAACC
+CTTTCTATAGATTCTTGAGTTTTTTCTTTCTTTCGCCAGATTTTACTCCAAGCACTCTGA
+ACTTTTCCATTCTTCGGGTCATAGTCAAGCGTACATCGACACCGCTGATGTCTTCTCCAT
+ACGTCCTTAGGGACTTTTGGATAACTATAAGTGCCAACAACCTCACGACACCATTCACAA
+CAGTTGCCACTTTCTGTTCTGACAACCTGTGGCGTCATACCTGTTTTATATTGTAAATCC
+GCATTTGCCTTGATGGTATCATCCACAATGGACTGCGAAAAATTAACAATCGGTTCACCA
+AACAGCCATTTTACATCATCAAATGTATTCTCGCTATCCAAACGATTTACCATCCCGTTA
+ATCTTGTCTCGATTTAGCGGTGGACGTTGCACCTTTAGACCAATCTGAGCATTCTCATTT
+AAAATCCGCTGAACATCACCAGCATAACCTGAAATCAATTTGTAATTCCGTCCCATAGTC
+TCATCTAAGAGACGCTTAGCGATATTGTAATACATTTTACCGTCTGGTAATTTATCCGAG
+CTAACAGAACCTGTCAGAGCCAAAGATAAAAGTCTTCCGACTTCAATAGCAAACTCATTG
+ACTGTTTTATAGGTCACTTTTTTAGCTTGCAATTCTGCAAAAGCCTTGGTTACAACATCA
+CTTTCGCCAAAATACTTTTCAAAATCTTGTCGAACAGATTTTAGTAGCTTAGGTAAGACA
+TCATCAACCATCAGTTGTTACCTCCGTGATAGCAGGTATAGGTTTATCAGCCCCTTTTAC
+TCCCGTTAAATCACGGATAACATCTGCATCCATGAAACCAGGGATAGCTTGATTAAGTTT
+GATAGCTCCATCCCCTACTAAAGTTAGCATATTTGCATCAGCTTCAAAGAGAGGCTCCCA
+TTTAATTACTGTATCCATGAATTGATTACGAAGATAAGGAAATTCATCTCTTAAACAAAC
+AGCAATATACGCCACATTTAGAAATCCAGAAGAAAAAGAACGTTGAGCTTTGCGTCCTGC
+TGCTCTCAAATTCTCATGTGCCGCTTTTATTGACTCAACAGACGATGGGTTGTCAGATGG
+AAAACCAAGGTCATCAAGAGTGAGACCGGAACCACCAGCAAATAGCGAAGCATACATTTT
+CAAGTGTTCCATGAAAGGGGCCATGCTTGCTGTTGTGAATTGCCCAACTGTTGGCTTGTC
+GCCATCCTCGTCTTTTGAGATTTCGAGTAACGTTGACACCGTAGCACGCCACTTTTCCAT
+CGGTTCAGCGTCTGGATCCATTCCCAAAACATATTTTTGTGGGAATGAGTAAAACTCAGC
+CGTAACCTCTGCTCTCTCAAGCGTTCTCTTCGCTGCCTTTTGATGATACATTCCAGCCTT
+GGTAATGCGACTGCGACCAAATGGTCTAACTGCGTCTGGTCTGTGAATGATAGGTACAAG
+CAAGGGGTGACCTGTTGGATTTTTAATATTATATGGTTTCCCTTTTTTTGGATAATACCA
+GATGTCTTTGTCTGTGAAATAGGCCTCTAACGTAGGATTACCGTTTGAGTCAGACTCTAA
+AATTGCATAACCCTCTGTTAATAAAAATGTAGTTGGGTCAAGTATCCCCGTCGCTTTACT
+AGCTTCGATAACTTGCATTTTAGGTAAGCCGTCTTCCGCTCCTGGCATGATGTACACAAA
+GCAACAAGATGCAATTAATGCTGACTGTATGGCTGTATCAAAAAAGATATCAGGGTTATT
+CGCTTTAAAAATTTCCCAAGCATTAAAATCATCGTTGGTAAACTCCCTGAAAATAATACG
+GTCCGCAAGGCTATCAACCCCTTTAGCGGTCCATTCTAACACAGACCTGTACATTTCACG
+CACATTATTTGGCATGACAATACTTCGTGTGTCGTCTCTGTCATCCATGGCATAATAACG
+ATATCTTTTATCAACTCCAGTTTTAAAAAGAGCTAACTTCCTACGAAGATAGCCCATACC
+CATATAATTCATTTCTGCTCCTTTATTTTTTGCATGACTAAATCTACAAAGTTTTCTTCA
+TGTACATCTATTCCTTCAATAAGTGTTATTCCAGTAAAACCAAATTCAGATTCATTTGCC
+AAAATTTCCTTTTTTAGTTTTTTATAGTGCTGCGCTAAATTACGTATTTTTTTAGGCTTT
+TCTGTCACATCTGTGTTAGGATTTAGGACTTTCTTTTTTTCTTTCCTCTGTTCAGCCCGT
+TTTTGTTTCATCAATTTACGTTGTTTCTCACGATTGCCTTTCTTACGGCATTCTTCAGAG
+CAATATAAAGTTCTATTGGTTTTTGCTTGGAAGTTTTTTTTGCAAATTAAGCATTTCTTT
+TTCAATGAAATTCAACCTCCAAAATTTTCTAAATCCTAACGTGAGAAAAAATGTACAGTG
+ACGGCGTGAAGCTCGGCCGACCGACCGGGTAGGGAGATACCCCCCATTTCGCTTCTAAGA
+GCTTTTAGTATAAATCAATATATTTGCCTAAAATCACTTTTTAAATGCAAAAGATGACCA
+GTCTCGACTTTGAGGAAGGTTTCTGTTGCCAATTGTCTTTGGCTCGTTGCTTGCTTGGTT
+AGCAAACAACTTATCAGACTTCTGCCTGTTGCACTGCCAGTGAGTTAACTGTAAGTTCTC
+AAGCGCTGATGGATGACCACCTTTTGCGATAGGAACTATATGATCTATTGCTGCGCTTAA
+TGGATGTGGATACTTAAGAGACTTGTCCACTGGCTTGCCACAGATACCACAGACAGTGGC
+TGCCTTTAGTAACTTCTTTTTATTTCTGTCAAATGCTACCCGGTGGGTACCTTTTTTATC
+TGCCCTTAACTGAGACATGGATGGGCCTTTCTAAATTTAAAAGAGGGGGGTATTTTCTTA
+CCTGTCCCTCATTTCTTGATAATACTATATTATCACTTTAAAACTGTCATGCACTGTTAT
+TCACTGTCAATCGCTGTCATTTACTGTCAAATTATTTAATTCCTTAGTTGCAACTCTTAA
+CAGTCTGAAATAGGTGCTTTCGCTGCAATTTAGCTCATCAATCACTTGCCATCTAGTCAT
+CTTATCAATATAGACCATGCTCAAAATCGTTTGACTGTCTGTATTTTCAAGGCTATCAAT
+CAGGTTTTGAAGCTCTCTTTGTTTTCTTATAGCTTCAGCAGTCTTCTTTTCAATATCTTT
+GGCAGTTGCAATCAACTCTACGTAAACATCATCTTGCTTACGTTTTATACCACCATTCAC
+CTTATCAGACGACCATTTAGGGCTAGAAAGCAACGAAGCCTCAATCTTATCTCGACGTCT
+GATTAAACTAGCGATATATAAATCTAAATTGCGTAAGTCTTTTAAAATTGCCTTAGCTTT
+GCTCACTAACTAGCTCCTTTTTGATATAATAGATTTGTCAAATTATTAACTAAGGAGTCA
+GCTGTGAGCTGGCTTTTTTGTGGAGAAAAGCCCTCTCTTCCTTTTTTTTATTTTGACACA
+GGCGCAGGATGTCAGTATTAGCGCCTTAAATAATAGCCAGTGACCGATAACCAGCGTTAG
+ATTTTGTTTTGGTGTAAGGAGGTTCTCGTTTCTATTTTTTAATTTCGGTCAATACCAACC
+GCACGAGTCGAACGTGCGTGATACCGTTATTGGTTATATCCATTCAATTAGTGGATTTTC
+AATGTGTTCTATCCCATCACCAATCCACTCTTTGACATTAAATTCTCGCTCAATATCTTG
+AGTCCTTGGCATAACGTTAATATCACTAAAACTCAGCATGTCGTCTTTTGTATTTTGCAA
+AAAATAAATGTTTTTAACTTGTCTTGTTAAAGAGTCGCCATGCACCACCACACCATTTAT
+CCCTCTTATAGACATATTAAAGAGTAGAAACGGTACTGCTTTGTCCGATAACTCTTCTAC
+GTGATACCAGTATTTACTCGGACGATAAGTAAATGGACTGTCATTTAATCGTTGTTCTTG
+CCATGCTTGGATAAGTATCCCACCCGTCCCGACTGCTACCTCGTAGTATTGATTACCACT
+TATTATTTTAGATAATAGTGTACTAACCGATTTAGGAGTAAAGTCTTGCTTTTTATTTTT
+GCGGTCAGCTTGTTCTTCCTCAAAATATTGCATAAACCAGTCGTAAGATACATCTGTTTC
+ATATTTCAAAAACTGTCTAAATATATCCTCACGACTATCTTTATCAAAGAGTATGTCCGT
+AAGTCGTTTGGGTGCTTTATAAACTTCGTCGATGCCTAGTATGCGATGTATCTCATCGAT
+CTTAATCATGTTACCCTCCGTTATTCGTTAAATCAGCAATCCGCTTTGTCTGTCTCTGAT
+TTTGCTCACTCGCACGTTTAAGCTGCTTTTGTGTCCTGCTTAGCTGTGTACGTAGTCCGT
+ATATTTGCGGTTCATAATAGCTTTTAAGCGATACGCAAAGCCCTGATACGACAATCAGCA
+TAACTGTTAGTGCAGCGATAATGATGCTTTTCTTTTTGATTGCTTTGTCTTTTTTTACTA
+ACTCATAAAGCAAGCAATCAATCATCTGTTCTTCAGTCATCCGTTTACCCCTTCATGTAG
+TACTCGTTTACGCGCTTGCCGCTAGCTAACTCTAGCTGTCTAATAAACCGCATCGCTTCG
+TTTTTAGTAGTAGTCATGTGTCTCCAATTCATCAAGATAGCCTTGATTGACATAGTATGA
+GCCAATCAAAATAGCGTCTGCTTCGTCGTCTTTGACCGATTTATTAAATTCTTGCTCCAC
+TTTTATTTTTGACTGTAATTTCATGGACTTCTTGCTTCGGTCTTTGTAGCTAAACTTCCA
+ATACTTACGCCACGTTGATACATTGATAAACACGACGTTATCAGCTATTAATCTTCCTAA
+GATAATTCCTGTAACAATACCGATTTTAAGCATGGATTGCTGGTTAGGTCCCATAACCGA
+GTTTTTTTCGACTGCGATTGTACTAAAATAGCAATCGTATTTTTTTAATGCTCGTGACTG
+GATTAGCCTTAATTGACTAGCCATATAGCGGCCGCGCTCAAAGTAGGATTTACTCTTATG
+TTTTAAGACACCACTCTGGATAAGATCTGAGCCTTTAAATAAGGCCCACCCTGTTCCAGA
+TGTTGAGATGTCTAACGATAAAACTAGATTGCTCATTCAAGCACCCCGCGAATGCCAAGG
+GTTTCAAAGATATTTCTCTTGTTATCTTCGATAAACGAGAATACTTTTATGATTTCGTCT
+GCGTCTTTCTTATACTCTTTAGCAAAATATGATGATGTTAGATTGATTTTAGTTTTGGGT
+TTAGCTTCAAGAATGAGGTCGTAGGCTGTTTCGAATAACTCTCCATCTTCATCAAGTGAC
+GGTTCGTCGTCAATCTTTTTAAAATCACTAATAAAATCCCATTGCATAGTCAAACTGCCA
+GAGATGGCAAAGATTCGGTTTACTCTATCTAAAATTAGTGCTGTTCCTGTTCCTGTAATT
+TTGATTTGTTCCATATTTTTCACCTTTTTAAAATCCACACTCGCCCTAAAATTGTGTGTG
+AGCATTGGCAAGGACGAGTGTAGCAATTCTTCATATCATCAATCCTGTTGACTTGACGAT
+ATTCCAACTTTCCTTTCTCGCTCGGAAAATTTAAACTTGCAAAGGCCAAGCTTCACTTTG
+CAATAGGTTATTAAAAAATCTCTACCCTTACAGACAATTTATTTTGTCTGCAATATTCGC
+ATTTTCCACAAGGCTTAGGCTTTTCTATGCCTTTTTTAACGTCATCTAATCGCTTAATGC
+TTTGTGCTAGGCTATCTAACTCTATCTGCATAGCATCTACATTTTGGATCCTGATGGCTC
+TTGTATCTGGTGGTGTCTCTTTAGTAACTGCGTAAATAATCGGTTCAAACGGCTTATTGT
+ATTTAGCTTCTAGCATGGTTTTGTAAGCAGCCATCTGCAAAATATATCCATAAGCTTCAA
+ACCATCTGACACGCTCTTCTCTATTCCAGATTGTGTCGTCAATCGGCCCTTTTGTTGTTT
+TGATGTCTACAAAATAGCCACGTTCAACATTCAAGCAGTCGATTTTACCCTTGAATTCAA
+CCTCGCCAAGAAATCCTGTGATTGCTGCTTCTTTTTCTCCTTGGTATATGGCCATGAAGT
+TACTGTCATTTTTAAGTGCTTCAATCATCTGTTCTGCGACTAAATAGTCTTTTTTGAGCT
+GACCTTTAGTTGTTCCTCTGGTCGAAATCATTTCAGAGCCGTTTTGGGCTTTGAATTCTT
+CATGAGCTTCTTTACTCTCAAAGTAAGAGTGGACATAGTTCCCGACGAGCAGCGCAGTGT
+TATCTCTGGTATCTGTCCAATTCCCTTGTAATTCAGCAAGCCCCCTCGCTTCGCACTCTC
+TAAAACGCTTGTACTGACTAATAGACCAGTATCTGATAGCTGATTCACGACTATAATAAT
+CCTTTCCGAGTAAATCTAAACTAGTCATCTAGCAACCTCTTAATTACTTCATCAATAGGT
+GTATCGCAAAAGACAAACTCTTCTCTTTCCCTATCTCCAACGAATTGAACAACCACTACT
+TTTTCATCTAAATTGTCAAAATTTAAAGCAGATCTTTCCCAAACGCCAACAACATATTCT
+GGATTAATATAATATCCTTCGATTTTTACAAGTTTAATCATATTAAGTCTCCGAGGTTAT
+CAAATAAGTTGCCTTCGCTAGCTTTAATTTCCCCTGTTTCTTGGTCAAAATCAGGAATCT
+CATCTGCTGGATAAGAGGTGTCTTCTAAAACCGTCTTATTTTCGTCTGTGAGCGTTTTTT
+CTGGTTCTGAATGTAAATCTTTAATTACATCTTTTAAATTGCTAGGAGCGTCCTTTTTTT
+CGTTCTGCGTGCCGATTAAGTCATCAAGGCTGTTTGTTTCTTGTGGTGTGACATCTTTTG
+GAATGACAATCGTTGAATCTGCGTTATCCGCTTCTAGAGCATCCTGCATTTCAACAGAAA
+GAGGGGCATACTTGCTCAGTAATTCCTTGAGTAATGTCTTGATAGCCATTGGATCAAATT
+CTGTCGCCCAAGGCGTTCCTGGTTTAAAATCTCCTGTTTTCTTATCAAAAGTTTTAGAAT
+ACTTTTTGGCATGTTCGTACACTTTTTCTTTCGGCCAGAAAATCATCTTGTAAAAGCCGC
+TGATTAGTTCTAAACTTGCAAAGTAGCCTTTTACAACACCAGAGTCAACGTAGTCGCCCG
+TTAGCTTCAACTGCCCTCTAATCTTGTCATAACCAAGGAATTCCTCTTCGTATATGATTC
+CGTGTTCAATATTTCGGACTTGTCCACTTCTTTGAGCTAGCTGTATAAGTCCTCTATATC
+CGATTTGAAATTGCGCTTCGTTTACTGTGATCCAACGATTTCCATCCTTGTAATTTCGGT
+TGTACGGCACCACGTAAGCAAAACCAAGACTAGGCTCGATTGGTAAATTAAGCACTGCTG
+CTTTCATAGCCGCTCCCATAATTGACTCAGATGTTGCTTTGGCTAGAAGGTTATTATTGC
+TGATGATTGATAATAAGCTAGTTGTAAATTGTTCGGCTCGTGCGCCGACAACCTGCTCAA
+TCCTGTTTTTTACTGCTGGCGATTTAAAAAAGCTGTTGTGGTTGTTTTGTGCTAATTGAT
+TTGTCATTAGATACTACCTCTTAAAATTTCGTCAAACATTCCGTTTACCATACTTTTAAC
+TTTTTGCTCTTTTGTTAACTCTGGAACATCCTCGCCATCAATAAATTTTAGGTCATATGA
+TGCTTCGATAACTACAACATCACACCCAAGCGTTTCTGCCAAATTATCAATTTTTTCTTT
+TTGTATGTTGTAAGCTTCTTCTGGTAAAAATGATGCCAGTTGAATGCTATCTGTAAGTTC
+CACATTATAAGCAAGTACATCTTTTTTGTTTTTGAAACTCTTTAAAAAACTTCCGTCTTC
+AGTGTTTCTTAGCACTACAATTTTTTCTTTGATGTTCATTTCATTTCCTCTTTTTGTGTT
+TTAGTTGCTCTCCCAGTCTTCACTAAATTTAAAATCATTGGATTTGCTCACATAATCCCT
+CGACTGCAGCATGTATATCTGTCTGACCTGCGCCAAGATATGTTATTCCCGCTGCTAAAA
+AGACTTCTCGTGAAGTTAGAACTCCACCGAGATCATCAATTGCCTGATCAAGGTATATGC
+TAAACGTTTCAAGTTCTTGTTTAGCTCTGATTTTTGCTTTTTCTACTTGTTCTGGTGTCA
+TATTTCCTCCTAAATCGCATATTTCTTACGCAATTGCCGCAATAGTGTCACGTACCGTGC
+TTTATCAACTAGTCCAAAATCAAGCAATCTCTCACGCTCTTGATGACTTGCTCGGTACCA
+GATAAGTGTTTCTCTATGTTGTTTTGTCATAACGCATTCTCCTGTTTATATCGCTCTATT
+CTCAACCGGTCTGCTTCTGCTGTTGTCATACCAGTTCCAAAAGCGTATAGGTTTATCCAA
+TTAAAAATTGGCTTAACTCCATTTTTTTCGATTCCTTCGGCGCAGTAACTAGCAAACTTA
+GCAAAAGTCTCTTTACTCGCCGTTTTACCAAAATCTTTTTTGATTTGTTTGTTAAAAAAA
+TTAAAAATCTCCTGATCCATCTTCTATACCGTCCATGCTTCCTAGAGCAAATTCTTCTAA
+ATCTGGTTCTTTGTAGTCTGGATTCGACCAGCTTGGGACGTTTGAGGTAGTTACACTTCG
+TTGTTTTTTACTATCGTCAAACCGTTGCAACCTGTCTCTGACCTTTTCTACTGTCGTATC
+TCCAGATTTATACCAATCAACTAAGATTTTATTGATATACTTCCAACTGATTTTGTTGTT
+TTCTACCGCTTCTCTTAAGGCAAGGTTGACAACTTCAATTGGCATGTTATCTTCGTGAAT
+CCACTTTTGAATATCTTCGATTTCAAATGGCGATATCATCCGTCCAAAAGTTAATTGGAA
+ATTTTCAAAAAGCTTTTTTTCGTCCATAGCTCCTCCTGATGTTGATGATGATGCTTATTA
+TCTGTTAGTATTTATTGTTATTTAGTATTTATTTATAAGTTAGTATTTATTAGTTGGCTA
+ATTTGTTGATTAGCAAATTGCACATTAGCAAATTAGGTATTAGCAATTTTTTCTAGTTCT
+AAGTCCTGTTCTGCCTTCAAAGTATTGAACGCCTCGTCGCTTATTTTTCTGTCAGAACAG
+AATCTATAGGCTTCGGTACCATATCGCCCGCCAAATGATTTTCTATAAGTTCTGATATAC
+TTGGCATTCTCTAACGCTTTCAACTGGCTTCTGATTGCAGATTCGCTATCCTTACAACGT
+CTAGCGAGTTCTTCAGGATAGACTCTCCATTCGTCTGCATTACTCAAAATGGTTAGCAGC
+AGTCCTTTTTCCTTATTGAAAAGTTCTTTGTCCTGAATAAATTCATTGCTAACAGCTGTG
+TAACTACCTGTTAATGTCTTGAAAAATGTACTGCATTAGCTGACAACCCCTCCTCTTGCA
+CGCTTCTTGCTCCATCCTTTGCTGTTTTTTAAAGCTACTTCCCTAAAAATTTTCCGCTTA
+TTCTCTGGCGAATTGTGTTTTTTAATGACTTCGTGTTGCACCCTAGCAATGACCGCTAAG
+ATAACGGTTGTTGCTAACAAAAATAATTCTAATTTGTTCATGTTATACTCCTACTCTTTT
+TTCAAATTTAATATTTTCAAGCATTTCTGGCAGTGTCTCTTTTTTTGTTTTGTAACGATT
+GCGAGATTTCCACTGTACAAACAGTTTGAATCCTTTGTAATCAATGAATACGATTCTATG
+CGTTGGATTTAATACAAACTGTTTAAAGTCTGGATGATCACGCATTTCTGTCGCCCACTG
+CTTTGCAGTAGCAACTGTCAACCCCTCCCATTGTTGAATCAAGTGTTTATAATCACCATG
+AGAAGCTGTTTCATTAACATCAACTGCTCTATAAGTAATTTCTGCTTTTGGCATATTAAT
+ATCCTCTCTCTTGTGTTATAATTAAGTAAATATTTTTTGTTTGGAGTCCGATTCCCGTCG
+GACTTTTTATTATCTAATTAAGTTGGTTCTATTAGTAAAACTCAGGCTTAATGTTTACAT
+TGAATCGAAGTCTATCCTTTGGATGGGCTTCTTTTAGTTTCTTTACTTCCGTGATTGCTT
+CTTCAGATGTTGTGCAATATAGGGTAAATGTTATTTCGTTCATGTGTGTCCTTTCTACTA
+TATGATTTTAAATCATATAGTGTTTAAAATTTTTGTGTTGCTTGCTTGTTTATCCCAAGA
+ATGTCATCGGTAGATACATCGAAAAACAAAGCTAGACTAATAAGATACTCACCTGAAATC
+TTTGTCTGGTCTTTTTCCCAGTTGCTGATAGATGTTTGAGTAACACCTAATTCTTTTGCC
+AATTCACGCTGTGACATCTTATTATGTTTAGCTCTTAATTCTGCAATAGTTACCATAGCT
+GAGTCGCTCCTTTCTTGATGATGATTACATTCTATATGATTTTAAATCTTGCGTCAAGTG
+TTTTATATGATTTATTTTCTGTTTTTTTGAAAAAATCGTAAATCATATAGTTTATTTAAA
+ACTTTTTTCTTATATGGTTGATTTATAATCATGGTTTTGATATAATTTACTTATCAAAAT
+TAAAAAGGAGGTATCCTATGGAGCAATTAGGGGACCGAATAAGAAAGTTGAGAGAAGGGC
+GCAACATGACTCAGACTGAACTTTCAGAAATATTGGGCATGAAAACCTATACTACTGTTT
+CAAAGTGGGAGAAGAATGAAAATTTTCCAAAAGGTAAAGACCTAAAAAAACTAGCAGAGA
+TTTTCAACGTTACCTCTGACTATCTTTTAGGACTCACAGATAGTAAACTTGGGAAAATCA
+CAATACAGAACGAACAACCTGAAATCGTTTCTATATACAACCAACTAGAACAACCTAGAC
+AAGAAAAAGTCCTCAACTTCGCTAACGAACAATTAGAAGAACAAAATAAAACCGTTTCTA
+TATTCGATAAAAAATCTGAGGAGACAGAAGATTATATCACTGACTACGTTGAGGGATTGG
+TTGCCGCTGGTCTTGGGGCATACCAAGAAGACAATTTACACATGAAAGTTAAACTACGTT
+CTGATGATGTCCCCGATGAGTATGATACTATTGCAAAAGTAGCTGGCGATTCAATGGAAC
+CACTTATTCAAGACAACGATTTGCTATTCATCAAGGTATCTAGCCAAGTCGATATGAATG
+ATATAGGGATATTCCAAGTCAATGGTAAAAACTTTGTAAAAAAACTCAAGCGTGATTATG
+ATGGCGCTTGGTACTTGCAAAGTTTAAATAAAAGCTATGAGGAAATCTATCTATCAAAGG
+ATGACGACATCCGCACAATCGGTGAAGTTGTGGATATTTATAGGGAATATTAAAGGAGAC
+TGTTATGGCAAAAGTCATATTCCAAGATAACTTTCTCTTAATGGGAACAAATTATCATGA
+AAAAGAAGCTAATAAAGTTATGGCTGAAATTGGTAAGAAATCACCATACTGGGATAAGGA
+TAAAGATTTTATTTCTGACTACATAAAATCAAACTTCAAGGATATCTACAAGTATTACAG
+GGTCTCAACAAAAGATGTAGAGATTGTCAGAGAACCTCTTAATCGTCACGATCCAAATGC
+CATAAAAGTCATGGTAAACAAAACTTTTGTTGGCTACTTTCCAGCAGACTTAGCTAAACG
+ATTAACCCCTTATGTAAAAAAATCTAGTCATTACCAAATGGAAGCAACCCTTACTGGTCG
+TGGTGGACAATACAAAACACTCAAAAACGATTTAAAGACCGTGGTTACTAAAAAGAAAGA
+TATAACTTATAAGTTACGATTGACTATTTTAAAAGTAGATAGAGTATCAAAAAGTAAAAA
+TGCTGGATTATTAGAGTCGATAGCATCTTGGTTTCTCAACTAACAAAAAAGCCCCACGCT
+CAAATTTGGCGAGGAGAGCGTGAGGCGAATCTAGTATAGTAAAAACCTGCTTCGCAGTAG
+GTCTCTTTACTATACCTATTTTAACAGAAAATGAGGTAAAAAACAAATGTGGATAGAAGA
+AACTGATAACGGTAAATTCAAATTTCGTGAAAATTATAAAGATCCTTACACTGGAACATG
+GAAACCTGTATCCGTTACTATGGAGAAGGATAATTCAAGAGCTTATAAAGCAGCTCGAAA
+AATCCTTGAACAAAAAATAACAGAAAAAATAGCGCAATTAAAGGCCTCTGAGTTACTTTT
+CACGGAACTTTTAGATGAATGGTGGGCGTTTTATAAGAAAGAACTTAAAAGGTCGTCTGT
+AGCTTCTCTGAGAGGTAATATCGAAGAGATAAGGGAAACTTTTGGAATAGGTGTTAAAGT
+AGTGAATATTGATCCTAAATACGTTCAGAATTATCTCGATAACCTAGATTGCTCTAGGAA
+TAAAAAAGAGCGTAATAAGTCTATGCTAAACTTAGCATTTGATTATGCTGTTGGTTTGGA
+TATTATCCAAGATAATCCTGCAAGACGTGCTAAACTCCCAAGGGTAAAGAAAACTCTTGA
+AGACTGGAAAAAGGCTGAAGAAAAATATCTTGAAGAAGATGAAATTAAACCATTATTGAA
+AGAATTGTACAGAAGACCTAGCACTTACCGACTTGGTTTGTTGGCTGAGTTTATCAGTTT
+GAACGGTTGTCGTATCGGTGAAGCTGTCAGCATTGAGCCGTGCAACTACGAATCTAAGTC
+AAGAATATTGCAGTTGCACGGAACATTTGATCATACAGAAGGATATCGTAACGGGGAAAA
+GACAGCACCAAAGACATTAGCTTCTTATCGTGAAACCATCATGACAAGTAGAGAACTTGA
+AATTCTACAAGAGTTAGAATTTATGAACGAACTAGAAAAAAATACAAATCATAGATATAG
+AGATATGGGATACCTTTTTACAACAAAAAACGGTGTTCCAATTCAGACTAACTCATTCAA
+CTTAGCTTTAAAAAAAGCTAATGAAAGATTGGAAGACCCAATTACAAAAAAACTTACTAG
+CCACATCTTCCGTCACACTCTTATTAGCCGTCTAGCAGAGAATAACGTGCCGCTAAAATC
+AATCATGGAACGTGTAGGACATGCAGACGCTAAAACTACTGCCCAAATTTATACTCATGT
+CACAAAGAAAATGAAATCAAGTGTAGCTGATATTATGGAAAACTATTAA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_003450.fasta.fasta
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_008261.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_008261.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1574 @@
+>NC_008261.1|provirus_1070550_1127691
+ATGAAAAAAAGGGTGTTTTGGGTAAGTATAGTATTTTTAATAATTATAACGGTTTTAGGT
+ATTACAATTAAATTTGATGGTAAGAAAGTTAATTGTAACAGAAAAACAGTTAAAGTAGGA
+TTTTATGAATATTATCCTTATTATTATCTTAATAAAAATTCTATGCCAGATGGCTATTAT
+AATGAAATACTAGAATTAATATGTAATAAGTTAGATTTAAATTATAAGTATGTAGATTGT
+AATGTAACAGATGCTTTAGAAAAGCTTAAATCTGGACAGATAGATTTAGTCTTTGGAATA
+AGTAAGACTCCTGATAGAGAAAAGGAATATGAATTTACTGACCACTATCTAAATAATGAT
+AACTTTGCCATATATACTAATAAGAATATAAAAAATGGTGATTTAAAAGCTTTAAATGGA
+TTAAAAATGGGATTTTTAAAAGGAGAAGAAAATAATGAGTGGATTTTAAGGCTTTTAAAG
+GATAAAGGCATAAATGTGAAACCTATAGATGTTTCTAATTATCCTGAAGATGAGGAATAT
+TTGTATAATAATAAAGTGGACTTTGTAGTAGAAAATACAAGAAGCAATATAAATTATGAA
+AATAAAAATATTAAAAAGATTTTTGAATTTTCTTCTGGACCAGTTTATATAGTTAGTAGA
+AAAGGTAATGAAAAATTAATTGAAGGAATAGATTCTGTCCTTGGAGAGCTTGAGGAAGAT
+GAGGAACAAAAAGATATTAATTTATATTCTAAGTATTTTGATGAGCATTTAGATAAATTA
+AAAAATGAGAAATTACTAGTTGTAATATTTTTAATTATAATATCATTATTTATTTATAAA
+AAAAGAAAAAATAAAATATTCGCTATAAGAACTAAAAGAAAAATTAGAGACTATATTAAA
+AATGATAAATATATATTATATTATCAACCTATAGTAGATCCAAAGAAAAATAGAGTAAAG
+GGATTTGAATCTCTTTTGAGATTAAATAAGGATGGAAAAATTTTAACTCCCTATAGCTTT
+ATAAAGGAAATTGAAGACAATAATATGTCTTTAGAGGTTTCTTTATGGCTTTTAAAGAAG
+GTTATTTTAGATTACAGAATAATAAAAGATTATGATATGGTTAAAGGAAGAGATTTTTAT
+ATATCCTTAAATGTTTCATTTAAAGAAATAGAAAATCCTAAGTTTTTAAGATCCTTAATG
+AAAATTGCAAAAGATTATAAGATTGATGATTGTAATATTTGTTTAGAGATAGTAGAAAAG
+TTTGGTATGGAGGATATAGGAAGAATACAAAGTGCAATAAGAATAATAAAGGAATATGGA
+TTTTTAATAGCTATAGACGATTTTGGAGTGGAATATTCTAATTTAGATTTATTAAATAAA
+ATTGATTCTGATATAGTGAAGCTAGACAAGTACTTTGCTGATAATTTAGACAAGTCTATT
+ATAAATGAAAAAACAGTGGAATTTATATCAGAAATATGTATCATAGCTAATAGAACTATA
+GTATTTGAAGGGATAGAGGAACAGTATCAGGTTGACATTGTTAAGGCATTTCCATATGAA
+AAAATATATATTCAGGGATATTTCTATTCAAAGCCAGTAGATATTGAGAATTTAAAGGAT
+TTTAAATTTAAGGATAGTTAATTTTCAAAGGATAGAAATAGTAAGAATTAATGAGAAGGA
+TTTATAATATAATAAGGTGGTTATAATTAGGAGGTACAAAAAATGAAAGTATTATTAGTT
+AATGGAAGTCCCAATAAAGAGGGATGTACTTATACAGCATTAAAGGAAGTAAGTAAAACT
+CTAGAGGAAAATGGAATAGATACTGAAATATTTCAAGTAGGGAATAAGCCTATAGGTGGA
+TGCATAGGATGTGGTTCTTGTAAAAAAACAGGGGAATGTTTTATGAAGGATGGTGTAAAT
+GAATTTGTAGAAAAAGCTAAGGATGTAGATGGATTTGTATTTGGTTCACCAGTTTATTAT
+GCAGCAGCTTCAGGTTCAATAACTTCATTTTTAGATAGAGCATTTTATTCTGGGGGTAAA
+CATATGGCATTTAAGCCAGGGGCAGTTATATGTAGCGCAAGACGTGCTGGGACAACCTCT
+ACTTTAGATCAATTAAGTAAGTATCTTACAATATGCAATATGCCAGTTGTAAGTTCACAA
+TACTGGAATATGGTTCATGGAAATACTCCAGAGGAGGTTAAAAAGGACCTAGAAGGTATG
+CAAACAATGAGAGTGCTAGGAAGAAATATGGCATGGCTTATTAAGTGTATAGAATTAGGT
+AAGAATAATAATATTCTTAAACCAGAATTAGAAGAAAGAGAAAGAACTAATTTTATTAGA
+TAATGGGACTATAAAGAGTTATATCATCAAAAGATATAACTCTTTATTTTTTATATAATT
+ATACTTTGGTTGTTTTTTAAAATTTTCATATAAAAATATTTATATATTTTAAAACAAAAC
+AATAAGGGAAATAAATTAATATTATTTTTATTATTTTGTTTTTTTAGTAATAAAAATACA
+TAGTCTTTAATAATGTTTATATAGATTTAAACTTTAAAATTAAAAAATATATTTTATAGG
+AGAGTGATTATGAATAGTGTACGTAAAATAAAGTGTTTATTTCTAATATTCTTAGATATT
+TTATTTATAAATTTAGGGTATTTCATAAGTTTATGTTTTGAATATGGAAAAGAAATGAAA
+ATAGAGTATTTTTTTAATATTAGAAATTTAATTATATTAGCAATTTTTACGAATATATTG
+ATATTTTGCTTTTTTAATCTTTATAAAAATATTTGGCACATGGCAGGGATTAGCGAGTGT
+ATAAGGTGTTTAATAGCGTCTTCAATAAGTTCTATATTATTAATATTATATAAATTTATT
+TTTAATATGGATGTAACAATAGTATTTTTAATTAATAGTAGCATTTTAATTTGTATGTTT
+TCATTACTTACACGTATGTCTATAAGAATTTTTAGGAAAATATATTTTCCTTATAAACTT
+GAATCCAACTTAAGAAAAAATGTTCTTATAGTTGGAGCTGGTCACTGTGGACGTATTGTT
+ATAGATGAGATGAATAAAAATAATAAATTTAATCCTATTGGTATAGTTGATGATGATTTA
+AATAAAAAAGGAACTTTTTTAAATGGTGTGAAGGTACTTGGAAATAGAGATGATATAGAA
+AAAATATGTAAAAGAATAAAAGTAGATATTATTTTAATTGCGATTTCAAATTTATCATCA
+AATGACAAGGATGAAATTATAAAAAGATGTGAAAATACAAAGATAAAAGTAAAAATAATT
+CCAAGTATATATGATTTAATTGATGGAAATGTTAAATTAACTAATATTAGAGACATTGAT
+TTAAGAGATTTATTAGGAAGAGATGAAACTAGATTAGACAAAGAGGAGGTAAATAATTAT
+ATAAAAGAAAAAATTGTTATTGTAACTGGAGGAGGAGGTTCTATTGGTTCAGAACTTTGT
+AGGCAGATAGCAGTGTTTAATCCTAAAAAGCTTATTATATTAGATATTTATGAAAATTAT
+GCTTATGAATTAGAAAATGAATTAAAAAGAAATTTTAAAAATTTAGATTTAGAAGTTATT
+ATAGCTTCTATAAGAGACAAATCTAGATTAAAGAAAATATTTGATAAGTATAAACCAGAT
+TTAATATTTCATGCGGCAGCCCATAAGCATGTACCTTTGATGGAAAATAATCCAGAAGAA
+GCTATAAAAAATAATGTTTTAGGAACTTTAAATGTAGCAGAATGTGCTGATGAATTTAAT
+TTAGAGAAGTTTGTATTTATATCTACTGATAAGGCAGTTAATCCAACTAATATAATGGGG
+GCAACTAAAAGAATTGGTGAGATGATAATACAAGCTATGAATGAAGTTAGTAAAACAGAT
+TTTGTTGCAGTAAGATTTGGAAATGTATTAGGAAGTAATGGTTCAGTTATTCCACTATTT
+ATAGAACAAATAAAAAATGGAGGACCTGTTACTTTAACTCATAAGGATATAACAAGATAT
+TTTATGTTAATTCCAGAAGCAGCACAACTTGTACTTCAGGCAGGAGCTTATGCAAAAGGT
+GGAGAAATTTTTGTTCTTGATATGGGAAAACCAGTAAAAATTTATGATTTAACAGAAAAA
+TTAATAAGATTATCAGGGTTTGAACCGAATAAAGATATACAAATAAAGATTGTGGGACTT
+AGACCAGGAGAAAAGCTTTATGAGGAACTTATTTTAAGTGAAGAAGAGCTTAAAAAGACT
+AAGAATGAAAAAATATTTATATTAAGTCCATTTAAGTTTGATATTAAAGAGATTAAAAAG
+AAAATAGTAGAACTTTTAAATGTAGCTTTAAATGAAGATAAAAAAGCCATTAAAGAGAAG
+CTTAAAGAAATTGTGAAAAATTATAGAGATTTAGAGCAAATAGATTTTATATAAAAGTGT
+ATTAATATATAAACTTTATAAATTAGCTTTTGTCATAATTGTTAATTTTTTATCAATTTA
+AGATGTAATAAAAATAGTTTTAAAATAAAAAAGGAGATAAATCTTAATGAATATACCATT
+TTCACCCCCAGATATTAGAGAAAAAGAAATTAATAATGTAATTGAAGTATTAAAATCAGG
+TTGGATAACTACAGGAAATAAAACCAAAGAATTTGAAAGAAAAATAGCAAAATATTGTGA
+AACTAAAAAAGCTATATGCTTAAATTCAGCAACAGCTGGATTAGAACTTATTTTAAGAGT
+TTTGGATATAGGAGAGGATGATGAGGTAATAACAACAGCATATACTTACACTGCGTCAGC
+AAGTGTAATAAATCATGTTGGAGCTAAAATTGTTTTAGCAGATACTTCAAAAGATACCTA
+TGAAATAGATTATGAAAGATTAGAAAAATTAATAAATGAGAGAACAAAGGCAATAATTTT
+AGTGGATTTGGCAGGAATACCTTGTGATTATGATAAAGTGTTTGAAATTGTAAATTATAA
+AAAGAAAAATTTTAAAGCCAAAGGTATTATTCAAGAATTTTTAGGAAGAATTGCAATTAT
+ATCAGATGCTGCACATTCTTTCGGAGCAATCTATAAAGGAAAAATAAGTGGAAGTATAGC
+AGATTTCACTAGTTTTTCATTTCATGCAGTAAAGAATTTAACAACTGCTGAGGGAGGGGC
+AGTAACTTGGAATATTAAAGATAATGAATTAAATGATATTTTATATAAAAAATTCAGTTT
+ATTTTCTTTGCATGGTCAGACAAAAGATGCTTTATCTAAAACTCAAGTAGGAAATTGGGA
+GTATGACATAGTCTCTTTAGGATATAAATTTAATATGACAGATATAATGGCAGCAATAGG
+GTTAGCACAATTTGAAAGATATGATGAGATACTTAAATATAGGAGAAAAAATATTGAATT
+ATACGATAAATTATTAAATGTTGAAAATATAAAAGTTTTAGATCATTTTAATAATACATT
+AAAATCTAGTGGCCATTTATATTTCATAAATATAAATGGAAAAGATGAAAATTTTAGAAA
+TAATATAATAAAGAAACTTGCAGAAAGAGGGATTTCAACTAATGTACATTATAAGCCTTT
+ACCTATGTTTACAGCATATAAAAAATTAGGATTTAAAATTGAAGATTATAAAAATGCATA
+TAATTTATATAAAAACGAAATAACTCTTCCTCTTAATACTATATTAACAGAAAGTCAAAT
+TGAATATATATGTAATGAGTTAAAAGGAGCTTTAATTTAAATGATATGTTAAATATTGCA
+AAAAGGACGTTTGATTTATTTTTCTCTTTGATAGGAATAATTATTACAATACCTATTTTT
+ATTTTAGTAAGTATTATGATAAAACTTACTTCCAAAGGACCTATTATATTTAAACAAGAG
+AGAGTTGGTAAAAACAAAAAAATATTTTATATATATAAACTTAGAACTATGACAGATTGT
+GATGTTAAAGCTAGTGATAGACAAGTAACTGTTATAAATGATCAAAGGATAACAAGAATA
+GGAAGAATACTTAGAAAATATAAAATAGATGAATTACCTCAATTATATAATGTATTAAAA
+GGGGATATGAGTTTTGTAGGGCCTAGGCCTGAAGTTAAAAAGTATGTAAAGTTTTACGAG
+GAAGAATATGATGAAATATTAAAAATTAAACCAGGTATAACAGATTTAGCTTCAATAGAA
+TATATAGATGAAAATACAATCATATCTAAATATAGTGATCCTGAAAAAGTATATATTGAA
+GAAGTATTGCCTAAAAAACTAATGTTAAATAAAAGGTATATAGAAGAAATGTCTATAAAA
+AATGATATTCTTTTAATTTTAAAAACTATTAAAAAAATAATTAATTGATTATAAATTAAG
+GGGTAAACTTATGTTAGTTTCATTTATTATAATAGCTCATAATGAGGAAAAAAATTTAAA
+AAATTTATTAGAAGATTTAAATGGACAAACTTATCCTAAGAAATTAATTGAAGTGATATT
+AATTGATAGTATATCTAGTGATAATACTAAGAATGTAATGAATGAATTCAGAAATTCAAA
+TAAGGAATTTAATAAAATAATAATAAAAAGCAATGTTAAAAAAATACTACCTTGTGGATG
+GAATATTGCAATATCAGAATCTAAAGGGGATATCCTTTTAAGGGTAGATGCTCATTCTAG
+AATTCCTAAAAATTTTATTGAAGAAAATGTTAATTGTATAAAAAGTGGTGAAAAAATTTG
+TGGTGGATATAGAGAAAATATTATATTAAATAAAAATAATTGGAAAGAGACGTTGTTATT
+AGCTGAAAAATCTATTTTTGGTAGTAGTATTGCACCATATAGAAGAAATATAGGTAAAAG
+GTATGTATCTTCTATATTTCATGGTGCTTATTCTAGAGAAGTTTTTGAGAATACAGGACT
+TTTCAATGAAAATTTAGCTAGAACTGAAGATAATGAAATGAATTATAGAATAAGAAAAAA
+TGGATATAAAATATGTTTTAATCCTAATATAAAATCATATCAATACACTAGAAATAATCT
+TTTAAAAATGTTAGAACAAAAATTTTTAAATGGTTATTGGATAGGACTAACTTTAGGGGT
+ATGTCCTAAATGCATTTCCATATATCATTTAATTCCATTTTTATTTGTGTTAGCCTTAGC
+ATTTACAACCATTAATATATTTTTAAATTCATACGGGCTATTTATAATTTTAGGAATGTT
+ATATAGTTTTTTAATAATAATAAATACTTTATTTATTATTAAAAATAATGAATTTAATAT
+ATTTTATATTTTTTTACCTATTATATTTCTACTATTACATCTAAGTTATGGAATAGGTAC
+ATTTATAGGAATTATAAAATTACCATTTTTTAAGATTAAAGTTTATAAGGGGAGAAAAAT
+AAATGAACAAAATTAGAGTTTTGCATATGGTTTCAACTTTAAGTAATGGAAGTGGAGTAA
+TGGGCTTTATAATGAATGCTTATAGAAATATTGATAGAAATAAAATTCAGTTTGATTTCA
+TTTATTTTGATAATGAAGAGAGAAGTATAACCTATATAGATGAAATATTAAAGCTTGGTG
+GAAAAGTAAATTATATAACAAAACCAAATAATTTAAGGAATATAAATGAATTTAAAAATG
+AATTAAGTGAAATTTTAAAGAAAGAAAATTATAAAATAATTCATTTACATGAAGTATATT
+TAAATAAATTTGTAAATGATGAAGCGAAAAAAGTAGTAGGTGCTAAGGTAATAGCCCATA
+GCCATGCAACAAAATATTCAGATAACAAAATAAAGGCTATTAGAAATAAAATATTATGTT
+TTAATTTAAAGAAGAATGTAGATATATTTTTTGCTTGTTCTAAGGCGGCAGGAAAGTTCT
+TATATGGGAAAAAAGCTTTTTATGATAATAGAGTATTTGTAATTAATAATGCAATTGAAA
+TTGATAAGTTTAAATATAATGAGAATATAAGAAATAAAGTAAGAAAAGAACTTAATTTAG
+AAGAAAAATTTGTTATTGGTAATATAGGAAGATTTGCTAAACAAAAGAATCATAAGTTTT
+TAATTGATATTTTTTATGAGGTTAAAAAGAAAAAAGAAAATGCTTTTTTATTATTAATAG
+GAGAAGGAGACTTAAGAGAAAGTATAGAAAGAAAATTAGAAAAATTAAATCTAAGAAATT
+CTGTTTTATTTTTAAGCTCTAGAAAAGATGTTAATGAAATTTTACAAGGTATGGATGTTT
+TTGTATTACCATCATTATATGAGGGACTTCCGGTATCCGTAATTGAGGCGCAAACTTCAG
+GGTTACCTTGTATTATTTCTAATAAGGTAACTGATGAGGTCAATATAATTGATTGTAAGT
+TTTTAAGTATTACTAATGCGAAAGTATGGTGTAAATATATTTTAAAGTCAGAGGATCACC
+TTAGAGTAGATACTAATGAAAGTATTACAAAAGCAGGATATGATATCAAATATGAAGCTT
+TGAGAATTCAAAACATTTATGAAAAACTTTATGCAGGAAGGGATATTTAAAGTATGTATC
+TTTATTATTTTTTCATAATATATATCTTTTTATGTGCATTAATTATATATAACAAAAAAA
+ACAAATTAAAATTAAGTGAAAAAAATAATATATATTTATTCTTAAATTTTAGCATGTTTA
+TTTTTATTAGTGCTTTTAGGGGAAGAAATATAGGAAATGATACTTGTAAATATTTAGATT
+TATTTAATAAGGTCAGATTTAAAAGTATAACTGAGCTAAAAGATAGGTATGAAATAGGAT
+ATTTATATTTAAATAAGATGCTTTCATTAATATCTGATAACCAGCAAATAATATTAATAG
+TAACCAGCTGTATTATATTAATTTGTTATGCATATTTTATAAAAAAATATTCTGCAAATG
+TTTGGTTGAGTGTATTTCTATTTTTTATATTAGGTTACTTTACATCAAGTATGAATACAA
+TAAGACATCAAATTGCCTTAGGATTAGTATTAATTTCTTATAAATATATAAAAGAAAATA
+AAATTTTTAAATTTTTAATTTTAATTTTAGTTGCATCAACATTTCATAGTACCTCAATTA
+TATTTTTAATTTCATATCCAATATCTAAATTGAAAATTAATTTTAGAAATATTATGATGT
+TTTTTTGGTTTGCTATATTAGGATATGCTCTATTTGATAAGATATTTAGATTTATATTAT
+TAGGAACAAAGTATGAATATTATTTAAAAACTGATTATCTAAATGGTGATGTAAGATTAG
+CGACTGTAGTTAATATATTAATAATAAGTACAGTTTTATTATTTGGAATTATTTCATCAA
+ATAATATAAAAAAGAGTAGAGATTATAATATTATGTGTTTATTTTTGTTTACAAGTCTAT
+CAATAAGTATAATATCACTAAAGTTTAATTTATTGGATAGAGTTGCTGATTATTTTCAAG
+TCTTTATTATAGTATATCTCCCTAATGTTATTAGTAAAATAAGTAATCAAAAGAAAAGGA
+TTATTGCAATATATTTAGTTATTGTTATGTTTTTTTTATATGGAATATCAATACAGTATT
+TAAAACCAGAGTGGAATAAAGTATTTCCATATAGCTTTTTTTGGAATTAGAATTATATAA
+ATATACAAATTTAAAGAGGTATTTAAATGAATATAAAAGAAAATATATTAAGGATATTTT
+CAGCTAACTTTTTAGAAGTTATTTCACGTATAATCATATCTTTTATTATTCCAATTATAT
+TATCTATAACTGAATATTCTAATTTAAAAACATATATGTTATACATTTCATATATAACTG
+TTTTTACATTAGGATTTGAAGAAGGAATGTATATAAAATATGGAGGAAAAGAGTTTAATG
+AAATAAATTTAGAAACATTTAAGTATGAACATAGGTTATATATATTATTACAAATAGTAT
+TTTCAACTATAGTTTTCCTTTTGGGAGTATTTAGTGAAAATTTAATCTTAATTCTTATGG
+CAATAACAATAGTTCCTTATAATATAGTAGTTTTTTTTAAGGCTAATTATAAGGCTTTAG
+GAGAATTTAAAATATACACTAAAATAGTATATTTACAGACAATTTTAGATTTAATATTAA
+ATATATTATTAGTTTTTTTTATAAAAAGTAGTAGTTATATAATGTTTTGTTTAGCTATTA
+TAGTTATTAATTTAGCTGGAGCTTTTTATGTTGAAGGAAATTTTTATAAAAAATTAAAGG
+GTATAAAATGTGTTTATAATAAAAAAATAAAAAATAACTTTAAAGTTGGATTTGTTATAC
+TAATTGCTAATTTATCTATAATGATATTTTACGGTTTAGATCGTTGGTTTATAAAAATAT
+TCTTTACTGAGTATGATTTTGCGTATTATTCATTTGCTATATCTATGCTAAATTTAATAA
+ATATTTTAATAAATTCTATATCAGTAATATTTTATAATTATATAGCTAAAGATGAAAATA
+AAACTATAATAAATAATTTAAAAAGGTATTTATTAATTTTAGGAGCTTTTGCAAGTTTAT
+CTTATTTTGGATTTGCAGCAGTTATTAATATATTTATAAAAAAATATATACCTTCTTTGA
+ATATAATAGCAATATCTTTTTCTGCATATCCTTACATCATAGTAATAAATATAGTAATTG
+TTAACTTATATAAGGCAAGAAAAGAAGAAAGAAAATATTTGAAAGTAGTATTAAAAATGC
+TTGGAATAGCATTTCTATATAATTTAATTACAACAATTCTATTTAAAAATTCAATATTAA
+TAGCGGCATCTACAACAGCTTCATTTATTACGTGGTATTTTTATTCTTTAAAGGATTTTA
+GTTATTTATTTAAAGATAAGAAAGAATTAAAATTTTTAACTATTAATTTAATAGGATTCT
+TGATATCATCCCATTTATTTAATTGGTTTTTAGGAGGAATAATCTACTTAGCAATTATAT
+TATTAACAGTGAAAATATTCTTTAAAAATGAATTCTTAAAAGGAATGGATTATATAAGGA
+ATAATAGATATTTAAATTAAATAAAATTATATCGGGGGAATAAATGAGAAATTTAGGGGA
+ACTTCAAAAAATAAATTTAGAAATGCTTTTAGAAACAAAAAGAATTTGTGAAAAAAATAA
+TATAAAATATTTTTTGATTGGAGGATCTTTAATAGGGGCAGTAAGACATAAAGGGTTCAT
+ACCTTGGGATGATGATTTAGATATAGGAATGCTTAGAGAAGATTATGAAAAATTTTTAAG
+TGTTTGTAAAAATGAATTAAGCAATGATTATTTTTTACAGAATAAAGATACAGATAGCAA
+TTTTGGTTTCTGTTTCACTAAAATGCTTAAGAATAATACTTTGTTAATTGAAAAAGCAAC
+AGTAACCTCAATGTGTAAAAAGGGAATATTTATAGATATAGTACCTTTTGATAATGTACC
+TAATAATTTTTTGCTTAAAATATTACAAGCTTTGAGAATAGACGTACTAAAAAGATTAAT
+TTTATTAAAAACTAATTATGATATATCCATGGGGAGAAGAGGAATAAAAAGAATTATATT
+TGTATTTTTTAAGTGGTTGTGTAAATTTTGGAGTAAAGAGTTTCTTTTCAAAAAAATATT
+TACCTATATAAAAAAATATAATACAAAAGAATCAAAAGAAGTTGTTTATATAAGTGGTGC
+ATATGACTATTTAAAAGTTTGCGTCAATAAAAAATGGGTTGAAGAAACTATATATTTAGA
+TTTTGAAAATGAAAAAATAAGTTGTCCAAAAGGATACCATAATTATCTTAAAAAGGTATA
+TGGAGATTATATGAAGTTTCCATCTAAAAATAAAAGAGGAAATAAGCATAATATTATAAA
+ATTGGAAATAAATTAATTAGGAGAATTTGATTTGAGAGAGGATAATATAGGTATAGAAAG
+ATATATTAATATCTTTAGGAGTAAAGCTAAAGTTATATTTTTAATAATGATGATTTTTGT
+ATTAACATCTACATTAATAAATTTTTGTTTAATAAAACCAAAGTATGAGATAAAGTCTAA
+AATATTTATAGGAAAAGAAGATAAACAAAATAATGGAAATTATGATAATAATGATGTTGA
+AATGTATAGAAGACTTGTAGGAACATATTCAGAAATTATGAAATCGGAAGATTTAATTAT
+TAATGTTATAGAATCAAAAAACTTAAATTTAAATTCAGAAGAGGTTTATAAAAAATTAAA
+GGTAATACCAAGAGATGAGACTCAAATTATTGAAATTTCGTATAGAGATATTGATAAGGA
+ACGGGGGTTAACTTTAATAAATGGTATTATAAATGATTTTACTGAAAAATCAAAAGAATT
+AATTCCAAACGGAAATGTCCAAGTTATAGAAAAAGCAAAACTTCCAACAAAACCAGTTAG
+TCCCAATAAATTTTTAAATATATTTATAGCTTTTATTTTAGGAATAGTCTTTAGTATAGG
+GTTAATTTTAGTTTTAGATTTTTTTGATAATACAATTAAAACTAGAGAAGATATTGAAGA
+TGATATAGGGCTTATACTTATAGGAGATATACCGGAAATAAGAGGAAATGATATTAAAAA
+TTTAAAGGAGGAGCTAAAAGAATAATGTTAATAAATAAAGAAACAAGTTGTTCTACAGCA
+GAAAGCTATAGAAAATTAAGAACTAATATAAAATATTTATTTAAGGATAAAAGTTTAAAA
+AAAGTATTGGTAACAAGTACAGAAAAAGGAGAAGGAAAATCAACTGTATCCTCAAATTTA
+GCTTGTATTTTTGCAAAAGATAGTAAAAAGACTTTAATAATTGATTGTGATTTAAGATCT
+CCTAGTATACATGAAAATTTTGAAGTTTCTAATGAAATAGGGTTTTCAGATGTGATTATA
+GATATTACAAAATTAGAAAAGTCAATAATAAATTATTGTGAATATTTAGATATACTTCCA
+TCAGGAAAAATTCCTAAAAGTCCTTCAGAACTTTTAGGTTCAACCAATATGGATATTTTA
+CTAGAAAAACTTTCGGAGAGTTATGATTTAATAATAATAGATAGTACTCCTTTACTTTCA
+GTAACAGATGCTCAAATTATATCAACTAAAGTAGACGGAACTTTACTTGTAATTAAAGCT
+AATAAAGTATCTAAAAAAAATGTTTTAGTATCAAAATCTATATTAGAGAAATTAAATTCA
+AAAATTTTAGGAGCAGTTTTAAATTGTTCTTATAAAAAATAAAATAGATAGATAATTATA
+TAATATTTATGATAAAATACAATTAAGGAAATGATTACATTAATATATATAATATGGGAT
+TAAAGTGTTTTATTGTTTATTATAATATATTAAGTAGTTTTATTTTAATTTAAGGTTTAT
+TTTAGAAGATTAAGGAGTTTACTATGGAATCAAAGGAAATGAGATTAGCTAAAAAAGCAA
+AAAAACTTATAGATGAGTTTGAAAGGGTTCAATCGGTTCTTCTAAGTGGAGAATTATCTG
+ATCAAGAAGTGGAAATAAGAGATGATGGAGCTACTATTGTTCTTAAAAATATAATGCCAG
+GATATAGTGGAGAAGCTATGTTTAAGTTAACTCACATATCTGATGTGGTTAAAGCTTACA
+TTGATCATATGGATGAAGAAAATGATGAAATGATTAAGAGTTACGAAGTTGAAAATACTA
+ATTGGCATGAAAGTGATTTAGGAGATATTTACAGAGAATCTGCTATGGAACATTTAGAAA
+AAGTTGAAGTAGTAGGAGATAAAGTTAGACATACGTATAAGGAACTTAAAAAGATAGAAG
+AGAAAGCTAGAGAAATAGAAGGACTATAGGATTTAGTTTTTATTTGTAAAGTAAGGTTAT
+ATATTAAATAAACCTTACTTTATTTTATTTATAAATAAAATAACAATATTAATTAAATAC
+ACATTTAGGAGATATATTTTTTTGGATTCTATATAGTAAATAAAAGAATAATGAGAGTTA
+AGTACTTTAAAATAAGGAGAAGATAATTTTGAGGGGAATAGTTTTAGATAAAGGGCAAGA
+ATATTACACAAATTTAAGAAAGGTTTTTAAAGCTTTTAATAACATTCATCTTGAGTATAA
+CTGGCTTATTACAGATTGTTGTGCTTATCCAGAGAATGAAGATATAGAGGAGCTATTATC
+AAGAGAATATTGTTTTATATCTGGAGAAGAACTAAATAGCATAATTAAAAAAGAAGATTT
+TCAATTGATTTGGGGTGTTTTAAGTGGTTTCAATAAGAAAATCACTTTAGAAGAGATTAT
+GAAATATAATTTACCATACGCAGAAGATAATAAAAATATTTGGGAGAATCCAGTTTGCAT
+TCAACATCCTCTTTCAGAGATAGAGATAATTTCATGTGATAGCGATAAAACAGTTTTAAT
+AAGCAAAGATGAAAATTTATTAGGTAGTTTTAAAAGCAATTTTCCCTTAAGTGAAGATTT
+AGAATTTTACAATAGAAAATTAAAAAATAGATTATAAAACTTTAATAAAAAAAGAAATTA
+TTAAAAAATTTATGTTTTTTAGAAAGTAGGAAAATACAATGTTTCATTATGTTTTTAATA
+GTTTAACTAAAATTTTCTTTGAGTTTTTTGAAAAAAGTTAAGAGGTTCAAAGAACTTAGA
+TTATAAGAGACATTAAGAGTATTTCCATAAAAAACAAATAATTAATTGATTATAAACATA
+TAGGTATATGAGTATTTATTATAATACTTTGAACTGATGTATAATGTCAGTATAAATAAA
+AGGGATGTAAAAAAGGATGTGAAAAATATGTTATCTAGTAAGAAAATAGTAGATGATTAT
+ATTAAAAAAATAGACTGGAGAGTCAATGAAAATTCCAATTCACCATATAGTTTTGGGAGT
+CTCAATAAACATATAATAGCTGAGGTTTCTAAAGATTACTGGCTTAATGAAGTTTATAAG
+GATAAAAGAATAATAGATGCTTATAAAAATGGAGATATGCATATTCATGATCTAGGAGGA
+TTAACACTTTATTGTTGTGGATATTCCTTAAGAAACATAATTTTAATGGGAGTACAGGGA
+ATTCCTAATATTCCAACTAGTAGTCCTGCAAAACATTTTGATGCTATATTAAATCAAATA
+GCTAATTTGGTTACAATATATCAAAATGAGATTATGGGAGCCGTTGCTTTTAATTCATTT
+GATACATTATTAGCACCTTATATAAAGAAGGATAATTTAACATATGAAGAGGTTAAACAA
+AATCTACAAAACTTTATATTTAGTATAAATAGTAATAGTAGGGCAGGAGCTGAACCAGCT
+TTCACTAATATTACCTTTGATCTTTTTCCACCAAAAGACTTAGAAAATGACCCTGCTTTA
+ATTGGAGATAAAATTCAAGAGTTCACATATAAGGAATGTCAAAAAGAAATGGATATGTTA
+AATAAGGCATTTTATGAACTTATGAATGAGGGAGATTATAATGGAAGACCATTTTCTTAT
+CCAATACCAACTTATAATATAAACAGTAATTTTGATTTTGATAATCCTAATAATGATATG
+TTATTTGAGATGACAGGGAAGTTTGGGTATCCTTACTTTGCAAACTTTGTTAATTCAGAT
+ATGGATCAAAGTGATGTAAGATCAATGTGTTGTAGACTAAATCTTGATTTAAGAGAGCTT
+AGAAAGAGAAATGGTGGTCTTTTTGGAAGTGGAGATAGTACAGGAAGTATAGGTGTTGTT
+ACAATAAACTTACCAAGATTGGCATATAAACACAAAAATAATGAAAAAGAGTTTTTTAAT
+GCTTTAAAAGAAATATTGATTATAGCAAAAGATAGCTTAGAAAAGAAGAGAAAATGGTTA
+AATGACAATATTATAAATAAAGATATGTTGCCGGCATTTTCAACTTATGTAGGAACCTTG
+AAAAATCATTTCAGCACTATAGGAATAGTTGGATTAAATGAGATGTGTGAAAACTTTAAT
+GGAAATAATATATTAACTGAAGAAGGAATGGAGTTTTCAATAAAGGTTTGTAATTTCATA
+AGAGAAGAATTAATAAACTTTCAAGAAGAAACAGGAAATCTTTATAATTTTGAGGCTACT
+CCAGCTGAATCAACTTGTTATAGATTAGCTAAAAAGGATGTAGAGGACTTTGAGGATATT
+ATAGTTAGAGGGGGAAGAGAATATCCATACTATACAAACTCATGTCATATGCCGCCTAAT
+GAAGTTAAAAACTTAAAGCAATTATTTGATCACCAAGATAAGCTTCAAGTGTTATTCACA
+GGAGGAACTGTGGTGCATATTTATTGTGATGGAGCTATAAGTGGAGAAAAGTCAAAACAC
+ATAGTAAATACAGTTTGTAAGAAATATAGAACACCTTATGTAAGTATTTCTCCTTTAAAT
+AGATACTGTAAAGAGCATGGATATGTAAAGGAAAGGGTAGAAGAGTGTCCTATATGTGGC
+AAAAAGCTAGATTTATATCAAAGAATAACAGGCTACTTAAGAAAAGTTGAATTCTTTAAT
+GATGGTAAAAAATCAGAATTTAAGGATAGAAATCAGTTAAGCCTATGATTATAAAAACAA
+AGGGCATTGTTCATGAGAGAGTAGAGGATGCGCCTTTTATGGGAGCATTAATAAGTGCAG
+TAGATTGTAACTTAAACTGCAAAGGATGCTTTAATCAACATTTAAAGGATTTACCAAACA
+TAGAGATGGATTCAGAAGATATATTAGATAAAGTGACAAATGATCCTTTTAATGAAGGAA
+TTATACTTGCAGGACTTGAATGGTCACTTCAACCTAAGGAGTTAAGGGAAATGGTTAATT
+CGGCAAGGAAGAGAAACCTTAAGGTTATAGTTTATTCTGGACTAAGTGAAGAAGATTTTA
+AGAAAAAGTTCCCTGATATATATGGTTTAAAAGGAGACATGTACTTTAAGTTTGGAAAGT
+ATGATGAAAAATTAAAGGTGAATAATAATATTCAATATGATGTTAAGTTAGCCACATCAA
+ATCAAAAGATATTAAAGAAATAAAGATAAAGAACTGTACCAAGTATTATATAAGTTTTTA
+TACTTTGGTATAGTTCTTTTATTTTGTAAAAATTATTTAGAATAATATTGTTAACTAAAT
+AAAAAAGTTTCATAAATTATATATAAGATTTAAATGATATATATCCCAATAAATATTCAT
+ATAATTTTACTATAGATTATTAATAAAAGGTGAATTTATGAAAGATAGAAAAGCTTCAAA
+GTACCATAGTAGAAGTTCAAGAGTATTTGCACCAGTTCATATTAATTCAAAGGGAGTTAT
+AGACTATAAACTCCCTTTATGTGATTTAATGGATAGTATTCTTAGCAAAAAGAGTTTTAA
+TACAAGTGTAATAACAGAAACATTAGATGGAAATCAATATTATTATGATTATGATTTTGA
+TGGAAAGAATATTATAGTATCTAAAAGTCAGATAATTAATGATTCTCCTGGATTAAAGTT
+AATTGAGAGATATAAAGGGAATTACTTAGAAAAAGAATTATATAATGACTTAGTTGTTTT
+AGTATTATATAAGGATGATAAAAAGGTTACAGACACTATCTCTTACAAAAAAGATTTAGG
+TTTAAATGTTGATATGGTTATAGAGGTAGGGAGTTATTTTTATAGACTACCATTATGTGA
+GTTTATAGACAATATTATAAGGAAAACTCCAGATATTTTAAATTTTATATATTTTGGATT
+TGAAGGTGATATGTATTATATTACTCTTGAGTTTGATGGAAAAGATATAAATTACATAAA
+ATATAGTGTTAATAATTCTAAGCTAGATGAAATTGAAAAAGCTATAGGTAATAGATTGGT
+TAAAGAATTTAGTGGTCATAATAATATTATTCTTAGTTTATATGATGATAATACTCGTGT
+AAAAGATATTGTTGCTTATAGTAGTAAGTTTTTATATTGAATATTATAAGTAAGCAAAGA
+ATTTATGGTGATATTTTAAAAGGATGGGTTATTGAAGAGTATAAAAATAAATGATTATAA
+TTTAAGATTTGAGCATCTTATTTAAAATAATATTTAGAAGAAACTCAGTTATTACTGAGT
+TTTTTATGTATTTTATAAAGAAATCTACTAAAAGATTTTTAGAATATTATAGAAATATAA
+ACTTCTTAATTGTTTTTATTTTTAGTTTTTCCTCTAATGAAATTTTTTAAGCTAGATATA
+ACTAATACTAAAACTACAAAATACATTAATATGTAGTTTAAGGATAATAGATTACCATTT
+CTATCAAAACCGAATCGGTATAATAAAAATGATATTGTTACTAATATGATAAAAATTAAA
+TTAACTTTATTTTGGTATTTTATATTAATCTTTTCGTCTTTCATATAAAAGCTCCTTTTT
+TTAAGATTATTAAATATATTCTTGCATTAATTTTTAAAATTTTCAATTACATGTGTAAAA
+CTGGCAATATTTTATGAATAATTGGGCAAATATAGAGTTTTATAGTGATTAAAAGTATGA
+CATTGCTTACAGCATACCTTTCAAATATGTAAGAATGATATTTCGCTATAAATGGCTAGA
+AATAAAGGATTTATATTGAATCGTCAAAAGTTTCGTCAAAAATAAATTTAAAAAATATTT
+TCTATGATAGAATGTGCTTTATTAAACATATCATTATTGACATGAGAGTATACTTTCATA
+GTTTGTTCTACTGAATGACCTAATATTTTTGCAGCAGTTTTAAAATCAACTCCATTAGCA
+ATTAATTTAGTAGCGTATGTGTGTCTTAATTCATGAAGAGAAATGTTGAAACCATATTCT
+TTTAAAAGTATGTTTACTCTTGAAAGAATAGTGTTTTTACTTTTAAAATTGAAAACTCTA
+TTATCTATATTTATTATAGTTTTATATTTTAATAGTTCTTCAGAAACTGAATTAGAAATG
+GGAATAATTCTAATTGAATTTTTACTTTTAACACTACCTAATCCCCATGAATTATCTTTT
+AGTATTTTCCATTGTTTATTAACACTTATTAGACAATTATTAAAATCTATATCATTCCAT
+GTTAAACCTAGAATTTCACCGATTCTCATACCTGTATTAACAGCTAAATATACTACTAGA
+TAATATTTATTATTTTTAAATTTTAATAATAAATCGTTAATTTCATCATCATTCAGTGCC
+TTTTTCTTAGTTGGTATTGGTTTACCTATTTTTATATATTTACTTGGAACTTCATCTAGT
+ATATTGTATTTAAATTTTGCACATAAAAATATGCTATTTAATATTTTTAAATAATATCTT
+ATTGTATTATTATTAAGATGTTCCTTAGTCATATTATCTATTAATTTTTGTATATCTAAG
+TTAGTTATTTTGCAAAGTTCTTTGTCATTTAAATCTTGAAACCTATGAAGCACTGTTACT
+AAGCCGTCTATTGTCTTAGGTTCTTTGTATAGCTTTTCATGCTCTAGATACATATCTGAA
+AAAGCTTTAAAAGTTATTTTCCCAAAACTATTATTGCTTGTTTTTATATTTTTCTTTAAA
+TCTTGTAGCATCTTTTCAGCAATAGGTTTAGCTTCTTTTTTTGTCTTAAATCCTTGTTTA
+GATTTTTGCCTCCATTTTCCATTGTAATCCTTATAGCTTATTATAAATTGCCATCCTTTA
+TCTTTTTGCCTATAAGTTACGTTATACTCCATATCTAACACCTCTTTTAAAATTAAAATA
+AAATTTTTTGATACGAATATATGTTCTATAAAATCTATAAAATAAACAGTTGAAAATCAA
+CTGGTTAAAACATTTTACATATTCCTAATGATGGAATAAAGTATATTATGTAATTATCAA
+TTTTATACATAACGCCATATTTAGCTCTGTAATAATCAATTGCTTGATCAAAGTATTCTT
+TAGTTACACCTAAAAAATCAGCTATTTCAAAAGCATTTCTACAATTATTTTCAAAAGCGT
+TAATTAATCCAACTAAGCCAACAGCTTTATCAAACCCCCAGCGCCTGGCAACTAATTCTT
+GTTTTTTATTACATATTTCAGTTTGATCAGTAATATCACCTAAATTTTTAATATAGTGTC
+CAAGTTCTTCAGCTAAAATACATGTTTTTTCTTTGGTATTTATATTACTATTAATAACTA
+TTATATTATCAACGCATTTTCCGCAAGGTTTATCTGTGCCAAGATCAATTTCAATGACCT
+TAGCACCATGACATTCGGCTTCATACATTAATCTTTCGTATTTAGTCATATAAACCCACC
+TAACTTATTTGAGATTTTTTAAAGCTTTATTTATTTTTTCATTCATTAAAGCTTTTTCTT
+CATCAGTTAAATTGTCATCATGACAAGCTACTAAATAAGGAGTTTTTTGATTTTCTATTA
+GAGTAGCAGCAAATTCAGTATCTAAAGAATACTTAGGCATTTCTAATAAATCCTTAGTAT
+ACGAAAAAACTTTATCTTTTCCTAAGTCATTAAGTTTTCTTAAGTCTTCTATATGTATTT
+CTTCATCTTTAGATAAGTTGTTTGAATTTTCGCCAACTTCATCTAAACCTAAAAGCCATA
+TAGGACTTACGTCTAAAGCAGCAGCTATAACTCCTAATTTATCTACAGGCATATTTTTTA
+TTGATCCTGTCTCATATCTTTGTAGAGTAGATTTACTCATATTAGTTTTAGAAGCTAAAT
+CTTGATATGAAAGCTTTAGTTCTAATCTTCTACTTTGTATTCTATTCATTATCATTTGCA
+TGTTTGAGTCATCAAGTAAATTTTTCATTTAATCACCTCATAGTTTAATTATAAAATATT
+TTTTCATAAATGCAACGATTTTTTGAAAAAACTTAAAGAAAAGTTGCATAAATGGGTTGA
+CTACATTTTTCAGAAGTGTTATGATTTAATCATCCTAAATATGCAACGGAGGTGAGAAAA
+TGGTTTATAGCAAATTAAAAGGGATTATGAAAGAAAATGCTTATTCTCAGGGTAAGTTAG
+CAAAAGAATTAAATATAACCACTCAGAGTTTAAATGCTAAGTTAAATGGGAGAAGTCAAT
+TTACCATTAAAGAGGCTATAAATATTATATCTATTTTTAATATAAAAAATCCAAATGATA
+TATTTGAAATTTTTTTTGCAAATAATATCCCAAATATGCAACGAGATATAAGTTAAGGAG
+GAAATAAATGAATAACTTAATGATTTTCAAAAATGAAGATTTATCAATCGATGTAAGAAC
+AATTAAAAATGAAGATGGAAGTATTTCAATTAATGCTGAAGATACTGCTAGAGGGCTTGG
+ATTTATTCAAAATCAAAATAAGAATGGAAAACTTTATATAAGTATAAGATGGGAAACAAT
+CAATAATTATTGTAAGGAATTTAATTTCCCCAACAAGTTGGGGAAAGATGATTTCATTCC
+TGAGAGCTTATTTTATTTATTAGCAATGAAAGCTAATAATGAGGTGGCAAGAAAGTTTCA
+GACTTGGCTAGCTGTGGATGTAATACCTCAGATAAGGAAAAATGGACAATATCAAATGAA
+ACCAACATCTAATTTAGAACTTTTAGAGTTACAAGTTAAAGCGTTAAGAGAAGTTGAAGA
+GAGGGTAATTGAAGTAGATAAGAAGTTTGATGATTTACCGCTATTTGAAATAGACAGTAA
+AGATTTAAAGAAGAAAGTTAATAGAGTTGTAGTTTCATTACTAGGTGGTAAGAAGTCTAA
+TGCATATAAGCCTTTAAGTAAAAAAGTGTTTTCAGATTTATATGGACAGATTCATAGAGA
+ATTTGGAGTTGATACTTGTGCAGCTATTAAGAGAAAAGATTTAGATTTAGCTAAAGAGAT
+AGTTGATAGTTATACATTACCAAGAGTATTAAAAGAAGAAATTGAACTTGCTAATAGCCA
+ATTAGCATTTGCTCAATGATAAAGAAATGAAAGGAAAGATTAAGATGGAAAATAAAATAA
+CTGCCCAAGTCAATAAAGAGCAGTTAAAAGTTAAATCTATAATACAAACTGTATTAAATT
+GTTTATTAATTATTACTGTTTTAGTAAATATAGTTTCTCTTTTTAAAAGAGAGAATATAA
+ATAAGCAATTACAAATGCAGATTGAAGAAAATAAATTGGCTATACAAAAGGTTGATTTAA
+TAGTTGACCAGCTTGAAAAAGAAATTACTAATCTTCAGAAGAAAGGTTCTTTAGATTAGA
+GTTTAATTTTTCTAATTCTTTAGTTAACTTAATATTGGTTTCAGTATTTTGTTGAATAGT
+TTTAGTCATATGTTCATTAGATATATTACTTTGTGTATCAGAATAAAGTCCATATACAAA
+AAATAATAGGGTAACAACAATATTAATAATATTTAAAATATCTGATTTACTAAGTTTACT
+ATTTTCAAAAGTTTCCTTTGTCGAGTCTATAGAACTAACATAAGAATCGATATCACTATT
+GACTATATTATTTTCATTACAAAATTCTTTAAGTGAATCAGTGAATGAATATATGCTTTC
+AGCTAATTCATTTGAAAACAAATTATAGTTTATATTTGAAGTTAATTTAGTTAATTGATT
+TAAGTTAATAAATGAGTCATTATATATTGCTTTTACCATAGAACTAATATTTTCAATATT
+TAAAGTATTAAAATCTTTAACCATTTGTTGGAGTTGTAAATTAATATTTGGCAATGGAAA
+AGTAATTTTACTAAGTTGAGAAATTTGTTTCATGCAACTTTCGATTGAGTAAACACTAGA
+AGCAAGAGTGAAATTTGGCTTGTAAATTGGAGTAGGAATTTTTATAGAGTTTCTAATTAA
+TTTACTATAAATTTCATTATTAGATTTCATATTAACCATAATTATACCACCTTTCATAAT
+TTATTTCGACTTGGCGGAGCCGATACTTAAATTATAAAGGTTGGAAATATATAGGACAAG
+TATCAGTAAACAGCGAATCCCTCTGATACTAAGGGAATGAATAAGACAAGCTTTAATTAA
+AACCTAAGGATAAGTAAATCGAAGGAGGGCAAGAAATGGCACAACTATTAACACAAAAAG
+ACTTAGCAGAACGTTGGCAAATGAGTGTTAAGTCTATTGAGGAGTATAGAAAAGCAGGAA
+TTATCCCTACTGTAGAAGGGATTCCTGCAATAAGATTTAATTTACAAACTATTTTGGAGC
+TAGAAGGAACTAAATTAGAAAGATTTAGTCCATTAGAACGTAGACGTATGGAAATGGAGT
+TAGATGAAGTAAAAGAAGAGAACCAAAAGTTAAAAGATATCTTAAGTAATGTACTAAGTA
+ATTTAGCACCAATAATAAGTCTTGTAAAGGAGGTTTGATATGTTTACGCCAGGAGGAAAA
+ATAGTCTTTGGAATAATAACAACAGCAACAACTTTATTTTTAAGTGTTTATTTTTTAGAT
+AAATCTATAAATGAGAAAGATCCTAAAAAAAGTTTTAAGTATTTAATGTTATTTGTTGGA
+TGTACTTTAAGTTTTATCTTTTCAATAAATGTAAGTTAGGGGTGATGTTATGAACTTTAA
+AGATATACAGAGTTTAAAGGCTAGACATAGTAAAGAAGAGTTTGAAAGTATCTTGTTAGC
+TGTAGAGCAGGATTTAAAATTTAATAATATTAGATTTAAGAAACCTATTCCAAAGAAAAA
+GTTTTTAGAGGTTCTTAACATAACAGAAAGTTTGTTTAGGAGGATTATATGAAGAAAGTA
+AATATAGGATGTTTAGTAACTGTAATAGGTTTAGTTATTATATGGTGTTTCTTTTACTAT
+TTATCTTATAAGGTTTGGTGTTGGTTATGGACTTAGTAAAAGTATCAAAGAACATAGCTG
+ATAGAGTACAAGAAAGGTTTAGCGATTTAAAAGTAGACAAGCCTTTAAGTAATTTAATAG
+AGGAAGAAATAAAAAGAGAGTGCATTGGCACCGACCAAAGTAACCAATGTACTCATAAAA
+AATAAATTTCAAAGAAAGTTTAACATAATAAATTTAAGGAGGCAAGTTATGATTAATATA
+CCAGATTGTTGTTATGAATACGGAAATGATGAAAAAGAGCCAAAAGTAGCTTTTGAGTGT
+AGTTGGTGTGGTGAGTGTATATATGTTGGAGATGATTATTACGATATAGGGGATATAAAA
+ATGTGCTGTGAATGTAATGATGAATGTAAGTCAGTAGCAGAGGAGGGATTCTAATGGAAG
+AGAGATTAGAGTGGCTTAGAGAAAGACAGAAAGGAATAGGAGGCTCCGATATAGGAGCTA
+TCCTAGGATTAAATAAATATAAAACAGCTTTTGAAGTTTATTTAGAAAAAACAGAACCTA
+TTTTAGAAGTAGGAGAGCAATCAGAATCAGCCTATTGGGGAGATCAATTTGAAGAAGTAG
+TTGCTAAAGAATTTGAAAAGAGAACTGGTAAGAAAGTAAGAAGAGATAGAAGGCACTTTC
+AAAATAAAGATTATCCATTTATGGTTGCTAACATAGATAGAAGAATTGTAGGAGAAAATT
+CAATTTTAGAATGTAAAACAGCTAATCAGTATTTAGCTAAGGAATGGGAAGAGGAAGAGG
+TACCTGCTAGTTATTTAGTACAAGTTCAACACTACTTAGCAGTTACAGGAGCAACTAAAG
+GATATATAGCAGTTTTGATTGGTGGACAAAAGTTTATTTGGAAAGAAGTTGAGCGTGATG
+ATGAACTTATAGAATACATTATTGAAGCTGAAAAAGATTTTTGGAAAATGGTCAAAGACA
+AAACACCACCTGCATTAGATGGTTCAAGTGCTGCTGAAAAATGGGTTAATGAGAGATATA
+AAAAAGTTAATGAAGGTGAAGTTATAAAACTAGATTCATCATGGAAGGAGTTACTTAATA
+AAAGAAAAGAACTCAAAGAATATAAAGATAATGTAGAGCAAGAAATTAAAGAGATAGAGA
+ACCAATTAAAGCAAAACATAGGATATGCAGAGTATGCTAATGTTCCTGGATATAGCATTA
+GTTTAAAACAATCAGTAAGAAAAAATTTAGATAGTTCAAAAATTAAAGAATTACTTAAAG
+ATGATTATGAAAAATATTTAAAAGAAAGTATAAGCAGAAGATTAATAATTAAGGAGGAAA
+AATAATATGGCAACAGCATCAAGTTTAAAAAATCAATTAGCAAAGAAGGGAACTGGTAAT
+AGTTTATCAGTTGGAAATACAGTTAAAGGATTAATGGATAGTCCAACTATAAAGAAAAGG
+TTTGAAGAGGTATTAAATGAAAAGGCACCTCAATATATGAGTTCAATAGTTAACTTAGTT
+AATTCAGATACTAACTTACAAAAATGTGAAGGAATGAGTGTAATAGCAAGTTGTATGGTA
+GCAGCAACAATGGATTTACCAGTGGATAAGAATTTAGGGTATGCATGGGTAGTCCCATAT
+GGTAATAGAGCTCAATTTCAAATGGGTTATAAAGGGTATATTCAATTAGCATTAAGAACA
+GGTCAATATAAGTCTATAAATGTAGTTGAAATAAGAGAAGGCGAATTAGTTTCATGGAAT
+CCATTAACAGAAGAAATTGAGGTTGACTTTAGCAAACGTGAGAGCGATGCAGTAATTGGA
+TATGCAGGATATTTTAAATTAATAAATGGATTTGAAAAGACAGTATTCTGGACCAAAGAA
+GAAGTTAATAATCATGCTAATAAATTTTCAAAGACAGTTAATTCAAAAAATTCTGTTTGG
+AAAAGCAACTTTGATGCGATGGCCAAGAAAACAGTTCTAAGAAACCTACTATCTAAATGG
+GGAATTTTAAGTATAGAAATGCAAAAAGCATATACAGCAGATGAAAACTTAATTAATAAA
+GGTCTAATGGATGATATAGAAAATGTACAAGCTAACATTGAAGGTATTCAAGAAAACAAT
+GAGAATGAAGGTGTTATTGAAGCTGATTATACAGTTGATAGTAACAATGAAGTGCTTGAA
+GGGCAACAAGATATATTTGAAGGAGCATCATTATAAGATAGGAGGGGTTAGTTATGGCAG
+AAGGATGGATAAAGCTTTATAGAAATATTCAAGAACATTGGATATGGCAAGATCCACAAA
+AGTTAAAATGGTGGCTAGACATTCTTCTTCTAGCTAACCATAAGGAAAATAAATTTTTGC
+TAGGGAATGAATTAATGGAAGTTGAGAGAGGGGAACATCACACATCAGAGTTAAAATTAG
+CCGAAAGATGGGGTGTATCAAAAACAACAGTAAGAAAGTTCTTAAAGTTACTTGAAAGTG
+AACAAATGATTGAACTTAAAAAATCGAAAAAGGGTACCACCTTGAAAGTTAGTAATTACA
+ACGATTATCAAGATTTTTCAGAGGGTGAAAAAACCATAAAAAAACCACAAAAAAACCATA
+GCGTATACCACAAAGAAACCATAGAAGAACCATATGCTATACCACAAAAAAACCATGAGG
+TATACACAAACAATAATGAAAAGAATGAGAAGAATGAAAAAAATGAGAAAGAAGGAGAAG
+AAGTAGTAAAATCAACCTCACCTCGTTCCTATCCTTCTCCTAGTCATAAATTATTAGCTA
+ATTACTTAACAGATGTATGTTATAGAACTTTCTTTAACAATGCAGATATTGTTGAAGAAA
+ATGAAGTTATAAAAATTAAACCAGAGAATGATTTTTCTAGAGGAGCTATTGAGAAGTATG
+TTCCAACACTAGAAATTCAAACTCATAAAAAAATAGAGGTGATTTAAGTGAAAGTTAATT
+TACTAGAAGTTTATTCAGTACATGAGCTAGCATTAAAGACCTACAGAGATTTAGCTAAAA
+GAAAAATAGAAAGAAATAGAGAAGTAGATGCTTATTTAAAAGTTAGAGAAATAAGTGGAA
+GAAAGAAATGGAATGTTAGATTTGGAGGATATAGGTGGTAGTAGTTACAGGAAAGATAAG
+AGGAAAGGCTAGGCCGAGAGTTTGTAGAGGCCATGCCTTTACTCCTAAAGATACAATTGA
+GTATGAAAAGTTAGTAAGAGAGTGTTATAAGAAACAAGATGGAAGATACCTAGAAGGAGC
+TATAAAGGCTTTGATAATTGCTTACTATAAAATACCTAAGTCTTATACTAAAAAACGTGT
+ACAAGTCATAAGGGATGGATTAGAAAAGCCAACAAAGAAACCAGATGCGGACAATATAGG
+AAAGGTTATATTAGATAGTTTAAATGGAGTAGCTTATAAGGATGATAGCCAGATTATAGA
+TCTTAGAATTAAAAAAGAATATACGGAAGAACTTGAGAGAGTTGAATTTGAATTTAGATA
+AATAGAAAATGTTCTTTTTAAATTTAATAATGCGGTATTGAGGGCATATACATGCCAAGC
+AACAATTAGTATAATTTTATTATTATGTAAGTTTATTATTCAATAAACTATATGATAATT
+TCAAATTTATTAGGAAGGAGTTAATCTATAATGAAAATAGACTGGAATTTTTTACTTTCA
+GTAATAACTATTATTGTTGCTAGTTATGCACTAATACAAACCCACCATCAAATGAAATTG
+AGCAACAAACAACATTTATTTGATAAGCGTATGGAAAACTATCTAATTGCTATGGGATTG
+ATACAGTTATATAGAAATAACTGTAAGGATTTCGATAAGGATTTCGATGAAGAAAAAGAT
+GAACCAATTTTTGCTTTAAAGTCATACTTTATATGGTTGACAAATAACACTTATTTGGAA
+GAAATCACTACTGCAATAGATAATCCACTAAAAAACCCAGGTCATAAAGAGTTTTTAATT
+AAATTGGAGAAATTAAAGGAAGTTGGAACTAAGATCAAATTTTTATTTCCTGATAATGCA
+TCTGATGCATTAGGAGACTTTGTTTTTAGTTATCAGGAATTGCTATTTTCAATGTATCAG
+TATCAAATACTTTTAAATAATATGTATGAAATTAATAAAGATCATAAATTAAGTCTTGAG
+GAAATACAACAAAAATTTGGGGAACCAAAGCATAGGCTTAAGCTGCAAAGGTCTTTTCAA
+AATTTAAAACAAGCAGACGATTTATTAAAAAAGAAAAATGTTGAAGAAAAAATTAAAAAT
+CAAATAAAATTATTATAGATAACAGTTTGTTAATTAATTACTTAAATAAAAAAATAAATC
+AAATATATTATTAAAATACCGTATTATTCAAAATGAATATGCGGTATTTTTATTTAAATT
+CAGAGATTAAGAGAAGTGATATATATGACAAAGAATCAAATAGGTTTCTTTGATAAACCT
+AAAATAAAGTTGTTGGAGGATTGGACAAGGCTCCATCCTCTATTAACTAAAAATAGCGTT
+CATGAGGTTTTTATTGAAAGGGAGAACTATTGCATCATCTTGATAGATAAAACTTTCTAT
+GGCGTTTATAAGAAGGATATAGAGCGGTGTTAGATTTTAGCCATGTATTAAAATTTATTT
+TATATAATAAAAAAACGGATACTTAAAGTATCCGTAAACTATCACACGAGGGGATTCGAA
+CCCCCACGGCCATATGACCGACAAGTTGGCAACTTGTTGCGTCTGCCTATTCCGCCACAT
+GTAGAAAATGAATTATTTCTAATTCATTTATATTTTAGATCAAATGAACAAAAATGTCAA
+CAAAAATACAAATATAATAAAATTTAGGAGGTATATATGAATAAAGAGCTATTCAGAAAA
+ACAGAAAATTTACTTAAGAATTACAATAGATTAGAAACTGAAATTAAATTAATAAAAGCA
+GAAATTGAAGATATTAAAGAATCTTATACTGGTTGTGTGGCCATTGGATATAGTGAGAAA
+AGTGGATCAACAAATAAATTTAGCAGTATGGTTGAGGATGAAATTATAAGAAAAGAGAAA
+GATCTATTCTATCTTAAGAGAGATTTAGAGTATAAGGTTAAGTTGAAAAGAAGAATAGAC
+TTAGCTATACAAACACTTAGAACTAAAGAAGAGAAAGATTTAGTTAAATTAAAGTATATT
+AATCAGCCCAATGTTAGTTGGGGGAATGTGGCTTACATTTTAAGATATAATAAGGATTAC
+TGCAGGAAAGAACTAAGGAATAAGATAATAAGGCAGATTGCAGATTTTATATTCTATAAT
+CCAGGAGTTCAAGAAAGGTTTATTATATAAATATACCCCATATCTATACCCGTTTAATAC
+CCACCATATACCTACTTTTATATGTTATTATGTAATTGTGGATAGGGTAAAGCGTTCATT
+GATGATCCTCCTGGATGTAAATTAAAACTTAACTAACGGAAAGAGCAAGGTGTAAAAGCC
+TTGCACGTGGAAGGAAGAGTATTAATAAAGGTGCAACTCCTTTACCTTCCTAAATAATAC
+TTCCTTTTAAGTTTATTTTTTCATACAAAGTCTAAGCTGGATTAAGTTCCTGCTAATATG
+GGGAGATAGTTTAATTGGTAAAACATTGGTCTCCAAAACCAAAGTATGAGGTTCAAATCC
+TTGTCACCCCGCCATTAAAAATTAAATAACCTCTGGATTACGGAAAAGAATTTAGTTTAG
+ACTAGGTTCTTTTTTATTTTGATTTTTGTAAAACTTTACCTTATAATAATTATGTGAAAT
+TTTATTATATATTAAGTGTTGGGAGGGGAACTATGAGAAAAGCTTTTTGGGGGTATATTC
+CATATGATGATAAGACTTTTGAAAAATTGTGGGAAACTGCAGATTTTGTTTTAGATGCTA
+ATATACTATTAAATCTATATAGATATTCGAATAATACAAAAGAAAAAGTGTTAAATAGTT
+TAGACAAAATATCTGAGAGGATATGGATACCAAATCAAACTGGTATAGAATATTTTAATA
+ATAGAGTCTCAATAATTTTAGAGCAAAGTAAGATTTATGATGAGGTTTTAGAAGAATTAA
+GTTTTTCTAAAAGTATAGATTATATAAAAGCTTTAAGACATTCAACTTTAGAAGATAAAA
+AGCCGGAAATTATAGAACTTTTACAAAAGTGTGAAAATAAAATAAAAGAAATTATAAATG
+AGGATAAGAAGAAATCTGAAAATATAATTGAAGATGATTACATTTTAAAAAAAATAGTTA
+ATATATTTGATGGTAAAGTGGGTTCGTCTTTAACTGATAAAGATTTAGAAAGCTATAAAA
+AAGATATTGATATAAGATATTCTAAAAAGATACCACCTGGATACAAGGATAATAAGAAAA
+ATGATGATAAAAAATATGGTGATGCTATAAATTGGTTAGAAATAATAAAATACAGTAAAA
+ATAATAAAAAAAATATTATTTATATAACAGATGATAGAAAAGAAGATTGGATTGAGATAA
+TAGAGGGTAAAAAAATTGGTCCAAGAAAAGAATTATTAAATGAGTTTTATCGTTCAACTG
+ATGGAAATATTATATACATATATAATACCTATAGTTTTTTAGAAGCATTCAATAAATATA
+TTAATACGGAGAATAACATAGGAAAAGATGTAATGGATGAAATAAAAGACTTAGATACTA
+TTTTAAATGATTTTGATAGTAAAAAAATTAGTATAATGAGCAAAAAAATATTTGATAAAT
+TTGTAGGATTGGGTGTAGAACCTAATTGTTTGATAATGATTAATCAAGAAAAATTCAATA
+AATATATGGAAATCATTAAAGATTGTCAAGAAGGTGGAGCAGATTTTCATTTATTTATAG
+ATGATTTAAAATTTTTGGAGTTCGTAGATAATTTATTAGTGTTGGAACCAACGATTTCAT
+TATCTAAAAATAAATATTATTATGAGTTGTATAAGAATTTTATAATAAAAAATAAAGTAA
+CTGTATAAATTTAAGTAGATAGAGTTTTTTTAATAAAAGCTCTATTTTTATTCTACTAAA
+GAAAGGTGGTGTTGTTATGAAGCTTACACCAAAACAGAAGGCGTTTGCTGAATATTATAT
+TGAAACAGGCAACGCCACAGAATCAGCTATTAAGGCAGGATATAGTAAAAAGACAGCTAG
+GGTAATAGGACAAGAGAACTTGCTAAAACCTGCCTTGAAATCTTATATAGATGAAAAGAT
+GAAAGAATTAGAAAGCAAAAGGATAGCTAAAGCAGAGGAAGTGCTAGAGTATCTAACTAG
+AGTTCTAAGAGGAGAAGAAACAGAACAAGTAGTAGTTACTGAAAATATAGGTGATTTTAT
+GAGTGAGGCTAAAGTTGTTGATAAGGAAATTTCGGCTAAAGATAAAATCAAAGCAGCAGA
+ATTATTAGGTAAAAGATATAGATTGTTTGTTGATAAAGTTGAAAAGGATAGTAACGTAAA
+TGTTAATTCTACAACTAAACTAGATTCTATACTTAACCAGTTAAAGGATGATGACGATGA
+GTGATGAATACAAGTTATCAGATAAGTATTTAGCTTTTTTAAAACATAGAGCACCAGTAG
+AAGCATTGGAGGGAACAACAGCAGCAGGAAAAACTACAGTAGGAATATTAAAGTTTATGC
+TGATGGTTGCAGAATCTCCTAAGAAAATGCATGTTATTGCTGCTAAAACAACTGGCGTTG
+CTGAGAAAAACTTAATACAAAAAGAATATGGAATTACTGATGTATTTGGTGATTTAGTCA
+AGTATAACGGTAATGGTGATAAAGATAATAAAATACCTCATATAAGATATATAACTCCTA
+ATGGTGAGAAAATAATATATATACTAGGTTATGATAACGTAGATAAATGGAAGATGGCCT
+TAGGTTCTCAATTCGGTTGTGTACTTATAGATGAGGTTAACACAGCTAGTATTGAATTTG
+TAAGAGAAATATGTACTAGAAATGATTATCTTATGATGACACTTAATCCAGATGATCCTA
+ACTTACCTATATATTCAGAATTTATTAATTGTTGTAGACCATTAGAAAAATATAAGAAAG
+ATGTTCCAAAAGAGATAATGGAGCAGTTAAATTCGGAACCAAAGCCTAACTGGACTTATT
+GGTTCTTTTCTTTTTATGATAATGCATCATTAAGTGAGGAAGCTATTGAAAAGAAAAAGA
+CGAGTGCTCCTAAAGGTACTAAGCTATATAAGAATAAGATACTAGGGTTAAGAGGAAGAG
+CAACAGGATTAATATTCTCTAATTTTGAAAGAAAGAATAATGTATTATCTAAAGAACAGG
+TTATTAAACAAATAAAAGATAAGAAATTAAAGTTTGTTCAATTTACAGCAGGATTAGATA
+CCTCATATTCTCAAAATAGTCCTGATACCTTTGCATTTACTTTCTTAGGTATTACAGATA
+AGAAAGAATTAGTAATGCTAGATGAAGAGGTGTATAACAATAAAGACCTAGAAACTCCAT
+TAGCTCCTAGTGATATAGCTCCTAAATACTTTAAGTTCTTAGAGAAGAATAGAAATGAAT
+GGGGATTTGCTAGAGATGTATTTGTAGATTCAGCAGACCAAGCAACTATAACGGAGCTTA
+AGAAGTTTAAGAGAACTAATCCATGTATGTATAACTTTATTAACTCTTATAAGAAAGTAA
+CTATATTGGATAGAATACATTTAGCTTTAGGTTGGATTAATACCAATGGTAAAGTATTTT
+ATTATGTTTTAGATACTTGTAAAGAGCATATAAGAGAACTTGAATGTTATTCATGGAAAG
+AGGATAAGTATGAGCCAGAGGATGCAAATGATCATACAATTAACTCTAGTCAGTATGCAT
+GGATACCTTTTAGAAAGATAGTAGGAGATTATATAACATAAGCACTTTCCTTAATTGTAT
+ATTTATTGTAAAATTACAATGAACGGAGGTGATAATTTGAATAAAATAATAAAATGTTTG
+AAAAAAATAATAAATTTTTTAAAATTAATACTCATTATTATTGCTATAGTATTTTCGTCT
+ATAGTATTAATAGCAAGTATTGTTTATTTATGTTTTGCTATAATATATTTACTACCTATA
+GGAATTGAATTTATAAATGGCAATTATGTTGCTACATCTACTATGATGCCAAATTACTCA
+ACAGTTTTCCAATCAATCTTTACATTGGTTAGTATATTTACTTCTTTATCAGTTAGTTTA
+TTATTATATAAGTTAAATAAACAACAAAATGCAGTTAAGTATAATAAAGAATTAGTAGCT
+CCTGCTAATTTAGTTTATTTTAAGATAAAATATTATCTTATACATCATTTAATTGAAGAG
+TTACGAAGAAATAGGAATAGGATAAGTAATGATCAATATCGAACTCAAAATGGATTAGAA
+GAAAGTGATTCAATAATTTATGAAAATATTGCTCAAGTTAATGTTGATACTTTAGAAAAT
+AATATTTATAAAATTTTATGTGAGTTAAATGATGATAGAAGTATAAATAAACTATTAGGT
+CTATATGAGGATATGAGAAGAAGTAATTCAATAATATATATTTTAAAAGATGAATTAACA
+AACTCATGTAATCTTGTTGAAACTAGGGGATATGAATGGGTTAAGGTACTAGTAGGTCTA
+CATAATAATAACTTTGAGTGTTTAAATGAAGATTATAAAAAAATCATGTATAGATTATTA
+GAATTAAGCAAAAGGAAAAAATAAACCGATAAAAATTTATCGGTTTATTTTTTGTAAGGA
+GGAGTAGAAGTGGGGTGGTTTAAGAGTATGTTAACTAAAGCAGCAATTAAATATTTAAAT
+GTTCAACCAGCATTAATTAATCCTATTACTATACAAGAAGCTTATACCTATGAAACTAAT
+GTGATTAGAAATAAGCTTTGGTATAGGGGAGAACCATACGAATTGGACCAATTCTTTAAG
+AATATATCAAGTGATCCAGTAAATAAAGCTAGGTTTTGGAGTGCTGTTCCAAGTGAAGAT
+TTAAGTATAAGAAAAATACATAGTGGATTACCTGCAATGATAGCTGATAAGTTAAGTGAT
+ATAGTTGTAGCTGACTTAGATAGTATAGAAGTTACAGGAGAGAATTATAACACATTATGG
+GAAGAAATAAGAAAAGATAATAAGTTTGATGATATGCTAGGTGATATAATTGCTACTACA
+TTAGTTAGTGGTGATGGAGCTTTTAAACTATCTATAGATACAGAGATAAGCAAATATCCA
+ATAATAGAGTTTTTCGATGGTGATAAGGTTGAATATATAACTCAAAGAGGAAGATTAAAA
+GAAATAAAGTTCTATACTTTTTATACTAAAAATAATAGACAATATAAATTAAGTGAAACT
+TATGGAAAAGGATATATAAACTATAATTTATATGATAGTAATGGAAATGAAGTTTCTTTA
+AATACACTTGATGAAACTAGAGAACTTGCAGATGTAACATATAAAGATGATTTTATAATG
+GGAGTACCATTAATGTTCTTTAAATCTCCTAAGTTTGAAGGAAGAGGGAAGAGTATATTT
+GATAATAAATCAGATGCCTTTGATGCATTAGATGAAGTTATATCTCAATGGATAGATGCC
+ATAAGGGATGGGAGAGTCCAAAAGTATATACCAGAGGATTTAGTTCCAAAAGATATTAAT
+GGTAATTTAATGAAACCTAATCCTTTTGATAATAGATTCTTAAAAGTAGGTTCTAGCCTT
+GCAGAAGATGCAAAGAATGAGATAGATATGAAGCAAGCTAATATAAATTATGAGGCTTAT
+GTTGAAAGTTATTCTAATGCTATTGATATGTGTCTACAAGGTATAATAAGTCCTAGCACT
+TTAGGAATAGACCTTAAAAAAACAGATAATGCAGAAGCTCAAAGAGAGAAAGAAAAAACT
+ACTTTATATACTAGAGGAAAAATGGTTGATATATTAACAGAGGTTATACCAGAGTTAGTT
+AATATAATCTTAAAGACCAATGATGTATTAAATAAAAAGAATACTGGAGAATATGAAGTA
+AGTATTGTATTTGGAGAATATGCAAGTCCTAGCTTTGATACAGTAGTAGAAACTGTAGGG
+AAAGCTAAAACCTATGGAGTAATGTCTATAGAGCAATGTATTGAGGAAATGTATGGAGAT
+ACATGGACAGATGAAGAAAAGGAAGAAGAGATAAAAAGAATAAAGGAACAGAATGGCTAT
+CTTGTAGCTGAAGAACCTAAGACAGTAGATGATTCTGATATTTCATATACTGATGATAAT
+GAGGTTGAAACAGATGGACAAGAGGGATAAGGATATACAATTATTAGCTGATATACTTAG
+AGGAATTACTGAAAATAAAATAAAAGAAAATGCTAAAAAGGAAAGAGATAAGTCTTATGA
+TATTAGAAATATATTCGAGCAAATGGAGCTTGATTTAATTTCTAGTATGCATAGGGCTTT
+TTATTTTCACCAAGCCGAGCAGAGTAAAGAAGGATTTCAATGGGAACAATGGCAAAGGAC
+TAAGCTTAGAGAAATTGAAAAGTATAGAAAGAGAAATAAGAAACTAGTTGAGGAATATAA
+CAAGCCTATCCAAGAAGCTATAAACAGAGAGATTCAAGGGGATTTTACTAAAGGTCAAGA
+AAATGCAGAAAAGTTAATAGATGAAGTAAAGATAAAGTTTCCAGAGAATATAAAAGAACC
+TCAAACAGTTAGAGAGTATATTGCTAAAGAACTAGGGAAAAAGACTAATCCACAAGTTGA
+AGAAAACTTCTTTGGTATTAACGAAAAGAAACTTAATGCATTACAAGAAACTGTTACAAA
+TGATTTAAAAAAGGCTCAAATGTCAGTTTTAAGAAAGATGGATGATGTATATAGGCAAAT
+AATATTTAAAACTCATGTATATTTGCAAAGTGGTACTAAGACTATTAATCAAGCTATAGA
+TATGGCTACTAAGGATTTTCTTGAGAAAGGTATAAATAGTATAACTTATAAGAATGGTAA
+ACAAGTTAATATTACTAGTTATGCAGAGATGTGTTTAAGAACAGCAAGTCAAAGAGCTAC
+ATTTTTAGGTGAAGGAAAGAAAAGAGATGAATATGGAATACATTTAGTAGTTGTTACGGC
+TCATGCTAACACTTGTAAAATGTGTGAACCATGGCAAGGAAAAGTATTGATTGATGATAT
+ATTTTCTCATGGTACTAAAGAGGATGGAGATTATCCATTATTAAGTGAGGCTGTAGGAAA
+AGGATTCTTACATCCTAACTGTAGGCATACATTAGCAACTTATTTCCCTGGTGTAACAAG
+ACTTCCAGTAGTTCCTAATGGTGAAGATGCTATTAAACTTTATGAGGTTGAACAGAAACA
+GAGATATTATGAAAGACAATTAAGAAAGTGGAAGAGATTCAAGGCTGGTACTTGTGATGA
+AGAGAATAAAGAAATAGCAAGTAAAAAGGTTAAAGAATTAGAAAAAGCTTTAAAGGATCA
+TTTAGAAAGTAATAAAGAGCTTAGAAGAAATAATTATAGAGAAAAAGCTAGAGAAGGCTT
+AAATATTAAGGATGCTAATATAGAGGCAGAAGTATTGAAGCAAAAGTTTCAAAATGCTAA
+AATTAAAGAAATAAGAGATTTCATTAAGAATAATCAACCTTTAAAAATAGAGGTTGGGAA
+ACAAGGTAAACATATTTTAGGACATAACAACTACATTGAAGGTAGAAGTTATTTAACCAT
+ATCTTTAGAAGAGGCACAAGAACTTATTAATAAGTATGCTGGTACTGGTGCTTTAGATAT
+GGATTCTAAAGGTAACTGGAGAAAAAAAGAAATAATAAAAACAGATAAGAAAATAGGTGT
+TAATGTAAGTATGTTAGATGGTTCAGAAAACAAAACAAATAACTTTAAAATACATTATTC
+TAAAAAAGGAACTCATATAGTTCCTAATTAAAGAGGTGATTCCATGTTTAACTTAGTAGA
+GACATTAAGAGATATAATGAAAACTCATAAGCTAGATAATAATCTTAAGTTAAAAATAAA
+AACTGTTGATGGGAATATCATTATTGGACCATATGAAGGATTTACACAAGCTTTAGATAA
+TGAACCAGAGATAGCAAGTATAGAAATAAAAAAAGATGAATATAACATAGAGCTATATGA
+AAATGAAATAGCTTCAATAGAAGTGTAGTAAGTTAATTTTGTTTTGGGGGATAAAATGGA
+AAGAAAAGTATTTATAGAAGGTAAAAATAAAAGTGAACAAGCTTATATAGGTTGGGAGTC
+AGAAGAATTATACCTAATTGGAGTAAAGGATGGATATAAAAGTTCAGCTGATGATCTTCT
+TGACAAAGCAATATTAGAAGGCCATAAAAATAGAATTGATATATTAGATAAATATATATT
+TCCAATAATGTTCTTATATAGACATAGTATAGAAATAAGCTTAAAACTTATATATAGAAG
+AGTTAATGGAAAGATACCAACTGGACATAATCTTATGACATTATGGGATAGAGTTGACAA
+GGATGTTTTAAACCTTTTAAATAATGATATTAAATTAAAAAAGCTTGAAGAAAAATATAA
+TACTAAAATTTATAGATTAAATATTGATAAAAAGTTATTAAATGAGATTAAAAACTTGAT
+AAAAGAATTACAAGGTATTGATTCTAATGGAGATGTTTGGAGATATCTTATCAATAAAAA
+TGGAGATTTATATTTTAATAAGTGGAAATTTATAGATTATCCGAATTTAAAAAATACTAT
+TAATTATATCTATGAGTTTTTAGATGGTTTATATTGTGAAGTTGATGAAATTCTAGTAGT
+AAGAAAGTCTTAGGAAACTAAGGCTTTTTTATTTTGTCCAAAACTTGCTTAAGACCTTAA
+ACTGTGCATGGAATTAACAGCCGACAGGCTATAAATGGAGGTATTTATGTCTATATCAAA
+TTTAAATTTAAGAAAAAGATTAGGTATGAAACTAGCACAAGATGATGGAGCAGGTAATGG
+GGGAGTAGGTTTAGAAACTAATCCAACTGATGGTGCAGGTGGAGAAGGTGAAGGAACAGA
+AACTAATCCAACAGAAGAAAAGACTTTTACTCAAGAAGAAGTAAATAGGATGATTAAGGA
+TAGGGTGGCAAGAGAAAAGAAAGGCCAACTATCTAAAGAAGAACTTAAAGCTTATCAAGA
+TTGGAAAGAAAGCCAAAAAACAGAAGCAGAAAAGCAAAGTGAAGCTTTAACTAATGCAGA
+AAAAGCTAAACAAGATGCAGAGGAGAGAGCTAATACATTAGAGGCAAAAGTAACTTGTTT
+ATCTAAAGGTGTTTTAGCTGATAGTGTTGACGATGTTGTTATATTAGCTAAAGCTATGGT
+AAGTGATGATGTTACTATGGATCAAGCAGTAGATAAAGTTTTAGAAAAATATCCAAGCTT
+TAAAGGAGTGCAGCAACAAGATGAAAACAAAGGCTTTAAAATAGGTGCTGATGGTGGAAA
+ACAAAAAGGAAATGTTGATGATGCATTAGCAAGAGCCTTTGGAAATAAATAATAAAAAGA
+TTAGGAGTGATATAAAATGGCAGTATACAGTTATGCTGAACAATTTGAAAGACAATTACA
+ACAAAAATATGCAAGAGAATTAACTTCATATGCATTAGAGCAATCTAATCCACAAGTTAA
+ATTCATTAATGCACAAACTATTAAATTACCTAATATAACAGTAAGTGGATATAAGGATCA
+TAATAGAAGTGCTATGGGATTTAATACAGGTTCAATGTCAAATGATTGGGAACCAAAGAA
+GCTATCTCATGATAGAGATATTGAGTTTGCAATAGATCCCATGGATGTTGATGAAACAAA
+CTTAACATTAGAGATGGCTAATATTCAAAATGTTTTTGAAACAGAACAGGCGATACCAGA
+AAAGGATAGTTATAGATATTCTAAGCTTTATGCAGAAGCTAAAACATATAAAGCAAATGG
+TGCTGTTATAGATAATACAGTTTTAACAACAGCAAATATATTAGATTGGTTTGATACTCA
+AATGGAGAAAATGGATGACTTAGGAGTACCAAGTGAAGGTAGAATACTTTATGTTACACC
+AGCTATTAATAAACTTCTTAAAAATGCGGAAGGATTAACAAGAACTATTAATTCTGATAA
+GAATACTGGAAAAGTTGATAGAAGAGTTTATTCATTAGATGATGTGACTATTACTAAAGT
+TCCAAGTGCGAGAATGAAAACAAAATATGATTTTACAAATGGATGTGTTCCAGCAGGTGA
+TGCAAAGCAAATAAATATTATACTTATTCATCCATCATGCCAAGTAACAAGAAGTAAGTA
+TTCTTATATTAAAGTGTTCACTCCTGGAACAGATAGTAGAACAGCAGATAAGTATGTATT
+CCAAAATAGAAGTTATGGAGATACATTCTTAATTAAAAATAAAGCTTGTGGTATTGCTAT
+TAATGCAGAATCAGAAGGTTAGAAAGGAGAATACATATGAAGGCTATTAAAGAAAATAAA
+GTTTATACAATAACTGAATCTGAACAGAACTTTTATAAACAACAAGGATATGACATAGTT
+AATGATGAAGGGGAAGTTATAGAACGTGGAGCAGGGAAATCTATTTCTTATGAGGAATAT
+ATAAAGTTAAAAGATGAATTAGATCCATTAAAAGATGAAAACTATACTTTAAAGCAAGAA
+AATGAGAAATTAAAAGAAGAAAATAAAAAGCTTAAAGCTGAAAATAAAGAGTTAAAGAAG
+TCTTAGTTAAGGCTTCTTTTTCTTTATAAGGATGTGAGTATATGTCTTATGTAGATATTT
+CATATTATAAAGATAATTTCAAAGGTGATATCCTTAATGATGATACTTTAGAAAATAGAT
+TAGAAAGAGCATCAGATCAAATTGATAAATTGACATATAACAGAATAATAGGAGTAGAAT
+TTAAAAATTTATCTCCATTTCAACAAGATAAAATTAAAAAAGCAGTTTGTTTACAGGCTG
+AATTTATAGAGCAATATGGTGAGTTTATTAATATGCCTTTAAGTGGATTTTCAGCTGGTA
+GTACTTCGGTATCTTTTAATGGAAGTATTGTAAATGGCATAACAACCACACAGGAAGTTA
+TTAATTATATATATCAAACTGGTTTAAATAGTAGGAGGATCTAAACTATGGGAATTAAAT
+TACCATTTCCTAAATGGCTTTTAAAAACACCAGTAGAGGTTTACCATACTTATATGAATG
+AGGATGGTGAACCAGTAGAAGAGTTAATTTATAAAGGATTAAGTATATATAATGAAAAGG
+GAAAGAATACTCTCGATGCAGAGCGTAGACTTGTAACTTTAAGTGGGACCGTAACAATTG
+AAGGTGATATTTATCCTAATAAATTAATTGAAGGATATATAAAGGTTGGAGATGTTAAAA
+AAGATATTTATAAGTCATCAAGGCCACGTAATCCAGATGGAAGTGTATTTTCTACTGAAT
+TGGAGCTTATCTAATGAAGGCTAAAGTAACAATAAAATTAGATAGAACTAAGATAAACAC
+TTTAATAAATGCTAGAAATAAAGCTTTAGAGGAAACTACAGAGGCCATGTTAAGTGATAT
+TAAGACAAGTGCTATAGTTCCTAAGGATACTGGAGAACTTGAAAGAAGTGGTTTTGTTGA
+TTTATCTAAGTTAGATGATGGAATAGCATCTATAATTTTTGATACACCATATGCTAGAAG
+ATTATATTGGCATCCAGAATATAATTTTAGACAAGATAAAAATATAAATGCACAAGGTAA
+ATGGATGCAATCTTATATTGATGGAGATAATAAAGAATTTGTAACAGAGACTTATTTTAA
+ATTCTTAAAAATATTTAGCAAAGGATTGATTAAATAATGTTGCTAAGTGAAGTAAGAGAA
+TATTTAAAAACTAAAATAGAATGCCCTCAATGGTATATAGGAAAGATAGATGCAACTAAA
+GAGCAATGTATAGGTATCTATAGCATAAGAGGACCAAGAAATCATATAGCCTTAGGTGGT
+TTAGAAAATACAAGCTATTCCACTAAGGCTATTTCTATATTAGTTCATTGGGGAAAGAAT
+GCTAATATAGCAGAGCAAAAAGCTCAAGAAGTATTTAATGTTTTATTTGGACAAGATGCT
+GTTATAGGTGGGAAAAGAGTTATAGATTTTAAAATGATAACTACTGAACCTATAGGAGTT
+GGAACAGATAAAAATAACATATATGAATATGTAATAGAAGTAAATATAATACATGAAAGG
+TAGTGAATAATTATGGCATTTACAGGAGTTTTTCCAGTATATAATCTTAAATTTAAGATA
+GGAACAAAAGGGAAAGCAAGTCAATCTCAAGATATGCAGACTATAGCTGATATGGAGAAC
+TTTGGTATAAAGATTGATGGTAAGGTAGAAGATTGGACACCAATGGATACAGCAGGTTGG
+GCAAGAAGTTTAATGACAGGAAAAAGTTTCTCAATATCTTTAAAAGGCAAAAGAAATGTA
+GGTGATCCAGGAAATGATTATGTTGCAGCAACTGCATGGAAGGATGGATTAGATTGTAGT
+ACAAAAGGAGAAATGGAGTTCCCAGATGGGTCTAAACTTACATTTAATTGTGTAATTGAT
+ATTAAAAATGTAGGTGGAGATGATAGTACAAAGGTTGCTCCATTAGAATTTGACTTAAAA
+GGTGACGGAAAACCAGAATATACAGAAGCACCATCAAGCTTAGGACATTAGGAGGTATAA
+ACAATGGCAAAAGTATATGACATAATGAATAAGTTAGTTAATGTAAAACCAACAGTAAAG
+ATAGATGAAGATCACGAATATAAAATTAATAATACGAAGAATAATGCTATATATATTCAA
+TCATTAGTTAAAGAAAATAAGAAAAAAGATGATAAAAAACAGGATGAGATGGAGCTTATT
+AATAAAATAATAAAAGCTTCCCTAGGTAAAGAAGCTTTTGAATATATAGATAGTAAAGGT
+GATGAATGGAGCATGTCAGCATATAATGCAATAATAAATGTAATAATGGCTGCTATATCT
+AATGTTGAATTAGAAGAAATTGAAGAAATGAGTGAGAAAGAGGCAAAGCGATTTCAAGAA
+AGTAAAGAATAATCAATGGTATGATTTATTTGAAGATTGGGAGCTTATAGAAGCTTCTTT
+TACAGCTCAATACGGAATTAGATTAAGAAATGAAACTAATATGACTTGGGATGAATTCTG
+TACATTGCTTAGTGGAATAATGCCTAAAACACCACTAGGTCAAATTGTTTCAATAAGAAG
+TGAAGAAGATGAAAATATGCTTAAGAACTTTACAGAAGAACAACATAGGATTCGTAATGA
+ATGGAGAAGTAGACAAGTAGAGCAAATGACAGATGAAGAAAAAGAGGAACAAATAAAAGA
+AATACAAGAAATTCTTAAAAAGGCGTTTAGTTAAAACTAAATGTCTTTTTTATTTTAAGA
+AAGGTGGTGAGGTAATGGCAGATGCAGATTCGGTAGGGAAAATTGGTCTTGATTTAGAGA
+TACAAGATGGTGATATAGGAAAACAAATAGAAAAGATGGCTAGTGCTATAGGTAGTCAAA
+TAAGTAAGTCGCTAGAAGGAATAACAGAAAAATTTGATTTTAATTCAATAACAAAAGGAA
+TTTCTGAATCTTTAAATAAAGGAATGAATAATATTGATGAAACTATAAAATCTAGTGTTG
+AGAAAAGTAAAGCTAATATTCTTAAGACAATAGAAGAAATAAAATCAAAAGCTTTAGATG
+CTATAAGAAGTATAATAGCTAAATCTAAAGAAATAAAAATTCCTATTCAGTTTTCTCCAG
+TTAGTAATATTGCAATGCCTAGTAGCAAGGTAGCAACGCAACCAATAAGTAGAAGAGGAC
+CACCAAAAAGTAATGTTGGAGATTTAGAATCTATAAAATCTAAGATTGAAAATCTTTCTA
+ATAGTTTAGAGATAACTAATAGATCAATAGAGCAGCAACAAGAAAAATTATCAGGATTGA
+AGGCTGCTTATAATTCTACATTTAATCAAGCTAGAAAAAACAAATTACAGGAGCAAATAT
+TAAAAACAGAAGCTGTTATAAATAAACTTATAGCTAAATCTGATGCAACAGGGTTTAAAT
+TAGCTGATTTAGATAGGCAGTTTGAGAAATTAGGTAATTCAGCTAAGAATTCTACTTTAG
+GATTAAATGAAGCAAGTAATAGTATGAAGAGGCTTGAAAATACTACAAGTAGAACAAATA
+GAAATTTAAGAAATGCTAATAACTCTACTAGACGATATAGAGAAAATATGAATGGTGCTA
+GAAGTGCAACAGGGATGTTTATTGATAGTATGTTTAGGTGGGGAATAGTATTCCCTTTAG
+TAATGAAGGGGATAAACACTGTTGCTAGTTATATAGGAAGTGCTTTAATGACTAATGCTC
+AGTTTGCAAACAGTTTAGCACAAATTAGAACTAATCTTATGGTTGCATTTATGCCAATCT
+ATCAAGCAGTTCTACCAGCACTTAATGCTCTTATGAGTGCATTAGCAACAGTAACCGCAT
+ATATTGCAGCTTTTATAAGTGCTATATTTGGTAAAACATATCAAGCTAGTTTTGGTGCTG
+CTAAAAGTATGAATGCTTCTATAGCTTCAATGAAGAATATGGAAAAGCAAGGTAAAAAAA
+CATCTGGAGCAGTAGATAAAATAGGAGATTCGGCAGAAAAGACAAAAAAGAAAATACAAA
+GGTCCTTAGCTGGATTTGATGAAATAAATAAATTAAGTATTCCAGATGATTCTGATAAAG
+CTCCAAAGGCTCCAAAAGGAGGAGGCGGTGGTGGAGGAATAGATCCGATACCAATGGTTG
+CTCCAGATATAGATTTAAGTCCAACAAGTGTAGCAATGCAAAAAATAAATGCTATGGTAG
+AAAAGCTAAAAGATATTATATCTAAAATATTTCAACCTTTTAAAAATGCATGGGCAAGAG
+AAGGAGCTGCAACAATTGCAAGTATTAAATATGCATTACATGGAGTTTGGGAGCTTATAA
+AAGCTATAGGTATTAGTTTTTTAGAAGTATGGACTAATGGAACGGGAGAAAAAATACTTG
+TAGTTATTCTACAAATTTTACAAAACATATTTAATATAGTTGGAGATATAGCAATTACAT
+TTGCAGATGCTTGGAATGCTGGAGGAATAGGAACAGCTATAGTTCAATCTTTAGCAAATG
+CTCTTTTAAATGCACTTACATTAATTAAGCATATGGGAGATTCTTTAAGGCAAGTTTGGG
+GAGAAATTGGTCCTGGATTAGCAACTACATTCATGCAAATATTAAATGCAACATCAGGAG
+TATTAGAAAATTTAACTCAAAAATTAATTTATGTTTGGGATAATGGAGGTAGTCATTTAT
+TCCAGGGATTTATAAGGCTAGGTGCAAAAATATTTGAATTAGCTGGGTATATTTATACTA
+ATTTTGTTGCTCCTATGGTTAATTGGTTTGTAAACATGATAGCTCCAGTTCTAGCTAAAT
+TAGCAGATATATTAGGAATTGTTTTAGATGCGTTTAGCAACTTAATAAATTGGTTAATGG
+GTAGTGGAAAGCCAGTATTAGATACAATTATTATTGTTTTAGGAAGTCTTGGTGCTTCTA
+TACTAATAGTTAAAGGAGCATTAACTTTATGGACAATAGCTCAAACAATTTGGACAACTG
+TAGCAAAAACAAGTACTATAGCAACAACATTACTAGGTGGAGCAATAGCATTTTTAACAA
+GTCCAATAGGAATTGCAATAGTTGCTATAACAGCAATAATAGCTAGTGGAGTAGCTTTAT
+ATAAAAATTGGGACTTTGTAAAAGCTAAAGCTATAGAAATATGGGGAAAAATAAAAGACA
+TATTTAATAGCTTTAAAGAATGGTTAAGGAATGTTTTCCAAACAGATTGGTCAAATTGTT
+TTGGAGTATTAGGGAATCTATTAAATCTTTTCTTAAAAAATGTAGATAATGTTTTTCAAT
+CTATCAAAAAAATATTTGGTGGAATAATAGACTTTGTAACCGGAGTATTTACTGGAAACT
+GGAGCAGAGCTTGGCATGGCGTTGTAGATATTTTCAAAGGTATAATGAGTGGATTAGGTT
+CTGTAATTAAAGCGCCTCTAAACTCCGTTATTGGGCTAATTAATATGGCTATAGATGGTT
+TAAACAAAATTAGTTTTACTACTCCAGATTGGATTCCTGGTATTGGTGGTAAGCACTTTG
+GAGTTAACATAGCTAAAATGCCTTATTTGGCTAAAGGCGGTATAGTAGATAAACCAACAC
+AAGCCGTAATAGGAGAGGCTGGAACAGAGGCAGTAGTACCACTAGAAAATAATACTGGTG
+GATTAAATTTACTTGCTATTAAACTTTCAGAAAGAATTAATAATATGTTATTACTTTCTA
+ATAATGCATTAAAACAACCTGATTTAACAATGTTAGGTCAAAATATTAATAGTAATGAAA
+AGAAGAGTATTAATGATCCAGAGTTCATAGAAAAAATAAAAGAAGTTATAATAGAAGCTA
+TTTTAGAAGCGATGAAGAATAAAAAAGATAATAGCTATAATAATTCAGGGCCTCAAGAGA
+GTGGTGATTTAATATTAAGAATAAGAGATACTGATTTAGGTAGAATTGCAATAGAAGCTA
+TAAATAAAGTGAATAGACAAGCTGGAGAGCAATTATTAAATCTTTAGGAGGTGGCAACTA
+TAGGAATTAGTATAAATGGAGTAGCAGTTGCTTCTCCAAAGAGTTTTAAGGTTAACATAA
+TGGATTTAGATGGAGAAAATACAGGAAGAAATTTATTAGGTGTAATGCTTAGAGATAGGA
+TAAGAGTTACTAGAAAACTTGAGTGTGAATGGGGTCCTTTAACATCTAATGAGATTAAAA
+CAATATTACAATCAGTAAGTGGAACAGAGTTTCCAGTTACTTATCCTGATCCAATGGAAG
+GAGTTACAACTAAAAATTTTTATGTAGGAGATAGAAGTACACCAGCTGTTGATTTTAATA
+AGAATGTATGGCAAGGTCTGTCTATGAATTTAATAGAAATATAAATAAAAGAAAGAAGGA
+ATTGAAATGTCAGAAGAAAATATAAAAGTAACAAGCACAATAACAGAATCTACTAACTTA
+AATGGAACAGTAAATATAGAAAAGGATGGAATGAAGCAAACAGTATTAACAATGAGTTGT
+AGTTTAACTCAAAATACTATCGCAAATATTCAAACATATCCTACTAATATGGAGTTGTTC
+TTAGCAAATTCTCAATTAGTTCAAGCTGAGGTTCAAAAATTTAGAACAAAGGCTACGGAA
+GTTGGCAAAAGCTTAAATTGTTTTATACTTTAGTTTATAAGAGCTTACAAAATGTAGGTT
+CTTTTTTAATGAAATTTTTAAAAGAAAGAGGTGTTCAAAATGGTTAAAATGACAAATAAA
+GAAATATTAGAAAAAGTTAATGTATTAGGAGAAATAAGTTTAAGAAAGTTACCAGTTAAA
+GTTTCTTATGCTATAGGCAAGAATATATCTAAAGTTGAAAGAGAATTAAAACACTATAAT
+AAAGAAAGGCAAAAATTAATAGAAGAATATTGTTTAAAAGAAGATGATGGAACTCTAAAA
+ATAACAGATGGAAATTATGATATTGATCCAGAAAGATTAGAGTATTTTAATAAAGAAATT
+AATGAATTACAAGAAATTGAAGTTGAAATGAATATACATAAATTTAATATTGAATTATTA
+AATGGTTATGAAATGAGTCCAGGAGATTTAATGTGTATTGACTTTATGATAGAGGAATAA
+TATAAATATTAATCTTTAGGAAAGGGGGTTAGTATTTGTTTAAAGTATCAGAAGCATTTA
+ATAAAGAAATAAATAAGTTACAAGGAAGAAAATTTAATGCTAAGGTTATTATAAGAGATA
+AAGAATATAGTGGAAATCAAATATATGAAATGAATTTAGAGGAATCAGTTAATCCTAGTG
+ATAGTTTTTCTATAGGATCAATTTGTTCTAACAGTTTCGATATAAAACTAATTAATACAG
+GAGATATATTTGATAATGCTATTGTAAAACCATATGTAGGATTGTATATAGGAGATGATA
+TAGAATATATACCTTTAGGTGTATTTACTGTAATTAAGACTAGTGTAAAAGGAAAATTTA
+TAAATCTTGAGTGTGTAGATAATATGCTAGGGTTAGAAAAAGTATATTTTTCAGATTTAT
+CTTATCCAGCAGATATAAACGATATTGCTAAAGAAATATGTAAAAAGGCAGGCGTTAATT
+TAGCCAGTAAATTACCTAATTATAGAGTTAATAAAATAGAGGGATATTCATTAAGGGAAG
+CTATAGGATTTATAGCTTCCCTTTGTGGTTCATTTGCTAGATTTAATAGGATAGGTGACT
+TAGAAGTTAGAGATTATGAGGTAGTAAAGCAGGAAATGACACCTCATAATTTATTTAAAT
+TAGATATTGAAGCTAATGAGTGCATTATAAAAAAAGTAATAGCCAAAAAAGGTGAAGAAG
+AATTAAGTACTGGTACAGATGATGGAAATAAAATTGTATTCAATAATCCAATAATAACTA
+AAGAAATTTTAAGTGATATATATACTAAATATAATGGATTTAAATATATATCATATACAG
+CTAAGTGGAAAGGTAACCCAGCTATAATGGCTGGAGATATATTAAATTTAACTGATTTAA
+ATGGGAATAAATATAATGCTTTAATAATGGAGCAAAAGTTTACCTATAAGAATGGTATTT
+CATCAGAAGTAAAGGCTAAAGGAAAAACTAGACAAGATTCTAGCTTTGATAGTAAAGGAT
+CAGTTGCTCAATCAATGGAGAGATATTCTATTGAACAAGCAAATATAAAAAAGGCTTTAA
+TAGATAAGGCTAGTATAAATGATTTAACAGCTGTTGATGCTAAAATACAGAGGTTATATA
+CAGAGGATTTAACAGCTATAAGAGCAGATATAGTTACTTTAAATTCTCAAAAAGCTAATA
+TTATCGAATTAAATTCTGTAAGAGCAGATTTACAACAGGCTATAATTGGTAAAGCTAATA
+TAACAGATTTAAACGCAGCAGTTGGAAAATTAAATGTATTAGAATCTAAAACAGCTAGTA
+TAGAAAATGCACTTAATAAAAATCTTACAGCAGAAAATATAGCGACAGGAGCAATAACAG
+CTAGTTCTGGAATAATAGCAGAAGGAGCTATAGGAGATGCAGAAATAAGTTCTTTATCTG
+TAAATAAGTTAAAAGCTGGAGATATAACAACTAGCAAACATAGAATTGTTAGTGCAGATG
+GAACCATAGAAATTGTAGGAAATCAAATTCTTATTAATAGAAATAATGTTAATAGAGTTA
+TATTAGGAGAGTATAGGAAAACAGATGGTACTACAGATTATGGACTACTTATCAGAGGTA
+AAGATGGTAAAACCATAATGCTTGATTCAGACGGAGTTCATAATGCAGGGATAACTAATG
+GAGCTATAGATAATAATAAAGTAGCTGACAACGCTAATATAAGTGGTAATAAGCTAGATA
+TAAATAGTGTTATTAGAGAAGTAAACAATAATGGTACTGAAACTATTAAGGGTACTAAGG
+TTACTGTAGGTGATAGAACTTTAGATGTAGAATTATCTACACAAAATAATACTATTACAG
+AGCATAGCAAAGAACTATCTAGTCAAAAAGCTTCCTTAACCGCTTTAGATAATGCATTAA
+AGTTTAAAGTAGATTCACAAACTTTTAATCAGAGTACAACTACTATAAATAATAATATTA
+ATAGAGCCAAGGAAGAAGCTATAAACAGTTCTAATTCTCACGCTGATAGTAAAGTTAATG
+AAGCTCTTAATAATGCTAAAGCTTTTGTTAATTCAGAAATTACTAATGTTAATACTCATT
+TGAATAAAAACACTAGCGAGATAAATATTTTAAAAGGTCAGATAGAAAGTAAAGTTTCTC
+AATCAGATATAGATAAATCTATTCAAAATATTGAGTTTGGTGGAAGAAATCTATTTTTAA
+AAAGTAAAGGTCCATTTAAAAGCTCTAATGAATATGTAGGGATTTCAATAACTTCTGTTG
+TAGAAAAATATTTAAATAAAAAAATTACAATATCAGCAGATGTAAAAGCTAATAAAGTTG
+GGAAAATTAGATTTTATTCTCTTGGTGGATATTCTGTAGGATTTTGGGTTGAGAGAGATG
+TAACTACAGAATGGACAAGAATAAAAGCTACTGGAAAGTTTACACTTAATGATGAAAAAC
+AAAAGTGGTGTGATTTAAGTTTTTATGGTACTTATGGAAGTGGACTATTTACTGAAGTTA
+GAAATGTAAAAATAGAATTAGGAGAATTGGCTAGTGATTATACAGAGGCTCCAGAAGATA
+CTGACAAGCTAATTATAGACAATATAAAAACAGTAACAGATAAAATATCTACAGTAGAAA
+GTAAACTTACACAAGAAAATAATAGTATAAAAGCTAGTGTTCAAGATTTAAATTCTACAA
+CTCAAAGTATTACAACTAATGTAAGTAATATAAATAGAGATTTAATAAGTAAAATAAATT
+CTAATTTAGCTGTAGCTAAAAATTTTGCTACAGATATAGCTATAGCAAAAGCTAATCTTG
+CAAGAGAACAAGCTATAGCTTCAGCTGATGGCAAGATTACAGAAGAAGAAAGAAAGAGAA
+TACAACAAGCACAGGAAAATCTTGATACGGCTATAGCAAGAGCAGATAAAGCTAAACAAG
+ATGCAATTAATGCAGCAAGTACAGATGCAACTAACAAAGCAAATAATGCTTTAAATAGTG
+CTAAGGCGTTTGTTAATGCAGAAATAACAACAGTTAATAATAAAGTGCATAACGTAGAAA
+GTAATATTGATATATTAAAAAATAAAATTGCTCTTAAAGTTGAACAATCAGACATAGATA
+AAACAAAAACAGAGTTAATTAATAAGATAAATGTTGTAGATAATTTAGCTAATAACGCTA
+AAGATTTAGCTAGTGCCATGAGCTTAGGTAAAATGTTATTTAGTGATCCTACATTTAAAA
+ATAGTTCTAACAATATTAAAACTTACAATAACAATGGAAATGGAACAGTAACAACTTCAA
+GAATTTCTAAAATAAATGGATGTCCAACTGATTCACAATATTGTATAGAAGTAAAAACTG
+TTGGAAGTGCAAGTCCTAACCATGGTGGATTTTATTTTGGAAATATGACTAGAGCAAATG
+CAATATTTGTAACGAAAATTATTGCTAAAATTCCAGTTGGATTAAGAATAGGGTGGTATT
+CAAATTCAACAGGGAATAATGGGAGTTCTAAATGGTTAACATCAGTAAATGGAACAGGTA
+AGTGGGAAGAGTATATACATTTATTAAAATGTGGTGATACAGGAAGTTTTTCTAGTACCA
+GTTTCTTTGCATTAGATGGAGGGGGAACTCCAACATCTAGCAATCCAATAATTTGGCATA
+TAGCTTATGCAACTGTTTTTGATATAACTGAAAATGATGAATCAGTTAATGTATTAAAAA
+CTGAAATGTCAACAGCTAAGAATAAGGTGGCAATAATAGAAACTAATTTAGACAGTATAA
+CTCAAAGAATAAGTTCTACTGAAAGTAAAACACATTCTATAGAAACTACATTAGGTGGAA
+AAGCATCTAAACAAGAAGTTGCAGAAGTTAATAATAGAATTGCTACTATTAAAGCTAACT
+TAGATTCTATTACACAAAGAGTTTCTAATACAGAAAGTAAAACAAATAGCTTAGAAACAA
+ATATAAATGGTAAAGCTAGTAAGCAAGAATTAACAGTAGTTAATAACAAAGTTACAGAAG
+TTACAGCTAGTTTGAATGGAATCACTCAAAGAGTAGGAAACACGGAAAGTAGAATAAATG
+CTTTAGATGGAAAAGTAGCTGGAGCTGTAACATTACAACAATTTACAGAATTCAAACAAA
+GCAATGATAAATTTAAATTTACTGTAGAACAAAGAAGTAGTGTATCAAATATACTTCCAA
+ACAGTTCTTTTCATGGTGGAGATCGTGGGTGGCTTCATGGTGGAAATGAATTTTGGTCTG
+GTCCTTATAGTGGGTATGGATTTAAGGGAAGAATTACTGGTGCAATAAAAAATAGAGCAG
+CATATAACAATCCAGAAAGATACTTACAAACTCATAAAGCTTATAAAGTTAAAAAGAACA
+CTACTTATACAATAAACTTCCATTATATTTGTGAAAAGAATGTTCAATCAATGGATGCTT
+TTGTTGTTTTAAGTGATACTGAACATGGTGATTATGCACAACCAATTTATGTATTAACAG
+CTCAAGGTGGTTCTCAAAGTAATGCAACTGAAGAAAAACCATTTACATATAAATTTAATA
+CAGGTAACCATGAGTGGGTATGGATTAGATTTGACCATAATGGAATGAAAAGTGGCGTTA
+ATTGGGATGAATTTTGTTGGGTTTATGTTAGTGAAATTGGAATCTATGAAGGTGATGTCG
+GAGCTGTTAAGTGGACACCAAAAGGTGGAGAAGTTTATTCAGCTAACTATCAAATGGATG
+GTCTAGGATTCAAAGGGACTTTTGAAGATGGTACTTATGCATCTTTAGGTAAAGATGGAC
+TTGAATGGTTTAACGCTGGTACTGGACATGCATATCATGCATTAACATACGTAACCTCAT
+TCGACATTCCAATTGGTAATCCAGGTAAAGCATATATAAAACTACCAGCTGAATTTACTA
+AAAGAAGAAACTCTCTTAAATGGACAGTCGCATTAAGAGGATATTATTACTCAACAAGTG
+GCGATTTCTTCCCATTCCATATACATTGTACTGGTGGGAGGGATTATATAGAAAATGGAC
+TTGTTGTATGTGAAGTTCAAGGTTACTGTAAAATACAAAATGCCCAAAATGCTGGTGATG
+TACAGTTTAGACCACTTACAGCTATGTTAATAGCTATAGCTTAAATAGAAAGGAGGGTTA
+TTATGGATAATTCTATAAAAAACTTTGAAAATAAAGTTACTTTATTTTATTCTCAATCAA
+CTGGAGATATAAAACTTCATGCTGGTGGAATACAAGATATGAGTTATTTTGGTCCTGAAA
+GAGATGACTATAATTATAAATTTATAGTTGTAGATAAAGATTATTATTTACTTAATAATT
+TAGAAAATTTTAAGGTTGAAAATGGAAAGTTAAAATTAAAAAGTAATAGTATATTAGCTA
+AATACATGTAGGAAGGAATAGACTATGGAAAATATATTTGATTATTTAAAGATGGGGATT
+GTAGCAATAGGAACTTTATTTACATGGCTATTAGGAGCATGGGATACCCCTTTAGTTATA
+CTTATAGTTTTAATGTCTTTAGATTATATTACTGGTATTACTAAAGGTTATGTTAATAAA
+GATTTAAGCAGCAATATAGGACTTAAAGGAATAGCAAGAAAGGGAATTATTTTCACTATT
+CTTATAGTAGCTGTAATGTTAGACAGACTTTTAAATACAGGAAATTGGATATTTAGAACT
+TTGGTATGCTATTTTTACATAGCTAATGAAGGTATAAGTATTATAGAAAATGCAAGTAAA
+CTAGGTGTACCAGTACCATCTAAATTAAAAAATGCGTTAATACAACTTAAAGAAGATAAA
+GAGGATCATAAGAAATTATGATTCTTTTTTTATAAATAAAATTAAGAAAGAAGGAATTAA
+AATGTTAAAAACAATTTTAAAATTAGTAATTAAAGTATTAGAAAGTAAATTACAAAAAAG
+TGGGTTAGAAGAAAAGATAATAAAAAATAAACAGTATATAGATATAGCAAAGCAAGTGTG
+GAATGTAGTTGAAGAAAACTTCCGTATCACAGAATCAGTAGAAAAGAAATTAAGTTCTAA
+AGCTTATGAATTTGACAAAATGATGATGGATAAGTTTCCAGAGTTATCACCAACAGATGT
+AAAAGAATTAAGACAAAGTATTGCTGGAGAAGTTAATAAAGGGAAAGAAGCTGTTTTAGA
+AAATTCAGAGATATTAAAGAAGTTACAAGAAGAAAACCAAGAGCTTAAGTCTAAGAACAC
+TGATTTAGAAAGTAAACTAGCTGCAATATCAAACTATGTGCCAGTGGAAAACAAATAGTT
+TATTAATGTAATACATAGGACTAGAGATAGTCTTTTTTTATTGGATTTAATTATATAAAT
+TTAAAAGAAAGAAGGAATTAATAATGCAAAGTAGAAACAATAATAATTTAAAAGGAATTG
+ATGTATCAAACTGGAAAGGAAATATAAATTTTCAAAGTGTAAAAAATGATGGTGTAGAAG
+TAGTTTATATTAAAGCTACAGAAGGTAATTACTTTAAGGATAAATATGCTAAACAAAATT
+ATGAGAGAGCGAAAGAACAAGGATTAAGAGTAGGATTTTATCATTTCTTTAGAGCTAATA
+AAGGAGCCAAGGATCAAGCAAATTTTTTCGTAAATTATTTGAATGAAATAGGAGCAGTTA
+ATTATGATTGTAAATTAGCTTTAGATATAGAAACTACTGAAGGGGTAGGAGCAAGAGATT
+TAACTTCTATGTGTATAGAATTCTTAGAAGAGGTAAAAAGAATTACTGGAAAAGAAGTTG
+TTGTATATACATATACAAGCTTTGCAAATAATAATTTAGATAGTAGATTATCCAGTTATC
+CAGTTTGGATAGCTCATTATGGTGTAAACACTCCTGGAGCTAACAATATATGGAGTGAAT
+GGGTTGGGTTCCAATATTCAGAGAATGGAAGTGTAGCTGGTGTAAGTGGTGGATGTGATA
+TGAATGAGTTCACTAATGGAATATTCATTGATTCAAATAATTTTACTTTAGACAATGCTA
+CTACTAAAAATGTAAGTATTAAATTAAATATAAGAGCTAAAGGAACTACTAATTCTAAAG
+TAATTGGTTCAATACCAGCCAATGAGAAGTTTAAAATAAAATGGGTTGATGAAGATTATC
+TTGGTTGGTATTACGTTGAGTATAATGGAATAGTTGGCTATGTAAATGCAGATTATGTAG
+AAAAGCTACAAATGGCTACTACTCATAATGTAAGTACTTTTTTAAATGTAAGAGAAGAAG
+GATCATTAAATTCTAGAATAGTAGATAAGATAAATACAGGTGATATTTTTAGAATAGATT
+GGGTGGATTCCGATTTTATAGGTTGGTATAGAGTAACAACTAAAAATGGAAAAGTTGGAT
+TTGTTAATGCTGAATTTGTTAAGAAATTATAATTTTAAGGTTAGTTAGAGTAATATCTGA
+CTAACCTTTTATTTTTTTGTTCATAATCATAATGAGGTGATTATGAACAAAAAAGATAAT
+ATTAGAATTGATTTAATAATTTTATTAGCTATTATTTCTATAATATTACTTTTAGTATAA
+TTTATATAAACTTTTAAAATTAACAATAGTTAAGGCTAGGTAGATTAATTCCTATTTAGT
+CTTTTTTATATTCTTAAAATAAAAAAGCTACACTTAAATGTGTAGCTAAAAAAGGAGTGT
+GATATATTATCTCTGTATCATTTAAAATAAAAATCTATCTTAATTATAGACATTATTTTC
+AATTATATACATATTAACAAAAAACTTTTTTTATTTACAATAATGTTATATAATGTTAAT
+AAAAACACAATTAAAAAGGAGTATTTAAAGTGAACAAAAAAGAAAATGTTAATTTAATTT
+ATTTAATAAAATCTTTTTCAAAAAAAGTGTACAATATATTTAATATCAGTAAAGGATTTA
+AGAAAGTTAAAAAAATTGTAGAATTTAATAATTTAAATCAAATTGAACAATTAAATATAA
+TTAAAGAAAATGATAAGTTATTATCTAAAAAAGATAAAGAAGTTAAAAATAAAGTTGTAG
+CTAATAATATAGATACATTTTTTAAGTTAACAAAAGATAAATATTATGGGTGTAATATAC
+CTATAGAGAAAGCTAGAATAAATCAATATTTTTTAGGTGATAGAAAAAAGAAATCCAATT
+CCGAATTTTTAAATAATATATTTTGCTCAGCTATATTAGGAAGTTTTTTAGCTGCATTTT
+TAAGTATTGAAATCAATGAAAGCTTAATAAAAATATCCGGTTTTTTGCTTTTAATTATAG
+TTATTTTATCAATTATAATAGTTATGCTTTCAATAATTTTTATAGATTTTTTCTTAGAAA
+TATCAGAAAAAGACACTGTTAATAAAGATCTATATTATAATATTGTACTTGAAATATTGT
+CAGAACTTGAGTTTGAGGAAACAAAGAAAAAAATAAATGATTCAAAGGAAATAAATATGG
+ATTTTAATCTAAATTTTTTAAAACTAAAATAGATAATTTTTAAATAGTATGTTAGTAAAC
+ATACTATTTTTATATTTGTATGCAAAAATATGTTTTGTATAAAGGAAAAAGTTGAGTGAT
+TTTATAATTTAAGGTAAAATTAAAAGCAAGTATAATAGGAATATACTTGCTTTTAATAGA
+GTATTTATAAAAATTAGTTATTTTATTATATCATAATACTCTATTAAAGAAAATAATAAA
+TGAGATGGAGGACTTATGAAACTAAAGTTAATAGAAAATAAAATACTTAGAGACTCACCT
+AATAGTTTAAAACAAAAGGTAATAAATGAGGTTGTTAAAAAAGGAATAGCAACATATAAA
+TATAAAACAGAGCCTGATTTAATACAATTATATAAAAAAACTATAGAAGAAAAAATTAGT
+GAATGTCTTGAAAAAGATCAGTCAACAATAAAAATAATAGATTTAATAGAAATGAAAAAA
+GGATATAAGCATTCAATACTTTATGATTATAAAAATTTAGATACAAATTTAGCAAAAAAG
+AAATGTATAGATATTGAGACAGAATATTATAAAAATGTAGGAATTACTTTAAGTGAATTA
+GAAACTCTTTGTTATGAAACAGAGAATGAATTTTTTATTAAGTTTCATAATGAAATTGAT
+ATATTAGAGAAAGTTGATTTACCAAAGTGGTTTAAAGTTAGATATCCAATTTTATTTGTT
+TTTCATAAAAAGTTTAATATTTTAGAAGTTAAATTTGACAAAATAAGTACAGACAAGGAA
+AGAAAATATTATAAAATTGCTATTAGTAAATGTTTTAAGTGGTTAGAAGAAAATTTAAAG
+TGTAAATGCAGTTATCTTAACCTAGATAAATATATTAGAAATTTACTAGAAGATCCTAAT
+GGAATAGTTAAAGAAATAGTTTGGACCGGTGAGCTTGCTAAATCTCAAGGGATAACATTA
+AAAGCTGGAGAAGATATGTCAATGCCATTTTTTCAACAATTAGAGAAAGAAATAATAAGT
+TGGAAGGAAAAATACGCACATAAAGAAGATGCACTGGATTGCTTAAAAGATATTGAGGAT
+TATTTAAATAAAACAAAAAAATTTGCTAATGATAAGTTAAGAACTTTAAGGTTTGTAAAA
+TATAAAGAAAATAATATTTTAAAGACTTTAGAAAAATATATAGAATTAAAAATAACATAT
+AATTACTCAGGAACTTCAGCCGATTTAATAGATGTTATTGAAAGTGAAGTAAATGATTTG
+GAGAGGATGAATTATGTCATTGAGCTTATTGGAACTAGAAAGATTAATAAACCAATGGAA
+GAAAGTATCGCAAAATCAAGTTAAAGATTTGTATGAATTACTAGAATATTTTAGTGGTGG
+AGTGTTGCCTATTAATACAGTAAAAAGAATTTTGGAATTAGACAACGATGAAGTAGAAGA
+ATTAATGATTTTTTTAGAAACTAAAGGAATTTTAAAAAGTGCATTTAAAGTCCTTTGTCC
+TGACAAATTTGAAAGTATTAGAGAAGAAATTTATGATGATATACGAAAGGTTCCTAAAAA
+GTATTGCGATAAATGTGAAAAAGGATGTATGTATTTAGAAAATATTGTAGTTGTTTTTAA
+GGTGGTATAAAATTTAATGAGTAATTATGAAATGTGTATGACTGATGAAGAATTTATTAG
+ATATAATAGTTATTTAAGAAAAATGTCTAAAATTAATCCAAAATTTATTTTAGATAAAAC
+ATTTTCTGTTTCAGATGAAGATATAGAAAAAGGAAAAAGTTTAATAAATGAGATTGAAAA
+TTTAGCTAAAGATATTAAAAAGGCTAAAACTCCAAAAGAGAGAAATGCAATTAATAGAGA
+AAAGGGTAAGAAATTAGAAGAGTTGGCTGGAGTTATGTTTAATTCAGCTGGACTATATTC
+TGAAAGAAATAATTTAAGGGATCATACTAATGAAATAGATCTATTATTAATTGCCGATGA
+CTATAATAAACTTCATAAAACTATTTTACCAGAGTATTTACAGAACGATATATTAATTGA
+ATGTAAAAATTATAATAAAACTATAAAAGTTGATTGGGTGGGTAAATTCTTTTCCTTATT
+AACTACTCATGATGGTGAATTAGGAATAATTTTTTCATTCGATAGTTTTTCAGGACCAGG
+GGAATGGCAATCTGCTAAAGGATTAGCAAAAAAAATATTTTTGTCAGAGAAAAGAGCTAT
+TTTAAATATAGAGTTAAAAGATATTAAGGAAATGTTAGATAATAAAGGAAATATAGTTTC
+TTTAATAAAGGAAAAATATGATGCTTTGAAACATCATGTTGATTTTAAAGCTTTAATAAA
+AAGACATCCAGCTGAAAAATAA
+>NC_008261.1|provirus_1784095_1821197
+CTATTTTATTAGATTTTCAAATTTACCAGATACTACTTCTACTAAGTCATTGGGATTTAA
+TTTTATTTGATGTCCTATCTTTCCTGCACTTACTATCATGAAATCTAAGCCTTTAGCACT
+CTCATGTATAAATGTTCTGTAATCACGTTTTAAACCGATAGGGGAACATCCACCACGAAT
+ATAACCAGTGTATTTTAATATATCCTTAACTGCTATCATTTCAACTTTCTTTTCTCCAGC
+TATCTTAGCAGCATTCTTTAAATTTAATTCTTCTGCAACTGGTATAACAAAAACATATAA
+CTCTTTGCTTGTTCCTTGAGCTACTAATGTTTTAAATACATTTTTCTCATCTACTCCAAT
+TTTATGAGCTACTGAAATCCCATCTATCTTTCCATCTTCACTTTCATAACTTAACATTTC
+ATATGAAACCTTTTTAGAATCTAATATTCTCATAGCATTTGTCTTAAGCTTCTTATCTTT
+TGCCATAATTTTCACCTCTTAAAATTAAATCATTTATAATTATACAATAAACACTTAAAA
+TATATAACTCTAATGCAAAAAGGACTAGTTAAACCTAGTCTTTTTATACTAATTTAAATG
+TTAAATCATAATCACTTATATTACCATCATAATATTCAATCCCATATTCACTTTATAATA
+TTAAAAATATAATTATAAATAATATAATTATAATAAAAGCTATACATCCACAACTTAGAC
+AAGTTACAACATCATCATCTGTATTAGAACTATCATTTTTTAATCCATCCATAGCATCAA
+AGCTTGTCTTATTATATACTTTATTGTAAGCTGCCTTTTTAGGATCATTAACCCATCCCA
+TGCCCTTTTTACCATATGTAGGATTTATAGATTTTTTTACTTGTCTTTTTACTTTTCCAG
+TTGTTCTTGATTTTACACTTTTTTTTAAGCTTGGTTTTCTAGGACCTATCTTCATAACTA
+CCTCCTAATTTATCATTTTCCGTTTAACATTATATAATATTTTTATTAATATAAAAAGTT
+TATATCCTTATCGGTATAAAGTTTTATAGCATGACAATAATTAAAATATAGATTAACTTT
+ATTTGTATAAATAGCTTCAAAAATGAAAAAAGTGATAGATAATATTAATTATCTATCACT
+TCTTAATTAGATCTTCTTAACAAATTCAGAATTAACAAATCCAACTTTTCCATTTTTAGT
+TGTTACTCTATACCAACCTATAAAATCGGAATCCACCCAATCTATTCTAAAAATATCACC
+TGCATTTATCTTATCTACTATTCTAGAATTTAATGATCCTTCTTCTCTTACATTTAAAAA
+AGTACTTACATTATGAGTAGTAGCCATTTGTAGCTTTTCTACATAATCTGCATTTACATA
+ACCAACTATTCCATTATACTCAACGTAATACCAACCAAGATAATCTTCATCAACCCATTT
+TATTTTAAAGGTTTCATTTGCTGGTATTGAACCAATTACTTTAGAATTAGTAGTTCCTTT
+AGCTCTTATATTTAATTTAGTGCTTACATTTTTAGTAGTAGCATTATCTAAATTAAAGTT
+ACTTGAATCAATAAATATTTCTTCTGTAAACTCATTCATATCACATCCACCGCTTACACC
+ATCTACACTTCCATTCTCTGAATATTGAAATCCAACCCATTCACTCCAAATATTATTAGC
+TCCAGGAGTGTTCACCCCATAATGTGCTATCCAAACTGGATAATTAGATAATCTACTATC
+TAAATTATTATTTGAAAAACTTGTATAAGTATATACAACAACTTCTTTTCCTGTAAGTCT
+TTTTACCTCTTCTAAAAATTCTATACACATAGATGTTAAATCTCTTGCTCCTACTCCTTC
+AGTAGTTTCTATATCTAAAGCTAATTTACAATCATAATTAACAGCTCCTATTTCATTTAA
+ATAATCTATAAAGAAATTAGCTTGATCCTTAGCCCCTTTATTAGCTCTAAAGAAATGGTA
+AAACCCTACACTTAATCCTTGTTCTTTTGCTCCCTCATAATTTTGTTTAGCGTATTTATC
+CTTAAAGTAATTACCTTCTGTAGCTTTAATATAAACTACTTCTACGCCATCATTTTTTAC
+ACTCTCAAAATTTATATTTCCTTTCCAGTTTGATACATCAATTCCTTTTAAATTATTATT
+GTTTCTACTTTGCATTATTAATTCCTTCTTTCTTTAAAATATTTTTTATAGAAAAAAGAG
+AACCTAAATTATAGGCTCTCATTTAAGCTTTTTACTGCTGCTAATTTATTTTCTGTTTCT
+GCATTTAATAATTTTAACTTCTCATTTTCTTCTACTAATTGTGTAGCTTGTTGTTTTAAA
+CTATCTTCATATAGCATAGCTTTTCCTTTGTTATATTCTCCTGCTATAGCTTGTCTAATT
+TGTATTAATTCATCTTTGGTTAAGTATGGACAGTTTTCTAAAAGCATTTTATCAAATAAA
+TCAGCTTTTGATTTAGCAAGATTTTCTATATTCTCTGTAATTCTATATTTTTCTTCTATA
+GCAAAGAATATTTTTTTACCAGTTTCATATGCTTCATTAAATTTAGAAGCTTTAAGCTTT
+TGGTCTGTAGCTTCTATCTTGACTTTAATTAGTTGTATTAATTGGTCACCTAGAGTTTTT
+ATTATTGTAGCTAAAAAAAGTGTAATAGCAGCAGCTAAAGCACTTAAAATTGGGTCTAAT
+ATCTTTTCCATTTTACATTCCTTCTTTCTTTTTATTTAAATAAATGATTTTGTATTGCAT
+AAAAAAAGAAGCCTACTATAGAGCCTCCAAACATTGTTATAAATATCTTTAATATCATTA
+TTAAAGTATCTATACTTTTTATTAAGTTAGTTATTTGAACTTCTTTTTTAGCATCACTTT
+GCTCTAACTTATCCAATCTATCAGCATGATTATTTAATCTTTTATCATGTGTTTTTAATT
+TATCTTCTACTAATTCTTCATGCATATCGCTACCCTTTCTTTTTTATGTAATTTAAGAGA
+ATAAAAAAAGACTATCTCTAGCCTTAATTATTCCCCTTCTATTTTATTAAGCTTGAATTG
+TTTCATGATCTGTTGGTAATGAAGTTACTAACAGATTAGATAACTCAATATATTGTTCAG
+GTGTTATTTCATGAGTCATCATGAAGCAGCCTAAAAATTGCTTCATTTCCTCTCTTTCCT
+TCTCTGTTTTACATCTATTTTCTATTTGTCTTTTACATAATTCATACATCATAATTAATC
+ATCCTTTCATTTATTTTAAATTATTATTTAATTTAATCATAGCAAGATTTCCGTTAGCTT
+TTAATATACCTGGTACTAATAAATTATTAATAACATCCCAGATATTATTAACTTCTTTAG
+CTAAGTTTTGCAAAGAGCTTCCTAGGTTTGAAGGTACTTTAAAGTCTAAAGTTCCTGGTA
+AACTATTTTCTATAGAAAAATAAGTTTTTTCTTGATAGGTATCTAAATCTATATCTATTA
+CCCCATCTACAACTTCTGTTACTGGTGTAGCTAATTGATAAACCACGGTTGTTGGATTCT
+CTTTTAGCCATGCTTTGAAGCCTTCTACATCTTGTGTTGTTAGCTTGGATTTATTTATTC
+TGATATAAAGATTACCACCAGAAATTTGCATATTTTCCTTATCTTTATCCCATGTTGATT
+CTGAAAGTATTGGGAAGTTTGAAATTATTCCTTTTCCGCCTTTAGAATTTAAACTATTTG
+GTAATTGTGCTGAAAAACGGATAGTGTTAATATCTGTGCCACTAGCTACACTAGACTTCA
+TAAAATTTAATGTAGCTAACTTAACCTCAAAATCATTTCTATAAACTTTAACTTGTCCAT
+TATCCTCATAAAGATAATCATCTTCACGAAGTGGTTCTTTAATTAAAATATCTTTTTTAT
+AACATTTATAAAGTTCGTATGGTTGATTTTCAGTTCCATCTATAACATAACAAAATAAAT
+CTTTTGCCACAAAATTAACTTGTGTATTATGTGGATTTTCTATTCTTATACTACTATTAG
+TATCAATATAGGCAATTCTTTGTCCAACTTGAAAATCATTAAGATTATTATTCCAATTGT
+TAGTATCTATCATATTTCTAAATTCGCCACTTTCTAACCAACAATTATTTATTATTAATC
+TACAACCTTTTAATTTAGCCTTAATCAATACTTTTGTTTTTTTATCAATGCTTATTTTAG
+CTGATGTTGTTCCATTATATTGATTAGCAATTCCACTTATAACGCCATTTTCATTTTTAA
+AATTAGTTACTGCACCTTGTTGAATTTTTTGTATATCAAAAAGATTTTTACCAGTACTTA
+AAACACTAATTTTATACTTATCTTCAACCTTTTCTGCTTCTCCAAAGCTTTTTAAGCCTT
+CAAAATATTTTTTAGGCATATAAGTTTCTTCTCTGTCAAGTACTATGCAAGTATTTCTTA
+GCAATTCCTTATCAGTTTCACTATTAGTCCACCCTCTATCATACATACCTAGAAAACCAG
+TTAATCTTTTACCAGTTAAGTCTAATTTAGTTATAGAATTTTCTTTTAAAATAGGGTTGC
+TATCCCATCCTCCACCTATTTTATACACATTCAATAAAAGTATTTTGTTAGTATTATTCA
+CTACATAAACAATTCTGTCTTTCGGTTCATTCTTCACAAGCGTATCAACAAGTATATAGT
+TTCCTCCAGCATCATCTCTTGTATTATTTGGTTTATATAGGTTATTCAAAGTTCTACCCT
+TAATTTTCATACTTTCTGTTCTACCTTCTAGTGTGTCATTTGCACTTATAGAACTCCCTT
+CATAACTTAAAGCTTGATTACTTTTAAGTCCATTCTGTAGTTCCGTTACATCCATACGAA
+TTTGAGGAATGTTTTGACTTCCATCCAACCCTTCTATGAATTCTTTAGTCTTTTCCAAAG
+AAGCTTGAAGTTCTGTATTTTTAGAAGTAGCTTCTTGGTTAGTTGCTGCAAGATTTGTGT
+TAGCAACTTTAGCTGATTCAACATTTTTAATTAATTCTGAATTTAAAGGTAGTCCTTTAT
+TTATATTATTTGATAGTTCTTCAGCTTTAGAATTTAATCCAGTTAGTGTTTCTATTTTCT
+CTGTAGATTCTATATTTTTAGTATCTAAATCTTTTATAGTTTCTTTAACTTCTTTAGCTA
+GATCTATGTTAGATTCTAAATTTTTATTTAAAGAAGTAGCAGTAGAAGTATTTTCTAAGA
+GCTTAGAATTAATATTATTAGCTTCTGTTATATTAGATTCTAAATTACTATTTGCATTAG
+TAGCACTAGAAGTATTTTCTTTTAACTTTTCATTTAATTTACTAGCTTTGTCTAGTATAT
+TTTCTAAATAAGTAAAGTCTTTACTATCTGCTATTTCTCCAGCTATTTTAGTAAATATAT
+TAGCTTCTACAGTTAATCCAAATGTTGCTGTATGCTCTAAAAATCCATCTGCTCCATAAA
+TAGCTAATTGACAACTATAGACACCATCTTGTTTAGATATTCTATTAGTTATTGGGAAAG
+TTATTTCTCCTTGCTCTGCATTTGTAATATTTAAATTTTCTATTATGTCTCCTTTGGTTG
+TTCCAGCCATTACATAGCCAAGTTTAACAGTCTTACCTGTTAAATTTAATCTTCTCTTAT
+TCTGTAATACACATATTTTATAGATTTCAGCATTATTATTGCCTTTTATTGTTTTAATGC
+CTTCGTTATTATAAGAATCAACATTAACTTTTAGTTCAATTTCTCTCATAATTCACGCTC
+CTTTCTATTTAGCTTTTGTATCTCTTCCAGCACTTGGATTAGTACATACTCCACTTCCAT
+TAAAGTCGTACCATTTACCTTCGATAAATAAGGTTTCCTCGGAAGCCATTACCCCATTAA
+ATTTTAGCCAATAGTAGTTAGAATCTTTATAAAGCCATTCATTCTTCTTTAATGCTCCAC
+CTTTACCAGCATAATAATAGTTAGCTTGGTATTCATAAAACTCTTCTTCTGCCATTAATG
+TATTAGACTTAATTAAATAAGTATTATTGTTATAATAAATAAGTTTAGGCTCTATAACCA
+TTTTGCAATTTTCATCTATCCAATAATAACAAGGTTTTTCATTAAAAGTACCTTGAATAA
+AGCAATTTCTATCTAAAGCACCTGAAGAACTTGCATGATAATCAATCCCATCATGTTTTA
+TCCACTCATTTTTAGCAATAAATCCATCATCTTTTACGAAATAGAAATCACTCTTATAAG
+GGTAAATTCCTTTAGTTGCAATTCCACCAGCTTCATTAGTCATTTTATATTTGCCGCTAT
+AGTAATCCAGGAATTGAAGTGGTAATTTATACTCATGACAACATGGATAAATAGCACCTC
+GACTTATCTTAAATACTGTCATATCATTATTATCGTTGGAGTAAACTTTACCGCCATATT
+TTAGACATTTTAAAGCAAAGTTTTTTATTATATCTTTCTTATAAACATCCAATCTATCTA
+TTAAACAATACCTAGCTTGTAATTCTTCAAATCGCCTGTCTGAGTTACCACCGTCTGCTC
+CGTGATGACTTAATTTGTATAAATCAATTTTCCCTATTCTGTTTTGTAAATGTGTTTCAG
+TAGCTACTGTACTATCACCAGGAAACAATGATTTAGTTCCATGAGATACTAGAAGATAAT
+TAACACTCATATTATTTTCATTGCTATAATCATAGAATTTAGATGCGAAAGCTTCTATAT
+AATCATTTTTCCCAATTCTGAACTGTTGGTCATTAGCAACTATTTTTTGTACATTGAATT
+TATCTGCTGCTGCTAACATTCTATCATGGTACCCTTTAGTGTCCCATTCAGTTTCTTGTG
+ATGGTAACCTAGAATAATCTATTCCATCTTTATATACAATGTATTGTGGTCTATATTTTT
+CTATAATGGCTGGTGCATTCCCTATATGATCAGAATGATCATGAGTAGCAAAAAAATATT
+TTAATTTATTTACTCCAATTTTATCTAGTTGTTGAATCATTATTTGAAAATTTTCTTCCA
+TGAAACAATCTATCATCGAAAATGTTCCATCGTCGCTCTTTATTACTATACAATCTCCAT
+AAGAGCCTTCTTTGTTTTTAAGGTTATAAATAATAGTTTCTGTATTATCCTGCATTCTTT
+CTGCTGTATAATCCAATTTTTTAGTCATTTCAGTTATGTTAGAAGCATTTTCTTTACTTC
+TTACATCTACCTCATTAAAATTATCTACTTTTGCAAGAGCCTTATCTAACGCAGAAAATT
+TATTAGAACTTTGTATAGCTTCAGTATCTACTAAACTTTCGGAAATAATTAATCTAACTA
+AGCAAAGCGGTGTAAGATGGCTACCAGTAGAATCACTAATTGTTAATTGATAATCTGCTG
+TTCCTGGAATTAAAAAATCATCTGTTAATTCTAATCTTGCAATTCCTTTTTTACCATCAA
+CTATAGTTAACTCATCAAAAATAGAAAAATGTTTGGGGTTTATACCAGAAATTCTAACTG
+TACTATATGTTAAATCTATAATATTAATTTCACCTAGAAACTTAAAATCTATAAACCTTG
+ATTTAATATCATGCTCAACCGCTTTAATTTCTATTGGATCATCTCGATTAATATAAATTT
+TTCTAGGTGGTTCTAAATATTGCATAAATTATTTCTCCTTTCTTGTAATAAAAAAGATAG
+TAGAAAACTACTCTCTTACACTAAATCTCCAACTTTTAAAGAAGGAGCTATATTTTGAGC
+TGTACCATTAACTCTAAGTTCCCAATGACAATGTGGGCCTGATGAATTTCCAGTATTACC
+ACTTCTAGATATAACTTGTCCTGCTTTTACTGTATCACCTTCATTTACTAGCAACTCGCT
+ATTATGAGCGTAAATAGTAACTAATCCACCGCCATGATCTATAAATAAATATTTACCATA
+GCTTGTAGTTAATTCTCTTCTTTTTATAACTTTACCTGACTTTGAAGCTCTAACTGGCGT
+ACCTATAGGAACACCAAAATCTATTCCTGAATGTTGAGCCCCTGAAGGATAATAAGGGAA
+TGTTGCTGTTACATGTCCATTACTTACTGGAATAATCCAACCATTACCATACTCATTATT
+TATTGTTTTAAAGTTACTACTTTCTATAGGTGGGAAGTATCCATCACCTTTTACTGTGCC
+TATTTGATTTCCACTTGCGTTTAAAATTCCAATAGGAGACATAATGTAGTTAGCATTTTT
+AAACATTTCAGCTTCTTCCTTTCTTCTACGCTTTAATCCTTTTTCAAAAATTGTTCCAGG
+CATAGTTGCATATGTTAGCCAATCATTATAAATTTCATCAATACTAGCACCCCTTATCCA
+AGCTCTGTACATACGAGAATTATAATATCCTGAGTTATAGCATAAATCTACAAATGCATC
+AAAAACATTTATATTAACTTTACTAAGGTCTAAACCATCTTTAAGCATTTGATTTTTAAC
+TAAAGAGCCATATCTGTCTGGTATTAATTCAAATAAAACTTTAGATGCAGTTTCTTCAGA
+ACAAGGTGGATTACCTAATTTAGCAAAGTATGTTGGCTCATTAGCTTTAGTAACTCCATA
+ACCATATGTTATTTGGCCATCTCCAATATTACCTGGATATTGTTGTAGGCCTTCTATTCC
+TTTGACATACCTGAAATATTTTCTTGAAGGTATTCCTTTACTAACATTCCCTAGGGTATC
+TACACCACCTCCTATAGGAGAGTTTGGGTCAAATACAGTAGTACCACTTGTATTTTTAAT
+AACACCATCTAATACTAGGTCATTACATCTCAATTCTCCAGTTCTAGCATCATAATATAA
+AGATTTATCTTTTCCTATCCTTGTTCCTGAACCTGCAACTACAATTTCATTATCAGGTGT
+AGTTATATTAATAAAATGATCTCCAACATGAATGCTATTTGTACCATTATCAGAACGAAT
+ATCTATGTTATAAACTTTGTTCCCTTTAAAATCTACTTCTTCATATATTCTTACTGGCTT
+TCCACCTGAATCATCTAAAATGTTATATTTGTCAAGCGCAATATAAGAAGGAACTTTTGT
+CTTACCTTCAACAGCATACCCAAGAGACATTGCACTATCAATATCATTTGCTAACCCAAT
+CAAAGGCTTATTTTCATCATCTCCTTGAACCAATGACATTAACGCACCTATATAATCGCC
+GTTCTTTTTCCAATTGTAAAGCTTAATCATATTATTTTCTATCTTTATTGCATCTTTTCC
+ATTGTTTCTAAATAAAGCTCCACCAGGTTTCTTTAAATCTATCTCAAAGCTTTTATCCAT
+ATTCCGTATTAAAACTGTTGTTAAAATACCTATTAATTCGTCAGCTATTATTCCTTTTGG
+AGTTATAGCTGTTTTAAAGTCCCACCCTGAATTATCGCTTAATCTTTTATCAGATAAAAG
+AATCCCTTTTGTCCCACCTTGAACACATCCAAAATCAGGATCATTTGGATCCAAAACTTC
+TTGAATCCAAGCAACTATATCTAATTTTTTTGCTCTATCTCTTTGTGCTAATAATGGAGC
+TTTCATAGCATTTATTGCTCCAATTATATTTTCGCCACCTAAATTCCCATCACCATCAAA
+GCTTCCTGCAATAGTATCAAATGTTACACTCTTATCTGCTTGTGCTGATGCATATGTGTC
+TAAATAATTTCCTATTTCACAATTCAACATTTCTTCATTTAAACAATCATATTCAAGTGA
+TATACATCTAGCTTTAATATTAATATCTAATGGTTTATGTTCTATATATACTGTATCTCC
+TAATAAAATCTCTTCTAGTGACTTATACTCTTTATATTCTTCAGTACTTGATAAAGGAAT
+AAATTGAACACTATAATTTACTAACGGCTTATCTATTCCTTTACTTATAAGCTCCTTACC
+TTTATTTTTTAACGCTTCATTAACCTGCTCTTGTGTATCAAACCCCTCTGCATTTTCACC
+TTTATTGTTTGGTGTCCCTTTTAACTTAATATCTTCAAATCTTTGCTCTGATTCAAACAC
+ATGACTATAATTATTAATTAATGGAGAATCTACCCATGGAGTTGTTCCACTTATACAGAT
+ACCATCATAACCAGTTGGTATTACTCTAGTTATTAAACTATCCATATCTATTGTTTCAAC
+TAAACCTGTTAAATTCTTTTTATATGCAATTCTAACATTATTATCTTCTCCTACTCTTTT
+ATTTAAGTAAATATCAAAATTATTTAAAAATAATTCTCCTCCCCATCTACTTAAAAAAGA
+ATTTTCTTTATCATCTCCACCTATTGCTTGTACTATCTTCTTTCTAAAATAATAAGATGT
+TGCTATCTTTTCTATATCTGAATGTCCTTTAAACTCTGTCCCTTTTAAAATTTTATCTAA
+TGCTTGTTGTCCATTACAATTTACACATCTAACATCAAATATATTTTCCTCTCTAGTTAA
+ATCCTTAATATATATGTCAACTAAGTCATAGAATATATGCCTTGCTTTTACACTCATATA
+ATCTAAGTTTTTTTCTATATCGTAGATTCTATAAAGCTGTTCTGGTATTTTTTTATATGG
+TGTACTAACTTTTATAACATCATCTCTAGAAATATATTTCCATCTTTCCTCTTCATCATA
+TTCATGCTCCATTGCTACTTCATTTAATCCAGTTACTAATTCCATTTTCAAAGTACATTT
+AGAAGGTTCTAATATCATATCTCCATTATTAACAAAATTCTTATTATTAAATTTATATAA
+TTGTACTTTCCCCATAAGCTTAATAATAAATATAATTAGGAATTATATTTATACTCTCTA
+TATTTCCTTCCCATCTAATTGTATTTTCCTCTAATTTTAAAATAGGAAAATCTCCCTTCA
+TGTACTTATTAGTTGGATTATCTAAAGTATCTTTATAACATAATTCAAGTTTAGAATTTA
+TAGTTGTTTTTCCCATGGTTAAATTTAATTCTATTAAACTTTCATTTATCCATAACTTTA
+TATCTCCTTCTCCTTGTATAGTTATTATTGGTTTACTTTCAAAATCTCCACTATTATAAA
+GCATGTCCCCATTATTTATTTCTAATTCTTCAGCTCCATAAAAACTATATGCAAAAGGTT
+CTAGTGTAAAAGTAACTTTGAATTTACCTATTGTTTTTAATTTTCTTTCTATATCATCAT
+ATTCAACTTTCTTAACTATATAAAAATAAGAAGGATCATCTCCTTCCCATAATTTTTTGT
+CTTTAATATTATCTAGCCATCTTCTTATTCTTCTTACTTTTTCATGAATATTTTTCCTAT
+CAATAAAGTTATACTCTACAACCAAAATTCTATTTTCATAACCTATAATTTTATAGTCAG
+TCCCATCCTTACCATCAATTTGTTGTTCTCTATATCTCTTTTTTAGTGAAGGGAAGAATG
+GTCTTTTTATTGCCTTAATTCCTATTTCTAAATCTGTGCAATTATTGAACCAAATAAAAT
+ATTTATGCACATATTCGACCTCCCTTCTTTCCTTTAGTAACTCTATAACTATTTTCATCA
+CTTTTCATTTGTTTAGCTACTTTCTTATATACTTTAGTACTGATTACTTCACCATCTAAA
+TTAGTTACATTTTCAATTACAACTACTATATTATTATTGTTTGTATTATTAAGTTTTGTA
+TTTATTTTTTCTAAGTCAACATTTGATATAGAAGGTACTATATTAGTATTTATAGTTCTA
+TCCAAACTTTGCTTTATATCTAAATTTATATCTTCCATTTCATTGACAAAACCTACTCCA
+ACACCTTGAGCCATAAATTTACCAACCTGATCTCTTAACACCCTAGATGGAGAATGTATA
+TCTAAAGAACTTTTAAATCCTTCTACAATTCCATCACAAAATTGTTTTATCTTACTTTTT
+ATCCATCCAATAGCACCTGTTATACCATCCCAAATCCCATGAACTATATTTTTACCTATC
+TCTTTCATTTGTCCTGGTATAGCTTTTACTGTATCTACTATAGAATCAACTAACTTTTTA
+CCACTCTCTTTACCAGCAGTCTTTAAATCTTCTCCCCATGCACTTACCTTATTCCAAGAT
+TCTTTTAACCAATTTTTAAATCTTGTTGGTAGTTCTTTAACATGATCTACTATAGAATCA
+ACAAATTCCTTTCCCACTTTCTTAGCTTCTTGGTACATATTATTTCCCCATGTAGTAACT
+CCATCATAAGCTTCAGTAATCTTATTCCAAATTTTATGTGGTAGTTCCTTAACATAATCT
+ATCACTCCATATATAAAATCCTTACCTGTCTTTTTTGCTGAAATATATAAATTATTTCCC
+CATGTCTTTACTTTCATATATGAATCAAGTAATTGTTTCCCTATTGCTTCAGGAAGCTGT
+GCAAACCATTGCTTTATAGAATTTATTGCATCTGGAATAGTTTTAGTGATAAATATTTTT
+ATGTTTAAAAATCCCTTATAAATTTCTCCTGCAATTTTTCCTATCAATATCCCCATAAGT
+TTAGGTAAATTACTAAATATAAATTTTACTTCTTCTATATAATTTTTTATTCTAGTTTTT
+ATTATAGTACCAAACTCTTTTATTTTATTTATGAAGTCTGTTTTAAATTGTGTAAGTTTA
+GATATTAACCACTTAAAGAAATCAGGAATACTTTTAGTAAAAAACTCTTTAATATTTGAA
+AATAATTTGTCCACTCCATTCCTAAATCCTTCACAATGCTTGTAAGCTAATGCAAAAGCT
+CCAGCAAAAGGATTAACTATAAGCAACAAAATTTCCTTCCAATCATTTTTAAAGAAATTT
+ATTAACTGCTTTAATTTATTAGGTACTGTTTCTGTAAAAAACTTTATAAGTCCACTAAAT
+ATTTTATTAACTCCATTTCTAAACCACTCGCAATGATTATATAAATAAGTTAAAGCTCCT
+ACTACTAATCCAACGACTAATATAATTTTTCCTACTGGAGATATTTCAGTAACAAAATTT
+AAAGCTTTCTGTGCTGCTGTTTGTAACTTTGTAGCAATTTTTAATTTTTCCATAACATCT
+CTAAATGCTTTATAATCTTTAATGGCATTTCTTATTGTTCCTGTAACTTTAGTTGTTACT
+GCTAAAGCTCCATAAGAACCAACTACAAAAGCTCCTATTCCCACTACTGCCTTTTTTTGC
+CCTTCACTTAATCCACCAAAAGCTTTAGCTATACCACCTATTCCCTTAGCAGCTAAAGAA
+ATAAATGGTGCTAATACTTCACCAAATCCAACTAGACTATTTTTAGCTAAGTTTAAAGAT
+GTTCTTAAATCATTTCCAGTAGTATTATTTATTTTTGCAAGAGCTGAATCAGTTGTTCCT
+ATAGCCTCATTCATTTTCTTAGACTTATCTGCCAACGTATCAAACTGTGAACTTGTTAAT
+GCTGTAATTGCTGTTAGTCCTTCAGTACTACTAAAAAGTTTTCCCATTTTATCTGATTGT
+CCACCAGTTTCTTTTTGTAATATTTTTAAAGTACCAATTAAGCCCTCACTTTTTAACATT
+GCTTGACCATTTTGGAAGCCATATTTCTCCATTAATTTTTGCATATCTGCTGTTGGTTTA
+ATTAAGTTACTAAATACTGCTTTTAACTGGGTACATACTTCTGAAGTGTTTCCTGTAACC
+CCTGTTAATGTAGCCATATTAGTAAATAAATCTGTCATTGATAAATTTAAATTGCTTGCT
+AGTGGGAATAATGGTTGCATGCTTGAAGCCATTTCTGGAAAAGTTGTTACTCCCAACTTA
+GCTGTTTGGAAGGCTAAATCACTTATCTTCTTTGCTGTTTCATCATTAACTTGATTATAT
+CCTTTCATTCCTGCACTAATTAAAGCAACTGCATCTTTAACCTCTGCTCCACCAGCCTTA
+GCACTTTTAGCCATAGTATCAAATATCTTCTCTGTTTCTGCTCCTCCATCTCCAATTGAT
+GAAATAGCCTGATACATACCATCTGTTACAATCTTCAAATCAATTCCTGTTTGGTTTGAT
+ACTTCCATTATTTTATTTTTATATCCTTCTAAATGACTTTGGTCATCTAAAAGAGTATTT
+ATATTTGCTATACCATCCTGAAACTTCATTTCTGTCACTGCAGCAGCAACACCAAATCCA
+GTAACAGCTATTGCTGCTGGTTTTAAAGCACTAGCTGCCTTCCCTGTAGCATTGCTTACC
+TTGTCCATTTTTTGAGAGAATTTATCTAAATTGATATCTTTTAATTTCTTATCAACCTCT
+TCTAAAGCTTTTTTATTTTCTAATAGCTCTGTCTTAGATTTATTCATTTTCATATTTGCA
+GTATCTATTTTTCTATTAGATGAATCTATTGCTCTTTCATTCCTAGCATATTCTTCTTTT
+AAATCAGCTAAAGATTTTCCTAACTTTTTTGTTTCCTCGCTATTCTTTCCAGTAGCTTCA
+GAACTTTCTTTATATTTTTTAGTTACTTCTTCTATTTTTTTAGATAATTCTTCTCTTTTT
+TCTTTTTGCTTCTGAACATCATTAGTCAACTTATTAATTGCTTCTTTTTGTAAATTAATC
+ATTCTATTTTGAAGTTTCATTTTTTCAGTAAGCTCAGCCTGTTTTACTTTTAATTGTTCA
+TTAGCATTACCAAATAATTTAGCCTGAGTACTTGCTAAATTAAATGTACTGCCAAGAGAT
+TTAAGCTCTCTTACCATATCCTTCATTTGCTTTTGAAAGTCAGATGTATTTGCTCCTATT
+TTTACATTAGCACCCATTAATCAACCTCCTTTCTTCAACAAAATAAAAAGGACTATACAT
+CTGTATAATCCTTGTCTTTATTCTCTTCTAAATATTCAAATTCTGAATTTATATAATCTA
+ATAAATCAACTATAGAAATATCTAAACATTCTTTTAAACTCATGTTACATTGTTTTCTAG
+CAAATCTAAAAATACTATATAATGTGTCAAGAAGATTTTCATATATTGTTATTTCTCTTT
+CTTCTTCATATCCTTCTTCTTTGTCATATTCTTCAAAGATACTTTTTTCAATTTTAATTT
+CCTGTACTGATCCTAAAGATTTAAATCTTTCTACAACTTCATTCTTGATATAAATTTCTA
+TAAAATTAAAAATGTAATACAAATCTTTTATATCTAATCTTTCCAAATTATTTTTTTTAA
+TATTTCCATCAAATATTAAATCTATAATTCTATATATTAAATCTAATCCATTAATCGTAT
+TTTTATATTCAAGATATTTTTTATACTTATATCCAGTTATATCAGTTGCATAAATTCTTT
+TTCTATTGCAAGAAATATTTAAATCACTTATTTCTTGCCCTTCGTAAAAGCCTTTTGTGC
+CTTATCTATATTCTTATCTAGTTTTCCTACTATCTCTATATCACACTTCATAAATTCAAA
+TATGATTTCAGCAACATCTAAATTGTCATCTATATCTTCTTTGGTAAATTGATTATCATA
+TATAGTTACTATTGTATCTTCCATTAATTCTAAATCATCATCGGTATAATCAATTTTCTT
+TTCCTCTTTTTCATTTATCTTAGCTTTAGCTTCAGTATATGTTCTATACTTTTTTCTTAC
+TATTTTTCCACTATCATATGTAGTACCATTTATCTCTATCTTCATAGTTACTCACTCACT
+TTCTTTTCTGTTCCTAAACTTTTAGGTTCTTGAACTTGTCCAAACCATCCATCTAAAACC
+TCTTTTGCACTTCCTGCATCAGCAAGATCCATTTCATCTGCATCCACACCAATATTACGA
+TCTTTTTTTCGTGGTATTATAGTTCCTTTTATTTTTGCATTTTGTCTTTTTCCTTTTTTA
+GCTATTGTTTCTGCCTCTTCATCCTCTTCTTCGCCAAAATTAACTCTATACCACCAATAA
+AATTTATATAATCCATTAGTTAATTTTGTTCTATATCCTATAGCTACATCTTTAGCTTTA
+TCGTCAGCATTTATAGCAGTCATTCCACCTAAATTTTTATGACCTCTTATCATTTCTCTT
+ATTTTTCTTGATAGATAATCCCCTTCGATTTCTATAGTTCCCTCTTCAAAATCATTGTCA
+CTTTCATCTTGAACATCATCAAAATATACTGGTTCATTCGTATATTTTAATTTTGTTTTT
+ACACTAGCTGCCTTCATTAATCTAACTGGTTTACCAGTAGTATAATTTTCAGCACTATCT
+TCTGTTATTGGTGCTACATATAAATCTTTTAATCCTTTTGGTTGTGCCATATCAACGCCA
+CCTTTCTTAATCTAATTCTTCGCTATAATTAAATCTCATAGCTTTATGATAAATTTTCAC
+ATCTACTTCAAATTGATCATTACTATCCTCTAATAAAAATCCATTATCTTTTAATAATTT
+CTTGACCTTATTTTTTAACTTCAATCCTTCTTCACTATTAGTTGTCCATATATCAACTTG
+TATATTATGAGTAATTGAAACTTCTTCATCATCTAAAAAATCCTCTGGAGCTTCTAAATA
+TTCAAAGAATGTAATATGTGTTTTTTTTAGCTCTTCATCATACCAACCTTCAAATACTGG
+AATATCTAAACTACTTAAACTATCAGCTACCAAAGCAATAATATCAAACTCCAATATATC
+ACCTACTTTTCTAATTTCTTCACAAGAGCTTCATAATGATACATAGCAATAGTATCATAT
+TTAGTTTTCAGCAATTTATTAACAGTACCAAAACTATGATGTGGAGGTCTTTTAGTTGTT
+CCCCACTCTTCCATCTTCATATAATAATAAGGACTATTATCCGTTTTATCCCATCCTATA
+ATTACATATAAGTTTCCATTCTTCTTTCTAAATTTAGGTTTAGGAATATTATCACTTGCA
+TGCCCTGGTGGTCTGCTTCCTTTCCTCCCACTCTTAGAATTATCTTTACTTTTATGAATT
+TTAGGCTTTACAGTATCATAAGCTAATTCACTACAATCTTTAAGTATATCTTTATTTACT
+CTTTCTAACCCTTCATTTGTAGAAATGCTCTCTGCTGTTTTTATAAGTTCATCTAATCCA
+ACAAACTCCATATTAATCATTAAAGCACCTCTTTACATTTTAGTTTTATAAAATCCTTTT
+TATATCCTAAGAAATCAGGATAATATATTTCATATTGTCTACCTTGCCATTCAACTATAA
+AATTTTCTTTATTCCTAAGCTCTTCTAACTTTTTGCAATATCTAACTTTAAATATTACTG
+TATTCTCTAATTTCATAGCCATAGCTTCATATAATTCTTTACCATATAAATCTAATACTT
+TTGCTCTACAATCATAAAAGGGAGTTGGCTCCCTTGGTGGTTGCCTTCTCCCTTTAATAA
+TTACTTCTTCTATTTTCTTTATATATATTCTTTCTCTTAGCCTAGACATTATTATCACCA
+CAATATTTCAATTGAGTTATTATTGAATTTAATGCAAATTGAGCTTTATCATTTTTATTG
+CCAATACTAATACTTTCTTCATCATCATACCAGTTCTTTACAAGTAATTTTACTGCTAAT
+GAATAAAGTTTCTTTCTATAATCTTTTTTCACGCCAGCATTTGTTAAATATTCTTCTGCT
+GCTTCTAAAAGACCTAATAAAAGATCATCATCTTCATCACAATCAATACATAGATATTTT
+TTTAATTCTTCCAAGCTCATTTTTAATCACTCTACGCTTTAGCTTCATTTACTTTTACTA
+TTAATCCAAATTTTCTTATTACTGCTGCATCTTCTGATTTTTTTAATGGTGATTCAACAT
+CAAATCTTTCTATAATTCTAGCTATAGTTTGATTCTTAGTATATCCAGCTTCTTTTGATT
+GATCTATTAAATATTGTTTTCTATCCATAAATTTAATTAATGTCTTTAAATCTGCAATTA
+TAAACTTGATTTCCTCTCCTGTATTAAATGTAGTTGAGTCTAATTCAACCACATCTCTTC
+CCTTAAATATTAAACTTCCTCCATCTGATAATTCTTTTAAAAGTGGTCTACCTTGCTTAT
+CCATTAATGCATCTAAATAACCTCTACCTAAAGAATTAGTAACAATAACAGCTCTACTTC
+TTGCATTAGGAACTAATGAATTTATTTTCTCAACCATTTCTATATAATCTTTCACTTCTT
+CAGTAGCTAGTAATTTATTAGCTTGATCTACTACTTCGCTATTTTCAGTATTAACTGCAT
+ATTCTACGAATTCTTCATTTACAAATTCTAAAAAGTTTATTTCACTATCTTCAAGTAATG
+AGTTATCTATCGGTGCAAGTAATCCATAATCATTTATATCATATGACATAGGTTTAGTTT
+TCATCATAGCCTTAACTAATTCTGTATCTTCTTCTAAATTTGCAAGTTTAGTAACACTTC
+CCCCAGCTCTTACAGGTAACTTTCCTGAATTTCTTGCAACTGGTATTACATGACAGTATG
+ATTTTAAAGCTGGATATCCCTCTTTTAATTTTTCAAATTCATTAACAAATTCTTGAGGTA
+TTACAGCTCCATTATTTGTTGCTGACATAACATCTCTTTCTTCTTCACTTAAAGATATTC
+CTCTTACAACTTTACTCATTGCGCTTAATTGTAAACTTCTTTTTTCTTCTTTTGAACCTT
+CTCCACCTAAAACTCTTCCACCTGAAAAGTTACTGTTGCTTCTTTCCTCTTCAATGGCTT
+CCATAACTGATTCTATTTCTTCCTCAATTATTTCCATTCTAGCCTCTATCTTTTCTCTTT
+CAATAGCTTTACTTCTTATTTCCTCTTCCTTCTCTTCTTTAGCTAATGATCTAATCTCTT
+CTACTATTACTTTTCTTCTTTCCTCTAAGTCTTTCTTCTTTGCTCTTAATTCTTTTAATC
+TTTCAAATAATTTCATTTATAAAATCCTCCTAAATTTAAATAATAAAAAAAGAGCTTTAA
+CAATATATAAGCTCTAATAAATTACTTCTTTTTTCTTCTTTTTTCTTTGCATTTATTTTT
+ATTTTTTCTAAGCTTCTACAATCTACTTCAGTATCTTCATAAGCAGGAAATGGTGTTGGT
+GATATTTCATATAACTCAACTTCTAATAAAGTCCTTTTCATTATTTCTTCACCATCTTTT
+TCAACTTTACTCCATTTATCGTCAAGTACCTTGAATCCAAATGAAGTACCATCAACATCC
+CCACGCTTTACACTTTCATATAAATCATTAGCAACTGTTGTATTAGGTAAATCAATATCA
+AACCTTAATCCTACTGAATCACTTTCTAACCTTAAAGTACCACTTTTTGTTGAACCTAAT
+ACATTATCAGTATTATGATTATATAAAGCTTTTATAGTATTGTTTCTTAAACTATTATCA
+AAAGCTCCCTCAGCAACAACTTCTACAAACTTATCTCCCCACCAATCTCTTAATACTTGT
+GATTCAACATTATACTTTGATGCATAACCTGATATTGTTTTAACTCCTGTTTCATCATTT
+GACCTTGCTTCAAAATTTGAAATTATATTTCTTACTTCTCTTTTAACTTCCTTATGCTCC
+ACTATTATCACCACCTTTCAAATATTGTTTTCCAGCCATAGCTATAGGCATCATATTACC
+ATTTATAAGTAATTCATTTCCTCCATCTTTTGGTGGTAAATTTTCTTTTTTTCTCACCTC
+ATTGGAAGCTATAAATCCACTTTGAATACCAATTCTATAAGCTTCATATCTTGTTTTTAT
+ATCACTTCTTAAAATACTATCTACATTAAACTCAATTTTCACATTATTTAAAGTTTCATA
+TTGACTTAATAATTTATCTTGCATCTCTTGTTCATAATTAGTAAGAGATGGTTGAAGTGT
+TGTTATATAAAAATCTTTCTGTTGTTCTGTAAGATTATTAAATGTTGCTCTCTCTAAATC
+ATTAAGATGATATGACTTCATTCCAAATGCTGCTGCTAATTCTCTTTTAGTTAATTTTGC
+ATTTTCTAAAAATTGTGCATCTGCCATGCTTAATGACAAAGGTTGAAATTGATACCCTAA
+AGGAAGTAATGAAACCGAATGAGCATTTGCTAGACCATTACTCATAGATTCAAATTCTTT
+TATAAAAGTTTTCTTTGCCTTTTCGTCTAGCTCTCCTACATATTGAATTATTCCTTTTGT
+AGTTAATCCACTTTTAAAGAATTTATTTATAAACTCCTGAGTAGCTCTTCCATTCTCAAT
+AGTACATTTCAAATAATCAAGTGGAGCTATTCCTATTAATCCATCTAAAGTAATATCTCC
+AATAAAATGTAGTATTTCATCAGGAAGTAACTTATGTTTAATCCCTTTATTGTCAGTTAC
+TATATACCAAACTTTAGTTAAACTACTTAAAAAGTTATTATCATCCATAACTTTAGTTAC
+ATTATCTGAATCAATAGGATATAAACCAATTATCTTTCCTCTTCTATCTCTTTCTATATA
+TGTATACGCATTACCTTTTAAAGTTCTTTGTGCTTCTAAGCACTTCCAAAAATTAATTGA
+GTTCATTAATGGATTAGGCTTATATCTTAAAAGATAATAAAGTTCATGTTCTTTATACTC
+TTCTCTATCCTTGTAAATCTTTAAAGATAATTTACCTATGCTTTCAGCTCTTACCTTAGT
+ACATATATAAACTGTATTTTCTTTTAATACTCTCTTACCTGATATTAAAAATTTTAATTT
+AATACCAAACTTCTCCCAAAAGTTAGAATCAGATATATTAATACCAATCTCTTCATCATA
+ATTACTTCTTTTATTAAATAACTTTTTAAAAAACTTCATCTATTTTCTCCCCCATAATCT
+CTTTAAGAAATCTTCTTCTGCAAATTCACTCACATTTAAGTTTTCTCTTTTCCAATATGT
+TATAGCTCTAACATGAGCGAATATACAACTTGCTAATGGGTCAATTCTTTTAAATCTGCT
+TTTTTTACTTATTTTTATTTCTCCAAAAGAGTTGGAATCAATCTCTGCATTTTGAACACA
+CCAAGTCATAAGTTTATTATCATCATGTTCAAGTTGCTTAACTTTCATTAAATCTCTAAA
+ATTTACAGTAGCTTCATTTAGTTTTGCACAACTTTGTCCACATTCTACACAGGTATAATC
+CTTTCTTTCTAGTTCTCCAACTAACATTGCAGCTCCATGAGGGTCATAACTAACTTCTAT
+AACATTTAGTTCATATTCTTTTACAATACTTTCTATAGTATTTAGAACTGCCCAAAAATC
+TACTATTAAACCATCATTAGCTTCTGTCTTTATTAACCAACCTTTTTTACTCCATAATTC
+ATATGGTACATTGTCAGTTATCATTTTTTCTTTAACTACTTCTGATGGTATAAATGATTG
+TCCAAATAAAGCATATCGTCTAATATTCCCATCTAAATAAGGAAACTCAAAAGCAATTGA
+AGTTAAATCCCCTGACTTTGATAAATCTATTCCAATATAACAATCATGTCCTCTGAAATC
+CTCTAAGGTTAATTCCTTTTTACAAGCTTTCCAGTATTCAACATCAACATACCTTTTTTC
+TCCTGCTGCAACATATATATTACAATTCTTAGTAAAGAACTCTATTCTCTTCTTTTCATT
+ACTTGTATTCTTAGCTAATTTAGCATTTTCCCTCATGCTTTGTATTCCTTCAGGATAAGT
+ACATAAAATTGGATTAGCCTTTAACCAAACTTCTTCATCAAAAGGATCATCTTCTTTTTC
+TAGCTCACAAATCATTACAAAGTATTTATCATTCTCAAAAGTTCCATCTAATATTGAACA
+ACAATCTAAATATTCATAATAACAAGCCGTTTCTTCGTAGTCCATTCCAGCCGTAGTTAT
+TATTACTAATAATGGCTCTGTTCTTGCCATCATACCTGATTTCATAACATCATACATATC
+TGAATTAGGATGTGCATGATACTCATCTATAATAGCCATTTGTGGATTCTTACCATCACC
+AGTTTTACCAGCTTTTTTACTTAAATGCTTCATAAAACTATTACTATTTCTATGTCGTAT
+TTCTTTTTGAGTAAACTTAAATTTCTTCTTTAATGGTTTAGAAGTCATTAGCTCCCATTC
+ATCAAAAACAATTTTAGCCTGATCTCTTTCAACTCCTAAAGTATAAACTTCTGCTGCATT
+ATACCCTTTTGCTCCTATTTCATAACCAGCCATTCCAGCTTCCATTTGAGATTTTGCATT
+TTTTCTCCCTACTTGAATAAAAGCAAATCTAAACCTTCTATAATTTGTATCCTTATGCTT
+CCAAGCTTCTATATTACAAATTACAAACTTTGACCATGAATTTAATATTATTGGTTGTCC
+CTCTAATACTCCTTTTGAATGTTTACAGTAACTATACCACTTAACAATTTTTTGAGCTTC
+CTCTTCATCCCAATAATACTCGAAATCTTCATGCTCCATTCTTTCTAAATCATTTAGAAA
+TCTCTGACAAGCTTGTTTATGTCTTTTACAAGCAACAATTTCACAATTTAGTATTTTATT
+AGAATAATCAATAAGCTCTTCAAGAACTGTATTATACATTTCCAAAATCCTTATTAAATG
+CTTTTTCATCATCATCAATATCAGATGCTTCTTGAATAATTTTTAATCTTGCTGCTGGAC
+TTAATCCAAACTCTGCACCTAACTTTTTAATAACATCAGCATATTGAATTTGAATAGAAA
+TCAAAGGATTCTTTTGAGTTGTTAAAGATCCTTGTTTATTAATATGTGTTACTGTAAGCT
+CATCACAATTTAACTTCATGGTACATTCTATATATTTTTCTATAGAGTTAGCCAAAACAG
+CTAAATTATAATTATCAATATTAGCAAGTATATCTACAGCTTCTAACTCTTTAACAATTT
+TCTTAAAAATACTTTTACCATCTTTGGATAACCATGTTGGTGGTCTTATTTTATCTCTAG
+GTAATTTTTTTAATTTTTCTTCTTGTTCTTGTCTTTTTTCAATTTCTTCATTAGTCAAAT
+GGCTCTTATTACCATTTGCAATAATTTGAGAAACTGAAATCATCTTTCTTCCCAAACCTA
+ACATTACCCCCCTTTAGTTCAAAAAACGAAAAAATTTTTTCTGACATAGATACTGCGACC
+TTTTGACACTCCTTAAAAACTTTTTATACACCCCCTACCCTTTAGGAATTAGCTTAAATA
+ACTCTTCCTGAGTATTTCTTTTAGTAACCATACCTTTTCTATATTTAGCATGTATCTCTT
+GGTGACATGAATTACATAAAGAAAGCAGGTTGCTTGTCCTTAATCCAAGCTCCCTGCTTT
+CCTTTAACTCTATTATGTGATGTACAACATCAGCAACTCTTATTCTATTCTTACTTAAAC
+AAACCTTACATAAACCTAAATCCCTAGCAATAACGTTAGTCCTAACTATATGCCATTCTT
+TAGAATTATAAAAAGCTTGTTCATCTTTATCTTTTCTTCTTACCTTATAATTCTTATGTC
+TATCCTTATTATCAAATGAATGCTTACTACAATAAGTTTCATTTAATTTTATAAGGTTAT
+TACATCCACTATAGTTACAAACTTTTTTAATTTTTAATCGCTCCTAATAAATATTTTAAT
+GCACCTTCAATTTCTTCGTTAACTTTTATCAAAGAAGTATTTTCTTTGTATTTTTCCACA
+AAGTCATCTATACAATCTGACTCTTCCTGACTTTGTGGAATTAATTCTTCTCTTAGCTCT
+GTTGGTCTCATATGATTACTAGCTTCAATATTATTCTTTAACTTAGTATCTTCTACAGGC
+ACAAACTTTAACTTAGGTGTAGTACAATCAACCGTTTTTTTATACTCATCATTCAATATA
+TTTTCCAATAAAAATTCTATTATCACTTCGTGATTACTTTTTTTATCAATCAGTCTTTTA
+TTTTCAATATATAAATCATATATTTTCTTTATAATTATTATACTTTCATTGGTATCATAA
+ATCATTAGTTCATATATTAAATCTTTTACATTTGATTTTATTTCTGGAATTATAAATCTA
+AAATCTTCACTTACTCGCTTAACCCCCCATGTATTACCTGCTTCAAAAATATAATAAAAA
+AAATCTTCCTTAACTGAATTAATATACTCTAATAACTCAGTATAAACTATAATATTAATT
+CTTCTTAGTTTTTCTTTTTGCTCAACATTTTTCTGATTTTTAGAATATTCAATTGAAATT
+AAGACAGCAATTATTGTTGCATATGCTCCTATTAAAGTAGTTACTACTGTAGCACAAAAT
+ATAATCCATTCAGCAACTTTAAAATGATTACCCCATACTTTCCAAATACTAAATAATGAA
+GCATATACCAATATTGATATTACCCCTAAACTTATTGATATATTTTTTATTATGGTTTTT
+TTATCCATTTAATCACCTCAATAACATATTATATATTATTGCAATATCAAGTTCAACAAC
+TTGCAAATAATACCCCATAATACATATTGTGTGGTTTAAATGAATTATCTTCAAAGCTTC
+ATAAAATCTAAGTTTAAAGGTAGTCTTAAAATTTAATGCCACCTCATTCTTTTATGTCCT
+ATTTAATAGATTTTAAAACCTTTAATCATTCTATTTATATGGCTCTGTTCAACCCCTATA
+TAATGTAAAGTTATTGAAGGGTCAGAATGATTGAATATCTTTTGGAGTGTAACAACGTCC
+TTATATTGCATATAAAAATGATATCCAAAAGTCTTTCTTAAAGTGTGAGTTCCTAAGTTA
+TAAAGTCCTAAAGTTTCTCCTGCATCTCTTAATATAGTGTAAGCTTGTTTTCTTCCAATA
+GGTCTGTTATAACCTTTCTTTGATTTTATAAGAAATTGGTCTAAATCTTTTTCATCACAA
+TATTTCTTTATTTCTCTTTTTAATATTGGTGTCATTGGAAATATCTTTTGCTTTCCAGTT
+TTCTTTTCTCTAATGGAAATATAATCTTTTCCTTTAACATCTCTAATTCTAAGACTTAAA
+ATATCACTTATCCTTAATCCTGAATTAATACCTAGTATGAACATAATATAATTTCTTTCA
+CTATACTTTCTTAAGTAATTAGCAATCTCATGTACCTTATTTGAATCTCTTATTGGTTCA
+ACATAGTTCATATACTACCTCACTTAACTAAAATTATTTCTTATTCTATGAAATACAAAT
+AAAAGAAAGAGTTTTTATTATAATTAAAACTCTTTCTTTTATTTATTATGGTACATAAAC
+TCTTACTATTTTATTAGAATCTGATGAATTTATCTCTAGAATTTTTTTTGTTTTTAGATA
+TTTCATCTTTGTATAATGACAATTATATGTTCCAAAGAGTTGAATATCTCTAAAATCATC
+AAAACCATCATCTTCCCACATGATACTTATCTTTTGCGAACTACTATCAAATGCTATAAC
+TATTGAAACATTTGCATTAAATGCAAGTTTCCTTCCTTTTTTTAATAAAACTTCTACCTT
+AGTATTAAATGGTCCATTTTGATGATTATTGGCAAAATAATATTTTTGTAATGCCTCAAC
+ACTCTGTAATTCTTGGTCTCTATCCAATTTTTTTCCCATTATTATCCCCTCCACAGATAA
+TTATAAGTTAAAGTTTTATAATTTTCAAAAAAATTTATTATTTTTGTCTTAATGCTCCAT
+TTACTCTTTTATAGCTACTATGTTTCATACATTCATCAATTCCTTGACAAGGATCATAAA
+TAACTACTTCTTCTTGACACTTTCCTTTTTGATATTTACTACATAATGGTGAGAAAAATG
+AACATGCACATTTAAGTCTGTTCCCTTCCCACAACATATACATAGGTAACTTTCTCTTTT
+CCATTTATCTCACCTCTTTTTTTACAAAGTAAAAAGAGCCAACTATAAAGTTAGCTCTTC
+TAAAGTTTAAGTGGTTATTCATTTGATACTATTATATTAACGCATATAAAGTTAGCTATT
+CAACCACATAATAGTTAGAGTTTAGTCAGAAATTAGTTAGACTTTTTAAATTCATCATAT
+CTAACTCTATTTTCTTAATTATTTTTGATTTTTTGCATATAAGATATTTAGGATTCATCC
+CTAATCTTTCAGCAATACTCTCCATATTCATTCCCCTAAAGTAATATGATGTGATTATCT
+CATACTCAACTTCATCTAAACATGATATTAGGTTTTCTATTTTCTTTATCCTCAACTCCT
+TATTTCTTTTCAAATATTTAAGAAACTGTATTCTCTTTTCCTTTGATAAAACTTCATTTA
+CTACTGGATCTGTTATTTTATAAGTTGTTCCAGTTCTTTCTGAATATTGTAATGCTCCAC
+ATCCTTGATATTCATTTTCTACAGTTGCAATTTCTAATTCCAAAGCTCTTATTTCTCTTA
+CTGTTTCTTTATAACTCTTTAATAATCCTTCTACATCATCCTTAAACTTAATCATATTAC
+CTATCATTTGAATACCTCACTTTAACTTTTTTTATTTAAACTAACTAAGTTGTACAATAT
+ATAGCTTTTGTAAAGGAACTTTCACATCCTTTCATAATAACTTATATCCTAGTTAGTAAA
+AATCTTTTTATTTACTTAGTCATTTAATATTTATTCTCTAAACACCTTCTAATTAACGAT
+ATACTTCTTATTCCTAGCATACCTTTTAATATTTTCAAAATTAAATTTTTCACTCCTGCA
+CCTACTATATTTTTATGAATAACTATCTTATTTTTGAATATAATATTAAATATAATATTA
+AATATAAAATTAACCATTGAGGTGATTAAATGCAAGGTGATTTAACATTACTGATAATCT
+TAGTATTAGCTTTATGCATATTAAAATGTCTTTAATTTTTAATTAAAGCTATAGAATAGA
+TATATATGTATCTATTCTGTTAGATCATATGTTAAAATAAATCAAATAAACACTTCATTA
+ATCACCTTTAAGATAGAGAGTTGTAAAACACAACTCTCTTTTTGATTACTCTTAGTCACT
+ACCTAGAATGGAATATCCCCATCATCAACTGGTATCATATCATCATTGAATTTATCATTA
+TTTACTTTACTATCACTTGAATCAATAAAATCAAATCCATCAACCGCTATATAAGTTATA
+TATCTTCTTGTCCCATCTTGTGCATCATAACTTCCAGTTCTAATGCTCCCTGATATACTA
+AATCTTTTACCTTTAGTTAAATACTTAGCTATGACTTCTGCTCTTTTTGAATAAGCTATG
+CAATTTATAAAATCAGCTTCTTGTGTTCCATCTTCTTTTTTAAAATCTCTATTAACTGCT
+AGTGTAAATCTTGTTACTGCTGTTCCTTTATTAGCAGTAAATCTTAATTCAGGATCTTTA
+GATAATCTCCCAACTAAAACAACTTTATTCATTTAAATCATCCTCTCTAGTCATAATACT
+TTCTATTATTTCTTCCTCTTGCTATGGCAATAGTAGTAAACTTGTATTTATCATATTCTA
+GTTCTTTTGCCTTACGCTTCTTTTTTAAGTCATTAACATATCTAGCAACAAATTCTTCTT
+TACTTAGTTTCATATTAATCACTCCTAAAATTCTGATAATCTTTGAGTTGGCAAATTATA
+ATTTAATTCAACTACTCCAGTTCTACCATTTCTACACTTAGCAAAGTTTATTTCTAAAAC
+ATCATCTACAATATCTTCCTTATCCTCTCTTGCTCTATAATAACCATCCCTATAAAGAAG
+TCCTATTACATCAGCATCTTCTTCAATGCTTCCAGTATCTCTTAAGTCTGATAGTATTGG
+TCTATGGTCTGCCCTTTGCTCTGATGCTCTTGAAAGTTGACATAATGCTACCATTGCTAC
+ATTTAACTCTTTAGCCATAGCCTTTAATGAATTTGATATATAGCTTGATTGTTCATATTT
+ACTTCCCTTTGTTGTCGGTCTTATTTTTCCTATATGATCTACTATGATTACATCTAACCC
+ATACTTTATTTGAATTTCTTTAGCTATTAATCTTATTTGATTTACTGTTATTGATGCAGG
+TTCATAAACAAATATGTTATTCTTCCTGCTTAACCTATCAAAAACATTTAATAAGCTATT
+CATCTCAGAATCATTGAATCTTCCTCTAGCAATCTTTCCATTTTCTATACATGTATTTGA
+AGCCAATAACCTTTGTCCCATTCCTTCGGTACTCATATCTAACTGAATATAAAGAACCTT
+GCCTTTTATATTTTCCATTATTGATAGTGATAAAGCTGTCTTTCCCATTGAAGGCCTTGC
+TCCAAATACAATAAAGTCTTTTTTCTCTAATCCATTTGTCGCATTATCTATTTTTTGAAT
+TCCTGTACTTATTCCAGTTAATCCACTTTTATTATTAAAAGCTTTTTCTATCTTATTTAA
+AGTTTTCTCCATTACCTCACTCATTGTATAAAATTTATCTTCTCTATCTGATGAATTAAG
+CTCAAGCAAAGTATTTTGTAATAAATCCACTTTTGATTCAATACTTCCACCATCAGTTAT
+TATACTTTTACAAGCAACAATTAACTTTCTTTCCTTACTCTTTTCTTTAACTAAGTTTAA
+ATGACTATCAAATGTACCTCTTGATGTGTGATATGATATTTCAGTTAAATCAGATAAGGT
+TATAGCTTGTGCCTTTATTTCTTTGGATAACTTCTCAGCGACTATTGTTAAATCAAAACT
+TATGTTATCCTTAAACAACTCTCTCATAGCTCTATATGTAATTTTATTTTTAGAGCTATA
+AAAATCATTATCTTCCAAAGAACCCATAGCTTTTATCATAAAATCATTATCTTGTATAAT
+AGTTCCTAAAATAGCTTTTTCACTATCAATAGCATAATTACTCTCCATACTCTCACCTTT
+AATAATCAAAATTACCTTTCTTTATATTAAGATTATCTTTACTTATTTCTTTTGTTCCTG
+CTCCAAGCTCTTGATTTAAATATCCTTCAAACTTATTACCAAATAAAGTTTCAGGCCTTA
+AATATTTCTCATACTCTGTACCTTTCCATTCAGAAACTTTATTATCTATAACCTTAAAAA
+ATTCTTCTTCATTGAATCCTTCATCTAATCTAGCTTTAATTAAAGATTGTGTCTTTCTAG
+TAGTAGCTTTATATGATTTTCCAGTCTTTGAATTGAGATACTCTATAACTCGACTATATA
+TAATATTATTTATATCTCTTATAGAAGAATCTTTGTTGGGATATATTGTCCTAACCCTTG
+GGACACTTTGTCCTAACCCTTGGGACATTTTGTCCCAAGGTATATATTCTGTTAAGTTAT
+CTAATTTTGAAGTAACATTTATATAAGAAAATTTTCCTCTTATCCCATCTTTACAAAATA
+AAACTTTTCTTTCTATTATCTTTAAATCATCAAACTTTTTTAATCTTCTCTTAAGACTTC
+TTTGAGTTCCTATTATCGGTATTTGTTCTAATAAATATCCCTGATCTATCCATATAAAAC
+GCTCTCCATCAATAATTTGAAACTGCATATTTTTACTTGAATACATATCTTTAATTACTG
+ATAATATAAGAGCATCATCATTATCTAATCCTGATTCTATTAATTTTTTCTGACTAAATC
+CATGAATTGTGTATTTCAATTTTATACACCTCTTTTCTTGCCTAAATTAATCTTGGATGC
+TAAAATTAAATTGTAAGTATTTTTGAGTGCATTGATTGCTTTGGTCGGTATCAATACACT
+TGTTTAGAGCTTCTTTACATGACATACCATTTAAAGAAAGCTCTATTATTTTTTCAATAA
+TTTTATTCATCTCAACTTTATCCATATTTAAACCCTTCTTACTAGCATTTCTGCTTCACT
+CAAAATCTCTAAGAATTTAATTTGTGATGTTTTCTTTCCAAAGCCAAGTCTATTAAATCT
+GATATCCTCTTCTGCAATACATAAAATAGTTTTAAAATCACAACTTGAATATTTGTTTTT
+TAATCTTTGAATTGCTTTTAATACCATAATTACCTCCTATAGCTTGTACAAATTATTTGC
+ATTGTATTATTTCTTTAGCCTTTTCACTTTCAATCTCTATAGCCTTTTTAGCTAAGAAAC
+TATTGAATTTTTCTATAGCCTCCATAGATGGTTGTTTTAATATTCTCACTTTAGTTGTTC
+CTATATATCCATCTGTTATAAATACATTTCCATCTTTTATAATTTTCTTTGGAAATAAAC
+TTCTATCCCAATCTTTAGGATCATCTTTTTTTCTTCTTGCCATACTACCTAATCCTCCCC
+TAAATATTTTTCTGCTATAAGTCTCATTTCTGCTGCTCTCTTTTCTAATTTTGAAAAGAA
+TTTTACTATAATTTCCAATTCTTTTCTTTCTGATACATCAATTACTCCATCTTCAACTAT
+TTTTAATAATGTCTTCTGAATATTAACACTATCATCTAATGTATTAGCTACTGAAATTGC
+AAACTTATACAAATTATCAATATTCTCTGATTCAATTATTGGAGTAATTCTCTTGCCAAT
+AGGACATTCATTACAACAATAATGATTTAAAAGTTCAGGAGCATTATATGCTTCTGCCAT
+AATAACAACCTTATCTACTGGAACTACTTTACAAAGGTCTAATTCATAATCAGTTAATGA
+ATCCTTTGAAATTCCTAAAAACTCTGAAGCTCCCTCCCTACTTGAAAATTTAGAATTAAA
+TTCAGCAGCCTTTTTTCTTGCAATACAATACACATTATTAGCTGCTTTAGTTGGTTGTTT
+TGCCATGTATTTTCTTCTCCTTTCATGTGATAATCAAACTACACAATAAGTGTAGTTAGT
+TTGCAAAAAAAATTTCATCTAAAGTACATCTAAATTTACTTTTAAATTTTTTCAAGAAAT
+TATAACTAGGATTTCTTATTCCCAATTCAATTTTAGTGTAGTACGATTCGGAAATTCCTA
+GTAATTTTGCTATTTCACTTCTGCTTAAATTCTTACTTAGCCTAAATCTTTGTAAACTAT
+TCATGTAAACCTCCTACACTTATCGTGTGATTTAAATATACTACACATTTTGTGTATAGT
+CAAGTTTTTTAACACTTTTTGTGTTTTAATCTTTTTATAGATGTTTTTAACTTCACATTT
+TGTGTAAAATATATATAAGGATGGTGAATATAATTGTTTGGAAATAGATTAAAGACTTTA
+AGAAAAGAGAAGGATTTAACCCAAGCTCAACTAGCTAATATATTAAAAACATCAGCTAGT
+GCTATTGGAATGTATGAGCAAAATAGAAGAACTCCTGATACAGAAACTCTACAAACTTTA
+TCAAACTATTTTAATGTATCTGTAGATTACTTAATTGGAAAGACAGAAATACGAGAATCT
+GCTGAACAATTATTAGAAGATAAATCAGTTACCATTGCTCTACACAATAAAAATGGTATT
+GATGATGAGCTTCCTGATGAAGCTAAAAAGGAAATTGAAAATTTTATTGAATATGTAAAA
+CATAAATATAAAAAATAGTTTTTATAAACTATAAAAATAACTGATATTTATTTGGAGGAG
+ACATTTTAATGAGTACTTTTTTTACAGATATTTCAATTGACAAACTTATCGTAAACCCTG
+AAAATTATAGATTTGATTCTGTTGACAATGAAACTTCAGCAATAAAAATAATGTTACAAA
+ATCATAATAAAGCAATCAAAGAATTATTAAAGGATATTTTAGAAAATGGACTTAATCCAC
+TAGAAAGATTATTAGTATTTAAAAAGAATGAATTTTATATTGTATTAGAAGGAAATCGAA
+GGGTAACTGCTCTTAAAATAATACATAATGTGAATCTTCTAAAAGATATTGAACAAAAAT
+ATTTTAATGAATATTCTAAAATACTTAATAACGCTAATTCTAAAATCAATATTGATAAGA
+TTTCTTGCGCTATAACAGATAATATTTCCGATTCCAATAAATGGATTGCACTTAAACATA
+CTGGATCTAATGGTGGAAAAGGTACTATTCCATGGGATACAACTCAAAAAAGACGATTTT
+TAAATAAAACAAATCCCAATAATTCATCTAATATAATAACTTCATTGTTCTCTTACATAA
+AATCAAGTAACATTTATGATGATACAATAACCCAAAATCTAACTAATATACCTATAACTA
+CACTTGAAAGAATATTAAGTGATCCATATGTAAGAGAAAATATTGGTATAGATATTAAAA
+AAAATACTATATATAAATTATATCCAGATAGCGAAATAAAGAAACCATTGTCAAAGATTC
+TACACGATTTGATAAATAAAACAATTGTAGTAACAGATGTTTATACTAAAAATGATAGAT
+TGGATTATATAGAAACTTTTAATAGCAACTCACTACCTAATTATGCAAATAAATTAAATA
+AACCAGTTGAAATATTATCTAATTTAAATCTTATCAATTTACCTTTACAAACAACTATTG
+ATAATAACTCTAATAATGATAATAGTGCTAATACCGATAATATTAACTCTAACAATATCA
+ATAATAGTGCTACTACTAATAATACTAGTAATAATACTAGTAATAATACTAGTAATACTA
+ATAATATCGCTAATATTGATAATAATAACTCTAGCAATATCAATAATAGCACTAATAATA
+ATAATAATAATAATAACAATACCGGTAATAGTAGCTCTATCAAATCTACTTCTCCAAAAA
+GAGATAATAAAGATATTAATAAAAGAAAAGCTCTAATTCCAAGTACATTTCATGTTAAAA
+TAACTGTACCAAGAATACAACAAATTTATAAAGAATTAAAAAAATTAGATGTATCTGATT
+TTCCTAATTCAACCTCAGTTCTTTTTAGAGTATTTTTAGAATTAGTTGTAGATGAATATA
+TAGAAAAGCTTAATTTAACTGGACTTTCAAATAACGATAAACTCAATAAGAAAGTACAAG
+CTTGCATTGATGATTTAAAAAGTAAAAATTTAATTGATAAAAACAAAGTAAAACCTATTA
+ATGTAGCAATATCTAATCATGATAGTCTATTTTCAATAAATACATTTAATAGTTATGTTC
+ATAATAAACATATGCTACCTGATGCAACTAATTTAAAAAACACTTGGAATCAATTTGAAT
+ATTTTATTTTAGTTTTATTAAATTCAATCACAAAATAATTTATGGCCAAAGTTTTATTTT
+TATGATAGACTTATATTGTAATTAAATGACTAAGGAGTTTACTTTATGAGCCTAAAAAAT
+TATTCACCTCTAAGATACCCAGGTGGAAAAAATAAGTTATCAAAATATGTAGGTAATTTA
+ATAAAATTAAATGATTTAAATGGTCATACATATGTTGAACCATTTGCTGGTGGAGCTGCT
+GTTGGTTTATATTTATTAATTAATGGTCATGTTGATAATATAATAATAAATGATTATGAT
+AGATCAATTTATGCATTTTGGCGTTGTGTATTGTCATACCCAAATAAATTTTGTGAATTG
+ATAAAAAATACTCCAATAACAATGGATGAATGGTACAAACAAAAAGAAATTCAAAACAAT
+AAAAAAAATGCTAGAATTTTAGAATTAGGTTTTTCAACCTTTTTTCTTAATAGAACTAAT
+CGTTCAGGTATTATAAAAGCAGGTGTTATAGGTGGCTATAATCAAAATGGAAACTACAAA
+ATGGATTGTAGATTTAATAAAGAAGATTTAATAGAACGTATAAAATTAATTTCTCGTTAT
+AAAAGACATATTAAACTTTATAATTATGATGCTATTGAATTAATTGATAAAATTATTAAA
+CCAAACTCTGATAAAACTTTTACATTTTTTGATCCACCTTATTATAATCAAGGTTCAAAT
+CTATATGTAAATTTTTACAAACATCAAGATCATGTGAATTTAGCAAATAAAATTAAAGAA
+TTAGATCATACTCACAAATGGATTGTTACATATGACAACACTCCTGAGATTTTTAATATC
+TATAATGATTTTTCTTTTATTCAATATCCATTAAAATATACTGTTGAAAGAAAATATTAT
+GGTGTTGAAGTTTTATTTTATTCAAAATCAACTATTATAAATGCATTTGATAAGAACTAG
+ACAACTTTAATCTAGTTCTTATTTTCACAGTTTATAAGAACATATGTTCGACCTTTAAGT
+AAATAGATGCTATAATTATCCTGTAAATAAATAAAATGGATGGTGGAACTAATGAAAAGT
+TTAAGTGATATTTATAGTGTAATTGAAGATGAAAACATAGAATTAGAAGAAGTTTATTTT
+AAGTCATCTAATATCGAAGGTATATATTTTAAAGTATCAGGAATGAATCCTATAATTGGA
+ATACATAAAAATTTACTTACTGATACTAGAAAATATATATCTGTGTTAGCTGAGGAACTT
+GGCCATCACTTTACCTCCTCAGGCAATTTAACATCTGAATGTATAACTTACTCTGATAAA
+ATTAATAGAAGTAAGCAAGAAAAGAAGGCTAGAATGTGGGCTGCTAACTATTTAGTTTCT
+GATGAAGAAATAATTGAAGCTTTATTACACATATCTGGTACTTTAAGTGGATTGGCTCTC
+CATTTTAATGTTACTGAAGAAATTATAAAATATAAGTTATTATCACTCTACCTAAAAGAA
+GATAAGTTTAGGATATCTAAATTAATGATTATGGAAGATGAAATAATTTATAATTCTTGT
+TCTGTTTAATGGAGGTCTATTATGAAAAAAGTTGCTATTTATTCAAGAAAATCTGTTTTA
+GTTGAAGGATCAGTATCAATAGAAACTCAGATTAATATGTGTAAAGATTATATAAATAAT
+AAATTTCCTAATGCTAAATTTAAAGTTTTTGAAGATGAAGGTTTTTCAGGTGGAAATACT
+AATAGACCTGCCTTTCAAAAAATGCTTAGAATGGCTCAACTAAATGAAATTGATATAGTT
+GTTTGTTACAAAGTAGATAGAATTGCTAGAAACACTTTAGACTTCTTAAAAATATTAGAA
+CTATTTAAAGAAAATAATGTTGAACTTATTTCTATAAGTGAAGGTTTTGACCCCAATACT
+CAAATGGGAAAAGTTATGTTGACACTATTAGCTAGTTTTGCTGAAATGGAGAGAACTAAT
+ATTCAACAAAGAGTAAAAGATAATTTATTATCTATAGCTAAAAAAGGCAAATGGACTGGT
+GGCTCCCCTCCTACTGGATTTAAAAATGGTTTAAATGGTGGACTTGAATGGAATAAACAA
+GATATGATTTTAGATGTTTTTAATATGAAATATGAGAAAGAAAAAAACTCTAATATTATT
+AAATATATAAAAGAAAAATATAATCATAATTTTCTTGGGGGAACTTTAGCTACCACATTA
+AGAAAACCTATATATGTTAAAAGCTCTCCCTCTGTATCTTTATACTTAAAGACTAAAGGA
+TATATAGTTCAAGGTGATGAAGATAATATACATTCCTATCTAACATATACAGATAAAGAA
+ACTAAATATGCTATTGTTAGTGATATAGTTGGATTAATAGAGCCTTCTATTTGGATTTCT
+ATAAATAAAGATATGGATAAAAATATATCAAGAGAAGGTAATAGATTTAGTGAGAAATTT
+TGGCTTACTAAAACAGTTAGATGTAAGTATTGTGGTCAAACATTTTGTGGACAAACCAAA
+ACAACTAAAACCAAACATTATAATAAACATGGTGAAGAAAAAATATATATTTCTACTTAT
+AGTTATTATTCTTGTAGGGATGCTGTTCGTGGTAAATTAAAAACTTGTACGAATACTAAA
+AGAGTTAAACAAGAAATATTAGAATTTAAGGTATCTGAACTTATACATTTGCTTAAAGAT
+AAAAAAACATTTAATTCTTCATATTTTTCTAATAAAATAGATAATTCTTCTAAAATAGAT
+ACTATAAAAAAACAAATAAAAAGTATTGATAAAACTATAAATAATCTTACTGACAAAATA
+GCTCTACTAAGTAATGAAGCTTCCCTTATTTTTATATCTAAATTAGAAGAATTAGTAAAA
+GAAAAATCTATATTAAAAGATAATTTGCTACAACTAGAATTACAAGAGCTTAATTCAAAT
+ACTAAAAAAGATAGCTCATTAGTCTATAATAATATACTTGCATTTAATGATGATCTTAGT
+GTAGATGACAAAAGAAAAATAGCTATGAGTTTATTTAAAGAAATTATATATGATCCTGAA
+ACTGATTCTTTAGATGTTACTTTCATGTAACATCTATTTTTGTCTAAATAAACATTGGAG
+AACATCCACCACGAATATATCCAGTATATTTCATTATATCCTTAACTGCTATCATTTCAA
+CTTTCTTTTCTCCAGCTATCTTAGCAGCATTTTTTAAATCTAATTCTTCTGCAACTGGTA
+TAACAAAAACATATAACTCTTTGCTTGTTCCTTGAGCTACTAAGGTTTTAAATACATTTT
+TCTCATCTACTCCAATTTTATGAGCTACAGATATTCCATCTATCTTTCCATCTTCGCTTT
+CATAACTTAACATTTCATATGAAACCTTTTTAGAATCTAATATTCTCATAGCATTTGTCT
+TAAGCTTCTTATCTTTTGCCATAATTTTCACCTCTTAAACTTAAATCATTTATAATTATA
+CAATAAAATTCTTTAAAAACTAAGCTTAACTTAATATTATCTCAGATGAAGTTAATATAA
+ATTAAGATATTTTGTGTCCATATTTTCAGTATATAATATCAAATCTTATTGAACCAAAAT
+TCTAGATTAATGGTAAAATACACTAATTATAAACTCTTAAATCTAGTAAGATTATAAAGA
+TTCTATATAAATAATTTAGAAGATAAAACACAAACTCATCTAGCCAAAGCTAAATTACTT
+AAGCTAAATAATTATCTAGATTTATTCTACTTATTTACTTCAAGGTGGTCATTTATGTCA
+TTCCTTTTCTACACATATATAATAAAAATGCTTTCATAATAAATTTATTATAAAAGCATT
+TCTTTTTATTTGTTTAAATCTTCAAATATAGCTTTATCATTATTTGAAAATTTGTTTAAA
+TCATTCGATTGTATAAGATTCCCATTGGCATAGTTTAATTTAGTATAACCTTTTTCTCCT
+ATAGTATAAACATATGGTTCTATTTCTTTATAATTTGATATAATATCAATAGCGTCCTGA
+TTTTTAGTATCATACAAATCTAATTTTTTATTGAAATTTTCATCAGAAAATTTATAGATG
+GCAAACTGTCCATCTACACCAAAGGATTCCATAGTATCTCTATCTCCTGTAGAAGAGTAT
+CTAGATGCTTCGTTATTATTTCCACAACCTAGAAATAAAAGAGCAAAGCTTAAAGCTATA
+AATATTAAAGAGACTTTTTTCAT
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_009012.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_009012.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3000 @@
+>NC_009012.1|provirus_1938476_1983993
+TTACGAGCAGGAATTATCGTAACATTCCTGGTTGTCATCTAAAATCACCTCGCTCTTGAT
+AAGACTATAAGCATACTCTGCCTGCTGAAATGGATCATCGTATAGATTATCTGGCATTGA
+AGCATGAAACCTAAAATTCAGGCATTTCTTTTCATTTCCTTTATGTTCATAAATCCTGCC
+AAGCGCCTCAGCTCGTCTGCGTCTTTCAAGTTGTGCTTTTTCGAATGTGTCCCTGCTGAT
+AATTGGCGGATAGAATTTATCCTCAACATACCGTTTATCTGAAAGCATTCTTGCAATAGA
+TGTGTGGTAACGCTTAATGCCCGCTTTTTGAGCCGCCTCGGCTAAAGAAAGCCCGGAAAG
+ATAAGCCTCAAATAGTTTCTTAATTTTAACTGCTTCCTCTTCATTAACGACAGCCCTGCC
+GTTTTGAATGGTATATCCAAAAGGTATATGGCTCATCATTTCATCAACCTTTCCCTCAAG
+TTCAACCCGCATTTCATTTTGAAACCTATTTCCTCCTGTGAAAACACAATGATTTCTTCA
+ATAAAGTTCTCAAATATATCGCTATCAAATGCATCAATCTGCTTTTCAGCCTTCGTTGCA
+AATTTAAAAAGCTTTTCTACCTCAACAAGAGTAGTCATGCCTCCATCGATTACGCGTTTT
+AATGCTTCTCTTTGTTCTTTTAATAAAGCCGCTTCTTTGAGCAGCTCATTTTTCTGTGTA
+TTAAAAAGAGCGGGTTCCAGGTATCCTTTGGCCATAAGTCCCATAATCACCTGAACTTGC
+TCTGTATTTTCTTTGATTTTAGTTTCCAGTTCCTGAATCTTAGTTATGTTATCTGAGTAA
+TTTGTTTTCTTTAAGCTTTGCAGCAATGGCCTTAGAATGAACTTATGTCCGAAAATAAGC
+TTATTGATCATTACAACGAAGGCCTGATGGATCGCATCCTCTCTGACAAACTTCATGGAA
+CAGCTTGATGCGTCCTTTATATGCTTTGTGCAGCACCAGGCAATGTATTTATGATTACCA
+CTGCCATGAATTCGACGCTTAAAACTGCTGCCACATTCTGCGCATTTGATTTTCCCCGAG
+AAAGGGTAGCGGTTTTGATATTTACTGCTTCCCTTGATTACGCCTTTTTCTTTACCTCTT
+TGCTTCAATATTTCTTTGACGGCTTCAAATTCCTCATGGGATATAATGGCTTCATGATGA
+TCTTTTATCATGTATTGATCTTTTTCCCCATGATTATAATGCCGTTTAAAATTCTCATCT
+GTATAGGTCTTTTGCAGAAGGACATCCCCAGTATATTTTTCATTGCTTAAAATGCCGCGG
+ATAGTTGTCGCTGTCCAGTGTGAACCTCTCTTTGTTGGGATTTTATCCGAATTTAGCCCA
+TCTGCAATTTTCTGTGTGCCTTTACCGTCCAAAGCCTCGGAAAAAATCCGCTTTACGATT
+TCAGCCTGTTCTTTATTGATAAATAGCTTTCCATCCACATAATCGTAACCATAGGGAGGA
+TACGAAATTTTGTATGTTCCGTTTTGGAACCTACGTCTGATAGACCACTTACTATTTTCT
+GCAATGGATAATGACTCGTTTTCTGCAAGACTGCTCAAAATTGTCAGCACCAATTCGCCT
+TCCATGCGCTGTGTGTTTATATTCTCTTTCTCGAAATAGATGAAAACACCGAGATCGGTA
+AGTTTTCTCACCATCTCAATACAGTCGGTTGTGTTTCTGGCAAATCTGCTGACCGACTTG
+GTTATAATAAAGTCAATTTTCTTGTTTTCACAATCTGCAAGCAGCCTTAAAAGTCCAGTC
+CGATTCTCCTTTTTTGTGCCTGATATGCCTTCATCATAGTAAATCCCTGCAAATTCCCAA
+TCAGGATTTGCTTTTATATAGGATTCATAATGGTCTTTTTGTGCTTCCAGGGTTGCCATT
+TGTTCATCACTGTCTGTTGAAACCCTGCAATAAGCCGCTACCCTCACCTTTGGCTTGAAA
+GCTTGGAGAGCATTGTTCCCATCAATCCTCGTTACCTTTCTCACTGTTTTCACCTCCTTT
+GGGTATGTGACATGTTACCTCTTTGTGCCGCTAATAGCAAGCCAATTAGGCCATAAGCTG
+TGCATACATCGGCGAGAAAGTTTTGCGGTTCAACTTGTCGATTTTGTTGAATTCTTCTTC
+TGAAATCAGTCCCGCCTTAAGCATCCTCTGCAGAATTTTGTACGCCCGCCAGTAATCAAC
+CTCTCTTTGAATTTCCTCCTGTGTTATCTTTGTATAGTTCGTTTCCTGCGGGTTATATGG
+TATATGATTAGCCGTCTCTATCATTCAAGAAAGCACCTCCTATAAAAACTTAGGACAGCC
+GCGATTGGCTGTCCTTTATCGTTATTCCGGCAATTTCAGAACTTGTCCGGGGTAAATAGT
+ATCTGAAGTCAGGCCATTGAGTTTCTTAATCTCCGGATATCTTGTTCCTCTACCAAGTTC
+TTTTTCCGCTATTCTCCATAAGGTATCGCCTTTTTGCACTGTATAGGTTCTATTGCCCTT
+GTTATCAGGAATGCTGTTTACAATTACAAGGTTTTCTTTTGCTACCCAAGTGTTTATGCC
+TGCGATTTCTTGACCGCCGGATTTCTTAACCTTTTTGCCAAGCAATACACATTCTTTGCC
+GCCTTTTATGACCGGCTTGCCTTTGTATAAAGTCTGTGTGACCCTGTGGTAATAGTCATT
+TTTGACCCACGTTGGAACTTCCACACTGCCGGGGTAGTAATTCTTTACACTGACCTTAAA
+CTCCACCATATCTCCAATTCCAATATCAGTATTGTTATCTGTACTGTTCTCCAGCGCTTT
+TTTCACTGCTTTTCGGAAAGTGTCCATATTCTCCCCATGCTTGGGGAACCAGTGCATCAC
+ATCAGCATGGTTGCTGGCAATACCGAGCTTGTATCCTTCGGAGTGGCAGATGATGTCATT
+CTCGTCAAGTCCGTACTCCCTGCAGAGCATAACGCAGAGTTCAACCGCATTCTGCCACGC
+TTTAAAGAAATAATCTTCCTGCTTTGCTGCATCATAACCCACCATCACCGACCCGGATTT
+ATACGAAAACCCAGCAGGCTCACAGATTTCAAAGCCAATATGGGTATTGTTTGCTGCTCC
+TCCCGCATGCCACCCGCGATGATCCCAAGGCAGGTATTGCCAAACCTCTTTATCGTCTAC
+AAAAGCGTGAACACATACCTGCCTATTTATTTCGCCGGCCTTGTAAGATTTGTTCCAACG
+GGAAAACCACTCAGCCGCCATTACACCCGGCACAGCCGTCGAATGTACCATGATTCCTTT
+AGGCGTGATTTTCCGACCTGCTGTATAGCAATCGTTTCGCGTCATGTATTTTGTAAAAAG
+CTTCATTTCTTTTCATCCTCCTCATTTGAGTGGCCATGCAGTTGTTCCAATGCGTTCTTC
+AGCTTTTCAGGAATGGGCAGTCCTATATGTGCTGCATTCTCAAGAATTGAAATTCCCTCG
+TTACTCAGGTAAAAGAAAATCACCGCTGTCCGGATTGCCCCTCCGTTGCCGAGAACCTGG
+CTGTCGATTATGTGTCCCACACCCACAAGTACAAATATAAGCACTTTCTTAAAGATGCCC
+TTGGCTCCGACTTCACTCGAAAGCTTTCTGTCTACAACGGCACACATCACTCCGGTCACA
+TAGTCAATGGCTACAAAAGCGATGAGTGCATATAAAAATCCATCCAGCCCTCCAAGAAAC
+CAGCCAAGAAATCCGCCAATAGCAGTAAAAACCGCCTGCGCCCAGTTCCATACTGTTTTC
+ATTGTCTTAAACCTCCGTTCAACTTGAGTTTTGCATATAAAAAAGCGCCCTGCCTTAAAG
+CAAAGCGCTGAAAATTAAAACTTCTAATCTATATTTGCTTCGGAAGCGCCTCCCACAACC
+GCATATCCTCCTGCCCAAGAGACCAGATGGCTATACCTCGCAGTTTCCATCGATAAGCCG
+CTTCGTTTGCCCAGTAAACAAGGCTGTCCACATCCTGATAATACAGAATAGAAAAACCAT
+CTGCATCTCCGAGGAAGAGACGGGATATCCAGATATTGATGTCTTTCAGTATAATCTTTA
+CTTCATAGTCATTACCGCAAGAAAGAGCCAAAAGTTGTGAGTGGAAGAAGTCATAGTCCA
+TCGAAATGTCCTCACTGCGAGTTATCGATTCCTCCACATCGTTATTTACTGAAAACACCT
+GAAATTCATCATCCCACGTGACACCAGTGCGAGCAAGCCTGCCAAAGCTGGTTATATTTC
+CATCCGGAAGTTCCACATCAAAACGCTCGTATGGTTCATATACCCATGCATCGCCCAGTC
+GCAGCAGCTCGCATACCGTCCGGTTGTCCGAGCAGTAACCTACATAACCACTACCACCGG
+TTACATTCACTGTGAAGCGCAGGGTTGAAGCTGCACCTGAATATACTCTTACCTTATTGC
+CGCGTTTTCGCATCTCTATAGTATACATATTCGGATTAGCACGAAGATCGGCATCTACAG
+TTTTTGAGAAACTGGTGGAATAGCTACCAAGCAAGGAATTACCTTGATAAAGCTCGACTC
+TTTGCGTGTCATAATTTAAGCAGCAGAAAATATCCCCAAGGAACACCCCAGCCCGTCCAC
+TGCTATTTTGAGGGAAAGCCAGCCTTGCCCGGATATGAATATCGGAAAACCCGTCGTATT
+TCCATGCAAGTTTGCCATATCCCTCGAGCTGGGAATATGGACGGTTTTCTGTGCTGTCTG
+GGTCTTGCCAAACATCCCATTCGCCATCCAGCACAGTCCAGTAGTTTTCAGGCAGGATGT
+TCCTGTCTCGAAAATCCTCATACCAAATAAGCGCCGAGTCGGGTTTTCTTCGCAACATTT
+CAAAGGTCAGTTTAAAACCTCGATCCGGCTCAACCATCACACCATTTACATCCTTGAACC
+GACGAGGAGAGAGCATAAAGCTGGCTTCACCGGCAAAGGGATACTCCGAAAATCCACTGC
+AAACCCTAAAACCGTAAAACTGGACTCCCGGCACACCACCGCTTATGCTGATAGCATGCG
+TTCCCTCTTGGAGAAATACACCTTTTGCAAGTGTCAACCAGCAAACTCTTCTCCAGTATG
+GCCACCATAAACGGTTCTCGCTGAAAGTCTTTGATATACCATCAAGGGAAACAATAATCG
+CATTTTTGTCCCAGTAAGGAAAGCAAAGCTGTACTGCAATATCGTAATATCCCGCTTCTC
+TTATCTCAAAACGGTACTCTGCTGACGCCTGGGCATCTCCCAGTGAGGTCATCTCATCAG
+TAATAATGACATTTCCTTCGTATTCATCCGGAACTCCGTTCCTGTCAATATAAATGGTTC
+CGAACTCCGCTTTCTGCTCCTTGCCATAGCTTGTCAAATATCTTCGCCTGTTGTAAACCC
+CTTTTAGCAGCGGATATTCCCAGGATACAGCATCCCATCCTTCCATATAGTCATATACAT
+GAGGAAGAGCCCAAGGTACTTTGTTATAGTCATCCCAGTAAGCCACAATTGGAATAAACG
+GCTGGGGCGGTGCATCACCTGTGAAATTGTAAACCCCAGTCATCCAGTATTTAGCCGCAT
+AGTAGGTATTAGACACTCCTCGATAGGTTATTCCGAGGTTTTCAGGCGTATCATGGATCC
+TCCAGTTCCAGCCATAAGCAGGCAAACCCATGAATATCTTGTCCGGCGACATAACGGAAA
+CAGCATAATCATATATGCCCTCAAGCCAGTCACGGGGAGATACCGGACCGGGAGCAGAAC
+CCGCCCATGCCATGCCGTAGCTCATGATGGCGGCGGTATCGCAATAGTCGTTAAGATCGG
+CATAAACACACCAGTTTTCACCGCCCACCGAGCCTTGAACACCGATCATACCCGGCAGGC
+AGATGTTGACAAGCTTTGTTGCATCATAAGACTTAACTGTATTGTATATATCCCTAAATA
+GTGCATTCGCCGCATCCTTGTTTTCATAACCGCCGCCGCGCTCCAGGTCAATATCTACCC
+CAGCGCACCATGGATACTTGTTCATTATTCGGATGATTTCAGTGAGAAACTTATCCTTTG
+CACCGTTTTCGTTGTTGCGAAGTGCAGTAAAAATATTGGCTATTCCATGATTCATAATAG
+TGAGCAGCCACTTAATGTGCGGCCATTTCTGAATATACGGAAGCATGCTGCTGATGCTGG
+TACCGGTTTCAGTGATTGTGCCTGTTTCGTCAACCTCAAAAGTAAAAATGCCTACCGTAT
+CAAAGCGGTCGCCGTAGTCTCTAAGTGCTTCATACATTCGGGCATTTCCCATAAAACTCC
+ACACCATGCACCGCTTACCTTTTAAATAATCCCTCACAACCGGTCACCGCCTTCTTGCAT
+CTCCTGAAATTCAAAGAGCACCCGCGCCGATTTTCTCTCTTCCAGCTTCACCATATGTTT
+GCTATCCCATGCCGCAGAGTATTGATAAAATCCATCCTTACGAGTAGGGCTTCCGTTTTT
+AAGGCATTGACGGGTGGAAGCCTTGAGCGCCAGCTCATCGCCTGCATTAACCGGGTCAAG
+AAACTTTACCTTATGCGCACCTACACCTTGGGATAGTTCAATACTCCCTGCGGCCATATA
+CTGTATAGGATAGATATAACAGTCAAGACCAGCAGAAGTTTTGCCAAGGTTGAATAAGAC
+TACAGTCTCCGCTGTTCGCACCACACCGTTATAATGCCGGGGCGGAACTGGCTGCCCGTT
+TTCCTGCATTTTCTTTAGCATTTTGCTCGTGTGGACGGTATAACCTGTTAATTGATCTCC
+TTCCTGAAACTGCAAGTCGGTGAAATAGATTGTTCCGGTGCAGTCGGAAATCTTGAGTGT
+CACAGTAACGCCCACCACATGTTTATTGCTTTTTGGTTGTATGGTTTCCGCAAACCTTGA
+AAACTGCATCCATTTCACCTACCCGTCCAATGTCCACTGTATTTCGCATACATGCCCGAT
+CCATCCGGTAGTAACCGCGCCACCTTGAAGCAATAAGTCTGTAAAGTACACTGTGCCGGT
+GCAGTCAGTGACACACAGCCTGATGGTGATAGATTTGACTCTGCTGATACTTTTGGGATA
+AATACTGTATGCAATCTGATTGAAATATGCCATATCATCACCCTCAAATCAGGTCTATAA
+ATCTTGTTTCTGTTGTACCGTCCTCGTATTCAATGACTATCTCAACACCAACTTGGCCGT
+TTTCACCCTTTTCGAGGCTTTCGGAAGCAATTTGTGCTGAAAAAGTGTAGCTTTTACGCG
+TTGCTGGATATACCGTCTGTGAAAGGCTCTTTTTCATACCAGGTACACCGACAGCCTTGA
+AGGAAGCAGTTCCCGAAACACCATTTTCAGTATCCACTTCAAAACCGGAATTGACCCAGT
+AGGCAAAACCATCATCCGCTCTGGAATTGCGCAGATGGTTGAATGGTACCATATCTTTAA
+TTTCCTGACGGTTTATCAACTCTGCTGAGGACAGCGCATCCGCTGCCTTGTCCCACTGTG
+CTGAAGAATCGCCAAGTTCCCGCAGTTTAGTTGAAAGCTCAATCACTGTTTTCCATGGTT
+CCTGCAAGTTATACTGCCTTCTCACAACACGAGTCTTTACCAAAAGGCCTAGTTCTTTAT
+CGTCCACTGTAACAATATCACCCAGTTTCCATGCTTCGTGCTCATAACCGGTTAGCGCAG
+ATAAATCCATTGCCGACAGCACATAAGAGACGCGAGGCTTCGAATATTCTGCAAGCCGCA
+TTTTTGCATATTCCAGCATCTGATACGGATTTGTAAACGACGAACAATCAAGCGTCGACA
+CCCTCACTTCACTGGAAAAAGTGTAATCTTCCACGTATTCCTTACCTCCATTAATTGAAG
+CGAAGGTCAATCCGTCCTTTCCATAAGCATAGAGCTTTGTCACTAATTCACGTGTATCGA
+CTACCCGCTGAATACTTTTCAAATTCTTTCTATATGAAAAAAGCGCTCCGCTATCAGTAC
+CACTAAAAGTCAAAAGGTGTACCTGGCGGTTGGCGCTGTCAAACACCAGATCGCCGCCAT
+AAATATTCTGTACGGTGCGAAGGATGGATAAGGCATTTTTTTCTGTACACTGCCATGTCC
+GTTTCGTAGTGACAGTAACATTTCCTACTGTCCAGCCTGTACCCAAAAGTGCATATTGCA
+TCGGAACATCTGCAGTATCTGCATTGAATTCTCTAGGTTCTTTTTCCGCACTGAAAGACA
+GATCGTAAAATACCGCTTCAGCATATACTTGCGTGATAACACGCCCATCTTCGCCTTTAT
+TGTCCGTTAAGGTTCGGATCCGGTAAATGTCATTTACGATTTGCACTTGTTTTTCATTTT
+CCAGTGTGCTTCTTTTTGGATCATGGAACGGAAGCTTGAATTCCAGCGTATCCGCGCCGT
+TCACCTCACCAGTGACAATGATATCAAAGGCATTTTCAAGAACAGCTTCCCATGCTCCGT
+TTTTGTCCAAAATCACAGGACGGGCAAAGCCTAATTTCTCATAGGGCGCTTTCGGTATAT
+CATGAAGCTGTATTTCCAGAAGTTTTGGCGTCTTCAACGGATCGCTGCTGGTAAGGGTAA
+CACGGAACCTTATATATTGCCGATTTGGCGATTGAAGTTCACCGCTGGTTCCCACAGCCT
+GCCATGCAGACCATTCTTCAAGATCATCGCTTGTGCTGGTCTCTACTAGAGACACTGAAG
+TAACACCTGCAGTATATTCGCTTGTCACAGCTACACGACCGCTGCCCGATAATGCACATG
+GAACCGCCCTTGTATAAAGTACGCCACTTGCAGGATACTCGCCATCTGTTGCTTTAAGGG
+TGACTGCGCCAGGCTCTGCCAAAGCATCTACATCCGAAGCCGCATCCCCACCGTTTGCTT
+GTAAAGACGACTTAAAATATAACAGCAAATCATCAGCTGTAAGCTGTGAGTCCGTTTCCA
+GAAACCAGTCGTCGAAGCCTCCGGCATAGTAGTAGGTATTTGCATGCATCCCCATAATAA
+TGTCTGCTATACATTCCCGATTCAGCTCTCCCGAAAAGGAACGCACAGGTGACACCCAGG
+TTGCCCCGTCGCTGCGATCGCATATGATGTTCTGCACCTTTTTGTTGTTTACTTCAATGA
+TGGAGGCGATAAAGTACCAGCCGCCGTTTTTTAAGGTAATGGTAGCTGTTTCACTCTGGT
+CGTAGATTAGTGTGCCGGAGGAGTTATACAACATCAGCCTAAGTCTTCCTTGATAAAGTG
+AAACATAAAGAATTGGCTGACCAGGTCCTTGGCGGGTATTGAATATGGATATATATGTCT
+GGCCGACCGAATAGGTGGTAGGATTAATCCAACCGCCTACAACAATCTTTTCGCCCAGAT
+TGCTAAAGAAACTCCCATCATTTTCTGCTATAAGATGGGTCTTTTCAGAAGTCGGATTAA
+CAATATTTTGCCTAAAGTATCTTCCGAATCTTCCAGCAATAAGGTTTGCCGATGTCCCTG
+ACCAGCCGGAGATGGTAAAATGTCTGCCATGTCCCGATGAATCCATAAGCAGAAGATTTT
+CGTCTGGTGTTTTTTCATTAAATCGCCATAAAGCAGACGTCCTTGATGTTACAGGAAACT
+CACCGGTAAAATCCTCTTGGCTCGTTAGAATTGATTTTATCGCCATGTTATCACCTCCAT
+CTGCTTTTTGCCTGTATTTTTAACTCAGTAAAGGTCGCGTTTTCTGCGGCAATCTCAATA
+TGATTAACACCTTTCCTGAGAATTGGAAAATTCAGATCCTGCAGGCTGGGAAGACCATTT
+CTCAAGGTTCGGCCTGTTTCATCAATAACCTTAGCTGTTACCATGCCGGAGTCGACAATC
+AGAGTTTCACCTTCAGATAATGAGCCAACAATTCTCAATTCCTCGCCGTTTGTAATAAGC
+GAAATATAGCTTGATGAGGACGTTGATATCAAACCCTTCAAGAGATAAACCGGATTGGAA
+TCCGCATTTCCTTTAACCCTCTCCAATTCATGCAGACCTGTTTCAGAAAGAACAAATATC
+TCATCTTCCAACGCGTAAACATACGGGTCGGGACAAACAAACCGAAGTTCAAAGCTGCCC
+GCTGTCCGCAATATCCGCTCACAGTCAACCGCTTCTGATAAGCGAGCCATGAAATATCGG
+TCGGGCAAATCATCTATAACAAGTTGCTTAAGCCCGTTTTCCGGATTTAACCATTCTGCA
+ACATTATCAAGAACCGATACAAGCTCAGCAAAACTGCGCTGGGGAAGCACACTACAGCTA
+ATTATTATGTTTCGTTCTGATATATCGCAGCCAAAATCTGCAATACCTGCTTTGCCCGGC
+ACAGTTTCAAAGGAATTGCGCAGGGCAGGGGAGACCTGCCATTTAGTAAGTCTTGCTCGT
+ATTTTCATACTTTGCGACGATATTCCATTGTAGATAAATCCCATATGCTTCCCTCCATTA
+CGCTGTTATAAAACGTCCCTGCGCCCTTGAACCTGTCTGCATCAGGTTATATAACTCCTG
+TGAAATCCTACGTATGTCTTCTTCACCACGAACAATCATCTGCTGCACCACAACAAGCGG
+CCCAGAAGCTAAACCGCTAAATTCACCTCTTCCACTTACATTAATATCAGGAGATATATT
+AAAATCTGTCGGCACTGCATTTTGCATATCGTCTGCCACTCTGGCCATAGCCTTGTCAAA
+TCCCTCACCAATACCCAGTGCCATATTGCCGCCAATGCCTTCAAAAACAGTGGACGGAGA
+TCTGATTCCAAGAAAATTCTTTACTCCATCAACAATACCGGAAAAGAAACCGGAAACCTT
+ATCCTTAATCCAGCTACCAAGGCTTTTAATACCTTCCCAGATGCCTTTTACAATGTTCTT
+ACCAATCTCAACTACTGAAACAACCGCCTTGCCCAAACCTTCAATAATTGCCGCAACAAT
+CTGAGGTAAAGACTTTACTAGTTCTGGAATGGCTTTCACAAGCCCGGCAGCAAGATGTAC
+GATAAGCGTAATTCCCAATTCTATGATCTTCGGCATATTGTTCGTCACAAAGTCAATGAT
+TGTTGTAATTATCCTCGGCAGTGCTTCAATTAGTTCTGGCAATGCATTTAAAAGTCCCTG
+CGCCAACCCCTGTATGATCTGAAACGCTGCGTCAAGAATTTTATCCATATTGTCAAGAAG
+TACCTCGGCAATGAGGATAATGGCTTCGACAACAGCGGGTATCAGCTCCGGAAGCGCCTC
+CCCGATACCGGACGCCAGTGTGGCAATCATTTGCACCGCGGCTTCCACCAAAGCGGGAAG
+GTTGTCAATAATTCCCTGCACCAGCGCCATAACAAGCTGCAAAGCACCGTCGGTTATCTG
+CGGCAGTGCATCGATTAAAGCCTGCAGCAGCGTCATGACAATCCGCACCGCCGCGTCGAT
+AATAACCGGCAGATTGTCCACAATAGCCCCGCCGATGGAGGTGACGATATCCAATCCTAC
+CTGGATAAGCTTCGGCAGGTTTTCCATCAGCATGTTTACAAGGCTTCCCACCGTATTGCC
+GATGACCCCGCTGATCTTCGTCCAGTCTCCGTTTGCTTCAGATAATCCACGAGTAAATTC
+CCCGAGAAGCACAACCCCGTCGTCGGCCAATATCTGAAGCTGGGGAAGCAGCACGGTGCC
+CAGCATGTTTTTGGCCGCCGCGCCGCCCGCCTTGAGCCGCTGGATGCTGTCGTCAAATTT
+CCCGAGAGCGTTCAATGAATCCTCGCTCATCACTGCGCCCATGCGCTTTGCTTCCTCGGT
+CAGCTCCGCTATCCCTGCCGAACCCTGCGCAATCAGGGGATTGAGTTCCTGTGCGGACTT
+TCCGAAAATCTGCATGGCCAGCGCGTCACGCTCAGTTTCGTTGGACACCTTGCCAAGTGC
+GTCTATGGTTTCCCAGTATACGGCTTCGCTGTCGCGCAGGTTGCCGTTGGCGTCCGTGAC
+CGAAACGCCGAGCTTCCGGTAAGCGTCCGCGATCTCACCGGTGCCTTTCCGTGCTGAAGA
+CATGGATCTGACGTTCCTTGCCATGCTGCCGGTTAAAGTATCTAAGGAGACATCCACAAG
+CTCCGCGGCGTATTTATACGCCTGCAGGCTGTCGGTGGACATGCCGGTTACGGTCGAGGC
+GGTAAGGATTTCATCGGCATAGGCCGCCGAATTTACCGACATATCCACAAGAGCTTTTCC
+CGCACCGACCGCTGCTGTACCAATAGCGGCCAGGGCTGCTCCCATGGCCACACCGATACC
+TTTCAATACACCTCCCAGTTTTTCAAAGCGCCCGCCTGCGTCATCCGCCTGATCCGCGGC
+CTTTTTAATTTCTCTGCCAAATTCGCCCGCCTGTTTTTCCGCTTCGTCAAACTCTTTTCC
+CGCATTGTCCAGCGCTTTGTTGTTCGCTTCCAGCTCGCGCTCCATTTTGTTCAGCTCTGC
+TTTGGCGTTGTTAAGCTGTATCTGCCAGGACTGCGTCCGCTTGTCGGTCTCCCCGAAAGA
+GGAGGCGGCGTTGGCAAGCGCTTTCTCCAAAGTAGCAATTTTTTCTTTCTGCAATTCGAT
+TTCTTTATTCAGCACCTTGTTTCTTGCAGTAACAGCTTCAACTGATTTATCTTGCTTATC
+AAACTGAGATGCAACCAGGTTCATCTCGCTGCCCAGTACCTTAAAACTTTGGTTGATCTC
+ACGAATGGCGTTCTTAAATTCCTTTTCGCCTTCAATCCCAATCTTCAAGCCAAAATTGTC
+TGCCACATAACCGCCTCCTTTCGAGTAAAAATTAAAAAATTATAAAAGGCTATTGTATTT
+CAATGCGGTTTGGCATATACTAATAGTAGGGAAAGTAGGGAATTTCCTGCTTTTCAAATC
+CTAAAAAGGAGGACTTAGCATGAACGTTCCCATAGTTGATAATGCAAAGGTAATGGCAAA
+AGGCCAGATCACGCTGCCAAAAGATATCCGCTCCAAACTTCGCCTTTCCACCGGAGACCG
+CGTCACCCTCATTTGCGAGGAAGACCGGGTTATCCTTATGAACTCCGCTGTCTACGCCAT
+GAAAATGCTACAGAAAGAAATGGAGGGCGAAGCGGAAAAAGCCGGGATCCGCAATGATGA
+CGATGTTATGGATCTGGTGAAGGACGTCCGCGCGGAGATTGAAGGTCTATGAGAGTGTTA
+ATTGACACCAACATCCTGATCTCCGCTTCCTTGAGCTGCGAAGGAACGCCTTATCAGGCG
+TACATTAAAGCTGTAACACACCCCAACCATGGTATGGTTTGCGATCAAAACATCGATGAG
+CTTCGCCGGGTATACAACCGGAAATTCCCCCATAAGATCCAGGCGCTTGAACGCTTTTTG
+GCGATTGCGCTTACTGTTCTTGAAGTTGTTCCAACTCCCGCAGTTGACGTGTCGGATGAG
+GCGCTTGTCCGGGACGCATCCGACAGGCCAATACTCAGGGCGGCCATTGCGGCAAAAGCT
+GACGTGCTTGTAACCGGAGACAGGGATTTCCTTGAATCCGGCATAACAAACCCAAAGATC
+GTAACAGCGGCAGAGTTTCTGCAAATGGAATAAAAGCAGCTTTTTAAAGCAGGGATTACA
+GCCACCCTGCTTTTTTGCTGCTTATATTCCATAAGGTATCACATCATCAATGGTCAGCAT
+ACGCTTTGGTTTCGCCAGCCCTAAAAACTGCTTATGGCACTCCCATAAATCCAGCAGGTA
+CCCAACAGGCATTAGCCATACTTCATCCTCTGAACGATTAAGCTGGACGGTGCCGTAATA
+TAAAAGCCGAGTGAACAATTCCTCATCGCTCACTCGGCCGGTGTGTTTTTTAAATCATCC
+TCACTTTCAACATTTCTTTTGGTGCCTTTGAACATCGCTTTCATGATAGCGTCTTTATAT
+GCTGCCAGTTCCAAAGGAGATGTGAGAAGTTCCACTGTCTCTTCGGTAAGGAGTTCACGC
+TTATCCTGATGTTTGAGATTGTGTATCAGAATGCTCTGGTTAGCCAGCAGTGTAATCAGC
+CATACCACTTCGTCAAGAGCCATTTCGAAGTTCTCGGTTTTCATCAGTTTCGTGCCGAGG
+TTTTCAAGACCGCCGTACCTTTTTGCAATCTCCTTTGTCGCTTTAGTGGTTAGAATAAGC
+TGGTATTCTTCGCCGCCGATGCTGATGTTTGCGCTTCTGTCCGTATCCTGCATTATTAGC
+TTCCTCCTCCCACAGCAAATACCGGCTCATAAACTTCCGTATACCAGCCAGCGATAGTTT
+CAGGCAATACACCGGGATCGTCTTCGCTGACCTCCGCCTTCCAAGGGTGCTTTCCCTGGC
+CATCTGGTTTGTTACGTCTCATGACTGTCCCTTCAATGGTGGGGGTCGAAAAGGTAATGC
+TGTCACCTTTCGTTTGCAGATTTGTCGCCGGGATTCCGAATTTCACCCTGTAAAGCCAAA
+AATACCTGTACTTGCCGTTAGCTTTCTTGGCTCTAAAGCCAATTGCAACAGGCGCGCCTC
+CATCCTCGCTGGTGGAAATCAGCACCTTGTTGTCATCAAGGGTGGCTCCCGTCAAAACCT
+CAGCAGCGTCTACTCCGATATCTGCAACACCAAGAGTCAGTGTGCCGCTTTGAAATTCCT
+TGACCACTTCTGCCGCCCCGTCATCGGCATAAAGCGTCGCCTCTGCCAGCTCCACAGAAA
+GCTCTGCCGTAATAGCCTTAGCCAGCGGAACAGGCGTGGCGTATGTCTCTTCTCCGTTTT
+CATTCTCAGTTATTTTGGCATAATATAACCTGTCCAGTCCGATTGTGGCCATGTTTTTCA
+TTCCTCCTTTACTTCATATTCTTTTGCCACATCAATGGCATAGTGGTGATAGCCGGTATC
+GTCCTCATGGCCTATATACCGCCTGTCGGTAATGGTAAAGCCTGCTTGAAGCAATGTGTT
+CACTATTTCGTTTTTACGGGCAGTGTAGTTTCCCTTTATAAATAAAGACAACCTTACCTC
+CTGGGTTTCTACCTGAGGCTGGTTGTCTGCAAAAACTTCAAATGTATCTGTCATCGGAGT
+AATGACAAGGTACTCATCTGGCGGTACACCGCTAAATACCCCGGTTTCAATGGGGATACC
+CAAACCATCCAATAACGAGTTTAATTCTGACAATATGCTCATATACGACCCAGCTCCTGT
+TCCAGTCTTGACTTCATTACTTCGATGCAGGACTTCCTTGTAGCTGATTTTGCCGGTTTC
+AAAAAGGGCCTTGGAGGCTGCCCGGACTTGCCATACTCAATAATATTAGCAATCTTCGCA
+TTGCTTTCCCCATCCTTCCTTGGTTCAGTAAAGCCGATTTTTATGTTGTGGTTTCCATCC
+CTGTCCTGCTTGGCAGGAGAAAGTCCCAAAGCATTTACCAATTCACCGGTTGCTCTGGAC
+GGATATTTAGTGCCGCTCCCGATAACTGACTGAAGATTGGACTTTACTTTTGAAAGAACC
+ACTTCCCCGCCTGCTTCCAGCACCTTAGGTATGATTTCGTCTGTTCTTTCTCCAAGTCTG
+GATAACTTGAGCAAGAACTGTTCCGGCATTTTAACTTCCACCTTAGCCACGTTGCAGCCC
+CTCCTTTTATGCTTTGCTTGATTTCACCTTTTCCGCAAGCACCTCAATATACATTCCACG
+TCCTTTTACATCCTCAACACTTATAATGTTGTACCTGCCATCGCTGCAAACGAGTACAAG
+ATCTGTGGTAATTTCAAGGTTAGGTATCTTACGGAAGCGGAACAGGGCAGACGCCTGCGA
+AAACGCCGCCCTGTTTGCCCATTTTTCACTGCCATGCCTATCTTCCTTGTATGCTCTTAC
+CGAAGCAAGAATGACATCACCTTTTTCAGTAAAACCCTCACTATCCTTAACCGGCTTGAC
+TGAGATAATGTCCACGAAAGTTTTCATTTTCCCAAGGCCCATATTTACACCTTCCAATCC
+CGGTCAAGCCGCAGCAATAGATTAACTGTATTCCATACCTGCTGTCCTGCCTGCACACTA
+TCCCCAAAAAAGCCAGCAGTCGAGCCATCCCTGCTTTCATAAAAATGGCTCGACAGCATA
+ATGACAGCCTGCTCAGTAGTAGGCGGCATGGGGTTTTCAGCATAATATCCTTCCGGCTTT
+TTCTGGTAACTTTCCGCATAGGCCACTGCGGCTTTGATATACTCTTGTAAAAGTGCGTCA
+TCTTCGCTGTGCTGCAATATGAGGTTTGCTTTAACCTTCTCCAAAAGTTCCATGCCGCAG
+CACCTCCGTTTTCATTAAGTTGATTTCTGCTGCAGTATCTTGACTGCTTCAGACAGTACC
+AGCTTGCCATCTACACGCTGGGTTGCCATGAATCCAACTTGTCCGGTCGCAGCATACAAC
+TCATTAAGCCGCTTAAAAACCCTGCCTTGACGGTCTGCCACCCAGTAATAAGAAAAATCG
+CCGAATACAATCGTTTTTGCTCCGGCGGCAATGGCTGGCATAAATGCAGAAGTTTTAACT
+GGACGATTGAGGATAGTATCCGGTGTTCCAGCAGTTACAGAAGGCTGCCAGAGATACTGA
+CCGTTGTTGTCTTTGAGCTTCCTTATAGCTTTAATTGTCGAATCATTCATAATGAATACA
+GCGTTCCTGCGGTACGGAGACTTTAGGCTGTAGAACAAGTCCATGATCTCGTCAAGGGTA
+ATGGCTGTTGCACTCGCCGCGGTTACTCCTATCTCGCCACCGCCGTTATCCGCCAAGATA
+CCGGTTGGCTTGCCAGATCCGTCGCCGATAAAAAATGCTTCCTCCTCTTTTGCTCCGATT
+CGGCGGGCGAATTCTTTGGCTATATACTGTTCAAGGTTAAATACACTGTCGTTTAACAAT
+TCCTCTGACACCTTGATCATAGTAGCCAGCTTATATGCGCCGATGGATACCTGTGCAAAG
+GAGTCATCGCTTTCGGGAATCTGGCCTTCCTCATCCACCCAGGATGCAGTACCCTTGCTT
+GCCACCACAGGAATTTTCTTGTCACCGCTGGACGTGGTAATAACATTGGCAATCTGCCTA
+AAGATATTCTCCTCCTCCAGTGCTTCCACAAGAGTACGCTCAAAGTCGTCGGGAACAAGA
+TATCCACCTTCGGTGTCCTCTCCAATCTGCAGCGCGTTGTGTACGTCATATTTGCGCCTG
+CCGCGCATCATGTTCCAGAAAGACTGCCTGTACTCATCGCTGGCACGTCCGGTTTTTTCA
+TTGTTGCCAGATATGGAAGTGGGTTTGTCTGTAATAGGAATATTCAACGGTTTTGACAGT
+TCCAAATCTATGGCAGCCTGACGCTCAAGACGCTCTATTTCTTTGCCCAGCGCAATAACG
+TCGGCTTCCATTTTTTCATAAGTTGCGGTATCCTCCGGTGAAAGCAGTCCGTCGTTCCCG
+CGTTTGCTGTCGAGGAAAGCTTTAGCAGCTTCCCCTACTTTCGCGCGTTTTTCACGCAGT
+TCCAGTATTTTGCTCATAATCAAATCCTCCTTAAGGTTTTATTTGGGGTCCCCGCTAAAT
+CGTAGATTTAGTGGGGTAAAAGTAGAAAAAGCCGCTTTTCAAGCGACTCAATTGGTGTTC
+CTTTTGGTTTTTCTTTTGGTTTAAGCTTTTGCAGGATGGAATTTGTTACTGCCTGCCTGC
+TGAAGATCATTCCTCCTGATACTTCAAACTCGGATGGGAATGATTCATCCTCCATAAACA
+AGATTCCATCAGCAAAGCCAAGTTCCACCGCTTTTCTTGCGTTAAACCAGCTTTCTGCAT
+CCATTAGGTGCGATATTTTTGCCCTGGAAAGTCCGGTTTTCAGCTCATAAGCGTTGATGA
+TGGATTCCTTTATTTCTTCCAGCATTGCGATAGCTTTCTCCATTTCTTCTGTATCACCGA
+TGGCTATTGTCATAGGGTTGTGAATCATCATCATGCTGACTGGTGACATAAAGACGTCAC
+CTCCGGCCATAGCTATGACCGAAGCGGCGCTGGCTGCAATACCGTCAATCTTTACCGTCA
+CTTTGCCTTTGTAATCCATAAGCATGTTGTAAATTTGATTAGCTGCAAATATATCTCCGC
+CAGGGCTGTTGATCCAGATCGTTATATCACCCTCTCCGGACAACAGCTCTGATTTGAACT
+GTTTGGGAGTTACTTCGTCTCCCAGCCAGCTTTCTTCAGCTATTGGGCCGTCAATATATA
+ATGTCCGGCTGCCATCATCGTTTTGTATCCAGTTCCAGAAGCGGCGAACCGGTTTTTGTT
+TTTGTGATTTGTTCAACTTTTGATCCCTCCGTTTCAGCATTGTTTTTGCCTGCAAATGTA
+CCTGCATCGGCAAGCCTGGTCATGTTACCGTTAACAAGATACAGATCTCCGCCCAACTCC
+GCCGGAATCCGGTTCATGTCCTCAAGCTCGCGGATATCGTTAGCAGACATCCAGCCGTTC
+TGGCGAGCTACAGCATAACCATTCATGCGGCTTGCATAATCACCGCGCAGAAGGCCATCT
+ACATTGAATTTGACAAAGTATGCCCGCTTCTCTGATGGTAAAAGCAGCGCTTTTTGGAGA
+GCCTGTTCCCAACGCACCACCCACGGGTCAAGCGTGTATTTAACAAATTCCAGAGATTGC
+TGTTCGATGTTTGAAAAGCTTGACTTTTCAAGATCTCCAACCATATGGGGAGGTACTCGG
+AATATCCGGGCAATTTCGTTTATCTGGAACTTTCTTGTCTCCAAAAACTGTGCCTGTTCG
+GGTGGAATGCCGATTGGCTGAAACTTCATTCCCTCTTCCAGGACTGCAATACGGTGAGCA
+TTGGCACTTCCTTGATAAACAGCGTTCCAGCTTTCACGCACCTTTGCCGGATCCTTTAAT
+ACGCCGGGATGTTCCAGAACGCCACCCGGATTTGCTCCGTTGGCAAAAAAGGATGCACCA
+TACTCCTCACAGGCAATAGCCATGCCTATGGCATTCTTGGCCATAGCAATAGGGGAGTAT
+CCGATCAGTCCGTCAAAACCGAGTCCCGGGATGTGAAGAACCTCATCACTTCGTAGGTAT
+ATAAGGCCTGCTTTTGGATTAACCCTGCTCTCATCGCTGTCGCGCCGATAAGTGTAATAC
+AGCTCTCCGTTTGGAGCCCTGTCTACCGTCATTTTGTTTGGCAAAAGGGGATAAAGCGCC
+AGCACTCGCCCGGAACCGTCCCTGACAATCTGGGCATAAGCATTTCCCCATAAAAGAAGA
+TGACTCATCAGTGTTTCTCGGAACACAAATGAAGTCATCTCAGGGTTTGGTTCGTCATGG
+AGCAAATAATAGAGCGGGTGGGTCAACGCTTTTTCTTTGCCACCGTCTTCCTTGTATCGG
+TATACATGAAGCGGAAGCCCGGCGATGGCTTCTGCAAGTATCCTTACACAGGCATACACT
+GCAGTTGTCTGCATAGCAGTCCGCTCATTGACAGCTTTTCCGCTGGATGTGCCGCCGAAG
+AAAAAGCTATATGCATTACCGAACAGGCTGTTTTTCGGCTTGTCCCTTGCTTTGAACAAG
+CGGGAAAATATTCTCATAAGCATCACTCCTAAAAATGGGCATGAAAAAAGCACCACATTT
+GTGGAGCTTCTTTACATTTTTATATTTTATTGATTAACTTCTTATTAACTTATCCTTATT
+TTGTAGTAAAATATCTGTTGTTTCTTTCCGTTCAAACAATTTACGATCCGTCAAATCTAA
+TTCTTTTTGTGTTTCAATGAATTCAATTATTCTTAAAAAATAATCGAGACATTTCCCTGA
+ATCATTCAAGATACGCAAAATTTGATTGCAAGCATTGATCATTTTTTTGGCACTATGATG
+TTTTGGTAAGTTGTTTGTTGCCATATACTTTAAAAGCATTATGGCATGATACTTTCCTTT
+ACGGTATTTTTTATCAATACATTTTGTTTTTATCAGGTTTTCGAAACGAAACATGGCCAA
+AGAACTTGTGTAATACAATATAGGCTGGTCGTCAGGTAGAAAAATACGGTTTCCAATATC
+TTTCAATAAGCTACTATAATGACCAGCAGCGTCGTGTGGTTTATCATTGAACATTGATGA
+TGCATTTTTTAACTGGGCACGAATAGTAACTATTCGATCTTTGGGAATCGATTCATTCCT
+ATATTGTCCTGAACGACGTTCATAATACAAGCGTTCATCCTCAGCAGTGTATGTGCGATA
+GTATTCCTCCAGTGTTTTTTGGAAAGTTGATAACGCTTCTAATTGTTCTTTGGTTATACC
+AGTTTGATTATTTGTAGCTTTTGTAATACGGTTTTTTAAGTCCTCATCCTTGGTTACAAT
+AATCTTAATCGGTATAAGTAAATCATGTATTCCAAGATTATCACGGTTAAGATACAAAAC
+ATGGCTGGTTTGGCATCCATTAACTATCTGATAGTTTGAAATTGTCATCTTATCGCTCAC
+AAGCACAGCAGAATGAGCGACAATTGTTATTCCATTATTTAGCATGCAAAAAGCGCTATT
+TCTGCCTTCAACAATAGTTTCTTCAATGTCCGCATTAACATAATTATTCACTCCAAGGAA
+GTCCCGAATATTATCTTCAAATACTTTTTTTAGTGAACCATTTTCATCGCATATAATTTT
+ATAAAATTCGCAGAATGGCAGTACCCCACTATATCCATAATCTCCATTATCATCAGAAAA
+CATCATCACATTTTTTGTAAAAACAAAAGTCGCTTCTATTTGCTCTTGTGATTTTCTATA
+CATACGCTGTATTTCTTGGGCACCGCAAGGTATAAATTCCACAGATGAAAAAAGTGCCAT
+GTTATTAAGCGTATCTATATGACTATTAATTACAGCTTTCAAATTGGAATCATCATCGTT
+CCACTTCCCCGGAGCAATATAATAAAGTCGTATTATCGGGTTTTTGACTTTCATATAGCG
+AGAATTACTATAAATAAAATCCTTCATTTCTATGAAGTCTGCCATTTCCTCTGTACTGAA
+TGTATTCTTAGCTTCATCAGAAAAAAAGACTTTAACAAAAGACAAAAAGTTACTTATCTC
+TGAATTATCAAAACTGTCAGATGTTTTTGCTTGTACAAATATAAATTTTACATCAAGTTT
+TTTATTTTGCTTAATTAACGTTTCTATCTCATCAATACTGCACACAATAGCTCCGTTTAC
+TTCTATCGCTATTCCATCAATACCTTGAGTAGCATTGCCAGTATGCATGTCTTGAATATC
+TATTTCAACCATGCCAGTTTCTGCAGATAAAGCACAGAAATTGGCAAAATGCTCGAATTG
+AACACTTGTTTCGTACATAGTAAAATTATGGCTAATAGAAAATTCATCTAAAAAAGCCTG
+AGTTATACGATCCAAAGTTACTCCTCCGATAATAATCTTATTTGGAGGAATTATAACACG
+TTTTGTCAAAAAATTCAATTACTTCACTCCTCGAGTGTTTTTTAATTAAGGACTTATATA
+AGATATTATGCTCACTTATGATATATTTTGTTTATAAAAATAAAATTCCCCTTTCATCAT
+AAATTGATCCGTTGCGTTCATCCCCGTCATGCCTTAACGCGCGGTCAAGCGCCATAATTA
+ACGCTACCGCGCCATCTATTCTCTCGGTGGATTTTTCTTTATCAGGCTTTATGTTTCCAG
+CTGGATCAGTTTTGACATAGATATTGTCCATCATCCAGCGCAGTACTGGATGGCCACCAT
+GGGCGATGCGTTCTTCCAATGTCAGCTTCATCAACTCTTTTGTAGGCGGCGACATATCTT
+TGAAACCCTGGCCGAACGGAACAACCGTAAAGCCCAAGGCCTCGAGGTTTTGCGTCATCT
+GAATTGCTCCCCAGCGGTCAAAGGCTATTTCCTTAATGTTATATTTCATCCCGAGCTCCT
+CAATAAAAGTCTCGATAAAACCGTAATGCACGACGTTACCCTCAGTGGTATATAAAAAGC
+CCTGCCGCTCCCAGACATCATAAGGTACGTGATCTCTCCGCACACGCTGATCGATATTCT
+CCTCCGGTATCCAGAAAAAAGTCAGTATCTGATATTTGTCCGATTCATCAAGCGGCGGAA
+ACACCAGTACAAATGCAGTAATATCGGTAGTAGATGACAGGTCAAGTCCTCCGTAACAGG
+TTCTGCCGCGCAATTTTTCCGCATCAACAGGAAACGCACACTTATCCCATTTATCCATTG
+GCATCCAGCGCACCGATTGTTTCACCCACTGATTTAAGCGGAGCTGACGGAATAAATTTT
+CCTCTGCGGGGTTTTGCTTGGCATTTTCACAAGCCACCCTCAGTTTTTCGATGTCGACTG
+TAATGCCTAGTGACGGATTAACCTTTCTCCATACCTTTTCACTTGTCCAGTCGTCGGTAT
+CGGATGCGCTGTAGATAACAGGGTAGAAAGTCGGATCTATCTTACGTCCCTGCAGAATAT
+CCTCTGCCTTTTGATGCACTTCCCAGCAGATGGAATTGCGGTCTGTGCCAGCAGTTGTGA
+TCAGGAAAAACAGCGGTTGTTTTCTTGCATCGCCAGATCCGTGAAGCATTACATCATAAA
+GATCCCTGTTTGGCTGAGCATGAAGTTCGTCAAATACCACACCATGGACGTTTAGGCCAT
+GTTTCGTATATGCCTCCGCTGAAAGCACCTGATAAAAACTGCCTAACGGTTTATAAACCA
+GCCGCTTCTGTGACAGCATTGGTTTAATTCGAGATTTTAATGCCGGACACTGTTCCACCA
+TATCTACTGCAACGTCGAAAACAATGGATGCCTGCTGACGATCAGACGCACATCCATAAA
+CCTCGCCACCATGCTCGAAATCACCACAGGTAAGATATAAAGCAATTGCCGCTGCAAGTT
+CGCTCTTACCCTGCTTTTTGGGATTTCTATATAGGCAGTGTTAAACTGCCGGTATCCGTT
+AGGTTTCAAGATTCCGAATATGTCCCGGACAATCTGTTCCTGCCAGTCAATTAATTCAAA
+AGGCATTCCATACCATTCACCCTTGGTATGCTTCAGGCAGTTTATAAAAGTAACAGCGGC
+ATCCGCCGCTTCCTTGTCATATCGAGAACCTTCCGCCATAAACTTGGTTGGTTTATATCG
+TTTTAACTTCCGCAGCTTTGCCGCCTCCTTTCCTAAAATTGAGCAAGAAAAAAGGAACCT
+CAGGGATGAAGTTCCTCTCGTTAGTGGATTTCTATGAAGCCTGTTACGTTATTACTGTTA
+TCGTTTGCCTGTCAGGATAAACTCGGCATATTCTTTTTTGTGTTCATTTAGAAAGACCAC
+CAATTCATAATAACCCTTTTTGTATGCCTCCTCCTGCACTCTTGGCAAATCAAACATATT
+GCAGACACCGCTGTCCCGTATGACAATTATCTGCCGGTAAATCTTATCAGTTATCAGATT
+TTCTATACCCATGTCCTACACCTCAGACTTCTCTGCCGCTGAAATTGAATCTCTTACCGC
+TTTATTGAGAACTGAAATATCAAAGCCCGCGTCTATATATCCGTGCCGAATCACCTCGTA
+ATAGTAACGACCCGGTGCTCCCAGTGGTCTGCCTTCATTCATGATATACACCATTGCGGG
+TACCCACTGCCCTTTGAAACGTACCTTAACTGTTTCTTTCCGGTATAGATGCGGATAACC
+TTCATATCTGTCCAGCGCTTTCTCATCATTAGGCATGATTCTCCAAAGCAGTACTGGTAC
+TCTTTCACCTTTTTGTTTTTCTATTGTCGCTACTGCGCCGCCATTCCCTCCTCTGAATAA
+CAGCCGGTATCCTGTGAGTTTTGCACTCCCCAGCACTTTTGCCGTCGGGCAGCGGTATGC
+CATCTGCCTTAAGTTCAGATTGCTTCCGTATGCTAAATATATGGTTCCTTTTTCTTTGCT
+CATCGTATCATCCTCCTTGTATTTACCAAGGCAGGGGCGGAGATCCGCCCCTGCGCTTGT
+CTATCTATGCCGCCCGAAACCGCCATGCCGCGTTGCCGCCCAAGTGTTTGCAAAGGTGCT
+CCCGACAATTTTTGAACTCATCACCAATAAGTCCTATGCGGTTGAGATATGTCCGCATGG
+CAAACTTCTCGTTCTCGACCTGCGGCTTTTTGCTGGAAGCGCATTTTTGCGTCAGCGCCT
+GATGGTTGAGCGCCAAGGCAAGGACGATGTAGCTCCTTATTATCCCGGCGTGGAGTTCGC
+TGTTGAAGCCGCGAAGCTCGATCGTACCGTTGCCGTTGAAAAAGCTGTGCAGATTGAGAA
+AATAGTACCGACTTCCATGATATCGCTGGCTGCGGCTTTCGCTGTAACCCTCATACCAGA
+TGCTCTCAATCGCCGCCATGGTTTTGGGCTTACGCCGATTCATCTTCTCAACCAGTGCCG
+CATCCATCTTTTTACAAAACCGCATCCTGTCCGGCTCAATCTGCAATGCTTTATAGAAAA
+GGTCATTCTTGCTGGCGATAATATTGATAAAATTGCGGATGCTTCGAGGCGTGTGGTCTG
+CCCCGTCTATATGGATATGGATCCCACAGCTTGTGTTTGCAAAACCTCCCGCCTTGCGAA
+GCCTCCTTACCAATTCCTGCAGGGTTTCAATGTCCTCGCGGTATGTCAGTATCGGACTTA
+CCAACTCGACGCTATATTCCCGGCCAGCCGCCGCAATCCGGCCGTTTTCCTTTTTCTGAG
+TCCGAATGCTCCCGTCGCTCATGAATTTCCATATCCGTCCATCCGGTGCAATAACCTTTT
+GGGTATCGTAATAATCTCCGCTGGATTCAATCCTCCCTCCAAGAAAAGCTGCTGCAGTTT
+TTGCCGCCTGTTTTCTTGTAATCCCCGTCAATTCTACCTCGATTCCAAATCTCGTTGTAA
+GCATTGCGCTTTCTCCTCGCTTTCTCTGTGTTTTTTGCCCTTTGGCAGTGTACATTAGGC
+CATTGAAAACACAGGATAGCAAGGCAATTCTGCATGAGTTTCCGCTGGATTTTGGACAAT
+TTTACATATCTTGATTTGTGTACATTTACAGCTTTCTGATCACATCTATACCATAGGCTG
+CACCCAGAGAAGAACCGCAGTCCCAGTTGATATGAACGGTTCCGATATCATCCACGAAAG
+ATACTGTTCCTTGGTCTCCCGGTTTCAGCTTAGAATACGGATCATCCATGCAGATAAGTT
+CAACGCGTGTTCCCGGTGGATACTGCTCTTTAAGGCGAAGGACTGTTTCTTTTGAAGGAA
+AGCCTCTTGCACTCATAGTCCGTCCTCCTCTCCAGGATAAATCATTCATTTTCGTCCACC
+GCCTTTGCTCTGCCTTTCCGATACGCCCCGTTACCGGACAGCCTTGAAAGTAACACCTTG
+CGTTCAGTTTTGAAGTTATCACCTATAAACCCCAACCTAAGCAGGAAACAGCGAAAAGCA
+TATTTTTCATTATCTGTTGGTTTTTCTTTTCGTAGTACTCGCTTCTGTAATTTTGCCTGT
+TCTGCCATCTGCTTTGCCAGCGTTATATAGGTCTGCACTTCATCAGCATTTAAAGTCGCG
+TTCCAGAAAGGAAAGGAAATCTCATCATTTTCAGCTAAGACTACAAGTTCCCCCTCAATC
+AACATTGCCTTCTTTATCAATGTCTCTTTGCTGGCCAGCATATTATTTAGGTTTTCAAGG
+CTAATCTCGCTAAAGCCCTCCAACGAAAGAGTAATTGTCATGGTTTCCTCTGCTGAAAAA
+CCCTCCACATTCAACGCGTCAATAACTGAACGGATGGTTTTTATTTCATTGAGACTGATT
+TTCGGTGAGTGAACCACACTGTCCCTGTCAATCGTCCAACTGCCAGCAGATTTTTCGTCT
+TTAATCTCATACAAAAACTCCGGTGCTCCGGCATAGCGCACCTGGCCTTCAAGGGCTTCA
+GCTATGACCGAGGCAATGGCTTTTCTCTCCTGACCGACAATCTTCTGTGAAAAGCGAAAG
+CTGTTATTGCTCATGCCATACACCTCCCCTCAAATAAGCTAAAACATTTTTGATTCCCAT
+AAAAAATCCCACCTTTCCTTTTTGGTGGGGTACATTAACGCTCTGTTTTGAGGGGAAAGC
+AAGGACATTTTTAATCAATCTGTGTTTCCGCGTAAGGTATTTTTTCACTACCTGTTACCA
+AGAATACTGAATCTGCGCCAAATTGTGAAACATAGCGCTTTACAATCACATCGCAGTATT
+TCGGGTCAAGCTCCATCATAAAACAAACCCGCCCGGTCTGCTGTGCCGCAATCATTGTCG
+TACCAGAACCACCGAACAGGTCAAGAGTTAAATCTCCAATATGGGAACTATTGAGCATTG
+CCTTTGCTACAAGCGATACCGGCTTCATGGTAGGGTGCTCCTCCGATACTTTAGGACGGG
+GTATCTCCCAAACATCTGACTGTTTACGGTCTTTAAGCGGGCAAAGGCGTGTTCCTTCAA
+GCCAACCGTACCAGATCGGCTCGTACTGGGTATGATAGTCCTTTCTTGACAGTACCAAGC
+TGTCTTTTTTCCATATAATTGTGCTCGACCAGTGATACCCTGCCTCCCGCATGACGTTCA
+TCAAACTGCCCCATTCCTGAGCACTCATTACTATATAGGTCATGCATCCGGCTTCAGAAA
+CCTCTTTCATGCATTTAAAAGCGCGCAATAAAAAAGCGCCGAATTCTTCGGTGCTCATAT
+TGTCATTTAGAATTTGTCTTGGCTTCCAGCTTGGATGCCTGGTATCTGAACCGTAATCAA
+CATTCCAGGGTGGGTCGGTGAAAACAAATCTCGCCTTTTGTCCGTTCATCAGCTTTTGCA
+CATCTGAAAGCATGGTGCTATCACCGCACATCAGACGGTGGCTGCCAAGCACCCATATGT
+CGCCCTTTTTAGTGACCGGAGTTTCAATCTCTGCAATTGCCTTTTCTGTATCGAAATTAT
+CCTCTTTGACATTAGCGGTTGTTTTATCACGGAACAACTCATCAATTTCCGCAGCATCAA
+ACCCGGTAAGAGAAACGTCAAAACCATCTTCATTTAAATCCATAAGCAGATCGGTCAAAA
+GCGGAATATCAAACTCGCCACTGATTTTATTCAGTGCAACATTGAGCGCCTTTTCCCGCT
+GTTCATCCAAATCAACTACAACACAGTCGATCTCCTTATACCCCAAAGCTGTAAGTACTT
+TATAACGCTGATGTCCGCCGACAATGTTCCCGGTGCGTTTATTCCATATAACCGGCTCTA
+CATATCCAAACTCTTCAATAGACCGACGTAATTTTTCATATTCAGGGTCACCAGGCTTTA
+AATCTTTCCGCGGATTATATTTAGATGGTTTTAGTTTTTCTGTTGGTATTTTCAGTATAT
+CCATAAATCTTAACCCTCCAGTTTGATGGCTTTTTCGCCGGTGAATTCCTCCCAGCGCTT
+AACAGCTAAATCACAGTAAACAGGGGATAACTCCATTGCGTAGCATTTACGCTCGGTCTG
+TTCAGCCGCAATTATAGTAGTTCCGCTACCAGAGAACGGCTCAAGCACAATACCGCCTTT
+GTCGCTGTGCATTTTGATGCACCGCCATGGAAGCTCCACAGGGAACATTGCAGGATGCTC
+CTTGTTTGCCCGTACAGTGGTCATCTCCCATATCCCAGCATAACCCCATTTCTTGCGTTC
+TTCCTTTGTAAGCCGTTTCACAAATTTATAACTGTGTCCCGCAAAGGCTGAAAGCCATAC
+ATATTCCTGATCGTTATATTCCTCAACTTCTCCTTTATTGCTGAAGGCCGAAATATACTC
+ATACTGCTGAACCGGCTTGTTTGAAACAAGATGATAGGGTCCTACACCAAAGTTCTGCCC
+CTGCTTCTTCCAAATACGGATCCAGATAGGTCGATAGCCATTGTCCAAAAACATATTCAC
+GCTGTACACGCTGGTTGGTTCAATAAACTGGGAGCCGGTTGCATATAAATCACCTAAGTT
+CCAGCAGACAATATCTGCATACCTGCATAAGTTTCTAATCACTGGGCGTACTGTCTCGAA
+CCATGGCTCAATCCCGGCTTTTTCATATTCTTTGCCTACCCCATAAGGCGGGGAAGTCAC
+TGCCATCTGTGCGTGACACCCTTCCATCAACTTCTCAAAATCCTCATTCTTCGTAGAGTC
+GCCGCACATCAAGCGATGATTCCCGAGAAGCCAGATATCGCCCCGCTTCGTTACCGGCTC
+GCGCTGCACGATTTCCTCATGCGCTTTATCTATGTCAAAGCTGTCTTGTACCGCCTCTTT
+GGAGTACCATCGGTTAAGTAGTTCGTCTATTTCAGAGGCGTCAAACCCTGTAAGCGAAAC
+ATCAAATGCACCTGCGTCCAACTCAGCCATCAGTTCGGCCAGTTTATTCTCGTCCCACTC
+TCCTTGAATCTTATTGAGAGCAAGATTAAGCGCTTTTTCTCTCTGCGGGTCAAGATCCAC
+TACAACGCAGTCTATCTCAGTCTGTCCCAAGTCCAGCAAAACCTTTAAGCGTTGATGCCC
+GCCTACCACATTACCTGTTTTTTGGTTCCAGATAACAGGCTCCACATAGCCAAATTCCTC
+TATTGACCGTTTTAGCTTTTCATATTCCTTATCGCCAGGTTTTAAATCCTTGCGCGGGTT
+GTATGCTGCTGGATTAAGTTTTTCAACAGATATTTTTTGTATGTTCATGCTGCATTCTCC
+TGTTCAATATTTTCTTAAGACCCTTTTTTGCGCCCTCACAATCTCCGTTTATTACTTGTC
+CCCGCAGAGTCTTAAACTGCTGCTTCGTTAAATGGTCTTTATATTTTCTTAGTTCCCTAA
+GAAAGATTGAATTTGTTTTATGCATCAGCCACCCCTCCTGGCTGTCAGTAGTTTTTCCAT
+CACATCGTCGTGGGGAGTGGCCCCCTTGTATTCGGTAGCACAGTTTTCCCGCACGACTTG
+ATAAATTTGATACCACAGGTTATTGGCCTGTTTCATAAAGCTTTGACTCATAGCCACATA
+AGGTGACGGGATGGCATTGCCAGTTGTCGGATGTTTAGCAAGAAAGCCAAATTCAGTGAT
+ACATTCCTCGCACTTGATCCACCGCGCCACACTCTGGGCATATTGCTCTATAAGCTGCGC
+AGGGATAAGGTGAACACACCTGCGTTCCTTAAGCCACTGCCATGTTTTTTCGTATATTTC
+CACCGCCAGTGTTGTTTTTCCGTTCTTCTGCTTTGCAGCAAGATAATCCCTCGGTGGCGG
+CATGCTCTCTCCTTCTAGTTCCGCAGCATCCGTAAACTCCATTACCATGAGCTTTCGTCT
+GCCGGGGTTTCCTTCCAAAATCTTATCCGCCAGAGGCTTTTTCTTCTGTCCTGCACCGAT
+ACGTGCCCCGCCGCGGTTGGTACCGTCCTTTGCCATACACATCACCTCGATTCATGTAAA
+AATAAACAGGGGATATACCCCGTTTGAAACTGCGATTTTTCGCGCGTGACCCCCCGCCCG
+TTGCACAAAACTGCTTCACCAGAGATTTTGACCCCCCTACCGTCTTGCCCATCGCTCTCC
+TTCGCGGGCAGTGATCGATGAGTGACATTGTTTGCATAGACTCATAAGGTTACTGTCTGC
+ATTGGTTCCGCCTTTGGATAAAGGGATAATATGATGTACCTCTTCGGCTGGTGTAAGCCT
+TCCGTACTTTTGGCACTCCTCGCAAAGCGGATGCTCTGAGATATATCTGTCCCTGATGCG
+TTTCCATCTCCGGTCATAGCGTTTTCTTGTTTGGGGATCTCGTTCGTATTTGTTGTAATA
+AGCATCCATTTGCCTTTGATGCATGTCGCAGTACCTTCCGTCCGTCAGTTCAGGACAGCC
+AGGAAAGGAGCAAGGCCTTTTTGGTTTTCTTGGCATCTGGCCACCTCCTTTACGCGTATA
+AAAAAGCCCTCACAGGTTCATCCCATGAAGGCTTATCTATAATTTTTCACAATACCATTA
+TATTTGGATTTATAATGAATTTCATCTCATAAAAATCTCATCTGGAATATTGAACAACAC
+ATTTGCTATTTGACCATGGCATCTTACCGTTATAATACTTATCGGAGATATACCGCTGCA
+TATCGGGTGGTAAAGCTGCAAGCAAAAGATAAGCCTTTTTCCTGTCTTCCTCTAACTCCT
+GGGTGCTTTTATAGAAGGAACATTTATCTTGCAAGCACTTGTGTACAGTCAGGATATTGC
+AGCCATTCCTTCCGTTACTGCCAAAACAATTATCGTACATCTTTCCTCACTCCTGTTTTA
+TGGCATAAAAAAAGCCCCGAAGGGCTTATGCGTTTTAATGTTATTTTTTCACGATATCAT
+TATATATGGGATACCTGTGTTTTACATCTCATAAAAATCTCACATAAAAGGAATGTAAAA
+ATATCAGTTTATTTGTTCAAAGATAGCTTTCGAGTATACTTCTATATCTCCAGGAGTGAG
+CATGTTGAATTTTTCTTTCACAGCGACAAAATATTCCCCGATCAATTCTTTGGGTATTAC
+ACGATTAGAATGCGCATCCACCGGCAAACCGTCTCTGGTATACCGCCATGGTTTCTCCAG
+ATGCGTAAACTTTTCTAGTATTTTTCCACTATAGCAGCAGAAGTTCTTAATAACGCTATC
+CAATATTGCTTTTTCAGCAGTTGTAAAAACTGATTCATCGAAAGCTTCAACGCTCTCAAT
+TGGGTCAAACCGATAAGATGAATACCTGTTATATACATCTCTGTAAACCGGTCCATGAAC
+CCATGCCTCACAGTCTTCTTCAAAAAGAAACCGTCCTTCAAAAGCGTAATAAAAGCCCTG
+GACATAATATAGTGCCTTTTGTAAAGCTAAAGGAGTTATGTCCTCGCACTTATAAAGCAG
+ATATTGGATAATTGAGTCCAGCTTCGAACCCGTTTTGTTTTCTTCCCCAAGCAGTTCCTG
+TACCTTCCGCTTACTTTTTTCATATGCCTGCAGAGATTTTAAATTGTCCTTATTTTTCTC
+CAGTAATTCTTTATAATACGCTGGATCATCATAAATCTTTTGAAGAATATCTGAATACTG
+TTTTGTAGGCATATCACCTTCACAATATCTCGAAAAAGTCATTTCCCCCCAACCTAAAAG
+CAATGATAGCGGACGTTTGCCAATATTGTATTTCTGAGGTATTTCTAATATCTTCTCCAG
+CGAAATAATGCCGTTTTTTTGACGGTACGTGTCATACAAAGCCTTTAGATTTTCGTCCTC
+TATATCCGCTACATAGACTTCGCTCCCACATTCCGTACAAATAGCCTTCTTTCCAGTATA
+CTCATATTCTTCGCCTTTAAGTTTACCCTTAATTGTTGCTGTTTCTACCATGTATTCGAC
+ATCTCTTCTGCATTCCTCGCAAAATGTCTTATTCCTATTCATAAGGCGGCCTCCTTTCAA
+ACTCTCTAATTTTCTGATTGATCATCGGAAAAGATAATCAATCGGCTTGTTTCGCTTATG
+AAACGATATAACAACCACTCGTTTTCCACTTTCACTATCAATTAGATTAAATTTCGTATA
+TATATCAACTAACTCCTCAATGCCATCAAAGTTAAATAACGTAACCTGGGGACAAAATAC
+ATATAAAACCTCATGTTCAAATCCTACTTTCGTATTTTGCAATGAATGGCAAAAATCTTC
+TGTTTTTATTTTCAGTAAAATCTCCTTTTGCCTTCTGCTGTTTAGATTATATTCATTTAT
+AAAATCTATGTTTTCTTGTCTATTCTCATTTTTTGATATAATGAATCTGCCCTCTCTAAT
+ACAGTCATGTATCATTGCCAAAATCTCATCAATCTGTTCCCAGGTATAATTCTGATTATA
+GTGCTGATTCATTGCATCACCTCTTTTGTGATACAATGATACTATATTATATGCCTTTTG
+TCAAGATTTATGCATCAATTAGTGCATTTTTATTTTGTTGATTTTTACATTAAAATATGT
+ATACTAAAGATAACAGCTCCTACAAGCTTATATTAAGCGCAATACAGTAGGCCATTAAAA
+ATACCCACTTAGGTAGTTCGTTCTATCTAAGTGGGTTTCCTATTTAACATGCTGCTAATG
+TTATCTTAAACTACTTCCCGTATAAAAGCAGTGCCAGATGATTAAGTGCCTTGTCCTTCC
+TACGGTACACCTGTGCTCTTTCAAGAAACAGCTTCTCTCCGATGTTTGCTACAGCTTCTG
+TCTTGCTCACATCATTAACAAAAAATTCTGTCAGTATAAACTGTTCTTCCTCCGACAGGG
+CTTCCCAAGCAGGCTTGAACCACTCCATATATTCTAATGCCCGTCTGTAACGTTCTTTCA
+ACACATCAATCTCGTCAAGGCAAGCAGCAAGGCGTTCTTCGCCGCTTTTGGGATTGTGTT
+TGCCCGGAACTCCGGTAATCTTTGCACTATGAGGGCTTGTCATACGGGTTTCAATTTCAT
+ATATATCCTCATCACTGTGTTCGATAATGTACTGCATGCTGCTGTAATCTTTCAAAGCTT
+CAACAGCAGCCGCTTTTTTATCTAAATACTGCCATGCAATCAGCATATCGCACCTCCAAA
+AAATCAAGATAAAAAACCTTGATCTTTGAAGCAGTGTGCTTTTTTTCGTTGCTTTGCAGT
+GCTTGTTTCCTTGTTCGTTATATCTTCGTTCTTTGCAGAAGGTCATGCTTTTCCAGAATA
+ACCTTCACCTCATCTACCGAATGGACAACCGCTGCCACGCCTCCGGCATTGAGGATTTTT
+TTGATGGTTGCTTCCTGCAGTTTTGTTGTCTTTCCCGATGGGGTTTTTACTTCAAAAGCT
+ATAAACCGCCCATTTACACAGGCAATAATGTCTGGTAGCCCGGCTGTGCCGTACATACCG
+CCATGTTCCTTCCAACAGAAACACCCCGGTACTGTCTTTAAGTACCGCAGGATTTTAGTC
+ACAATACTCTTTTCAGACATAACCGCTTATCCTCCAAAAATGTTACCTTTTCCCCTCTTG
+TTACCCCGGTATTTCTAAAAAGGTAACTTCTCAAACCCGCTTTACAAGCGCATTTGCGGA
+TTTTGTTACCTTGTTACCTTTTTTTGGGGTAGGTATAGACACAAATATTTATATTTTTTT
+ATTTTTTATTTTTCAAAAAATAATTTCATCTCTCGCGCGTATATATAAAGTTTAGGTAAC
+AAAGGTAACATCGGTAACAAGTGGCTATTCACCAGCGTTTCGGGCGTTACCTTTTTGTTA
+CCTTGTTACCTTTTTCAATACTAAAGAGGCTCAATATCTGTAATTTCAAAGCCGCTCACA
+TCGCATCGCTCTTTCAGTATCGAGAAATCAAGAGCCCACGCTTTTTTTGTTTCATTCCCG
+AAACGCATCGTTTTATTGCTCTCTATAAAAAAGTCACTTTGCCTCAATTGCTTCAGAAAC
+TGGTTATATGGAAGACATTCACCTGTGATTGCATAATCGCGTCTGTACTTGGTATAGCGG
+TCATATACATCACAGAAACGAATCCCGATAACCTTGCCATCTTTATCAAAAGTGTAGTCT
+TGATTCGGAGCCAGTTTCATCCGGGCCATGATTTCCAGGGTCTGTTCTACAATGGTCTTG
+TTATTGCTGCCGCCATCCAGCAAGTACTCCTGCACACCGTTTTGAAGATATCGAATACAT
+GCCCCTTTGTTAATGGGAAATACTTCAGCCCACGTTACATTAAGGAATTCACACAGTTTG
+TTTACTAGGCTCAATCCGGCATAGCAACAGGCGAGATTATTGACGATACGAGATGGAAAC
+TCATCAGATATCTCTGACTTTGCTTCCTCATACCACTTCTCTGCCTCAGCAACCGATACT
+CTGAGTGCTATATCCAGCAGGCTCCGACCGAAGCTGCCAAGCAGATCCGCTTTTGCACAC
+AGCTTATAAAATGCTTGTCTATGGCTGGCTGGTTTTAAGTCCTTCTTGCTGAATAGCAAT
+TCTATGCTCCGTTCTCTGATGGCCGCTTCATCCGGCGATTCCTCACCAGCTACAATAATA
+GGTGCCAACAGTTCATAAGTAACAGCACTTTGATCCGCCCTACCGCGGACACCTTCATGG
+CCGTCATATGCATCTCGAAGATGGTTGTATAAGGCATTTAGCCTTAACTTATCTATCTTT
+GAAGGCTTGAACTCATCCATCAACTGCGGTATAAGATTCGATGATGCAGATTCCTTCATC
+AGTGTAAATGCAGTAACCTGCGTAGACGCGCGGATTTTGCTGCACGAAAATACCGGCAGA
+ATAACCCGCTCCAATGTATTACTTTTTCCGCTGCCTTGTTCTCCGACAAGCAATAAATGA
+GGAAACTTGATGCCTGATTTTTTAAGATGCGGTTTAATGAAGCATCCGGCCACCCAGGCC
+ATTACTGATACCGTTTTTATGGGCTCGTTATAGCTGAGGAGCCATTCACCAAGCATAATA
+AGCTGTTTCTTTGTCAATGGCTCAAAGGTTAGGATATCGGTTGTTATGCTTTTATACTTA
+TCAAGCTGCACGATATCTTCAACAATGTTGCCTCCTGCTTCAATGGCACCATCCGTTGAA
+ACATATACCATCCGCCCGCCATGCTCATAAATCCCAAGAGCCTTGACCCCTGTTTTCCTT
+ACCCACTCCATTTCAGATATATAACCTTTCAGCAGTTCCAAATCTCCTTCTGAGCCAAAA
+TAGCCTAAGGATATTGTCCGGCGGTTCAAGATATTTTTAAATTTTTGGATGTTATTGAAG
+TCGGTAGTCATAAATGTCTGGCGGTATATTTCATCACGGATTGTAATAAGGTCAGCAGTC
+ATCTGCGTTTCATCTTCCGATACAATCATCTCCACCGGTTGAATGATAAAATTTGTTATA
+GGATACACACTTTCGCCTCTGGTGCGGTAATACCTGCCCTCATGTTCAAAGATAACTGAC
+TCGCTTTCGCGGCTGTATACATTCTCTGTGACTTCAATGGCCTTATCCAGTGTCTCCTGC
+CCATATGTTGCTCCACTTGCATGATGTACCGTATCCCACTTTTCCCGGAATAACCCGGAA
+TTTCTAAACAGCCTGTCCATCTGCTCTTTGTTTTTGCCTGACCAGAAAGCCAGCATACAG
+CAAAGAGCAAGGTCGGCTTCGGACTGGCTCGGATACCCTGCTTCCTGCCATTTTCCTTCC
+CATAGCAGTTCAAATTCCTTATGGTTTTCGGCTGTCTGGGCTTTCTCCAGAATTTCTTCA
+TCTGTAAGCGGCTCTAGCTTAAAATTCTTACGGTTTTTCTTGCTTTTCCCGCTCCGCTTC
+TTGCTTTTGATATAGTTCTCATGTATCCAGGCCAGTGCTCCGTTATCTTCGGCAATGCTA
+TCAGGAGTCCCGGGCAACGGGTCGCCGGTCATTGTGAAGTACCTGCTGTGGGCATACATT
+TCAACGCCGGTTTTAGTGTTTTTATTGCCCTTGGCAGGCATCTCCCCTTTATAGAAAATA
+TGAAGCCCAGTTCCTGAAGGGCTGATTTCCGTATAGGACGGAAACCGCTCAAGGATATCC
+TTGGCGGTATCGCTTAATTCCCCAGTGTTTTTGTCGCGGCAGTGATCTATGTCTATCCCT
+ACTAAACCTCCGCTTTTTGCGAATACAAAATCTAATCCGGTATAGAGGTATTGTTCTTTT
+GCCGCAATCGCATCGTCAAGGGTCGACCAGTCGTTTGGGTTAGTGCTTGAGGCTTTTCTG
+CCGGTTAAGGGATTGTAAGGGATTTTACTGTCTCTTCCGTCCTTTGTGTTTGGTTCCAGA
+CGCCAGCAGATCCATTGCTTCCGGTTTGCCAATTCTTTAGGGAATGAGATGCTCACTTAC
+ACTGCACCTCCTCGCATCGTTCATTAAAATACCGGATCGGAATGCTGCGCTGCTTTGCCT
+TTTCAATCTCAATGGACATCCCTTTAGTAATTTTTCTGCCAAATACCCACACTTCTGAGC
+ACTTTGACATCAATACCATGCCAAAGTACAAGCCCAGATTTCGCATTTGTTCATCATCGT
+CGTCCATAAACTGCGGAAACAAGAGGTGCGGAGCAATAGGTATGCAATTCCTGCTCACTG
+CAAAGCGGCAGTACCCCTGAGCCTTACGGATATTACGTTCTATATCACCAGCATATGGGC
+TGCAGATAAATACCATCGGTCTGTAGGGCGCTTTCCTGGCCTCTCGCTCAATCCTAAGCA
+GTGCTTCATAAGGTGTGGGGTCGTAATATCCTTCTGCGTTAAACTTGCTGATACTCATGG
+TATTACCCCCTGCCTATGCGCTTTTTTGTTCACGTTCGATTACAGGCAATATACCTTTCT
+TGTTTTTAAGAAGGTCATAGATAAATAGCCTTCCTTTTTGTGTCCAATATGTGTGCATTA
+CGCTTCTTTCTGCATCAATAGCATGAGTCTTGGACTGCGTGTATCCTTGATCGGCGTACT
+CCTGATATAAAAGCCAGCAGTTTCCCATTTTGTACTGTACTCCAAGCTCATGAAGCAGCT
+TATTGAAAGCGCGGCCAGACATTCCGTAATCCTTGGCAATCTTGCTGATCGGCACAAGGC
+TTTTATTTTGCAATATGAGATCATAATAGCTCGCTTTGGGCTTCAACTCACTGATAATCT
+GTTTATTCTTTGCATTTTCTATTTCTAAAGCTTTCCGCCTGTCGCGTTCTGCCTTTAGTT
+CAGAGAAAATCCTGATGCCATACTCCGGATTAGAAATCATCTCTTCGATAACTTTATCTG
+TAGCATAAACTCCATATTTTCTGATCGTGGGCAGCACTTCATCAAAGACCCATTTCTCAA
+AGCGTTCAGCTGCAGGAAGTTGGGATTTAACTATCAACCGGAACAAATCACCTTCGGGAA
+TATAATTTATGTTGATGGTTTTTTCAGGATTTTGCGGATGAGGTACCTCACGTTTTGTTA
+GGTACTTACAATGATCTATTACTGCCTTGTGTGGGTTACTGTATCCCAGCATCCTTGCAC
+AATCCGTTGCAGGAAAGTATTCCTTTCCATCAATAACGAGTACTTTAAGTTCTCCAAATT
+CTGTATTCTTAAAAACCTGTAAATTAGTCATAATATCAATCCTCCATTTCTTTCATTTCT
+CCAAAATTTCTTCCTACCGAAGCCTCTGCCACAATAGGTACATCAAATGCAGGGAAGGGT
+TGTGTTTCCATACACTCTTTTATAAAAACAACTGCTTCGTCCACCTTGTCTTCCGGTAAT
+TCAAAAACCAGCTCGTCATGTATCTGCAGCATAGGTTTCAGCCAAAGCCTTTCGGGAAGT
+CCACTGATGATGCGCCCACAGGCAAGCTTTAGAATATCTGCCGCTGTACCTTGAATAGGT
+GTATTTAATGCGCACCGCTCGGCAAACGACTTCTTGCCCCAATCTGATGACCGAATTCCC
+AGCAAGTATCTTCGCCTGCCCAGCCATGTTTCTGAATAGCAGCTTACAGCAGCCCGCTTT
+TTTACCTCATCCTGCCATTTGGCAAGACCGGGGTATCCGGATTTCAAGTTTTGAATGATG
+GTCTCACATTCAGCCAAAGTTGGGTTTATGCCAGCTTTAAATTTTAGTGTCCTCTGTAAG
+CCAGTGGGAAACAGGCCATAGAACACACCGAAATTGCAGTTCTTTGCGATGGTTCTTCGC
+TCTTTATAATGCGGAGCATTTTTGTCTGCTGCCTCCTCAAAAGGAATGCGGTAAATAACA
+GAAGTGGTCTGCGCATGGATGTCACCGCCTGTACGATAGGTTTCCAGCATACGTTTGTCC
+CTGCAATAAAACGCTCCGACGCGCAGTTCTATCTGTGAAAAGTCAAGGGATAAAAGAACC
+TTTCCGGCTGGCGCAATGATAAATTTTCGTACACCTATTGGGTCATTGTCTTTCTGCGGA
+CAATTCTGCATATTCGGGTTTCTTGAAGCAAACCGCCCTGTCTCTGTCCCCAGCGGCATA
+AGATCTGGATGAATCCTGCCGGTATCCTCATCAATAAATCGAAGATAACCGTCTATATAG
+GTGGATTTGAGTTTTCCCCATTTGCGGTACTCCTGTACCAGCTCAAATAAGCGAACTAGC
+TCGGGCCTGTTAGTTGCACACCATTCTTTTAACAGAATCATGGTTTCATCATCGGCAGCT
+TCCTGATGTTTTGCGGTTGTTTTCATAACCGGAAGGCCAAGATCCACAAAAAGATACTTC
+TTAAATGCTGAAGTTGAAGCATTTGCCCCAATCTCTACATTGCCGATAATTCCGGCAATC
+TCTTTTCTGATACTGACAATCTTTTCTGCAGCTTCCGCTTGTTTCTTCAGCATGGCTGAC
+TTATCCACCAATATGCCGTTATACTTCATTATCCCGACATATACTGATGTAGGCGATTCT
+ACCTCTTCCACAATCGTTCTGTGTTTGGGTAAAAATCTATCAAACCACTGATTGAAAACA
+TGATACAAGCGAAGAGTGTAGTCGCTGTCAGCACAAGCGTAGCGGACAGTCTTCTCATCC
+TGAGGGTTCAATTCATCGAAAAACCGACCTTCAGTAACCGTTGAGAATTCTGTCATTTCT
+GCTTTGCAGAGTGCAGGCGCAAGCGTTTTAAGTCCGCTGTCAGCAAGACTTCTGAACTCC
+CACTTGCTTTTTAATGTAAGCTGTGATGCTGCAATCGTGTCATAGCAAGGCTTTTGAAGG
+ACGATACCTCTTGCGTAAAGGAACATAGACTCAAAAGCCAGATTATGAGCAACTTTTATT
+ACATCTTTTGATTCGAATAGTAATTTCAGATAATCCCATATTGCCGCCTGGTTCTCTGCA
+TTTCGCCCGCTACGATGTTTAAGTGGAACATATATAGCAGTCCCTTCTGATACTGAAAAA
+CTGATCCCTGTAATATCTGCTTTATGAGCATCCAGAGCTGCACTTTTATCGTTCCTCCAT
+TTATCGCGGGGTGACGTTTCAAAGTCGAAAGCAAATAGGACAGTGTTTTTCAGATACTCT
+TTTATTTCAGACAGCATATAAACACATTTGTATCCCATGCGGTTCTCCTTTCCGCCCTAT
+CGGAGATGGAAGTTACTCTCCGATAGGGCCTTTGATCACTTAAGCGGCTCAGTAATTTCA
+CCTGATTCAGGGTCTACATTTATTACCTCTTCACCGGCAGGTTCAGTGTCATGGCCGACT
+CGGGTACTGAATGCTTTGACCTGCTCGGAAAGCTTGGATATCAACGCATATTCGTCAGCG
+GTCAGATCCCGATCTACAGCAAACTGGGCCTGTGAATAGGTGATACCGCTTGAATTGGTC
+GCCTTTTTCAATGAAAAGCGGGTAACTACGCTGTTCGACTTTTTACCTTTAGAAAGCAGC
+CTTTTGATGTAGCGGGAAAACTCTTTCAACGATCCTGTTGGCAATGAGAGTATCAACGGG
+AAAATCTCCCCTTCACGCAGTACATATATCCTGCGGCGGTTTTTGCAGGCTTTGCTGCCG
+TTTTCCCCCGAACCGAACTGATTATATGGGCATTTGGCACAGCTTCCTCCGGGGTCTCCT
+TCGCCGGTTATACCATCAAAGCTTCCGCAATCCGGTGGGTTACTGCCTCCGGTATACTTG
+TCCTTGTAGTATGCATAAAGTGGATGATGATAAAGGATTACCGCTGAGAATTCCTTGACA
+GTATCAGGTTCTCCGGGATTCTCACCAGGCACTTCAAATACTGTGCTGCCTGCGGACGGG
+ATTTTTATGCGTTCAAAAGTCATGTCAAGACCGTCAAGTTCTGATGCCATTGCCTCGTCA
+AGATTGAAATCAGCGAGCTGAAGAAAACCTGTATTTTCGTTAATAGTTACGAGTTCATTG
+TTTTTCATGCTTTTATACCTCCGTAATTATGAATTTGGAATGTAATCTATATCATTGTTC
+TTTGAAGCATTGTTCTTCGAACAGTTATTCCTTGAACATTGATATTGGAGCATTGCTTTC
+TGAAGCTATTTACCTTGCTGCTTTCCGCACAGTTACTGTTGTCTTTTCGAAGACATTCAC
+AAGGCCTTTCAGCCAGTCCGGAAGCTCGTCCCCATTCTCCGCAATCTGTTCTTTAACAAA
+TGCTGACAGGGAATTTGCATTTACTGTTTCATAGATGAGTTCTCCAAAGCCTTTACTGCG
+TAGTGCGTCAAACAGTTCCTCCTTCATGCCTGCGGCAGCACTGGCTCTTGTTGTCGTTGA
+AAGGCAGAACATTGTTCCTGCTCTTGTGAAGTTTTGCGTCTCACTGCTGATCATCAGCTC
+AGACAGACGGTATTCGACATCGTCAATCTCCGCATTTATGCTTTTCATTTCCTCTTCCGC
+GGCCTTTTTTGCATCGCGAAGCTCCTTAAGACGGTCAGCAAGTTCAAACATCGCATTATC
+GCTCATAGCTTTCACCTCCCTCTGGGGCAAAAGGATTTGCTCCTTTGCGGTAGTCGTCTA
+TCAGCATTTTTGCAAGATCTGCCTTATTGCGTAGGGCAGTCAGGATTTTTGAATCCACAG
+TACCCTTGGCAATAAGGTAGATATATGTGCAGCCATTCTTCTGTCCAACTCTATGGATGC
+GGGCCTTTGTCTGCTCGAAATTCGACATGGAATAATCAAGGGAGTAAAATACCATTGTGC
+TTGCAGCAGTCAGCGTAATACCGAGTCCAGCGGTTGCAATCTGGCCTACAAACACCATGC
+AGTCGGGATCATATTGAAACCGGTTTACTTGTTCTTGGCGATCCTTAGTCGCACCATAAA
+TACACGCATAGCCGATGTTCTTTTTCTCCAGCAACCTGCATATAGCATGAATTTCAGGGA
+TAAACCTTGCTATGACAACCAGCTTATGTCCTTCTTGAATACTGCTTTCAAGGATATCTT
+CAAGAGCTTTCAACTTGGCATCACTGACTTGCTCGATTTTCCCACCGTCATCGCTTCCGA
+TGAAGCCGCCGGTTAATTGCGAAAGACGAAGCAAGCGTGTCAGTATGTTTGTAGCTGTTA
+CTTCTCCTGCTGACAGCTCAGTATAGCTTTGTTTGACAAGCTCTTTATATTTCTTTAAAG
+TGACAGGCTCAAGCTCAATATGGCGAATAATATCGGTGGTTTCCGGCAAATCCAGACACT
+CCGCTTTGGTCGCCCGGAATGCAATGCTGTGAATCCTTTTCATCAAATCCTGTTCCATTG
+ATTTTTTCAGCACTGGCGTATGGTTGCCATAGCCAACCATATTGAAATACCGGTTTCTGA
+AGGCATAGAAGCTGTTACCAAAGATGCGTGGATCGAGAAACTTATATTGGCTGAATACAT
+CTATGGCTTTGTTGGTTATAACCGTTCCTGTCAGTAAGAGCCGATACCGGGCAAGCAAGC
+CTAACCGGTGCATTGCCTTTGAAACAGAAGTATTATGAGTTTTAATTTTGTGTCCTTCAT
+CAGCAATGATAAGGTCAGGATGCCAATTAGCCAGTTCCTTTTCCATTCTCCATGCAGATT
+CATAGTTGACTACCACCACATGGACACCTTCGCCAGTTAAAAATCTTAGCTGTTGGATTT
+TCTTTTGAATCGTGCCATTAAGGACTATAAGCTGATATGGGAAATCTGCGAACCGTTTAA
+ACTCGTCTTCCCACACTCCCAGAATGGAAAGTGGCGCAACAATCAGCACACGTTTTATTC
+TTCCTGCAGCAAGCAATGCTCCTATAATGGCGATTGAGACAAGAGTTTTCCCGGTACTTT
+TCAGCCCATTTCCATCAGGAGCGCTGCACCCCATCCGGAAATGGCAGAAACACCACCACC
+CTTCAAAAGCCCAAATAGACTGCAGATGAAATTGAAAGCACGAATCTGATGGTTGTATGG
+TCTGCCCTTTATGGGCATTGGAATTATTGACAGCGTTTTTGCATTGTTCATAGAGTCTTG
+CATCTTATATCCTCCATCCTTCAATTTTGAGGGTTGGCCAACTCTCTGACTCAATGCTAC
+CTAAAATGCAAAAGCATGTCTGGACATCTAAAGTCCATGTTTTGGGCAAAAAAATAGCCA
+TTATGCAGTAAGGTTTTTGCACCTTTTTTGCATAATGCCTTAAAATCTCATTATAATAGC
+CGGTTTAAAATATAAAAAGTTGGACTTCAGAAGTCCAACAATTTTTTTAACTTATCATTT
+CTTTATATGCCTTTGCACAAAGAGGGGAAAGTCCCAAGGCTTCCAAAACTTCATTGCATT
+CATATATTGAATGCCCTCTATACGAATGGATTAGCTTTTTATACGCCAATTGCTGTGGAG
+TGTTATTGAGAGTATATCCGGCAAGCCTTAATATTTCTTCACTGTATGTAGGGCTTAGCT
+CCAATCCGATGCAGATTGCAACAACGGTTTCTAAAGTTGGATTGTTAAGTTCATTGTTTT
+TTATTCTGTCATATGTTTTTCCTGAAAGCAAAGTCTTTTCTATAAAAACAACCTTATTGT
+AGCCTTTCCTTTTGATATGTCCGTATACCGCTTGGGAAAATGTCTGGGTTGTACGGCTCA
+AATGCTGACCTTCTTCGACGAATTCTTCGTGAAACTTCTTTAGCTCTTCTGAACGATTAA
+ATACTTCCATATTATGCTTGTCCGGATTAAATGTCGGCACTCTGTTATAATCCGGTGTAG
+CTTTACGGAACATTATAGAATCGAGGTATACTACAATGTCCATTTTTGAGGCTTTATTTA
+ATTTTAAATCAAACAGAAGGCAGCATTCATCTACATGCAGTTTTGCATAGTCTGTAAGAT
+CAATGCTTCCATTTTCTAACTTTTTAATGTATTTGGAGTCGTTAATAACGTAATGACCAT
+CAACATAAATAAAATTACCGCTGTCTATAATCTTTGCGAATTCCGGATTTGCATAGTATT
+CAAAAAAAGAATCACTTAGGCTAATACTGTATGTTTGATTCTTATGTAATGAGTCTGCCT
+TAAATGAATAATTGCTGATAAAATGGTCATCTACGTAGGTATATACACCTTCAACTTCCT
+TATATCCAAGGTCAAGCATCCTTATTTTGGCCGCTATCCTTGACACCTGGAAGAAGTCAG
+CTAATTCATACACGACATTTTCCATTATATTTAGCCTGTCGTAAGTACCAAAAAGGAGCT
+CATTCTTTTTAATTAGCTCCTCAATCTTTTTAATGGTCATTGATCTAGGCATAAGGATTC
+GTGGTGCAATTCCGTTAGCATGCCATTCCATCCAGTCTTCTGGCGTCCATTGCTGTTTGT
+ATTTAGTTGTTTCGTTTACCCTGCAGCTTATGAGCAAAGCATCGCTGTTATACGTCTTAA
+CTAACTCATGGTATTTTCTATGCTTATACCAGTGGACACACTCATGAATAATGGTATTGT
+TCATGCACCCTATGTTTCGCATGAAATACACATTAGGATCCACGAGAATTGTTCCTCTTG
+AAACTTCCAAAGGCTTATATGTTCTTTCATTTCTGTCGTAATACTCTATTGTGCAATCGC
+CAAAGACTATTTGACCAAATATAGTGAAATGCTTTGTAAGCTGGATTTCCTTAACCTTAA
+GCCCCATTCTTTTCACTACTTCATCTACTGGAATGGGCATAGGAGTACTTAATGCTTCTG
+GGCAAAACTCATTTAGAAATTCAGTAGCAACATTGTCAAACTGTTCCTTTTCTATAATTG
+GTACTAAATACTCAGACAGTCTGCCTAATTTGCTTTCTCTGTACTTGTTGTATATTGAAA
+CAGAGTTGATTTGAAAATTCTGAATTCCGTCATCAAGGTCAGCTCTGCAGGAGATACGGA
+ACCATTGTTCTATACCATCAGTCTCGCGATTCCTTCGTACTGTTTCTGCAATTTCAATTT
+CGGCAGAAACAATTACGTCAAATAAAATACTGTTACCTGGCGAGTCGGTTATATCTATCG
+TTATGATGTCAAAATCAGATAATGCTGCTTCATCCGGTGATTGCACATGGTATGAGTTGG
+ATTCAAGCTTATCCGGGTTGTCCTCTATATATTCAGACAATTCGTCAAAGAGATCATTGT
+AATACATATTTGCAATAACATCTCTGAACGAGCTGACGCTTGCCATACCGTACCTCCCTG
+ATTACCATCATTTCAGACCAAATATTTCCTTATGTAAATTATAGCATGAATTTCGCAAAA
+CACAATAATTAATTTGCGGGCTCAAATTTTTATTGTGTTTCAGCTTACTTTATGATATTC
+TTTATAGCGAGCGAGGTGACAATTATGGCCGTAAGCTATAAAAAACTATGGAAACTCTTA
+ATTGATAAAGATATGAAAAAGAAAGATTTAAGAGAAGCGGCTGGTATTAGTACATCTTCT
+ATGGCAAAACTGGGTAAAAACGAAAATGTTACGACCGATGTGCTTGTGAAGATTTGTAAG
+GCATTAAACTGCGATATTTCAGATATTATGGAGATTGAGCCAGATGAATAGGTATCAACA
+GCTTTTACTTAATAGTTAAGCAACAATGACGCTAATTGAATTATTATGAAAAAACTTAAA
+TTAATAAAATTTTAAAAGTGAGGTTATAAAGATGTATAATCAATTTTTTAATACTGTTCT
+TGAAGTACTAAAATAAAGATGATAAAATGTATTCTGATTACTAAGAAGGTAAGTAATTAT
+ATATAGATTTCTTTGCTTACTAAATTGGAAAGAGATTACAGCCCAGAGGTTGTATATAAT
+GCTCCCCATTGTCAAGACAGTTTTTTAGCTTTTCTAAGTTAGTTCTCCTTTCTTAATTTT
+GTATAATCTTTACAACTGTGCACTCTGTTGGAGGATGTCAAGGGCGAGCGTAAGCGAGTT
+CATCTTGACCCTTGACATCCTTTGGACATATATCCTTTTGCTTTCCGGTCTGTTATGACA
+GACCGGCTGCCTTCCGGTGAGGACGGGGTTTGGGGCGGAGCCCCATAATTCTATACAACT
+GCCAGTAGCTGGTCATATCCTCCAAAGTAATACTCTGCCGGTGTTTTGTAATCCAATGAC
+TGGTGCGGTCTCCTATGGTTATAGTGCTCCACATATTCCTTTGTGATTTGTCTAAGTTGT
+TGTACCGTTTCGCACTCTTCAAGATAAAGTTTCTCCCACTTGTAGGAACGGAAAAATCGT
+TCTATCCTTTGGTTGTCTAATGCTCTTCCTTTTCCATCCATAGATATTTTGATACCGTTA
+TTTTTTAATAGATTTATGTAATCATCACTGGTAAACTGTGAGCCTTGATCACTGTTCATG
+ATTTCAGGCTTGCCATATCGCTTTATGGCCTTTTGGATTGCTTCTATGACGAATGTCTTA
+TCAAGAGTGTTTGATAGTTCAAACCCAACAATATACCGAGAATACCAGTCTATTATTGCA
+ACCATATACATGAAACCGCGTTTCATTCGGCAATAGGTCACATCTATGGACCATACCTGA
+TTAGGATGATCAATTTTCAAGTTTCTCAACAGATATGGATACAAATTCTTACCATGTATT
+CGTTTGCTGAGGTTGGGGCCAGGACAGAATCCATGTATGCCCATTTCCCTCATATAACGC
+CGGGTCCGTTTTCGATTGATATGAATGTGATAATCCTTGTTCAATATACTTGTCATCCTG
+CGATAGCCATATTCCGGATAAGACGCGTAAATTTCATCAATGATACGCTTAATCAGGTAT
+TCCTCCTCATTTACCGGAGCAGGCTTGTAGTAAACGCTCGTACGGTTTAAGCTCAATAAT
+TCTGCTTGCCTTGTTATGCTGAGTTTCTTCTCATTTCTATCAATCATTTTCATGCGGTCT
+TCTCGGGATTTAGAGGAGGCCAGATTTTTTTTTAAGCCAGGCAACCTCATATGATAGTTG
+ACCAATTTGCTTAAGCAGTTCGTCCTTCTCCTTTTCAT
+>NC_009012.1|provirus_2022140_2067593
+TTAAATTGCAACTTCAATCTCCGTGCTATCAAGCAAACTCACTATTATCTTTTTTCCATC
+AAATACTGTCATTTTCTCTATTATTCTAAAATACATATCAACATCAAACTCCTCTACTAT
+CTTTGCATCCTTTAAAATTTCAATAAACTGCCTTGCCTTATATCTTTTAAGCAAGTTATC
+ACTTTTAAGTCCTTCCTTCCACTTCTCCATAAAGTATTCCTTATTCTCCACCATAGCATT
+AAATGTATTTACAAAGGCATGATATAAAACCTTGTCATCTATATGCTTATTCTCACAGCT
+CTTTTTTCCCTTTACTTCATATTTTTTATTACATCTCCAAACCACTCTTCTTAGCCTTTC
+ATCAGTAGAATTCCATACCTTTCTTCCAAAGGCACTGCCGCAGTGTCCGCAGATAACTCT
+TCCTGCAAAGGGATTATCTACTGTGGCATAATCAAGCTTACTGATGTTATATTTTTCAGC
+AAAAGCTCTTCTTCTCTCCATCTCTAGCTGTACCGCTTCCCAAATTTCTTTATCTATAAT
+TGCAGGATGGCTTTCTTCTACATAATACATTGGAACTTCGCCATTGTTTACTGCTCTTTT
+TTTGGTTAGAAAATCAACAGTATATGTCTTTTGGAGAAGTGCATCTCCTTTATATTTTTC
+ATTACTTAAAATCTTTCTTATACTGCTTTCATACCACTTAGGTTTTCCATTCCAGTTAGG
+AACACCTTCTTCTTCAAGTTCCCTTGCAATTCTGTTTGCACCTTTACCGTCAAGGTAATC
+CTTATATATTCTTCTTACAATTTTAGCCTGCTTTTCATTTATCACAAGATTTCCTTCTTC
+ATCTTTATCATAGCCTAAAAACTTTGTATGATTTATATGAAGCTTTCCCTGTTCAAACCT
+TCTCCTTATGCCCCATGTAGAATTTTCACTTATACTTCTTGATTCATCTTGGGCAAGGGA
+GCTGAGGATTGTAAGCAGTACTTCTCCCTTTGAATCTAAAGTATTAATATTTTCCTTTTC
+AAATATTACTCCAATACCTAATTCTTTAAGCTGTCTTACGTAGTTTAATGTATCAAGTGT
+ATTTCTTGCAAACCTTGATATAGACTTGGTTATTATCATATCTATTTTCCCTGCTTTGCA
+GTCTTCTATCATTTTATTGAACTGTTCTCTCTTTTTAGTGTTTGTCCCTGAAATCCCCTC
+ATCTGCGTAAATTCCTCCGAATTCATAATCTGGATGATTTGTTATATAAGATGTATAATA
+AGCTACCTGTGCTTCATAGCTTGATAACTGTTCTAATTGGTCTGTTGATACTCTGCAATA
+AGCTCCCATTCTCTTTTTCTGCGTCTGTATTTGCTCTGCCAGATTGTTTCTGTTTGCTCT
+TGCAGGTATAAGTGTAATATTTCTTGCCATCCTTAACTTCCTCCCTTACAATTATTGGTT
+CTTCTATATTAAGCCTGCTTATAACCTCATCATCAATTGATGTTCCACTGCAGGCGTCTT
+TTCCGTTTTTAATATAATTACTGCACTGCCATACAATCTTTCTGCAATTTAATTTGCTGT
+TCCAAGTTCTTCTCCTTAGAGTAGAGCCGCATTTACTGCAGAAAAGCATTCCTGTTAATG
+GATATCTGTTTGTATATTTTTTTGTATCTCCTGCTTTATTTCCTTTTGCCTTTGCTCTTC
+TTGCAATTTCTATCTGAACCTGCTCCCACATTTCTCTTGAAACTATGGGAGAGTGATTAT
+CTTCAATATAATAGCTGTCAATTACGCCTTCATTTCTAACACTTACTTTTCTCAGATGGT
+CTGGTGTGTAATACTTTTGAAGTATGGCATCTCCCTTGTATTTTTCATTCTTGAGGATAT
+TTAAAATTGTACTTTCCTGCCATCTGCCGCCTGCAACAGTAGGCACTTTATCTTCATTTA
+ATTCTTTGGCTATGGTAAATGTTCCTTTGCCTTTTAAATAATCTTCAAATATTCTTTTAA
+CTATTTCTGCTTCTTTTGGGTTTATAACTAAATCGCCGTATTCATCCTTGTCATAACCTA
+AAAATCTTGTGGTATTTATAATCAGCTCTCCTCGTTCAAACTTCTTTTTTACCCTCCACT
+TTAAGTTATCACTGATATTTTTACTTTCTTCCTGGGCAAAAGAAGAGAGGACGGTTAGCA
+TAAGCTCTCCATCCCCTGATAAAGTTCTGATATTCTCTTTTTCAAATATTATTTCTACAC
+CAATGTCCTTTAGTTCTCTTACTACTTGAAGCATTATTGCTGTATTCCTTGCAAATCTTG
+AGATAGATTTGGTGATGATTAAGTCTATTTTCCCTTCTTTTGCAAGATTAAGCATTCTTT
+GAAACTCTGGTCTATTATCTGTAGTGCCGGTAATTCCTCTATCAGCAAATACACCTGCAT
+ATTCGTAATCAGGATTATTTGAAATCAGATTTTCATAATACTGGATTTGATTTTCTAAAG
+ATTCACCTTGAGCATCACTGCCGGTTGAAACTCTTGCATAAGCACAAACTCTTTTCTTTT
+TATTTTCCTTCTTTTTTACAGGTTCAATAATCCTAACACGCATTCTATATCCTTCCTTCT
+ATCAATTTGGTACTACTATACATCACTCTAAAGGTGATAGAAGTCAAGCTAAACAAAAGA
+AAAGCCGCTACTTTAATTAACGGCTACTTATTAAATATCATAATTACAGCATCAAACCCT
+GCTGCCCTAAGCCTTTGCACCTGCTTTTCAGCATTTTCTCTTGACTTATATGAACCTGCC
+ATAACCCTGTAAAGAGTCTGCTCGTTTTCTACTTGAGCTTTTGCTGAAGGTTCAATATAA
+CCAATACCTAATTGTGCAAGAACTGCTTTAGTTATAGCCTTAACTATTTCATTTCTCTTT
+GAATCAAATAAAATATTATCTCCTGTGTTATCAATAAAACCTATCTCTATTAACACTGCT
+GGAGCCTTGGTTTCTCTTAATACATGATAGTTAGCTTCCTTAACTCCTCTATCTGTAAAT
+CCTAATGCTGCAAGTGATGTTTGTATCCTTTGTGCTAATGCTTTTGATTTTGCTCCTCCA
+TTTAAATATGTGTATGTTTCAACACCTTTTGCCTTTTCTGGATCATAAGCATTCCTATGA
+AAAGAAATGAAGTAATCATAGTTATTCCTATTTTCAAAAGCACTTCTCTCATTAAGGCTT
+ACTGTGGCATCTGAAGTTCTTGTTTCATCAACTGTAACTCCATGCCTTCTTACCTCTGCT
+GCTACAGCTCTGCCTATGCTTAGAACATCATTGCTTTCCTTTCTTCCCTTATATACTGCC
+CCTGAATCTTGGCCACCGTTAATGGCCAGGATCAATCATTATAATCCTTGGCATTTAAAC
+CACCCCCTCAATAAAACGACCCAAGGAATCTCTTCTCCTTGGGTGTAAAATATTGTTATG
+GCATCTAGCACATACAACTTGTAGATTATTTAAATTGTTATTATTTCTATTCTTATCTTT
+ATGATGAATGTGCAGACGTGTACCTTCTTCTTCTTTCCCACAAACTTCACATCTTTTAGG
+CTTATTTGCAAGTGCTATCCTACGCCAGACATCACCTGAGATGAAACTGCGTCCATCTAT
+ATAACTAGGTGCTAAAGAACCTTTCTTTCCATACATAGGATTATTTTTTCCTGATACATC
+TGCATGATTAACACTTATTTTTAATCTAACTTCTGATTGCCAAGCTGGATTATCTATTTT
+ATTTCTATATGACATCCTACACGACTTTGAACAAAATTTACCTCCATTATTTCGTATTTG
+GGACTTATATACATAGAACTCATCATCACACCATTGACAATATCTTTTTATCTTAGTCAA
+CCTTATCATCCTCCTTATTTAGCTGTTTTAAAACATCCTTTAGTTTCTCTGGTATTGGTA
+AGCCTATCTTAGCAGAGTTCTCTATAATGCTTATTCCTTCATTGGAAATGTAGAAAAAAA
+TAACAGCAGTACGAATCGCACTACCGTTTTTAATCAAATGAACATCTACTATATTTCCTA
+TGCCCACCATTACAAAAATTAAAACTTTCTTAAATATCCCTCTGAATCCTACCTCACTTG
+ACAGCTTTCTTTCCAGCACTGCTACCATGAGACCTGTTACATAATCAATTACAACAAAGG
+TAATCAGTGCATACATAAAGCCATCAACCCCTCCTAAAAGCCAGCCAATATAGCCGCCAA
+TGGCAGCAAATACTGCTTGAATAAAATTAATTGAATTTTTCACTGTAAATCCCTCCACTC
+TAATAAAAATCTTCTCCATAGTTAATTAAATCTACTTCAAACATATACTGAACTTTCATT
+GTATTTGCTTCAGTTTTTTCAACAGGCTGTGCAAGCTTGGTATGTGCTCCAATAGGTCTG
+CTTGTTAAAAGGGCTTGGATACATAATTGAACATAGTTGTTATAAGCATAAGTGTATCTG
+CTTATCCATCTGTCAGTACCAAGGATATTATGATAATAATAATTACCATAACCATTTGGA
+AAACTAAAATACATTTTATAGGCTTCCAGTAAATTCCCTTGAGGAGTTATAACTTGATAA
+AAGCTTGTACCCCCTTGAGTGCTTGTGTAATATAAATAAATTCTATTGGCACTTCTATAA
+AAATTATAAACATAGCATCTTCTCTCAATATTTCCACTATCCATACCCTTATTTCCAAAC
+CAAGTGCTATTACCAATCTTAGGTTTAATATTCATATCCTGAACCTTGTTTCCTGCGGCA
+TCTACTCTAATCCATCTGTTTGTATAAACAGTTTCATTAAATTGGCTGTCTGTTCTTGAG
+GTGTATCCAATAATATCAATGCAACCATCAAGATAAATTCCATCACTAGAAACTGTTCTA
+TATGTGAAAGGTACGTTATATGCTGTATCCTTAAAACTTTGGCTCATATTTATATCAACA
+TAGCTTAATTGAACTCCTACCTTTGTCCACTTATATATTCTCATATATCTTTCACTATTT
+ATGCTGTAAAGGTAATACCCAATAAAAATAAGCTCTCCATCTGGTTGAATATACGGGCAT
+ACATGACTAAGTCCATCGTATTTTCTTACTGCATGACTACTGTCAATATTTAAGGCATTT
+CCATCTGAATTTAAAAGTTTAACCACCTTATCCCAAAACACAACATCATTTGTATTTATA
+TCAAATGGAATCATAAGCCATTGTCCTTTTAAGCTGTCTGGAAATTGAATATAGCTTGAC
+TGTGTTATGTTTGTATCCCTTGAATCTGCTAATATCCATCCCTTTGTTGGACTTGTAAAT
+TTTATAGTTCTTGCATAAGAAAATAAAGTATTCACTGCCCAATACCTTTTAGGATTTGTA
+GTATTATATACAGCATAATCTGAATCTGCTGTTTCCCTTCCATAGATTGCGGTTCCCGCA
+TAAAAATAATCCTTATTATCAGGGTCACCCTCTGCCCAGTAAATACTTTCAATTTTACCG
+TTTGCCGCATGGGTTGGAAAGTCAAATACAAAATTCATCTTTATTTTAGAATCTGTAACT
+TCAAATTTTGATTCTGCTCTATTTATAGTTCCACGCCTTGTATCATTTCCAGAGTAAGTA
+TTATTTCTATGGGCAAACCCTATAATATTTCCCATAACCCTTTGCTCATTAACATTTTCC
+GGCTTATCATTATCAGTTAAGTATAAGTATTCAAACCAGCTGTAATTATCACATCTTCTT
+GTATTTCCTGCACCCATAATACCTTGAACAAAATGTCCTAAAAATGTATCTTTAAAATAT
+AAATCCGGTATTAAGTTTTCTGTGTATGCCTCTCTTATTTTCTCCTTAGTTTCTGCATTA
+AAAAGTTCTAATAAAACCTTTCCTTTAATGCCCCTCTGTCTTTTACTCTTTTTACTTTCA
+GAAATCTCACCTGTAAGCAAATCTTTATTGTAAGCAATACTTTCGTAAGGCTGTCCCTCA
+ATAAACATATCATCACCCCTCAGTTGTAAAGAATTTTCATCTTCCTTAATTTACACACAT
+CATTTAATGTAGGTTTTTCTAAAATATAAGCAAACCTCAGTTTCCTATTTTGAGCAATCA
+TTGTATTTAAAGCTGCATAATCTAAACTTGTAAGTATTGTAGGATTTATCCCATTTACAA
+GAAATGCAGCAGAATCTATAATATCAATACTTTCAAAGCTTGATGTATTGATATTATAGG
+TAAGCCAGCTTAATCCCGAATCAACACTTAAAGCTATTCTAATTCTGCCATTGGTTGTAA
+CATCATTTAAATTTGAATCTTTCTTAGTGTACTGAACAATTGCTTCAAGTTTATTTATGC
+TTTTCCCATCATGTATGTTAAAATCATAGTTTTGAATAATTACCTTTGGCTTACTTGTTA
+CTGTCTTTTCAATAAAGAATCTATTGCTATTTTTATTTGCCTTAACATCTGGATTATCAG
+TATAGATATAAAGAGCAGGTGAAGTGCCTGAAAGTCCTGCCATGGAAGCAGGAAGAGTAT
+CAACGCCGTAGGTTTTAAACATTTCTTCTGTAAGAGGTAAATCTCCAATTTTAACCCATG
+TACTACCTTGATAGTTTTTCACTCCTTCATTATCCACCATAAGAAATTTTGTTATACATG
+GAATATATGAACCTTCCTGCACTATGTAATTTTTACCCAGTGGGTCTGATGGAGTGAAAA
+TATATGATTTTCCCGCTGTTAATGCCAATGATTGAGTGCCTACATTTGGATTTACAAAAC
+TATTTGTGCCGTTATTAGGTATCTTCTCAACAACAAGCCTTATTACTCCAGTTTCAAAAA
+TAGAAAGTTCCCAAATAAGGTCATTGCTGCCCCAGTTGCTATAGGAACTGTTTCCTTCAA
+ACCTTATTCTGAAAAGCTTTGTGCTGTATTCTACTTCACTGGCATAATAAAGGTTATTAT
+AGCTGGCATCTCTTCTGTTAATACAAAGATGTTCTGATGCTCCCCCAAAGCCTACCCAGG
+TATTACCGCTTGTGTAAAGCTGTCTTATGGCTAAACCATTGTAATTAAAGTTAAAACCAA
+TGTCAGGAAGAGTTACTGTACTATCATCATTTCTTGTACCATAAAGTGTCATTCCTGCAT
+TTCCTTTTGGAAGGGACATTTGATTTATAACTGGCATTATCCTCTCCCCCTAACCTTGCT
+TAAGATATGCATTTATTGCAATCAAATCCTTATAAAGTGTTGTATCCCGCACATTTGCAG
+CATAAATTACGCCATTTCCTAAGTCCTCAATATATCCGCCTTCTCTTTTTAAAATGGGCT
+CCTTTATTGTTACCCTATTATAAAAGTCATAGGTTCCATCTTTGTTTTTATCGTAGTCAG
+AACTAAACTCAACCCAATCGGCGTCAAAAGCATAGCTGCTTGATTTACTGTTATTAAACT
+CTTCTATAATTCCCATTACATTTAAGGTTAACTTTGGGTTTCCATGAGATATAGCAGCAA
+TATTAAATCTTGTATTGAAATTCTCAAGACTATAGCTATCTACTCCACTCACATTGTTGT
+CTAAATAATACTTAAAACTGTGTCCTGTATTAAAACTGTATGTTCCAATCTTGATATTGA
+ACAAATTATAAAGGAAAGTATAAACAATCTCTGCCCTTGGTATACTTGCACTTAGTCCAC
+CCTCTAAGTCTCTTCCCTCAATACTTACCTGCAGATTATTCTTTTCAATTGTAAATGTTC
+CATTTGAAACCTTCATCTCTACCATAAAAGTATGGTCTCCTGCCGTTACCTGTGGCATTG
+GAAGGGGCAATCCTATAACATTATCTCCTGATGCTAACTTTTGAATTGGCTTAAAATCGT
+AGTATTTTCCATCTAAGGAAAACAGAATTGTTAATGTGCAGTCTGCACTAGCTTTCCCTG
+TCATGGTGATATTACAATTTAAGTTTGTATCTGCTTTTGTTGTTATTCCTATAATCATTG
+CTGGATAGCTGCTAGTGCTGATTGTTATAGTATCGCTGTTTTTCTTGATTATTACACTGC
+TTAAAGTACCGCTTATTGCACTGTTTATTTCCTCTAAAAGCTTACTGGTATCCAGCTTTT
+CAATAATTGTGTTTAAAGGATCACCAAGCTCTATCTTTGTATTTATAGGATTTATAAGGT
+CTGTCTTTTTCTTTATAACTCTTAAATCAGTAGTTACAGCTATCTTTTCATTTCTTACCT
+TTACAAAATCACCAACACTTACTTTAGTAAGATGACTATAATTTTTATACTCTTCTGTCT
+TACTTAGCTCCATAAAATCTATTGTTATAAATACCTTTGGACTTGCAGCCTTTTCAGCAT
+ATTCTTCTGCCCTTGCTCTAAGGCTTTCTACATCCTTGCATTCCTTAAACTCAACCCTTT
+TGGTTATGGGATAGGGAAGTAATTTTGCTCTTTCTCCCTCTACTTCTATATATCTTTCTG
+GCAACAATAAATTATTTGCTCCTACTGCATATATCCTTGTAGCAAGTTCACTGGTATCCT
+CAATAACCTTCATTCCATTTATGTTTTTACCGTATTTTATTAAAATTCCATTGTTTTCAC
+CAATGGACTCTTTTATCTCTATATTAAAGTTATCTCTAAAAAGTTCTCCACCATAAATTT
+CAATAAGTCTAAAAATAGCATCTACTGCATTAACCTCTTTAACAGCAAAAGGTGCTAAAT
+TCTCTTCTAATGCCTTGAATAAAAACAACCCTTGAAGTTCGGGCGGTATGCTTGCTTCAA
+GAGCTTCTTTCATATTTGCATTAAGCACCTTTGCTGATTCTATAAAATAAAAGGCAAGAT
+CATAGAATATATGTCTTGCCCATACCTTAACTTTACTTATTTTATCCTGTGTTCTCTCTA
+CTTTATATATTCTAAAAAGCTGTCCATCAGCTTTAATAATATTGAGTTCCTCTAAATACT
+GTGCTTTTTTAGATTGAGCAGGGTATTCAATTTCTAAACTATAATCTCCATTTAACTCTT
+CATTTATCTCAGCCATAAGGCATTCATCTAAAACAGCAAGCCCATTATTGTCAAAGTTTC
+CTCTAGTTGTCTTCTTATCATATACATAGATCATTATAACCACCGCCAATTTGGAACAAT
+TTCTATTTTTGAAACACTACCTGTCCAATCAAATTTATTAGAACCTGTTTTTAATGTTAT
+GAAATCACCATTTACTTTACTGTTTAAGTTATCTCCTGCATCATTATAGGCATCTTGAAT
+GACTGAATCTAATATGATTTTTCCTGTTATATCATTCAAGTTTACAGTAGTTTCATTAAC
+CTTAAGGCTTACCTTCCCAGAACCATAAACTGATATTATAGGTTCACTTTTAAGTGTTCC
+TGGATTTATTATTGAAGCTCCATTTTCAGTAATAGTAAATATGTTATTCTGCACAGCGTA
+TTTAAAGGGTCTGCAATTAAATATAATTGGAAAAACAGATGTGTATTTGAATACTTGTTT
+AAAATCTATAGCATTAACTACTTGTGCTTTATATTTTTTATCATCTTGAAAACTAAATAT
+TAAATCACTTTCTCCTGCTGAAAAAAGCCATGCCTTTATATTATCTAGCTTTTCAGCTAT
+GTTATTACCTTTAATACTGCATTCAACTGCAATTGTTATATCTTCATAAGTTCCTTCATC
+ATATCTTAAGCTTGAGTCTCGCCCTGGAATATCAATATATGATACTCTTCTTTTAGGAGA
+TGGCAGAGATGGTCTTTTAGAAATAATAATGCCATAATCACTATAACTATTTTTTCCACC
+AAAATTGAAACTAAGCATTAAGCACCACCCCTTCCCATTGAAACTCTCTGCCTGTAAAAT
+TCAAGCTCATAGGCAAGCTGCTCTATATCCTTATCTGAATTATTAATGAAATTTTCTATA
+TGAAGTGTTAATCCGCTTCCACTTCCTCCTTTTGCTTTTTCAATTGCCCTTGCCATAAGC
+TCATCTAACCTATCTATAGGAAGTACAGCTTCAGTTCCTGCTTCACCGACACCGATTATA
+CTAGGTCTATTAAATATACCACCCTTCGCATACCAATCTACACCTAGGTAAGGTACACTT
+GGAGGTTTCAAACTAAACTCTCCCTCAATACTAAAATGAGGAAGTTTTATTTTAGGTATT
+TTTATTTCTGGTAAATGTAGATTGCTGAAAAATCCTTTAATTGCATTTATAGCATTACCT
+ACAGCATTCTTTGCTGCATTTATTGGATTTTCAATAGCTGATTTTATCTCATTCCAAACT
+GCTGAAGTTATTCCTTTAATGCCATTCCATATTCCTAAGATTATGCCTTTGATAAATTCA
+AATTCTGTTTTTATAGTTCCTTTAACTAAATCAATGGCTGATTTTATCACATTCTTTATT
+CCATTCCATAAGTCAGAGGTAAGATTTTTTATTCCTTCCCATACACCCTTCCAATCACCT
+TTTATTGCACTGGTAACTATTTTTATAACATCTTGAATGGCTTTAAGTGTGGTATTTACA
+ATAGTTGCTACTAAATTAAAAGCAGTTGTTATTATCTTTACAAAATCATCACCATACTTT
+TTCCATATTTGATTTGCTAAGGTAATAAAGGCTTGAAACATAGCCTTTAAGCTTTCAATG
+ACACCACTTATTAAAGCTTTAACTCCATTCCATACTGTATTTACTGAATTCCTAAAGTCC
+TCATTATTTTTGTATAAGGCTACAAAAATAGCAATAAGACCTGTAATAGCCGCTACTGCA
+ATGCCAACTGGACCAGTTATTGCTGCAAAAGCAGCTCCTAAGGCTCCAGATGCACCACCT
+GCTGCTGCCATTGCTCCACTCACTGTTCCAATTACAGTAGAAAGAGTTCCTGCAATACTT
+ATTACCTTACCTATAATCATGATTACTGGACCTATTGCTGCAACTACTAATCCGATTTTA
+ATAATTGTTTCTTGCTGTTCCTTTGATAGCCCTTGGAACTTATCTAAAAGAGGTTTTATA
+GTGTTCATTAGTTTTTCAAGTATAGGAATTAAAAGTTGTCCAAACTGAATGCCAAGCTGC
+TGTGTTTGCTCTTTCATAACTCTAAGCTTATTGGTTGGTGAATCCATAGTTCTTGCAAGG
+TCACCTTGAGCATTTTTTGTAGCTTCCATTATAGCACCATACCTTGCTTGAACCTTTTGT
+GCTTCAGTAAGCTGTTCACCCTGCTTTGCAATTCCATGAGAATAAGCATAGGTTTTAATT
+GTATTATCATTAACTAATATACCTAAAGCTTTAAGTGGTTCTGCCTCTCCACTAATACCA
+GATTTTAATTTCTCAAATGCCTCTTCTGGTTTTAAGTTATAGAAAGAAGCCATATCATAG
+GAAAGCTGAGTTAATCCTTCTGACATCTTTAATGACTCTTGTGAAGTTAACCCCATAGAG
+GTAAGCATGGCATTATAAGTTGCTACATTTTTTCTTACATTGAAAGCATTGAGTCCTAGA
+GCTTTTGAGGTTTCTTCTGACCACTTTCTTGCATCGCCTGCCATTGAACCCATAGCTACT
+TCAAAGAGATTTTCAGATTCCACTGCATCCATAGCCATTTTTGTTGCAGCAGTTCCTATT
+CCAACTAAAGGAAGTGTTACAGCAGTAGAAAGCTTACTTCCTATAGAAGACATCTTATCT
+CCTACAGATTTCATCTTTTCTCCTGCACTATTCATGCTTTCAGACAGCTTATACCAAGCC
+GAGCTTTTTTCCTTAAGTTCTCTTGTTGCCTCTTTCAGCTCATTCTCCATTTTATTTAGT
+TCTGCTGTAGCATAATTAAGCTTAATTTTAAGATTTTCAGTAGCCTTTGCATCTTCACCC
+TTTGTTTCTACACTCTTTTGATATGCTTTTTCTAATGCCGCAACTTTATCCTTCTGAAGT
+TCTATCTGTTTATTTAAGGTATCTGATTTAAGTCTTAGTCCTTCTTCAGATTTGCCAAAA
+TCACCAAGCTTAGAAGAAGCTGCTGCAAATTCACTTTGAACAACCTTTAGACTTCTTTGA
+ATTTTTGCTACACCTTCTTGAAAACCTCTATCATCAAGTCCTACCCTTGCAACTACGGTA
+TTTGCATCTCTTGCCATCATCTCACCTCCCTGCTAGAAAATAATGTTATCTATATAATCA
+AGCTCCTCTTCTTCCTCAATTCCATTTACTCTCTTGTATACATTAAAAAGCGCTTGTAAC
+TTCTTAGGTGTACTGTGCCAAAATTGCTCCTCTGTCATTTTTAAAAGGTTTGTTCCTAAA
+TAGAAAAGCCACTCCCAATCCCAACCTTCGGAATCAGTGTGGCTTTCTATTCCCCCATGT
+TTTCAGTTACTTCTGGCATTGCTATTACCAATGCTTCATTAATTGCAGTGCCTAATTTCT
+CCATATCACTTAAAGTTAACATTTTTCCTACTTCTTTTAAGGTTACACTTTCATCTGCAG
+CCTTAATTGCTGAATAAATAAGTGCTCTTATTGCCTTTAGTTTTCTATTCTGTAAATCTT
+CAAAAGCTTCATTGATATCTCCATAGATCTCTTCTAATTCACAGAATGTATTCATATCAA
+ATTTAAGTTCATACTCTTTGTTTCCTATAGTAATTTTAATACCTTTATTTTTCAGTTCTG
+ATGCTTTCATATAATCAGCTCCTTTCTGGATTTTGGGTATAAAAAAACAGGGATGCTTAT
+TTCCCTGCTAATTAAAAATACTTTAATGTTGATACATTAGTATAAATATTGTTCTTAACT
+ATGTATCAAAATAATTACTTAAGCTTTTGTATCTCTATAACTAAAATAAGGACCGCACCA
+CCCAGTTTCGTGTGTTTTTACATAAGTCCAGTTAAATTCTTTGTCTACAACATAAACATC
+AAATTCATTCAACAAATCATTTGCATTCAAGTTAGCTGCCTCTTCAACAATAAAAACATC
+ATCTGTATGTTGGTAAAAAATATAACAGGAATTTTTCCGTTCATTATTAAAAGCCGTTTC
+TGCTTCTTGCTCTTTCAAACAAACTCTTTTTTCGAAGCTGAATACATGCCATAAATATCC
+ACAAAAACCATCGTCATCGTACATAAAAATTTCTTTCTTTTCATTATGACTCAAATGATT
+TGCAAAAACATTCTCCCATTGCTTTCGTAAAAAAGTCCCCCATTTAGGAACTTCAATCAC
+CTTAATACTTTTATTTTTAAGTATCTCATTTATACTCATATTAAGTTCCATCTCTTCACC
+AACCTTTAGATTAACTCAATAATAAAATTGTAAATTTATCAGCCTTTTTTATTGTATTTA
+GGACGATATGCTAAGATAAAAGAGGATTCAAGTGCTTGTCTAGCAATAATATCAATTTTT
+TCATCTAACTTTATAATATGAATTAAATTACCTTCTTTAAACCAAGGTTTGTCCGACTCT
+TTTGGAGTATGCTTATAACATCTATCGTTTAATGAAGTACCTGTTTCTCCAATATATAAA
+CATTCAGAATTATTATAAAATAAGTATATGATATTTGAAACCGAAATTTCTTCTTTAAAT
+TTTTGTTATAAATTGCAATATTAAATGCCGTGCAAAATTTGGTAAATCCATTGCTTACTG
+GAATAAATTCTATACATCATACCGCCATTTCTATGGCTGACCTATAACCAAACATTCTTC
+TTGGATATTCATTAATCCATCTCTCTATACTTTTTATTTTTGCTTTACTTACTTTTGATA
+TATCTGTTCCTTTTGGTATAAATCTTCTTATCAGTTTATTAATATTTTCGTTCGTTCCTC
+TTTCCCAAGAACTATAAGGATGAGCATAATACACTTTCGTCCTGTCCTTGCCTGGCTCTG
+TTTTTGATTTCTCTATCCCTCTATAGTCCAAAAACTCTGTCCCGTTATCTACTGTTATCG
+TTTTAAACTTCTCCCTAAATTTCCTTCTATACTTCCTTTCTAATTCATCTATTGCTTTGA
+TTACTGATTCCTGCGTTTTGTCTGGTAGTTTAAGAATTATTTCTTCTCTTGTCTTTCGTT
+CACTTAATACCAGTAATACTGCTGCGCTATTTTTTCTGCCTACTACACAGTCCATCTCCC
+AGTGTCCATATTCCTTCCTATCGTTAACTTCTTTCGGCCTTTCCTCTATGCTGCTTCCCT
+TAAGATTTTTCAGTGCTATCTTCTTTACCCTTTGATATATGCGTTTTTTACCATCCTTTT
+TCACTGGCAAATATTTATTCGTTAGTCTTAAAAATACATCCCCTCTATCAATGTAGTTAT
+ATAGTGTTTTCGTGCAGATACTCGTTTTAAACTTCAGTCCCTTTGCTTTTATTTGTCCAA
+TAACAGCATCAGGAGAATATTTTTCATTTATTATCTTTGATTCTATATACCTCACTAATT
+CATGGTCATTTCCTATCTTTAACCGTGGACCTTTATTCTTCCCGTTCTCTACATATCTCC
+TTTGGGCTACATCTGCACAATACTCTTTTCTGTATGTTAAATCACTATTTTGTAAATATA
+TTGTCCCACGGGTTATTTCTCTTTCTATTGTCCTTCTGTGCCTGCCCAACCTCTTTGCTA
+TTTCCGTTACTGTATACTTTTCTTTTAGGTACAACTCTATGGCGTATCTTTCTCTTTCAT
+TTAGGTGTTTGTTTTTTCTTGTTTCTGTGTTATTATTCATATATAACTCATGGTACTCCT
+TTGCTAATGTTTTTCTTTGGTTATTAAACATTTTACAATGGATTACCATGAGTTTTCTAT
+ATATTACGGCATTTTATTTTACAACTTCCCTCTTTAAATTTTTGTATATCTTGTTTATTA
+GAAACTAGATTACAATAATTATATTTTACAGTTTTTAATTCCATTTTATCCCCCTTTGAA
+TTATTATTTTATCTTTTAGTTAAGTAAATATCATTACTTCAAAACATTCTACAACGGTAT
+ACTAACTACATATTTTATTATAACAAACATTTCCTTACAGTTAAATTAGCTTCATGTAAT
+ATTTTATGCTGTTACTACAGGCTCTTCAGGAACAGCAGTAAACCACGAACTAATAATTGT
+TGCATCTACCCCTTCAGCATCCTCATCTGCAATAAATCTATAATTACCATCAAAGTCCCT
+TGAATAAAACTTGCCTTTAAGCTTAGCACTTTGTGCCTTTGGCTTTTCTGCTTCAGTATC
+ATATTCATCTGTTGCAAGTTCAAACTTTCCTTTTAAAAGCCATACATACCTGTACTTCCC
+GTTATTTTTCTTAGATTTAAAACCAAGTGCTATAGTTGGAGGCATATCATCCTTGTTTTC
+TACTAATATACCCTTTACAACCTTTGATCCCTGCAGTTTTGCCCTGCTTGTAATTGATAG
+CTGATTTACTTCAATTTCTACATCCACACCTTCAAAAGCAGTTATTATATCTTCTACAGT
+ATCATCTGAATAAATATTTTCTGAATTTGATTTTGGAGAAAGTTTAGCACTTATTGCTCT
+TTCTAACTTTTCCGGAGTGCTGTAAGTAACACCAGTACTGTCATCCTTTGTTAAAACAGC
+TATATGAATATCTCTAAGCCCTATCTGTCTTGCCATACTTATTCACCTTCCTCTAAATAA
+TAAAATTTAAAGCCTTTATGATAGATTTTTGTATCTTCTTCATAAAGGTCTATTTCATTT
+AATCTTTTGAACCCTGCTTTAAGCAAAAGTTCTTTTATATTTTTAACTATATCTGTATAA
+TCAGCCTTTGACCACACATCTACTTGGATATAATGTGCTGTCAAAGCTTCTTCATCATCC
+TCATACTCTTCACCTGCAGTTAAATACTCATGAAAAGTAATATAGGTTTCTGTTTTTCCA
+CTATACTTTTGAAAAGCTACTGGAATCTTAAGAGGTTTCAATGTATCCATAATCAACTTA
+TTTATCATTCCTCAAGTCCCCTTTGCAGTTCTTCCTTTATAATATTATTTATCTCTCTTT
+TATTCTCAAGGACAGAGTTCTCTGCCCAATGCTGTGCAGGAATTTTACTTGTACCAAATT
+CAGTAAATTTTGAATAAAAGAACTCTGAATTATCTCCTTTATTAGGACCTATCTCAATAA
+AATCTACGCCGTTTTCTTTTTCAATATCCGAAACCTTTATATTATCTGCCATATGTCTTT
+TTGTCTTGTTTGACCTTGGAGCATTTTTTTCCATGCTAGTTTTCACTAAATTCCCTGCTT
+TATCAAGTGCTCTTTTCTTTATTACATCTCCTCTTGCACCCAGCTTGTTTACCCTGTCTA
+TAAGCTCCTGCATTCCTTCAAGTTCTATTCTAGCCACTGATATCAACCTCCATAGCCTTG
+ATTTCTATGAATTTATTGGCATATTTTATGTTATCAATTGAAGTTATATTGTACTGCTTT
+CCTTTAAATAAAATCCTCATTGTTGTTTCAATATTTGGTACATACCGTATAGTAAATTTA
+ACAGTATTTTCGGCATGAACAGCTGCTGCTTCAAAGTATTCTCTGCCATGAAGATTTGTA
+ACAGCCGCCCATAACTCTTTAAAATCTGTCCAAGTTTCAGTTTCAAAGCCATTATCATCT
+GTTTGAACTGTATTTTTCTGCAATTTTATTCTATGTCTTAAATCTTCAGCCTTCATATTG
+GAATCACCCTGTTCATAGAAAGAAGAGCATTTCTTGCTTCCTCTAACTTTGTTTTTTCCT
+CTGGTCTGTAATCATCATATAAAAGCTTCATTTGAAGTATCATTGCCCACTTTATTGCTT
+CAGGCACTTTATCTCCACTATCTCCATAGCCTGCAATTAATCTTACTCTTACTGCATTTA
+CTGACTGAAGTTCTACTGTAGGCCAATGCTTTCCTCTATTTAAAACAACTCTATTTACAA
+AGCCATCTAAATCAAAAATATAATTACTTTCATCAAATAAATACTCCTGTCTATTCTCAT
+CATAATATTTTATACTTTCCACCTTTTGTATCGGTGAGCAGCTATCAAAAACTATAGCAT
+TACCATTAGGGAAAGTATCCAAAACAAACTCTAATGTCTGAGTTATATATTTTCTATTTT
+GAAAGTTTTCACACCATTCCCTTGCCTGCTTTATAAGACTTTGTATTAGCAAATCATCAT
+CATTACCATCTACTCTTAAATGCTGTTTTGCTTCTTCTAAAGTTATGGGTTCAACTATTG
+GTGGATTTATTATTTTGATTGCCATCTTATCACCCCAAAAGAAAAGGAGCACTAAGGCTC
+CTTGATTTAACTGCTGTATCTGCTGTCTATAATAACATCTGCACTTGCAAAATTAGCTGC
+TTGAGAACTTGCCCCGATTTTAATTCCGATACAAGTAAATCCTTCATTTATATCAAGCTT
+TGCAGGATCTATTTGAAAAACAATCTGCTTATTTCCTGCTGTTTCTTCTACTGTATATCC
+TGCTCCATCTGTTTTTAATAAAGTATCTGCAGTCGTATTCTCATTTGCCCATACTGGTAC
+ACTGCTGATTAATGCCTTTGAATCTGTTCCTTGTGTATCTTTTGCCTGATATATGGATAT
+TTGTGTTTCATGAGCTGCTGCTTGAGTAAGATTTACAATTACTACAGCATTTACTGCATT
+TTTTAAATTTACATATCTGCTTTCTATACCTTCATTTGTTGTCTTTGGTGAAATGATCTG
+TATTACTTTATATTTTTCAATAAACATAATTTTTACCTCCTACCTATCTGCTAAAGTTAC
+AAAAGGACTTAGTGGATTTGCACCCTTGTAAGGCATAATTGGCTTATTCTTATAAGGCAT
+TCCATTGAACTTATAGATGAATCTGAATACCTGCTCATCATATAAAAATCTTACATGGAT
+AGATACATCAGAAGTTAAACCTTTTTTATCTATTCCAATATACTGGGTTGGGTCAGCTAA
+AATAATATCTCCCTTTTTACCAAGAGGTGAACACTGCTCTATTGGAATTATTGGTCTATT
+AAGTAAGGTACTGTACTGTGATGCTGCAGCTCCACCGGAAGGCATAAACACAGGTGCTCC
+ACCAGCTCCAATATTAAGAGCCATAGTGTAAAGCTGTGGTTCTATCTCTTGATTTATATA
+CCATACTGCATTTGCTCTAAGTCTTGCAGGCATTGAACTCCACATTTTAAGTATATTTTC
+ATACTTAATTGTTCCTGCTCCTTGATCTTTTTCCTTGGGTACTGTAACTAATGCATCAGA
+GTTTAATATTCCAAGGGGCATTCCAACACCAGTACCATTAATGATTGCATCATCTATTTT
+AAAACTCATTTCATCTGCATAAGCTTGCCTTACTATAGCTTCAAGTGCTGTAGTATCTTG
+TAAAAGGTCATCGGTTACATAGCAAAGTGCTAAAAGCTTTTGAAGTGACATTTCAATTTC
+CCTAAACTTTGGCTTGCTTTGAGCTGCTGTTTCTGCTTCAGCTACCCAGTAAGCCTGTAC
+ACCTCCCCATCTTGAGCCATTGGCTCTGCTGTTTTCATCAATTCCAAGCGCCCTAAGTCT
+ATTGGTATTAGCCCCTATTGGTATCATTCTTATTCTGTTTGCCACCTGACTTTGTGCCAT
+CATGGATTCAAATAAGTCATTTATAAACTCATTTTCTAGTAAAAATCCTCCTTCTGAAGC
+TATGCTTTCATTAAGTCCTGTTGCTGAGTTCTGATAAGTTAATCTGTTGTCCATTCTTCC
+TCCGGGAGATGAAGCCTTTGCAACGGCACTTAAAAATTCTCCCATGCACTTCCACTTCTT
+TTCATTGTGATTCTTTGGCTGAGCATATATTGGTTCATTCACTGGCGTCTTAGCCTGTTT
+TTCTCTTTCTGCATTTAATGCATCAATTTCTTTTTGTGCCTCAATTTTAGCTTTTAAAGC
+CTTAATTTCAGAAAGCTTTGCATTAATTTCATCAGCTGTAGCCTCCTCTTTATTTATAAG
+GTTTTTAGATTCTGTTTCTAAATTTGATAACTGAGCTAATAATTCTTTCATTTTTTCTGA
+CATATACATTACCTTCCTTTCAAAATAATAAAAGCCCTAAAGTTCACACTCTAAGGCAAG
+TTTTGCTTTTAATAATTTTATTTTTTCTTCATCTTTATAGGTTTCTTTAAACCTTTGATT
+ATACTGTTTTATAAAATCTCTAGTCCTGTTATTAACACTATTTTGAATAGCAAACCTGCT
+GAACATAAAAGAATTTTCCAATGGCTCTTCTTTATTCTTTTCATAAAGCATTCCATCTGC
+AAATCCTTCAGCTACAGCTTTTTTTGCACTCATCCAAGTTTCCTCATCCATCATCTGAGA
+TATTTTTGCTCTTGATTTGCCTGTTTTAAGCTGATAGGCATTAATTATAGTTTCCTTTAC
+TTCATCTAGCACATCAGCTCCATGCCTTAAATCCTTAGCTTCACCTTGAAAAGTTCCCCA
+GGGGTTGTGTAGCATTATTATTGATGTTGGAGACATAAGTATTTCATCTCCTGCCATAGC
+TATAACTGAAGCTGCTGAAATTGCCACACCATCAATTTTTACTTTAACCTTTCCCTTGTG
+TTCCTTTAAACCTGTGTAAATTCTTGAAGCTGCATAGACATCCCCTCCATAGGAATTGAT
+CCAAACATTTATGTCTTTGCCTTTATATTTATTTAGTTCTGACATAAAACCCTTTGGAGT
+TACATTGTCATTTCCAAATAGCATCGACCAAAAATCATCGTCCATGACAATGTCACCATC
+AATTCTAAGCTCTATCTCCTCCTCATTTTCTTCGCTGTTTTTAAAATTCCAAAACGGCAT
+TTTATCACTTCCTTTCATTAATCATATTAAATATTTCTTCCCTTAGTGCTTTAAGCTGCT
+CTTCCTGTTTTCCTGCTTCGCTCATATTGAGAGGTTCGAGATATCTGTCACCGTTATCAA
+TAGGATTCATATTTTCAAGCCTTCTAATATCATTAACAGAAAGCCATCCCCACTGTCTTC
+CTTGTGCATAGGCTTCATATCTTGATTTAATATCTCCACGGAGTAGTCCACTGATATTAA
+ATTCAAAATATCTGTTTTTTCTTCTTGATTCTTTTGATAAAAGCTGAAGATTTAAATTTT
+CTTCCCATTTTTTAAACCACGGCAGCATAGTGTAAACAATAAACTCTAAGCTCTGATGTT
+CAATATTGTTATTTGTGGATCTTGTTAAATCCTGCACCAGATGAAGTGGTACTCTGAAAA
+TTCTGCACACATCTTCAATTCTGAATCTCTTGGATTCTAAAAACTGTGCATCTGTAAGCT
+TCATGGTTATTTCCTTAAACTGACCGCCGCCTTCAAGAATCATTGGAACTCCTGCATTAG
+AAAGTCCTGTGTAGTTCTTCTTAATATCCTTTTTAAGCCTTTGAAATGCTTCATCTGAAA
+GCTCGTTAGGATACTGAAAAATACCGCTGGTTGAAGCCCTGTTATGATAAAAATTTCTTT
+CAAAGGTGTCCTGAGATAATCCAATATCAATAGTAAGTGCCGCATAACTAAGAGGTGTTA
+TTCCTATATACCCGTCTAAAGTGAGTCCCGGAATATGAAATATTTCATCTCTTGTTTTAG
+GTTCTTGCTTTCCATCAATATAATAAAGAAGCCTTCCTGTAGATTTATCTATATCAATTC
+TTACTCTGTCCCATGCTATTGGTCTAAGTTCTAAAAGCTCTCCATGCATATTAAAAACCT
+TTTGTGCTATAAAGTTTCCCCCAAGGTTTATATTTGTCATACCAAACTCTTTAAACTGCA
+CTGGTGTCATTTCTGCATTTGGTGCATAATGAAGTACACCATATTCAGCAGTATCTGTAA
+CCTGCCTTCTGTTTCCTTTATCATCTTTTTCATAAAGCATTATAGGACAGCTTGCCAAGG
+TTTCAGAAAGGACTCTATTGCAGGCAAAAACTGCAGAAAAACTCATAGCCGCTGCTGTAT
+CTATTTTAAAATTATCTTTTACAACTTCTTCACCATTTAAAAAATCCTCCGAATATTTCT
+GAAGGACTTCAAACAAGGCATTCTGGGGCGTTAAAAATAACTTCACTCTATCTTTTAGTT
+TCAAAGCACCACCTCCTAATCAAGAAAACTTCTCATTCCTCTTTTTTCATAGACACTTTC
+TTTATTTTCATGTCTTATGGATCTATCAAGTGCCATAATAAGTGCTACAGCACCATCTAT
+CTTTTCAGTAGACTTTTCTTTATCAGGCTTTATATTGCCTGCAGGATCAGTTTTTACATA
+AATATTATCCATCATCCACCTTAAAACAGGATGTCCTCCATGGGCTATTTTCTTTTCAAG
+AGTAATTTTCATAAGCTCCTTTGTAGGAGGAGACATATCCTTATACCCCTGCCCAAAAGG
+TACAACTGTAAAACCCATTCCCTCCAGGTTCTGTACCATCTGCACAGCACCCCATCTGTC
+AAAGGCAATTTCTTTTATGTTGTATTTTTTCCCAAGCTCTTCAATAAAGGTTTCTATATA
+GCCATAATGAACTACATTTCCTTCAGTAGTTTTTAAGTATCCCTGCTTTTTCCAAATATC
+ATAAGGTACATGATCTCGTCTTACTCTTAAATTTAAATTATCCTCTGGTATCCAAAAGTG
+AGGAAGAACAATATATTTTTCATCTGATGTTCTTGGAGGAAATACTAAAACAAAGGCTGT
+GATATCTGTGGTACTTGAAAGGTCAAGTCCCCCATAACACTCTCTTCCTTTTAAACTATC
+TATATCAACTTTAAAAGCACACTCATCCCACTTGTCCATCTGCATCCATCTTGTGGACTG
+CTTCACCCATTGATTTAATCTAAGCTGACGGAATATATTTTCTTCAGCAGGATTTTCTTT
+TGCACTGTTAAAGGCATTTCTCACTTTTTCTATATCTATGGTATGCCCAAGAGAAGGGTT
+TGCTTTATACCAGTTTTTCTCTAATGTCCAATCGTCATTGTCATCTATTCCATAAATAAC
+AGGATAAAATGTTGGATCGATTTTTCTTCCTTCTAATATATCTACTGCCTTTTGATGTAC
+TTCATAGCATATAGAATTTCTATCTGTTCCGGCTGTGGTTATAAGAAAAAACAGCGGCTG
+CAATCTTGCATCACCACTTCCTTTAGTCATAACATCATATAAATCCCTGTTAGGCTGAGC
+ATGAAGTTCATCCATTACAACTCCATGAACATTAAGTCCATGTTTTGAATAAGCTTCAGC
+AGATAATACCTGATAAAAGCTGTTTGTAGGCTTATATATCAATCTTTTTACAGAAAGAAC
+AGGTTTAATTCTTTTCTTAAGAGCAGGACACTGTTCTACCATTTCAACAGCTACATCAAA
+AACGATAGAAGCCTGTTGTCTGTCTGCAGCACAGCCGTAAACTTCAGCTCCCCATTCTCC
+ATCTCCGCAGGTCATATAAAGAGCAACTGCAGCAGCAAGCTCGCTATTATGTGTAGGAAT
+CATGGATTTACCTGCTAAATATAATCTTGATGGGCTGTCAACCTGAATACATCTCATTTT
+TGTCTTTCCTGTTTTTTCAATAGACTTTATATAATGAAAATGTGATCTTGTTTTAATATT
+TCTTTCTCTGCCTCTTTTAAGCTTTCTATCTAATCCTGATACTTCTAAGTCATTAAAAGC
+AGTAAACTTTATTAAATAACATATTTCACCTGTTTCAATTCCATATCTAGCTGATGGAGC
+TGTTTTTAACGTATTCTTTATTCCCAATGACCATAATAAATCCTGAACATCCTTGGCAAG
+TTCAAAAAGAATTGTCACATATATTGCCTGGCTTTTAGCAGTGCTTACACATCCATCAGA
+ATCTATTAACCCTTGTAATAATCTTTTTCTTTGCTGAGCTGATGCTCTTAAATATTCAAT
+AGGTATCCTTTTTTCCCTAAAGTTTTTAACTAATATACTTTTAAGTTCTTTATATACTAA
+AATATCGCTGTTACCCTCCTGCTTATATCTATTATGAAGTTTATATGGTATATTTTTAAT
+AACTTCGTCAACATCATCTCTCATTACAGTTATTTCAGGCTTTACAGCATTACCATTTCC
+TATCCAGTACCCAAATAGATACGGATCTATAGGAAGTTTATTTTCAGGCAAAATAAAAGC
+ATCCGCTATTGGGATGCGAAATAATGCTCTATTTTCTTTACTTTTAGTTTTAAACTGCTT
+TTGATACATTTCTCCTGTTGTTAATAGTTTTTCTCTTCTGCCATTATTAGTAACTTGAAC
+CTTCCATAGATGCCTTTCTCCAGCTACTATACTTGTTCCATCTCTAAAATTTATTTTATA
+TGCCTGCTCCGTATCATCAATTTCACTTATTGCAACAACATTACAAGGTCTTCCCTTTTC
+ATCAATTACCTTATCTCCTGCTTTTATTTCCCCCATTGTAGTCCATCCATCAGGTGTTGG
+AATCGGAGTATCAAGGGCTAACTGTTTTCCATTTTTCTTAGGAATTTCAACATAAGCAGT
+ATTATACTGCCTGTATCCATTTTCTTTTACTGTTCCGAATATATCCCTTATAATTTTATC
+CTGCCAAGGCAGAAGATCAAAAGGAACACCACGCCACTGACCCTTTGTATGCTTTAAGCA
+GTTAATAAAGTTTACGGCATGCTGTGCTTTTGCTTCATCATACACTCTTACTGCCTCCTT
+TATAAAGTATAAGTTCCATTGGATCTTCTTCATCATTTATATTGTCAGTGACTATTCTGC
+TTCTTGCTGATGGAGTAAGTCCAAACTGTTCGCAGAATCTGTTCATGATTTTAAGGTAGG
+TTTGAGCGATAGATACCTGTGGCACCTGCTGCCAGTATCCCGATGGTGTTTTTACAATAG
+TTCCATGTTTAGTTATAAATTCTTCTGCTTCCTTCCACCTTGCATAGGCTTGACAATATC
+CTGCAAAGGCTGCCATATCTATTTCTGTAAGTATTCCCATTGCCTCAAGCTGCTTTGACA
+TTCTCCTCCACTCTTTTTTAGCTTCAGCATCAAGCCAGCCTGGACATTTAGGTGCTTTTT
+TCTCAGGTTTTGGTTCATCTTCATTAAGTGGTCTTTTCCCTGGATTTCCTTCAAGTATTT
+TTAATGCTGTTGGTTTTGGTTTTCTTCCCCTTTGAGCCATAGGTATCACCTCCTCTTTTG
+GCTAACTAAAAAGAGCCTACAATCGTAGACCCTTAAACTTATTTTCTTTTTCCTTTTATA
+CCCTTGTAGTTGTAATTCCCTTTCTTAACTTCTTCATATTCAGCTTCTACAGCTTCTTTA
+TAATCACTACGTTTCCTTTCCTTTTCCTTGCAGCTTAAGCAAATGCAATCCTCATTATAC
+ATTGACATTATTCTACCCTCTTTTAAGCTTTCTCCACAGCGATCACAGGTTTTCTGAGTA
+AAAAATTTATCCATTTATTTCAGCACTTCCTTCCTGTTGTAATTTTCTAAAAGCACAACT
+GCCTTCAAGATTTGAAAGAAGTGTTTTCCTTATATCTTTATACCTACTTCCATTCATGCC
+AAGGCGAATGAGCCAAGTTCTGAATGCATATTTAGGGTTATCCTCCTGAGCCTGCTTAAA
+AGAGGTGTGTTTTAATTTTTGTGCGTTCACATTTATTAAAGATGCAAGTTCTATAAATGC
+GGATATTTTTTCATGGCTTAAGGTTTCACCTAATAGCTTAAAGGTAAAAGTTCCTTTCTC
+AAAATCAAAGGATATGCCTTTGCAACCATCAGTTCCAACTTCAGTAATAGCATTTTGAAA
+TTCTTCTAAAGTTTCTGTTCTCTTTAAATTCAAATTCTTTATAAAGGTTTCCTCAATAAA
+AGGTTCTTTTAATTCGAAGGTTTTAACAATTAGCTGCTGTTTACTGTAAAGCATATTTAA
+AATATTTATTAGCGTTTTTCCCGTATGCTCTCCTAATGGAATTTCTAAATTAAAACTATC
+AATAGTTGTATCCTCTATTTTTTCTTCAGAATCCTCTCCCTTTAAAATTTCGTTAAGTGT
+AACAACCCTACCTTGCGAAGTTATAATGGTTCCCTGCCTATCTATTGTGTAGATTTCCTT
+TTCCGTTTTAATTTCATAGGCAAAGCTTGGTGCTCCAAGATACTTTGCTTGAGAACCTAA
+GGCTTCACTTAAAATTTTAACTATTTCTTTTCTATCCATCTTCATTCCTCCCTGTGTTTT
+GGTAGTTACATATATCACTCTAAACACAGTTAATAGCAAGTACTTTGTATAAATATTTTA
+AGAAGAAAACAGGCCCTTCAGTCTGCTTCTGTCTAATTTTCAATCGCTGTGTACCTTGGG
+TAGGTGTAGCCTTCTGAATCTACTAAAATGCTTTTCTTTGTTTTTGTGTTCCTAACCCTT
+ATGCATCTTAGCTCTCCTTTTTCGTTGCAACCACCATCTTCTTTGGTTATCCAAGGCTGG
+TCTTTGCAGAAGTCTTTTGCAAATTCTTTAAATTCCTCATCTCTTAGTTCAATTTCTTTT
+GTAACTTCGTAGGCTGTTCCTTTTACTCCATCCTTCTTAGCTTCTTTTGTAAGTTCTTTA
+AGTTCCTTTAAATTTAAAACCTTTCTTCCAAATAATGCTATCATTCTAAAACCTCCAAGT
+GTGTTTTTGTTATACTATATATCACTCTAAAACACACATATATCAAGCTAATTCTTAAAG
+TTTATATCTATTATTTTTGCTTATAGCTTCAGCACTTACTTTCAATGCTTCTTCAATAAA
+ACCTATATCAAAACCTGAAGATGTATATCCTTCTTTAACTATTCTTAGATACCTTTCACT
+TGGAAGGTTTAAGTTAATCCTATCTTTTATTTTATTGGTCATGATGTACACCATAGCAGT
+TACTATTTCTCCACTTTCAAGCTCCACCTCTAAATCTTTTTTATAATAAAAGTTTGGGAA
+ACCTTCGTAAATGTCTAAAGCTTTCTCATCTTTAGGTTTAACCTCCCAAACAAGTACTGG
+TACCTTTCCACCCTTAAAAGGTTCAATAGTAGCATAAGCATTATTAGGTACTCCTTTAAA
+AAGCAACCTAAAATCCTTTAACTCCCCCTTGCCATAAACCCTAGCCGTAGGACATCTTTT
+TTCCATCTGCTGAAGATTTAAGTTTGAACCATAAGCAATATACAATCTTTTCATCTATCA
+ATCCACCCTTTCTGAAAGCTTCTAATTGGGCCACAGTTCCCCTGTATTGCCTTAAGTTTA
+ATTCCTAGCCCATTAGTTCCTTCTACTACCCTAAGGGCGGTAATTCCGCCCTGTGGCTTT
+ATGAAGCCAGCCGCCTATCTATGCGGCTCTCTGAAATCTCCAAGCTGCTGAGCCTTGAAG
+GTGCTTTATAAGGTGTTCTCTGCAGTTTTTGAATTCTTCACCTATAAAGCCTATTCTGTT
+AAGCCAGGTCCTCATTGCAAACTTTGGATTTTCAACCTGTGGCTTTTTACTGCTTGCACT
+CTTTTGAGTAAGGGCTTGATGGTTAAGTGCCAAGGCTAAAACTATATTTGACCTAATAAC
+TCCTGCGTGCATGGTTCCATTAAAACCTCTAAGTTCAACTGTTCCTGTTCCGTTGAAAAA
+GCTGTGTAGGTTTAAGAAGTGGTATCTGCTTTCATGGTAATGCCTTTCTCTATTTGAACC
+GTATCCCTCGTACCAAATATCCTCAATCTGCTTCATGGTAGTAGGCTTTTTCTTGTTTAT
+CCTTTCCACCAAATCTGCATCCATCTTTTTGCAGTATCTCATTCTTTCTCTCTCAATCTG
+AAGGCTTTCATAAAGCAGGTCATTTCTTGAGTAGATTATGTTTATAAAGTTTCTAATACT
+TCTTGGTGTATGGTCAGCTCCATCAAGGTGTATGTGAATCCCTGTGCAGTTTTGCTTTTC
+TGAAAAGGCTCCTGCTTTTCTAAGCTTTCTTACTATCTCCTGCAAAGTTTCTATGTCTTC
+TTTGTAGGTAAGTATTGGACTTACTAGTTCTACACTATACTCTTTTGTAGCTGCTACCTT
+CTCGTCATTTACTTTCTTTTGGGTGTAAATACTTCCGTCATACATAAGCTTCCATACTCT
+TCCGTCTGCTGCTGTTACCTTATAGGTATCATAATAATCATTTTCTCTTTTTATACTTCC
+TCTTAAAACTTCTGCAACAACCTTTGCGGCCTTGTTTCTTGTAACTCCTGTCATTTCAAT
+TTCAATTCCAAATCTTGCTTTTAAAAAATCTGTGTTTTGCATTTTTGTTTCCCCTTTCTT
+AGTGTGTTTTTGGTCATGTACATATATCACTCTAAAGGGGAGTAATAGCAAGTATATTAT
+CAAAGATTATTAACACTATTTTTATTTAATAGATTGTGCTACTGCAAAAGCTACATTTAC
+AGTTACTGCATTACCTGCCTGCTTATATAGCTGAGCATCTGAATTTACAGCCCTTGCTTT
+TTCAAATAATTCATCTGGGAAGCCTTGAAGTCTGAAGCATTCCTTTGGTGTAAGCCTTCT
+AATACGGTAATTTTTGTCCAATGTAGCCATTTGGCATCCTGTATCTAAAGTATTTGATAT
+ACCTTTTCCAACCCTGCCTCTTCTTGTTTTTGAATTAGGTACTGAAATATTTATGCTGTC
+TCCAATCTCAGCTTCAGCATAGCCTTTTTTTGTGGCTTCTTTAACTGCAACTCCATGTCT
+GTCCTGACTTGTTAAAGTAAACATTGGTTCATCTGCATTTTTAAATCTCCTTCCATTCTG
+ACGTTTATTTTCTCTTTCAGGAGTTATAACAGCCCTTGCTTCAAGAACAGCATTTTGTGT
+TTGATTTCTGTTTAGTCCTCGCCAATCACTGGCACTGATTGTATGTGCTATTTTTATTTC
+ATCAAGAATACCATCATTTCTATTAAACTCAATTGGAACACTCTCTAAAACTCCGCTATT
+CATTGCAGTTCTATTAACCACTCCTGCTGTATAACGTGATGTAATACATCTTGATGTATC
+TGTGAGCTTTGGCTTTGTGTAAGACTGGTCTATAAAAATTTTGCTTCCTTCGCCCTTATT
+AGTTGTAACTGCTGGAGCAATTCCTTCTGATGAATAAACATTTCCATTCATACCTTTGCC
+GCTTGGATTTATATTTCCTACGCAGTAAAGACCAGTCTTTGCTCCTCCACCTCCACCACA
+ACCTGTAAGTGTGCAAGCTACTCCTTCTGCATCATAAACTCGCTCACCTTGACAGCCGCC
+TATAATCTGCTTAAGAGCTGCTGTGTTTTCTCCTCTGACAGGTAGTATTTCTCGTCTGCC
+TCTGCTTCTAAGATTTGCAGTAATGAACACACGCTCTCTGTTTTGGGGTACTCCGAAATC
+TTTAGAGTTAAGCACCTGCCAGAAAGCATCATACCCTGCTTCATCCAGCTCAGAGAGAAC
+GGCTGCAAAGTCCCATCCGTTATTAATTGACAGCAGGTTTTTAACGTTCTCAATAAGAAG
+GTATGAGGGTTTATCTTTTTCTTCTTTGCCTTTGATAAGGTCAATAATTCTAAAATATAA
+GCCGCTTCTTTTTCCTCTGATTCCTCGCTGTTTTCCTGCAACTGAGATGTCTTGACATGG
+GAATCCAAAACACCAGATGTCTGCATATGGGATATCTTCGCTTTTAAGTTTTGTAACGTC
+ATCTGCATACCACTCTCCTTCCGTATCAAACATTGCTCTATAGCTTTTAACTGCAAATTT
+ATCTTTTTCACAAAATCCTATACATTTATGTCCTGCAAGTTCTAACCCCAATCGAAAGCC
+GCCTATTCCTGCAAAGAAATCAAGGAAGGTCATATTAATCACAACCTTCCTTTTTTATAT
+CAGCATATTTAATTTTAACTCCATCTCTAACTAAAAATACTTCTTCATCTGTACCAACCT
+GCTCTATATATCTTTTTACAATAACATCCGCATACTTTTCATCAAGCTCTATGGTATAGC
+AGATTCTATTAGTCTGCTCACAGGCAATCAAAGTAGAACCACTGCCGCCAAAAGGGTCAA
+GAACAATACAATTGCTCATGCTGCTGTTTTGAATTGGATAAGCACAAAGAGCTACTGGCT
+TCATTGTTGGATGGAGAGCATTCTTAGATGGTCTGTCAAAGCTCCATATAGTACTTTGTT
+TTCTATCAGAGTACCAATTATGCCTGCCTTCCTTCTTCCAACCAAAGAGTACAGGTTCAT
+GTTTCCACTGATAAGGACTTCTGCCCAGTACCAAGCTTTGCTTTGCCCAGATACAAACTC
+CGGATAAATAAAATCCAACAGCTTTAAAAGCCTTTCTAAAGTTTAATCCTTCTGTATCTG
+CATGGAATACATAAATTGAAGCATCTTTCTCCATAGCATCATACATATTAGTGAACGCCT
+TATAAAGGAAATTATAAAACTCCTCATCTTTAAGGTTATCATTTTGAATCTTTCCGGCTT
+TTGCTTCATATGCAACATTGTAGGGAGGGTCTGTAACCACTAAATTAGCTTTTTTACCAT
+CCATTAAAGCCTCATATGTTTCAGCTTTAGTACTATCCCCGCAAATAAGCCTGTGCCTTC
+CAAGCAGCCACAAATCTCCCTGCTTTGAAATTACAGGTTCTTTTAAAGCATCTTCAACAT
+CAAAATCATCTTCTTTTATTTCCTTGTCATGAACATTGCTAAACAGTTCTTCTATCTCCG
+GCGGTTCAAAACCTGTAAAGGAAACATCATAATCTATACTCTGCAAATCCTTAATAAGCT
+CAGCAAGAAGTGCTTCATTCCACTCTCCGCTTATTTTATTAAGTGCCACATTCAAAGCCT
+TTTCTTTTGTTTTATCTATATCAATAACAACACAATCAACTTCTGTATAGCCTAAGCTTT
+TTAAAACCTTCCATCTTTGATGACCGCCAATAATTGTAAGGTCTGAATTTACAATAATGG
+GATCTACATATCCAAATTCAGTTAAACTGTTTTTTATCTTTTCATATTCCTTATCACCCG
+GCTTTAAATCTTTTCTCGGATTATATTTAGCAGGTATAAGGCTGTCTATTTTTAACTTCC
+TAAACTGCATCTTCTTAAACCTCCCCAAACCTTGATTTTATATAGCAGCTGTGACTGCAG
+TATTTTCTGTTTTTATTTCCATAAGAGCTGAACTCTTTCTGGCAATAGACACAGGTATAT
+TTATAAACAGCTGTATCCTTTTTGTTTCTTTTATCTTGATTGTTTTTCCACCAGATTCTC
+CTGCATTCTTCAGAGCAGAATTTCCTTGTTCTCCCTTTTCCCTTTTGTTTTAATTTCTTA
+CCACAGTGAAGGCATACAAGATTCTGCTTTTTCATCTCTTCAATGTTTAAACTTACTACA
+GAAACATCACCGCAAAGACCATTCCTTTTACAGTAGCTTTTTACTGAATCTCTTGATAAA
+CCAAGAACTACAGCTATCGCTTTATATCCCAGTCCTTTAAGTCTTAACTCATGAATCTGC
+TGTTTTTCAACTTCAGTCAATTCCTTTATGCCTCCTTTCCTTTTGCGATGAGATTAATGT
+AAAATCTTAAAAAAATGCCTTAAAAACACTTAAAAATCACTGTTTAAACTTGATTTTTGA
+ATAGTTTTTATATAAACATCAAAAGCCTATAAATCCTTGTATTTTTAAGGTTCACAGGCT
+TTTATCTTCTGATTTTTTATAGATACTTATCTGCAAAATATAAAATAGCTTGATTGCTGA
+TTTTCCAATGGTTACAGTTGATTTTTTATGAAATATATGCTACCCCCCTTATCAAATTCT
+GCGAAATTTCGTGCGAAGGGAGCCGCCCGACGTAGGGGGTTCAAGTGGTGAGGATAATGA
+TGCCCCCTACCCTTTGTTGAAGAATTATCAACAGATTGTCCACAGGTTATTAACATATCA
+TTGTTGATAACTTTAATAAGAATAGACTCGTCCTTTCCTTCCCCATCTGCCGTCTTCCTT
+AGCAGTCTTTCTATCATGACAGCTTTTGCATAAACTCTGCCAATTGCTCTCATCCCAGAA
+CAACCTTTCATCACCTTGATGTGGTTTAATATGATCCACTACAGTTGCAGCAGTAACAAT
+ACCTTTTCTTTTACACTCTTCACACAGTGGGTGTTTATGCAGAAACTGTTTCCTAAGTCT
+TCTCCACCTGCTACTGTTATAAAGGTATCCATAGGGTCTGCAGTTTTTATTGTAGGTTTT
+ATTTATTTCCTTTTGATGTTTCTCACAGTATCTGTCGCAGGTAAGTTCAGGACAGCCAGG
+ATAACTGCAGGGTCGTTTAGGTTTTACTGGCATATATATCAGTCCTCCCAAGTTATGTTT
+TTACATATGAAAACCACCACAGTTTTTCTGTGATGGCTTCATCTGTTTTTTCACTTCGTC
+TATTATAATACTACTGCGGATACAAGGGTGTCTTTCAATGTCTTTTAGTGTCCTCTTTAA
+TAGATATCTAAATTCTTTTTTCCTAATTATAATTTAATCAGATTTTAATACTCTCTTTCT
+ATCACATTTACTCTCATCTTTTGTTTTTATTCTAAAAATTTCCGTTTTTAAAATAGTTTT
+TTTAATTTTTTTACAATCAGAACAGATATAATTATAATTTGGTACATAGTTACATGACAT
+TACTTCTGTACCACAAAATATACATCTAGGGTAGTATCTAGCTTGTTTACCTTTTTGTTC
+AATCCTAATCCCGTCTAACAAAGCTTCTTTATAACTCATCTTTCTAATCCTCCAATTATA
+ATATAAACACATTTTGATACTCTCTTTCTATCACATTTACTCTCATCTTATGAAATATTT
+ATTTCTTTTAAAGCTTTATCATGAATACGAAATATATGCTGTAAACTGTATCCCATATCA
+ACAGCAATCTGTTCCCATGTCTTAAAACAGAGATATCTAAGTTCCAATAGAGTCTGATAT
+TCTGTATTATCTATTTTTCTAATAACTGAAACAAACTCCCTTTTTAAATCCACAAGAATA
+TCAATATCTCTATTTATTTCATTTTCTAAATCAACTATCTTAGCTATTATATCCTCCATA
+GAATGCACATTACGAGTTCCACTAGGTGGTGTATCGCTTAAAGTAGATGTTGCCTTTGTA
+GCTAATGCCCTTAAGGAAATAATCTGCTCTAACTTACTATTAATTCTTTGGTCTATATGA
+TAAGCCTGTGATAAATATTCTTTGGCTGTCATGCTAAATCTCCTCCTTTAGCCAAGGCAT
+TTTATTGTCATAATAGGACTCTGCAATATGCATTTGTGTACCTTTATCTAAGGATTTAAT
+CCTTTTAAAAGTTAGCTTCTTTTCCTGCTGAAGCTGCTGCTTAGTTTTATAAAAACTACA
+ACTTAGGTCATCACATTTTCTAACATTTAGCACACTGCACTTACCTTTTCTTAAGGCAAA
+ACAACTATTTATTGTTTTTTTCTTTTTTAATTCCTTTATTCCATTCCCAACAGCCTTTGC
+AGCTGTAGGATCTGAGTATGCTTGTCTATCGCTCATTTACAATTCCCCCTTACTTAGGGA
+GTACATGATACCTAGTTATATATATATATTTCTTTTTTATATAGTAATATTTTTATATAT
+ACTATATCTTATTATATAAAGGGTATATACATCTTGGACATCTTGTACCCCATTGATTTT
+ACTACGTTACAATCTTGTACTTATGTTGAACTCATATAGAACCCATCTTGTACTTACATT
+TTCACAAATATCCTATATTTCTTCCCATCAATTTTTTTATCTATAGTTTTATAACCGAAC
+CTCTTGGTAATCTGTCTTGAAAATTCTATATGACTAAGTGGCTGCAGATTATTATTTAAA
+CAAAACTCCAAATAATTCTTATAGACATTTTTCGTTGGCTCATTTTCTACTTTTGTTTCA
+TATTCTTCATAGAATTCAATAATTGGATTGTTGGTCTTCTCATATTCTTTAAGCTCATGC
+TCCACTTGTATGGATTTTGTGAACTTTTTATTTTGTAGGATTCTTTTAAGCCCCTTTAAA
+CCCAGTAAAATCAAATATTCCATGGACTCTTTTGTCCTTAATTCATATTTAATATCTGGT
+CTGAAATCAGGATCATCTGCTGTAAACTTTGCCTTAAACGGAATTATAAGAAGTCTTCTT
+TGGACAGCTCCTGTTTTATCCTTAACCCTTGGAACATTATTGGCTGAAAATAAAAGCTTG
+GAGTAATTATTAAAATCAAAAGGGTCTTTGCCTTTCCTCTCTGCATTAACTCTATCCCCT
+GTAACAAGCTTCTTAAACATTGAAGGCTCTGCAATAAATTCATCTCCAATATCGTCACCA
+ATATTTGCAAGCTTTCCAAATAATTCTGCTGTTTTAAATCGCTCTCCCAACTCCTTTAAA
+TCAAGAGCTGCAATATTAGAAATACCTATAAGTGTAGTTACCATATCCAAAAATGTTGAT
+TTCCCATTTTGTTTTTCACCAGTTAAAATGAAAGCTTTTCCAATTTCATTTCTTCTATAA
+AATGTGTATCCTATAAGTTCTTCAAGCACACTTCTAATTTCAGCATCATTGCAGCTGATT
+TTATCTAAGGTTTTATCTGCTAATTCAAAATAAGCATTTGGGTTATAATCCCACGGAATT
+CTGTTAGTGATGATAAAATCTGGAGAATGTTCTGTAAAAGAATCATCTATTATGTTATAA
+ATTCCATTGTTAAATGCTATGCGATTATAATCTTCAAAGCTTGGAATAACGTTATTAGTA
+ATAAGTTCTAGGTAATTTATAGTTTCATTCCTCTTTGCTTTATTAAGCTCTGGTAAATGT
+TTAATCATAACTGATTCAATTTCCAAAGTACTATTTTTATAAATTCCGTCCTTATAAACA
+TGGAGCTGGTTATTAATTTTAATAATGTGCTCTTCATCCCTTATAAATCTTGCAAACTGG
+TCATGTAAGAATTTTGACTTTTGATAAAACAAAGGTTTTAAAAATGCTTCATCTCGAAGT
+ATTGTATCTATTTCTCTTTGTTCTAATGGTTCTTTTAAAATATATTTGTTTATGATATTT
+ATAATGTTTTTAATACTATCCTTACTAAAACCTTCTGATTGAAGGGTTAATATATAATTG
+AATAATGCTTGATTTCTTCCATCTCCTTCTTTCATATTTAGAAAATCCGGTGCTGTTTTT
+AATGGTCTTAGCCATTCTGGAAGATAGTCAACTTCTTCTGTTTTGTTTAACCATCTTCTT
+GTTACCCCATTCACTCTCAATGGCACAATACAATTCTTTGAGCCAAGTCCTATGTCAATT
+GTTACTCCTAAAGGAGTCTTTGTCTTGATTTTTCTTGTTTTTAAATCTGTGTTTTTAAAA
+TAAAAATGCATCCCTCTATCTGTCTTTAATATGCAACATTTAATATCTAAATCTGTTATT
+ATGTTTTTTACAACATTTGCTTCTTCTATTGAATCAAAATCTATTTGAATAATATCATCT
+TGTAAAACTGCACCGTAATCTTTGCCTGTTTTTCTTATATAGTCATAACAATAAAATTTA
+TTTCTGTCCTTATATCCCTCTAAAGGTTTTTTTCCTTTTAAAGGAATGTATCCTTTGAAA
+ATATCCATGGTGTTTTCACCCGCCTTTTGGTAAGAATTATATAGTAAAAAGGATGTTTTT
+TTGCCCATTTTCATATACTTTTTGGGTTGTTTAATCATAAAATTTATATGTTTATTCCCA
+AAAGTCGCTTTAAAAATCTTAATATTACCCTTAAATTGCTTTGAAATTTAACCTTTTTGA
+TTAATATTTCCCAAATTCCTATAATTTTTTATCTGATTTCACCAACAAAATCTTCAATTC
+TTTTCTTTGCTAAATTTATATACCACTCTTTATCAAGGCGTCTTGGTACTCTTTTGCCTA
+TAACACTGTCATTTACTATAAAACATCTTTCCGGAGTATTTGCTATTTTTTCAACTCTGC
+CATTAGGCTTTACTTTAAATACACCTTTATCCTCCTCATTCTTTGATGCAAAAACTCTTA
+AAGTTTTTTCTGCTAATGGTTTGTCCCCATAAAGAGCATGAGAATATTTATAAGTAAGCT
+TTACAACCTTTTGAAACATTAAAAGCTCCTTACATTCCGTTATAGTTTTTTCAACTGGAA
+AACCTTCTATAAAATATTTCTTTAAAGCTAAGTTTATTATAGGCAGATCATTATCAATAC
+TATTTAGTTCCTTAACATAGGCCCCTTTAGATTTAAAACTGCCGTCTTCTTTAATAATGA
+TGTAGTTATTTACATCCTTTTGATATATTTTTTTAAAGATTTCAAAATCAAGCTTCATAT
+AAGTCCTATCTTCCCACTCTCTGCAGATTTCTTTAATTTTATCTAAATCTGATTTCCTAT
+TTATTTTTCCTATTAAACCATCAGTATTGGACTGAATTAAAGTCCAATGCGGTTCCAGCC
+TTTCTATTAAATCTAAAAGTAAAAGCTGTCCTGCTACACATACATTATTAGCCTGTCTTG
+GGTCATAGAGGTTATTGTATTTGTATTTCATAGCACCATAGGTACTATTTAGAACAATTT
+TATAAGGTTGCTGCATTGGGTTCTTTTCAGCTTTTAATCTTATACGTTCTTTATAAATCT
+CTTTATATAAATTAGAATCTTCCACATTCCTTGATAAATAGCCATACTCTATCATCAGTG
+TTGGATAAAATGAAATTACATCTACATTTAAAAGAATTCCTTCACCTATATATTTTTCTT
+TTGCACCATGAAGTCCACCCCATGCAAATACATGCGGGACACCACTTATATTTATTTCTA
+ATGATTTATCATAACTGTGATTACTTGAATTTTTGTACCAATCAAGAACCTCATTATATT
+TATTTATTTTTAAATTACTTGGTATGTCCAAATCAAACTCATCAGAGCGATTTATTTTAT
+TTGCTTTTAAAATAACTGCTGCAAGCTGAGCCTTTGTTTTACTTATATATTTAAGCGGCA
+GTTTAAAAGCTTTAAGTAAAGCTATATGACTATCAAATTCCTCTTTACGATGTAAAAATA
+TTTCTATAGTCTGCTCAACATCATGGGTACAGTATTTTACTACTTCCTCTAATTCTTCTT
+CTGTTAACTTTCTATCTATTGAAAAGCTTACAGTGCTTTCTCTTATGTCATTTCCCATAA
+ATCCTTCTAGTTCTTTTAAACCGTGAGTTGTTGTCATAATATCAAATTCATAAAGTTGAA
+TTTTTTGAAATAGCGAGCTGTACTGCCAGCCTTGATTTTTTTCTGCTATAATGAAACTGG
+AGATACTATATGGGTCAAAACCACAAAGGATACCTTTTAAAATATACTGATCATAATGAT
+GGCTGTTATAGCCAATCCAGATATGTTCTTTATGTTCTTCATAAAATGATGCTAATTTCT
+TAGCATCATTTATAAAGACATATTTTTGATGATTAATAGGGTCTATTACGACGAAGAGCC
+AATCTTGCAGGAAAACCTCTGCGTCAAAGAATAAAATCATACCTATTCAACCTCAAAAAC
+CTCAGTAATTTTAAAGGTCTTAAATCCTTTGTTGGTTTCCCCATACTCTACTGCATATTC
+TAAATTGCCGTCAATTGCTTCATGAATATCAAGTATTAAATCGTAGTATTGTGAAAAACT
+TTCAAACTCTACTTCTATTCCAGCTTCAAGAGATCTTAAAAATTCATTAGCGTTATGAAG
+CCCAAAAGCTGTGTTTATAACTTGGTTCATAAACAATATGGAATTTTGATATTCACCAGA
+TAAGATTTTCATCCAGCAGGATAACATAGGTTTACCTGTCTTTGATTCTACAAGTTCCAT
+TTTTTCAATTTTTACCTCATATGTTCCAAGGGGTACATCTTTGTATTGACCTTCTCCTGT
+TCCTACATTTTTTAAGTCTTCCTTTAAACCCTTAATATCAAATTCCTTATCAAACTTTGC
+AAATAAATTTTTTGTTGCCATAATTATCTCCTCCTATTTTTATTTTCTAGAGCGTCTGCT
+CTTTTTTACTGATTCTTCTTTAACTTCAGATGTTTCTAATACAGTTGTATTATCTACTGC
+TGCTGTATTATCAGAAGTATCTGTTTCTGATTTAGAATAAGTTTTTACACCTTCCTGAGC
+ATCTTCTAAAGCTTTCATAAACTCACCCTTATCAAGCTCTACTTTTGGAACTTTAAAATT
+GAATCTGCCACCGCCGAAGATATTTTCTTTCTTTTCAAGCTGCAAGTATCTTTCTTCTCC
+ATCCATAAAGGCTCTTACAGTTAAATCTACTGTTCCTGCTAAAACATTAGCTATTTTTTC
+ATTAATATTAGGTTTTATGGTTGTAAGCTTAGCTCCATTTTTTAGTGTTATTTCTGTAGT
+TACTTCCTTAGAAATATAAATTATTTGATATCCTAAATTCTTAAGTCTTTTTATGGCTGA
+TAAATATTCAGTTCTAACCATATCCCATCCTTTACCAAAACCTGCATCCTGCTCATGGTC
+TATTCCTAACTTGTTATACATATAAAGCCTGCAGTGTTCATATAAGTCCTCAACTAAATC
+AATGCACACTCTTTTGAAAGTGTTATCTTTCTTTTCAAGCTCTGTAATAACATCTAAAAA
+TACTTCCCAAGCCATTTTGACTTTTTTAAGTCTTCCTTCAAAAGTTACTTCATCAGCTAT
+TTTTATAACTGGACTTGTTGTGTTATCTGTGTTTCCATCAGTATTTAAGAATAATAAATC
+ATCGAACTGATCAACAAAAGTTGATTTTCCAACGTAACTGTCGGCATATATCCACATGTC
+CGGATACCTGTCTATTTGAAGTTCTCTCCTAACATTTTCTGGTAATAACATATCTGTTTG
+TCCTCCTTCACAATAATTTTGATATTCACACCAATCACAAAGTCTTGATGGTGTTTTTTC
+ATATTCTTTTTCATTAATAATTTCCCGGCATCTTAGCTTAAATTCTTGAACCTTAGTCTC
+ATCATATGGAATTTGAATCACCTTAACTTCCATAGCTTCTAAAGTTTTATGAAGCCTTTT
+TCTAAACTGATATAAATCCTCAGTTTTCCTTTGCCTTATAGCTGTTTTAGGAATAAAAAT
+AAATCCTATTTCTGATACCTTAAATCCAAGTTTTTCTAAGTAATACCTATATAAGTGCAG
+CTGTTTTGACTCCAGATAATGCTCTATATTATTGCTGTATTTAAAATCATAAATGCTAAG
+ACTTCCATCCTGTGTTTGGATAATAAAGTCTACAAATCCTATAAATTCTGGAAAATCAAT
+TTTAAACTCATATTTTTCTGTCGGCTCTTTATTATGAAGCATTGTATTTATTACAATCTG
+AGCCTTTTTCACTAATGATGTAAGCTTAATAACTTCATTTACATGAGCATCAGTAATAAC
+TGGATACTGATTATAATAATATTGCTCCATTGCCTCTATACCTTTCTCAATCCCAAGATG
+TAATGCTGAACCTGCAATTAAAGCATTATCTGCTGCCGGTGAAGGTATTGTCCTTACTTT
+GTCTTTATATCGCAGTTTGAATTGGTACTTGCACTTTTCAAAGCACTCAACTCTGCTGTG
+GGAAAATTGCACGCTAGCACCTCCTCTATGAGTTTTTTAAATTCTTCAAATCCTGAAGGA
+TATAAAATTATTCCAATGCCTCCTGCTTCATTTATATTTTTTATATTCATTTTTTGAAGT
+TCTGTTGGTTTTCCTTTTTCTGCTTTCAGCTCAATGGCTACAAAAACTCCATTTATACAA
+CAGATTAAATCTGGAATACCGCTTCTTTGAAATCCACCACCAAAAACTTTAAAATACCAT
+GTTTTTGAGAGTGTTTTTAAGTATTTTATAACTTTAGTTTGAAACTGTTTTTCTGTCATA
+ACATCTCCTTTTCAAACAGCTCCACAGTAAAATCCCGCCTTTGTTTTAATACTTCAAGTA
+TCTTTTCTTCTATGCTGTTTTCTGTAATAAGATAGTAGTAAAAGCAAGTCCTATTTTGCC
+CTATCCTGTGTATTCTCTTTTTTGACTGCATCCAAAATTCACTAGATAGTGGAAGGCTGA
+AATAAATAATTCTATTTGCCTTTTGCAAATTAACTCCAGATGCCCCTGCTTGGTACTGAA
+CCAATGTAATACTGTTTGACTTATTTTCATAATTTTCAAGGTCTGTTCCGTCTCCATTAA
+TATAGGAAATGGGTCTATCTATCTTAAAACAGATGTTTTTTATAATCTCAAACTCTCTTT
+TAAAATTGTAGAAGATAACAAATCTATCATTACTGGATTCAAAGATATCTTTTAGCACCT
+GATGTTTATTTGAGTTGTAAATAGATGTTAACTGCCTTAGATACAATAACTTTGTAAGTG
+CTGTATCTCCTGCTAAAGTTTCACCATCAATTGTAATAACTCTGTCTTTTTTAAACTTTT
+TATATTCCTTTGAGTTCTCGATTGTTACAACCTGTTCAATCTGCTCCGGCAGGTCAAATA
+CTTCTTCTGTTTTCATAAATACTGCACCATAGGATTTTAGTTTTTCCTTTAACCTATCAA
+CATTTTTATAGCCTTTTACAACTGGAATTTTAAATCCTCCAACATCAATCTTTTCTGTTA
+TTGTGTAGTGATTATAAAAGGAGCTTTTACTAATATTCCATCCAAGAAGTCTAAGCTGTG
+ACCACAGCTCCTCATATTTTCCACCTGTAGGAGTACCAGAGAGAAGAATTATATTTGCAG
+GATTAAGGCTTAAAATAAATTTTGCCCTGTTGGATGTTTCATTTTTAATATACTGCGATT
+CATCAAGTATTAATGTAAAATCCTTTAGCTTTTGTAATTGCTTCCTTCGCCATACCAAAT
+CATAATTAATAATAATTACACTATTTTGCGGTATGCTCTCTATAGATTGATTCTTGAAAA
+TTATAATTTGTAAGTTATAGTAATCTTTAAAATGTTCTTCCCAATCTTTAATTTTGGACT
+TTTGGCAGATTAGAAGATTATAAGGTGCATTTAATTGTTTCATTTTTTCTGAACCTAAAA
+ATGTCTTACCTAATCCCAATAGGTCACATGTCAAGATAATAGGCTACCTTTGACTTATCC
+ATTGTCTCCTCCAACACATGCTGCTGATGTTTAAATAGCTTTATCTCTGACATAAAAACC
+ACCTCCCTTCCAGTAACAGCTGCTAAATTTCAAATTTGTATCCATACTGATTCATGATTT
+GATCAATAAACTCTAATGATTCAGGAAGCCACACATTTGTCTTTATTTTCATTCCATTTT
+TCAAGGTATCAGTAATAACCTGACAGTATTTTGTATGACTGTATTCAGCTGTCATAACGT
+AGTATGGATTACGACCATAGAAGTTGTTATCAACTTTTTTAATTACACCTGCATCCTGCA
+TTATTCTGTTAAACTCCTGTGCCGTTATTCCATAATACATACCAATATCTGAAGCTCTAA
+GCATTTCATTTAAACGCTGAAGATTTCTAAATAATTCTAGTTTCTTATCCTGTTCTTCAA
+TCTTTTCTGTAAGCTTTTGTATCTTTTTTCTTTCTTCTTTTAGTGCCTGAAGTGTTTTTA
+TCATTGTATCTGGGTTATTTAGCATTTCTTCTATTACCTTATCCGTTGCATAAATTCCGT
+GTTTTCTTATAGAAGGTAAAACTTCATCAAAAACCCATCGTTCAAAACGTTCTGCTTTAG
+GTAATTTTGATTTAACAATTAATCTATAAAGATCTCCTTCTGGTATAAACTTTATTTCCT
+GTTCACCACCACTTGTAAGGACTCGGTGTTTCACCGACCCCTTTGTATGCCTATTAATTG
+CATCATAAGGATCTGAATATCCAAGTATCCTTGCACAATCAGTTGCTGGAAAATATTCTT
+TTCCGTCAATTACTAAAATGTTCAATTCACCAAATTCTGTGTTTTTAAAAACTTGTAATT
+CATTCATACCTTTTTCCCTCCCTTATATTTTTTTAGCATCTTCAAAAATATCAGCATAAT
+CTTCAAGTTTAACTTCAATTAGCTTTTCTGCACCATATTTTCTTAATAGTGCTTTAATTT
+CTGTTATCTTACCTTTTTTCATTTTCTCTGTTAGTACCATGCTTATATCTTGAATGCTTA
+TTTGATCATTCATTGTATGGTTCTTTGCTTTTGCTCGATATTCTGCTGCAAGTCTTTCTA
+GTTCTTCTGCAAGAACTAAATTTATATCAGTCATAAATTCCACCTCCTTCACCCTTATGC
+TTTTAGAGCAAAGTCTTTGATAATGCTATTCATTACTGCAAGGTCGTCACCTGACAGCAG
+GATACTTAATCTTTTTAATAATTCCAATTGTTCAGGTTTTAAATATTTTTGATTTAACTT
+ATAACCATCTGTAATCTTGATACCTCCACCATGTCGTCCTCGAATAGTTTCTATGGGGTA
+AGAAAGCGATAGGATATCAATATCATTTTTAATGGTTCTAATACTAACCCCAAACTCATT
+TGCTAAGTTAGCCATTGTGTCTTGCCTTCTATGACATAATCTTTCTATGATTTCTATGCG
+TCTTTCATTTGGTCCCATCGCTTTCTCACCCCCTTTCCTTTGCTCTGTGATTTAAGAATA
+AAAGTTAAATATGCAGACTTTTTGCTTATTTAAAAAAATTTTAGTTCCTGCAGCAATAAA
+AAATAGCCGGAGAAATGCTATGTGCTAAGGAACAATCCTTAAATGCACATTTACATTTCA
+ATCCGGCTATCTAAGCAGCTCACAAGGGATTGAATTTTATTTGATTTTTATATTATTTAA
+GATGCTTCTTCTCTTTTCTTTTTATAAATAGACTTACAGACTTCTTTAATTCGTACCATT
+GTCGTCTTATCTACATATGGACTTATAACAGAACTAATATCAATTAAAACAGGTTCCTTA
+TGCTCTCTGCATTTTATTGATATTAAGAAAGAATCTTCTTCAATAAGAATTTTAAATAAT
+AGCTTTTTATGTTTTCCTTTGTCTCTCACTTCTTCTAATACCATAGGCACCTCCATCTTT
+TTCTCTAATCGTGTCATGTCAGCTTTTAAGCGAACATATAGCTTAAAAAAATTTTGTCTT
+AGTTTTATAACTTGTATGCATTTAGTCATTAACATAATGCAAGAGTAAAATTGATACATT
+TGTTTTATGCACGCTTACATGTGAACATATTGTTTCAAAATAACAACACGAGCTATAGCT
+CCTGCTGTCATCTTTATATTGAAATTCCCAAAGTATTTAATCTTATTCCAGCAGCCTGTT
+TTGATACTTGAAACACAGATGCTAATTCATCAATTATTAATTCTCTAATAATTTCCGGAC
+TTAATCCTCTCCACAAAAAATCGTTTATTCTTTTTCCTGCTTTATATCTTCCTCTTAACT
+CTTCTGCCTTTATTCTAAACATTTCTGCTGGCATTAGGATTGCTGCTGCTATGTTATCAG
+CCTGCCACTCTATCCACTCATCTGCTGTTTTAGGCTTGTATGCTTTTTGTTTAGGACATC
+TACAGGCTTTTGCCATAGCTTTATCTTTATATGACAGGGTCATAAATCTTAATTGATGCT
+TGTCCCAATGAACCATTTCATGGGTAACAGTAAACCTTTCTCTGCCTCTATTTGCTATTT
+CAGAAAGATCGCTTTCAACTAGAAGAGTTCCTTTTTTATATTGTCTTACAATATTTTGCT
+GAGTATCCTTATCATAAAGTTCCACACATCCATCAGAAAATATCATCATCCCTAAAGTAT
+CACAGTTTCTATCGATATTTACATAGTCTATTTCAAGTCCCATTTTAAGCTCTGCAATAT
+CTTCTACTGGTATTGCCATTGGTTCTTTCAAACCTTGTGGATAGTATTTTTGCAAAAATT
+TAGCTGCTTCTTTATCTATATCCCCTTTTCTGATGATGGGAACTAAATCATTATTCAAAT
+TCATTATTACCCCATCCCCTTTATTTATTGTAAGCTTCTATGTCATTTATAACAAAATCA
+CTTAATGAAGCATTATCTAATACTGCACTGCAGCTTAATTTAAACCATTGGCGTATTGAC
+TCTGAAATATTTTCTTTAGCAAAATAATCCCCTATTTCTATATCGCAATTAACAAGTATA
+TCAAAACTTACTTCTTCATCATCTTGCTTGATGTTATTGACCCTTAGTATTTCTATATTA
+TCCAATGTAGCTTCTAAAACTTCTATTACATCTCTAGCTCTTAATGTTAAGTCATACTCA
+GAATAGTTATTCATTATTTCATCTTCTAAAGTATCAAAAATTTGTTGGTAAAATTGTTCT
+TCTATCATACCTTTAAAATAATCATTCATGAGTATCCCCCTCCCTACTCTTTCTCATCTA
+AGGCTTTAATAAATTCAATCCAAGCCTTTTCTGTAATATCACTTTTCCCCTCACTTTCGA
+TTTTACGTGCTTTTCTAAGGGCAGTTCTAGCCAAACCACTTTCTTTTATATAATCAGGTA
+AGTCCATAGGGATTTCATCCCTATCTTCAGATGCTATATCAATCATATAATCTGTTTCTT
+CTGGTGTTAGTCCTAATATTTTTGCTATTTCCTCAATCTTATTGATATTAGGTGGATTTC
+TTCTCCCTTTTTCAATATCACTCCAATAAGCTGGAGAGATATCTAACAGCTCTGCCATCT
+TTCTTAAACTTATTTCCTTTTGTTTTCTTTTTTCTGCAATAAAATCCCCAAACTTACTAC
+TCATAATATACACCTCCTTTCACTGTCAGCATTATTTATTTAAAATTGAGTTTTGAACAC
+TTAAATAATAGAAAACTGCTTATATTCCTGTTTTTCCTTAATGAAATTCAAATTTTTAAG
+TCTTATCCTTGCAGCTGTTAAAGATACGTCAAATATATCTGCAATTTCACGACTTAAGAC
+ATCTGCCCATAAATCTTTTTCAAAATCAGTTCCCATTTCATAACACATTCCCACCATACC
+TGCTGACTTAAATTTAGCTGTTACATATCTGGTAAAGATTTTCTTAGGCATTAATAATGC
+TGAAGCCATATAATCCGCCTGCCATTCAATCCAATCATCATCAGTTACAAGCTGCCTTTT
+CCCTGCACTTTCAATATCGATTGTACGGCATTTTATCACTGGCTCATTTGGGATAGCACT
+ATCAAATAATGTCATCTGCATTTTATTAATTGTGTAAATATGTCTGTGTAAAAGCCAATG
+TGCTATCTCGTGTGCATGAGTAAAGCGGCCTCTTCTTAATTGATCTTCATTCAGAAGACT
+ATTGTCTATTAATATAGTCCCTTCATTTACTGGTATTCTTTTCGCTTTATTATTATCTGC
+ATCATATACAGGAATATAACAATCATTAAATACTGTCATTCCTAATATGGATTGATTATG
+TGTCAAATCTTGATAATCCATTTCCAATCCAGCATAACATTCTGAAAAATGCTCTACATC
+TAAACTGCAAGGCTCTTGAAGGACCTTTGAGTTATAATCCTGTAAAACTCTTTCTGCTAA
+ATCATCTATCTCTACTCTTTTAAGAATAGGTGTACCATTATTTTTAGTTTTAAAATCTAA
+TTGAATCAATCTACCATCCCTCTCATAAATGCATGTATGCTTCATTGCTAACACTATTAT
+AATATGGCATATTATTCCTTGTCAAGAAATAAACATACAAAAACCGAAAAATAAGACAAT
+TTTATTGAGATATCTTACTTTTCGTACATAACTTTTTCAATTCTTCTCTAATATTTTTGC
+TAGTGCCATAACAATACCTTTCAATTGCTTCTTTAATATTAAGAAATATTCCTTGAACCT
+TGCCAAACTGTGATACATTTTCAAAGATAGCTTTACATTTTATTAAACAAAGGTAGACTC
+CAACAAAATTCTAACTTTTAGTATTCAGTACCTCTATTATTTTATTTACGCAGCCATCCA
+AATCTTTGATAATCTGCTTAGACCAGAACCTCAGTACAATCCATCCTTCTTCTTCAAGCT
+TCCTTGTTACTTCTAAATCTCTTTCCATATTTCTTTTTATCTTTTTATTCCAGTATTCTT
+TATTTGTACCTGCAACATCTGTATTCTCCTTATAATTGTATCCATGCCAAAACTCTCCAT
+CACAAAATACAGCAACTTTTTTAACCACAAATACAACATCAGGCTTTCCAATTAATTTCC
+TATAATTTTTTCTATAACGATAACCTCTGCTCCACAGTGCTTTTCTTAGAATACATTCAC
+TCTTACTGTCTTTATTTTTTATTGCTCTCATATTTTTTCTTCTTTGTTCTGGAGTTAAAT
+TATCCACTATTTTCACCTCAAATTTATTAGATAAAAACTGACTTGTTTAATTAATGCTAA
+TTTTAATTTACCATTTTTTGTACACTATGCTTACATTTAAATCTATTCTGCTTGTACTAA
+TACCATTTTTTTAATATAATGTATTATATGAGTAATAAAGGGGTTGATGCTAGTGGCCAT
+TGCTGGAAACAGTTATACAATACAATTAAAGCCTTCTCATCTTGGTTGGGGAGATTATCG
+GTATACAAATACGAGAGATATTATCTACGGAGAAGGATATATTCCTTTACCCAAACCATA
+TGCTAAAGCATTTAATATATTTAACTCGAATTATTCTGCTACAGGCCTGGGATATAATTT
+ATTTCGTGCTTCATCTGTTGATGGTTTTTTAAATAACGTAACGCTTCTGGCCCAAGGTTC
+TTCAACTGCTGGAGATATATATGCTAAACAATTTTCTGTACATGGTAATCTTAAGATGAT
+TGGGGCATGGTATGCGAGTCAAAATGCAACAACTAACAATTTAGTAAGAGTTACTTGGAC
+ATCCCCAACAGATATTCTTCTTGAAATAATTTAA
+>NC_009012.1|provirus_2931283_2970170
+CTATTTTGCAAACAACTCCTCTATTTTGGACACAGCTTCTTTTTGAATATTAGGTAACAC
+ATGGCTGTAAGTATCAAGGGTAACGGAAATTTGGCTGTGGCCAAGACGTTCGCTTACTAT
+CTTTGGATTTATGCCTTGCTGTAAAAGCATAGTGGCGTGGGTGTGCCTCAGGTCGTGGAA
+ACGTATTTTGGGGTAACCTAGCAGCTTGATCAGTTTTGTAAATTTCTGACCTAGGTAATG
+GGGGTCATACGGTCTTCCGTCGTCCCAAGCGCATACAAAGTCTTGGTCATTATAGGCAGA
+ACCCATTAATAGCTTAGTTTTATTCTGCTTTCTTTTGTGTTCTTTTAAAGCTTGGACGGT
+GTAATCCATTAAAGCTATAGTACGCATTGATTTAGCTGTTTTTGGTTCTTTAAGCGTAAG
+TACGCCGTTTATGCGCTGTAGGGCATATTTGACCATTAAAAAGCCCCGTGGAAGGTCAAT
+GTTCTCCCATTTTAAGCCGCATATCTCACCTGCCCTCATGCCGGTTTGCAGTGCTAACAA
+TACTGGTATATAAATCGGTGTCTCGGCAATGTCATCTAAAAATTTTTTGGCTGTTTCGAC
+GTCCCATACTCGCATTTCTACTTTATCAGGACGGGGTGGCGTAACGGCATCGGTGGGGTT
+TGATATTATAATCTGCCAGTTTACCGCATGTTTCAACGCCAGGTGCAGCATGCGGTGTAT
+TTTTAAGACGGTGCTTTTACTTAAGTTTTTCTCCAGCAGGGATGAGTAAAAGCTTTGAAT
+ATGGGCTGGCTTTAGCTTCGGCATCATGATGCCGCCTATATGAGTTTTTATATGGGCGGC
+AAATTCGGTATAACGCCTATAAGTGCTCGGTGCTACATTGTTTTTGGGGTAAGTATCCAG
+CCAGTAATTGAGGTATTCGGCTACAGTCATGTTTGCTGGTTCAAAATATTCACCCTTCTC
+TATTTTTGCGATTATGTCGGCCAGGGCCTTTTCGGCTTCCTTTTTTGTTTTGTAGCCGCT
+AAACCACTTTTGTTTGCGTTTGCCGTTTTCGTCACGGCCGATGTCAACTACTATGCTGTA
+GGTGGAACCTCTTTTGCGTATATGGCCGCGCATAGGCTATCCCTCCTTTTAAGGCATATA
+ACTTTAAAAGACCACCGCCTTGCCAAATTTTTACAACGAATGTTTTCTTATTGCTTCGAC
+AATAGCGTCTGTATTCCAGCCTACTATTTCAATAGCTACGTCAGATACTGCTTTTGGTAT
+TCTTTCTTGTCCCCATGGTTTTATTCCTATTATAGGTTTACCATAATCCACAGATATATC
+TATTTCTTTTTGAATCCAGAAACTGTAAGCTGCATACATTCCTGACAAAATAAGCACACA
+ATTTACAGGACGAATTTGTCCTTTTAGCTCTTCAATTAATGTTTTCTGATCGACTGGGTC
+GTCTGGATCAATTACTGGGTCATGCTGTGGGACAGAGTAATTTCTCCATTTAAAATTTGG
+AGCTTTATTTAGTAGGTCTACTAAACGGTAATAATCATCATTGTATTTCCATGCATGGCT
+AATGAACAAATCATATATTTTTAGGTTGGGCATTGTTTACACACTCCCCTTCATTTGTGA
+TATAATCATATTAGAATCATAAATTTTAGAATAAGGCAGGGCGGTGGTCCCATGCAGAAT
+ATAAGAAAGAGAAAGTTTCGGAAAAAGCCCATTATCATTGAAGCCTACCAGACTGACAAG
+GAAATCATTATAAACACGATGGAAGGTCCTCTTAAGGCTTCGCCGGGCGATTGGATAATT
+ACCGGGGTAAACGGCGAACAATACCCATGCAAGCCGGATATTTTTAAAAAAACTTATGAA
+CCAATTGAGGATGAGTGATTTGTGTTTCTCACGTTATGGAGAGGGTTTGTTTGCCTTTGA
+CTCCAGTCAATGTGTTCGGTTGACATTATGCGTTCGCATTGTTCAACGAGCAACTTAAAC
+GGATCATCTGTTTTGGAATATATGCCAGCTTTAGTAAAGTATAAAAATTTTTCTTGCTTT
+AGTGCTTCGCATGTATTCCTATATTTAATCCAGTTTTCTTGGAATTTGCAGATGCCGTGT
+ACAGCTGCAATGATTGATATAACTGCGCTTAATATTGCTATAAGCAGTTTTAGATAAAGA
+GGTCCTTCCATGAGTGAAATCATAACAGTAATAGATGCAGACAGGACTATTTCTGCTATT
+CTTAGTCCTTTGTATATGTATTGATTTTTAGTGCTTTTTTCATCATACCACATTATCTGG
+TCATCTAGCCTTTGAGAAAGGTATTCTTCTTCTTTCATAAAGATATCCCACCTCTTTTCT
+TGTCGATTTATTTCATATGCAAGATTTTATACTCCACCAATTCCTCATTAACCCCTAGTG
+TGCTGGCGATATAACTTATCGGTTGGTAGCGCATTTCCTTAATGTCGTAATCATCGATAA
+GTAGCTCTGCTGCAAACTTGTTGGCCTCACATTCATACGGCCCAATAGGGAACAAGGTAT
+ATTCTCTGATAAAATATATTGGCTCTGATGAGTGCAGGATGGCATGTCCAAGTTCATGGG
+CCAATACGATACGCTGGCTGTATTCATCCAATGTACTGTTAACGACTATAAATTTATTTC
+GCAGCGTTTTTATGTAGTATCCTTTTGTATGATGTGAGTATTCCTTATGTACGACGTGTA
+TGTTGAGGTATTTTGCAAGCCTTAAGGGGTCTCTAGTTTCATATTTCTGGACGAGGTGCT
+TTACACGGGCGTGAATATTCTTTTTCACTCCGGAAGCACCTCCTTATTGGTCGGTTTTTG
+CCTTTTTTCTGCCGTATTTCTTCTTGTTCATCTCCTTTGCCTTCCAGAAGAGCTCGGATA
+TATCTCGAAAGAGCTTTTCTTTGTCTTCTTCTGCGACCTCATCGTTCATGAAGAAGATGC
+CGGCCTGCTTGATGAAGTCTTCATACTGCATTAGGTCACGTTTGGTCACTTTATGTTTTT
+GGGTGTATTCTTCAGGGATGTAGGGGTTGCGGATGTCAGTGCGACCTAGAAGATAATCGA
+CTGATACCGAATAAAATTCAGCTAATTTCTGTATTGTGACAAAGTCAGGTTGGCTTTTGC
+CTGTTTCATATTTTGTATATGTGGTTCTATCTACGCCAATAGCATCGGCTACATCTTTTT
+GGCTTAAGTTTTTCTCTGTTCTTAACTGCCTGAGAATTTCATTAAAGGGCATGTTATTCA
+CCTCCATATTTTATTATATGTGAATCTACTTCACATAACAATTATAGTGCAAAAATTTCA
+CTTTGGCTATTGACAAAGTGAAGCAACTTCACTATAATTAATTTCGGGGGGTGAAGTTAA
+TGCACAACAAAAACGTGGCAAGTGAAGTAAGAGAACTTATAAAAGAAAAACGTGCTGCCT
+TGAACCTTACACAAAAACAGCTAGCGGATTTGGTAGGAGTTGACAGAACAACAATTTCAA
+AAATTGAAAATGGAATAAGACCATCTGTAAATAGTGCCAAAAAAATAGCTCAAATTTTAG
+GCTTAGACTGGACAATTTTTTTTGATAGCGATGAAGAGCATCAAACCGAGACTGCGTAAA
+GGAAGGGGGTGAGGGGGATGGCAGACTTGCCACAGGTATTTAATTACAAAGGCAAACAAG
+TAAGGACATTTATCATCGATGGTGAACCGTGGTGGGTTGCTAAGGATGTGTGCGATATTT
+TAGAGCTTGGCGACACTCACAAAGCTATGGAAAGGTTAGATGAAGATGAGCGGAATACAA
+TTCCGGTCACCGACTCACTTGGAAGATTACAAGAAACTTATGTAGTTAATGAGGCTGGTT
+TATATAATCTCATTTTAGGTAGCAGAAAGCAAGAAGCTAAAGAATTTAAACGATGGATTA
+CCCATGAAGTCATACCTCAAATACGCAAGACAGGGATATATGCATTAGAACCAAAACAAC
+TTTTAGCAGTAGCAATAATTGAAGCACAGAAAATCATAGAAGAGCAAGACAGGAAGATAA
+AAGAATTACAACCCAAAGCGGAATTCTTTGATGCGGTAGCAGGAAGCAAAGATGCAATTG
+ACATGAACAGAGCCGCAAAACTGATATACGAAGAAACTAGACTAGGCAGAAACAAGCTGT
+TTAAGTTACTGCGGGACAAAGGCATTTTAATGAAAGACAACATACCGTATCAAGAATACA
+TAGACAAAGGGTACTTTAGAACTATTGAGCAGAAATATACGAAGCCAGATGGAACAACAC
+ACATCTACATTAAGACTCTGGTTTATCAGAAGGGGCTGGATTTCATAAGAAAGATTGTTA
+AAGAGGATAACGTAATACATCTTAAAAGAGCAAAGGGGGTTTGACAATGCGATACGAGGA
+CTTGCCTGATGTTTTAACTATACCGGAGATGGCAAAGTTTCTCCAGATAGGCATCACCAA
+AGCATACGAGATGAGCCACTGGAGGGGCTTCCCGGCCATACGAATAGGGCGGGCAATACG
+GGTACCCAAGAAAGCATTGCTGGAGTGGCTTGAACAACAGAGCAAACAGGAAGAGCCCAG
+ACTAACTGCAATTAGGGTGAGGTGATAAAAGAAAAGCCGTTTTCAAACGGCACAAACAAA
+AACCACTACACCCTCATTATACCACAAGGTGTAATGAGGGGGCAATAAGGGGGAGCGAGA
+ATGTTGTATAAAGTGACCTCACCCATGTTAGAACAGGAGATAGTTGTGGAAGCACAAAAC
+TCAACGCAGGCTAAGAGAAAGGCTTGTAGGTTGTGGGGCGTTAGCCCCAGCGACGAATGG
+CATGGCATATCCACGATGCAGGCCAGAAAGTTAACAGAGAAAGAAAGACAAGAAGAGTTG
+AGAAAGTGGGGGATTGAGGATGCGAGTATTTAAGTGTGGCTGCTGTGGCTATAAAGCACC
+GGAATATATGTTTGCATACGGACGAGGGCGGGAGTACGGTGAGCATCCGGAACACCGCTA
+CTGCCCTCAGTGTCATCAATCAATTGATTGGTACGGATACGGGATATTTTGGGTAAGTGA
+ACAGGCATCTTAAGGGGATGAAATACAAATGAGAAAATGGATCGGGAAATATGGAATGTA
+TATCGTAGCAATTGCTGCTGGTGCGGTACTGACACCGGCAGCAATCCGAACAGCAACACT
+ACAAAGAGGGTATAAGGCGATAGGTGGGGAGTATTTGATTATACCTCTTGCAATATTGAT
+AGTGTTCTTTGTGCAGGAAGTAAAACAAACAATAATGGAATTGAGGGGAGGAATAAAGCG
+TGAATAACGCATTGCAAATGCTTGAGATAGAAGAAGTTTACAACATGCCTGAGGAAAAGA
+GGGAGCGGTTTAAAGTAACAGATAAGGATAGTGCAAATTGGTGCCTGAGAAAGATCAAGG
+CTCTAAAACAGGAGATAGAGGAGAACAAAAGGATAGCTGATGCGGAAATACAACGGATAC
+AGAGCTGGTTAAAAGAAGTAACTGAACCACTGGAGAGGTCAATACAGTTCTTTGAAAGTT
+TACTGATTGAGTACCATATGAACATATATGCTGAGGACCCAAGCAAAAAGACTATCAAAC
+TACCATATGGCACATTGAAGGCTAGGGCTCAGCAACCGGAATTTTGCAGAGACGACGAAA
+AGCTGGTTAACTGGCTTAAACAAAATGGTATGACAGAATTTGTAAAGGTCATAGAAAAAC
+CTGAATGGAACGAGCTCAAGAAAAAAGTAAAAGTGATAGGTAATAGCGTAGTGTACGAAG
+AAACTGGCGAGGTCATAGATGGTATAACTGTTCAGGAAAGACCGCCTAAATTCACAGTGG
+AGGTGGAATAGATGACAAAAAAGTTAATGGAACTAGAACAGAGAGAAAACATAAATGCGA
+GCATAAGTATATTGGGCAGCGTGGATATTGCGCAGGTCCAACAGATCCTAACGAGTATAG
+AAAAATTTCAAATGGTTGTTCAAAAAACGCTAAATGAAGGCCATGACTATGATATTATCC
+CAGGCACATCGAAGCCATCACTTTTGAAGCCAGGGGCAGAGAAAATTTTGGTGTTGCTCG
+GGCTCACGTCGGAATACGAGATTATTGAAAAAATAGAGAATTATGAGAAGGGCATATTTG
+CATATACGGTTCGATGCATTCTGTCTAAAAACGGGAAAAAGGTTACAGAAGGACTGGGCT
+CATGTAATTCCAAGGAGGATAAATACCGGTGGCGGTGGGTATCGGAAAAGGATCTCCCAC
+CGAATGTTGATAAAGATATGCTGAAGAGCAAAACCAATGAGTACGGCCAAAAGCTATACA
+GGATTGAGAATGACGAGATATTTACTCAAGCGAATACAATCCTTAAGATAGCCAAGAAGA
+GAGCACAGATAGATGCGGTACTTACAGTCGCTGCATTGAGCGAGATATTTACACAGGATG
+TGGAAGATATGCAGGAGTTTCTGCAGAACGAACAGCTTGAAACCATGAAAGCAGAGGAGG
+CTGTAAATGTTAAGGTCACGTTCGGCAAACACAAGGGTAAGACGCTTGGCGAAATATACA
+GCCAGGCACCGGACTATGTGCAGTGGCTTGCGCAGAATGCAAGGAATGATGTCTTAAGAA
+AAGCGGCTAATATGGTTATGAACGGCAAAGGTAATGAGAGTCAACAGGAAGCTCAACGTT
+CGGAGGATCTATCGAACAATCAAGGAGAAGACAATATACCTGGGTTTGAGCTGACGGAGG
+AAGAACTCCCGTTCTAAAAACGGGCGAAGCTAGTTCTGTAAATTTGATCGCAGGGGTCGC
+TAAGATAGCGGCCCCGCCTAAATGTGAAATAAAAGGAGGCTACACCATGAACCGATTCAA
+ATGCCCCGCATGTGGCGGGAATCAATATACAGCATGTTCTACGTCTGAGAAGTGTATCTA
+TTGCGGATACAAAGGGCAACTAATGAAGATGGAGACGCTAGAGCCGGAAAGTGAAGGAAA
+AATGATAGATTGCAAATATTACGTGCCAGCATGGGTAGGGAACAAAACTACAAACCCACA
+GTCGGACTGGTGCTTGAAATATGGTGTAACCTTGGGCGGGAAATGCCTGAAGGGTTGCAG
+TGAAAAGAAGGATGTGAGGAATAGTGAAGTATAAGGTGATGTTCACACATAGCGACAAAG
+GACAAAAAAGAGGCCATAAACTGCGTGAAGGCAAAGAAATATACCAGCATCCGGAGGGGT
+ACTTCGTAGTGCTGGAGTTTGAAGGCGAAAGCGGGAAGTTCAGGGAGGCTTTTTGGCCGG
+AGGATATTGTGAAAGATAAGTTGTTTTTGTGAAGGTGGAGGGGTCAGAATGCCAAACAGA
+ATCATTAAAGAATCAATATGTACAAGCGACACCATAGACCAATTATCTTGGTTTGAGGAA
+GTGTTTTTCTATCGCCTCCTGGTTAATTGCGATGATTATGGGAGGATGGATGCAAGGCCG
+GCGATTCTGAAGGCGAAGCTGTTTCCTCTTAAAAGTGTTACCGAAAAGCAGATTTCTGAT
+GCTTTAAATAAGTTATCGACGGTAGGTATTGTAGCCCTATATGAGTATGATGGGAGACCG
+TACCTGCAATTGGTAACTTGGGAAAAGCATCAGCAAATACGTTCCCGGAAGGCAAAGTAT
+CCATTGCCTCCAGAGGATATTCCTTGTAAGCGCGAACACATCATGCCCGAAGAAAAAGAC
+ATCGAGGACCTCTTGTATGATGTCATGAGCTCAACGAAACGATTTGAGGAACATACCTTG
+CTCTCGGTTGAAAGACAGGTAAGGGTCGGTGAAAGCTATCTTGATATCGTTGCTAAAACC
+GAGAGCTCCGAAACACTTGTATTTGAATTGAAACGCGGCCGGTTGAGTAATAAGGCTATT
+GACCAGATATCCAAGTATTTGACCCTCATAAATGGAAATGGCATCTTAATAGGCTGCGGC
+TTAAGCGCCAATTTCGACATTGAGCGGTGCAGGAGCAACGATATAGCTGTTGTCATTTAT
+GATGATGACCTGAATATGTCGCTTGTATTAGGTAACTCCACTGTAAACAGTATTGATTTA
+ACGTTAAATCACGTTAAATCACGTTATGCAAAGTTAGCGCCTAATCCAATCCAATCCAAT
+CCAATCCGAATCCAATCCGAATCCAATCCTAATCCGAATCCAATTAGTAATAATGGCGCG
+AACAAGTCGCGCGGATTCACTCCTCCTACTCTTGAGGAAGTGGCCGCATATTGCCAGGAG
+CGTAACAACGGTGTTGATCCACAGAAATGGTATGACTTTTACGCCGCCAAGGGTTGGATG
+ATTGGGAAAAACAAGATGAAGGATTGGAAAGCAGCGGTGCGCACTTGGGAGAAGCGGCAA
+CAAAAAGGGGGTTATACATACAACTATGAGGATGGAGGCGATAGTCTGTGAACTTTGACG
+GTATTATCGAAGATCTGGCGAAGAAGTGTGAACCGAGCGAAGAACACTTTGATTATTACA
+AAGACGGCCTGCTTATTTGTGGCAAATGCAATACTCCCAAAGAGTGCGTGGTTGAAGTAT
+TGGGGACACTCAGAAAATTTGGATGCATGTGTAAATGCCAGAGTGAAGAGTACCGTGCCA
+TGCAGGAGCAGATCAGGCAAAGGGAAGAGTTTGAGCGGATCGGTCGCCTCCGGACGCAGG
+GCATCCAGGACCGATGCTATTGTAACTGGACTTTTGAAAATGACGATGGACGGAACCCTC
+AGCAAATGGACAAGGCTATGCGGTACTGCCTGAGATGGGAGGAAATGTACCGTGACAATA
+TTGGACTCCTCCTTTGGGGCGATGTCGGAACCGGCAAGACGTTTTTTGCGGCCTGCATAG
+CAAATTACCTAATAGACCGGGGCGTGCCGGTGCTTATGACTAACTTTATTAGATTGTCGA
+ATGCACTAATGGCCCTTGACGAGGACAGAAACGAGTACATTAAATCCTTAGACAGCTACA
+AGCTGCTCATAATCGATGATCTGGGCGCCGAACGGCAGAGTGACTATATGCTTGAGCAGG
+TCTATAACATCATAGATAGCCGTTATAAGAACGGCCAACCTCTTATTGTCACAACTAACC
+TGCCGTTGTCGGAAATCAAGAATCCTTCTGATATCAAGTACAGCAGGATTTATAGCAGAA
+TCATTGAAATGTGCGTGCCCATCAAGTTTGAGGGACCAGACAGGAGGAAAGAAATATTTA
+ACTTAAAGTTGGAAAAAGCAAAAAAATTGTTCGAGGGTGATTAAAATGCCAGTAAACAGC
+AGAGAAAAAGGCAAGCGCGGCGAACGGGAATGGGCAAGCATATGTCGGGAAGAAGGCTAT
+AACGTTAGGCGCGGACAGCAATACAACGGCATTGAAGGAGCTGACTGTGTCGGCTTGCCG
+GGAATACATCAGGAAGTCAAACGTGAACAGAGATTGAATATCGAAAAGGCATTGCAGCAA
+GCAACCAGAGACGCAAAGGACAGCGAGATACCGATAGTTGCCCACAGGAAAAATGGAGAG
+AAATGGAAAGTGACCATGTGGGCAAGTGATTGGTTCAAGCTATATCGCGAGTGGGAGGCA
+AGCGAATGGTTAAAGAAAAAAGAAATCAAAGAATTTGAAGGACAGGAGTTGTGGGGTTAG
+GGAGGCAGATCACATGAGCCGAGGAAGACCAAATAGGGGGTGTGAATGTGGGAATCCTAG
+AAAGACGCATATACAAAAAGATTGAGTACTATTTATACCACTACCACCAAATTCGTAAAG
+AGATAGAACAAGAAAAGGAAATTATTATCCAGTCAGGTGGCCGTGACCTCACCGAATGGA
+GAGGCGGTATCAGCTACCATTCGGATCCGACTGCGAATAAGGCTATTAAACTCACTAGTC
+CAGAGTTGCTAGAAAAAGAGAAATGGCTGAAGGTGATAGAAGGTACTATTCAGCATTTCC
+AAGGTACAGAAAAGGGCCGCTTACTACAGAAAAAGTATTTTGACCAGCTGGGAGAGCGAC
+ATATATGCAAGGAATTACACATCGAAAGGACAACTTACTATCGATGGCGAGAAGAAATTG
+TGCTGTATACCGCCTTACTAGCGGCGCAATATGGTCTTATAAAGTTTTAAAAAATTCAGA
+ATTTTTGGCCAATGAATGTGTTACAATGATAGCGGGAATATTATGATATTTGGGTGTCAT
+AGCAGAACAGATGCAATACAGCATAACTCGGCTGATGAAATATTTGAGGGTTAGATTGAT
+GAGCTGTTGAGGAGTTGCATGGTTCATATATTAGTAGCCAGGGTAGATGGGGGGTCAGAG
+AAGTATATTAGTCGTTTGCTTATAAAATGGGATAACAAAGGCAGAATTGAAAGTAGAAAA
+AATATAGAAGAAGGAGTGGTTACGTGTATTCTCACCGGTTCTAAGGGGTTCATATGCAGG
+CTTGATGTGGGAAAAGTATGTTGTTACGTGAACTTAGATGGCGTAGCCTTGTATCTGATA
+AATTTTGTCATAGATGTATAATTAAGTCAAGCTTAAAGTTGTAAGCAAAATATGCTATAA
+TAGATTGAGGGAAGAACGAGGTGAGATTATGAAAAGAAATCCACTTGTTGCTCCTGTGTT
+GAAGTGGGCAGGAGGGAAGCGGCAATTACTAAAAGACATAAAGAAGCATATACCAGAGAA
+ATTTTCAACTTATTATGAGCCCTTTTTAGGTGGTGGGGCTGTTTTATTCGAACTACAACC
+TAGTAAGGCTGTAGTGAATGATATAAATGAGGAATTGATGAATGTTTATTTAGTAATTCG
+GGATCATGTTGAAGAACTCATTGAAGAATTAAAAAAGCACGAAAGAAAAAATAGTGAAGA
+ATATTATTATGAAATAAGAGAACTAGATAGAGACAAGAGAAAGTATGAGCAATTAAGTAA
+CATAGAAAAAGCTGCGAGAATAATTTATTTAAACAAAACATGTTATAACGGTTTGTTTCG
+TGTAAATTCACAAGGTCAGTTTAATGTTCCTTATGGGAGATATAAAAATCCAGATATTGT
+GAATGAAGTTACATTAAGAGCAGTAAGTAATTATTTTAATAAAGCTAAAATAACTTTTAA
+ATGCGGAGATTTTGAAGAAGCAGTTAAGGGGGCAAGAGAGGGTAGTTTTGTGTATTTTGA
+TCCGCCTTATGATCCCGTTAGTGATACAAGCAGTTTTACAGGTTATGATATAAATGGGTT
+TGACAAGGAGGAACAGATAAGGCTTAAGGAATTATGTGATAAATTAAATAAAAAAGGTGT
+AAAGTTTCTACTTTCAAACTCAGCAACAGATTTTATTTTGGACCTGTATAAAGATTATAA
+TATAACAATAGTCCAAGCTAATAGGGCAATTAATTCAAAAGCGGACAAAAGAGGAAAAGT
+TGATGAAGTGCTGGTGAAGAATTATGAGTGAGACAAAGAATGATATTGCATGGGAACGAA
+TTTTTAAGAAATATAGAATATTAGAGAAAATAAAGAAAAATGGGGCTTTTGAAATAACGT
+CAGGGCAAATAAATGAGTTTAGAGAAGCAAGGTTAATGACAAAATTTGATCACCGAAAAA
+ATTTACCGAAGATTTTTGAAGAAAATAATTTTTCTATTCTTCCTATTACTAGAGGTAGTT
+ATTTAATTGCGCAGTTTAAGGCTTATCATAGGCTTGAGGAAAAAGAAACAGAAATAATCA
+AGATTCCATTTCCTACTTATATTGAAAGTATTGATTATGAAAACATAACAAGCGAGGCTG
+CGGCTTTAAACTGTGCGTATGTTTCAGGTATATTGGCTGATTTTATTGAGGATGAAGAAA
+TGGTTCCAACAGTTACAGGTCGAATGAGTTCTGATGCGTTTTGTTTTTATATTAATACTT
+ATTCGGGGTCTAAGTTTAAAGTTAATGTTACTAATGCTCAAATTGAGATAGATGGTGGAT
+ATGAAGGGCTGGGAACCTTTTCTTTAATTGAAGCGAAAAACTCGTTATCAGATGATTTTA
+TAATACGACAAATATATTACCCTTATAGGTTATGGCATGATAAAATTAACAAAAAAGTTA
+AGCCAATATTTATGACTTACTCTAACGGTATTTTTACTTTTTATGAGTATGAGTTTCAAG
+ACCCTGAAGATTATAATTCTCTTACTTTAGTAAAACAAAAAAAATATAGCATAGAGGAAA
+CAGAGATTGGGCTTGATGACATAATAGAGATCTACAAAAGGACAAAAATTATAAATGAAC
+CAGAAGTTCCATTTCCACAAGCAGATTCATTTGAAAGGATAATTAATCTTTGCGAGCTTT
+TAAATGAATCAGAGTTGACTAGAGATGAAATAACAACAAACTATGATTTTGACTCTAGGC
+AAACGAATTATTATACAGATGCAGCTAGATACTTGGGATTAGTACATAAGCGTAAAGAAG
+GTAGAGAGGTAATATTTTCGTTGACAGAAGAGGGGGAAAAATTATTTAAACTGAAATATA
+AGCCAAGACAATTAAAATTTGTTGAATTAATTTTGTCCCACAAAGTTTTTAGAGAAGTTT
+TTGAATTGTGTCTGAAAAATGGAAAAATGCCAGATAAACATGAAGTAGTGAAGATTATGA
+GATACAGCAATTTGTATAAAATAGAATCCGAGAAAACATTTTATAGGCGTGCTCAAACTA
+TAATGAGTTGGATTAAATGGATATTAGAATTAACTAGATTGTAGTACATAGCCAAAGATT
+GTACAAAAGTTCGGTACTTTTTAAACGGATTTATATGGTAGTATAGTAGTATAGAATTGT
+ATACTTTCCTCTTCAGCCCGGTTGCTCAGCCGGGCTTTGTTGAAAAATATGGTGGTTTTA
+GTAGGATTTTCTTCCTTTCTTATAGAAAATTAATACGAGATAGGAGGAAAGTAATAATGG
+GGGATAAGAAAGACGCTATAAAAAGTTTTCTTACAGAAAATGTCTTAGGCGTCATAATTG
+AATATGGTAAAGAAGCGGCTAAAGCTCGGATAAAAGATGTTGTTACTAATGACGCTGCGA
+AGTTAGCTGCAGCGGTTGGTATTGATATGGCAGGCTCAATAATACCGGGAATAGGGAGTG
+CTATTTCTGCATATAGAACTCAAAGACAACTTAATAATTTAAATACTTTAGTATCAGAAC
+TTAACAAGAAGGTTGAAGAGATTAAATTAAATTTTGAGAGACAGACAGAAGAAAATAAAA
+AAACCTTGGACGCAATTTTTGAAATGGTTATTTATAAAGCGGTTAATACTAATCAAAGCG
+AAAAAATAAAGTATATGGTTAATGGATACGCAAATCTGACAGCTATTCAAAATGTATCTT
+ATGATATAAGCTATCTTTTTTATGATGTTTTAGATAGAATGACTATATTAGATATAGCTG
+TTTTGAAAGCTTCATATCCTTTTTGGGGTACTGAAGAAAATAGGAAAAGCTTTGTAGATG
+TCTTGAATGAATTTGGCATAGATTATTATCAGTATGAAGCGGTAAGGGATAATCTTTATC
+GAATGGGGTTGCTAGAGAATCAATATGATGATGCTTTAGAAAAAGATCTAGATTTACTAG
+TTAAAAATGTTAATAATCTAAATGAAGTAGTTATTTCAATACAAGAAAGTCTTGCAAATC
+CCAGGAAGAAAATGAAGAAGCTTAAAAATACAAAAGTTGAATTAAAAGCTAAAGATCGTT
+TAAAGATATCTAAATTTGGCAGGGAATTTGTTGAATTTTTTATTAAAAATTATAACGATT
+AAAAATTATAACGATAATGTTGGAACATAAAGCTACTTGTTGAAGATAGCTTTTTAATTG
+GAGGGAACGATATGGATATTGGAATGTTTATAAAGAAATGTTTTGAAATAGGGATTTCAT
+TATTGAATAAAGAAAAGCTAACAGAGGAGGAGAAAGAACTTTTAAACGCTCTAGATAGTT
+TAGAAAAATGGATCCAAGATAGAATCCTTTTTGAGAATTAAGACTTTGGATAAATTAAGC
+GGGGTGAGGTGATGTGAAGCTAACAGAGAAGCAAAAGGCATTTTGCGATTATTACATTGA
+GACATTAAATGCTACTGAAAGCTACAAAAAAGCAGGATATAAAGTCAAAACAGATGGTGC
+AGCTAGAGTTAATGCTTCAAGATTGCTAACAAATGCTAACGTTAGGAAATACATCGAAGA
+GAGAATGAAGCAAAAAGAATCCGAGCGCATTGCCTCACAAGATGAGGTTCTGGAGTTCCT
+CACGCGAGTTATGCGTGGGCAAGAAGTTGAGGAAGTGGTCGGGTTTACTGAGTATGGGGC
+AGTAAAAGAGAAGAAAACACCGAGTGCCAGGGACAGAGTAAAAGCAGCCGAACTTTTAGG
+CAAAAGGTATGCGTTATTCACTGAAAAAGTCAACGTCGAAGGGAACATGGGCGTTGCTAT
+TATAGATGATATAAAAGAAGATGATAGTGATGACGCAAGTTAGACTTAGCGAATTAGTCG
+CACCGAGTTTCTACGAGATCCACAATGACATAAAGCATAATAGATATACTCATTACTGGC
+TTAAAGGTGGCCGTGGCTCAACCAAATCCTCTTTCGTGAGCATTGAAATCATCCTCGGCG
+TAATGAAGGACCCTAACGCTAATGCAGTGGCCCTGAGAAAAGTTAAGGAGACTATCAAAG
+ATAGCGTATTCGAGCAGTTAGTGTGGGCAATTGAGAAGCTGAAAGTTACTGAATACTGGG
+AGATAAAGCACAACCCTATGGAATTGACATATCTACCTACGGGACAAAAAATATTGTTCC
+GTGGCGCTGATAAGCCAAGGAAGATTAAATCCATCAAAGTAAGCCGGGGATATGTAAAGT
+TTATCTGGTATGAAGAAGTTGACGAATTCCTCGGAATGGAAGAAATCCGAATCATTAATC
+AGTCCTTGATGCGTGGCGGAGAGCAGTTTGTCGTCTTTTATACTTACAATCCTCCAAACA
+GGGTTAACGCTTGGGTGAATGAAGAAATACTGATTGATAGACCGGACAGAAAGGTCCATC
+ATAGCACGTATTTGACTGTTCCTCGAGATTGGCTTGGGGAACAGTTTTTTATTGAGGCAG
+AACATCTTAAAAAAGTTAACGAGAAAGCGTATAGGCACGAGTATTTAGGTGAAGTCACCG
+GCACAGGCGGCGAGGTATTTACAAACGTGAAAGCAAGGAAGATAAATGACGAGGAAATAA
+AAGCATTTGACAGGATAAAAAGAGGACTGGACTTTGGCTATGCTGTTGACCCGGCAGCTT
+ACATTGTGTGCCACTTTGATAAAACAAGGCGGCGGCTTTATATATTTCACGAGATATTCC
+AGGTCGGCTTGAGCAATAGGAAATTGGCAGAGTTAATTAAGAAAGAAAACAAAAGCAATA
+AGTTAGTGGTTGCGGACAGCGCGGAGCCAAAGTCAATAGCCGAATTGCGTGGTTATGGAA
+TCAACATAAGGGGAGCGAAAAAAGGACCGGACAGCGTTGAATATGGAATAAAGTTTTTGC
+AAGACCTTGAAGAGATAATAATTGACCCTGAGCGATGTCCAAATACATTGCGAGAGTTCG
+TAAATTATGAACTTGAGAAAGACAAAGACGGCAATTTTAAAGCTGAATTCCCGGATAAAA
+ACAACCACACGATCGATGCTGTTAGGTATGCGCTTGAGGATGATATGAGGACGGGCGGCC
+TATCAATTTTAAAGTGAAGAAGGTGAGAAAGGTTGCTGCTTAATCTTTTTAATTTCAGGA
+ACTTTAAAGACTTATTCCGCAATGATATAAACATGATGACTGTAGAAGAAATTTTATATA
+ACGAAATCAAAGAGTTCCAGGCATCCGATAGAAGGGCCTGGATGGTTATTGGCGATAGAT
+ATTACCGGTGCGAAAATGACATCCTTAACAGGCGTATAGTACGCCATACAGAGAGCGGAG
+ACATTGAAGATAGGTCAAAAGCAAACAATAGGTTGGCCCATGGTTTTGTTAAAAACCTTG
+TGGATGAAAAAATAGGATATCTGCTTACAAAGGATTATTCGCTGAAGTGCGACAATAAAG
+AATATATTGAGAAAGTTAAAAACGTCTTGGGTAAATATTTTCAATACACCCTTACCAGGC
+TCGGATATGAAGCGTCGAATAAAGGCATAGCATGGTTACAAGTTTACATAAATGAGCAGG
+GCAAATTTGGAATGATGATAATTCCTGCTGAACAGTGCGTTCCACTCTGGAAAGATAACA
+CTCACACTGAACTTTATGGCATGATTAGATATTATGTGCAGACAGTTTATGAAGGCAAGG
+AAAAGAAGCAGATCACTCGCGTGGAATATTACACGGATAAAGAGGTTTATTTTTATGTTC
+TCGATAATGACCATCTTATCCCGGATATAGAGCAATATGAAGGAGGGCCCATACTACACT
+ATAAAAAAGGGGAAGAAGGCCGAAGTTGGGGGAAAGTGCCTTTTATTGCCTGGAAGAATA
+ACCATCTTGAATATCCGGATGTTAAATTCATTAAATCGCTTGTGGACGCTTACGATAAGT
+CACGGAGTGAAATAGATAATTTCATTGAAGAAACAAAAAATCTTATCTATGTTTTAAAAG
+GCTATGGCGGAGAAAATTTATCTGATTTCATGAAAGACCTTAATTACTACCGGGCTATAA
+AAATAGATGATCCAGAGCATGGTGGAGTTGATACACTAACACCGAAAATAGATATTCAGG
+CAGCAAAGGAACATTTCGAACAATTAAAGCGGGATATAAATGAGTTTGGCCAAGGTGTGC
+CCAAGGACCTTGACAAATATGGCAATTCTCCCAGTGGGACAGCATTGAAGTTTTTATATA
+GTGGGCTGGATTTAAAATGCAACCACTTGGAAGTAGAATTTAGACAGTCATTTAATCAGC
+TTTTGTATTTTGTAAACAGATATCTCGCAGAAAACGGTCAGGGAAATTATGAGAATGAAA
+ATGTAGAGCTAATTTTCAATAGAGATATACAGATTAATGAAACTGAAACTATCAATAATT
+GTGTTAACAGTAAAGGCATTATTAGCGATGAGACTATCCTTGCAAATCATCCATGGGTGT
+CTGATGTAGAAGAAGAATTAAAGCAGATTGAGAAAGAAAGAAAATCAGAGGAACCGCCAA
+TGTTTGGTGAGGGGGATGAAGAGTGAAAGTAAGAGAACTGGTTGAAATATTAAAGGAACT
+AGACCAGGAGCAAGAGATAAGGTATAGTTCATATGAATTTCTCGGGGATTTTAAGATTGA
+AGGAGTTGAAGAAGCAGAACATGAAGGAATTAAGTACTATAACATAAAGTAGGTGGTAGT
+TAGTGAATAAAAAGGACATAACCTACTGGGAAAAACGACAGGAACGGAAATATCTGGCCG
+GAGAGAAGAAGCTTGATGAATATTATAAAGGTTTGCAGAAAGCGTTTAGACAAGCAAAAC
+GAGAAATCCAGAGTGTTATAAATGATTTCTACATGCGATATGCAAAAGAAAACAAAGTAT
+CCTATGCTGAAGCCCAAAAACTACTTGATAAGGCAGAAATAGGCGAGCTGCAGGACTTTA
+TAGACCTTGTTAATAAGAATATGGGCAAGTATAATCGAAAGCTTAACAATATGTCTATAA
+AAGCCAGAATTACCCGCTATCAAGCGCTAGAAAAGCAGATAGATGCTATACTACAGCAAT
+TATATGCTATTGAGTATGAGTATAAAGGTAAAGAGCTACTGAAGGAAGTATATGAGGATT
+CTTATTATCGTACCTGGTTTAACATAGACCAGTACCACGGCTTTCATCAGGAGTTCGCAC
+AGATTAATCCTAGAACTATAGAAGAGTTGATAAAATATCCTTGGAATGGAGCAAGTTTTT
+CTGATAGGATATGGAAGCAAAAAGACCATATGCTGCAGGTATTAAAAGAAGACATTACTA
+CTATGTTAATACAAGGGAAAAATCCTCAAACATTAGCAAGAGATTTCGCAAGAAGGTTTA
+AAACAAAAGAATATGAAGCATATAGGCTGCTACATACAGAGAGCAGTTTTATTATCGAAC
+AGGGAACTTTAGCAGCATATAAAGAAGATGGGGTGGAGAAGTATCAGATTCTGGCTACTC
+TGGACATGAGGACATCGGATATATGCAGAAGTGAGGATGGGAAAATATATGATGTGGATG
+AGGCGACAGTGGGAGTAAATTATCCTCCATATCATCCATTTTGTAGGACCACAACAGTGC
+CATATTATGAGGATGCTGAGGTAGGTACAAGGGTTGCGCGTGATCCGGTAACAGGTAGAA
+GTTATGAAGTTCCAGCGAATATGACATATGAGCAATGGAAAAATAGATATATAGATCAAC
+CTGACAATATTATTCGCCAAGAGATACTGAGTAATCCTGAAAGACTTGATAATTATAGTA
+TCCAACATTATAATAAGCATAAAGAAGGAACCAAACAATATGAGCAGTATAAGCAATCAA
+GACTTAAAAAAGGTCAAACTGAACAAAGCAGTTTACTAATTTCTTACGATGAAGCTAAAG
+AAATAATAAAAAAATATGCTGGTACTGGAGTATTTAGTAGAGACAGGAAAGGGAAATGGA
+GAAATGAGGAATTTGTGGATGTAGATTCTATAATTGGTGTTGTGCATAATATTGATGGGA
+CAGTAACGCCTACTAATAGAATTCAAATAAAATATGGGAAGAACAGCGTGCACATTGTAC
+CTGTATTACCAAGAAAGGAGAGAAATAAATGAATCTTTGTGAATATCAAGGTAAAAATGT
+AAGAGTTATTACGACAGACGGGCAGAAGATTGAGGGGTATGTAATAGCTTTTACAGATGA
+AGAGGAATGGGACGAGACCGATCCCGAGGGCAATAGTATTTCAATTGAAAATGATGAAGG
+CATTATTGGGATTTATGAAAAAGAAATAAAATCAATTGAAGTAATGAAAGGCTAAACACC
+ATCTATCATGAATAACGATAGATGGTGTTTTTATATCTATGGAAGCACTTGGTGAAGGCC
+AAGTGCTTTTATTATGCCGTCTTTTCGGTACTGCAGACGTAAAAGAACAGGACACTCGTG
+GAAGCGACCACGAAAAAAAGCGTAGTGAAGATGAAAGGAGAATGGAAATGACAAAAGAAC
+AGTTAATGGAAATGGGGTTAACTGAAGAACAAGCTGAGAAGGTTCTAGTTATATATAAAG
+AAGATTTAAAAAGCTTTATCCCTAAAGCTAGATTTGATGAAGTAAATGAAGCCAAAAAGA
+ATTTAGAGGAACAACTTAAAGACAGAGATAAGCAGTTAAAGGATCTTGGTGAAAAAGTAA
+AAGATAATGAAGAATTAACTAAGCAAATAAAAGACCTTCAAGAAGCCAACAAAAAAGCTA
+AAGAAGAGTATGAAACAAAGATTAAGAATCTTACATTAGACAACGCTATAAAACTTGCTT
+TAAAAGAACATAAGGCAAAATATGAGGACCTTCTTGTAAATAAGTTTGACAGAGAAAAAC
+TCGTTATCAAAGATGATGGCACTATAGAAGGATTAAATGAACAAATAGCAGCTTTAAAAG
+AAAATTACAAAGACTTATTTGAGCAGCCTTTAAGTGGACATACCCCTAATAATACCGGAG
+ATAATCCTGAGGGAGGAGAGCTTCAACAAATAGCCAATACTATCAGACAAAATTTAGGAT
+TTTAAGAAAGGAGAGCGTAAAATATGGCTAATGTATTAGAATATGCAAAAATATTTATGC
+AAGAACTTGATAAGCAGGTAGTGGCACAAGCTACATCTGGATGGATGGAAGCTAATGCAG
+GCTTAGTTAAGTACAATGGTGGTAATGAGGTAAAAATACCAGTTATAGACATGGATGCAT
+TAGGAGATTATGACAGGGCTAATGGATTTGTTGACGGGTCAGTAAATTTAACATATGAAA
+CAAAAATTATGACTCAAGATAGAGGCAGAACTTTCATGCTTGACCGCATGGATGTAGATG
+AAACTAACTTTGTAGCAACTGCTGCTAATGTCATGGGAGAATTCCAGAGAACAAAGGTTA
+TTCCTGAAATCGATGCGTACAGGTATTCCAGCATTGCAAGCCAGGCTATTGAAAAAGGTG
+TAGCAGTTGGTGGCTATACTCCTTCAGAAACCGACATACTTAAGAAGCTGAAAGAAGATG
+TCTATGCAATATATGATGTGGCCGGAGAAATTCCTCTGGTCATTATCATGAACATGCAGG
+TCGCTGCAATACTGGAGAATTCCACAGAATTAAGTAAAACGTTATCGGTTATTGATTTCA
+CTCAGGGGGATATTAAAACCTCGGTGAGGGCTATTGATAACAACCCAATAATCAAAGTGC
+CTTCCGCACGAATGAAGACAAAATATGTATTCTATGATGGCAAAACCGCAGGCCAGGAAG
+CAGGTGGATTTACACCAGCTGAAGATGCTAAAAACATCAACTGGATTATTTGTCCAAGGA
+CTGCGCCTATAGCTGTATCTAAAACAGATAACATAAGGATATTTACTCCTGAACAAAACC
+AAAAGGCTGACGCATGGAAGATCGATTACAGAAAATATCACGACCTCTGGATAAAGGACA
+ATCAGTTTAAAGCAATTCGTGTAAACATCAAAGAGGCCATAGCATAGGAGTGATGCCGGA
+TGTATAAACTTGAAAAGCTCAATGTAGTCAAAATCGTACCGACGGAACATGAACGGGAAA
+AACTCTTGGCTAAAGGCTTTAAGGATGCGGAGAAAGAGGAAAAGAAAGAGGAAAAGAAAA
+AGGATGAGAAGAAGGCTGCTAAATAGCGGCCTTCTCCCTCTTTTCTACCCTAAAAGGGGT
+GAGTATATGTCCATTGAAGAAATGCTTACAAAAGTAAAGAGTAACCTCAAAATTGAGGAT
+GATAGCAAGGACCTAATCATAACTGACATTATTCAGGAGTGTCTGAACTACTGCAACCTC
+AAAGAGCCGCCGGCAGAACTGGAACCATTTATCCGCCGCAAGGTCAAAACCATCATTGAC
+TATGAGGCCGAGACCGGAGGTAGTTCAGTATTTGACGTGACCTCAATAAAAGAGGGTGAT
+ACCTCTATAACTTACAACACTGACGAGGTTTCCAGAGAAACTATCTACGGCCTGTCTGAA
+AAAGACAAGCAGGCCTTGATGCGATTCCGGAGGTTACGAAGATGAGCGTATTGCAAAGAC
+TTTGGAAAGACCGAATGGATATATATCGTTGGGTTGAGGTTGTAGAGGGCGGCTTCACAA
+AACAGAAAAAGGAGAAGATTTACGAAAACGTCAAATGCCATTACAGTAAAGGCCAACTGG
+TTAACACGGGAGAAGACAGTGTGCCCACATTGATAACTTCTCACACTTTGTTTTGTGGTC
+CAGATGTGGACCTTCAAGAAGGTGATGAGGTGGTTGTTACCCAGCGGAATGGCAAGCAGG
+TAACCCTGACAGTAGGTGAGGGTTTTCCGTACAGCACTCACCAGGAGTTTTCCGTGAAAC
+GGGTGGATACGGCATGAGCAACTATCGCACAAATAAGGCCGCAATAGATAAATTCCGGAG
+AGAATTGAAAGCCATGCTGGGTGACATTTCTGAAATTGACAAGAGGGTTTTGGATAAAGC
+TGTGAGTATAGGCCTTGCTGATGCCAAAAGAAATACGCCGGTGGATACCGGTTTCATGCG
+GCGAAGTTGGCATGTAATGCCTACGAAGAAAACTTCGCAAGGTGTTGAAAAGGAGTTGAT
+TAATTCTGCAGATTATAGTTCCTTTGTGAACTACGGTCATAGGGTGGTCAACAAGAAAGG
+TGAAACAGTTGGCTGGGTAAAAGGCCAGTTTATATTGGAGAAAGCAGTAAACACAGTAGA
+AAAGGCTTTAGCAAAAGAATTTGAAAAAGAAGTGGAGAGGGTGAACAGGAAACATGATAA
+GTGAAATTAAGCAGGCTATTGCTCAGAAAATCCATGAACAGTATCCTTCATCTACTATCT
+ACGATGAAGACATTCCTCAAAACTTCAAAACACCCTCTTTTTTGGTAACCGTCATTGAAC
+AAAGCTATGGCAAGAGGCTCGCCAACAAATACAACAGCACCGTTTCCTTTGATGTGGCCT
+ATTTCAGCGATAAGGGGAAAAACGAGGTCAAATCCGACTGCCAGGCGGTACAAGTGAACC
+TGCTACGGGCTTTCGACCTGGTGGGAACCTTCCGGGTTCAGAACCTGCAGGCAACTATCG
+TGGATAACGTGCTGCATATTACCTTTGATGTGAGGTATTCGGAGATAAAGACAGGCGAAG
+AGATTCCAAAAATGCAAGCTCAAGCAACAAATACAGATATAAAGACCAGCTAATTAAAGT
+CAAGAGTTTTTAAGAAAAAATTTTAAGAATTTTCTAAAACTCCTGACAGCGAAAAAAGGC
+ACAACGACAAGACCACCTAAGATTAGTAGACATAAAATAGCTGGCCTGAAATAGTAAATT
+GATTTTTGAAAACTAAACATCGAGTACAAGTACTACTAAGCTGCTGTGTGCTTCGCTGCA
+AGCATTTGCGCGTGCTCTTGGGGAGAACGTAATTCGTAAGGCTTTCTATCCCTAAGAACA
+GCAAAAATATAATTAACAAGCTTACGCATAACAGCCCCCAAAGCTACTTTCTTGGGCTTG
+CTCTGGCATTTGTTTTTGTAATATTCCATCAGTACAGGGTTGCAAGCTGTTTTGTCCCGC
+TTGGTGCGGATATTAGCAAGAGCAATTGTGAAAAGTACTCTGCGAAGCAGTCTTGACCCC
+CTTTTTGACATCTTGTTTTGTGTGCCGGTAAACTCTCCGGACTGCATTACAGAGGGGTCA
+ATACCGAAATAAGCAACTAGCTTGCCTGGCTTTGAAAAGGCTGAAAAGTCGCCAATTTCA
+GCCAGAATGGTAACAGCAGAGATAAGTCCTATACCTGGAATGCTTTGTAGAAGCTCGAGA
+GTCAGTGCCAGCATGGGCATGTCCTTTGCCATATCTTCAATAATCAATGAACGAATGGCT
+TTGAAGACTTTCTCAAGGTTTTCTTCCAAGGTTTTAATCATAGAGATATACACACCAAGC
+ATGGCAACATTTGAAGAGTTACTAATGCTTAAAGGTGCAAATTCTTTGGCCTTGGAATTC
+AAAAGCTCATACTTTGCAGTTGCCCATTTAAGGCTTCTGCGGGAATTCTTCTGTATCAGT
+GCAATCAACTTGTTTCTGTTCGCTTTAAGAATATGCGCAGGTGCAGGATATTTCTCCAAT
+ACTGCAAGAGCAGCCTTTGAAAAGATATTAGGGAATACATCCTTGAAGTTTAGCATGAGT
+TGGTCAACAATACCCATAAGCCTGTTTTTGTAAGCAGTAAGTTCGTCAGAGAGCTTGTAG
+TACTGGCGGCAAAGGCTTCGCAGACATTCAATATCCTCGTCGGGGATATTGGTAGTTTTA
+AGCTCCTGAAATCTGTATAGCAGAGCAATTTTCCGGGCATCCACTTTATCATTTTTCACT
+TTCCTTATTCCAATATTTTTGATAGAATCAGTTTGGATGGGGTTTATGACAGAAACCTCA
+AATCCAGCTTTATAAAGTGAATGGAAAAGGATTTTGTGATAGTGCCCAGTGGATTCCATG
+ACGACGAAAGGCCTAGAATCAAAGTCCTTTTCCGTTTTTTTCAGTAATTCAACGGCTCTT
+TCAACGTCAGTACTGGAATCATGGCGGATCTTCATGCGGGCAATTACTTCATTGGATGGA
+GAAAGAATTGCCATCTCACTGAAGAACTTGCCGACATCGATTCCGGCGATGGGTCTAAAA
+TTCATAAAAATGCCTCCTTTATAAGATTAATGGACTTAAAAGACTCCATTCCTTCTCATG
+TAAGTAAACAACCTTGCGTGTGACACGAGGAGCCAGCTGAAATGCTGGCCTCAACCAGCC
+AAATCATTTAGACTTACCGGAATGGATAAATACTCTTTCTTACGGGTAGTCGGCCCAATA
+AGGTCCGTCCCAGGAGTGATTACAAACACTCTCCAAGTCCGGAAAATATTATACATGATT
+GACAAGGTTCAGGCCAGACGAAAGCTAGCAAGCGGTCATAGATGGGGAACCGCAGGCGGC
+AGGATTTGAAAGCCACCGCCATCCCCTAGGGGATGGCACATAGAAGTGCTTGATGTTTAG
+AAAAGCAACAAATATGACATTATGTTAACAGGGTCGAACAGTGGCAAAAGTCACTGATGA
+AATAACAATATTAATTGTACAAGGAGTGATAAAGATATGGGTGGAACTTGGACGAACCAG
+AATAAGATCCTTCCTGGGGCATACCTTAACTTTCGGACAAATGCTCCACTTTCCATAACA
+TTAGGGGAAAGAGGTACAGTAGTAATACTACAGGAAGTAAGCAAGGGTGCTAGTGGGGAA
+ATGTATAAAATAACAGCACTTGACCAGAGTAAATGGCCGACAGGTGTAACAGCTGAAGAT
+AAATTACTTGCAAATGAGGCGCTTAAAGGTGCCAATACTGTAATCGTATATAATTTGGGT
+GCTGAACACACCTCTGAGGTGGTTGAACAGGCTTTGGCTAAATTGATGACAGAAGATTTC
+AACGTATTGGTGTATCCATATGATGGTGCAGCATATGACACAATTAAAACTACTATCAAA
+GCTTGGGTTGATATGATGCGTACCGAAGAGGGCAAGAAAATTCAGGCAGTTATGGCTAAC
+TTTGCAGCTGACGATGAAGCGATTATCAATGTTACCCAAGGTGTTAGACTTGTTGACGGA
+ACAGAACTTACAGCAGCACAAACTACAGCATGGGTTGGAGGTGTTACTGCTGGTGCGGCT
+ATTAATCAGTCTAATACTGGACGTAAATATATAGGTGCTATCGATGTGGTACCTAGAATG
+ACTAAAACTGAAATGGAGGCTGCTGTTCAAAATGGAGAATTCATATTCAAAGTAGATACT
+GCTCAGAATGTAACAGTGATATACGACATTAACAGCCTAACCACTGTTACCGCAGAAAAA
+GGTAAGCAGTTTACAAAGAACAGAGTGATTAGAACATTAGATGGTATTAATAACGATATT
+GTAGAAATATTTGAATCGAATTATGTTGGCAAGGTCAATAACAACGCAGATGGTAGATCG
+CTTCTAAGAGCAACATTAATTGAGTATTTCAACGAATTGCAAAGACTAAACGCAATTCAG
+AATTTTACTGCTGAAGATGTAACCGTATCTCCTGGTAATGATTCTGATGCGGTAGTAATT
+GACTGTTATATCCAGCCAGTTGATTCCGTAGAAAAAATCTACATTACGGTAAATTTGTCA
+TAGTTGAAGGAGGGTAATAAGGTATGGCAGATAATTATGTAAGATTATCAGATACGATAT
+CCTCTAAAGAAGGAAAAGCTTATATCACAATTAATGGACAGAACAGGGAATTGTTTGAAA
+TATCGAGCCTGACTGCTCAACTTGAGCTTCAAGTACAGTCCCGCCAGATGCTCGGTCATC
+GTATGGTCCAGCATAAAGTAGTTGGGGCCGAGGGTACCGGATCAATGACAATGTATTTCA
+TGAACTCTGATATGTTGAGATTGGCGATACAATACATCAAAGAGGGTAAATATGGAGGAC
+TGAAGCTCCAGATTAAAAACGAAGATGCACAAAGCACAATTGGAAAACAAGAAATTGTGC
+TGCTTGGTGTATTGCTTAACACTATACCTGTTGCTGCATTAGATGATCAATCAGATGATC
+CGATTACTGTTGACACGGATTTTACATTTGATGACATTGAGGGTTTGAGTTTCTTTGACT
+TGCCGGCAAATTATAGATAAAAGGGAGTGGTAAATAATGAGTTTAGGTTCTTTAGAGGCT
+TTTCTTAATCCTGTGAAAGTTGAAAATAAAAAGGTTATAGTGTCAAACAGATTCAAAGAT
+AAAGACGGGAACCTTGTACCGTTTGAAATCCGCCCTATCACACAGGAAGAAAATAAAATG
+CTAATCAAGAAATACACAAAAAGGGACAAGAAAGGTCAGGAATACTTTGATAGAGCAGAG
+TATATATCAGAGCTTACGGCATCCGCCGTAGTATTCCCAGACCTTACAAATGCAGAACTG
+CAAAAAGCATACGGTGTACTAGGTGCATCTGCATTACTTCAAAAAATGTTATATGTTGGC
+GAGTATGCAGAATTAGCCCAGGCAGTTCAGGAATTGAGCGGACTTGACACAGATATAAAT
+GAGGATATTGAAGAAGTAAAAAACGCATAATGCAAGGCGATCCTGAGTTCGTCTTAGCTC
+ACTTCGCCTTGCAAAAATTACACATATTACCTTCAACATTAGCCAATATGAGCGAAAGAG
+AAAAAGCTTTTATATATGCTAGTATACAGCTTCGTATTGAGCAAGAGAAAAAAGAGTCAG
+CTAAAATAAAGGCTGCAAAGGGAGGAGGTAGAAGGCGTTAATATGGCAACTTTAAAAGCA
+GTTATGGCTTTATTGACTGGAGGTTATACATCAGGAATCAATAAAGTCATTAAAAATACA
+GATAAAGCAACAGATAAAATTTTAAAAGCTAGCGGTGCCACAGATGAATTTAATAAAAAA
+TTAGAAGTCACTGGCGCAAGTGCTAATACTGCAAGTGGTGGATTGGGGAAATTACTTAAA
+ACTTTTATAAGTTTAGCAGCGATAAAAAAAGGAATAGATATTACAGACGAATATAGTAAT
+ATAGCTGCTAGACTCGCACTTATTAATGACGGCTTGCAAACACAAGAAGAATTGCAAAAT
+AAAATCTTTGCAGCTGCTAATCGGTCTCGCGGTGTATACTCAGATATGGCCAGTGCAGTG
+GCCAAAATGGGGCTGCTAGCCAAGGACGCTTTTACCTCCAATGATGAACTAATTGCCTTT
+ACAGAGCTTGTACAAAAATCATTTAAAATTAGCGGAGCTGACCCATCTGAACAGGCAGGA
+GCAATGAGACAATTAGCTCAAGCGATGGCTTCTGGTAGGCTTCAAGGTGATGAATTAGTA
+TCAATAATGGAAAATGCTCCAATGATATATGAGGCAATAGCAAAATATATGGGAAAGACA
+AAAGGAGAACTTAAAAAATTATCTTCTGAAGGAGCTATAACGGCCGACATAATCAAAAAT
+GCCGTATTTGCCGCAGCGAAAAACATCAACACCAAGTTTGCAGAGATGCCAATGACTTTC
+GGAGACATATGGAACAGGATTAAGAATGGTGCACTTAAGGCCTTTGATAAAGTTATTGTA
+AAGGTAAATCAGCTTATTAATGCTGACAAGTTCCAGCGATTTGTAGACAGAATGATTACT
+GGTTTTAGTCTTGCAGCATCTGCGGCAAGCTGGTTAATCGATGCTATAATTAGAGGTTGG
+GATACGATAGGGCCAATACTTGCAGTTATTGCTGGCATATGGCTTGTTTCTATAATTGGA
+AAACTGTGGGCAATGATACCACCACTGATTGCGCAAGCAGCAGCATGGTTAAGTGTATAT
+TGGCCTATACTACTGGTAATTGCTATTATAGGAATAGCAATATCTGCAGCAAGACAGCTG
+GGAGCAACATGGGATGAGATTATAGGATTTATTGGAGGGCTAATCGGTGTTTTTGCCACA
+ACTTTCTATAACTATTTCGTCATGATCTGGAATCACATAGCCGCTTTCGTGAATTTCTTC
+GGCAACGTATTCAAAAACCCAGTAGCTGCTGTACAAGCGCTGTTTTTTGATCTAGCATCT
+AACTTGCTTGGGTATATCGAAAAAGTGGCCCGGGGAATTGAAGATTTGCTGAACAAGATC
+CCGGGCGTGAACGTAAATATCGCCGGAGCCATCACAAAACTGAGAGACAAACTAAAAGCG
+GCATCAACGCAGATAAAAACCGAAGCCGACCTGAAAACCTATGTTCAATCCAAAGAATTC
+ATGGATTTCTCTGAAGGTTGGACGAAAGGCAGCACCATGGGGAAAAATCTTGTAGACAAG
+GTAAGCAACGCATTGTCAGGGCTGACTGATATAGGCAAAAGTTTTGACATGGGGCAATTC
+GGTACAAGTCAAAACCCGCTATATGTCACATCTAACGATAAGCTTAAGGTGGACATGTCG
+GATGAAGACTTGAAGTATTTGCGAGATATCGCAGAAAGAGAATACATTGCCAAATTCAGC
+ACCGCAACGCTTGCACCTAACATCAGTATATCCTTTGGAGATGTACACGAAACAGCGGAT
+GCCAATAAGATAGCGGGAAGAATTAGAAAAATACTCCAGGAAGAAATCGCTATGGCGGCA
+GAGGGGGCATATGCATGAGTTATGCAGTGTTTTTCGATAAAGATGGTGTGACATACCGTC
+TGCCTGTTAATCCGGAACAAATCGAAGTTATATCAAATCAAGCAATTGAAAAATATGAAA
+TATTAAAACTTGGACAAATTGCTGTGCCAACACATATGGAATTAACCGAATATAGTTTTG
+AGTGCGAACTCCCATTCAAACCTTTACATTATATAGAAACAGCTGGCGATTTCAAGAATG
+CGGATTTCTACCTTAACCTTTTTAAAGCATGGAGAGAAAAGAAAGAGCCGGTACGCTTCA
+TTGCTTCAAACGGTATCGGCGATGATATCAACTCGTTAGTACTTATTGAAGAATTAACTA
+TCACTGAAAAAGCAGGAGAAGAAGGAGATAAATATGTATCTTTTCGTTTAGTAGAATATC
+GGCCATACGGAAAGAAAACTGTTGTGATCCCGACACCAACCCAAACAATAGTCAAAAAAG
+ATGAACCGGTTCCAGCGGTGTCGCTAAAAGCGAATGATTACCATGTAGTACAACCTGGAG
+ATACCCTTTGGGGCATCGCAAAAAAGTACTATGGAAACGGTAATCAATATCAGAAAATTT
+ACGAGGCAAATAAAAATCAAATCAAAAATCCTAATCTCATATATCCCGGGCAGAAGTTGG
+TGATACCGAGATGAATATGGAATTTGCGGTTGAAACAGATGGGAAGATATATGAAATCAG
+CGAGCTTGTTACTTCCGTATCTTATACAGATAAACTTAACGATGGATGTAGCAAGCTCGA
+ATTCTCATATATTGATGACGATTTAAAAATACATAACGGCAGCGTAGTGCGGTTTAGATA
+TGATAATGAAAACGTGTTTTATGGGTATGTTTTTAAGCATGGTCAGAATAAAGCCAAAGA
+GATCAGCGTAACCGCATATGACCAACTCCGCTATTGCAAGGCCAAGGATACGATTGTGGT
+CAAAAATGACACTGTAGATAGCCTCGTAAAGAAAATGTGTAACTATTTTAACCTGAAAGC
+TGGTATACTCACCAATACTGGCTACAAACTGCCTGTAAGCGTTCAGGACGACAAGACCTG
+GCTGGATATAATTTATACCGCCATAAGCGACACACTGATGAATACAGGCAGATGGTACTG
+CCTGCGCGATGAGTTCGGCAACATAGCAGTCAGAGATCTCCAGGAGCTGCAGCTCGATCT
+TATTCTTGGCGATGAGAGCCTGGCTTATGATTATGAATACGAGAAATCCATTGATGATGA
+GTTCTACAATCAAATTAAAATTGTAAGCGACAATGAAAAAACAGGCAAAAGAGATGTATA
+TATAACCAAGGATAGCAGCTCAATACAAAAATATGGGCTGCTACAATATTTTGAGGTACT
+TGATAAAAACTACAATCCTTCACAGGCCAAGGCAAAAGCTGATGCACTCCTGCGGCTATA
+TAATAGGGAAGTTGAAACTTTGGAGTTAGAGTGCCTTGGTGACGTGAGAGTAAGAGCGGG
+GAGCAGTTTTTACGGGCGGATTGAAGATATACAGTTGAATAAACGGCTAATCGTAAAGTC
+AGTTGCTCATGAGTTTATCCCTGTGCACACAATGAAGTTGGAAGTGATGATATGATTAAC
+GAAATTAAAGCTATAATCCAAAACTACCTCAATAATGCTAAACTATGCCGGCTTGTGGTG
+GGCACAGTGACCAATGACGGCATCAAGGTAAGTGATAAACTCACTATTCCATATGAGCTC
+ATAGTGGGTAATCTCAAAAAGAATTTGATTGCTGGCCAGAAAGTGCGGCTGCTCCAAAAT
+CACGGTGGCCAGCAGTTCTATATCCTGGAGGTGATCTCCGAATGATACCCAACGCTTCTA
+TAAATATTGAATTAGGCTCTGCAGAAAGTATAGAAACAAGCCGGACATATAAACTATCCG
+GAGATAAAATCCAGGGCTATGTAGATGGGTTGGAGGCTCTCAAACAAGCTATATATAAGG
+TGCTCAACACAGAGCGATATGAGTACCCGATATATAGCTTTAATTATGGGATTGAACTTG
+AAAGTTTAATAGGCAAAGATCCCATATATGTTCAAATTGAGTTGAAACGCAGAATTCGAG
+AGTGCCTTCTAAGAGATGATAGGATTACCGATGTCGATAATTTCAAGTTTGAAGTAAACG
+GTGATGAAATAAAATGCACGTTTGATGTTCATAGCATATTCGGCAATTTCACAGCCTCCC
+GGGAGGTGATTTTTTAATGTTTGAAGATAAGACTTATGAAAATATATTGAACGATATGCT
+AAGCAGGGTATCAAATGATGTAGACAAAAGAGAAGGTTCTATTATTTATGATGCTCTAGC
+TCCAATTGCTTATAAATTAGCCGAAACATACTTCCAATTAAATAATTATGTTGATTTATT
+TTTTGCAGACACTGCAGTAGGAGAGTTTCTGGAGCGAAGGACTGCTGAATCAGGAGTGGA
+ACGGCGACCTGCTACAAAGGCAATAAGGAAAATTGTTACAACAAGGCCTGTAGATGTTGG
+CACAAGATGGGGATTAGAAGATACAACATATGTTATTATAGAAAAGATATCTGATACAGA
+GTATAGGGCCGAATGTGAGCAGTATGGCACTATAGGAAATTTATATTCGGGCGCTCTTGA
+TAACATAGATAATATATCTGATGTATCTGCTGAACTAACAGATGTTCTCATTCTCGGCGA
+AGACGAGGAAACAGATGAAGAACTGTATCAACGTTACTTAGAGGAAATCAATGCCATACG
+ATACGGTGGTAATGTGGACCAATATCGTGAGTGGATCAGTGCTATCCCTGGTGTTGGACG
+CTTTAAAATCCAACCGTTATGGAACGGCCGCGGTACTGTTCGAGCGATTATAACAGATGC
+AAATAATCAAGTGCCTAGCCAGGAGCTTATTGACCTTGTACAAAATACATTAGATCCATA
+TCAGGATGGTATGGGGACCGGCCTTGTACCGATTGGACATGTGTTTACGGCCATGGGGGC
+TATCCCGAAGGTCGTGAACGTCACCATGACTGTAGTGTTCGAGGAAGGTTATGGCCCGGC
+TGATATACAGCAAGATGCCGAACGGATTATCACCGAATACTTCTCCGAAATCAACTTCGA
+GGACCAGAAATTTGTGCCGACCACGGTCCGGCACGCCGTCCTCCTGAGCCGTCTGATCAA
+TATTCCGATGGTTCGGGATATCCTGGTGCTAACGCTGAACGGTATAGATGGTAATATCAC
+GCTTGCGCCTGATGAAGTTGCCAGCCTCGGGACGGTGACGATAAATGCTGATTAAGTGGC
+TTGAGGAAGAAGCTGATTACCTTGCATATTTGCCTCCTGTTCTACAAAACATTAGAGAAT
+TTCAGGAGTTAGCGAAAGCAGTTAATCCTGAAATTATCGCACTAAAAAAAGCTATAAACA
+AGGTCCTAAACGAACAGTTTATCCAGAGTGCAGAGGATACGCTACAATGGAGGGAAAAGG
+AATTCAATATCACGGCCAGCAGCGATGAAACGATAGAATTCCGACGTGAACGATTGATTG
+AACGTAAAAGTCGAAAGCCACCTATTACGTTGCGTTCGCTGCGCAATCGACTGAACGCCT
+ATATCGGCACAACACAGGCAGAAATTGAACTAGTACCAGGGGAATATGCTTTCTCTATCT
+CTATACCAGCAGTAGATGGGTACAAATTCCGTGATATACAGAGGCTTGTTGAAGAATTGA
+AGCCCGCCAACATGGAATATCTGCAATTCCCGTTTTCAGTTGAGAGGATTCGGATCAAAG
+AAGAAAGTAGAGAAATTAAGATATTTTACGCAAGAGCTGGTCTGGCTATAGCAGGGAGAA
+CAAGAATTGGGACTACATTATCCGAGCGTGTAGTCTATAGAAGGTAGGTGATTTGATTGG
+CAGTATCTACATTTTACAAAAGTCAGTTGGTAGAAACAACCGATGCACTACTGACTAAAG
+CGCTGGTGAACGAAACTATCGAAGTGACGCAATTAAACATCACGAAGTATGCAGACAGCA
+TTACGGTTGAGATGGCTCTTCCACCCGATCTAATCGTTACGAGAATTGATTTTTTGGACA
+GCGAAGACAATATCATTACTTCAATAACAGGCATTGAGATAGATACGGCAGTAACTACGA
+TATTCAGCCACAACATCCAGTTTGTACAAGGAGGTGCATAAAGGTGCCTTTTCAGAAAAA
+AGTCTGGCAGTTTAACGACATAATCACAGAAGGCGAATTGAATCGCATGGAACAAGGTAT
+TGAAGATTCTATAACTGCCGCGAATCAAGCTGAAGTAAATGCAAAGGCTTATACTGACCA
+AGAAGTAGGTGAAGTTGCCCAAGAACTTGCTGCACATAAGGCGGAAAGTACGCAGAACGC
+TCATTTGGCGAAAAACATCGGGATTGAAGACGCTGCGGGTAACTTCACAGCGACCGACGT
+GGAAGGGGCACTGGCCGAGCTTTTTACGTCTGTCAGTAATGGTAAGACTCTTATCGCTGG
+GGCCATTACTGACAAAGGAGTGCCGACCAATCCCAGCGATACATTCCAGCAAATGGCAAC
+AAATATTCAAGCAATTCCTGTTGGAGATTATGCTGTAGGGGGTACAATCCGTGATTCTGT
+CTTGCGTTTTTTGCCGGGCGGTATGGGTGTAGAAATCTGGTCGAAGACGGACGTGGCGAG
+AGGGCAGGGCATCGCCGTAGACAGTGCAGGAAACGTATATGTCGCTCACTCTGTGGGCAG
+CGGCGGAAAAGCCGTACGAAAGTTGGATTCAGCAGGAAACGAAATCTGGTCGAAGACGGA
+CGTGGCGTATGGGCAGGGCATCGCCGTAGACAGTGTAGGAAACGTATATGTCACTCATTT
+TGTGAGCAGCAGCGAAAAAGCCGTACGGAAGCTGGACCCGAACGGAAACGAGATCTGGTC
+GAAGACGGACGTGGCGTATGGGTGGGGCATTGCCGTAGACAGTGCAGGAAACGTATATGT
+CGCTCACTCTGTGGGCAGCGGCGGAAAAGCCGTACGAAAGTTGGATTCAGCAGGAAACGA
+AATCTGGTCGAAGACGGACGTGGCGAATGGGCGGTACATCGCCGTAGACAGTGCAGGAAA
+CGTATATGTCGCTCACAATGTGAGCAGCGGAAAAACCGTACGAAAGTTGGATTCAGCAGG
+AAACGAAATCTGGTCGAAGACGGACGTGGCGTATGGGTGGGGCATTGCCGTAGACAGTGC
+AGGAAACGTATATGTCGCTCACAATGTGAGCAGCGGAAAAACCGTACGAAAGTTGGATTC
+AGCAGGAAACGAAATCTGGTCGAAGACGGACGTGGCGTATGGGCAGGGCATCGCCGTAGA
+CAGTGTAGGAAACGTATATGTCACTCATTTTGTGAGCAGCAGCGAAAAAGCCGTACGGAA
+GCTGGACCCGAACGGAAACGAGATCTGGTCGAAGACGGACGTGGCGAGAGGGCAGGGCAT
+CGCCGTAGACAGTGTAGGAAACGTATATGTCACTCACGATGTGAGCAGCGGCGAAAAAGC
+CGTACGAAAGCTGGATGGGAACAGATATTTTCAAATAGTGGGGTGATATCATGATATTTG
+TAGGAAATTTTATACAAGATGAAAAAGGAAAAGGGTTAAGGATTGGCTTTGTGCATTATA
+GGCCCTTTGACGAAACGGTAGGGATGAATCTACCCGAAGAAACAATACGCCAAATGGGAG
+CTTTAGTCGATGAAATCCCCGAACCAGAGCAAAGAGAAGGCAAAATCCCAGTGATGTATT
+ACAATCCTGAAACGAACACTGTTTATTATGAATATGAGGACAAGCCATTGTCGCTCGAGG
+AGGAAATTAAATATCTCAAGGAATTGAATGCAGAGTTGATATATCAATTAATGATGAAAG
+GAGCGTTGTAAATGGATTGGTTCAAGACAATCAAATGGTTTTACGACAGCCAATTGTGGA
+CAAAAGAACAAGTTGCAGATGCAGTGCAGTACGGGAAAATTACAGCGGAACAGTATCAGA
+AAATCACGAGTGAGGAATATAACGAAATAGAAAGCACCAATTAAGGTGTATTTTTTATTG
+CCTTTTTTTGAGGACTTACCTTTTAAGGTAGGTCCTCTATTAATTGTTTTTTAGAAAGGC
+GGTTGGTTTATTATGAGTGAAGAGTTCAACAACAAAGAAATCATAAAAATGATGATGGAC
+TTTAAATCAGACATTAAAGGTCTGCAAGCTGAAATTCAGGAAACAAAAAACTTGCTGAGG
+AATTACAATGGTTTGCGTGAAAAAATGATGTCCTTTGAAATTGAGCTGGCAACTTTCAAA
+AAGGAAATTTTGACTCTCAATGAATGCAAAAAAGAGCAAAAATCCGACTGGAGATGGGTT
+GCTGGTTGGATTGTTGCTGTCGGAAGCCTGACCGTATCAATTATTGCTAATTTCTTCAAA
+TAAAGGGGGATGAGCACATTGGTACCGTACATAGTCGACCACATACCCAAAACAACACCT
+TACAACCGTCGCCCCGGATATTCCATGACGCCGGAATATATCACAATACATTCTACCGGC
+AATCCGACCAGCACGGCAAGGAACGAACGAGCGTGGTTAACTAACCCGAATAACAATGTC
+ACGGCCAGCTGGCATATTGTAGTGGACGAAAAAGAGGCAATTGAAGCCATACCTCTAAAC
+GAGGTCGCATGGCATGCCGGGGACGGGGGGAACGGGACGGGAAACAGAAAAAGCATTGGT
+ATTGAAATATGCGAAAGCGGAGACAGGCAAAAGACTTTGCAGAATGCTGCGGAACTGGTT
+GCAAAGCTGCTGAAAGAGCGCGGCTGGGGAGTGGACAAGCTCCGTAGGCACTATGACTGG
+AGTGGTAAAATATGCCCTCGGATTTTCCATGATAACGGCAAGTGGACAGGGTGGAAACAG
+TTTAAGGAAGCTGTTCAAAAGGAACTTTTCGGAGGTGATAACATGACACAGGATAAAAAT
+CAGCCTTCCGACTGGGCAAAGGAAGCGTGGGAATGGGCAAAGCAGCAAGGTCTATTGGAT
+GGTACAAGACCAAAAGACAATCTTACCAGGCAAGAATTAGCGGTTGTATTAAAAAGGTTG
+GCTGAGAAAAAATGAAATTTTCAAAGGTAATCGTATCATTATGCTAATACAAAAGTAATT
+ATTGCCGAAAGAGCGGCACAGGAAGCGGAGAACAAACTAAAACGGTATGAAGAATTTTTC
+AGAACATTCAGAGGGTTCTTGGGAGGTGTGTGAAATGAACGATTTTTTCACTCCTGAATT
+CCTGGCCACATTCGCTGGGCTAACAACCGCAGTTGCTCTTATCGTGCAGTTTACGAAGTC
+TATAGTAAAACGTCAATTTGGCGATGCAAGCGTGAGAATATATGCATTTGTGATAGCACT
+AATATTGACGTTCATATTCGCACCGGCAGGATGGGGAGTACAGGGAATAGTGCTCACAAT
+TATAAACGCAATATTGGTTACATTAGCCGCAGTAGGAGGGTATGAGATTATAGCGGATCC
+CAAAGCGACAAAGCAGTTCCCCGAGGGGCAGTGATGCCCCTCTTTTTTTGTCTCTGGAAT
+GTTTGATACTGTGTTTTATGCACAATCTGCTTACATAAAGCATATATTGTATGCATGTAC
+CTTACCTACCACTATATGTAGTGTGTTGATTTTGGAAATATAAAATGGGATAATAAAAAG
+GGGAAGAATGGAAAAGGGGGATAAAAGTTGGAGAGAACAAAAGAATTAATTTGTTATTTT
+CTGGCTAATTCGCTACATCCTTTAAACAAAACAGAAATAGTGAAAATGTTATATTTATTC
+GAATATTATCATGTTCAAACTTTTGGAGAGCAGTATGCTGAGTTAACATTTATTAGGTAT
+AATTATGGGCCTTACGCGCAGGCTATTGAGATAGCTCTTGATGATTTAATGAACGATGGT
+TTAATCAAGAGAGAGATTGTTGAATATACAGACAGATGTATATATTTGCATACACTTTGT
+GATACTGGGAAAACCTACACGGATTTATTGAATGAGGAAAAGAAATTAATAGCTGATAGA
+GTTATTGGAGAATTGTCTAATAAAAACTACGATGATATGATCAAACACGTATATTCTACA
+CCCCCGATGAGAAGAATTTTAATTAAGGAAGAAAGGTGCGGTTTTACGTTGGTCGGGGAG
+GTGTTAAACATGAAAGAAAGTAAACCGCTTAGAAAGTTCAGTAAGGCAAAAATAGAAGAA
+GCAAGGAAAAGACTTGATAAATCATCTCGAGGTTCAGATGAAGAATATTATGCACACCTG
+TTAGCAGTAAATGAAGAACTTAAGATATTAAGAAGGAGGGCCAATAGTTGTATTCTGAAG
+TAAAACCTCTTTCTAGAGAAGAGCTAATAGACGAAAGGTGTTTTGAAATTGGAGAGATAT
+ACTATATAAACGATTCGTTGATAAACATTCCTAACGTAGATAGACTAAAAGATGGTTCAC
+GAAAGATACATGAGGGGAGAATGGTTGTAATTGTTCATCATAACGAACAAAACTACAATA
+AATTTTGTCCAGTAGTTGCAGTTACACCTTTATCAAGTCGTGTAGATTTGAAAAGGCCAT
+TTGATTTAATATTAAAGAAAGATGATGTAGATGGTAATTTAAGATATGACAGCATAATAC
+AACTCCAATTAATTCAACCCGTGTTGAAAGTAGATTTAGAAAGGTGTATAGGCAGATTGA
+AAGAATATAAAATTGAAGAATTGATTGCAATGCAACTCGAAATGATTGGAATAGAGTAAT
+AAACGAAAAAAAGAGCGGCAACCCCACCCGAGCGGTTAGCCGCTCTTTTTTGCAAACATT
+TTGCTAACGTAGCAAACCAAAAATGATGTGAAAAGGTAAAAAAGAATAACAATATTAACA
+CTGAAAAACGTTGATTTTTCGGCATTTTTACGAAATGGGTATAAATGACTGATAGAGGGT
+AAAAATACTTTTATGGGTTTCCTAAACCGCAGGTCAGGGGTTCGAATCCCTTTGGGCACA
+CCAGAAAAGCCGTTAACCATTCAGGTTGATGGCTTTTCTAATTTTTAACTCTAATTTTTA
+ACGGCCTTTGCTAATAATGCTTCCGGACGGAATGTAGGAACAACGACTTATCAGATAATA
+AGGGAGAACAATGTTATCTGAATTGTGGATCGGTATTGAATGTTTTCGGAAAACAATGGG
+TTTGACAATGAGCATTTTATTGGTTATAATTTTATTCGCAATGTTTGGTAGTTGTTTTGC
+TTTATACCTGTTTTATTAATCGGAGGATTGGACGCAAGTTGGAATTTGAAGCAGGGTCAC
+ATCATTGGTTTATGAGAGAGGCCCTGAAAGAGGCCTACAAGGCATATGGCAAGAACGAGA
+CGCCCATAGGGGCGGTGATGGTTAAGGATGGTTCAATAATTGCCAGGGGACATAATCAAA
+AGGAACTTACGAATGACCCCACCAATCATGCTGAGATGGCTGTAATCAGGGAAGCATGTG
+CAAAACTCGGCACGTGGAGACTTAACGACTGTGATTTGTATGTTACATTGGAGCCTTGCA
+CAATGTGTGCCGGTGCAATTATTCAGGCCCGGGTTGGAAGGCTTTTTATAGGCTCTCTTG
+ATCCTAAAGCAGGAGCGGCCGGTTCGGTAATAGATGTGCTGAAGGTTGATGCTTTTAACC
+ATAGGGTTGAAGTGACATATGGAATATTGCAGGAAGAATGTTCTGAGATTTTGAAAAATT
+TTTTCAAGGAACTTAGAAAAAGAAAGTCAAATCGGAAGATATGATTTTTAAGTTGATTTG
+ATGAAGTTTTTTGGGGATTATTGAAATTTGAAGGAATAGGATTTTAATATTAAAATATAA
+GTATAAAATATTATATTTATTAAAATACGGAGACGTATCGAAGTGGTCATAACGAGCCTG
+ACTCGAAATCAGGTTGTCGCGCAAGCGGCACGTGAGTTCGAATCTCACCGTCTCCGCCAC
+GAACCTGTTTGCGGGAAATATCCGCAGACAGGTTCTTTATTTTATGTTAAAGATTGAAGA
+AACAGTCTGGCAGTATGTAAAAGTTCCGGAAGGACAGGAAATTGGACAGGTGGAAATCTT
+GTTTGAACGGATTGACAAAAAAGTTGTACAGGAAGAAGAGTCACACCTCCTTAATATGAA
+ACATAGAATGATACAAAACAAGAAATAATGCCATAAAAGCCGGAAAGGAATGGGGAAGAG
+TGTATAATACGAACAACAAATGGCCATATCCTTGTTTTTCAAACGCGCCATTATATACTT
+CACATAGTATGCCACACGGTATGTACGGTGATAAAGTGTACCAGTGCCCGTATTTTCTGA
+ATATTCCAATGTATAACTTCAGCCTTTGCAGCCCGTTTTTGCCTCAGTATGGTCCTTGTA
+CGGAGAAGGCGAAGCCTTGCGATGTGATTAAATTGAAGGACTATGGTCCAGAGCCTTTTG
+TAGTAAATATTGAAGAAGCTGCAAAGCAAAACGACAATTTTCGCACGGCTTTGTGGACAG
+GAGAGCATTTGCAGCTTACATTAATGAGTATAAATGTCGGGGAAGACATAGGCCTCGAAA
+TGCATCCTGACGTCGATCAATTCATACGTATAGAAGAAGGCCGCGGACTTGTTAAAATGG
+GCGACAGCAAAGATAATCTGGATTTTCAAAGAAATGTGCATGAAGACTGTATAATTATCA
+TTCCTGCGGGGAAATGGCATAATCTGATAAACACAGGTAACAAACCGATAAAATTGTATT
+CCATTTATGCGCCGCCGAACCATCCTCACGGTACGGTTCATGTTACTAAAAAGGATGCCG
+GTGAGTAA
+>NC_009012.1|provirus_3339258_3389049
+GTGAGCGACCATATCGCCAAGCGTGATGGAACAAAAATTTTAATTGAAATCAACACCGCA
+GATGCCACAGAAGAGGACATAAAGAATCTCTACGACCTTCTTTCCAAGCTGTTTGACGAA
+ACAAAAGAGAATTACTCACCAATGGTTCATTACATGGTTGGAGAGATATTAGAGCCTGTG
+ATGATGAAGATGGCAAGCCTCATGAAACCAAAGAAGCCGGGTGTGAAGGCAGGTGAGTAA
+GAAAAAGTATATTGTACGCTGCCCTCATTGCAATCATGGAATGTTTGATGCCGATTATGC
+TGATGTTGAAATCAAATGCCCGGTATGCAGAAAGGTTTTTGAAGTAAAGCTGGAGAAAAA
+GGCGGGGTAAAAAGTGAATAAATCTGGCCCAGAGCCACAAAGGGAGCGAATGACTCACCT
+ATAGAGCCTGGCAGATAGTCTTAAAAACTATTTGTCAGGCTCTATTTATGTTCTCGGAGG
+AGGTGAGAATTTGAAAGTGACAATGATGGACGCAGCATTAAAATACGCAGAAGCAAATAT
+CCCAGTCATACCATTGCATTGGATTTGTGAGGATGGCTCCTGCTCCTGCAAGGAAGGGAG
+TAATTGTGACAGCAAAGGAAAGCATCCGTTATATACCGGCTGGTACAAGAATTCCACTGC
+TTATGTTGAGCAAATAAGGAAATGGTGGACGAAAACCCCCAATGCCAATATAGGCATTCC
+TACAGGCGAGAAGTCTGACTGGCTGGTACTTGATGTGGATGATGGCGGTGATGAAACCAT
+ATCTGCACTTGAAGCAACACATGGAAAACTCCCGGATACGGTTACTGCTGTTACAGGAAG
+TGGAGGTTGGCACTATGTCTTTAAATACCCTAAAGGCCGGAGTATCCCAAATAAGACCAA
+GTTTGCATCGGGTCTTGATACGCGTTCAACAGGTGGACTGATTGTCGTGGCTCCAAGCAT
+TCATGTAAGCGGTAATCAGTACCAATGGTTAGAAGGACATTCTCCCTTTGACAGAACCCT
+GGCAGAAGCTCCGGAGTGGCTATTAAAGCTTATGGAAAGGGAGGAAGTATTGCTTACACC
+CTTTGAAGGTAGCAGTATTATAGTCGAGATTAAGGAAGGAAACCGCAACAGTACCCTGAC
+AAGCCTTGCAGGAACCATGAGAGCAAGAGGAATGACGGAGGAAGGCATCTATACGGCATT
+ACTTGCAGAAAACAACGCAAGGTGCAATCCTACGCTTGATGAAGCGGAAGTTAAGAAAAT
+ATATAGTTTAGATTTTCAAAGAGTTAGTAACTTGTAAAGAATTATAATATATACGCACAA
+AGCCGCTTGATTTTTGCAGAGGATCTTTGTACAGTCATAAAGTATTTACATATTGCCTGA
+ACAATTCAGCTTTCAGGAGATAAGGAATATACATGTTGGATTTTTCTGGCTGTGGGTTAT
+TGCAGCGGTGTCTGCAGTATTAATTGCGGCAATAGTTGCTGCTGTGATTCATAATATAAG
+AAAAAGGAGAAAAGAAGAGGAGGAAAACGAGCTGGCGGCGGCTTGATTTGTAAAATAGGT
+ACGTTCTACTTGCTTTTTCAGAATAGAAATAATATAATAATGCCAGGAAAAGGCAGAAAA
+GTTTCCTGGCATTATTATAATGCAACCACGGATTGCAAGCATTGGGATGATAATTTTGAG
+GTGATAAAATGGCAACTATAACGTTATATGCCGGAAAAATCAACCAAATGCCCGGATTGA
+TAAATGAAGTCAAGAAATCTGTGGTGGATTACAAGTCAGAATTATCCGCATTGAGAAAGA
+AAACTTTGAACATCAACAGAAGTGTATGCAATTTGGATGAAGTAATAAGTTCCATACAGG
+CATCTTCCCAGACTCAGGATAGAAAAATTGATTCACTTGAGAAATTCTGCAGTGAAAGTG
+AGAAGTTTATATCGGAAGTAATACGTATCGATGAAGAAGTTGCTGAGCTTATCAATAAAC
+GGAAAGAAAATTTTTACAAAGAATATTATTATTTAAAACCGGAAAGCGAGAAAAGCGGCT
+GGGAAAAAATCAAGGACGGCTTAAAGTCGGTTGCGGAGTGGTGTAAAGAGAATTGGAAAT
+CCATTGCCAAGATAGTGGCTGCCGCAGTAGTTATTACCGGGTTAGGGATAGCGGCGGCAT
+TGACAGGAGGGGTATTGGGAGTCATACTGGCAGGAGCATTCTGGGGAGCATTGGCCGGAG
+GATTGATAGGAGGAGCGGTTGGAGGAATAGCCGCGGCGATAAATGGAGGATCGTTTCTGG
+AAGGATTTGCGGACGGGGCATTAAGCGGAGCGATTTCCGGAGCGGTAACGGGAGCCGCAT
+GTGCCGGGCTGGGTGCTTTGGGAGCAGCGGCAGGAAAAGGAATCCAATGTATGAGCACAG
+TGGGAAAAGCGATAAATGTTACATCAAAGGTTACGGCAGCACTCTCGTTTGGTATGGATG
+GATTTGACATGCTGGCAATGGGAGTATCATTGTTTGATCCATCCAACGCATTGGTTGAAT
+TTAACCGGAAGCTGCATTCCAATGCACTTTATAACGGATTCCAGATTGCTGTAAACGCGC
+TGGCTGTTTTCAGTGCCGGGGCGGCATCGACAATGAAGTGCTTTGTTGCAGGTACAATGA
+TATTGACAGCGGCAGGTTTGGTTGCGATAGAGAATATCAAGGCAGGAGACAAGGTAATTG
+CGACGAATCCGGAGACTTTTGAAGTAGCGGAAAAGACGGTGCTTGAGACATATGTGAGAG
+AGACAACGGAGCTTTTGCATTTGACAATCAATGGAGAGGTAATCAAGACAACCTTTGAGC
+ATCCGTTTTATGTAAAAGATGTGGGTTTTGTTGAAGCGGGAAAACTGCAAGTAGGAGATA
+AGTTGGTTGATTCAAAAGGCAATGTTTTGGTGGTGGAAGAGAAAAAGCTTGAGATAACAG
+ATGAACCTGTTAAGGTTTATAACTTCAAAGTGGATGATTTTCATACTTATCATGTTGGGA
+AAAAAGGGATATTGGTACATAATGCAGACTATAACCCCAAAATGGGATTTGATGATTTGG
+ACCTTGAGAAAGCTACGAACAAACAAAAAGGCAATTATGGAGAGTATCTGGCAGATGATA
+ATCTTATTAATAATCCAAAATTGAAAGAAGCAGGGTATGATTTGGAGCGGATAGGAGGTA
+AGGTTCCGACCTCACCGGATGATAAAATTACAAAAGGGATAGATGGGATATATATAAATA
+AGAATCCTGACTCAAATGTTAAATATGTAATTGATGAGGCGAAATTTGGAAAAGCGGGAC
+TTAGTACAAAGACAAGAGATGGAAAACAAATGTCGGATTCTTGGCTGATAGGTGATAAAA
+CAGGTAATGATAGAATTTTAGAAGCAGTGAATAATGATAAACAATTAGCAGCTGGTATAC
+TCGATGCATTACAAAACAACCAAGTAGAAAGAGTGTTGTCAAAAGTGGATGCAAACGGAA
+ATGTAACGACATATAGACTGGATAGTGATGGTAATATAATTGGAGTTTGGCCATAAATAA
+TTGAAAGGAGGTAATGATATGAGAGATCCATTATGTGATAAAAAAGATTTGATAGAAACG
+ATAGAATTTAACCAAAAGGCTATTTTAAAAATGAAAGAAAAAATTATTAATCTGAAGGCC
+GACATAGAGAATGGTATACAAAGATATCCAAGAGATAATCAAAGTATAATTTATGGTACA
+TTTAAATTAATGTTTATGTATGGAATGAGTACACTGAGAGCAAAATATTCTTTGGGAAAT
+GAGCCGGATGCAATGATAAATGATTATTTAGATAATATAACGTATTTAGAGAATATGGGA
+GAAGAAGAAATAGGATATATTTTTCTTTTATGGATGGTGGGACTGGGTATCCTTTTGGAA
+GTGGATAAAGAAGAATTGAAGAAGTTGGCGAAAGTTATAGAGAGACGAAAAACAGAAGAT
+GCACTTATAGATTTTCTTTTGAAATCCTGTGATATAGGTTGGAACCACAGTACAACGAAA
+TATGAAAAAAAGAACCCGTATGAAAAGACAGCAGAGATTATAAAAATAGCATTGCACGAC
+AAAGACAAGGAAGCGGCATCTAAAAGGCTTGAAAAATATATGGAAAAAGAATGGTTCAAG
+GGGCACTATGACTTTGAATGGAGGAATGCGCACAAGAGGCCGGGGTATTATGGTTTTTGG
+AGTTTTGATACAGCGGCACTGGCCAAGATACTGGGACTGGATGACAGTGCACTGAAAAAC
+AACAACCATTATCCTTATGATTTGGCACACTATAAGAAGGGAATGACCTTTGATTTGAGT
+TGGTATAGTGTACCAAAGGAAGAGGAAGATAAGGAAGAAGAAACGGTGGTATATGGTATA
+CCGGGTAATCCTGAGTTGGAGAGGATAATACCTGGGAAGTTTCACAGTTTTGTAAATGAG
+ATAATAAATGATTATAAAACACTGCCGGACGAAGAATTTTGGAAGAAATACAATTTGAAA
+GAAATCTGGTTTGATGTGGAGGAGTATAAGGAGGATAATAAAGATAAGAATTTGCTAGGA
+ACGATTATAGTATTCATGCTTGTGGACAAAGATTATATTTTGCAGTTGGATTATAAAGAA
+GAGTTAATAGACTATATAGAGAATATACATAATTACTGGGCCAAGAAAGAAGTTAAGCTT
+ATAAGCTTTGAATTAGACAATGACCAGCAGTACTATGCATATGTGCCGAAGGATGCGGAG
+GTTGGTTCGTTGTATGAGGTAAAACTGACAGAAGTGGAGAAAATAGAGGAGGTTTAGTGT
+TTATTGTGTAATAGTGTGAAGAAGATGAGTTGTTTATGAAGAATCTGCTGTATAATTGGA
+TATATATAGTTTGATTTTGGGAATCTCCTTCCTGGCGAAACAAAAACTATAGGACAGTAT
+TTGGGAAGGAGTATTTTTTGTGTTATTTTTTTTGGGGAAGATAATATTGTATTGAGAATA
+ATAAGAAGTTTTATTAGGATTGTTTATGGTTGTCAATGTTAATATAATCAATGTTAATAT
+AATCAATGTTAAAAGGTATAGGAACAGAACCATAGCAGGGGAGAGTCAAAATGTACATTT
+GGCAGTGAAAGATAAGCTGAAAAAAAGAGGGGCGTTCATTTGAATTAATTCCTGAAGATC
+TTGATGTTTATAAAGAAGCATTGGATTTATGGTTGAGTCCAAATTTGGAAGAGGTTAAAA
+GCGTGATTGATAAAATGATATTGTATCATTCCGTATTAGTTTCGGACATTGATAACGAAC
+CGGAATTTGGTGATTACACGTATGGATTTTATCCATATGAGATATTGTTTTTAATGCATA
+TAAGGAGGAAATTAGGTTTGCCGGTACCGGATAAATTTGAAGACTTGCTGATGAACACAC
+CGGAAGCGAAGGTGGTGATTAATGAGCCGGAGCCATATCCGGAGTGGGATCCTTTGTTGA
+GAGCCATAGATGAGTTTTACCGAAAGAATTATCCAAATTACATTCCCAACAAGCATGGAA
+AACTGTTTGAATAGGAGGAAACTGTTATGGCAATGGAAGATATAGTTGGGATTATATTTG
+AAGACATTGAGGAAGTGAAACCAATTTTAAGTGATTCGGAAGGAAATGATTTGGAAGGAA
+ATGATTTGAGTGAGGCGATATTGGAATACGGGATATCGGAAGGGAAGTTTCTGTGTGTTG
+ATTATGGTGGAGAAGAGGGGAGCGAGATAATAAATTATATAATGGATTATGAATTCAGTC
+ATGGAATAGAGCTTGCAACACAGGAGGAGTTGGAAGAGCTGGACGAGATGGAGTATGATG
+ATTTGACAGATAAGATAAAAGAAGTGAACAAGATATTGGAGAAAGCAGGGTATGGACTGT
+TTTGCTTTCCAACAGGAAGTGATTTTTATGCGTTGTTTATAGCGAAGTTGGAGGATAAAG
+AGAAGTTATTGGAGGAAAAGATAGTTGATGATGAGGAGTTGCCATTGGAAGAGAGGTATA
+TTCAGTATTATGTGTAAGGGGATAATCTGCAGTATTTAGAGTTTTGGATAAGAATATGGC
+TTTTATAAAAATATTGGCAGTGTAAATATTTTTGTGTAAACTAATTTTCCTTCTATGTTA
+GTGTTTAAATATATTTTAAGACTCGAAAGTCTGCTTTGTCAAATTTTATAGATTCAAAAG
+AATTTCTGATAAGAAATTCTTACAAAAGAAAAATTTGACAAAGATGATGCGTATAAAATA
+TTACAGGGGGGGTTCAGGAAACCAGAGTTTCCCTGAACCCCTTGATTATACTATATACGC
+CCTTCGAACATAATCTGTAGCTGTCCCAGTATCAAACCCCAGTTTTTGTAACGCATCGTC
+CATTTTGAAGTAATCTTTACTGTAGCTAAATATATGCTCTTTAAAAGTGACTGGTCGCCA
+GGAAATACTGTCCTTGATTTGTTTATCCTTCTATAACTGCTATTCAGGCTCTCAATAGTA
+TTGGTCGTATACATGATTTTACGTAGTTCCTCCGAATACTTAAAAAATGGACAAATAACA
+TCCCAATTGCTCTTCCAGCTCTTCATAGCTGCCGGGTATTTCTTCTCCCATTTCTCTGAA
+ACCTCAAGCATCTGGTCGTACCCTGCCTTCTCATTCGGAGCCGTATATATCCGTTTCAAG
+TCCCTGGCAAATTCCTTTCGGCCTTTATCTGACACATACTTTAGCGTGTTTCTTATCTGG
+TGTGTTAATGTCAATCAAAATTTAGGCCACTTACCGGGGTAAAATTAGGCCACCATTTCA
+TAAAAAATCAGTCATTATTTGCCTGCTTGGAAAGAGCCTGCTTAAACCTGTAGCTTTCAC
+CATTGATGTTCAGAATGTGCGCATTATGGGTCAAGCGGTCAAGCAGGGCGGCTGTCATTT
+GCTCATCGCCTAACACCTCCGTCCATCTTGGAAATTCTAAGTTTGTAGTTATGATCAGGC
+TGCCCCTCTCATATCGGGAAGAGCAGAACTGGAACAACAATTCTGCTCCGATTTTACTGA
+AAGGCACATAGCCTAATTCATCAAGGATCACTAAATGCGGCGCCAGCCATTGCTTTTCAA
+GCTTATTAAGACGATATTCCTGCTGTGCTGCAAGCAATTCATTTATCAAACCAGCTGCCG
+TATAGAATTTGACCTTCATACCCTGCCGACAAGCCTCGTAACCGAGCGCAGTTGCAATAT
+GGGTTTTCCCTACTCCGGAGTTGCCTATCAAAATGACATTTTCTCTTCTTCGGATATATT
+CTCCCTGCATGAGTTTCAATACCCGCGGTTTGTTCAAAGAAGGTATGGCAAGGAAGTCAA
+AGCTTTCAATCGTTTTGATAACAGGAAAGCCTGCTTGCCGGATCCCTCTCTGGATCCGGT
+TATTCTCCCGCTGATGTACTTCCTGTTCCAGCACACACAGCAGGTATTCTTCATAATCCA
+GATTATTGTCTGCGGCTTCTCTTGCCAGGGATTCATAGGTTTTTGCCACCTGTGGCATCT
+TTAGCTTCTTCATGTAAGTTTCGATAAGCATTTTATTGACCGGCATTATTGTCCACCTCC
+TGACATGAGAGCGCTGTATTTGCTGAGATCAGGAGGTATTACAACAACCTCGGGGATGCC
+CTGAAGCTTGTCTTTGCTGACAGGAGCCGTCTTAGGACTGCCTGAGACCAGTAGCTGTCC
+TAATATGTTAAATACACCGTCATAACTGTATACATTGTATGCCATAGCTATTTCAATAGC
+TTCTGTCACCAGTGCCGTAGGGTAATCCCTGTGCAGCATGAGTATTTTTACGAATTCCCT
+GTTGCCTCTCGGACTTCTGGCATTTAAGCTTCGACGATACTGCTCATAAACGGGTGCCAG
+CATCTGAGGTTTATATACTTTTGTGTTGCCCAGGGCGCGTGATTTTTGCAGCAGCAATTC
+CAGATAGTGATCAAGCTTTATCTGCTCCTGGTAGCGTCCGTATATCCTTGGATGGCTTGC
+TATCATTGTTCCTTTGTTTAGTATTTTTACTTCATCCGCAGTAGCTTTAACAGTGACTTT
+CTCTCCCACATATATCGTGGGAACAGAGTATCGGTTAGTTTCAAACTGTACCATAGAATA
+GCGGTTGACCTTTGCCTCTTTATACCTCGCACCATCAAACCTTACCGCCGGTAATGGCCT
+CAAAGCTGCCCTTTCCGCTTCCCATTTCGGATTGCTTTCCAAAAGCTTTATGCATTCGTT
+GTGCAGATATTCATTCAACTCCTCAAATGAATCAACCTCGGGGTAGGGAACGAAGAACCT
+TCGCACAGCCTCTTTGCCCGCATTCTCTACACCACCTTTATCGCTCCCTTTTGCCGGCCG
+GCAGAATGAAGATTCATAAAGGTAATGGGTTCGTAAAGCGATAAACTGCTCCTGCTCTTC
+TCTGTTGCTGCCTTCGAGTATCTTCTTCACTGCCGTTTTCAGATTGTCGTATGCTATCTT
+GTATGGTACACCGTTCATGAACTCAAAGCATTTGATATGGCCATCAAAGAACGCCTCCTG
+TTTCTCAAAAGGGTATGCTCTTACGTAGAATCCGCCTGATCCTCTCAACTTCATTACAAA
+CAAATGTGCCTTGGTTTCTTTGCCTTTTAGATAAAAATATGCTTCTGTCCAATCTACTTC
+TGCATATGCTCCCAACTCGAACTCCAGTGGCAGGAAAGCTTCCCTTTGTTTTCGGTATTC
+CTTTCTCAGGTAATCCATTACAGTGTTGTAGCCGCCTGAAAAGCCTTCTTTTTTAAGTGT
+CTCAAATATTTTTGTCCCTGTATGGCGTTGTTTGCGGTGTCTGGTTTTATCATCTTCTAT
+TATCTGTTTGATCATTGGTATGTACGGCCCTAATACCGGATGCGTTCTTTCCTTTGTCAA
+CTTGTACTTAGGTGGTTTTGGTTCCTCCAGCGAAATATATTTTGAGATTGTATCCCTATG
+TATCCCAGTCCTCCTGTTAATTTCCCTGATACTTAAGCCTTCCATGAAGTACATTTTTCT
+GATATCCTCTAATTGAGCCATCTTAATCATATCCTTTCCTCCTGTACGATAGTGTCTGTT
+CAACAAAATCATACAGGAAATTTGATTAAGGTGGCCTATTTTTTTGCCGGTATATGGTAC
+ATTTTTAGAGTAGCATTAACACTGGTGTACTATACACCTCTGATATTCAGTATTCGGAAA
+AGCCGCATTGATTGCATCCTTTATCCCTGAAAGTGCATCAGCACAGAGAATCAGGATGTC
+TTTAACTCCTCTGTTTTTAAGGTCTTTTAAGACACTCAGCCAGAATTTTGAGCTCTCATT
+TTCTCCTACATAAATACCGATAACATCTTTCTGCCCTTCTATATCAATTGCCAGCACAAT
+ATATACGGCCTTCTTCGAAACAATGCCGTCATTTTTTACTGAAAAATGAATTGCGTCAAT
+AAATACTATCGGATAAACCTCTCCCAGAGGCCTTTTCTGCCACTCTTCTATCTGAGGTAG
+TATTTTATCAGTGATCTTACTTACCATCTCGGCAGATACTTCAAATCCGTAGATTTCCTG
+TATCTGCTCATTGATTTCTCTGGTAGACATCCCCCGCGCATACATTGCTATTATTTTATT
+TTCAATTTCTGAAATGTCCCTTTTATACTTGGGAACAATTTTCGGCTCGAATTCTGCATT
+CCGGTCCCGCGGGATATCTATTTCTACTTGCCCTACACTTGACTTTAATGTTTTTGATGT
+GTACCCGTTACGGTAATTTGATTTCGCTTCTTCAGTTGATTCGTACTTTTCATATCCGAG
+ATGTTCATCCAGCTCTGCTTCCAACATATTTTGTATCGTATCTCCGAGCAGATCCTTCAA
+TGCTTCCTGCAAATTCTTTGCTCAAGTGATGTTGTACTCAGAAATGAGATTTCTGATAAG
+CTCTTTCTTTTCTGGTGTTATTATTCTTTTTCTTGCCATAAAAAACTCCTCCTATACTTT
+AGTATTCTATCATAGAAGGAGTCAATTAGTTTACATAAATATTTTACAGTCTCTTAGCTT
+GTAAAGAATTATAATATAATATATATGTACAAAGTCGCTTAATTTTTGCAAAAGATCTTT
+GTATAATCATAAAGTATTTAGATATTGCCTGCACAATTTCAGCTATAGATTCAAACAAGT
+TGTTATGCGTTACATTCATTCGGATGTCTTTCAAAAGGTGATCGATTGAATTCAACTCGG
+AGCTATAAGGAGGCAAATACTTAAGGGTAATGTTCTTTATTGAATCCAATGGGAGTATAA
+ATAATTTCATGTATTAAAAATTTTTCAGTTCTTCCTGGCAAGAAATTTTAAGTTTTCAAA
+GTTTACAGAATGTAAATCCTAAATCACTTCAATATTATATATTATTGCCGGTTTTGCTAA
+GTTTTACACATAAATTTGATTTAATTCGTCTATAATTATTTATAATGGAGTGTTTTGCCC
+TTTTTCGCTCAATTATCAACGAATTGGTTGACGAAAACCGGTGCAAGGTATATGATAACG
+GCAGGGAAATAGATTTCAAATATTACAGTGATAACAATACATTAACTTTTACCCTCGGAA
+AGGGTTGGCACAACGTTGGAATTGTCCTTGTGGATATGGCGGGAAATGTAAACAATATTC
+AGGAGATAAGGAATATACATGTTGGATTTTTCTGGCTGTGGGTTATTGCAGCGGTGTCTG
+CAGTATTAATTGCGGCAATAGTTGCTGCTGTGATTCATAATATAAGAAAAAGGAGAAAAG
+AAGAGGAGGAAAACGAGCTGGCGGCGGCTTGATTTGTAAAATAGGTACGTTCTACTTGCT
+TTTTCAGAATAGAAATAATATAATAATGCCAGGAAAAGGCAGAAAAGTTTCCTGGCATTA
+TTATAATGCAACCACGGATTGCAAGCATTGGGATGATAATTTTGAGGTGATAAAATGGCA
+ACTATAACGTTATATGCCGGAAAAATCAACCAAATACCCGGATTGATAAATGAAGTCAAG
+AAATCTGTGGTGGATTACAAGTCAGAATTATCCGCATTGAGAAAGAAAACTTTGAACATC
+AACAGAAGTGTATGCAATTTGGATGAAGTAATAAGTTCCATACAGGCATCTTCCCAGACT
+CAGGATAGAAAAATTGATTCACTTGAGAAATTCTGCAGTGAAAGTGAGAAGTTTATATCG
+GAAGTAGTACGTATCGATGAAGAAGTTGCTGAGCTTATCAATAAACGGAAAGAAAATTTT
+TACAAAGAATATTATTATTTAAAACCGGAAAGCGAGAAAAGCGGCTGGGAAAAAATCAAG
+GACGGCTTAAAGTCGGTTGCGGAGTGGTGTAAAGAGAATTGGAAATCCATTGCCAAGATA
+GTGGCTGCCGCAGTAGTTATTACCGGGTTAGGGATAGCGGCGGCATTGACAGGAGGGGTA
+TTGGGAGTCATACTGGCAGGAGCATTCTGGGGAGCATTGGCCGGAGGATTGATAGGAGGA
+GCGGTTGGAGGAATAGCCGCGGCGATAAATGGAGGATCGTTTCTGGAAGGATTTGCGGAC
+GGCGCTTTAAGCGGAGCAATTTCCGGAGCGGTGACAGGAGCGGCATGTGCCGGGCTTGGT
+GCTTTAGGAGCTCTAGCAGGGAAAAGCATCCAATGTATGAGCACAGTGGGAAAAGCGATA
+AATGTTACGTCAAAGGTTACGGCAGCACTTTCTTTTGGTATGGATGGATTTGACATGCTG
+GCAATGGGAATATCATTGTTTGATCCATCCAATGCATTGGTTGAATTTAACCGGAAGCTG
+CATTCCAGTGCACTTTACAACGGATTCCAGATTGCTGTAAACGCGCTGGCTGTTTTCAGT
+GCCGGGGCGGCATCGACAATGAAGTGCTTTGTTGCAGGTACAATGATATTGACTGTGGCA
+GGCTTGGTTGCGATAGAGAATATCAAGGCAGGGGACAAGGTAATTGCGACGAATCCGGAG
+ACTTTTGAAGTAGCGGAAAAGACGGTGCTTGAGACATATGTGAGAGAAACAACGGAGCTT
+TTGCATTTGACAATCAATGGAGAGGTAATCAAGACAACCTTTGAGCATCCGTTTTATGTA
+AAAGATGTGGGTTTTGTTGAAGCGGGAAAACTGCAAGTAGGAGATAAGTTGGTTGATTCA
+AGAGGCAATCTTTTGGTGGTGGAAGAGAAAAAGCTTGAAATAACAGATAAGCCTGTAAAG
+GTTTACAATTTTAAGGTCGATAATTTTCATACGTATCATGTTGGCGAAAATAGGGTATTG
+GTTCATAATGCGAATAAGTATGTTAAGGGAACGCGTAGTACTCAGTTGACGTTTGATGAA
+GCACTGAAAAAGTTAGACAAGTCAGGCTTACGACCGGGTCAAACAGAAATTTCAAAGAGT
+AGGGTTATGGAAATCGTAGAGAATTATGATCCTATGAAAGCACAAAGCAGTGTGTATACT
+GATTCAACGGGTAGATATTTAGTTGAAGGCCATCATACAACTGTCGCAAATACAATGCTA
+GGAAAAGGATCTGGGGTGAATATGAATATACCTACACAGCAGATACCATCTGCTACAAAT
+GTCTATTGGACAAAAAAGTGGTATGAATTTTGGAAAACACAAATAAAAGTAACAAAATAA
+GAAGGTGATACTTTGGAGAAGTACTCTTTATTCGGAGAATTATTGTATTTAGGGTTTGTG
+TGTGAAAAAGGGAGGTGTAAAAGTTCAGGATTTTGGAAGTTGGGGTATAAGAGAATCCTT
+CATAAACATATTGTCTTACTAAGTAAGTTGATTCAATGTATATTGGTTAGTGAGGTATCC
+GATAACGATGCTTTAATATTGAAAGAGTTTATTGAGTCAATTCAGACAGAAAAAGACATT
+ATTAAATATTACCCAATAAATGAAGATACAATGAAGAAATTACAGGATAGTAATTATTCA
+ATTATTACATCAATTGATTCTGATAGGTGTAATAATAACATTAATCTACTCATGAATGAT
+ATAACAACCGAGATACTAGAATTATTAGATCATAAATTTTTTTTAAACAAGAAAAGGATA
+GCTATGTTAATAAGGGCAATACATAATTTGCCACGCGTATACTTAGGAAAGGGGTTGCAC
+ACTTTGTGCAATATAGAGCAGCCTGCTATTGATTATAAAGCTGCACTTGAATATTCCTTT
+AATAACATGGATGAAGATACTAGACAGAGGTATAGAAAATACTATCAGTAGACGGTAGAA
+GATGTTAAAATGGATTATACTCATATTACCTTTACCGTTTTAGATTGAAAAGTTTAACTA
+ATACCCGGCAAGCCAATATAACGGCAAGTCGGGTTTTCTTTTTATCCATACTTGACAATA
+TGTAATACATTGTGATACAATTAAACCAACAAGAAATACAGGAGGTGCAATAATGTCTAC
+AGAAAAGGATAGTATGCTACGGGTAAGGCTTACACAAAGGCAGTCGGATGAGTTGGATGC
+TATTATTGGTGAGCTTCAAGCACAAATGCCGGAAGCAAGTGTTACCACATCAAGCATAGC
+AAGATACGCTCTGGAGAAATATGTGAGCGACCATATTGCCAAGCGTGATGGAACAAAAAT
+TTTAATTGAAATCAACACCGCAGATGCCACAGAAGAGGACATAAAGAATCTCTACGACCT
+TATTTCTAAGCTGTTTGACGAAACAAAGGAGAATTATTCACCAATGGTTCATTACATGGT
+TGGAGAGATATTAGAGCCTGTGATGATGAAGATGGTAAGACTTATGAAGCTAAATAAGCC
+GGGGGTGAAGGCGGATGAGTAAGAAAAAGTACATTGTCCGCTGTCCTCACTGCAATCATA
+GAATGTTTGATGCCGATTATGCTGATGTTGAAATCAAATGTCCGGTGTGCAGAAAGGTTT
+TTGAAGTAAAGCTGGAGAAAAAGGCGGGGTAAAAAGTGAATAAATCTGGCACAGAGCCAC
+AAAGGGAGCGAATGACTCACCTATAGAGTCTGGCAGATAGTCTTAAAAAACTATTTGTCA
+GGCTCTATTTATATTCGGCGAGACAGGAGGTGGGAAGTTTGAAATTGACAATGATGGACG
+CAGCATTAAAATATGCAGAAGCCAATATCCCAGTCATACCATTGCCCTGGATTTGTGAGG
+ATGGCTTCTCTCCTGCAAGGCAGGGAAAAATTGCGACAGCAGGGAAAAGCGTCCGTTATA
+TACAGGCTGGTACAATGATTCCACTACTGATATTGAGCAAATAAAGAAATGGTGGAGAAA
+AACAACCAATGCCAATATAGGCATTCCTACAGGCGAAAAGTCCGGTTGGCTGGTGCTTGA
+TGTGGACGATGGTGGTGATGAAACTCTATCGGCTCTTGAATCAACACATGGAAAGCTTCC
+GGATACGGTTACTGCTGTTACCGGCAGAGGAGGTCGGCACTATGTCTTTAAATACCCTAG
+AGGCCGAAGTATTCCAAATAAGACCAAGTTTGCACCGGGTCTTGATAACCATTCAACAGG
+TGGACTGATTGTCGTAGCTCCAAGCATTCATGTAAGCGATAATCAGTACCAATGGTTGAA
+AGGACATTCTTCCTTTGACAAAACCCCGGCAGAAGCTCCGGAGTGGCTGTTAAAGCTTAT
+GGGAAGGGAGGAAACATTGCTTACACCCTTTGAAGGTAGCAGTATTGTAGCAGGGATTAA
+GGAAGGCAGCCGAAACAGCACCCTGACAAGCCTTGCAGGAACCATGAGGGTAAGAGGAAT
+GACAGAAGAGAGCATCTATGCAGCATTGCTTGCTGAAAACAACGCAAGGTGCAATCCTCC
+GCTTGATGAAGCGGAAGTTAAGAAAATATATAGTTTAGGTTTTCAAAGAGTTAGTAGCTT
+GTAAAGAATTAATATATACGATATACGCACAAAGCCGCTTGATTTTTGCAAAGGAGCTTT
+GTACAGTCATAAAGTATTTACATATTGCCTGAACAATTCAGCTTTCAGGAGATAAGGAAT
+ATACATGTTGGATTTTTCTGGCTGTGGGTTATTGCAGCGGTGTCTGCAGTATTAATCACG
+TCAATAGTTGTTGCTATGATTATAATATAAGAAAAAGGAGAAAAGAAGAGAAGGAAAACG
+AGCTGGCGGCGGCTTGATTTGTAAAATAGGTACGTTCTACTTGCTTTTTCAGAATAGAAA
+TAATATAATAATGCCAGGAAAAGGCAGAAAAGTTTCCTGGCATTATTATAAGGCAACCAC
+GGATTGCAAGCATTGGGATGATAATTTTGAGGTGATAAAATGGCAACTCTAACGTTATAT
+GCCGGAAAAATCAACCAAATGCCCGGATTGATAAATGAAGTCAAGAAATCTGTGGTGGAT
+TACAAGTCAGAATTATCCGCATTGAGAAAGAAAACTTTGAACATCAACAGAAGTGTATGC
+AATTTGGATGAAGTAATAAGTTCCATACAGGCATCTTCCCAGACTCAGGATAGAAAAATT
+GATTCACTTGAGAAATTCTGCAGTGAAAGTGAGAAGTTTATATCGGAAGTAATACGTATC
+GATGAAGAAGTGGCTGAGCTTATCAATAAACGGAAAGAAAATTTTTACAAAGAATATTAT
+TATTTAAAACCGGAAAGCGAGAAAAGCGGCTGGGAAAAAATCAAGGACGGCTTAAAGTCG
+GTTGCGGAGTGGTGTAAAGAGAATTGGAAATCCATTGCCAAGATAGTGGCTGCCGCAGTA
+GTTATTACCGGGTTAGGGATAGCGGCGGCATTGACAGGAGGGGTATTGGGAGTCATACTG
+GCAGGAGCATTCTGGGGAGCATTGGCCGGAGGATTGATAGGAGGAGCGGTTGGAGGAATA
+GCCGCGGCGATAAATGGAGGTTCGTTTCTGGAAGGATTTGCGGACGGAGCATTGAGCGGA
+GCGATTTCCGGAGCGGTAACAGGAGCGGCATGTGCCGGGCTTGGTGCTTTAGGAGCTCTA
+GCAGGGAAAAGCATCCAATGTATGAGCACAGTGGGAAAAGCGATAAATGTTACATCAAAG
+GTTACGGCAGCACTTTCTTTTGGTATGGATGGATTTGACATGCTGGCAATGGGAATATCA
+TTGTTTGATCCATCCAATGCATTGGTTGAATTTAACCGGAAGCTGCATTCCAATGCACTT
+TACAATGGATTCCAGATTGCAGTAAACGCGCTGGCTGTGTTTACTGCCGGAGCGGCATCC
+ACAATGAAGTGCTTCGTTGCAGGCACGCTGATATTGACTTCGGCAGGCTTGGTTGCGATA
+GAAAATATCAAGGCAGGAGACAAGGTAATTGCGACGAATCCTGAAACTTTTGAAGTAGCG
+GAAAAGACGGTGCTTGAGACATATGTGAGAGAGACAACGGAGCTTTTGCATTTGAGAATC
+GGAGGCGAAGTAATCAAAACAACCGTCGACCATCCATTTTATGTTAAAGATGTAGGTTTT
+GTTGAAGCGGTGAATCTGCAAGTCGGAGACAAATTGGTTGATTCAAGAGGCAACGTTTTG
+GTAGTGGAAGAGAAAAAGCTCGAAATAACTGGTGAACCTGTGAAAGTTTACAACTTTAAA
+GTTGATGACTTTCATACTTATCATGTTGGGAATAAAGGGATATTGGTACATAATGCGAAT
+TATAATCCTAAAACTACCTTTGAAAATCTGGATCTGGAAACCGCCAGTAACAAGCAAAAG
+GGTAATTATGGAGAATATCGTGCGAACGATAATTTAATTAACAATCAAAGTCTGAAAGAA
+GAAAGATATAATTTAAAACGAAAGGGGAGAAGTGCACCGACATCTCCGGATGATAAAATT
+GTAAAGGGGATAGATGGAATATATGTAAACGAGGATCCAAACTCAAATATTAAATATGTA
+ATTAATGAGTCAAAGTTTAATAGTGCACAATTGGGGAAAACGAAAAAAGGCATAAAACAA
+ATGTCGGATGAGTGGCTCCTTGAGAAACAAGGTAAAAGAATTTTAAAAGCAGTTAATGGC
+GATAGAAAGCTGCAAAAAGACATATTGCAAGCGTTAGATGATGGTCAAATAGAAAAAGTT
+TTATCACGAGTTGGCAAAGATGGAAAAGTGATAACATATAGACTGGGCAGCAATGGTGAA
+ATAATCGGACTTTGGCCATAAATAATGAATGAAAAGGAGATGAGGATATGAGAGATCCGT
+TATGCAGTGAAAGTTATTTGTTAGAAACAATAGAATTTGACAAGGAAGAAATTTGTGAAA
+GAAAAAAAAAGATTATTGTGCTGAAAGATGATATGGAAAAGGGCATACAAAGATATCCAA
+AAGACAATCAAAGCATAATTTATGCTACATATAGAGGAATGTTTATGTATAATACAGAAA
+TACTTATAGCTAAATACTCTTTAGGTAGTCATCCGGATGAAATGATTGAAGATTATTTAA
+ACGGTATAGAGTATTTGGAAAATGTCGGTGAAGAAAAAGTATGGTATATTGATCTTTTGT
+GGATGCTATCGTTAGGTATACTTTTAGAGGTAGACAAACAAGATTTAAAAAGGCTTGCTT
+GTGTGATAGAGAAGCAAAAAAAAGAAGACGCACTGATGGATTTTCTTTTAAAGGCTTGTG
+ATATAGGATGGAATCATAATACAAGTGAATATGAGAGAAAAAATCCATATGCAAAGACGG
+CTGAAATTATACAAATGGCATTGCATGATAAAGACAGGGAAAAAGCTTCGAAAAGGCTAC
+AACAATATATAGAGAAAGAGTGGGTTAAGGGACATAATGATCTGGACTTCAAAAATGCGC
+ATAAAGAACCCGGCTACGTTGGCTTGTGGAGTTTTGAGGCTGCAGCATTGGCAAAGATAC
+TGGGATTGGACGACAGCGCACTGAAAGATAACAACCATTACCCTTATGATTTGGCGCATT
+ATAAAAATGGAATGAGTTTTGATTTAAGCTGGTATGGTGTGCCAGTTGAAGAGGAAGCCA
+AGGAAGAAGAGGCAATAGTGTATGGAATACCGAACAAACCTGAGTTGGAGCAAATAATAC
+CTGCAAAATTCCACAGTTTTGTGAATGAAGTGATAGGAGACTACAATACATTGACTGATG
+AAGAGTTTTGGAAGAAGTATAATTTGAGAGAAATCTGGTTTGATGTTAAGGAGTACGAGG
+AAGATAATAAAGCCAAAAATATGTTGGGAACGATTATAGTATTTTTGCTTGTAGAGAAGG
+AGTATATTTTGCAGTTGGATTATAAGGAAGATTTGGTAGATTACATAGAAGATATAGATA
+ATTATTGGGGTAAAGAGGAAGTAAAGTTGATAAGCTTTGAAGTGGACAATGACCAGCAGT
+ATTATGCATACGTACCGAAAACCGCAGCAATAGATTCGTTGTATGAGGTGAAATTGACAG
+AAGTGGAGAAGATAGAGGAAGTTTAGTCTTATAGTGAAGGATTGAGATTATTAAAATGAG
+GATGGATTTTGATATTATTTCAGTGAACGATGTAAAAAACGTTAATTGAATTTTATATAA
+TGCGGGCGGTAATGGTAATTCTGCCCGTTTTAATTTAAACTGATTTATTGAAGATTTCTG
+AATTACGGAAATAACTGTGCTTGTGTCCTATAAAAAGACGGGTAATTTAATTTGTGATGT
+TTTGTATAAAAGATATAGGTTTCGTTAAAGAGATGAAGCTGCAACCAGGAAACAGGTTGG
+TTGATTCGGTAAAGATATTTTTGGTAATTAAGAAAAAAGCCTGAGATAACGGATGAACCT
+GTGAAGGTTTACAACTTTCTAAAACCACCTTTGAAAATTTGGATTTGGAAACTGCCAGTA
+ACAAGCAAAAGGGTAATTACAGAAAATATCGTGCGAATGATAATTTTATTAATAAATAAT
+CAAAATGTGAAAGACAAAGGATATGATTTAAAAGGGGGGAATGAGTGCTATGGCATCTCC
+GAATGATGAAATTGTAAAAGGAATAGATGGAATATATTCAAACAAGAATCCAAACTCAAA
+TATTAAATATGTAATTAACGAATCAAGATTTAATGCTTCCCAATTATGTAAAACGAAGAA
+AGGCATAAAACAAATGTCGGATGAGTGGCTTCGTGAGAAACAAGGTAGAAGAATTTTGAA
+AGCAGTTAATGGTGATAGAAAACTCCAAAAGGACATAATACAAGCGTTAAAGAAAGGTAA
+GGTAGAGAAAGTTTTATCACGAGTTGGCAAGGATGGAAAAGTAACGACGTATAGGCTGAA
+CAGCAATGGTGAAATAATTGGATTTTGGCCATAAATAACAAATGAAAAGGAGATGATGGT
+ATGAGGGATCCGTTATGCAGTGAAAGTTATTTATTAGAAACAATAGAATTTGACAAGGAA
+GCAATTGATGAAAATAAAAAAGACATTGTTGAATTAAAAGATGATATGGAAAAGGGCATA
+CAAAGATATCCAAGAGATAATCAAAGCATAATTTATGCTACGTTTTTGCATATGTTTATG
+TATAACACGGAAACGCTTATAGCCAAATACTCTTTAGGTAGTCATCCGGATGAAATGATT
+GAAGATTATTTAAACGGTATAGAGTATTTGGAAAATGTCGGTGAAGAAAAAGTATGGTAT
+ATTGACCTTTTGTGGATGCTATCGTTAGGTATACTTTTAGAAGTAGATAAACAAGATTTA
+AAAAGGCTTGCTTGTGTGATAGAGAAGCAAAAAAAAAGAAGACGCACTGATGGATTTTCT
+TTTAAAGGCTTGTGATATAGGATGGAATCATAATACAAGTGAATATGAGAGAAAAAATCC
+ATATGCAAAGACGGCTGAAATTATACAAATGGCATTGCATGATAAAAACAGGGAAAAAGC
+TTCGAAAAGGCTACAACAATATATAGAGAAAGAGTGGATTAAGGGACATAATGATCTGGA
+CTTCAAAAATGCGCATAAAGAACCCGGCTACGTTGGCTTGTGGAGTTTTGAGGCTGCAGC
+ATTGGCAAAGATACTGGGATTGGACGACAGCGCACTGAAAGATAACAACCATTACTGCTG
+TTACCGGCAGAGGAGGTCGGCACTATGTCTTTAAATACCCTAGAGGCCGGAGTATTCCAA
+ATAAGACCAAGTTTGCACCGGGTTTTGATAACCATTCAACAGGTGGACTGATTGTCGTAG
+CTCCAAGCATTCATGTAAGCGATAATCAGTACCAATGGTTGAAAGGACATTCTTCCTTTG
+ACAAAACCCTGGCAGAAGCTCCGGAGTGGCTGTTAAAGCTCATGGAAAGGGAGGAAGTAT
+TGCTTACACCCTTTGAAGGTAGAAGTATTGTAGCAGGGATTAAGGAAGGCAGCCGAAACA
+GCACCCTGACAAGCCTTGCAGGAACCATGAGAGCAAGAGGAATGACGGAGGAAGGCATCT
+ATACGGCATTACTTGCAGAAAACAACGCAAGGTGCAATCCTCCGCTTGATGAAGCGGAAA
+TTAAGAAAATATATAGTTTAGGTTTTCAAAGAGTTAGTAGCTTGTAAAGAATTAATATAT
+ACGATATACGCACAAAGCCGCTTGATTTTTGCAAAGGAGCTTTGTACAGTCATAAAGTAT
+TTACGTATTGCCTGAACAATTCAGCTTTCAGGAGATAAGGAATATACATGTTGGATTTTT
+CTGGCTGTAGGTTATTGCAGCGGTGTCTGCAGTATTAATCACGTCAATAGTTGTTGCTAT
+GATTATAATATAAGAAAAAGGAGAAAAGAAGAGAAGGAAAACGAGCTGGCGGCCGCTTGA
+TTTGTAAAATAGGTACGTTCTACTTGCTTTTTCAGAATAGAAATAATATAATAATGCCAG
+GAAAAGGCAGAAAAGTTTCCTGGCATTATTATAAGGCAACCACGGATTGCAAGCATTGGG
+ATGATAATTTTGAGGTGATAAAATGGCAACTATAACGTTATATGCCGGAAAAATCAACCA
+AATGCCCGGATTGATAAATGAAGTCAAGAAATCTGTGGTGGATTACAAGTCAGAATTATC
+CGCATTGAGAAAGAAAACTTTGAACATCAACAGAAGTGTATGCAATTTGGATGAAGTAAT
+AAGTTCCATACAGGCATCTTCCCAGACTTAGGATAGAAAAATTGATTCACTTGAGAAATT
+CTGCAGTGAAAGTGAGAAGTTTATATCGGAAGTAATACGTATCGATGAAGAAGTTGCTGA
+GCTTATCAATAAACGGAAAGAAAATTTTTACAAAGAATATTATTATTTAAAACCGGAAAG
+CGAGAAAAGCGGCTGGGAAAAAATCAAGGACGGCTTAAAGGCGGTTGCGGAGTGGTGTAA
+AGAGAATTGGAAATCCATTGCCAAGATAGTGGCTGCCGCAGTAGTTATTACCGGGTTGGG
+GATAGCGGCGGCATTGACAGGCGGTATATTGGGAGTCATACTGGCAGGAGCATTCTGGGG
+AGCATTGGCCGGAGGATTGATAGGGGGAGCGGTTGGAGGAATAGCCGCTGCGATAAATGG
+AGGATCGTTTCTGGAAGGATTTGCGGACGGCGCTTTAAGCGGAGCAATTTCCGGAGCGGT
+GACAGGAGCGGCATGTGCCGGGCTTGGTGCTTTAGGAGCTCTAGCAGGGAAAAGCATCCA
+ATGTATGAGCACAGTGGGAAAAGCGATAAATGTTACGTCAAAGGTTACGGCAGCACTTTC
+TTTTGGTATGGATGGATTTGACATGCTGGCAATGGGAATATCATTGTTTGATCCATCCAA
+TGCATTGGTTGAATTCAACCGGAAGCTGCATTCCAATGCACTTTATAACGGATTCCAGAT
+TGCTGTAAACGCGCTGGCTGTTTTCAGTGCCGGGGCGGCATCGACAATGAAGTGCTTTGT
+TGCAGGTACAATGATATTGACTGTGGCAGGCTTGGTTGCGATAGAGAATATCAAGGCAGG
+GGACAAGGTAATTGCGACGAATCCGGAGACTTTTGAAGTAGCCGAGAAGACGGTGCTTGA
+GACATATGTGAGAGAAACAACGGAGCTTTTGCATTTGACAATCAATGGAGAGGTAATCAA
+GACAACCTTTGAGCATCCGTTTTATGTTAAAGATGTGGGTTTTGTTGAAGCGGGAAAACT
+GCAAGTAGGAGATAAGTTGGTTGATTCAAGAGGCAATCTTTTGGTGGTGGAAGAGAAAAA
+GCTTGAAATAACAGATAAGCCTGTAAAGGTTTACAATTTTAAGGTCGATAATTTTCATAC
+GTATCATGTTGGCGAAAATAGGGTATTGGTTCATAATGCGAATAAGTATGTTAAGGGAAC
+GAGTAGTACTCTAAAAAGTTTGGGAAACAAGACTGAACAATATGTTACAAAACGAGGCTG
+GACATGGGATTCTATGGACGATGTTGTTAAAAAAACATATACTACTCGTGAAGCTATTAA
+CAAAGCAACTGGTAATCCAGCAACTGCTTACTACAATAAAGCTGGCGATTATGTAGTTGT
+GGATAATGTTACCGGTGAATTAGTACAAGTTAGTAAATTTGGTGATACTGGATGGATTCC
+TGACGCGACAATTAAAAATCCATACAAACCATGAGAGGGTGTTATTGATGACTGATATTA
+TTAAGGAGAATTATTCAAAAAAGGCCGTTATCTATGATAATATATGGATGTATTTTATTA
+AAACGGCAAAAGAAGTAATATGTGATTGCCAAAAAAATCAGATTAGAATAATGGCGCTGG
+AGGCGTTTAAATTAACAGGAGAAGGGATACAACCATCTCAAGAACATAGCATATATTTTA
+ATGTCAACGAAGATTGCTGGAGCAGAGCTATTGAATTTTTATCAAAAATTAAGGATAATG
+ACTATTTATATGAAATTTGGTATGAAGGATATTAAATCAGGAGTTAATAATTGCATAGTC
+GCATATTTTTAAATGATGCGCCCTTCCCTCCGAATTGCGATAAAGTACAGTCTTAATACA
+ATACCCGGCAAGCCAATACAACGGCAAGTCGGGTTTTCTTTTTATCCATACTTGACAATA
+TGTAATACATTGTGATACAATTAAACCAACAAGAAATACAGGAGGTGCAATGATGTCTAC
+AGAAAAGGATAGTATGTTACGGGTAAGGCTTACACAAAGGCAGTCGGATGAATTGGATGC
+GATTATTGGTGAGCTTCAAGCACAAATGCCGGAGGCAAGTGTTACCACATCAAGCATAGC
+AAGATACGCTCTGGAGAAGTATGTGAGCGACCATATCGCCAAGCGTGACGGTACCAAGAT
+TTTCATTGAAATCAACACTGCTGATGCCACAGAAGAGGACATAAAGAATCTCTACGACCT
+TCTTTCCAAGTTGTTTGACGAAACAAAGGAGAATTACTCACCAATGGTTCATTACATGGT
+TGGAGAGATTTTAGAGCCTGTGATGATGAAGATGGCAAGCCTCATGAAGCCTAAGAAACC
+GGAGGTGAGGGATGGTGAGTAAGAAACAGTACACAGTCCGCTGCCCCCATTGCAATCACA
+GAGTATTTGATGCCGATTATGCTGATGTTGAAATCAAATGCCCAGTATGCAGAATGGTTT
+TTGAAGTAAAGCTGGAGAAAAAGGCGGGGTGAAAAGTGAATAAATCTGGCACAGAGCCAC
+AAAGGGAGCACAAGACTCACCTATAGAGCCTGGCAGATAGTCTAAAAAACTATTTGTCAG
+GCTCTTTAAATTTTCTAGCACGACAGGAGGTGAGAAGTTTGGAAATGACAATGATGGACG
+CGGCATTAAAATACGCAGAAGCCAATATCCCAGTTATACCTCTGCACTGGATTTGTGAGG
+ATGGCTCCTGCTCCTGCAAGGCAGGGAGCGATTGCGACAGCAAGGGAAAGCATCCGTTAT
+ATACCGGCTGGTACAAGAACTCCACTACTGATGTTGAGCAAATAAAGAAATGGTGGACGA
+AAACCCCCAATGCCAATATCGGAATTCCTACAGGTGAGAAATCCGACTGGCTGGTGCTTG
+ATGTGGACGATGGTGGTGATGAAACCCTATCTGCACTTGAGGCAACACATGGAAAACTTC
+CGGATACGGTTACTGCTGTTACAGGAAGTGGAGGTCGGCACTATGTATTTATATACCCTA
+AAGGCCGGAGTATTCCTAATAAGACCAAGTTTGCACCGGGTCTTGATATGCGTTCAACAG
+GTGGATTGATTGCCGTAGCTCCAAGCATTCATATAAGCGGTAATCGGTATGAATGGTTAG
+AAGGACATTCTCCCTTTGAGAGAATCCCGGCAGAAGCTCCAGCATGGTTGTTGAAGCTCA
+TGGAAAGGGTGGAAGTATTGCTTACACCCTTTGAAGGTAGCAGTATTATTGCCGAGATTA
+AGGAAGGAAACCGCAACAGTACCCTGACAAGCCTTGCCGGAACCATGAGGGCAAGAGGAA
+TGACAGAAGAGAGCATCTATGCGGCATTGCTTGCAGAAAACAACGCAAGGTGCAATCCTC
+CGCTTGATGAAGCGGAAGTTAGAAAGATAGCGCACAGTGTCAGCCGATACCAGCCAAATC
+CTCCGATGAAGAAGCATTACCACAGGACAGACAGCGGGAATGCAGAAAGGCTGCGTGACA
+GGTTTGGTGAAATCATTAGGTATTGTCCGGCTTTCAAATACTGGTTGGTATATGACGGCT
+GTTGCTGGAGGAAAGAAACCGGAGAACTTATGCAGTTTGCTATAAAAACAGCAAGAGACA
+TGCTCGCAGAAGCAAGCCGGATAGAGGATGAGGCTGCAAGAAAAGAACTGGTGCGCCATG
+CCATGCAGTCTGAAAACGCAGGCAGGCTTAAAGCCATGATCGATGTGGCTTCAAACCTTG
+AAGGAATGGTAATTATGCCGGATGAGATTGATTCTGATATATGGAAGCTGAACTGTAGAA
+ATGGTGTGGTAGACCTAAAGACAGGCGAACTCCTTCCTCATAAGCGGGAGTACTATATGA
+GCAAAATCTGCCCTGTTGAATATAAACCAAGCAGCAAGGCTCCCAAATGGATGGAATTTC
+TGAATACCATTACGGGAGGAAGCAAGGAGCTTGTAAGATACCTTCAAAAAGCTGTAGGCT
+CGTCATTAAGCGGGGATATTTCAGAGCAGGCCCTATTCGTCCTTTATGGAACAGGAGCAA
+ACGGAAAGAGCACATTTCTAAACACCATCTCTGACCTGTTGGGAGACTATGCAAGAAATA
+CTCCGTCCGAAACTTTTATGGCTAAAAGAATAGAAGCGATAGGAAATGATATCGCAAGGC
+TTCAGGGAGCAAGGCTCGTTACTGCCATAGAAATAAATGAGGGACAAAGGCTCTCTGAGG
+CATTGATTAAGAGCTTTACAGGCGGAGACAGAATTACAGCAAGGTTTCTTTATGGAGAAT
+ACTTTGATTTCCAGCCACAGTTCACCCCGTTTCTCGTAGTAAACCACAGACCAGTCATAA
+GAGATACCAGCCACAGCATTTGGAGGCGCATTAAGCTGATTCCTTTCACCGTTACCATAC
+CCGAGGATAAAAAGGATAAGCAGCTACCGGCAAAGCTGAGAGAAGAGCTGCCTGGCATAT
+TGTCATGGGCAGTAGAGGGTTGCCTTCTTTGGCAGAAGGAAGGACTAAATATGCCTGATG
+AAGTCAAAAAAGCCACAGAAGGTTACCGGGAGGAAATGGATACCTTCTCAAGTTTTATAG
+AGGAATGCTGCATTGTGGAGGAGGGCAGGAAAGTCTCCAATAGAAGCATCAGGTACGCTT
+ACGAAACATGGTGCCGGGAAAATGGAGACTACCCTCTTGGACAAAAGCTATTCAATGCAA
+AAATGACGGAGCGCGGCTTTGCTGTCAAACGCAGCGGAGCCAATGGCAGCAGGGACTGGC
+ATGGTATTGGTCTTGCGGATGAGGGGATACTTTTGTGATTACTGACGACTGACGGCTTCT
+GACGTCAATTCCGTAAATTTTTATATATATTTTTTCTTATGTGAAATTTATGAAAAAAGA
+GTCAGTAAGAGTCAGTACGTCAGTAAAATCTCAGTACCTTGATGCAGAGGGGAGGGGAGG
+TCAAATCTCTACAGTAAAGCATAAGGGCAACGGGCTGGCAGCACCGCGTAAAAAAATGCA
+GATTCAAACGGGGTATTAACCCCAGACCATATTAACAAAAAAACAATTATGAAAATGGAG
+GATTTAAGCATGAGATTTATAGCAGATTTAGTACATGAGAAAAAGCAATTGGTGGAGAAA
+GCAGAAGCTATTTTAAACGAAGCGGAAAAAGCAGGTGGAAGTTTGACTAAGGAACAGGAG
+CAACAGTTTAACCGCTACAAAGACAGAATAACACGCATCAATGATAGCATTGATGAAGAA
+TTATCAAAAATCAGAACCTCTGAGCCAATATTGAATATGCCGCACAATCCCATGGCTCGT
+GAAGATGTGTCAAAAATTCCGGTAACAAAGGCTATATCAAAATCATTCAGAGGGATGTTC
+TATGGAAACGAAACTGTGAGCTTAAGCAACAATGGTTTTCATTCCATGGATGAATTCCTG
+AGAACACTTCACTCAGGCAGAGCCGACAACAGGCTAATAAATGCCAGTATGGTGGAAGGA
+ATACCCGAATTCGGCGGATATTCCGTACCGGAGGAATACGGAGCCTTCCTGATGGATAAA
+TCCCTGGAGAATGAGATCATTCGTCCCAGAGCAACAGTATGGGCAATGGGAAGTGAAACA
+AAGAAAGTATCAGCCTTTGATGGAGCAGACAGAACCAATCACCTATTCGGCGGTATCTCA
+GGAGAATGGCTGGAGGAAGGACAGACAGGCACACGAAAAACAGCCAAGTTAAGGCTGATT
+CAACTGAAAGCCAAGAAGCTGGCCTGCTTCTCACAGGCATCCAATGAACTTATTGCAGAT
+GGTATGTCCTTTGAGGAAATGTTAGCTGGAGCGCTTATTAAAGGCTTGGGCTGGTACATG
+GACTATGCCTTTATCAATGGAACCGGTGAAGGCCAGCCTCTTGGTATTATAAATGACCCG
+GCACTGATTACTGTAAATAAAGAGGCTTCTCAAGAACCAGCCACAATTACCTATCAAAAC
+GTGGTCAATATGTTCTCAAGGCTTGCTCCGTCATGTTTTACCAATGCGGTATGGCTTGCC
+AATCCATCGGTAATACCACAATTGCTCACCATGACCATTACCATTGGTACCGGTGGCGCT
+CAGATACCGGTATTCAGGGAAGAGAGCGGGAAATTCACACTTCTGGGTAAGGAGGTCTTA
+TTCACTGAGAAATGCCCCACATTGGGTGCTAAGGGAGATTTAATCCTTGCAGATCTTTCC
+CAGTATGCCATAGGCATGAGGAAAGAGATCGCTCTTGACCGCTCCAATGTCCCAGGCTGG
+ATGGAGGATATGACCGACTACAGGGTGATAGTGCGTGTAGATGGTCAGGGAACCTGGGAT
+AAACCTATAACACCGAAAAACGGAGCAACGCTCTCATGGGCAGTGGCTTTGGAAGCGAGA
+TGATTTGCTCAGATTTGAGCCAAGTCTGAGCCTAAGCAATACTTAGGGTAAAACCGCTCA
+AAAATGAGAAAATAGGAAGCTCTGCTCCTGCTTAACAGACTATTTAACAGTGGGTAGTTC
+TCCTACCCACTGGAATGCTTCGAACCCTCAAAAGCTTATAAATATTGCATTTAGAAGCAG
+AATTGACTTGCTATATCAGCGTTTCAGAGTGATGAATGTTAGTGCGGAATAAAGGCTTTA
+ACCGTAGGAAGGGGTGAAAGTGTGAGAGCAAAGATTACCACAACCATAGAGGAAGCCTTA
+TTGAACAAAGCCAAGGCACTTGCTAAACAAGAGGGTTTGTCTGGTGCCAATGCCATTATT
+GAAAGGGCTCTGGAGTTGTATTTTACCAGTATTCAATGTGAAGTGTGGGAAAAATCGTTG
+TCCAGCGGCTGGATAAAGAAGCTGGTTCTCAAAAGGGATTCTATTCTGTACGAAAACATC
+AAGTGCAGAAAAACCATGGAGAACTGCAGGCCGGATGATTACACACCTGAAAGCCTAAAA
+GCAAAAGGCTGGAAGAAGGTTTAGCAGCCGGGGAAAAGGCCTCTGTATTGCTCCTTGAAA
+CGTAAAAGCATAGGTTGCAGCCGTAAGCTTTGTTGAAACAGAAAGGGCAAATAAAGAGGA
+ATTTGAAAGGCTACTGCAGTTATCAATACAGAAATTTATTTGGTCAGTAGCATTAAGAAG
+TTTATGTCCAAGCGAAGCAGTAAAAGAACACTAAGAAATTTGAACTAAGGCTCGTGATGC
+CTGAAATCACGTAATTTGTCACACCAGGAATAGATAGGTTGGCGTTCCCTTGCGAGGTCA
+AAGAACTAAGGTTCTTAGACTAACGCTCTTAAATTGAGGTTGCCGGTATGAGTGGTGGAG
+ACATTGGAAAAGGAAAGGATAGATATTTATCATAAACGAAACACCTGCTTTGTTGGAATT
+GATATGCACAAGGACGCACATTGTGCAGTTGTAATTGATTGTTGGATGAATAAACTGGGT
+GAGGTTAACTTTGAAAACAGGCCATCCAGATTCCCTGCATTCGTTGAGGATGTAAGGAAG
+ATTTGCGGGATAAAGGAAATTGTATTCGGACTTGAAGATACCAGAGGCTTTGGCAGAAAC
+CTTGCTGCCTATCTGGTGGGCAGGAAGTTTGAAGTAAAGCACGTAAACCCTGCATATACA
+AGCGCTGTAAGGCTTGCAAACCCCATTATTTACAAGGATGACTCCTATGATGCCTATTGT
+GTGGCAAGGGTGCTCAGGGATATGGTGGACACTCTGCAGGATGCCAAGCATGAGGATATA
+TTCTGGACAATACGGCAAATGGTGAAAAGACGGGATTTGATTGTAAAAAGTAATGTGATG
+AACAAGAACCAGCTCCACAGCCAGCTTGCTTATAGCTACCCATCCTACAGGAAATTCTTT
+GCCATGATTGATTCCAAGAGTGCCTTATGCTTCTGGGAGAACTACCCGTCACCGGAGTAT
+ATATGGAAAACAACACCAGAAGAAATATATCAGACGATAAAGCCTGTGCATCAGGCGCTT
+AAAATACAGCGCATCCATGAGATTATATCCATGATTGAAAGGGATGGAGACACAAGAAAG
+GACTATCAGCCCGAAAGGGATTTTATTGTGAGAAACATCGTGAAGGATATCAGACACAAC
+AAGGAGTTGATTGCCGAAATTGACGATGAACTAAGAAAGCTGATACCTTTGACAGGCTAT
+AAGCTACATACAATGCCGGGAATCGACCTTGTTACAGAAGCACAGATAATATCTGAAATC
+GGAGATATTAACCGTTTCCCTGACTCAGACAAGCTGGCTCGGTTTATGGGCTTGGCACCG
+GTGCAATTCAGCTCTGCCGGAAAGGGTAAAGACCAAAGATGCAGGAATGGCAACAGGGCA
+CTAAATGCGATATTTCACTTTCTTGCAATCCAGATGGTAGCAGTATCGGCCTCAGGAAAG
+CCAAGACACCCGGTATTCAGGGAGTATTTTGAGCAGAAGGTCAAAGAGGGCAAGAACAAG
+CCACAGGCGCTTGTATGCGTGGCAAGGCGGCTTGTGAGGATAATCTACGGTATGATGAAA
+ACCAAGACTGAATACAGGCCATATGAGAAGACTGACGACAAGAACTGATTTCATATTCTG
+GAAGCAAAGCAATGGAAGATAATTCTTTTTTTCGTTGAGATATGGTAACAGGAATTATAT
+AATAGATATAGTCCTTGTAGTGAGGGAACGCGTAAGACTACACCGAAGACAACACTAGAC
+TATTTAAAAGACATTGAAGTAAAAAATGGAAACTACTATGCTTCAAAAGCAACTATTGAT
+GAAATTGGGAAAATTGAAGCAAAAGGCGTGGACTTTTCAAAGCTAGATAGTAAAGTAATG
+TCATTAAGAGCATCAACTGAAGGGGGAATGTCAAGAGTAATAAAATACTCGGATGGCAAT
+GGCATAAAGTTTATAATACATGAAGTAACTGATGCAAAAGGGAATATAATTCATAGAGAT
+TTTGATGCTGTAAGAATTGAATCTGGTCAGTTAATCAACAAAAAGTAGGGAGTGAGTTTA
+GTGACTAAAAGTGATATTGAAAAAGTATTGAGTGATATAGTTAATAATTTCTTAGAGAAA
+AAAATTGATGCTGACGAAACTATTGAGCAACTCATTACAAGAATTGATCCTTTAGAAGTC
+TATAAGTTAGACAATGAGCTTTTAATAACAGACTGTTATTTTGCAATCAAACATTTGACG
+GAAAATGGTTATGAGACAACTATAAGAGAGCTCCAATATTTTAGAGAGTGTTTTGCAGGG
+CAACGGCTTTATGACATCAATGAGAAAAATAAGTTTATTTTGGATTAATAGTTAATATAC
+TATGCAGGTCACACAGTTTCGGCTGGTGTGGCCTTTTTATTGTCCATGCTTGACATATCG
+TAATACAATGTGATACAATAAAATCAACAAGAAATACAGGAGGTGCAATAATGTCTACAG
+AAAAGGATAGTATGTTACGGGTAAGGCTTACACAAAGGCAGTCGGATGAATTGGACGCTA
+TCATCGATGAACTTTAAGCGCAAATGCCGGAAGCAAGCGTTACCACATCAAGCATAGCAA
+GATACGCTCTGGAGAAGTATGTAAGCGACCATATCGCCAAGCGTGATGGAACAAAAATTT
+TAATTGAAATCAACACCGCAGATGCCACAGAAGAGGACATAAAGAATCTCTACGACCTTC
+TTTCCAAGCTGTTTGACGAAACAAAAGAGAATTACTCACCAATGGTTCATTACATGGTTG
+GAGAGATATTAGAGCCTGTGATGATGAAGATGGCAAGCCTCATGAAACCAAAGAAGCCGG
+GTGTGAAGGCAGGTGAGTAAGAAAAAGTATATTGTACGCTGCCCTCATTGCAATCATGGA
+ATGTTTGATGCCGATTATGCTGATGTTGAAATCAAATGCCCGGTATGCAGAAAGGTTTTT
+GAAGTAAAGCTGGAGAAAAAGGCGGGGTAAAAAGTGAATAAATCTGGCCCAGAGCCACAA
+AGGGAGCGAATGACTCACCTATAGAGCCTGGCAGATAGTCTTAAAAACTATTTGTCAGGC
+TCTATTTATGTTCTCGGAGGAGGTGGAAATTTGAAAGTGACAATGATGGACGCGGCATTA
+AAATATGCAGAAGCCAATATCCCGGTTATACCTCTGCACTGGATTTGTGAGGGTGGCTTA
+TGCTCCTGCAAGGCAGGGAAAAATTGCGACAGCAAGGGAAAGCATCCGTTATATACCGGC
+TGGTACAATAATTCCACTACTGATGTTGAGCAAATAAAGAAATGGTGGACGAAAACACCC
+AATGCCAATATAGGCATTCCTACAGGTGCGAAATCCGGCTGGCTGGTGCTTGATGTGGAC
+GATGGCGGTGATGAAACTCTATCGGCTCTTGAAGCAACACATGGAAAACTTCCTGATACG
+GTTACCGCTGTTACCGGAGGTGGCGGTCTGCACTATATCTTCAAATACTCACAAGGCAGG
+AGTATTCCAAATAAGACCAAGTTTGCACCGGGTTTTGATAACCATTCAACAGGTGGACTG
+ATTGTCGTAGCTCCAAGCATTCATGTAAGCGATAATCAGTACCAATGGTTGAAAGGACAT
+TCTTCCTTTGACAAAACCCTGGCAGAAGCTCCGGAGTGGCTGTTAAAGCTCATGGAAAGG
+GAGGAAGTATTGCTTACACCCTTTGAAGGTAGAAGTATTGTAGCAGGGATTAAGGAAGGC
+AGCCGAAACAGCACCCTGACAAGCCTTGCAGGAACCATGAGAGCAAGAGGAATGACGGAG
+GAAGGCATCTATACGGCATTACTTGCAGAAAACAACGCAAGGTGCAATCCTCCGCTTGAT
+GAAGCGGAAATTAAGAAAATATATAGTTTAGGTTTTCAAAGAGTTAGTAGCTTGTAAAGA
+ATTAATATATACGATATACGCACAAAGCCGCTTGATTTTTGCAAAGGAGCTTTGTACAGT
+CATAAAGTATTTACGTATTGCCTGAACAATTCAGCTTTCAGGAGATAAGGAATATACATG
+TTGGATTTTTCTGGCTGTGGGTTATTGCAGCGGTGTCTGCAGTATTAATCACGTCAATAG
+TTGTTGCTATGATTATAATATAAGAAAAAGGAGAAAAGAAGAGAAGGAAAACGAGCTGGC
+GGCCGCTTGATTTGTAAAATAGGTACGTTCTACTTGCTTTTTCAGAATAGAAATAATATA
+ATAATGCTAGGAAAAGGCAGAAAAGTTTCCTGGCATTATTATAAGGCAACCACGGATTGC
+AAGCATTGGGATGATAATTTTGAGGTGATAAAATGGCAACTATAACGTTATATGCCGGAA
+AAATCAACCAAATGCCCGGATTGATAAATGAAGTCAAGAAATCTGTGGTGGATTACAAGT
+CAGAATTATCCGCATTGAGAAAGAAAACTTTGAACATCAACAGAAGTGTATGTAATTTGG
+ATGAAGTAATAAGTTCCATACAGGCATCTTCCCAGACTCAGGATAGAAAAATTGATTCAC
+TTGAGAAATTCTGCAGTGAAAGCGAGAAGTTTATATCGGAAGTAGTACGTATCGATGAAG
+AAGTGGCTGAGCTTATCAATAAACGGAAAGAAAATTTTTACAAAGAATATTATTATTTAA
+AACCGGAAAGCGAGAAAAGCGGCTGGGAAAAAATCAAGGACGGCTTAAAGTCGGTTGCGG
+AGTGGTGTAAAGAGAATTGGAAATCCATTGCCAAGATAGTGGCTGCCGCAGTAGTTATTA
+CCGGGTTGGGGATAGCGGCGGCATTGACAGGCGGTATATTGGGAGTCATACTGGCAGGAG
+CATTCTGGGGAGCATTGGCCGGAGGATTGATAGGGGGAGCGGTTGGAGGAATAGCCGCTG
+CGATAAATGGAGGATCGTTTCTGGAAGGATTTGCGGACGGCGCTTTAAGCGGAGCAATTT
+CCGGAGCGGTGACAGGAGCGGCATGTGCCGGGCTTGGTGCTTTAGGAGCTCTAGCAGGGA
+AAAGCATCCAATGTATGAGCACAGTGGGAAAAGCGATAAATGTTACATCAAAGGTTACGG
+CAACACTTTCTTTTGGTATGGATGGATTTGACATGCTGGCAATGGGAATATCATTGTTTG
+ATCCATCCAATGCATTGGTTGAATTTAACCGGAAGCTGCATTCCAATGCACTTTATAACG
+GATTCCAGATTGCTGTAAACGCGCTGGCTGTTTTCACTGCCGGGGCGGCATCGACAATGA
+AGTGCTTTGTTGCAGGTACAATGATATTGACTGTGGCAGGCTTGGTTGCGATAGAGAATA
+TCAAGGCAGGGGACAAGGTAATTGCGACGAATCCTGAAACTTTTGAAGTAGCGGAAAAGA
+CGGTGCTTGAGACATATGTGAGAGAGACAACGGAGCTTTTGCATTTGACAATCAATGGAG
+AGGTAATCAAGACAACCTTTGAGCATCCGTTTTATGTAAAAGATGTGGGTTTTGTTGAAG
+CGGGAAAACTGCAAGTAGGAGATAAGTTGGTTGATTCAAAAGGCAATCTTTTGGTGGTGG
+AAGAGAAAAAGCTTGAGATAACAGATGAACCTGTTAAGGTTTATAACTTCAAAGTGGATG
+ATTTTCATACTTATCATGTTGGGAAAAAAGGGATATTGGTACATAATGCAGACTATAACC
+CCAAAATGGGATTTGATGATTTGGACCTTGAGAAAGCTACGAACAAACAAAAAGGCAATT
+ATGGAGAGTATCTGGCAGATGATAATCTTATTAATAATCCAAAATTGAAAGAAGCAGGGT
+ATGATTTGGAGCGGATAGGAGGTAAGGTTCCGACCTCACCGGATGATAAAATTACAAAAG
+GGATAGACGGTATATATATAAACAAGAATCCTAATTCAAATATTAAATATGTGATTGATG
+AAGCCAAATTTGGAAAAGCAGGACTGAGTGCAAAGACAAGAGATGGAAAACAAATGTCAG
+ATTCTTGGTTAGTGGGTTCTCGCTCAAGAAATAATAGAATTTTAAAAGCAGTAAGTAATA
+ATGAAGATTTAGCATTTGACATAGTGAAAGCATTAAGAAATAACCAAGTAGAAAGAGTAT
+TATCAAAGATAGATGTAAATGGAAAAATAATAACATATAGACTGGATAGCAATGGTAATA
+TAATTGGACTTTGGCCTTAGATGATTGAAAAGGAGGTAACTATATGAGAGATCCGTTATG
+TGATAAAAATTATTTATTAAAAACAATAGAACTTAGAAAGAAATATATTTGTGAAATGAA
+AGGAGAAATTGTTCAATTAAAATCTGATATAGAAAAGGGGATTCAGAGATATCCTAGAGA
+TAATCAAAGTATAATTTTTGCTAGATTTGCAATAATGTTTATGTATGGTATGGACATGCT
+TTTAGCAAAATATTCCTTGGGCAATCACCCTGATACAATGATAGATGACTATTTAGACAA
+CATAACATATTTAGAGAATTGCGGTGAAGAAGAGGCCGGCTACATTAACCTTTTATGGAT
+GGTTGGACTGGGTATCCTTTTGGAAATGGATAAAGAAGTGTTAAAAAGACTGGCAAGAGT
+TATAGAAAGGCAAAGAATAGAAGACGCACTTATGGATTTTCTATTGAAATCCTGTGATAT
+AGGTTGGAATCACAGTACAACGAAATATGAAAAAAAGAACCCGTATGAAAAGACAGCAGA
+GATTATAAAAATAGCATTACACGACAAAGACAAGGAAGCGGCATCAAAAAGGCTTGAAAA
+ATACATGGGAAAAGAATGGTTCAAGGGACATTACGACTTTGGGTGGAGGAATGCCCATAA
+GGAACCTGGCTATTATGGTTTTTGGAGTTTTGATACAGCGGCACTGGCCAAGATACTGGG
+ACTGGATGACAGTGCGTTAAAAGACAACAACCATTATCCTTATGATTTGGCACACTATAA
+AAATGGAATGACCTTTGATTTGAGTTGGTATAGTGTACCAAAGGAAGAGGAAGATAAGGA
+AGAAGAAACGGTGGTATATGGTATACCGGGTAATCCTGAGTTGGAGAGAATAATACCTGG
+GAGATTCCACAGTTTTGTAAATGAGATAATAAATGATTATAAAACACTGCCGGACGAAGA
+ATTTTGGAAGAAATACAATTTGAAAGAAATCTGGTTTGATGTGGAGGAGTATAAGGAGGA
+TAATAAAGATAAGAATTTGCTAGGAACGATTATAGTATTCATGCTTGTGGACAAAGATTA
+TATTTTGCAGTTGGATTATAAAGAAGAGTTAATAGACTATATAGAGAATATACATAATTA
+CTGGGCCAAGAAAGAAGTTAAGCTTATAAGCTTTGAATTAGACAATGACCAGCAGTACTA
+TGCATATGTGCCGAAGGATGCGGAGGTTGGTTCGTTGTATGAGGTAAAACTGACAGAAGT
+GGAGAAAATAGAGGAGGTTTAGTGTTTATTGTGTAATAGTGTGAAGAAGATGAGTTGTTT
+ATGAAGAATCTGCTGTATAATTGGATATATATAGTTTGATTTTGGGAATCTCCTTCCTGG
+CGAAACAAAAACTATAGGACAGTATTTGGGAAGGAGTATTTTTTGTGTTATTTTTTTTGG
+GGAAGATAATATTGTATTGAGAATAATAAGAAGTTTTATTAGGATTGTTTATGGTTGTCA
+ATGTTAATATAATCAATGTTAATATAATCAATGTTAAAAGGTATAGGAACAGAACTATAG
+CAGGGGAGAGTCAAAATGTACATTTGGCAGTGAAAGATAAGCTGAAAAAAGAGGGGCGTT
+CATTTGAATTAATTCCTGAAGATCTTGATGTTTATAAAGAAGCATTGGATTTATGGTTGA
+GTCCAAATTTGGAAGAGGTTAAAAGCGTGATTGATAAAATGATATTGTATCATTCCGTAT
+TAGTTTCGGACATTGATAACGAACCGGAATTTGGTGATTACACGTATGGATTTTATCCAT
+ATGAGATATTGTTTTTAATGCATATAAGGAGGAAATTAGGTTTGCCGGTACCGGATAAAT
+TTGAAGACTTGCTGATGAACACACCGGAAGCGAAGGTGGTGATTAATGAGCCGGAGCCAT
+ATCCGGAGTGGGATCCTTTGTTGAGAGCCATAGATGAGTTTTACCGAAAGAATTATCCAA
+ATTACATTCCCAACAAGCATGGAAAACTGTTTGAATAGGAGGAAACTGTTATGGCAATGG
+AAGATATAGTTGGGATTATATTTGAAGACATTGAGGAAGTGAAACCAATTTTAAGTGATT
+CGGAAGGAAATGATTTGGAAGGAAATGATTTGAGTGAGGCGATATTGGAATACGGGATAT
+CGGAAGGGAAGTTTCTGTGTGTTGATTATGGTGGAGAAGAGGGGAGCGAGATAATAAATT
+ATATAATGGATTATGAATTCAGTCATGGAATAGAGCTTGCAACACAGGAGGAGTTGGAAG
+AGCTGGACGAGATGGAGTATGATGATTTGACAGATAAGATAAAAGAAGTGAACAAGATAT
+TGGAGAAAGCAGGGTATGGACTGTTTTGCTTTCCAACAGGAAGTGATTTTTATGAGTTGT
+TTATAGCGAAGTTGGAGGATAAAGAGAAGTTATTGGAGGAAAAGATAGTTGATGATGAGG
+AGTTGCCATTGGAAGAGAGGTATATTCAGTATTATGTGTAAGGGGATAATCTGCAGTATT
+TAGAGTTTTGGATAAGAATATGGCTTTTATAAAAATATTGGCAGTGTAAATATTTTTGTG
+TAAACTAATTTTCCTTCTATGTTAGTGTTTAAATATATTTTAAGACTCGAAAGTCTGCTT
+TGTCAAATTTTATAGATTCAAAAGAATTTCTGATAAGAAATTCTTACAAAAGAAAAATTT
+GACAAAGATGATGCGTATAAAATATTACAGAGGGGTTCAGGAAACCAGAGTTTCCCTGAA
+CCCCTTGATTATACTATATACGCCCTTCGAACATAATCTGTAGCTGTCCCAGTATCAACC
+TCCAGTTTTTGTAACGCATCGTCCATTTTGAAGTAATCTTCACTGTAGCTAAATATATGC
+TCTTTAAAAGTGACTGGTCGCCAGGAAATACTGTCCTTGATTTGTTTATCCTTCTATAAC
+TGCTATTCAGGCTCTCAATAGTATTGGTCGTATACATGATTTTACGTAGTTCCTCCGAAT
+ACTTAAAAAATGGACAAATAACATCCCAATTGCTCTTCCAGCTCTTCATAGCTGCCGGGT
+ATTTCTTCTCCCATTTCTCTGAAACCTCAAGCATCTGGTCGTACCCTGCCTTCTCATTCG
+GAGCCGTATATATCCGTTTCAAGTCCCTGGCAAATTCCTTTCGGTCTTTATCTGACACAT
+ACTTTAGCGTGTTTCTTATCTGGTGTACTATACACCTCTGATATTCAGTATTCGGAAAAG
+CCGCATTGATTGCATCCTTTATCCCTGAAAGTGCATCAGCACAGAGAATCAGGATGTCTT
+TAACTCCTCTGTTTTTAAGGTCATTTAAGACACTCAGCCAGAATTTTGAGCTCTCATTTT
+CTCCTACATAAATACCGATAACATCTTTCTGCCCTTCTATATCAATCGCCAGCACAATAT
+ATACGGCCTTCTTCCCAACAATGCCGTCATTTTTTACTGAAAAATGAATTGCGTCAATAA
+ATACTATCGGATAAACCTCTCCCAGAGGCCTTTTCTGCCACTCTTCTATCTCAGGTAGTA
+TTTTATCAGTGATCTTACTTACCATCTCGGCAGATACTTCAAATCCGTAGATTTCCTGTA
+TCTGCTCGTTGATTTCTCTGGTAGACATCCCCCGCGCATACATTGCTATTATTTTATTTT
+CAATTTCTGAAATGTCCCTTTTATACCTGGGAACAATTTTCGGCTCGAATTCTGCATTCC
+GGTCCCGCGGGATATCTATTTCCACTTGCCCTACACTTGACTTTAATGTTTTTGATGTGT
+ACCCGTTACGGTAATTTGATTTCGCTTCTTCAGTTGATTCGTACTTTTCATATCCGAGAT
+GTTCATCCAGCTCTGCTTCCAACATATTTTGTATCGTATCTCCGAGCAGATCCTTCAATG
+CTTCCTGCAAATTCTTTGCTCAAGTGATGTTGTACTCAGAAATGAGATTTCTGATAAGCT
+CTTTCTTTTCTGGTGTTATTATTCTTTTTCTTGCCATAAAAAACTCCTCCTATACTTTAG
+TATTCTATCATAGAAGGAGTCAATTAGTTTACATAAATATTTTACAGTCTCTTAGCTTGT
+AAAGAATTATAATATAATATATATGTACAAAGTCGCTTAATTTTTGCAAAAGATCTTTGT
+ATAATCATAAAGTATTTAGATATTGCCTGCACAATTTCAGCTATAGATTCAAACAAGTTG
+TTATGCGTTACATTCATTCGGATGTCTTTCAAAAGGTGATCGATTGAATTCAACTCGGAG
+CTATAAGGAGGCAAATACTTAAGGGTAATGTTCTTTATTGAATCCAATGGGAGTATAAAT
+AATTTCATGTATTAAAAATTTTTCAGTTCTTCCTGGCAAGAAATTTTAAGTTTTCAAAGT
+TTACAGAATGTAAATCCTAAATCACTTCAATATTATATATTATTGCCGGTTTTGCTAAGT
+TTTACACATAAATTTGATTTAATTCGTCTATAATTATTTATAATGGAGTGTTTTGCCCTT
+TTTCGCTCAATTATCAACGAATTGGTTGACGAAAACCGGTGCAAGGTATATGATAGCGGC
+AGGGAAATAGATTTCAAATATTACAGTGATAACAATACATTAACTTTTACCCTCGGAAAG
+GGTTGGCACAACGTTGGAATTGTCCTTGTGGATATGGCGGGAAATGTAAACAATATTCAG
+GAGATAAGGAATATACATGTTGGATTTTTCTGGCTGTGGGTTATTGCAGCGGTGTCTGCA
+GTATTAATTGCGGCAATAGTTGCTGCTGTGATTCATAATATAAGAAAAAGGAGAAAAGAA
+GAGGAGGAAAACGAGCTGGCGGCGGCTTGATTTGTAAAATAGGTACGTTCTACTTGCTTT
+TTCAGAATAGAAATAATATAATAATGCCAGGAAAAGGCAGAAAAGTTTCCTGGCATTATT
+ATAATGCAACCACGGATTGCAAGCATTGGGATGATAATTTTGAGTTAATAAAATGGCAAC
+TATAACGTTATATGCCGGGAAAATCAACCAAATACCCGGATTGATAAATGAAGTCAAGAA
+ATCTGTGGTGGATTACAAGTCAGAATTATCCGCATTGAGAAAGAAAACTTTGAACATCAA
+CAGAAGTGTATGCAATTTGGATGAAGTAATAAGTTCCATACAGGCATCTTCCCAGACTCA
+GGATAGAAAAATTGATTCACTTGAGAAATTCTGCAGTGAAAGCGAGAAGTTTATATCGGA
+AGTAATACGTATCGATGAAGAAGTTGCTGAGCTTATCAATAAACGGAAAGAAAATTTTTA
+CAAAGAATATTATTATTTAAAACCGGAAAGCGAGAAAAGCGGCTGGGAAAAAATCAAGGA
+CGGCTTAAAGGCGGTTGCGGAGTGGTGTAAAGAGAATTGGAAATCCATTGCCAAGATAGT
+GGCTGCCGCAGTAGTTATTACCGGGTTAGGGATAGCGGCGGCATTGACAGGCGGTATATT
+GGGAGTCATACTGGCAGGAGCATTCTGGGGAGCATTGGCCGGAGGATTGATAGGGGGGAG
+CGGTTGGAGGAATAGCCGCTGCGATAAATGGAGGATCGTTTCTGGAAGGATTTGCGGACG
+GCGCTTTAAGCGGAGCAATTTCCGGAGCGGTGACAGGAGCGGCATGTGCCGGGCTTGGTG
+CTTTAGGAGCTCTAGCAGGGAAAAGCATCCAATGTATGAGCACAGTGGGAAAAGCGATAA
+ATGTTACGTCAAAGGTTACGGCAGCACTTTCTTTTGGTATGGATGGATTTGACATGCTGG
+CAATGGGAATATCATTGTTTGATCCATCCAATGCATTGGTTGAATTTAACCGGAAGCTGC
+ATTCCAATGCACTTTATAACGGATTCCAGATTGCTGTAAACGCGCTGGCTGTTTTCAGTG
+CCGGGGCGGCATCGACAATGAAGTGCTTTGTTGCAGGTACAATGATATTGACTGTGGCAG
+GCTTGGTTGCGATAGAGAATATCAAGGCAGGGGACAAGGTAATTGCGACGAATCCGGAGA
+CTTTTGAAGTAGCCGAGAAGACGGTGCTTGAGACATATGTGAGAGAGACAACGGAGCTTT
+TACATTTGACAATCAATGGAGATGTAATCAAGACAACCTTTGAACATCTGTTTTATGCAA
+AAGATGTAGGTTTTGTTGAAGCTAAAGAATTGCAAGTAGGAGATAAGCTGCTAGATTCAA
+AAGGCAATGTTTTGGTGGTGGAAGACAAAAAAATTAAAATTACAGATGAACCTGTCAAAG
+TTTACAACTTTCAAGTTGATGATTTTCACACTTATCATGTTGGCTGTAATGGTGTACTGG
+TTCATAATGTAAAATATAATGATGGTTCGAATAAGATTAATAAATGGGTTGATGAAGAAG
+GAAATATAATATGGCCTCCAAATAGAGGCTTCGACGGTGAACCGGTGAAAGTAACGTTGG
+AGCCGGGAACGCGAATCGATAGGTATGGCTATGAAGGAGGTACATTTGCTTCGCCTGTGG
+GAACGCCGTATGACTGTCGTTCTTTAGCACCGGGAACGGAAACTAAACCATATAATGTCT
+ATGAAGTTGTCAAGCCGGTTGAAGCACTAAGCGGCAAAATAGCACCATGGTTTGACAAGC
+CCGGTGGAGGAATACAATATGAATTTAGTCAGTCAATTAAGGAAATGTTGGAAGCAGGAA
+TACTAAAAAGGGTGGGATCATAAGATGAATAAAAATGATTTAAGGAAAATGTTGACCGAT
+AGCAATATACCTAAAGATACATACTCTTTGGACGGCGGTTTGCCGAATGAAGCATATTGC
+CTCAATCAAAATGGGGATAGATGGGAAGTTTATTACAGTGAACGGGCTCAGAAGACCGGA
+TTAAAAATATTTGAAACGGAAAGTGAAGCATGCGAGTATTTCTATAATTCATTAGTTCAG
+ATGTTAAAGGACATGGGCGTATTATAATTACAAGTTATCTGTATAGGTCATACAAGTTTT
+AACCGGTATGACCTATACATGATTCGGTTTACGGAGCTCATCCGATTATGCCTGAGGGAA
+GCTGATAAAATATGCATTTAATTGACTTGGAGATTTCCAAAATACAATCCATAAGAATAT
+ATTTGCCATGTAAAAAAGAGGATATAAAGCCATTTGATATTGTGTCAATAGAATATATAA
+AAGAACAAATAGAATATGATTTATATGTTGATGATTTTGCAACAGAAGCGATAACATCGT
+TGAAAAATCAGCTGAAAAAAGCGTTGAATTTTGAGTTGCATATTCAAAACGAATATATAA
+ATAAAGGGATTGGGTATTACTATAATATTTATGTAAATAAATTGTGGACAACTGATGCTC
+AAAGCCTTGTTGATCCATCACAAAATTTTAGCCTTTGGTCAACTCCAACTCATATAGGTA
+TTGAAACTTTTATGTATAATATTGATGATAAAATATATATTGAAATAAGTCCAATTTACA
+AGTGGAACTGCGATTATCCTGAGAATGAAAGTGAATATGAAACTTTTGACAATTTTCTAA
+ATAATTACAAACCAATTGATATTGTTTCAATTGACAGAAGTGTTGCTGAGAGATGGCTAG
+ACTTTTGTTGTGATATGATAAAGATATTTAAAGAAAACGATAAAAAGTACTTAAAAGAAG
+ATAACACAAATTAGCTTTTTATATGGCAATTTTTTATTTGTACAAAGCTACTAACGAATC
+ATAAAAAACTTAAGCTTAAGGGATAGGGAGAATTTGCAGGTCACGTAATTTCAACTAATG
+TGACCTTTTTGTTTAATATATATTATATTTATATATTAATTCAATTATATTCAGAGACAG
+GAAACACATTACAAGTTGTACAAAGGTAGTGGAATGTTTTATGTTATATGACCACAGCAC
+TTTCTTTTAGTATGGATGGATTTGACATGCTGGCAATGGGAATATCGTTGTTTGAACCAT
+CCAATGCATTGGTTGAATTTAACCGGAAGCTGCATTCCAATGCACTTTATAACGGATTCC
+AGATTGCTGTAAACGCGCTGGCTGTTTTCAGTGCCGGGGCGGCATCGACAATGAAGTGCT
+TTGTTGCAGGTACAATGATATTGACTGCGACAGGCTTGGTTGCGATAGAGAATATCAAGG
+CAGGGGACAAGGTAATTGCGACGAATCCTGAAACTTTTGAAGTAGCCGAGAAGACAGTGC
+TTGAGACATATGTGAGAGATACGACGGAGCTTTTGCATTTGACAATCAATGGAGAGGTAA
+TCAAGACAACCTTTGAGCATCCGTTTTATGTAAAAGATGTGGGTTTTGTTGAAGCGGGAA
+AACTGCAGATAGGAGACAGGTTGGTTGATTCAAGAGGTAATGTTTTAGTATTGGAAGGTA
+AAAAGCTTGAAATAACAGATAAGCCTGTAAAGGTTTACAATTTTAAGGTTGATAATTTTC
+ATACGTATCATGTTGGCGAAAATAGGGTATTGGTTCATAATGCGAATAAGTATGTTAAGG
+GAACGCGTAGTACTGTAGGTAAACTTACAGGTTCATTGGATGGGTTAACATCAGCAGAAA
+GAAAGGTTGTAAATGATTTGCTTTCACAGGGTAAGAATGTTGAAATAATTCCGCGTTCCA
+ATGTTCAAGGGGTTAGCACACCTGATTTTATAATAAATGGGGTAAAAACAGAATTAAAAA
+CATTAAATGGAACAAGTCTAAATACTCCGGTTACTAGGATTACAGATGCGTTTAAACAAG
+GTGCAGATGCAGTTATTATTGATGCAAGAAATGTTGGAATAACTGCTGAACAGGCAAACC
+AAATACTCAATCGAGCTGCAGGCACTTATCAAAATAAAGTATTACCAGGTCAAGTTGAGA
+TTTGGACTGTTGACGGTATTATTAGGAGGTAATAATTTATGAGAATGCAATGTAAGTGTG
+GAGAAATATTATCCAATAGTATGGCTCCTAATGACATCCAATTAAGAGTATATACTGATA
+GGGAATGGGATGATATAATTAATATGGGTGAAATTGATTCAATTAATATACCACACCCTA
+AAATCGATGTATGGCGTTGTCCTAAATGTGAAAGAGTTTATGTCTTTGAATATGGTAATC
+ATAAAGCAATAAAAGTCTATAAGTTAGAAGAATAGGTGTCTTTTTAAGGTCACACAGTTT
+CGTCTGATGTGGCCTTTTTTCTTATCTATGCTTGACAATATGTATTACAATGTGATACAA
+TAAAACCAACAAGAAATACAGGAGGTGCAATAATGTCTACAGAAAAGGATAGTATGTTAC
+GGGTAAGGCTTACAAAAATGCAGTCGGATGAATTGGATGCGATTATTGGTGAGCTTCAAG
+CACAGATGCCGGAAGCAAGCGTTACCACATCAAGCATAGCAAGATACGCTCTGGAGAAAT
+ATGTGAGCGACCATATTGCTAAGCGTGACGGAACCAAGATTTTTATTGAAATCAACACTG
+CTGATGCCACAGAAGAGGAGATAAAGAATCTCTATGACCTTCTTTCGAAGCTGTTTGACG
+AAGCAAAGGAGAATTACTCACCAATGGTTCATTACATGGTTGGGGAGATTTTAGAGCCTC
+TGATGATGAAAATGGCAAGACTCATGAAGCTAAAGAAGCCGGAGGTGAAGGCAGGTGAGT
+AAGAAAAAGTACATTGTCCGCTGTCCTCACTGTAATCACAGAGTATTTGATGCTGATTAT
+GCTGATGTTGAAATCAAATGCCCGGTATGCAAAAAGGTTTTTGAAGTAAAGCTGGAGAAA
+AAGGCGGGGTAAAAAGTGAATAAATCTGGCACAGAGCCACAAAGGGAGCGAATGACTCAC
+CTATAGAGCCTGGCAGATAGTCTTAAAAACTATTTGTCAGGCTCTATTTATGTTCTCGGA
+GGAGGTGAGAATTTGAAAATGACAATGATGGACGCAGCAATAAAATACGCAGAAGCCAAT
+ATCCCAGTTATGCCTTTGCACTGGATTTGTGAGGATGGCTCCTGCTCCTGCAAGGCAGGG
+AGTGATTGCGACAGCAAGGGAAAGCATCCGTTATATACCGGCTGGTACAAGAACTCAACT
+GCTGATATGGAGCAAATAAGGAAATGGTGGACAAAAACACCCAATGCCAATATAGGCATT
+CCTACAGGTGAGAAATCCGACTGGCTGGTACTTGATGTGGATGATGGCGGTGATGAAACC
+ATATCTGCACTTGAAGCAACATATGGAAAACTTCCGGATACGGTTACTGCTGTTACAGGA
+AGTGGAGGTTGGCACTATGTCTTTAAATACCCTAAAGGCCGGAGTATCCCAAATAAGACC
+AAGTTTGCATCGGGTCTTGATACGCGTTCAACAGGTGGACTGATTGTCGTGGCTCCAAGC
+ATTCATGTAAGCGGTAATCAGTACCAATGGTTAGAAGGACATTCTCCCTTTGACAGAACC
+CCGGCAGAAGCTCCAGCATGGTTATTAAAGCTCATGGAAAGGGTGGAAGTATTGCTTACA
+CCCTTTGAAGGTAGCAGTATTATAGCAGAGATTAAGGAAGGCAGCCGCAATAGCACCCTG
+ACGAGCCTTGCCGGGAGTATGAGAGCAAGAGGAATGACAGAAGAGAGCATCTATGCAGCA
+CTGCTTGCCGAAAACAAAGCCAGATGCAATCCTCCGCTTGATGAAGCGGAAGTTAAAAAG
+ATAGCGCACAGTGTCAGCCGATACCAGCCAAATCCTCCGATGAAGAAGCATTACCACAGG
+ACAGACAGCGGTAATGCAGAAAGGCTGCGTGACCGGTTTGGTTCAATCATAAGGTATTGT
+CCGGCTTTCAAATACTGGTTGGTATATGACGGCTGTTGCTGGAGGAAAGAAACCGGAGAA
+CTTATGCAGTTTGCTATAAAAACAGCAAGAGACATGCTCGCAGAAGCAAGCCGGATAGAG
+GATGAGGCTGCAAGAAAAGAACTGGTGCGCCATGCCATGCAGTCTGAAAACGCAGGCAGG
+CTTAAAGCCATGATCGATGTGGCTTCAAACCTTGAAGGAATGGTAATTATGCCGGATGAG
+CTTGATTCTGATATATGGAAGCTGAACTGCAAGAATGGTGTGGTAGACCTAAAGACAGGC
+GAACTCCTTTCTCATAAGCGGGAGTACTATATGAGCAAAATCTGTCCTGTTGAATATAAA
+CCAAGCAGCAAGGCTCCCAGATGGATGGATTTTCTGAATACCATTACGGGAGGAAGCAAC
+GAGCTTGTAAGATACCTTCAAAAAGCTGTAGGCTCATCTTTAAGCGGGGATATTTCAGAG
+CAGGCCCTATTCGTCCTTTATGGAACAGGAGCAAACGGCAAGAGCACATTTCTAAACACC
+GTCTCTGACCTGTTGGGAGACTATGCAAGAAATACTCCGTCCGAAACCTTTATGGCAAAA
+AGGATAGAAGCGATAGGAAATGATATTGCAAGGCTTCAGGGAGCAAGGCTCGTTACTGCC
+ATAGAAATAAATGAGGGACAAAGGCTCTCTGAGGCATTGATTAAAAGCTTCACAGGCGGA
+GACAGAATCACAGCAAGGTTCCTTTATGGAGAATACTTTGATTTCCAGCCGCAGTTTACC
+CCATTTCTCGTAGTAAACCACAGACCTGTCATAAGAGATACCAGTCACAGCATTTGGAGG
+CGCATTAAGCTGATTCCTTTCACCGTTACCATACCCGAGGATAAAAAGGATAAGCAGCTA
+CCGGCAAAGCTGAGAGAAGAGCTGCCTGGCATATTGTCATGGGCAGTTGAGGGCTGCCTT
+ATATGGCAGAAGGAAGGACTAAATATGCCTGATGAAGTCAAAGAAGCTACAGATGGGTAC
+CGGCAGGAAATGGATACTTTCTCATCGTTCATTGAGGAATGCTGCATTGTGGAGGAGGGC
+AGGAAAGTCTCCAATAGAAGCATCAGGTACGCTTACGAAACATGGTGCCGGGAGAACGGA
+GATTATCCTCTTGGTCAAAAGCTGTTCAATGCAAAAATGACGGAGCGCGGCTTTGCTGTC
+AAACGCAGCGGAGCCAATGGCAGCAGGGACTGGCATGGCATTGGTCTTGCTGAGGAGGCG
+ATACTTTTGTGATTACTGACGACTGACGGCTTCTGACGTCAATTCCGTAAATTTTTATAT
+ATATTTTTTCTTATGTGAAATTTATGAAAAAAGAGTCAGTAAGAGTCAGTACGTCAGTAA
+ACTCTCAGTACCCTGATGAGAGGGGAGGGGGAGGTCAAATCTCTACAGTAAAGCATAAGG
+GCAACGGGCTGGCAACATCGCGTAAAAAAACGCAGGTTCAAACGGGGTATTAACCCCAGA
+CCATATTTACAAAAAAATATTAAGAAAATGGAGGATTTAAGCATGAGATTTATAGCAGAT
+TTGGTACATGAGAAAAAGCAATTGGTGGAGAAAGCAGAAGCTATTTTAAACGAAGCTGAA
+AAAGCAGGTGGAAGTTTGACGAATGAACAGGAGCGACAGTTTAACCGCTACACAGACAAA
+ATTAAGAGCATTAATGAAAGCATTGACGAGGAATTATTAAATATCAGAACCTCTGAGCCA
+ATTCTAATTACACCACAAAAAGCTGTATCTCCTATTGAAGAATCAAAAACACCTGTAACA
+AAAGCCGTATCAAAATCATTCAGAGGGATGTTCTATGGAAACGAAACTGTGAGCTTAAGC
+AACAATGGTTTTCATTCCATGGATGAATTCCTGAGAACACTTCACTCAGGCAGAGCCGAC
+AACAGGCTAATAAATGCCAGTATGGTGGAAGGGATACCTGAATTCGGCGGATATTCCGTA
+CCGGAGGAATACGGAGCCTTCCTGATGGATAAATCCCTGGAGAATGAAATCATCCGTCCA
+AGAGCAACGGTATGGGCAATGGGAAGTGAAACAAAGAAAGTACCAGCCTTTGACGGAGCA
+GACAGAACCAACAACCTATTCGGCGGCATCTCGGGCGAATGGCTTGAAGAAGGACAGACA
+GGCACACGAAAAACAGCCAAGTTAAGGCTGATTCAACTGAAAGCCAAGAAGCTGGCTTGT
+TTCTCACAGGCATCCAATGAACTTATTGCAGATGGGATGTCCTTTGAAGAAATGTTAGCT
+GGAGCACTCATTAAAGGCTTGGGCTGGTACATGGACTATGCCTTTATCAATGGAACCGGT
+GAAGGCCAGCCTCTTGGTATTATAAATGACCCGGCGCTGATTACTGTAAATAAAGAGGAC
+TCTCAAGAACCAGCTACAATTACCTATCAGAATGTTGTCAATATGTTCTCAAGGCTTGCT
+CCATCCTGCTTTACCAATGCGGTATGGCTTGCCAATCCATCGGTAATACCACAATTACTT
+ACCATGACTATCACCATTGGTACCGGTGGCGCTCAGATACCGGTGTTCAGGGAAGAGAGC
+GGGAAATTCACGCTTCTGGGTAAGGAGGTCTTATTCACTGAGAAATGCCCCGCATTGGGT
+GCTAAGGGAGATTTAATCCTTGCAGATCTTTCCCAGTATGCCATAGGCATGAGGAAAGAG
+ATCGCTCTTGACCGCTCCAATGTCCCAGGCTGGATGGAGGATATGACCGACTACAGGGTG
+ATAGTGCGTGTAGATGGTCAGGGAACCTGGGATAAACCTATAACACCGAAAAACGGAGCA
+ACGCTCTCATGGGCAGTGGCTCTGGAGGCAAGATAGTCTGCTGAAATTTCAGCCAAAGCT
+ACCATTGAATCCAGTTTTAGGGTAAATGAGTGAATGCTTATTTCATTGCCACAGGACTCA
+ATTTGAGCCTAAACAATACTTAGGGTGAAACCGCCCAAAATGAGAAAATAGGAAGCTCTG
+CTCCTGTTTAACAGACTTTTTAAAAGTGGGTAGTTCTCCTGCCTGCTGGAATTGCTTTAA
+ACCCTCTGAAACCCATAGAAATACTGCTTTCTAAAGCATAATTGACTTGCTATATCAGCG
+GTTCAGAGTGATGAATGTTACTACGGAATAAAGGCTTTAACCGTAGGAAGGGGTGAAAGT
+GTGAGAGCAAAGATTACCACAACCATAGAGGAAGCCTTATTGAACAAAGCTAAGGCACTT
+GCCGGACAAGAGGGTTTGTCCGGTGCCAATGCCATTATTGAAAGGGCGCTGGAGTTGTAT
+TTTACCAGTATTCAATGTGAAGTATGGGAAAAATCGTTGCCCAGCGGCTGGATAAAGAAG
+CTGGTTCTAAAAGGGGATTTAATTCTGTACGAAAACATCAAGTGCAGAAAAACCTTGGAG
+AACTACAGGCCGGAAGATTACACACAGGAAAGCCTAAAAGCAAAAGGCTGGAAAAAGGTT
+TAGTAGCAAGTAAAAAGGCCTCTGTATTGCTCCCTGAAACGTAAAAGCGTAGGTTGCAGC
+CGTAAGCTTTGTTGAAACAAAAGGGGCAAGTAAAAAGGATTTTGTAAAGGTTGCAGCAGT
+TATCAATACAGAAATTTATTGGTCAGAAGCATTAAGAAATTAGTGTCCAAGAGAAGCAGT
+AAAAGAACATTAAGAAATTTGAACTAAGGCTCGTGATGCCTGAAATCACGTAATTTGTCA
+CATCAGGAATAGATAGGTTGGCGTTCCCTTGCGAGGATTAAGGTCAAGGGACACTTCTTT
+ACAAGAAATGTCCCTAATCGAATCTAACGCTCTTAAATTGAGGTTGCCGGTATGAGTGGT
+GGAGACATTGGAAAAGGAGAGGATAGATATTTATCATAAACGAAACACCTGCTTTGTTGG
+AATTGATATGCACAAGGACGCACATTGTGCAGTTGTAATTGATTGTTGGATGAATAAACT
+GGGTGAGGTTAACTTTGAAAACAGGCCATCCAGATTCCCTGCATTCGTTGAGGATGTAAG
+GAAGATTTGCGGCACAAAGGGAATTGTATTCGGACTTGAAGATACCAGAGGCTTTGGCAG
+AAACCTTGCTGCCTATCTGGTCGGCAGGAAGTTTGAAGTCAAGCACGTTAACCCTGCCTA
+TACAAGCGCTGTAAGGCTTGCAAACCCCATTATTTACAAGGATGACTCCTATGATGCCTA
+TTGTGTGGCAAGGGTGCTCAGGGATATGGTGGACACTTTGCAGGATGCCAAGCATGAGGA
+TATATTCTGGACAATACGGCAAATGGTGAAAAGACGGGATTTGATTGTAAAGAGCAATGT
+GATGAACAAGAACCAGCTCCACAGCCAGCTTGCTTATAGCTACCCATCCTACAGGAAATT
+CTTTGGCATGATTGATTCCAAGAGTGCCTTATGCTTCTGGGAGAACTACCCGTCACCGGA
+GTATATATGGAAAACAACACCGGAAGAAATATATCAGACGATAAAGCCTGTGCATCAGGC
+GCTTAAAATACAGCGCATCCATGAGATTATATCCATGATTGAAAGGGATGGAGACACAAG
+AAAGGACTATCAGCCCGAAAGGGATTTTATTGTCAGAAACATTGTAAAGGATATCAGGCA
+CAACAAGGAGTTGATTGCCGAAATTGACGATGAACTAAGAAAGCTGATACCTTTGACAGG
+CTATAAGCTACATACAATGCCGGGAATCGACCTTGTTACAGAAGCACAGATAATATCTGA
+AATCGGAGATATTAACCGCTTCCCAGACTCAGACAAGCTGGCTCGGTTTATGGGCTTGGC
+ACCGGTGCAATTCAGCTCTGCCGGAAAGGGTAAAGACCAAAGATGCAGGAATGGCAACAG
+GGCACTAAATGCGATATTTCACTTTCTCGCAATCCAGATGGTAGCAGTATCGGCCTCAGG
+AAAGCCAAGACACCCGGTATTCAGGGAGTATTTTGAGCAGAAGGTTAAAGAGGGCAAGAA
+CAAGCCACAGGCGCTTGTGTGCGTGGCAAGGCGGCTTGTGAGGATTATTTACGGCATGAT
+GAAAACCAGGACAGAATACAGGCCATTTGAGAAGGCTGACGACAAGAACTGA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_012982.fasta.fasta
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_014008.fasta.fasta
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_014168.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_014168.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1022 @@
+>NC_014168.1|provirus_27479_67296
+ATGACGCGCGCGGTTCCGGTTGCGGATGTTCGTGTGGAGGGCAGGCACCGCAGGGATTTG
+GGCGATGTGTCGGCGCTCGCTGCGAGCATTCGCGAGGTGGGGTTGATCCATCCGGTGGCG
+GTGACGGCGGATTTGCGGCTGGTGGCCGGTCAGCGGCGTTTGGAGGCAGCGCGGCTGTTG
+GGCTGGCAGACGGTGCCGGTCACGGTGGTGGCCTCCCTGGTGGAGGCTGCGGACTTGTTG
+CGCGCGGAGGCGGATGAGAACACGCAGCGCAAGCCGTTCACCCCGACCGAGGCAGAGGCG
+ATAGCCAGCGCGATAGAGGCGGCGCTGCGGCCCGTGGCTGCGGCGAGGCGTGCTGCTGCG
+ATCAAGGACCGAGACGAGAAGGGCAGGGCTCTGTCCACTTCCGCCGAATCGGCGGAAGTG
+GAGCGCCAACCCGAGACCAGGGACATAGCCGCGCAAGCGGTGGGCTACGGGCGCGACACG
+ATATCGAAGGTCCGCAAGGTCAAAGATCTGGCTGAGGACGAGGAAACCCCCGAGCCTGTT
+CGCGAGGCGGCGCGCTGGGCGTTGGGGGAGATGGACGCGACCGGCTCTGTGGCGGGTCCG
+CACCACAGGGTCATGTGCGCGGTGGAGGCCGAGGCGGCGCCCAAGCCGCATCCGGGGGTC
+ACGAAGTGGCTTGAGTCGAGCCAGGAGCTGAAGGACAAGGGCTACATGGTCGCGTTCTAC
+AAGGTGCTCAAGAAGTCGGGCGAGATGTTCCAGTTCGACCCCGAGCGCGTCGGGCGACTC
+GGGGACGAGCGCGACGTGGAGGTGGTCGAGCACCAGTTGAAGTCCACGCAGAAGTTCTTG
+GACAAGATGCGCGCCGCCCGGTCGGGGCTGCGCCTTATCAAAGGAGACCAGGGATGAGCA
+GACGGCGCGCGAAGAAGAGCGTGTGGAGCACCGCGCATTGGAGCCAGCGGGACCGCGACG
+AGCACGACGCTCTGGTGTACGAGGCGTGGGAGTCGTCCAAGCGCCAGGACGAGCGCACGG
+ACTTCTACCTCAACGGCCTGATCGACGCGGAACAGGCGCAACGGGGATGGGCCGTGGAGG
+TCTTGGCGCACTACCGGCGCAACGGCTGCGCGAACGGGTTGAAGAACCACATGAAGCGCT
+GCCGTGTGCCCATGTCGCACGATGGCCGGATTTTGAGCAAGCCCGCCGTGGTGGGAGCCC
+GCCGCACCGACGAGGACGGCACGCGGTACTACGAACAGGCGCTCATCTACTACGTGACCC
+TGCCCGAGCTGCGGGAGAAGCAGAAGGAGAGCATCGCGCTTTCGAAGACCTACGACGAGA
+CGACGGCGATGTTCGGCAAGCTCATCGCCCTGTGCGAGGCGGGCGGCGCGAACACGCCCG
+CCGAGGCTGCGGAGAACCTTGGCGTCACTGTCGAGGGCTGGCTGCTGGGAGCGGCGGCAT
+GACCGGCCAGAAGAAGGACGAGCGGTGCGCTTGGTGCGAGCGGGCGTTCCGCGCGCATGT
+GGCCGCTGGGGGTTCGTGGGCGAGCGCGCCGAGGGTGCGGGCGGCGCAGACGCGCACGCA
+TCCCGGCAAGGGCGGCGAGCCGGTGTGCATGGAGCACCGGGCCGAGTTCACAGGCGTGTT
+CGGAGTGCTCATATGAGCGGGCTTGTGCGGATCGAGAAGGGCCGCAACCACTTTTACGAG
+CTGGACGGCGAGCGTGTGGACGGTGTGACGACGATCCTCAGCGGCGGGATACCCAAGGCT
+GCGTTGATGCCGTGGGCGTTGAAGACGGCGGCGCAGTTTGCGGTGGAGAACTGGGACGAG
+CTGTGCGGGCTCGGGCAGTTCGAGCGCGTGGACCAGATCAAGAAGGCCCCTTGGCGCGAG
+CGGGACGAGGCGGCGAACCGGGGCTCTGAGGTGCATAGGCTCGCGGAGCGGCTGATGCGC
+GGCGAGGAGGTGACCGTTCCGGCCACGTTGTCGGGGCATGTGCGCTCGTGCGTGGACTTC
+CTGGACGAGTGGCAGCCGGTGCCGGTGTTGCTGGAATGCCCGGTTGCGTCCCGAGCGGAG
+CGGTACGCGGGCACGTTGGACGCAGTGGTGGACATTCCCGGCGAGGGGCGTTGCCTGATC
+GACTTCAAAACCTCCCGTTCGGGCGTCCACCCGGAGACGGGGTTGCAGCTCGCGGCCTAT
+AGGCACGCGGACTTCGCCCTGGCGGGCGGGGAAGAGGTCGCTATGGGCGGTCTTGGCGTC
+GAGAGGGCGTTCGGGGTGTGGCTGCGCCCGGACGGCTACAGCGTCCACGAGCTGAGGGCG
+GGAGCCGAGGAGTTCGCGGTGTTCCTCAGCGCCGCGCGCATCGCCCGCTGGGCGAAGACA
+TCGAAACAAGTTGTCGGTGAAGCTTTGGAAAGGCAGAAGCATTGAGCGAGTTAGAGAGAA
+CCGAGACCGAACCGGAGCAGCGGGCGCTCTCGAAAGTCGGGCAGTGGGCGCTCGACGCGC
+GCGAGGCGCACCAAGTGGCGCAGTCGTTGGCGAAGACGTCGTTCGTCCCGAAGTGCTATC
+AAGGAAAGCCGTCGGAGGCCACGGCGGCGATCCTCATGGGCTCGGAGATCGGGCTTTCCC
+CGATGACTGCGCTGCGCTCCATCGTCGTCATCCACGGCACCCCGGCGATGACTGCTGTCG
+CGTTGCGGGGCCTGGTGCAGTCGCAGGGCCATCGGGTGTGGATCGAGAAGGCGAGCGACC
+AGTCCGTCACCGCGAAAGGCGTTCGGCAGGGCGACGACATCGTGCATGAGTCCGTGTGGG
+ACATCAAGCGCGCGGAATCGCTCGGGTTGATGGACCGGGATCAGTGGCGCAAGCAGCCCA
+AGGCCATGCTGACCGCCCGCGCCACGAGCGAGGTGTGCCGCCTGGTTTCCGCTGACGTGC
+TGCTCGGTCTGCCGTACTCGGTCGAAGAGCTGGACGAGCCCGAACCAACGACGACCGTCA
+AACGCAAACGTCTTGAGCCGGTCGAGTCGCAAAGCTCAGAGAGAGCCGAAGCCGAGCCCG
+CCGCCGCTGAGGAGCCACAGGAAGAAGAGGCGGTCTGATGGCAGGCGACACTGTTATCAA
+TGTGGTTGGGAATCTCACGGCGGACCCGGAGTTGCGGTTCACGCCGACCGGGGCTGCGGT
+CGCGAACTTCACCGTCGCGTCGACCCCGCGTGTGTTCGACCGGCAGACGAATCAGTGGCA
+GGACGGGGAGGCGTTGTTCTTGCGCTGCAACATTTGGCGCGAGGCCGCGGAGAACGTCGC
+GGAGTCCCTTGTCAGAGGTCAGCGAGTGATCGTTGTGGGCAGGTTGAAGCAACGCAGCTT
+CGAGAAGGACGGGCAGAAGCGCACGGTGGTGGAGCTCGAGGTGGACGAGATCGGGCCTTC
+GCTGCGCTACAGCACGGCGAAGGTGAGCCGCGCGAACCGTGGCGGCGTCTCGCAGTCCGA
+CGAGCCGGATTGGCGGTGACGGCTATGGAGTCTTCCCCGGTGTCGTTGGAGCTTGAGCTT
+CGCGAGTTGATGAAGCAGCGGCGGCTGGCGTCGCTTGAGAAGCGGGATTTGCGGATCAAG
+GCGGACGACGAGCGCCGGGAGTGGAAGAGGGCGCACGCGGTGTGTCACGCCTTCTACAGG
+AGCAAGGGCTACGCGGTGGAGGACGCGAAGCAGGCCGCGACAGCGGATAAGGGGGTGATG
+GCGGCTCAGCAGCGCGCGGAGCATGCCGAGGCTCTTGCCGGGTACGCGGCGGACCAGTTG
+CAGGACTTGCGGCAAGAGGTCATTGCCGTGCAGTCCCTCATCAGTTTGTGGAAAACCCTT
+GTCGAGAACGGAGGGTGAGCGGTGAGCGACCAGATAAAGAAGGCCGATGAGGCGTTGCGG
+GCGCATGAGGAGGCGTGGGTGCGCCGTTACGTGCAGCTCGGGCATTCCCTGGAAGAGGCG
+AGGGCGGCGTACCGGGCGAAGTTCTGGGCGGGGGAGGTCGATCTGCGATGGTGAGGCCGA
+TATGCCGGTTCGAGGGCTGCCAGCGGGAAACCACAAGGAGCAGCTTGTGCCCCGCTCACG
+AGAGGCAGCTTCACAGGCGTGGCGAGGGCGGGTTGACCCCGCTGGGCGTGCCCTTGTGGA
+AAGGCTGCGTGGTGCCGGGGTGCGAGCGCAGGCGTTTCGGGAAGAACATGTGCGGGCTGC
+ATCTCAACCGTTCCCGCAAGGGCTTGCCCCTGGACCCTTGGACCCGGCATGACGAGAAGG
+TGTACCAGTCGGCGCTACGGGGTGTGGCGGGTGTTTTCGAACGCCGTGTTGCGGTGGAGA
+TTGAGGCCGGGGAGTGCCGCGCGGAGGCTGAGCGGAAGTTCCGCGTCGAGTTCCAGTTGC
+TCGCGTCCTTCCTGGATGACTTCGCGGGAGAGGGGGCGCTGCGATGACCGCCGAGTTCAG
+CAAGCGCGCCCGCGCTCTTGTGGAGTTGCGCTCCGAGGGGAGGTGCGAGGGCGAGTTCGA
+CCCGCGCGAGCGCTCGAAGAGGCCCCGGTGCCTTCGGGTGGCCGAGGAGATGCACCACCG
+CCGCACCAGGGGCTCGGGCGGCACGAGCGATCCCGCGTCCTCGCAGGTGAGCAATGCTTT
+GGCGTTATGCCGCAACTGTCATCACTGGGCGGGGCAGTGCTTCCGTCTCGCGGAGGCGCT
+GGGGATCTGCGTGTACCAGGCGCACCGCCCGGACGCGCGGCCCGTGTTGATTCGGGGCGA
+GTGGCGCCTGCTCTTGGACGATGGCGGATTGACCCCGCTTATCCGCGTGGGCGAGGACGA
+GTGGCGTTTCGACGCGCTCGGCGGCCACCGCTACCCGGCGTGGCTGGTGGACGGCGCTAC
+ACCGCTCGATGAGCGGTACGTGGACGTGAGCGGGCCGTTGGATGCGAACCGTTACGCGAC
+GAGATGGGCGGTGGCCTGATGTCGTGGTTCAAGGTGGATGACGGGTTCTACGCGCACCCG
+AAGGTTATGGGGCTCTCGGACGGCGCTCTGAGCTTGTGGACGCTCGCGGGCACCTGGTGC
+GCTCACCAGCTCACGGACGGCGTTGTCCCGCACGCGGCGCTGTCGATGCACAGGGGCACG
+CCTGAGCGGGCTCAAGAGCTCGTGGAGGCCGGTCTTTGGGAGCTGCACCCGAAGGGCCAC
+AAGTTCCACGACTGGGAGCAGTACCAGCCCACCAAAGAGCAGGTCGAAGCGGAGCGTGAG
+GCCGCGAAGGAGCGGATGAAGGCCGCTCGGGCCAAGCGCAAAGCCGCGAAGCCTGTTCGG
+GAGAACACTGAGGATGGTTCGCGCGATGTTCCGGAGAACACCGAAGACGGTTCGGAGGAT
+GTTCGGGCGAACACCGACCGAACTTCGGGCGAAGTTCGCCTAACCCCGACCCGACCCGAC
+CCGTCCTTATCTACTGACGTAGATAACTCAAGTACTTCGCCTTCGGCTCAGTGTTCACCC
+GCCGAGCTTCGCGCCGAGTTCGCGGCGTTCTGGACCGTCTACCCCCGCAAGTCGGGGAAG
+GCCAAAGCCGAGAAGGCGTTCGAGCGGGCCAGGCGCAAGACCACCGTCGAGGCGATGACC
+GAGGCCGCTGGGCGCTACCGGGACGACCCGAACCGTGAGGCGGGTTTCACGAAAGAGGCA
+GCGACCTGGCTCAACCAGGAGTGCTGGAACGACCCGCCGCTGCCGCCGAGGTTCGAGCGC
+ACCAGCGCCAAGCCTCCTCCCGGCCCGTTGGACGGCTACGGGGCCGGTGTGAAAAGCCAG
+ATCGGATGGGAGATGCTGAGCCCCACGCCTGACCCGCAGGCGGTCGCGATGGCCGAGGCT
+GCGGGCTACAAGCCGCCATCGAACGGGCACAGATTGCGGGAGGTGGGCGCGTGATAACCG
+AACAGGAAGTCGTGTTGGTGCTGCGGAAGATCAGCGCGAACGACAAGCGCAAACCGGATC
+AGTTCGAATTGGATGAGTTCGTTTCCGCCGCGCGCCGCCACAACTGGACGTACCGGGAGG
+CGTGCGCCCAGGTGGACGCGTTCTTCGACATCCCGCGCGGCGGGGAGAGGATCACCCACG
+GGCACATCACAGCCGGGATCAAAGCGGACCGCAGGCACCCGAAGCCGGTGGCGGACGTCC
+TGCAACTGGAAGGCCCGAAACCCGCGAGCGAGGACAACCCCGACCGGCAGCGCGTGCTGG
+CGATGGTGCGCGAGCTGAGCCGCAAGTTCTCGATGCCCGAGGAGACCGCCCGGTGAACCG
+CATGAAGCAGAAGGGGGACCGCGCCGAGCGGGAGGCGGGGCGGATCGCGGGGGCGTCTGG
+TTTCCCGTGGTGGGAGCGCATGAAAGCCGGGGCCGAGCGGGACCGGGGCGACTTGACGCT
+GTGCCCGTACGTGATCGCCCAGGTGAAGGACTGCAAGCGCATCTCGATCCCCGAATGGCT
+CAGGCAGCTCGCGCAGCAGAAGCGCAACGCCCGCGCCGACGTCGCCGTGCTGGTGGTGAA
+GCACTCCATCCCCGGCAAGGCCCCGGTCTGGTCGATGATCCTGCCCTACCAAGAGGGATT
+GCGCCTGCTCAGGCAAGCCGGATGGGGCGAACCCGTCACCGACGAACCACGCATCACCGA
+GGAAAGGACAGAGCTATGAGCGGAAACCCGATAGCGACCACACGCTACACCGTTCTCTCC
+GGGCCGGGGAGCGGCCCGACGCTGGGCGAGCTTCGCGAGCTGGTCGCGAAAACGCACGAC
+TGGGCCGCAGACTCGCGCGTGCTCATCGCCCGCTCGCGGATCGACCAGGACGACGAAAGC
+TGGCACATGGCGCTGCTAAGGGAGGCCGGGAAATGAGCGAGGACATGTGGCGGGACGCCG
+CCCAGGTCGCGGCGCGGAACAATGCGGGCAGCGGTGGGCGTGTGCCGCTTTTGGCGTTCG
+TGGACCGCAGTGACATGGCGCAGGTCGGTGTGCTCATCGCGGCCCTGGTGGCCATGGCGT
+GGATGAGCGCGGACGGGTTGGCGTGGGACATGGCGGGCGTGTTGAGCTTCGCGGGGGGAT
+TTTTGACCGCGACGTTGGTCAACGCGCTCGTGTTCACGCTGATGGTCGTGAACGGGCGGG
+CGGTCTTGCGTCGCCTTGCCGTTGAGAAAGGAGCCGGGGAATGAGCGCCCGCAAACTAAT
+GGCAGGAGCCGTGGCCGTCGTCGTGGTCATAGCCGCCGCTGGCTGCGGCGCTTCTAACGA
+GCAAATCAACCCGCCTGAACCGCAGGTGTGGCGGCTGCCCATAGCTGATGGCCGGAAAGT
+CGTGTGTGTCTCGATCAGCAATTCGAGCAACACGGCGATGTCCCTTTCCTGTGATTGGGG
+GAATGCGAAATGAGCGATGAGCTACCGATCGGTGTTGTGGGACGGCGCATCGTCTCGATT
+GCAGAAGGGGCTCGCAGAATTGTCGAGCCTTCCGCTTACGACTCGTCGCCGTTCGTCCAC
+GACGGCTTGGTGATCGGTCTGGACGACGGATCTGAACTGTTCATTCAGGACAACGGCGAG
+TACTACCCAGGGTTCTTCACACACTGGCTCGGGCAGAGCATCACCGAGGAAAGGACACAG
+CAGTGAGCAGGGCGAGCATCAGGAGGATCACCATGTGGAGTGACGTCGCGTTCACTGCCC
+TCCCTCCGGGGTGGGTGAACGTCTACAGGATGGACGACGGCACCTATGAGACCGAGCCCT
+GCCCCGGTGTGCTGCTGCAAGAGGCGACCCAATATAAAGAATGCTGGGACGAGGAAGTGG
+GCGGCAGTAACGTGCTTCGGACCCGTCGGTGCGAGATGGACCGTGAGACAAGGACCGTGC
+CCGCCGAAATCTGTGTTGGAAACTTGTCGCCAGCCTGCGATGTCTCCAACTATGTGACAA
+CCGCCACGGCTGAGGAATGGGAGGGCCAAGAGGCCGGGGAGGCCGGGGAATGAACGCTCA
+AGAGTTGAAAGAGTTCATCGATGAGCACATGGCGCAAGACTGGCTGATCTTGGTGAACGA
+GATGACCGGGGCCGCGCTCGTGGCGGACTTGGCCATCACGAGCGCCGAGGGCTTTATCAG
+GCTCTCGGGCAGGATCACGCCTGACTTTTACAGGTTCGACCCTGAGACTGGTCGGCTCGC
+GCATGAGCGGTACTCGCTTGAACTCATGAGAGGTTGGCGCGCGGTGAAGCCTGGCAGCCC
+GGAGTACGAGGCGGCGATGCGCTTGAACACTGCACGGATCAAAGCGCGGGCGGTGTTCGA
+CCAGTTGGGCGCGGGCGACATGACCATGATCGAGACACGTTGGCCGGTGATCAGGGCCGC
+GATGTCCAACGTTTCGGAGGCTGCGGCGCATATTGCGGCGGCGGATGAGTACGGGGAGCT
+TCTACGGCGGCAGGAGACCATCAAGGAGGCCGGGGCATGACGGACGGTGGTTTGGATTTC
+GGGGATGGCGTGACCACAGCCCCTACACAGAGGTGGGCCGAGGCAACGACGAACGTCTCC
+GAGCTGCGGGACGTGTGGGGCGAGCTGGCGAACCATAACGGGCGCGTCACCGACCTTGAG
+GCGGAAGTGGAGAGCGTCAAAGCCGAGGTGCGGGCGCGCATGCTGGAAGCGGCGTATCCG
+TCCCGTAAATCGCTCCTCGCCTACATGCGGCCCGCGCGTTGGGCGCAGCTCGCGGCGCTG
+TTCGCGAACCTCGCGCTTGTCTTGTGGTGGGCTGTTGTCAGCTGCGGCATGGGGATGTCC
+CCTTATCCCGGTGCGATTGTCTGCGGGATCGCGATCTGCGCTGCCTGGATCTTTTCGGTG
+GAGGCGTTATTCGAGGCGCTGGACCGCAAGGGGGCCGGGGAATGAGCGATGAGACCAAGC
+CGTTCAGGTTGCAGGATCAAATTTTAGTCCTGATGCTGATGCACCTGGACCGGATCGATG
+AAGCCTACTGCGCCACGCTCGACGGCTATAAGGTGACCGAGGCGCGGGCCGAAGATGTCG
+ATCTTCTCCGCATGTCGGCGTACTTGGCCGAGCACGCCGACGCGTTCCGCGACGACTCGG
+AGGCTGAGTCCGGTGAGATCCGTGTGGTGGAGGTCGCGAAGGGTTTGCGGATGCTCAAAG
+CCGGTGACATGTGGGTCACCGAGAGCATGGTCGAACAGCTTGGCAGGGTCGCGTTCGATG
+ACATCAAGCCCTTGGGCAAGGTCAGAATCCCCGTCGCGAAGCACTTCGGACTGGCGAACA
+CCTACGCCATCGGCCTTTCCAAGAGCACCGGATGCCTCTCTTTGGCCTCATCGGCTGGAA
+CCGAAAAACTGTCACGCAACTTGTGTTTCTTCGGAGATGAAAAGTTGGACGAGACGCAAT
+CCGAAGAGGCCCACATCTATGCCGCGCAGGAACGAGCTATAGCCGCCCTTCCCTTGATGG
+TGTTGGCGGACCAGGCATGAGCCGCGATGAGTTCTGGACCGGCCCAGTGTCGTTCTGGAC
+GATGACCGGGGCGGGGTTCGTGTGCGCCGCGCTCGCTGGGTTTTTCGCCGCGCAAGGGAA
+ATGGCCGCTGGCCCTGTATTTCGCGTTCGCGGCCATCGTCTACCTGTGCTGGGTCAAATA
+CCGGCGTGTGGACGACTCGCGCCGCGCGTTCGAGGACGGCAGGCGTTACACGGTCGATGA
+GGTCGCCCGGATGCGGCGAGTGCTTTGGGAGTCCCGACCACAGGTGTCTTACACATACGC
+GCCGGGTGAAAGCGAGGAGTCCGCATGAGCGTCACAACCTTCTGTTCTGTCCCGCATTCG
+CGTGAGGCGACCGAGGACGACCCTGCCGACGCGCTCAGGGAGCACGGCGGGCGCCTGGTG
+GTGTACGACTTGAACCGTCCCGCCGCGTTCGACGGGGCGTATTTGTGCGCGGGTCACCTC
+GCGCGCCTGGCGGACTTGATCGCCCAAACCCCGCATATTGTGGCGTTGCTGTTGTCGGAT
+CGGGAGAAGTCTTGCGCTTGGGGCGATCAGGAGGGCACTCGCCGCAAGACCGACCCCCCG
+GCTCCGTTGAGCCTCGCAGCCCTCGATGAGGCCGACAAGGAGTTCGCCGTGTTGCAGTCG
+TGGGCTGAGAACCATCGTGACTCCACGGGGCTTGTGCCGCCCCGTATACAGCATTTGTGG
+AAGCGCGGCGGCGCGGGGGAGGTGATCGGCGCGAAGTCCGGGCATGTGCGTCTCTGCCAC
+GCCCTTGTCGGGTACCTGTTGACCGACCCCAATGTGCTCGCAAGCCAGGAATGGGCCGGC
+GAGATGCTGCAAGAGCTGGCGGACATGCGCGCCCGCCGCCGTCCGCGTTGGCGGCTCGTG
+GACGAGCCGACGCCGACCGGGTACCCGTGCTTGAAATGCGGGGGCCGCACGATGCTGTTC
+CGCCCTCCGATAGACCAGTTCGACCCGTGCCTGGTGCAATGCCCCGGTTGCGGTTTCACT
+TTGGAGCGCGAGCAGTTCGACCGGATCACCACGGTCATCGAGGACGGGAAAACACCGCGC
+GGGAGGGTAGGATCGGATGCGTGAACGCGCTGCTGGACGTGGATGTTCCCGAGTTCGTGA
+CGGTGGAGCGGGCGGTGCGCGCCACGGGCCGATCCCGCCGCACTATCTACCGTTGGAAAG
+AGTCCGGGGCGGTGCGGTGGCGGATGTTCGAGGGGAAGTTGATGGTCGAGGTCAACGACG
+CCGACGAGGCCAAACTGCGGTGCTCGGACGCGCGACGGGCGAACCTGCGCCGCAAACGGT
+AGATGATCCCCGTAAGTATTGCCAAACATGGCGAGGCGTCGTAGGCTGCCCAAGCGATGC
+GGGTGTTAAACCTGTTCGGTGTTGGGGTGCTTGGCGGCGCTGGGTGAAAGAGAATGCTCG
+TTGAATCTTGGTGATGTGCGGAGTGTGGATGTGGCCGCGCTCGGGGACTTGGCGACGAGT
+CTCGCGTCCCGAGCGTCGTCGTTGGAGGAGGCGCGGGCGCAGTTCGCGAAGATCACGCAG
+TTCCCCGGCTGGTCGGGGACGGCGAAGGACGCGGCGGCGGGGAGCTTCCAGCGCGCGGAC
+GCGAGCTTGTTGGACGATGTGGCGCGGGTGTCGGCGGTGCATCAGGCGGTGTTGGAGCTG
+TCGGCGGACTTCGCCCAGTTGCAGGCCCGTGTGCGGGAGTTGGAGCGGGAGGCGGCGAGC
+ATCGGGGCGGTGTTGGGCGACGACGGCAAAGTCACGTTCCCGGAGGGGGCTCCGTGGCCG
+GATGCGACCCAGCAGCACCGCGCCCTCGTCATCGGCGGCGAGGCGTACGAGTTGATGACA
+GACGCGGACCGGCTCGATGAGAAGGCGGGCGAGGTTCTGCGCAAAGCTGTGGGCGGGGAG
+ATCAACGCCGCTGGCACGGGGAACGAGACACAGGCGGCGCTGGCCGGGGCGGCGCAAGGC
+ACGTTGGGCATGCCGGAGCCTCCGAAGGCCCCTGGGGGGCATGCGGACCCTTCGTACAAC
+GCGGGATGGTGGAAAGACTTGACCCCGGAGCAGCGGCGTCGGGTGCTGGACTTGCACCCG
+GAGTGGGTCGGCAACCTGGACGGGGTGCCCGCGTCCGTGCACGACGAGGCGAACCGCAAA
+ATGCTGCCGGGGGACATCGCCCGGTTGCAGGCGGAGGTGGACCGTTTGCAGAAGCAACTG
+GACAGCGAGTTCGGGCACGGCGCCTTCAGCAACACAGACTCGGACCTGTGGTACGCGCAG
+CGCCGGTTGGAGGGTTTGCAAGCGACCGAGAAGGCGCTGCGGGACAATCCCGGCACGAAG
+CTCCTGGTCCTCGACCCCGACTACGGGACCAGGGGCCGTGTCGCCATCGGCACGGGCGAC
+CCGGACACCGCCAACCACATCTCCATCTCGACCCCCGGGGTGAACTCCTCCCCCGGGCAG
+AGCATTGGGGAGATGACCAAAGAAGCAGTAGCTCTAAAGACTGAGACCGAGAACGTGCTT
+AAGGCCAATGGGCATGGGAACGAGACGGTCTCGACCATCTCGTGGATCGGGTACGAGCCG
+CCGCAGGCGCAGCTCGACCCGCAGCACCTCGACAAGACGGGCGACGTCGGACCTGGCGGG
+TTGCGGGACGAGCCGGGGGGCTTGTCCGACGTGGCCAGCGATGCGAAGGCGAAGGCCGGC
+GCGGCGAGCCTTTCGCAGTTCTACGAGGGCATCAGCGCCGCCTGGCATCCTGCGGACGGA
+GACTCCGCCACGAGCCCGCACATCACCGCCCTCGGGCACTCCTACGGCTCGCTCACCACC
+AGCCTCGCGTTGCAGCAGACACAGACGGGAGTCGTGGACAACGCCGTGTTCTACGGCTCC
+CCCGGTCTGGAGCTTCCTTCCCTTGACCGATTGCCGGTCGCTACGGGGCACGCCTACTCC
+ATGCAAGCGCCGAGCGACCCGATCAACTACGTCCCCAACCTCACCGAGCACTACGGCCCC
+AACCCCGTCGAAATCCCCGGCATCACGAGGCTGTCCACCGAAGCCGGGGACACCACCGGC
+GACGCTGCACCCGGCACGACGGTGCACCACGACGGCGCGCACGGTCACTCGGAATACCCG
+CGCAAAGGCGACAACGGGCAGTTGCGGATGCCTGGATACAATATGTCTGTGATCGTCGCG
+GGGATGACCGGGCAGGACGGTCGCCCCGACCTCACCAAGAGGGGAGAATAACCCTTAAAT
+GACGTACCCGGTGGAGAAGAGGAGTTGGTTGCGACGGCGTGCGGCGTGGTTGTGGGCTGC
+TGGTGTGGTGGTGCTTGTCGGGGTGGTGTTGGTGTGCGGGGTGGGGGTGTTTCGGTTTGT
+GGAGGTGTTGAAGGGCATGGATGACGCGCCGCGGCACATGGCACAAGAAAAGGTTCCGGC
+GTTCGAGGAGCGGTATCGGGACAAGGGCAGTGTGCAGCAGGCTGCGGAAGACTTGGAGGC
+GGTGATCGCTCGGGCCGCCGACAAGATCGCCGCGCTCGTCCCCGGCCTGACCTGGAAATG
+GCAGTACGATCCTGGAAACATCGGCTGTCCGGCCGATGCTGCCAGCGACACGAGGGTCAC
+ACGATTCGCGACTCGCCTAGCGGGTTTCGACGGCGCCATTCCGGAGGACGTGTGGCCCCG
+TGCGGTGGCCATCGTGCGCAGCGAGGCGGAATTCCTCGGGATGACGGCCCAGTTCAAGTA
+CCAGGACGCGGCCAAGCAGCACGACCTGGTGTTCTCCTCTCAAGACGGCGGGGAGATAAG
+AATCGCCACAGCCGTAGAAGCGTTCATCAGGGGCAAGACCCCGTGCCGGTTGATGGAGGA
+CTGGTACACCGACCGCAATATTCCTATTCCGGGCACGGGCAAGGAGCCGCGATGACAGCC
+GATGGGGCTCCCGCAGGAGCAGGCCAGAGGATCGAGGTTGCGCTCGAAGAGCTTCACGCA
+GGCGCGAGCCAGCTTCACGACCTCGCGCAGGAGGCGACGAGCAAGCTCGCCTCAAGCGAT
+CTGATGTTGGAAACCTCCTCGCGAGCGTTGAAAGGCTTGAAATCCGCAATCGAGTTCGCC
+GCCTACGCCGAATTCGAGACCGCGCGGGGCAAATCCGCTATCGAGACGATCACCGCTGCG
+GCAGAAAACGTCGGGTATGCCGCCGAGCACTACCACGGCACGGACGAGTCGAACGCCGCC
+AGCCTCGGTTGACCAACCCTCCTCGTTTTTCGAACACGTCAGCGTGTCGTGTTGACGTGG
+GTAATCTTCGAATGGCACACTAATGCCAGTAGCACCCCTATGCCTACTGTCGCCAGATCC
+TTTCGTTACATGAGCGTTGATCCTGGTAGGGCCGCTTCCCGCCTGGTGTTGGCGCACCAG
+GGCGACGGGGAGCGGTTCTTTGTTTCCGGGGTTCTTTGGAGGCCGCATGCCCAGTCTTGA
+CGCTCTGCGCGACGAGATCGACCGGGCCGTGACCGCGTATGTGGCGCAGTCCCGCGCGGA
+GGACGGCGACAGCCCCGGTTTGCCCGGTCCTTGGGTGGTGGCGGTGGGCTCCCAGTCGAT
+AGACGACGACGGCGAGACCATCCACACTATCGAGCCTGTGGGACAGCCCGGATGGGTCAC
+GAAAGGGCTTCTGCTGTCCACGCAGGAACTCTTGCGGGCCGAGTACCAGGAGCGCGAATG
+AGCGCCAGCCCGAACGGCATGGACGGGGATAGTGACGGCGGTAGGATCGGGGCATGAGCG
+ACACCACGGCCTTGCCGGTCAAGGGACGCACGCTGATCGTGGCAAATCTTCAAACCAAGA
+AGGCCCTGCAAATCGGGCTTGGACCGGAAGTGACTATCACCTCCACATTGAGAGTTCCCG
+ATGGTTTCGGGCCAAATGCTCCTGAACCGCGACAACTGCACATCGCCGTTGGGGGCGACT
+CTGAGGCGGTCAACTCCGCTCGGGCTGCTCTCTCGCCCGAAGAGGGCGACATGATCGCGG
+TGCAAGACAACACCGACGATTCCGTGCCAGCGTGGTTCGCGCTCTCTCGCGAGACGATCA
+CGCGGGCGGCGGACGGCCAAGCGCTTTGGAGCATTGAGGGCGTGAGCATGTACGACCTGC
+GGCGGGCAAGGGCATGAGCAAGCGGATAGCGCCGTCGAGGCCGGGGGTTGACTTCCTGAT
+CGACGGGGAGCTGCACAAGGTTCCCCGTTCTGCGATGCTTGAGCCTTATGGCGCAGCTCG
+GCTGCAAGACGGCTCGATGGTCTACAGGTTCATGGCCGAACGGCTCCCGCCAGGGCTCAC
+CGAAGCGGTGAAGAACTCGGCGCACGCGGTCAACATCCGAGAGCACGACGCCATCCGAGG
+GCACGGGACGCTCAGATACACCGAACCGCTGTGGGTGACAACTGTTGTCGAAGAACGCGG
+GGTCACCACGTTCAAGGCGGTGTTCACGCAGATTGAACGTCACATCCTCGGGTGGCCGAC
+CCGTGATTTGTGGGTTAGCGCCCAGGCGGCGCCTGTCAGTTGCAGACCGAGAGGCGGATG
+TAGCAGTCGGCGCGGCTTGTGGCCTCGCAGCCTTGTCGGGCCATTTCGCGCGCTCGGGAC
+GCGGAGCTGCTAGCCGCAAGCTCGTAGCCGCGCCTCCCGTTGACGCTGTCCCTGGTGAAC
+GCGATTGCGGCGCAACCCCTGAACGGGTATGTCCCGCACCGTGGCCCGCACTTGTCCTTG
+GCTGCGAGCATGGCGTAGTTTCCGCTGGAAGCGCCGGTGGCCGCAGTTGCGTTCCCCTGC
+CTGTCGTAGGCGATGGCGCCCCAACGCGCATGGTACGCGAAGGCCGGACTGGCGAAGCTG
+AATGAAGCGGCGAGGGCCACGAGGGCGGCGGTAAAGCGCATCATTGGGTTCTCCTAGGGT
+AAAGCCGAAGCTGAGATTTGTGTCCTCAATCACTTAGACGCACGGGATGCCCCCCAGGTT
+CCATTCGTCGGAAAATTTCAAGAACGGCGGCATGATCTCAACCTTATCGACGCGCTATCT
+CCCTGAGGGCTTAGCCGAGGAGTGACCGATGGGCGTCCCGCGCAGCACGACCAAGCGGGA
+TGCCGACCGCAAGACCATCGCCAGGGGCAAACCGCCGTGCGGTATCTGCGGCGGGGAGAT
+CGACTATGCCCTGCCGCACACCGACCCCGCCTCGTTCGTCGCCGACCACATCGTGCCCTT
+GAACAAGGGCGGCGCTGATGTGCTCGCGAACAAGCAGCCCGCGCACCGGGACTGCAACAG
+GGCCAAGAGCGACACCGCTGTCACCGACCTCAGACGGCGGTACGTCACAGAGAGAGCGTG
+GGCATGAACGAAACAGAGCCAAGGGCGACACTCACCGGACCCCCGACGACAAGCACCATC
+TTCTACCCCGCGAACAGCGAGCACCCCGCGTTCAAGATCGTCCTCGTAGAGCAAGCAGGG
+GCTTGGGAAGCCGAGAGCGTCGAAATCCTCGACAGGCATCCAGTCCAGGAGCCAGACTCA
+GGTACGTGACCGAGAGGGCATGGGCGTAGAGCGTCCGAGTGCCCACACGCCCACGACGAC
+AATAACAACCCGTCATCCCGGCGCAACGCCCTGACCTGGGGAAACAGAAAAATCCCTGGT
+GGAAACACCCACGGGGGATACCCCCCACGGTAGCCCTTCCGCACCTCGGCGGCATAGGCG
+GGTGCCCCCCCTTGGATTTTTCCCTTTGAAGGGAATAGAGCTTTGGCCCTTGGAAGGAGT
+CCGTCATGTCTCGTGGGAGCAGCCGGCATCAGGTGCTCGGGCCGGTCGCTCGGGCGGTGG
+AGACTGGCAGCGAGATCGACCGTTTGAACGCTTTGCAGGCGCGCTTGGCGGGGGCTATTG
+ATGACGAGGGGACGCCGCCTCGGGATTTGGCGGCGTTGACGCGCCGTTTGCAGGACGTGT
+CGGAGCGGTTGGACTCGTTGATGAGCGAGAAGGCCGAGCAGGTCGCGGCGATTGTGGAGG
+ATGAGCGGTGGGATGGCTCGGCTATCTGAGGTCGCGCGTCATCTGGTGGTCCCGGAGGGG
+ATCGTTTCGACGGAGTGGCCTCGGGTGCGGGCGAAGTGCTCGGAGCTGGGGTTGGGTTTC
+GATGAGTGGCAGGACGGGCTTGGCCGGTTGATGTTCTCGAAGCGCGAGGACGGTTTGTAC
+GCGTGCGACACGGTGGTGGTGTCGATTCCCCGGCAGGTCGGCAAGACGCATGTGATGATG
+TCGGCTTTGTTCGCGCTGTGTTTGCTGCGGGCGGGGTTGACGGTGTTGTGGACGGCGCAC
+CGGGTGAAGACGGCGAAGGAGACGTTCGGGTCGATGGCGGCTCTGGCGGCGCGGGATTCG
+GTGCGTCCGCTGGTGGCCCAGGTTGTTCGTGGCCGTGGCGACGAGGCCGTGTTGTTTGTG
+AACGGCTCAAGGATTTTGTTCGGTGCTCGTGAGGCGGGGTTCGGGCGCGGGTTCGCGGAT
+GTGGGCGTGTTGGCGTTCGATGAGGCGCAAATCCTCGGTGAGTCGGCGTTGGACGACATG
+TTGGCGTCGCAGAACGTGGCTGAGAACCCGTTGACGTTGTTCATGGGCACGCCGCCGCGT
+CCGAAAGATCCCGGCGAGGCGTTCACGATGTTCCGGCAGGAGGCGTTGGACGGGGAGTCC
+GAGGGCACGTTGTACGTGGAGCTGTCGGCGGATCGTGGTTGCGACGTGGAGGACCGGGAG
+CAGTGGCGCAAGGCGAATCCGAGCTATCCGCACCGCACATCGGAGCGGGCGATGCTCCGG
+TTGCGCAAAAACCTCTTGGAGGATTCGTTCCGGCGCGAGGCGCTTGGGGTGTGGGACGAG
+GTTTCCACGCATCAGGCGGTGGTGAAGGATTCTGTGTGGCGGGCTCTTCGGGCTGATGGC
+CCGGAGTCGTCGGTCAGGCCGCACGCCTTGGTGGTGGACATGTCCCATTCGCGGGAGGTC
+TCTGTGGGGGCGTGCTGGTTGGACGGGGATTGCGCGCATGTCGAGGAGGTGTGGGCGGGG
+GTGTCGGGCTCTGAGTGCGTGGAGTGGGTCGCGGCGAACGTGGGCCGGCGTGTGCCTGTG
+GGGGTGGATTCGGCTTCGCCGGCGTCGTCGCTCGTGCCCGAGCTTCGCCGTCGCGGCGTT
+CGGGTGGTGGTCACGAACGCGTCGGACATGGCCAAGGCGTTCGGGATGCTCATGGACCGG
+GTTGCGGCGGGTTCGCTCTCGCACGCGAACCAGGAGTCGGTGAATCAGGCGGTGGCGGGG
+GCGAGGCGTAGGCCGATCCGCGACGCGGGTGGCTACGGGCTGGACCGCAGGGACGAGACG
+GCGAACATCGCGCCGCTTGTCGCGGTGATGTTGTCGGTGCTGGTCGCGGTGACGCATGGC
+AGACGGAAGAGTGTTGTTTCGAGCGGTCGAGGGGGGTTCGTGCTGTGACTGTGTTCGCGG
+AGGCTCCTCGGGTGCGGGGTTTGACGGACGACGAGCAGCGGCTGTTGGGCCGCTTGTTCG
+ATGAGTTGACGCGGCGCGCTGGGCGCAACCAGTCCCGCTCGCGGCTGTACGAGGGCAAGT
+ACGCGGTGAAGCGGACGAGCACGATCCCACCGGAGTATTTCCGCATGGGGATTGTGCTGG
+GTTGGGCCGCGAAGGCCGTGGACATCCTGGCGCGGCGTTGCAACCTGGACGGGTTCACAT
+GGGCGGACGGGGATCTTGAGTCGTTGGGGTCGCGCGAGGTGTGGTCGGAGAACCTGTTGG
+GCACCGAGTCGGACTCGGGCGTGGTGTCCTCGCTGATCCACGGCCCAGCGTTCCTTGTGA
+ACACCGCAGGGGAGGCGTGGGAGCCGAAGGCGTTGATCCATGTCAAGGACGCGCTCAACG
+CGGTGGGCGACTGGAACCCCCGCGCGAGGCGTTTGGAGAACCTGTTGTCGATCACGGATC
+GCGACGAAGAGGACCGGGTGACCGGGTTCGCGCTGTACATGGACGGGTTGACGGTTTCCG
+CCGCGCGGGACTCCTCGGGCTGGGCTGTGGAGCGCTCCGACCACAAGTTCGGGGTGCCCG
+CAGAGCCGCTGGTGTACAAGCCGCGCGCGGGTCGCCCGTTCGGCTCGTCGCGGATCAACC
+GGGCGGTGATCGCGCTTTTGGAGCAGGCCACGCGCGTGGCGATCCGCATGGAGGCGCACG
+CGGACACGTTCTCCTTCCCGGAGTTCTGGATGTTCGGGGCGACCCTCGCGGATCTGGCGG
+GGGGCGAGAAGAACCCGAACCCGTGGCGGGTTCGCATGGGCCGCATCAAAGGCTTGCCCG
+ACGACGAGGAGACCGGGGTGCGCGCGGAGGTGCATCAGTTCCCCGCCGCTTCGCCGCAGC
+CGCATGTGGACATGTTCGAGCACATCGCGGGGCAGTTCGCGGGGGAGACGTCGATCCCGG
+TGGAGTCGCTGGGGTTGGTGAACCGCGCGAACCCGACGTCCGCCGAGTCGTATATCGCCT
+CTCGTGAGGATTTGATCGCGGAGGCCGAGGGCGCCACCGACGATTGGTCCCCGGCGTTCC
+AACGCTCCTTCACCCGGGCGTTGGCGATCAGGAACGGCTTGGACTCGGTGCCCGCCGAGT
+GGGTCACGATAGCCCCGAAGTGGCGTTCGCCCATTCACTTGTCGCGGGCCGCGCAGGCGG
+ACGCGGGCTCCAAGCAGCTCGCGGCGGCGCCGTGGCTCGCTGACACCGAGGTCGGCCTCG
+GGCTGTTGGGGCTCGATGAGCAGCAGATCCGGTTGGCGCTCTCGCAGCGCCGCCGCGCGC
+AGGGCTCGCAGGCCCTCGCTGCGCTCACCGCTCGGGCCAGAGGGACCGCTGATGCCGCTG
+GCGAGTGACGCCGAGCAGATGCGCGCCTCCCTGGTGGGGTTGTCGGGCATGTTGGAGGAC
+GAGGCGCGCTCGCTCGCGGCGGATGACTCGGGATCTCTGGCGGGGTCGGCGGCGAAGGCG
+TGGATCGGCTCGCGTCTGGCTGTGGGGATCGGCGGCTTGATCGAGGAGTACGCGGGCGCG
+GCGCAGGCGGTCGCGGCTGACTTCTACGACCTCGCTCGGGGGGCGCTCGCTTTGCCGGGT
+CGGTTCACGGCGTTTGTGCCCGATCCGGGGACGTTCGGCCCGGACGCGCTGACAGGTTGG
+GCCGCGTCGGAGGCGACGAGCTTCACGGCGTTCGAGTCTCTGGTCGTCGGCGGGGCGAGC
+AGGCGCGTGATGAATGCCGCGCGGGACACGACGATGGCGAACGCTTTGGCGGACCCGCAG
+TGCCGGGGCTGGATGCGCATCGGGGCGGGGGAGTGCGATTTCTGCCGGATGCTCATCGCC
+CGTGGGGACGTGTACACGAGCGAGTCCGTGCGGTTCAAGTCGCACGACCACTGCAAATGC
+CAAGCGGCCCCTGTGTGGGACGAGAGCAATGTCGTGGAGCTGCGCGAGAAGTACGTGCCC
+AGCGCCCGGTTCAAGACCGAGGCAGCGCGGCGGCGCAACAACGAGGCCGTGAGGGCGTAC
+CTCTCGGCCCAGTAGAGACCATCCCTGCCGCAACGGCGGGGACCGACCCGGAACGGGGAA
+TGAATCATGTCCGAACCCATTGTCGAAGCGGCAGAGGCGCCCGAAACGGAAGCCGATGAG
+CCCAAGCCCAAGCAGACGGAGACGGTCGATTTCTGGAAGTCCAAGGCGCGTGATTGGGAG
+TCGAAAGCCAAGTCGAACAAGTCGGCGGCAGACGAACTCGCAGCGCTCAAGGACTCGCAG
+AAGACCGAGGCGGAACGAGCGGCAGAGAAGTTGGCGAACGCCGAGGCCGAGGCCGCGACG
+GTCCCGGTCAAGGTCGCCGGGGCGCTCAAGGCGCACCTGGTGGCGTTGCACGGGATCAGC
+GACGAGGACGCGGAGCTGTTTTTGACCGCGCAAGACCCGGAACTTTTGCTCAAGCAGGCC
+GCTCGTCTCGTCGGGAACCAGTCGGGCGTGAAAGGCAACAAGGTGCCCCATGAGGGCGCG
+AACCCCCGGCCCAAGCCGAACTCCACGAGCGAGTTCCTTGGCGCTTTGACCGGGGCCGGT
+TAACCACACAGATTAGGGAGAACAAAATCATGGCAGCATTGCAGAGCACGGACCTGTTCC
+TGCCCACGCAGATCGCGGACGGCATCGTGGAGCGGGCGAAGACAGGTTCGACGGTCGCGG
+CTTTGTCCGCTCAGGAGCCGATGCGTTTCGGCAAGGTCGAGATCATCACTTTCGATGACG
+ATTTGACCGCCGAGTTCGTTGAGGAGTCCGCCCCGAAGGGCGCGGATTCCGCGAAGCCGT
+CGCATGTGACGGCTGTTCCGCACAAAGCGGTCGTGCAGATGCGGACCTCCGACGAGTTCA
+AGTGGGCGGACGAGGACTACCAGCTGGGCGTCCTCGGCAAGTACCAGGAGAAATGCGCGC
+GGGCTCTGGCCCGAGGCTTGGACCTCGGTTTGTACTACCGGACCAACCCGCGCACCGGCA
+ACGCGCTCACGGCGTGGACGAACTATTTGAACGCGACGACCAAGCGCGTGGAGATCACCG
+CTTCCTCGCAGCCGGACATCGACTTCGAGACCGCCGCTGGTCTGGTGATCGGGGACGGTC
+ACAGCGTCAACGGCGTGGCGTTCGACCCCAAGCACGCTTGGAAGCTCTCCACGGCGCGTT
+ACGCGGACGGGCGCAAGAAGTACCCGGAGCTGGGGCTTGGCGCGAACCTCTCCTCGTTCG
+AGGGCGTGACCGCCGCTGTGTCTTCGACGGTCTCGGGCAAGGCGAAGGACGGGGACGCGA
+CGGACAACAAGGTTCGGGCGATCCTCGGGAACTTCCAGTCGGGCATTCGTTGGGGCGTGC
+AGCGCAATTTCCCGTTCAAGATGCTTGAGTACGGCGACCCGGACAACACCGGGAAGGATT
+TGGCGGGCAACAACGAGATCTTGTTCCGAACGGAGATCGTGTACGGCTGGTACGTCTTCA
+CCGACCAGTTCGCCGTGATCGAGGACGCGGCTGCCTGATGCCGCGTCTTAGGAATCGGGC
+GAGCGGGGCGGTCGTCAACGTCGATGACCGTCTCGCCTCCCGGCTCGGCCCGGACTGGGA
+GCCAGCCGGCGACGGCGGGGCCGACACCACGTCGCGCCCTCGGCGCAGAACGCGAGGGGC
+GCATGCCAGCGGTGACGATAACCCCAGCTGATCTCGCGCCGTTCGCGGTGATCGAGGAGC
+CGAAGGCTTTGGCGATGATCGCGGACGCGCTGGCGATGGCGCGGTTGGTCGCTCCCTGTG
+TTGACAAGGACGATTTCCCGTTCGCGGACGCCGCCAAGGCGGTGATCCGTGGCGCGATCC
+TGCGGTGGGAGGAGTCCGGCTCCGGTGCGATCTCGCAGCAGACGGCGGGGCCGTTCGGGC
+AGACGCTCGACACCCGATCCCCGCGCCGGGGCATGTTCTTGCCCAGCGAGATCGAGCAGT
+TGCAGAAGATGTGCCGCAACGCTTCAAGCTCGGGGGCTTTCTCCATCGACACGGCCCCGA
+ACGGGGGCGGGGTGTGGCACGACGACGCGTGCAACCTCGCGTTCGGCGCTTCGTGGTGCT
+CGTGCGGGGCGAACCTCACCGGCGACGGCCCGCTGTGGGGCACGGCGTGAGCCTCCCGCA
+GCCGCACACGGTCCAGCACCGCCGCAAGACCAAGGGCGGGTACGACGATCAGGGGTACCA
+GATCGAGCCGGGTTTCTCGGAGCCGGTGGAGCGCCGCGTGATCGCGGTGTATTGGGAGCG
+GCCCGCCGAGGCGGTGGTGGGGGACTCCCCGGAGCGGGACCGCGACGAGCTGGTGGTTCT
+CACCGGCGAACCGGAGGCGTATGGGGACGGGGATCTCATCGAGGCCGCTGGTTTGCAGTA
+CAGGGTGATCGGGCCGCGCGATTGGCGTATGGGGCCGTTCGGGTTCAAACCGGGCGGGGA
+GGTGCGGTGCGTGCGGAGGGACGGGTGAATGGGGCGCATCGACTGGAACCGGGAAGGGTT
+TCGGGAGCTGCGCAAAGACCCCGCTCTCGTCGCCCATTTGAAGACGATTGCCGAGGACGC
+GAAGCGCGACCTTGACGCGGAGCTGCATGGGGCGCAAACCAATCGCGGGCAGCGGGAAGC
+GTCCGGTTACCGCGCCGACGTGGCCGTGGGCCGCACGCGCGCACGGGGGTATGTCGGCAC
+GGAGACGGCTCGGGCGATGGCCCACGAGCAGGCCCACGACTCGCTTTTGAAGTGGGCGTT
+CCGCAACGGCGGTCAGTCTCCGAAGAGGAAGGGTTGAGCTGTGGCGGTCTATCGGCCTCC
+GGTGGCGGGCGAGGTCCGCGCCCATCTCGCGCGGGGGCTCTCGGCTCGCGGCGCCTCGTT
+CGGGTGGTTCTCATCGAACCCGAATCCGAGGCCGACCGATGGGCGGTGGGGCGTGTGCTC
+GCAGATCGAGTTGCGGGACGTGCAGCGCGTGGAGTCCGAGTCGCTGTTGCGGCTGGTGGT
+GATCGACCCGGACGAGCGGCGCGGGGAGCGCTCGGCGTCGTTGGCGCTGGCGCTCATCGA
+GGCGGCGCACCGCACGGCGGCGTTCAGCTTCCACGAGCTTTACAGCGGGCCGGCCCGCTA
+CCAAGACCCTGACGACCCGAGGGTGTTCGGGCACGTCATGAGGCTTTCCGTCACCAGGGC
+GGGCGAGCCGTTCGCGTGAGACGCGCGGGCGGGTGCAACACAGGAAGGAAATCGAGATGA
+CCAACCCAACGACCCCGGCGACGGGGAAGGATTATTTCGGGTACGGGGACGTGCGGAACA
+TTTTCAAGCCGCAACCGGACTCGGAGAAGACCGTGGGCGGCCTGTTCGTCGGCCCCAAGT
+TCATCGACGTCGCGGAGGCGCTGGACTTGGACGCCCCGGTGCTCGAATCGCTCAAGCAGG
+CCGGGTATTTGACCGTGGAGGGCATCCGCGTCAAGCAGGACCGGCCCGGCAAGGCCATCA
+ACGCGTTCGGCGGCGACGAGCTGGACTACGGGCAGACCTCGTTCTCCCTGACGGTGGCGT
+TCGACGTGTTGGAGTACTTCAACGACGACGCGCAGCGCCTCGCGTACGGCAAGAACAACG
+TGACGGTGACCCCGGCGACCACGAGCCACGGCAAGCGCACCCTCACGAAGATCACCGCGA
+AGCAGTTGGACGAGGTGTCTTTGTTCATCCTCTTGGTGCAGGGCGACAAGCAGGCCCGCT
+ACCTCGCCCCGTTCGCGCGGGTGACGGAGGTGGGCGAGGAGAAGCACGTCCACGACGAGC
+TGGTGTCCACGCCGCTCACCGCGCGCTGCTTCCCGTACCAGGGGGCGGTGTTGCACCGCA
+ACGTGGACGACGGCATGAAGCTGCCCGCAGGGTTGGCCGCGTGAGCGCCGCGAAGGGCAG
+GGGCGCCAAGGCCGAGAAGCCCGCCCCTGTCCCCGGCGACCTGGATTTCGACTGGTCGAA
+GGTGTACCCGGAGGGCGAGCTGTTCGAGTACGAGTCGGGCGGGGTCAAGGTGGTGATCCC
+GGTCTTCGAGAAGTTCAGCGCCGACTGGTACCGCCGCAACCGGCGCCTGTCGAACGAGGA
+GAGGTTCTACCTGCATTTGGAGCGCTCCGCGAAACCGGAGACGTTCGAGGCGGCGGACCG
+GCTCAGCCACGACGGGTACGCCGCGTGGTTGACCGCCTGGGGCGAAGAAATGATGTCCCA
+ACTGGGAAAATAGCGTGGGCGGTGGAAACGCTGCACCGGCATCCCTTCGCGGCCCGACGC
+GACCTGCTCGCGCTCGGGCTGCGATGGGAGAACCTGTGGGACGGCACTCTCGACGTCCTC
+GACGTCGCCGCGCTCGCCGTCGCCGCCCCGCCTCATTCCGCTTTGTTCCACGCGCTCACG
+GAGGGCTGGGACGTGAACGCGCATTTGACGGCGGATCTCGTCTACCTCTCCGAGCTGGGG
+CTGTGGGCGCGCACCAAGGACGCGCAATCCGATTTCCCGCGCCACAAGCCCCAACCCGTC
+CCGCGCCCCGGCGCGGCGCGCGAGCACGGCCCGACGCAGGCCGATTTCGAGAATTTCCAC
+GACGCTGTAGACAGGAGGGCTCGCGGTGGCGACCAATCTCTCTGACGTCTATGTGACCAT
+CATCCCGGAGACCCGCCGCGTCGGGGAAGCGATCCGGGCGGCGTTTCGGGACGCGGAGCG
+CGAGGCCAAGCTCTCCTCCGAGCGCATGGGCCGCGACTTGGACCGCGAACTCGGGGACGT
+GCATGTCACGGTGAAGGTCGGCGCGGACACAAAGCGCGCCAGGCGCGAGGTGGACGAGCT
+CAAGACGCACGGGCAGCGCGCCGGGGAGGCGATGGGCACCGCCACCGGGCTCGCGTTCGG
+GAAAATGTTCTCGGCGCAACTGGGCTTGGTGAAGTTCGCGTCCCTCGGCGCGGCAGGGGG
+CCTCGCTTTGTCGGGCCTCGGCGGCTCCCTCGCCTCTATCGTCGGGGTCGCCTCCCGCGC
+ATCGGGGGCGTTGGCGCTGGTGCCCGCCGCCGCGATGGGCGCCGCGGCCTCGGTGTCGGC
+GCTCAAGCTGGGGGTGTCGGGGCTGTCGGACGCGTTCAAGGCGATGGAAGACCCGCAGAA
+GTTCGCGAACGCCTTGCAGAAGCTCTCCCCGGCCGCGCAAGAGTCCGCCAAGGCCGTGTA
+CGCCCTCAAACCGGCGTTCGACAGCATGAAGAACACGGTGCAGGACTCGCTGTTCGCCGG
+TCTCGCCCCGCAAATCACCCAACTCGGGCGGACGTATCTGCCAGTGGTGCAGCAGGGGTT
+CGCGGGCGTGGCGGGGGCGGCGAACCAGGCGGGCAAGTCCGTGGCGGCGTGGGCGCAGAC
+CCCTGAGGCGGTGGGGCAGGTCAACAAGCTTTTGGGCAACACCACGGCGGGCATGAACAT
+CCTCGCGACCGCCGCGCGCCCAGCGGTTCAGGCGGTGCTGGGGCTCGGGGCCGCTGGCTC
+GGACTCCCTCCCGCGCCTCTCCCAGGCCGTCGCGGACGTGTCGAACAGGTTCGCGGGGTT
+CGTGAAAAACGCCTCGGAGTCGGGCCGGATCACCGAGTGGATCGACGCCGGGCTGACCTC
+GCTCACCCAATTGGGGCACGCCATCGGCGCGGTCGGCTCGGTGTTCGCCACCGTGTTCAA
+AGCGGGCTCGGCTGTGGGCGGCGGCATGCTCGGGACGATCACGCAGGTTGCCGACAAGTT
+CAACGACTTCCTCAAGAGCGCGGACGGGCAAGCAGCCCTGTCGGGGTTCTTCACCGGCAT
+CAGCCAAGCCGCAGCGGCGCTCGCCCCGATCCTCGGCACGCTCGCGCAGATCGTCGGCAC
+GACCATCGTCCCGGCCCTGTCGAATTTGGGCACCGCTGTGGCGCCCGCCCTGAACGGCAT
+GCTGCAAGGCCTCGGGGCGGGGTTGAACGCGATCAAACCGGTGTTCGAGCAACTGTCGGG
+GCCGCTCTCGCAGATCGGGCAGGTCATCGGGGACGTGCTGGCGAAGACCCTCCCGATCCT
+CGCCCCGGCGCTGGTGCCGCTCGCGCAGGCGTTCGCGGACCTGCTCTCCGCTATCGCGCC
+GCTGATCCCGCCGATAGCGCAGCTCGCGTCCATGTTCGTCCAGGCCGTCGCGCCCGCGCT
+CTCTGTAGTCTTCCAAGCCCTCGCCCCGGTCATACAGCAGCTCATGGACGCGCTCAAGCC
+GGTCCTCGACCAGCTCGGCCCCGTCCTCGCGCAGGTGGCGCAGACGCTCGCGGGACTTTT
+GGTGCAGGCGATCCAGGAGCTTCTGCCGCCGCTGATGCCGTTGGTGAAGTCGTTCGCGGA
+CTTCTTGGCGGCGGTCCTGCCGCTGCTGCCCGCCGTGGTGAAGGTCGCCGCCGTCATCGC
+GGGCGCGCTGGTCAAGGCGATGGCCGCGACCCTGCCGCTCGCGGTTTCGGTGGTCAAGGC
+GATGGTGGACTTCTCCACGAAGATCGCGAACTTCGTGGTGCCGTGGGTGAGCAAGCTCGC
+GGACGGCTTCGGGTGGCTCGGGGACAAGGTCAAATCCCTCATCGGCTGGTTCAGCGGCGT
+GAAGGACGCGGCGGGCGAGGCCTCGGGCTCGGTGAGCTCGTTCGCGTCCGCCACGCCCGC
+GCCTTTCGCGTTCCCGCAGACAAGCGGCGGGGTTCCGGGAGGCGGGGAGCCTTCCGCGCT
+CGCGAACCGCCTGCGCCGTTCGGCCGGAACGCCGGAGGGCATGGACCGCGCGGAGGCGGG
+GCGGTTGGGCCAGTCGCTCGCGGCATCGGCCACACCCGACGCCAACGGGTCGCTGCTGGC
+CGACGCTTCGCGCCTGCTGGCGGACTACGCGACAGGGAAGGGCGATCAGGACGCGGTGGC
+GCGGGCTGCGGAACTCATCGACCAGGCGTCCAAGGGCGGGGCGTATGTACCCGACTCGGA
+CCCGCCGCCTCCTGCCGTCCCGCTGCCGCCTGTTCCGGCGCCGCTGCCGGTCCCTGCCGC
+CCCGGTCCTGCCTGCGCCGTCAGCGGGCAAGGGCGGCAAAGCGCCCGCGCTGGCGCCGAT
+CACGATGGCGGATTTGGACAAGTACGACACGCCGGGGTTGGAGACCGGCGCCCCTGTGAC
+CGTGGCGCCGGGTTCCCCGGCCCGCGCGGAACAGAGCGTGCCCGCGACGATGGGCGTGGA
+CGTGTACACCGGCATGGGGCAGACCGGGGGCGGCTCGGGCGCTCAGCAGGGAATCGACTT
+CGCGCACTCCATGACCGGCACCGCGTACTCGCAGCAGGTGTTCGGGCGGATCGGCATCGA
+CTGCTCGGGGATGGTGTCCGCGACGGTGAACGCCGCAGAAGGCAAAGACCCGTTCTCCTC
+GCGCATGTCCACCGTCAACGAGGGCGAATGGCTCAAGGCGCACGGCGCGGTGGAGGGGAT
+GGGCGGTCCTGGGGATCTGAGCATCGGATGGTGGAACAAAGGCTCCTCTGGCGGCAACAA
+CGGGCACACGGCGTTGACGCTCCCGAACGGGGAGAACGTGGAGTCCGGGGGCAGCCACGG
+CGTCGTTGCCGTGGGGGCGGGCGCGGCCGGTGCGGGCGACAAGCAGTTCGACCATCACAT
+GCACATCCCGAAGGAGCTGTTGGGCTCCGTGCCCACCGCTGCGGGCTACGCGCCCGCGCT
+CTCGGGCGCTTCGGGGGATTGGCGCTCGCGCACCGCCGACCGCGCGGTGCAGAACGCGCA
+GGACTCGGTGAAAGACCACCAGTGGCGCGTGGACCAGGCCAAGCGGCGCATGATCGAGGC
+GAAGACGCAGCAGCAGCGCGACATGGCGGAGCACGCCCTGATCGTCGCGGAGCGCGAGCT
+GGCGAAGTCGCACGAGAAGCTGCGGGACGCGCAGGACAAGCGCGCGGAGACGATGGCGAA
+GGCGCGGCAGAAGGGGCAGCGGGGCGGTTCGGACGGCGCGGAGGACTTCGGGCACTCCCT
+GGTCTCGGGGGCGCTCTCCGGGCTCGGTTTGGACGGCTCGCTCTTGGACAACCCGTTGGA
+GTGGTCCGGGGTGAAGTGGCTCACGTCGATGGTGAACGGTTTCACCAAGCCCGCGCAGGG
+CCAGCAGGGCCGCTACGGCTCGGACGGGGCCGCTCTGCCCGGTTTCGGGCCCCCCGCGTC
+CGACCCCGCCCAACTCGCCTCGCTCGGCGCGCAGGGCCTCTCGCAAGGCTTCGGCGCCGA
+TTCCGGCTCGCAGCCCTCCCCGGCCCAGGTGGACCAGTCGATCAACCTCACGGGCCAGTT
+CGGCAACCCGAACGACACGGCGCGGGCGATGCGCGCGGAGATGGACAACCGCAACCGGGC
+GTTCTCCATGAACGCGGGGAGGATGTGATGGCCTACCAGCGCACGGACATGACGCAGTAC
+CCGAGCCAGCACCCGGACCTGCGGACCCCGCAAGGGGACTACCCGCCGTTCGGGCGCCCG
+CTCACCGAGTACTTCCAAAGCTGGGAGAACGTCCCGCCCGTGCTGCGCTCGGACCAGCTC
+ACCGTGATCTACGTCGGTGTGCCCGACGAGCGCGGGGTGCGGGCGATGTGGCATTTGGCG
+GGGCCGCGCCGGGGCTTGGAGGGCGTCGCTTTGGCGACGGACCTCTCCGGGCTGGTCATG
+CCCGAGTTCGAGCGCGCGTGGCACGAGTCGGCGTGGATGACCGGCGCCGTGCCGGGGCAT
+TTGTCGTGGCCCAAGCGGCTCTTGAACCTCGGCGTGCATATCAGCGCGCCGCGCCTGCCG
+AGGACGATTCTGGCGGCGGACGGGCGCCTGGAGCGGCTGGTGGCGTCGAGCAGCGCTGAC
+CGCTACCGGTTGACGCACCAGTTGTGGTGGAACTCGTTCTCGATGGACGCGGACGGCGAC
+CTTTTGTGCTTCACCCGCACGACGGGCTTCCGCAATCTCAAGGTCCGTCTCGCGAAAGCC
+CCTGCCGGGACGTTGGAGACGGACCCCGCCGCGTTCGGCAACAACCGGATCACCGTGGAT
+CTGCCCTTGGTCGCCTCGGACCCGTTCTTCGCTTCGCCCGCCTCGATGGGGACGTGGCGC
+AACAACGAGGACACCGCCACGCCGCTGGACGCGTTGGAAGAATTGGTGCGAAAGGTGATC
+CCGGACGCGGACTTCACGTTCGCGAAGACCGCGCTGGCTCTGGTCGCGGAGGCGCTGGGC
+AACCTGATACCGGGCATCGACGTGGGGCAGGGGCATATCGCGGTTCGCAACGACGGCGAC
+GTGCCGGCGTGGCCCGAATACGTGATCCACTCCGGGTCCGGGGGGTTCTGCTGGCTCCCG
+GACGGGGACCGGATGGTGATGCTGCCGAGGCTGTTGCCCACGGACGGGAAAGTGCTCGTG
+TCCACCGACCCCTCCAAGAAGACCTTCACCGCTGAGAACGAGCCGGTGGACATCGGGTTC
+TTGGGCGTGGTGGCCCGCTCGCAGTTGTTGGACCTGGTGCTCAAACCGTTCTTGGAGGCC
+ACGGAGCCGTTGTGGCGGCGCGGCGCGGAAGTGTTTTTCACCAAACCGATCCCCCCGAAG
+ACCACCGTGCAATTGCCGGTGCGGCACTCCAACGAGAACGCCGTCATCACCGCCCGCGTC
+CCGCAACGCCACTACGGGCCGGGGATCTGATGCCGTCCTGGGCCGTCTCCCCGGAGTCTC
+TGGCCTCCACGGCGCTCTCCGTGATGACCACGCTGGTGGTGGGACCGGAGGACGACGGGG
+CTCCCCGCTGCGATTATTTGAAGCTCTCGGCGCGCAGGGACGCGCGCCTGGCGCAGCTCT
+CGCAGGCGCCGATGGTGCGGATTTGGGACCACCAAATGCGTCTTGTGGGGCAGGTGCAGG
+TGGAGTCCTTGAGCGCGGACGAGCTGCTGCGCGACACCGGGACGTGCCAGTTCCGGTTCC
+CGTTGGACTCGCATGTGGCGCGGTGGCTTCGCAACGGTCGCCGCCCGGACTCGGACGTGC
+ATGTGACCATCGACCCGATTCCCACGGAGCGGACGTGGCGGGACCGTTGGGGCGGCAAGG
+CGTCCTTGGTGTCGTTCATTCGCGCCGAGGACGGGCGGGAGTGGTGCGAGGTGAAAGCCG
+CGCACCACTTCGAACATTTGAAACATATTATCTATAGGAATAATCCAATTACCCCACCGG
+AGGCGCAGGGGGTCAGGTTTTGGCTTCTGCCTGGGCCGACCCGGAGCGTCGTGTACTGGA
+CGACGCTGCTGGCATTGGCGCAACAGTTTTTTCCGCCCCTGACCTTGGTGGACTCGTTCG
+CGGACCCGCTGCGGTGGGCGACGATCAACCCCCTGGATCTCTCCCCGTTGAACTGGCCGG
+TGCAGCCGCAGTTCGTCAACCCCTTGCTGGATCAGTCGATGTTCACGGTGCTGACCGCCT
+CGTTCCAGAACGCGCACGCCGCCACCGCCGATGTGCTCAAGGCGTCGGGCTGCCACATCC
+GCGCCTACACCTGGCTCCCCGAGGACAAGGACTCCCCGCACCCGGAGCTGGAGGCGCTGA
+TCGGACCCTTGGCGCGCCCGTCCCGCGCGTGCGTGGTGCTGGCCTGCGAGGATTTGTCCG
+GGGTGACGGGGCCGACCGGGACGATATTTGACTCGGTGCTCTCCTTCGGCGCGAAGCTCT
+TGGACGACTCGTTGACCGAGGTGCTGCTGCCGCTGGATCTGGACGGGGACGGGCGCACGG
+ACCCGTTCTTCCGCGCGCTCACCCTCACCGCGCCCGCTCGCCCGAAGGTGGTGTTCCGCG
+ACGGCGACCAGACGGGGGTGATCGAGTCCAGCTATTCGCACGCCCCCGCGACCGCGCACA
+CCGTCTCGACTGGGAAGGGCTCGCCGCCGCTGCTGAACGACGGGATTTCGTTCGGGGTCA
+AATATGGCTTGAGCCGTTTGCAGGATCTTTTGCAGGGCGGGCAGCTCGGCGGCACCTGGC
+AGGTGCCCGGCACACCGGGTTTGGACGAGCTGTACCAGGGCCAGCTGAGCAACCGTTTTT
+TGACGCACAAGGCGTGGACGGACGCTCTGCGGGCGTTGCGCTCGGGGGACTACGCCTACA
+TCGCCGCGCACGAGCAGTCCGCGGTCGGGTACAGCGTGGCGGGGGCCTTGGCGATCCAGT
+CCGGTCTGCACAAGAACCGGCCCCGCACCACCAAGCACGTCCGCGTCCGCAACGGCGCCC
+CGCACTGGGTGGGCCGGGACTACACGCTGGGCACGCGCGTGCTGCACGAGCACGGCGGGG
+TGCTGTTCGCGGACCAGACCGGCGCGTTGGGCATCCGCATGGACCCGGACGGGCTGGTGA
+CCAGGCCGGTGCAGATCGGGGAGGACGACGACGAGGAGAACCCCGTGGCGTCGGCGTTGC
+GGGCGGTGCAAGGGATTTGGGGCGCCATCGGGGCGTTCGGCGGCGCGGACGGGGGCATTT
+AGTGGACGACGAGGAAGAGGTCAAGGCGCTTGAGGCCGCGTGCCGCGCGGTGCCGCTGGC
+GTCGGGGGCGGTGCTGGATCTGCGGCTGTTCGCGAAAGAGATAGCCGAGCATCTGTTCGC
+GGAGGGCTGCCGCAAGAGAGCCGAGCGGGTGGAGCGGGAGTTCCCGGAACGGTTCCTCGC
+GGTCCCGGACAAGTTGTTGGGCGGCTGGTCGCAGCCGTGCGAAGTGGTGGACAAGAGATC
+GGAGGAACGCTGATGGCCGATGTGCCGCAGCCGGGGGACAAGGTGTATATGTTCTCGGCG
+GACGCGAGGATGGACTTCCAGGGGATCGTGCTCGACCCGGACGTGCCGTTGAACATGGCC
+GCGACCATGCAGATGGTCGGCATGAACGGGGTGGTGACCTTCCCGGTGCTGGTGGGGCGG
+CAAGGCCCGCCCGGGGTGGACCGCCCGATCATCAAATTGATCTACGACCCGCAGATAGAC
+GACGCCTCGAAGCTGCCGCAGCTGACGAACACCCCCGAGGACGTGCAGAAGGGGTATGTC
+ATCGGTTCGCTCTGCCACTGGTGGGACGGGCGGCAGTGGCGGGGAATCCAACTGGGCGTG
+CCGGGGCCAAGTGGCCCGGTGCCGATCATCTCGTGGTCGGTGGTCTTGTTGGACCCGGAC
+GGCTCCGAGGAGTCGAACGTGAAGGTCACGGGCTCGGACGCGGCTCCGGGGGTCCAGTTG
+CGCCTCAAGGTGCCCAAGGGTCCGAAAGGCGATTCGGGGAGCATCCGCCTTGCGAGCGAC
+TACGACGACGCGACGCCGCCCGCTGTCGGGGACCTGCTCACGTGGACCCCGGAGAAGAAA
+TGGGCGCCGCGATCTTTGGGCAAGGAGGACGTGGCCTATTACACGGTGCCGCAGAGCCAG
+TTCAAGGCGCAATCGCTGGTGGTGGGCGCGAACGTCCCGGTCGGGTCGTTCACGATCCCC
+AAGCAGTCCTTCGACTGGAAGCCGTGGGTGTCGGGGTGCGTGAAGATCACCGGGGCGGAA
+CTGGACTTGGACCCGTTCTCCTCGCGCATCGAGGTCCGCAAGGACTCGATGGACGGCCCG
+TTGTGCGCGGTGGGGTTCGGGACGCCCACGACGATGACCGTGGTGTCGCCGCATTTCTCC
+TCGCCGGGCAACAAGACGGCGGCGGTGAACGCGAACAACGACGCGATGCGCTGCGAGGCG
+GGCAAAGACGCGGTGTTCCACGTCGTGATCGCGATGGATCAGGGCATCGGCGGGGTGTAC
+TCGTACAACCCGGACTGGACGGAGTTCCATGTCGAGTGCAAGCGGGTGAACTAGGGTGCC
+GCGCGCGCATCAGACGGCCCCGGTGGAGATCGACAAGAACCCGGAGCACCGGCTGGGGGT
+GAACGCCCACAAAGACCCTGTCGATTTGCAGAAGATCGCGCAAATGCAAGTCCAAGGCTT
+GCTGAACGCGATCAAGCTGTTCACCGGGCTCGACCTCGCGGACCCCGGCAAGCTGTTGGA
+GTCCGTCGTCAGCGGCGCGGCGGGGTTCGCGGGCGCGGTCCTGAACGCTTTGACTTCGGC
+GCTCGGCTTCGATTTGTCGGCCAAGCTCCGCGAGTTCGAGCAGGCGCTTGAGGAAGTGCC
+GGTGCTCGGGGACATCGTGAAGGCCCTCACGGGCAAGGCCGGGGGCGCGGGGGATTTGGA
+GGCGTGGGCGCAGTCGTTGCCCGCGCAAGCGGAGCAGGCCGCGCACGACGCGATAGCGCA
+GGTGAACACGCTCGTGGGGGAGTTGGCGCACGGCGCGGAGACGGTCGGGCAGACCCTCGC
+GGACACCATCGGGTCGGTGGTGGACCTGCTCGCGGGCACGCACCAGCAGACCCAGGACAA
+CACGGCCGCGATCACGGCTTTGTCAACTATCGCCCCGACGAACGTGGTCACCAGTTTGGC
+GTCTTCGACGGACCCGAACGACATCCCCGCCTTCGACCGGATCCTGATGGTCCCCATCGC
+GGCGACGGCCTCGGCGGGGGCGCACACCCACACGTACAGCAGCGGCGGCACGGGCCAAGG
+CACCACCTCCACGGCGGGGGCGCACACGCACGCCATCGGCTCCGACGCGTGGGGGTACGC
+CCCGGAGGACAAGGAGCTGGTGCTGGTCTTCATCCGCTCCGACCGCAAACAATCGGTGAA
+CGCGGTCAAGGTCATCACCGCCGTGACGGGCTGGTCCCTCGGCGGCGTGAGCACCGTGCA
+GTTGAGCCTGCACGCCTACAGCCAGCCCGACGCGGCCCTGAAACTGTTGGCGACCACCAG
+CAACCAGAAAGACGTCATCACCACCGCCGCGCAGGAGTACGCCATCGGGCTCGGCAGCAC
+CTTCGACGTGCTCCCCGGCCACGTCCTCGCGATCGGCGTGTGGCAGCAGGTCAACCTCTT
+CGGGGCCACGCGCAAGCTCGCCGGCATCCCGCAAGTGGGGGTCAAGCCCCGCACCGGGGC
+GCCGGTCAAAACGATCCTCGGCAAGATCACCGGGCAGTCGTCCATCCCGGCAACGATCAA
+GCTCTCCGACGTCGCGTGGAACTACAACGCCGCCGTGTGGGGGGCCTTGACGCTCGCCTG
+AGCGTGTGCGGCTCGCGCCGCAGACGGGCAATCGCCGCATCGCGGCGCGGAAGGAGAAAA
+AGATTATGACGGATCCGTATGGGCTGCCGGTCGGCTCGGACGTGCGCCAGGGCGCGCGGG
+GGTTCCCCGAATGGGTGTACGCGCTCGGCGCGGCGTTCGGTTTGGACGCCTCCACGTATC
+CGGGGCACCAGGAGCGCGCGGGCCTCAACCAGGGGATCGACTGGTGGCCGAAAGGCAGAG
+CGGACATGACGGGGGCCTCCTACACCCCGGCGCAGCGTTTGGCGTTGGGGCGGTTCGCCC
+TGTGGGCCGGGACTCAGCCGGGGGTGGAGCAGGTGATTTGGTGCGACCCGGTTTCCGGGG
+TGAAGACGGGGTTCTTCATGGGGGAGCGGGTGGGTCCGGGCACCGCGCAGCCGGGGTACT
+ACCGCGACGACTGGTCCGGGCACACCGGGCACGTGCACACCAGGATTGTGCGGGCGCTCG
+CAGCGCCCGACGACATCGGACAGGAAGGGAACAGCATGCCTTTGTGGGGCGTGGACATCA
+GCAACAACAACGGGGCCGTTGATCTGGCGCAGGTCAAAGCGGAAGGCTTCGATTTCGTCG
+CGGCGAAGGTCACCGAAGGCACGGGGTTCAAGGACTCGTATTGGCCGCGCAACCGGGACG
+CCGCGCGCGCCAACGACCTGATCCTGATCGGCTACCACTACGTGCGGGACGGGGACGCGG
+AGGGTCAGGCCGCGAACCTCGCCGCGCACATCGGGGACACGAGCGTGCCGGTCGCCCTGG
+ACTTCGAGTCCGGCTCCGGGGGGTACGCGAACTTCCAGGCGGTGAAATCAGCGGTGGAGC
+GGCGGGGGATGCGGGTCGCGCTCTCCTACATCCCGCGCTGGTACTGGCAGCGGATCGGCT
+CCCCGGACATCTCGGACGCGCCGGGGTTGTGGGCGTCGGCGTACGTGAACGGGACGGGCT
+ACGCCTCCGTGCTGTATCCGGGCGACGAATGGTCGGGCTGGCAGCCCTACGGCGGGGGTG
+AGCCGAAAATCTTGCAGTTCAGCTCAAGCGCCCACGTCGCCGGGAAGAGCGTGGACGTGA
+ACGCCTTCCGGGGCGCCCGTGAGGAGCTGCTGTCTTTGTTGGGCGCCACCGCTCCCGCGC
+AGCCCACAGCGAGCCTCGACCAGTTGGTGCTTGACCAGCTCGTCGGGCCGGGATTCCACG
+GTTGGCCGCAGCTCGACAACAAGTCCGTCGTGGACTTCCTCGCCTCGTGGCGCGAGGAGC
+AGCGCACAGCGAACAAAGCCATGGCGGACGCTTTGGCGCTTCTCCTGAAAGGAACAACCC
+AGTGAACGTGATATCCCTCCCCTACAAGTGGCGCGTCGCCCTCTACCAGGTGCTCAAACT
+CGCGAGCGCCGCTGTCGGCGCGTTGTTCGTGATCGCGCCCTTGTTCGGGTGGGAGCTGCC
+GAACACGAAACTCGACGCCCTCGACCAACTGGTATTCGCCGTCGTCAGCCTCTTGGGGCT
+CGGGGCGGGTTCGGTCGCTACAGAGCACGCGAAGATCTCCACGGACGGGCCGCTCCCGGA
+CCCCCGCGCCCAGGCGCCGCAACCGGACCCTATGGCGGTCGCCGCGCAAACCGTCGCAAT
+GACCATTGAGGGCGTGCTGGCACAGTTGGAGCGCTTGGCGAAGCCGCAGGGCGAGTGATG
+CTCAAACAGATCCTCGCGGACATCGCGCCTCTCGGGCCGACAGGGCTCCTCTCTGTCATG
+GTGGTGTTGATCATGACCGGGCGCATGCTGCCCTTGCGGGAGGTGCGGCGGATGGAGCAG
+ATGCTCAGCGAGCACATCGCGCGGCTTGAGCGGGCCAACGCGATTCAGGCCGAGACCATC
+GAGCAGCAGCACGAGACGGTGCGGGAGCTGATGGAGGGAGCGCGCCTGTCCACGGATCTG
+GTGTCCGCGATGAAGACCTCGGGGGGCGTGTGATGCGTTGGCCGTGGCAGTTGCGCGAGT
+CCGTGGAGTTCGACGGCGAGGATTTGGACCGCAGGGTGCGTGAGGCGCAGCACGCGAAAG
+ACCGCGCGGACAAGCTGCGCGAGGAGGCCGCGCCGCTGGTCGCGCTCGCGCGCCGCCAAC
+GGCGGGAGAACGGTTTCGGCGCGGCCGTGGAACGGACGATGAGGAGACGGCATGCGTAGC
+AGGGAATCAGCTGTCGGCGCGGCGTCGGCCGCAGCGGTCGCGGCGGCGTCTTGGCGCTGG
+CTGGGATGGGGCAGGGTGGACGACGCGCTTTTGACCGCAGCCGCCCTCGCGTCGGTGCTC
+TTCAGCCTCATGTACTGGCGGCAGGCCCGGGGATACATGAACCGCGCCGGGAGGGCCGTG
+CTGTGGGTGTTGGCCGCTCTGTCGGCGGTGTTGGCGCAAAACACCCTCAGCGTGTGGACC
+GAGCAGGACTACCCAGGCCGCGATCTCGTCCGCACAGTCCTCTACGGGGCGCTGCTGTTC
+ACCCTCGCCCGCCTGACCGCCACCGCCCTCGCGTACCGCAAGAAACACTAAGACCGTCTA
+CACTCTCATCCGGCCGCGCGCCCGTCCCTCATCCATAGGGCGCGCGGCCCTCACACACCA
+AGGGCTTTCCCGTGGCCGCTATGCGGTGATGTTGAACAGCCAAGGGCGCTTCTCGTCTCA
+GTGGTGGAGGATTGATAAGAACGCTGCGGGGATGCTGATGTAGAAGACCGGCCAGCCGAA
+GTAGAAGACCATACCGGCCAGCGAAGCCGCTATGACACCTCTTCCGGCGTTCCGCCATCG
+CTCATCGACCCTGAACAGATAGACGCCGACTCCGAGCGAGACAAGGAGGATGAACCCGAA
+TTTTGATTCCAGGGTGAACCCCAGGAGTATGAGTGTCCCGCTGGCGAGCAGGCACCAGAA
+AAAGCTAATGGGGCTGTCCGCTGGTGGTGTCTTCTCGGTTTTTGTCTTGTCGTTCAAAAT
+GTCACGTTCTCTCTCAGCACGGCAAGCGCGACTGGCACGATAAGGCATCCGATGGCCGCG
+CCACGCCATAGAGGGGTTCTCTTGATCAGGGGCAGCAGCAACCCCGCGCAAGCCATGATC
+AAGCATGTCATGATCAGCGCGGGTCGTTGGCTTGCCGCTTCATGCGGAAGGAAGTAACGG
+ATCAGCGAGTACAGGATCTCGCAGACTGCGGTCAGGATAGGAGCGCTCCATGTCGCGGCG
+TTCCATGACACAGCGGGGAATCTTATAGTCGGCATCAGTTCACCACTGAATATGTGTCGC
+GTCTTTGGTGGAGAAGAGGGCGAGGAACATTCCGGGGATCGTGTAGAGAAACAGCCAAAA
+AACATATCTGAGCAGCAAAGCGGAGACTGTCGCGGCCAACATGCCCATACCGATTTTTCT
+TTGCTTACCGGTTGTGAGCGACATAGCGAGTCCCGACAAAAACAGAATCAGCACTGTTGG
+CACGTACCAAGCCATATGCAGGGCGGCGACCGCCATAAGCGCTGCGGACGTCAAGACCAG
+GGCCGCGAAACTTTCCGGGCCGTGAAGCCGCTGGGCAGGTGCTGTGTCGTCGCTCTCGCG
+GTCTCGCTGGTTCATTGCGTCAACCACACGAACCAGGCCAACACGAAGGGCACCCCGAAT
+ATGCCCAACGCCACCCCGCGCGCGGTAGGGGTCCGAACGAAGACCCACAACAACAGGGAC
+AGCGTTGAGACGATGCCGCACAAGAGCGGGAATGTTAGGGACTTGCTCCCTGGCGGCTGC
+AAATTGACCAGGAAGGTTATCGCCGTCAAGCAAGCGCATACTGCCACGGGCGCGCTCCAC
+GTCGCAGCCGCCCACGACACAGCGGGGAGTTTTATGGATGGCATCAGATGTCTCCCCTCA
+TCGCTGGAGGTTGTTGCGGCGCTACCGGGTTGAGCTGTGGCGGCGAGTCCCCATCCTCTG
+GGGCGAGGGTCATGGACTCGTCGGGAACGGGAACCTGCGGTCGATTGCTCGGGATGCCGG
+GGCCATCCCACTGCAAGCCGGGTTGATACTCCTGTATGGAACCCGTCGGGCCATTGCCGA
+CAGGGTGCGATTTCGGCAGATTTTCCATAGGGCCGAACTCGCTTCCCGTCGCCTGATAGG
+CGTATGCGGTCGTTGTCGTGCCGTTCCTGTCTTGGTAGACCTCCATCGAAGGGTAGTCGC
+CCACTTGCCCGTCAATGTGGACCCCGTTCGCTGTCGGTGTCAAGGTGATCTCGCCGTTGA
+CCGACAGGCCAGCAGCATGCGAGAAGAAGGGCGCCAATGGGTTGGTCGCGTCGTAGTGGA
+TGCGCACACGTCCGTCCGTTGTTTGCTGCACGTCAATAACGGGGTCTTGCACTTCCGTTT
+TTCCTTGGATATCGACTGATGGGTTTTGTCTGGCGGCGACGACGCCGTTCTCGTAGTCGA
+TGTACAGGGACACTCGGGTCTGGCGCGGGTCGAATTGTTCTTTCGGGCCGCGCGCGTCCC
+CAAGGTCGTTGGGCATGTTGAACACGTCTGTGGCGGGGATGTACAGGCCGACCCGGACGA
+TTCCTTGGCCGGGGACGGCCTTGATGCGGCCGACGTCGACGCGGGCTGGCACGCCGTGGT
+TGCGTCCGACCATGCTGTGGGTGTCCATGATCGCGGCCATCTTCCAGTCGGCGTCGCTCT
+GCGGAAGCCTGCCGTACACATGCTGGAACTGGTCCGGGTCCACGCCGTGGTGTGATCCAC
+GATCCGGGATTTCGCCGGGGTCTTGCTTGAACGGCTCGAATTTGTCCGCTTCTTTCTTCA
+CGCTGTCGAGTTGGTCGCCCAGTTCCTCAGCGAGGTCTTTGTCTGCGGCGAGTTCTGCGG
+CGTTCAGTTCGTCGGTGGTCTCGTATTGGAGGGCGGATTCGCGGGTGGCTTGGGCGTGGG
+CGTGCAACGCCGCTGCGGCTTCTTGTGCGTTGATGTGCTGGTTGGTGATCGCGGCCATGA
+ACGCCGCGATGAACGGGGCTCCGATGGGGCCGAGGGCTGTTGTCATCATGCCCTGGAAGA
+CGCTGGGGTCGAACGCTATGGTTCCGTCGAGCATGAGCGCCATTTGTTCTGTCTGCTCGG
+CGTGCGCGAGCATGGTTTCTTGGCTCGCGTTCAAGGGTTGGCCCATGATGCTCCGATTCC
+TGTACAGGGGATTGTGAGTGGACTGTAGCATTCCGGTGGGATTCCAAAAACGCGAAGGCT
+GTGTCCGTTCAGCCCGCTAAGGCCACGGTGAGCTTGGTTTCTGCTCCTCTGAACGGATTT
+AGCCGACTCACGGCCTCGGAAGTTTTATGGGTCGGCACCTGTGTGTATTGCGCCGTTGTC
+GAGATCGAGGCGTGGCGCATGATCTCTTGCACGACCCGTATGTCAACGCCTTCGTCTAGG
+AGGGTTGTTCCTTGCCAGTGCCGCAACTGGTGCGGCGTGGCTCTGACCCCGGCTCTGCGC
+ATGGTGAGGCTTATCGTCTGAGACACCGATTTGCCGCTGATGTGCATTCCGGGCCAGCGG
+CTATCACGGGGGAACCACCAGCCGCGCTCGGGCATCGTGGGTGCGATTGCCTGCAAAATC
+GGGTGCAACGGGACGAGGCGTTCCTTGTTGCCTTTGCCCAAGACTCGGACGAAAACGCCG
+TCCACAATGTCTTCGCCGCGCAGTTTCGCGATCTCGAAGGCCCGTAGGCCCGCGAGACAG
+TACAGGAGCACCATGAGCCGGGTCCGTTTGCGGTTCACGGTCTCAAGGAGGCGTGCCAAG
+TCTCTGTCCGAGACGGGCCGGGGCGCGCGGTCGGGGTATCGCACGGTGCCGACCTTCACC
+ATGGGGTCGTCTGTCCGGTGCTCATGGACTTGTAGCCATTTGAACCAAGCTTTGAGGTAT
+TGGGAGTAGGTCGCAAGGCTGGATTGGCCGAGGCTGGACTGCTGAGCGAGCCACCGTGCC
+ACGTCTAGGGCGCTCGCTTGGCTTGGCTCGATCCCGATGGAGCTGGCGAATGACTTGATG
+ACACGTATCCTTTCCGTGATCGTCCGTTGCGAGAGCCTGCGGGCGAGCATGAAAAGTTCC
+CACTCTTGCACGAGCAGCATGGCTACGTTGTGTGCGTGGTGGGTTCCGGCGACGTTGACG
+GGGGACAGCACGGCGGGAATATTAGCGTCCGTTAAGGAGCTATTAACCTCTTGTTGACCT
+TGGTTATCTATCCGAGACGGACAGGGTGCGGATTTTTTATCGTCTTGCAGAGGGTGGGGG
+ACCGCTCGCAGTCGGCGCTCATTCTGTCGGGGTGCCAT
+>NC_014168.1|provirus_1141631_1162952
+TCATTTTGGGGTTGGGAGGCTCTCCCTCGCGAAGATCGCCGAGGCCCGTTTGAGGATCTC
+GACCTCCATCGCCAACACCCGGTTCTCCCGGCGCAGGCGGACCAGCTCGGCCCGCTCGTC
+GCCCGCGATCCCCTCGTGCCCTCCCTCGCGGACCACGCGCTTGCCCTCCACGCCGTCGGC
+CTGGGCCAGCCACTTGCGCAACGTCTTCGCGTCCACGCCCAGCTCCTTCGCTGCCCAGGC
+CACAGGCCGCCCGCCCTCGCGGGCGGCGCGGGCCGCCTCTGTCGCCCTGCGGCGGAACTC
+CTCCGGATGCGCGGCCATCCGCACTCCCTTCCCGAGGCCCGAGGCCCCGACTCAAAGTGT
+CCGGAAAAGCGTAACCAGATCATTCGGCGGTGAACACCGCGAGCCAGGCGTGGTTGTGCG
+GGTCGCGGGCGTCGAGGATCGCGGTGGGGAATCGGGAGACGTGCGCGATCCCGAGCACGT
+CTCGGCTGATGAGCGCGGCCTGCGCCTGGGCGGCGAGGAACCGGGCCTCGCTACGCCCTC
+GGGCGAAGGCGGCGACCCGCACGCGACAGGTGGTGGAGACGGGCCAGTTCACGCTGCCGC
+CGTCGTCGCCCACGAGCAGGAACGGCCGGCTGGTCTCGGGCTGCCAGTCCTCGGGCAACT
+GGCCCCCGGCGTCGGCGTGCGGGACCTCTCGGCGCAGGTGCTCCCAGATCGCTTTCGCGG
+GGTCCGCGGGGACCCTCACCGCTTGCGCCTGGGGTCTCTCACGGCGACTTGCAGCCCCGC
+GTCTTTCGCGGCCCTGGTGAGCACGCCGTGTTTGGCCTCCACGGCGAGCCCTGCGGGGTG
+GGCGAGCACCACCGCGGCGGCCTGACGGTCGGTGGTGTAGGCGTCGACCTGCACCAGCTC
+CTCGGCCTGCGCGCTGCCTTCTGTGATTGTGGCGGAGAGCGCGATGACGGCGGGGTCGGA
+GCGGACCTGGGATGCGATCCGTTCGGCGGCTTGGTCGACGAGCTTGCCGAACCGGGTTTT
+GAGGAGCTCGCCGACCGCCTGCTTGTCCAAGGTGACTTTGACGTTCATGGCCGTGCGCTC
+ACCCCCGTTCCGTCGTCGCCTCGACCACCAGCGCCGCCCGTCTCGTGAACGGGCTTCGCC
+ATTCCTTGACCCGCGCCCGGCACACCAAGCCCCGCACCGTGATCAGGTCGCCGCCCTTGA
+TCGGGCAGCCCAGCGGCAGGCCGACCTCGAACCCCTCGGACGCCTCGGCCCGGCCCGCCT
+CCTCTGGGGGGCGGCGCAGCGCGAGCGGCGCGATATAGAGGACGGGCTGCTCGTAGGGCA
+CCCCGCCCGGCTCGGGGTCCCCGTCCGCGCTCCACCCCGATTGCCGGGTGATGACGACCG
+TCTCGGGCATCGGCTGATTCCCTCCTCTGGGCGTATGATCTGGGCATGGGATCAGAACGC
+GACCTGCCGGTCGAGGAGGACTACAAAGATTTCGGGCAAGAAGGCATGATCCAGCCCGAG
+CTGTACCAGTCGAATGGACGGTCTCCGAGGATCCTGCCGTTACTGCCCCCGTCTCCTGCG
+GGGCAGTCGTCCTTGGTGGTCGATGACGACCCGCTGGGCAAAGACATGGCCCTAGAGGGG
+CCAGGCGGCCGCGCGGTCGTCCACTTCCCACAACACGGCTGATCGCGTCACGCGGCTGAT
+GGTAGGTAGTACCTGTTGAGGACCTCGTGCTGCTCCGGGCCGAGGCTGGAGGCTCCTGGG
+GCGGGGAAGTACTCGTAGGGCCCCATCTTCTCGTGGACGCCGCCGAGCGGCGAGGTGACT
+GCCCGGGCGGCTTGTTCGCAGATGAGGGCGGCGACGGCGGGGGCGTCGTCGTAGCCGTGC
+GTGAATTCGACTGTGACTGTGCCTTCAGGCCAGCCGGACTCGCGGACGAGCAGTCCGGCC
+GGATCGGCGCGGTAGCCTGTGATCTGCTCTCCGTCGACGGTGACGGATTGGACGGAGACC
+AGGCGCAGGGTGGGCAGCGCCAGGACCCTCCCGCCGTCGCAGGCGACGTTCTCGGTCTGG
+GCGACGACGGGGGCGATGTGCCAGCGGCAGTGGTCGCGCACGGCGGCGGTCGCCGCGCGG
+AGGGACTGCTCGGCCCGGCCGTGGTCCGCCAAGAGGCCCGCGAACACCTCGGGGTCCACC
+AGCGGCGGCAGCTCCACCGCGCTCACCCCTCTTGGGGCTTGGGCGGGGCCTGTTTCGCCG
+CCGGCTTCTCGGATTTCCCGGTGAACAGCGGCTTGTCGAGGAAATCGGCGTCGCCGAGCG
+CGTCCGATGCGGTCAAGCCTTGTTTGGCGGCGTCCTCGTCGGAGAGCTGCACGATGCGCT
+CGATACCGGCAATAGTTGTCTTATACAGCTTCATATCACTCACCAGTTCTATTAGTTGGC
+CAAAAAAATCTTCGCGAAGGCGAGGGGGCATCGCACGGCGAGCGCGAGGCGGGTCTCGGC
+GCGGATCTTGACCCGGTTGTAGACGAAGTCGTCCTGGTCCGAGTTGGTGGACTCGACCCT
+GATCCCGCCCTTGCGGTAGAGGGTGGCGCCTTGGGCGAAGTTGCCCACCAATGGCTTGCC
+CTGCGCGACGACGGGGGTGACGATGGTGCGCAGCCCCCACAGCGGCGGGTCGGTCAGGAC
+GGGGCCTTGCCCGTACTGCCCGGTGAAATACCCGCCTGCGAGGTATTGGCCGTTCCCGTC
+GCGGGAGAGGCGGAATTTCTGGTAGTCCAGGGGGTGGATGACCAGGCCGTCGGCCTTGTA
+GTTGGTGGCGGTGGCGATCTTGGTCATGGCCCGGAAGATGGAGTCCGCGTCGTCCCCGGC
+GTTCGCGCTCTGCTCGTTCTGCAGGCCCGAGCGGTTGAGGATGCCGGTCAGGTCGGTGCC
+TTGGCCGGTGCCGTAGAGCAGTTGGCGCTCCTCGAACACCGACAGCGTGTAGAGCAGCCT
+GTTGTCGATCTCCGACTGCACGAGCGGGAGGTCTTCGAGGGTCTCGTCGGTGAGGTGGAT
+GAACGCGGCGACCTTGGTGACGTGGTCGGTGACCGGGGTGGGCTCGGTGAGGTGCATCTG
+GGGCTTGCGCCCGCCCTCGGGGACGGTGGCGAAGTCGCCTTCGATCGATCCCTCCAGGTA
+GTAGCGGATCGCCTGCCCGGAGATGGAGCCCGAGCCGATCAAATCGGCGACGACGGGGCG
+CTCGCGCTTCTGGCGCTGCAGGGAGCGGTCCACATCGGTCAGCCAGTCCCGGTACGGGCC
+GTCCGGGCCCCCGGTGACCTGGACGTCGTCGGCGGCCTTGCGCCCTGCGGGGACCCATTC
+GGGCGCGGTGGCGGTCGCCCCGCTGACGCCTTTGATCTCTTGCAGCCGCTGGCCGGCGTG
+TTTGAGGAAGTGCTCCCCGAGGCTGCGCGCGGGGGCACGGCCCGGGTCGAGCTGCCAGCC
+CGGGTGTGCGAGGGCTTTGCTCGCGTCGGGGACGAGCTGGTCGATGGCGCGTTGCAGCTC
+GCTGGACTCGCGCTGGGATTTCAGCTTGACGTCGAAGCCTTTGACTTGCTCGATCAGCGA
+GCGGACGCGCTCGGCGTCCTCGGGGCTGAGGTCACCGCCGGCGGCCTTCGCGCCGTCCAG
+GATGGCTTTGGCCTGTTCGTGTGCTTCGGCGCGCTCTTTGAGCAGCGGGTTCTCGGCGAC
+AGTGGTGGTCAATTCGTCTCCTCGGGATGGATGTCGAGCAGGTGGAGCTCGGCGGCGTAG
+AGCCGGGCGGGCGGGGCGGACTTCGGTGGCGCTTGCGCTTCGGGTTCGGGCGGCGGCTCG
+TCTTCTGGCGGGTCGTCTGCGGGGAGGACCGCGAGCAGGGCCTCCCCGGCTGCGCGGACG
+GCGTCGAGCGCGTCCCGCAGGGCGGCCTCGTTGCGCGCGGAAATCGCGCGCCCGGCTTTC
+ACATCGAGGACCTCGGCGTCGGGGTTCGCGCCGATCGGCACGACGGACACCTCGTGCAGG
+CGCAGCTCTTTGAGGTCCCACCCGGCTTTGACGCGCTCGGAGTCGAGGACGTCGAAGGCG
+AAGCTCATCTGCGCGAGCCGCCCGTCCTTCATCAGGCGATGCACCTGTGCGGCCTTCGGG
+TTGTCCAAGTCGAGGGAGGCTGTCACCAAGAGGCCCGTGTCGTCCTCGCTCGCGGTGAGG
+ACCTTGCCCACGCACAGCTCGGGGTCGCTGAAATCGTGCCCGTAGAGCAGGGGGATCGGG
+CGGCCCTTCTCGGCCCATTGGGCGAGGGTCTTGGCGAACGCGCCTTTGACCACGACGTCG
+CCGTGCAGGTCGCGGTTGCCGAAGCAGGAGGCGTACGCGGTGAAGACGCCCTCCCGCTCA
+GGCAGCGGCCGGATAGTCGTGTCGAACGCTTTGCGCCGCATCGCCGGCTCCCTCCTCGTG
+CGGGCCGAGCGGCGGTGGCGGGCTCGGCTCGGTGGTCTGGTTGAGGTTCCTGAGCAGCTC
+GTCCCCGCCCTCGACGGCGGGGAGGTTGTCCTTGGCGCGGGCCTCGTTGACGGTGAGCCA
+CGGGCCTCCCACGGCGGTGGCGGTCGCCTGGGCCTCCTGCTCGAAGGAGCCTTTGAGCTT
+CTCGCGCAGGTCGAACTCCACGTAGCTCGCGGAGCCGGGGGCGATCCTCGGGACGAGGAA
+GGCGTTGAGGCGCCCTGCGACCATCGAGAGGGTGGGGCCGAGGGTGTCGGTGTAGAGCAT
+CCGGGAGAACGCCTCGACGTTGCTGTAGTTGGCGTTGTCCAACAGGCCGACCATCACCGG
+GGAGATGTGGTAGACCGAGGCGACGGTCGCCAGGGCGAGCTTCTGGGCCTCGATGTAGTC
+CTCGTCCTTCGCGGAGAACCCGATCCGGCGCAGCTCCATCCCGTCCTCGAGGACCGGGGT
+GCCGCCGGCGCGGGGGCCGTTGTTGCCCGAGTAGGCGCCCTGGTAGTCCGTGACGAAGCG
+GTGTTTGGCCTCCGGGGACCAGCGCGGCGCGTCGGCGGGGCGGTGGATGTAGGCGCCGAC
+CCGGCCGCCGTTGCGCCAGGTCTGCAAGCGGTAGGCTTGGGCGGCGATCTGCTCGGCGAG
+GACGGCTTTGAGCGTGGCCACGGGGGTGAGCCCGCCCGTGGGGTCCAGGGGGTTCCAGCC
+GTGGAAGACGAGCATCTTCTCGCCGGGGATCACCACCAGCCCGGTGGCGTGCGGCGGGGC
+GATCTGCCACTCGGCGACCGCGAACGGCGTTATCTGGCGGCGGCCGGTCACCCACGCGGG
+CGGGATCGGGCGCACCACCCAGCCGGACTCCGAGGCGGGGTCTTGGTCGACGTACCAGAA
+CGCCTGGTCGTACAGGCTCAAATCGGCGACGAGCGAGTACAGGAGCTCGTAGCAGGTCTG
+CTCCGGATTCGGGCGCTCCAACAGCCGCGCGAGCGCCGTGTTCCGCTCGCGCTCCCGCCC
+CCCGTTGGGCTGCCTGCTGTAGGCGTGCAGGCCGAGCTGGGCGACGTTCCTAGCGAGGAA
+GTCGATGACCGTTCGCAGGTTCGGCTGCTCGGCCCACAACTTCTCCACCGGCTGGGCTTG
+CAGGTCCGCGAGCACGACCCGCACCACCGGCTCGGCGGCGGTCCACACCGCAGGCGGCTG
+GGCTGGCGGCTTGAAACCGAGCCAGGAGAGCAGGCCCATACTTCTGGCCTCGCTCTCGTC
+AGGTCACAGCACGGTCAGCCCCGAGTCCTCGTAAGCGCTGACGGGCTCAGCAGCAGGTAG
+GTTCGCCAATCCCCATGTCGCGGCAATGGCGGCGACGAGCGGGGCTGGGTCGACGGGTGA
+GTGTTTGCGGTCGATAAGCCACGCGTCCCCGGCCGGGCGGACAGCTGCTGTGGCGGCTGC
+TTGGTCCAGGCCAGGGTGCGATAAGTGCCGTATCTTGCCGGTGGCGAGCAGGTCGTGGAA
+CGCTCCGGTCGCTTTGCCGAGGTCCGGGCCGCGCCACGCTATGACGGGCAGCCCGGCGGC
+CTCCAGATCGGCTACAAGGGATGAGGCGGGCGCGCCGTTGGCCTGCACGATCACGGCTGC
+GATCTTCTCGCGGCGCTCCGCGAGCCAGGGGGCGACCCAGTCCGAGCCGGCGCGTTGGGC
+GGTGATCTCCACATGCGCCATCCCGTCGTCGCGGCGACCGGCGAGGGCGAGCGTGACGGT
+GGAGCGGTTCCAGGCCATGTCCAGGCCGACCACTCGCGGCGAGTCGGTTGCGATCGTGCT
+GTTGTCGTCGCGGGTGGAGTCCCAGGAGCCGGGCGGGAACGGGCCGGGCGTGACGGTGAG
+GGGCCATTGGCAGAGGACTTCGGCGGCGAAAACCGGGGCGGGGTCGGTGGCGTACGCGCT
+GGCGATGGCGCGCTCGGTGATCGTCACCCCGAGGGCCGGGTTCGCTTGCGCCCAGGCGTG
+GCGGTCTTTGGGGTCGCAGCCGGGCGGGGCGGACCACTCGAAGATCCCCACCGAGTCGTC
+TTCGGCCTCATCGTCGGGGGCCTGGTCCTCGACGTGGTCGGGTTTGCCGTCCGGCCAGTC
+GAGCTGGCGGTGGGCGATGTTCCTGAGGTGGGCGAGGACGACGGAGAGGTGGTCCCCGGC
+GTTGGAGAGGCACCAGACCTGCGCGTCGGGGCGGGCCATCGTGGTCTTGGTGACCGCCGC
+CCAGGAGTCGAAGGACTGGTGCTCGCGCAGCTCGTCCAACAGGATCAGGTCGGCGGTGAA
+GCCGCGGGCTCCGCGCCGGGAGGCGGCCGCGATCCTGTATTGCGCGCCGGAGTGCAGGCG
+CAGGCTCTTCTTGCCGTTGGTCTTGTCGACGTGCAGGACCTCGGACGCGAGCTCCGGGGT
+GCCCTCCGCGAGCTCGACGGCCTCGCCCCATGCCTTCTCGCTGTTGGCGAGGTCTTGGGC
+GGTGCCGACGACGACGCCGCCTTTGACGTAGACGCGCCAGAGGGCGAGGACGATCATGAG
+CAGGCTTTTGCCGTTCTGGCGTGCGGCGAGGGCGATCACGGTGCGAAAGCGCGGCAGCCC
+GTCCGGGCGGACCTCCAAGGCGTGTGTGAGCAGCCATTCCTGCCAGGGGAGGAGCTGGAC
+GGCGAGGACGTCGCGGGCGAACTCGATCACCGAGTGGCCGAGGCTGGCGTCGGGGGTCAG
+CTCCCGCAGCGGCGGCGTCCACACGCGAGGGACAGTGGAGCCGAGCAGCTGTTCGGCCAC
+ATCCGCCCTCCAGGTGCTAAGTCTTCGTCTCTGCCGCCTTGCGCAGCTGCGCGAGCTTGC
+CCCCGGAAGCGGGCGGTTGCGGCAGGCCCTTGCGCCCGAACGGCGTCAGGCCCAAGTCGG
+AGAGGATCTTCCCGAGCGCGGGGGAGGCGTTGTGGCAGACGCGGGCGAACTCGTCCAGCC
+CGCGAGCCTCGGCCTCGTCGATCAAGCGCGCCAGGGCGCGGGCGTTCTCCACCGCGCCCG
+CGTCGAGCGGGGTCAGGTGCGAGGCTGCGGCGACGCTGGCCTCCACGGCGGCGAGGACAG
+AGGCCATGCGAGTGGCTCCCATCGAAAGTTGATCTGTTGGCCGGAGGGCGGCAGTCTCCT
+GGCTGGCTTCGCCATGGCCGACTTGCGCGGGCAGAGCCGAACCGGCTACCTGTGTGATCG
+AAATATCAATCCGCCGAAAAAGGCGTGATCAGGCAAGTGACGAGTGTAAAGTAAGGATGT
+CAGCGGATATCGCGCTTGGCCGTGTTGGCCGTTCCGTCGTTGGCATGTACCCGGCCATGT
+TGTGGCCGAGGCAGGAGGGCTCTCTTGAAGTGGGCGCCGAAAAAGAGGGATCGGCGGCAG
+GCGTTGCGCATGCTGCTGAAGCCGCAGGACCATGGATCGGGACCTGTCGACGGGTCGTGG
+TGGCCGCGGAGCCGGGACTTGCACGTCGAGCTGCCTCGGCTGCTCCCGGAGCTCGTGGGG
+CAGTTGGGGCTTGTCAATCTGGTGTTGTACGACTTTGGCGGTTGGTCGACCGCTCCGGGG
+CACGTCACCTCGCAGGAAAGGGCTGTGAAGACGACAGGGGAGGCTCGTCGGCCGTTGAAC
+GCGGTGCGTGTGGTCGGTTTGAGCCAGAAGCAGCTCTTGCTGCTCGTGATCCCGCACGAC
+CTGCACCCCGACGACGCTCGCTCGATCATGGCGAGGGCGGCGGGACGTCACAACACCGAC
+GCCCCCGAGAGGCTCTCCCAGATCCTCTCGCCCGACGGCGCCCAAGGCACAGACGTGGTC
+CCGAGGCAGCGGTCGTGGGCGGGCGACGGCGGCGGCGATCTGGGCGAATGACCCTGCCGG
+GCCGCCGCCGCGTCCAGGCTCCGGGGCGAGAGCGCCGCAGGTCGGGCTGGTTGGCGGCGC
+GAATCCCCCCACGGGCGTACAATGAACCGTATTCCCGCTGATTCGGACGGCCTCATTCGA
+AGGCGTCGTCGCGGGGGTCGAGAGGCTCGCTCCTGCGGGCCGGTCAGGAGCGTCCATCGT
+GTCGCGACAATTATCACTATCACACCAATCGGGCGCAGTCCTCGATCCGATGCCGCGCCA
+TGGCGTGACATTGCGTCTGCGGTTGAAGCCGAAAGCCGAGCCGACCGGACATGTGGACGG
+GGCGTGGTGGCCCCGCTCGCGAGACTTGGCCGAAGAGCTGCCCGAACTCCTGCGGGTGCT
+CGGGGTCCGCTTAGGCCACGTCCATCGGGTGATCTATCGCGCCAGGGAATGGGCGATCGC
+TCCGGCCCAAGCCCTGATTGCCGGGAAACGAGTGCTGCTGGACAAGTCCTACTACCAACC
+GCCAGGCACCATACGCCTAGAAGGGGAGCGGGGAAGACGGCACACGCTGTTCGTGGTCCC
+GCCCTGGGGCGTCCCGCATCTCGCGCACGACGCGATGATGACAGCGGCCGCACCGAACGA
+CAAGACGACCGTCGCGGACCTGCTGGAGATCTCCGACGCCACCCCCGCCGACCTCGTCGA
+GCAGCGAGAGGAAGAAGACCGATGGGGCACCGACGGAGGGGCGTTGCCACAACCTAGCCA
+GCGGCGGTAGCGCGGACGACGCCCTCCCCCCTCGCGCGCACGCGCGAGGGGGGCTGGTCG
+GGGAGGGATTCGACGCTACCGCCGCCATGGCTGTCATGATCGACTTCGCCGTGATCTTGA
+GCCCCTACCCCCTGGGGGTGGCGAGTGGGTTAGTCCTCGAAGGCCACGACGGTCTCGTCG
+CAGTAGTGGTCGCGCTCGTCGCAGTAGTTGTGCCGCACGAGCCCGTCGTCGTGCTTGATC
+GTCAGCCGCGTCCCTTTGTCTCCGATGACGGCGAGGATCAGTCCGCCCGCGCCGACCTCG
+TAGAGTCGCACGGTGAGGGTCTTGCCGTCTTCCGTTTTGGCGTCGACGGACTGGATGAGG
+CCGTAGTCGCCCGCGTCCTCCAGCTGGGTCTCGTAGCGCCAGTGCTTGAAGCTCTCCTCG
+GCAGATCCCATGCCCGCATCCTATCACATTCATCGAATACATGTTCGACTATGGCTAGAA
+GTCCTCGCTTCTCGCCCAGGCCGCGTGAGCGGGTTGGGCTGCGCCCCTGGTTTGGTTGCA
+GCGGGCGTGGCTGGCGCGCAGGTTCTGGTAGTCGAAGGCCAGATGCGGGTGGGTGGCCCT
+GGGGTAGGCGTGGTCGGCTTGGAAGCTGTCGGGGTGCTCGGGCGGCGCGTTGTAGTCGAT
+CGGCTGGCGGCAGATCCAGCACGGGCGGCGTTCTGCCCGCAGTCGTGCGCGGAGTTTGGC
+GGCCTTGTCGCCGGACCAGCTGGCGGCCATCTTGGTCAGGCCGCGAGGCCCTGCGCGGGC
+CGCTGTGCTGCGAGGTGGGCGGCGATGACGTTGCCGGCGACTTGCCCGAGCTGGACTGGG
+ACGGCGTTGCCGAGCTGCTTGAGCGCGCTCTGCCGCCCGGCGGCTATGATCTGCCAGGTG
+TCGGGGAAGGTCTGCGCCCTGAGCCTCTCGGGGATGGTGAGCTCGCGTGCCCGGCCTTCG
+GGGAGTTGCACCATGTTGAACCGCGCCGAGCCGGAGTGGCTGGCGAGGACGGTGTTGGCC
+GGCAGGTCCGGTCGGGTGGGGTGCATCTTCCACGGCGGGTTGACGATCGGCTCGCGCCAG
+AGCGCGTGGCGGGTGTGGTGGGAGCGGTCGACGGGGCCGATCTCGCCGAGGTCGCAGGTG
+GCGTCGCGGAAGGTGCGCCACGGCAGGAGCGCGCCGGGGCCGTTCTGCTTCACGAGCGCG
+AGCTTGCGGGCGTGGGGCTTGTTCAAGGGCAGCCGGTCGTCCTCGGGGACGGGGTGGCGA
+TGCCAGTATTCGCCGGTGACGTATTGGGAGTGCAGCAGGGCCTCGAAGGAGTGGGTGGGC
+TCGGGGAAGGCGAAGCCCTCGGGGTTCTGGTCTTCGCGGATGCCGATGACCAGGACGCGC
+CAGCGCTGCTGGGGGACGCCGTAGTCGGCGGCGCAGACGAGGTTCGGGGTGACGGTGTAG
+CGCAGGCCGAGGGCGGGCTCGGCGAGGCGTTCGAGGACGCGCCGGTAGTAGTCGGCGTGG
+CGTGGGGAGAGCAGGCCGCGCACGTTCTCCATGAGGAACGCCTTGGGGCGCAGCCCTTGG
+ACGGCGCGGACGAATTCGGGGATCATGTCGCGCTCGTCGGCCTCGCCCCGCTGCGAGCCG
+GCGAGGCTGAACGGCTGGCACGGCGGACCTCCGGCGACGAGGTCGGTCTCGCCGGGGGCT
+GCGATCTCGCTCCAGTCGACGCCTCGGACGTCGCCCTCGATGACGGGGGTGTCGGGGAAG
+TTGGCGCGCAGGGTCGCGCAGGCGTTCTTGTCGAATTCGACCAGGGCGGCGGCCTGGAAA
+CCGGCCCGCTCAAGGCCAAGGGCCAGGCCGCCCGCCCCGGCGAACAGCTCCACGCTCGTC
+AACAGTTCGGGCATGGGCTGTTTCCTCCCCTGGTCGTGGCTGCTCGCAGCAGGTCGTGGA
+ATCGGTAAAGGTGCACGCCCGAGTTGTCCAGGCCGGATGGCCGGAGCTTGCCCCGGCGGC
+TCCAGGCCCGGACGGTTTGGGCTTTGACGCCCAGGACCCGCGCGGCCTCGTCGGCGGCGA
+GGAGGGTGTCGGGGCCGTGGGCGAGGATGTTCGGCGGGAGCGGTCTGCCCACGATGGCCC
+CCTTGTCGACACAGCTCGCCGGTGGCGGCTCTCTAGGTGGGTGGTGGGGCTCGGGGCGCA
+CGTCTCCCGCTGACCTCTACGCTACGGAGTTAGCACACATGTTCGCAATGGAACGGCGCG
+GCGATGTGAAATCGCCTGGTCGGGGGGTTGTGCTCGGCGGCGTGCTTGTGGATGAGTCCA
+GGTCATGAAGCCTTGTGGCGGGCGATTTCTTCCCATTGGGCCTGGTATTGGTCGAGCCAG
+TCCGCGATCTCGCCCTCGTCGGGCTCCCAGTCGCACACCGAGCACACGATCCGGTCGTAG
+TGCTCCTCGACCTCGTCCCAGCAGCGCCAGACGGTGAGGTTCTCGCAGCCGGGGCATTTG
+CCGCCGAGCCAGACCATCGGGGCGGCGACGCCGTAGGGCTTGGTGCGCTCGCGCAGCTCG
+CCCCATTCGCTCGCGAGCTTGCCGGCGTGGTCGAGCTCGCAGATCGTCTCTAAGCGCTCG
+TCCAGCCACTGGCGGGACTGCGCGACGTGCGCGGCCTGGGAGAGGTTCTCGCTTGGTCCG
+AGGCCGCCCAGGACACAGGCGAGGAGCTGGTGGGCGCGGACGAGGGATTCGGCGATCTCG
+GCGCACAGCTCGCTGGCGCGTTCGGCGGGGTGCCCGAAGCCCTCGGGGGTGGCTTTGCGC
+CCGAGGGTGTCGGGGCCTTGCGGGCGGGGCAGGAGCGCGAGGCGTTCGTAGTCGGCGGCG
+ATGAGGCCGAGTGTGCGGCGCAGTTGATTCCGGCAGCCACGGCACATGCCGTCTGCGACA
+AGTCTGCGGTCGCCGAATTTGTCGCGGCAGCCGGGGTGGACGCAGGGCCGGGCGCTCATG
+CGGCTTGCTCCTGCTCTGGTTCGAGGGGGAGGTTGTAGGCGAATTCGGTTCCGGTCCAGG
+CGAGGCTGATGCGGCCCCTCTTCCACAGCTCCCAGGCGGCGTGTTGGAGCGCCCAGTGCC
+CGAACGCGAGGTGGGCCGCGCGCCACTCGGCGTTGGTGGGCCCGGACTCGCGAGAGTTGG
+CCCAGATCTCGCGCATGAAGCGCTCCAGGTCCTCCGGGTCGATCATCGAGGGCTCGTGCG
+TCACAGGTTCTCCTTCGCGGCGTCCGTGCTGGCGGTTGGCGTGGCGGGGCGTGCGGTGAG
+GGTTTCACCGTCCCAGGCGAAGGCCACCAGGCCGTCGCGCCACAGGGCGAGGACCTCGGC
+GAGGGTGATGAGCTGCTCGAACTCGGCGAGGGCCAGGGCGAGGTCTTCCTCGGAGAGGCG
+TCCTTCCGCGTGGCGCCGGACTTCGGCGATCATGCGTCTGGCTTCTGGGTCGTGCGCGAG
+GGCGATGTCGATGGTCATGGTTCAGTGCTCCTGTGTCGGCTGGTTGGTGTTGTCGATGGA
+CTTCTTGTCGGCGAGTTCGAGGATTTTGGCCTCTAGGCGGCGGTCGAGCCGGTTCTGGCG
+CTCAGAGCGCTCGCCGGGTTTCTCGCGTTCGGCCCGGTCGCGGCGGATCGCTCTGGCGTG
+TCGGATGACGTCGGCGGCGGCGATGTGCTCGCCGGTCTCGCTGTAGTGCAGGGTCACCGC
+GTCCAAGAGGTCCGGCAGTCGCAGGTCGAAACGGGCGAAGGCTTGGGCCCAGGCGCGGGC
+CATGCCGGGCTCGGGTTTGGCGAACCAGCGGTCGAAGAGCGCGGCTTTGCCGAGGGCTTT
+CGCGGCGTCGGCGACCTGCTGGTCGCTGGGGTTGATCATTAGTCGAGCTCCCTTCCGGTC
+AGGTCTTGGGCGTTGTGGGCTTTGGCCTCGTAGTCGGCGGCGATCGCGAGCCAGCCGAGG
+GCCTTCTCCGAGGGGCTGCCCCTGGCGGGCTGGGCCGGGTCAGCCCGGTTTTTGACGACT
+TCGGAGACCAGCGACGGCAACAGTCCCGCCCCTGCGCGGGGTTTGGCGAGCCACAGGCGC
+AGGGCGTCCGCGACGTCGGCTCTGGGGGTCCCGGCGCGCAGCAGTTCGGCGGCTTTGACG
+GCGAGGGCGGAGCGGATCTGCTGGGGGTGCTCGCCTGGGATCGTCTCGCGCACCAGTGCC
+CAGCCCTTGATCGGCACGCGACCGGGCAGCGGCCCCTCGCGCCCGCCCGCGTCGCTCAGG
+TGAGGTGCTTTAGGAACGTGACTAGTAGATGTCTTTTCTTCTCTATTCTTTTCTAGAGGC
+GTGACGTCACGGGACGTTTCCTGTGACCGCTCGCGCTGACGGCGTTTGCGCTCGCGGTCT
+TTCTCTCGTCGTTCGAGCAGTTCGTCGCCGGTTTTCTGCCACCTCTCCCAGTTGCGGAAC
+CGGTAGACGCCAGGACTGGTCTCGTCGACGATCTGTGCGCGGATCAGCTCCGATATGTAC
+GACGAAACGCGGACGATCCCGAGACACATCGCCTGCTTTTTGTCGAACACGCCTTTGGTC
+TCGGCGTTGCCGCAGAACGCGAGCGCGCGGGTGAACAGTCGCTCCGCGTTCGCCGACAGC
+CCGGCCACCTTCGCGTCGAGGTAGTAGGTCGAGGACAGCCACACCTTCTCCATCGCTCAC
+GCGCTCCTTTTGGGCGCTTCGCGCCGGTCGTGGAGCGCGACGACGGCGTCCACGGCCCTC
+GCGCCGAGAGCGTTGTCGGCGCGGTCCTGCGCCTCCACGCTCGCGTGCAGGTACAGGTCC
+GCCAGCACGGCGACCGGGGTCCGGACGGTCTGGGCCTGCCCGGAGCGCAGCCGGTGCAGC
+TCCGCGCTGCGGCGGTCCCGTTCCAGGCGGGCGTGGTTGCGCTCGCGCTTGTCCGGCGCC
+CACAGGAGGTCTTCTGCGACGACGGCGGTCATCTTCGGCGGTGAGGGGGAGCCGGGCGGG
+TCCAGGCTCACGAGGTAGCGCAGCTGGAGGACCTCGACTGTGACGCCTTTGGCGAACATG
+CCGTGTTTGGTGGCGAGGTCGCGGGCGAGCGGGATCGTCTCGCCCGGGCGCGGCGGGCTC
+ATTCGGACCTCCGCAAAAGGGCGCCGGCCTTGTGCAGGGCGTCGGCCTTCTCGGCCTGGG
+TGAGCGGTTCGAGGACGCGGGCCTTGCCCTCTTTTCCGAGGCGCCCGCCGATCCAGCCGC
+GCCCGCAGTGCTCTTCGAGGTTCTTCACCAGCCCCGCGCCGAAGACGAGGACGTCGGGGG
+CGCGCTCGGGTCCGGTGGGGTGCTCGACGTCGACGACGTTGGCGCGGATGGCGGGTTTGA
+CGCCGTACTGGCCGGTCTCGACGTCCTCTTTGGCGAGGGGCTCGATGAGCAGGACGTGGC
+CGTGGGCCTTGTCCCAGTCGAAGCGGTAGGGGGTGGGGTCGACGAGCTCGGGGTCGTCGG
+GCTCTGCGGTGTTCGCGGTCGTCATTTGGTTCCTCATTTCCTCTTAGGCGGCGTTGTGGG
+ACAGGACGGCGGTTTCGCCGGCGCACTGGACAGGCGAGCTGGGGCGTGGCGCGAAGAACG
+GGCAGTGCTCGCACTTGACGGGGGTGATGGGGATCTTGGCGAAATCGGGCTCGGTTCGCG
+TGATCGCGTTGTGTCGGCGGCGCCGGTTGGCTTGTTCGAATCGGCGCAGGTGCTCTTGGG
+CGAGCTCGGGGTCACAGGGCTCCTCGAAGCAGATCGCGTCCTCCAGGTTCCCCGAGCGCG
+GCAGGTAGACGACCGCGATCTTGCGCACCTTCACGCCGGTCTGGTTGAGGCCGTGCCCGT
+AGAGGCTGGTCTGGGCGCGGTGCTCGGGGTCCATCTCCCCTTGGCGCTTGACCGCCGCGA
+TCCTGGCGGCGGACCCGGTCTTCCAGTCGATCACCGTCCCCGAATCGGCGTCCACCAGGT
+CCGGGGTCCCCGCCAGGCCGGGGACGATCTCGATCTTGCGTTCGGCGGTCCACCGTTCCC
+GGCCGAGCCGGGCGTTGTCCGCTACAGCGGCGGCGCCCAGCCAGGCGTGGATCGCGGTGC
+CGACGATGGAGGCCCACGGGTCCCCGCCCTCGTTCGCCTTCGGGGCCCCGGCCAGGCGCA
+GCGCCAGGCGGCGCTCGCACGGGTGCGCCAGCTCCGAGGGCCCGAGCGCGGACTGCTTGG
+AGCGCGGGTTCGCCCCGTGCTGGGCCTTGATCATCTGTTTCAGGTCGGCGAGCAGCCCGA
+CAGGCCGGATGGGGTCGAGGATCTCGAATGCTCCGAGGGCGCTCATTGTTCGGACTCCTC
+CCGGGGTTCGACCAGCCGAAGCTGCGGGGGGCCGCCGCCGGGGGCGAGCTCTGGGTGGTG
+GGCGAGGTCGAGGAAGAATGAGTTCAGGTCGCTGAGCAGGCGCCAGAGCTGGCTGAAGAC
+GAAATCGCCCGCCGTCCACTGCCAGTGCCCGTCGCGCAGGTCGGTCCAGACCGGGGCGTG
+GCGTTTGTGCAGCGCGTCCAGCTCCTCCTGCAACCGCGCGATCCGCGCCGTCCGGGCGGT
+GATGGCCCAGTCTTGGGGCGTTATGGCGCTCATCTCTTCTTCTCCTCTTGGTCGTGGGCG
+AGCTTGCGCTCGGCGTAGCAGGGGCCGCACAGCTTGTGCCGCGCCTCGCCCGCTGTGAGC
+GACACCGAGGCACAGCGGACTTGCGGGCCGGGCAGCTGGCCGCCGGAGTCCAGGTGCGCG
+CCCCAGTTCGCGACGCAGTCCTCGCAGCGGATCGTCTTGGACGGGGTTTTCGTCCTCGTC
+GCCCTCCACGCGCTCATTCGTCGACCGCCCGGAACACGCGCACGCGTGTGGTGCGCTGGC
+AGTCGGCGAACGCGATGGGCCAGTCGCGTTTGAGCTTCGCCTGGTCCAGGCCCGTGCGCT
+GGTGGGATTCCCAGGTGACGACGGCGCGCCCGTCCAAGACCCCCACATCCGCGTCGCCGA
+GCGCGGCCTTGATCTGCGCCTCGTGCCGTTTGGCGAGCTCGGCGTGCTCGGCGGCCTTCT
+CGCGGTGGTGCAGCATGAGGTCGAGGTCCGTCCGGTGCTCGGCGAGGTGGCGGGCGGTGC
+GCTGGCGGGCCGGGGCGGGGTCGGCCAGGCGCAGCGTCGGCTTGCGCTCGGGCTCGTCGG
+GGAGCGCGGGCGCTGTCGCTGTGCTCATCGTGTTCTCCAATCTGGTGGGTTGTGGCCGGC
+TCCGGCCGGGAGCGGTGAACGCCTCCCGGCCGGAGGGCCGATGGGGTTAGTCGAGGGGGT
+TCTCCGCGAGGCGGGGCCACGGGTAGTGCTCGTTGGGGTCGACGCGGATCACTTGGGCGC
+TCTTGCCCGCGCCCCAGAGGTTGAAGGCTTTGAACACCGGGGCGAGCGTGTCGCGCAGCG
+CCTTGGGATTGTTCGCCGACGCGAGCCCGGAGCGCAGCTTGCGGCGCAGCGTGTAGGCGG
+GGTGCCCGTGGCCGATCATCTCTCCGGAGGCGAGCAGGTGCAGGAACATGTGGCCGTTGA
+CGTGGTCCACAGCGAGGATGCGCCACGCCGCCGCGGCCCAGGAGGAGGGGGAGCCGGCGA
+GGTCGCGGTAGACCTGGTACCCGAGTCGGGTCGCGCAGGCCAGCTGTTCTGCGTGCTCTC
+TGGCGAAGGCGACCGTCTCGGTGTGGGTGGGGACGTGCCGCTGGTCGAGCATGATCACGG
+CACGCGCGGCGGAGGCGACCTTGGTGGCGTCGGGGACGCCGTCGATGCGCAGCGCGTCGG
+CGACGGTGCGCTTGGCCCCGGAGTCCATGACGTGCTGTGAGTCTTTCGGCAGCCCGGTGA
+CGAGCAGCAGTTTCAGGCGGACGCCGGATTTGACGATCGCCGAGAGGCGGTGCTGCCCGT
+CGAGCAGCGTGCCGTCGGCGGCGACCTGGACCGGGGCGGCGTTCTCCTTCCAGCGCCCCT
+CGGTCATGTCTCTGGCGAGGGCGTCGCGGTGGGCGGGGCGCAGGTTTCTGTTGCGCGTGT
+TGTGCCCGAGGAGCTCTTCGGCCTCCTCGGGGCCGATCCACCACCAGGAGGCGTCGGGGC
+CTGAGGCGTCGGCGAACGCGGAGGCTGGAGTCGGGATAGTCGTGGTCATGGCGATCAGTT
+CCTCTCGGGGATGGGGATGGGCGGTTCTTCCTGTTGGGGGAAGTCTTCGGGGGCGAGCTC
+GTCGAGCAGCTCTCGCGCGGAGAAGATCGTCTGCTGCAAGGCGCGGCGGACTCTGGGCTC
+CAAGCTCTTGCGGTTCGAGCCCCAGCGGTCGTCTTTGAGCAGGCGGCGGTACCCGTCGAG
+GACGGCGTCCTGCTGCACGCTCAGCCGCAGCTCCACATCGGGCAGCGGTTTGCGCTTGCG
+GGCGGCCTTGGGCTCGGGCAGGGGCTCGTCCGGCGCCCGCTCCCGCTCAGGGGGCTGGGC
+GGCTTTGGCCTCGATCACGGACTTCCACGCGGCGTGGACGCTGCCGTCCTCGTCCATCGA
+GGCCAGTGCCCGCTCGGCGGCCTCGCGGACCGCCTCCGGGGCGTCGGGGTCCTCGGCGGC
+CTCGCGAACGCTGCGGACCTTCGCGATGGTGTCGCGGGAGTAGCCGACGGCTTCCGCCGC
+TATGTCCCTGGTCTTCGGAATCCGCGCGTCGGAAACTGGTGCAGAATCTGCACCAGTTTT
+CGGCCTGCCTTGGGTGGCCTGCCTGCGTGCTTCAGCAACAGGTTTGAGGATCTTCTCGAT
+CTCACCGGCGATGGCCTCGGCCTCCACGGGGGTGAAGGGCTTGCGGCAGGCGTTCTCGTC
+GGACTCGGCGCGCAGCAGCCGCGCCGCGTCGTCGAGGTCGGCCATGACGGTCACCGGGAC
+GCGCTGCCAGCCGAGCAGTTTGACGGCCTCGACGCGGCGCTGCCCGGCGACCAGCTGGCC
+GTCGGGGGTGACGACCACCGGGTGCAAGAGACCGACGGTCTTGATGCTGTCGGCGAGGGC
+TTGAAGGTCGCCGAGGTCTTTGCGGTGCCTGCCCTCGACGGTGATCGCGTCCAGCGGCAG
+GGACGGCGCGCTCACGCGGCGGCTCCCAGGCCCAGTTCGCGTGCCCAGGCGGGCAGGAGC
+TGCGCGACCGGGACGGCGAGCGCGTCGGCCACCTTCTGGAGCTCGTCGAGCCGCCAAGGG
+CGCTGGCCCTTCACGGCCCGGCACAGGACGGGGTACTCGACGCCGATCTTCTCGGCGAGC
+TGGGCGCGGGTCATGTCGCGTCTGGCGAGCAGGGCGCGCACCTCGGCTGCCACCGCGTCG
+GAGAGGGTGTGGTTTTCGATGGGCATGCCGAGAGCCTAATACCTAATCATGATGTTTGCA
+ACTTCATTAGGTATGTGTCATGGCTCATAGGTGTAGCGAAAGTCCGGAATATGTTGTTCA
+TCGTCATTCCCGTCCGATACGGTGGGCGCATGGTGAAGAAAACGGAGAGCATCCCCCTCA
+CTGCCCTGCAGCTGGCCATCGTGCGCGAGACCCGCGCCGAGCTGACCCGCCAGGGGCTGA
+GGGTCTCGGCGCTCCAGGGCCCCCCGTCGCTGGAGGGGGGCACGTTCGGCGCCGAGCGCT
+ACGTCCGCGCCCGGCTCGGCGAGAAGCCCGCGATCCCGCTCACCCTCCTGGAGCTAGAGA
+TCGTCTGCCGCCGCCTGGGCCTGAAAGTCTCCGATCTCGTCGAGCGCGCCGAGCTCTCCC
+TCGCCGCCGGGCGCATCCCCGCGCCGCTGTGGCCGGAGGAGCGCCCCGAGCGCCAGCCCC
+ACTGGGGCGGCCCGAACCGCCCCGAGCGCGCAGAAACGCCGACGAATCCAGAAAAGTGAT
+AGAGAACACATACATGTCCTGACATCGGAGGACGTCCGCGAATCAGGCGGAAAACCGAAA
+AAACATCAGTGTAATTCGAGGTCAGGGCCACTTTTTGTCAGTGGCCCGTCCGATGATCTC
+CAGCATGAGTAAACAACCGACCACGCGCACCGAACCGAACCAGGACCCAGCCGCCCGCCC
+GAACGAGACCTCGCCCGAGCGCAGAGCGGTCGAGGAGACCGCCGCCGCGCTCGCCCAACT
+CGGGCTCGAAGCCTCCCCGCTATCGGCGACACGCCGAGAAGCGGAAAACGGCGACACGCC
+GACAGCACTTTTATCCACAAGCGAGCGGTTCCCTGAGCTGGGGGAACGATCCGATGTTCG
+GCGAGTCTCCCCAGAACCCCTCGCCGTGTTCGCCGGATTTCAGACGATTTCGGCGAGTTC
+CACACAGCCCTGTGGACAACTGCGCTTGACGATCGCGCCGAAATGCCTAACGTTCAATCA
+CATGCATGTGATTCAGCACTCGGAGGACGACGACCAGGCACTGCGGGAGCGCCTCGCCCG
+CCGTCCCTTCCACCCGTGGCGGGCGCTCGGGGCCGGCTGGCCGGAGGTCGTCGTCGACGC
+CTTCGCCGAGCTGCCAGACGGGGTCGGCTGGGAGCGCGAGGGGAGCTTGATCCGGCTCGA
+CCGCCGCCTCGACGGCGTGGTCCGGCGCAGATGCGCCGCCGCCGCGGCGCTCGCCTCCCT
+GGAGCGCGAGCGCTGCGGCTTCGCGGCCCCGTGCCCAGCCGAGGAGCGCGCGGCGGCGGA
+GGCCGAGGCCGCGCGCTGGCTCTTCCATCTCGCGGACCTGCTGCAAGCCTACGGCGACGC
+GCACGACCCGACCGACCGCGTCGAGCTCGCCCGCCTCCTCGACGTCACCGAGGAAGTCGT
+CAAAGCCCGGCTCGACGGCCTCACCCGCGAGGAGGGCGCGTGGCTGCACATCACGTTCTG
+GAGCGCCGCGTGAAGCCCGACCCCGCCAGCCTCCTCGCGTTCGAGCGCGCGTGGTGGCGC
+AGGGCCGCGAACAAAGACGCCGCTGTCCGCGAAGCGTTCGGGCTCGGCCCGATCCGCTAC
+TACCAGCTCCTCAACCAAGCGCTCGACGACCCCGCCGCCGTCGCCGCGCACCCGCAGACC
+GCCAACCGCCTGCGTCGGCTGCGCGAGGCGCGACCGGCGGCCAGGGCGCTCGGCGCGGCC
+TAGAGGCCCTCGCCTCGAACCTGTTAACGAGGGAACAGATTCGAGCTATAGTATCGAACA
+TTAGTTCGAATAACCGGCGTCGAGCCGGCCATCCCGAGGAGCACAGATGCCCAGACCCGC
+CACCCCGCTCGGCTGCTACGGCAAGATCAACACGAAAGAGGCCCGGCCCGGCCACTGGAC
+CGCCTCGACCTGGTTCCGCGACTGGGACGGCGAGAGCAGGCTGGTCAAATCCAGCGGCCC
+GACCAAGGCCAAGGCCGAGAACGCCCTCAAGAAGAAACTCCAAGACCGCCAGACCCCCGC
+CTCGGGCGACCTGGTCACCCCGGACACCACCGTCGCGGTCCTGTGGGCCGAGTTCCGCAA
+CCAGCTCGTCGAACGGCAGAAGGAGGGCTCGATCTCGGAGGGGACCATCGACCAGTACGA
+CCGCGCGGCGAAGAAGATCCAGAAGGGCCTCGGACAGGTGCGGATCAAAGAGCTCAAAGT
+CCAGCTGCTGCACAACTTCCTGCGCGCGCTCCCGAAAGGCTCAGCCCACCACTGCCGCAC
+GATCCTCTCCGGGATGCTCGCCCTCGCCGTGCGCTACGAGGCCCTGCCCACCAACCCGAT
+GCGCGACGTCCCCAAGACGACCGCCGGCAAACGCGCGCGCGGCTCCGAGTCCGCCCAGCG
+GCCCAAGGGGATCGACGACGAGACGGTGGAGCGCATCCTCGACGCGATCATGACCTCGGA
+CGCCCCGTGCCCGCAGATCGGCCCCGGCGGCGTGCCGACCCCGCGCAGCGCCTACGCCCG
+CAAGCACTCGCCCGACCCGACTCTCAGCCAATACGCCCAAGACGCCGACCTCGTCGACGT
+GATCACCTTCCTGCTCGGCACCGGCATCCGCATCGGGGAGGCGCTCGGCGTCCTGTGGAC
+CGACGTCGACTTCGAGAAACGAATCCTGACGCTCTCCGGAAAAGCTGTCAGGGTCAAAGG
+CCGGGGCATGGTCCGCGAATCCCACACCAAGACCGAGGCGGGCGACGGGCGGCCCATCGA
+GCTGCCCGGCTTCGTCCTGGACATGCTTCAGCGCCGCAAGGCCCAGCGCCATCTGATCGG
+CGCGAGCGGGTTCCGCCACCCCGGCAAGATCCGGACCGACGAGGAGCAGCTGGACTTGGT
+CTTCCCGGCCGCCAACGGGGGAGTGCGCGACATGAACAACACCCAGCGCCAGTGGCGGCG
+CGTTCGGGCCGCGCTGGAACTGCACTGGGTCGTCCCGCACGCCTTCCGCAAGACCGTCTC
+CACCGCCATCGACGAGGGCGGGCTCTCCGCGCGCGTGGCCGCCGACCAGCTCGGCCACGC
+CAAAGTCAGCATGACCCAAGACGTCTACATGGCCCGCTGGAAGCCCCACCCCGAGGCCGC
+GCAGCTCCTCGACGAGCGCTTCGGCGCGATGGTGAAAACGATACGTAAACATGACTTCAA
+CGAGGAAGAGGCCGTGGCGTGA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_014211.fasta.fasta
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_014212.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_014212.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1309 @@
+>NC_014212.1|provirus_1170297_1209132
+TTAAGCGGTGGGTCTGTCTTCCCTGGGGCCAAGCAGCTCGCCAACGGCCAGGGCAGCTTT
+TTTGCGCTGCGCCCTGAACAGATGTTGGTACGTTTGCTGGGTAAAAGCTACGCTGGCGTG
+CCCTACCCGTTCTGAGACTACCTTGGGATCAACCCCGGCCAGGGCCAGCAGAGAGACGTG
+AGTATCCCGTAAATCATGGAAGCGAATTTCTTTGACTTTAGCCCGCTTGATGATGGCTAG
+AAACTCCCGACGCAGGTTGCTCGGCTCGATGGGGGTTCCCACAGAAGTTGTAAACACCCA
+GCCCTCGTCAGTCCAGGCGTCCCCTATCCCCAGGCGATCCTTTTCTTGCTGCTCCCGATG
+TTGCTGCAATACCTCGAGCACATCGCTTGAAACGTCTACTGGACGGCTCGAGCGGTAAGT
+TTTAGGGGATTGAACAACCCGCTTGCTGCCGGCTTTGGTAAGGTTTTGCCGCACCCAGAT
+CGCGCCTTCCTGCCAATCAATGTCCGCCCACTTCAGCCCTAGCAGTTCGCCTCGGCGCAT
+CCCGGTCATGAGGGCCAAGAAGAAAAGGGCATACAAGCGGGAGTGCTGTGCCTCAGCCAG
+GAAACGCCAGACTTCCTCGGGCGTCCACACCTCGCCGGTGTAGCGTGGCGCCTGAGGGGG
+CTTGACCCGGTCCGCCGGGTTCCAGGGCAACAATCCCCAACGCACGGCGTCCTCGAGCGC
+GGCGTGCAAGGTCCGGTGCACCAGCCGGACGGTCGTTGGGGAGAGGGTTTTGAGCCGCTT
+GGGGTCGTTGGGGTGAATGCGCTTCTTAAGCAGATCAGCGTAAAGGTGAGTCAAGTGCAG
+CGGCTGTAAGCGCTGCACCGCTATATCCCCCAATATAGGGATTGCGTGTTTCTCAAGGGC
+GACTTTGTACCCGTAATGGGTGGTGGGTTTGACTCGGTGTTCTACTGAAGTCAGCCAGCG
+CTCACAAAACTCTTTGAGGGTGATCCGGTCGGGGTCAGGGAGCAAATTGCGGCCATAGGC
+CACCAGCAGCTCAGCCAGCTTCTTGGCGGCTTCTTTGCGGGTCTTGGCGTACCCCCGGTG
+GCGCTTACCGCTGATCATCAACGAATACTCGTAGCGCCCGTCTGCGCGTTTGTAGATGGT
+GCCTTCATTGTTGGCGCGTTTCATAGGTGGTTGTGTGGCGGGGGATGGGGAGGGGGGAGG
+GCATGGGTCAGTTCGTGGGGTCAAGTACTATCGAATCTTGGTCAAGACCCACACGCGTAC
+TTGTTCCAAGTTTTGCGATCTGTGTACCGATATGTGCTTCCCCAAAATTCAGCTAGTTCA
+AGTTGGGCGGTGCGCATAGCCGGGTTATAAGTAGCAATTACGCTGAAAGGGCTGGTTTGA
+CCGTTAAGCACTGGCTGGTAATCTATAAGAGCATCTTGAGAAGTAATGAACTCGTCGTTT
+TTGGTGAAGAAAGAAACTTTAGCAACAACTTTATCCAAGCTTTGGCCTGACACGTTTGTC
+ACCCTACCCTCGGCCTTTACAAAACTGTCGCCAATCTGACTCCAATGCCAATCCTCAATG
+TTGACACTCCCACGGCTAAAGCACGTGGGATTCTTGGTTCGACGAGGACTGCCTACGTTG
+TGTAGGTCTTACACCCTCTCCCCAAGCGTTTAGCGTCTCCGGGTGCCCCACGGCGACGGG
+GATAGCTCGTATCCCTTCGGCCCGGATGTTCAGGGCCGCGTTCAGGTCTCGGTCGTGCAC
+CGCCCCGCACTCACAGGTCCAAACCCTGTCCGAGAGGGTGAGGGCGGTGTGGATTGTCCC
+GCACTCCCGACAAAGCTTGCTGCTGGGGAAGTATCGGTCAATCACGACGAGATGTTTGCG
+ATACCAGACCGCCTTGTACTCCAACTGCCGCCGAAACTCACCCGGGGCCGCATCTAGAAC
+CGACTTGGACAGCTTGGTTTTCGCCATCCCTTTCAGGTTCAGGTCCTCGATGCACAGCCC
+GTCGTACTTCTGGACGAGTCCGGTGGTCAGCTTGTGCAGCCAGTCCTGCCGCTGGTTGCG
+AACCTTGGCGTGGACCCTGTTCAGCCGATGCCTGGCCTTTTCCCGGTTCTTGCTACCCTT
+CTGCTTGCGGGAAAGCTCCCTTTGCGCCCTGCGAAGCTTGCGCTCTGCTTTGCGGTAGAA
+CTTGGGTGGAGCTATTCTTGTACCGTCGGAAAGCACTGCGAAGTCTTTCAAGCCGAGGTC
+AATCCCCACCACATGCTCAGGGTTTACGGGGGGCAGGGGTACGTCGGGCATCTCGAACTC
+GGCGGTCAGGGTGACGTGCCAGTGCCCTTCGGTGTCGCGTTTGAATGTTGCGCCTTTGAT
+GACGCAATCAATCGGCTGGCTCTGGCGAATCTTCACCCCACCGACCTTGGGGAGGTAAAC
+CTTGCCTTCCTCCACCCGGACGCGCTGGGGAATGCGGAAGCGGGGCGGGTCCTTCTTTCG
+GGTCTTGAACCGGGGGAACCCGGCCCGTCGCTCGAAAAACGCCTTGAACGCCCGGTCGAG
+GTCTTGGAGGGCTTGTTGCAAGAGTTGGCTATCCGCTTCTCTGAGCCAGGCCATCTCAGG
+CCGCTTCTTCAGGGCGGTGAGTTCGGTGGCCTGCCCGTTGTAGGTCAACCCCTTCCCGGT
+GGCGGCATACGCCTCCTTGCGCCGTGCAAGGCCCCAGTTCCACACGAACCGCCGAGCTCC
+GGCCATACGCAGCAAAGCCTCAGCTTGGGCTTGGGTGGGTTCCATGCGGAAGCGGTAGAC
+CTTGCGGAGCAGCATTCAGTCCCTCGTCTTCTGGGCGGCGATGTATTGCTCGATGGTTTT
+GCTACTGACCATGCCAGCCGTGGAAACGAAATAGCTCCGTGTCCACAGGGCGGGAAGGCG
+GATGAGTTGGGGAAACTCCCGGCGCAACACGTGCGAGGTGTAGCCCTTCAGGCGGTGGGC
+GACCTGGTTAGGGGCCACGTCGGGGTCTACCGAAATGAACAGGTGTACGTGGTCGGGCAT
+GATTTCCAGGGCGATGATTTCCCAGCCTAGTTTAGCGGTCTTCTCCCTAAGCAGAATATC
+CAAGCGCTCGGCCAACGGTCCTACCAGAATCTTGCGGCGGCGCTTGGGCACGAAAACGAA
+GTGGTAACGCAGCAGCGAGACGGAGGTGTTCTTGTGTTTGTAGGCCGTAGGCACTATCAC
+AGTATAGCACACCTGCCGCCCACCATGCGATGTGCCCCTGCGGGGCACATGGGGGAGTCC
+ATGTATCCCATCCCTGAAGGGAAGGGTTTTATAGCTCCCCCACACCCCCTCGCTTCTATA
+AGATTGCTCCTAGCACCCAGCCCCAACGTTTCCCCTTGGGTTTACGAAAAGCGAAAACCA
+ACAACCCTATGAAAACGATTGGCCATAAAAGGTATAGCATATCTCCCTCCAAAGCTTCAC
+CTAATCTATTTTGAATTTACATCAATGTTCGTCCAACTTAGGGTCATTTGCCATTCAGCG
+TTTCAATCCTCACTCGAGCTTTCGCCCGAGCGCAACTACATTTTCCGCACCAGGGTAGCT
+GCCACCCCAAGGACGCGGTCGTTATCGGTAAGAGGAACCGGCGGGTGGTCGGGGTTATCA
+GAGTAGAGGTACCAGGAACCGTTGTAGCGCTGTAACCGCTTGACGATGACCCCATCCCAG
+TGGACATGCACCGCCACGATGCGCCCCGGCTCGACTGCTCCCCCGGTCCAGAACACCACC
+ACGTCCCCGTCCTTGAGCGTGGGCTGCATGGAATCCCCACCGACCCGCACAGCGAACAGT
+TCAGACTCCGGCTTGCCTTTGAGGTCCGGGATGTGGAGAGTGATGTATTCGGCGTTTTCA
+TTCCACATCGGCGGCCCGGCTCCGGCATCTACGACGGGGATACGATACCGCGTCACCGGA
+ATGGTAGCAGTGATTTCCGACCCGGGGAGCTGGATGCCTGTCTCCTGGGAAAACTCCTCG
+GGAGTCCATTGGAGAACATCCAAAATGCGCTCGAGGGTTGTGGGCTCCTTATATGCTAAA
+TAACGAACCATTGTGTCTACACTAGGGAGAAAACGCGCTCCTGCCCACCCCGGGCTTTTA
+CCTACTCGCTTAGAAAATTCAGCTTGACTAATATCTAGTTGTTTCAAACGAGCCTTGATC
+GCTTCTGCGGCTTCTATTATTGCCACCATACCCCCTCCAGTCAAATACCTTTGGTATTAG
+GGTAGCAAATAAATAACTACTAGTGGTATTGACGCAGCGATTCGTATCGACTACAATGTG
+TAGCGATGATAGGTGAACGCCTAAAAGCTCTTCGAGAGGCACGGCAGATGTCACAGTACG
+ATCTGGCCCGTGCTGCGCATGTCAGCCAAGGGCTAATCTGGCAAATTGAGGCCAACCGTA
+AAAATCCTGGCTTGAAAACGCTATTGCGGCTAGCAAACGCCCTATCTGTATCTCCTGACC
+AACTACTACCTGTAGTATCTCATGTAGGACAGGAGGCCCCCCGATGACTGACCCCACCCT
+CATCTGGCAAGTAGCCGAATCCCTCGGCTTTGGCCGCCGTGTGACCTACACCCCGGATGA
+GGTAGCAGCCATTTTGCGCATGGGCCGCAGGCAAACCTACGAGCAGATTCGCTCGGGGCA
+TATCCGGGCTGTCCGCAACGGTAGCCGCTGGCTCGTACCAGTCAACGCCATTGCGGAATT
+CGTTGGGGCAGGGCGGGAGGCCATCTCCCGATGAAATGTCCCCCGCTAGCGGGCGGGGGA
+GGAAGGAGGAGAAAACAATGTACAGGGACAGTATAGCACAACTCGAACGGGCCAGGGCAG
+AGCTGGCCGAGATGGGCAACCCATACGCCTACCCCGTGCGGGATTGGATAGACGATCATC
+TGCGGCATCTGGCCCTGCAGCGTTATCAAGCGCTGCAGGAGGAGGTCGCGGCGATTGAGC
+GGCGGTTGGATAGGGAGGTGGCGTGATGCCTAGCCCTATGCGGCGCCTCGAGAAGGCCCT
+ACGGATCGCTTTGGGCCGGGCGCACGGCGGCGATGCTGCATACGCCGTGCAAGTAATCGA
+AACCCTCGAGACCGACGCCGAAGCCCCCGACTACGCCCCCCGCCCCTATCAGGGGTGGCG
+GGATGCCCGGCGGCTCATCAACGAGATTGAAGCCCTCGAGCGCTCAGAGGGGGTTGAGCA
+CGTCCGCATCAAGCGCCGGGTTCCATCGGCCTACCGAACCGGAGAGTTTTATGTCTAAGC
+GCAGATTCGACTGGCCTGCTTTCTTCGCGGCCTTCTTTCTGGCCCTCATCGCCTGGGGGA
+TCGCCTTCGGCATCCCCTGGGGCCTGGATTGGATGGATCGGAGGCTGCCCTGATGTGGTG
+GCCCGACGACCTCCGCGATTTCCGCCGTTTCCGCGCGGTGTATGGCGCGGGGCAGTTCCG
+CTGGGGTAGCCCCGCCACCACCCCGGCCAAACGACCAGGGGAGACCAACACCTGCCAGAC
+CTGGACCGAGCGGCAGGTGTTGCGGCTGGCGCGGCTGGGGGAGCTTGATTCTGATCGGCC
+AATCGCGGCGAGCGCCGCTGGCAATGTGTAGCCCCAAGGGGGCAAAAGGAGTGTGTGTAT
+GCCGTTTGTGATGGAAAAACCGCAACAAAATGACTTTGGCACTGAAAGCGTGGTCTTCCC
+CCCCAACACCCCACTCGAGTTCACCCTGGAGAAGATCGAGGCTGGGCTTTACGAGCCCTT
+CAAGCCCGACGGTAGCCGGGATCAGCCTTATCCCCATTTCCGCTTCACCTACAAGGACGC
+TGAAGGAGACATCTACCAGACTCAGCCGATGCGTTTTCCTCGAGCGTTCCAGTTCAACGA
+AAAGGCCGGCTTTTGGAGGCATATAGGGGCCCTTTTTGGCCGCCCACTCACCGAAGAGGA
+CGCTGGAGCTGTGGAGATCGATCTAGGGCCGGGCTTCGACACCTGGGAGGACGTGCTATC
+CCGAGATAAGATGCCTAACTTGTTTGCCAAAAAAGACGAGGTGCGCCCGCTCCAGGTTAG
+GAGCATCAAGGTCCACGGCAAGGAACTGATCAGCTCCGATAGCAAGGTGCTTTTGATGTT
+CTCCACACAAAAGAAAAAAGACAAAGACGGCAAGCCCAAGCGTGACAGCAACGGGGATGA
+GATCGAGTACAGCAAGCTCGAAAGCGTATTTCCGATTTCCAGTGGTGAGAGCGGCAAGAA
+GAAGCGCCCCGTTTAGGAATCCCGCAAGCCCCTACCCGGAATCCTGGGTAGGGGCTTCTT
+GACGCTCGAGGGGACAACTATGGACCACAGCAAACTCACCAAACTCACTGGGGTGGGACC
+CGCCTTGGCCGAGCGGATCGCCAATCACTTTGGGAGTGAAGCCGAAGCCCTGGCGGCCTT
+GTCTGAAAATCCCTATCGGCTGATGGAAGTAGAAGGCATCGGTTTTCGCCGGGCTGACTG
+CATTGCCCAGGCGCATTTTGGGATTTCCCCTGATGACCCTATCCGGCACGGCTACGGCAA
+CGACTGGGTTTTGCGGCAAGCCGGGGGGCGGATGCCCCTCGACCTCTACCAGGCCAGACG
+AATGGAGATCGGACTCTTTGATCGTCGGTACGAGCTATGGGGAGCTTTTTGTGACATCCT
+CCTAGAACCTGATTTGCAAGATTCCCCGGAGTTTGCGCAGTACGTTTGGCTAGAGCCCGA
+GCTTAGGGCCGAACAAAGTTTGGCCCGCTTTTTGGTAAAGGCGACGCGACCAACCACTAA
+CCCTTTTATCATGCCTAACGGCATTCCTACTTATCTAAACGAGGCTCAGGTAAATGCGGT
+ATTGAAGATGTCCTGCCCCGGATTTGTCCCCGCTCTTTGCGTCACGGGCGGGGCAGGGAC
+GGGTAAGACCACGGTGATCGCTGAGGCAGTGAGGCGGTTAGGGGCCGGGGCAGCAAGAAT
+CATGACGTTTACGGGAAAGGCCGCCCAGCGGGTTAGGCAGGCACTCGCTGGGCGTGGTTG
+TGAGGATTTTGCCGAAGTCAGCACGCTGCATCGCGGATTGGATTACAAACCCGGGGAGGG
+ATTCCGCAGGGAACGCTTTACGGAGTCCGTTGTAATCATCGACGAAGCCAGCATGGTGCC
+CAATTGGCTGCTGGCCCAGGTAGTGACGCGGCTAGAGCCCTTGGCAACGCTGGTGCTAGT
+CGGCGACGTGGCTCAGTTGCCGCCAATAGACGCCGGGTTCCCCTTCAAAGACTTTATCGA
+CGCTGGGGTTCACACCGTAACTCTGACCCAAAACTACCGCCAGGAAAACCAGCGGGAAAT
+TTTTGAGCTGGCCGAAGCAGTACGAACTCGAGCCCTCCAGCCCCCACCTTTGCATGCCTC
+GATCTGCGCCACCAATCTTTCCGCCTACGAGTTCAACTACTGGTGTGAAGCCTTGCTCGA
+CCCAGATCAGCTACCCCCTTTGCTGGACTGGCAAGCCATCACGTACAGAAACGCTGACCG
+CGAGCGGATCAACCTGGAGTTGCAAAAAATATTCAACCCCCACGGGGGGAAAGCTTTCGA
+GTACTGGCCCCGCGCCCTCCCCAAGGAAGAACGAAAGCCGATCACGGTAAAGACGGGGGA
+CAAAATCGCGGTGCGGGCAAATGTTTACTCCCTGGAGGTGATGAACGGTCAGACCGGGAT
+CGTCCGGGATGTTAAGCTCGACCGCGAAACCTACGAACCGGTTTCGGTAATTGTAGAAAT
+TGAAGGACGAAGTGTAGAAGTTCCGTTGGAACTGGCTCCAGATCTCCTCGAGTTGGGCTA
+TTGCATCACCACTCACAAGGCCCAGGGGTCGGGGTGGAAGGAGGTGTTTATCTTGCAGCC
+GGGGGCAGTTGGGTTTGACTCCCGGCGCTGGTGGTATACGGCGATCTCGCGAGCTGAGGA
+ACAGCTCGCAATCCTCACTCAAATGGGAACCAGGACCTGGTGGGCCAATGCCACCAAGCC
+TATGCCCTTCGAGCCGAGCAGCTTGCTCGCGCGGTTCCAGCGTTACGCCTCCCAGCCGGT
+GGGGGTTCGTTGATGCCTGGGGCCATGGATACCCACAGCTTCCGCCGTCGTCTGGCTGAG
+GCCATGAGCGAGGCGGAAATCCAGCAAGGGATTGTGAGGTACCTACGGGCTACGGGCTGG
+GTAGTACTGGAGATCAAAGGCAACGCCAAGCGGGGTGGGACGGTATTTCAGACTAAGGGG
+ATCCCTGACCTCTATGCCGCACGAAAGGGACGCAGCTTGTGGCTCGAGGTCAAACGGCCC
+GGCCAGAGGCCGCGCCCCGAGCAAGAAGCGCTCCATGAACGTTTGCGCCAGGAAGGGTGC
+GAGGTGCACGTCATAGACGGGATCGAAGCGCTGGAGAAGCTGTTATGACCGGAATTTTAA
+CTCCTCCTACCACCTACGCCTTTTTCCAACACCTCAGGCTTCCGGAGGAGCGCGGGTTTT
+TGGAGTTTCGCGCTTTGCCTTCTAAAAAGCAGAGTTGGCAAGAGTGGCCCCCGCCCGAGA
+ATTTTGATGGGCTTTATGAGTTTCCTCGCGAAGAGATCTACTTCGGAGTTCTCTTGCGCG
+ATACCCGCAAGGGCAACGCCGCCCACGTACGGCGAGGCAGTGTTGCCTGGCTCGAGCTGG
+ATTTAGCAGGGAGCCTTTACCTTCCCGATTGGGACAAGAAGAGCGTGAAACAGGCACCCC
+CCGAGATCCTTCGCCGGAGCGCGGAGCAGCTTTGGGCGGACCTGGAACTCGAAGCTCGAG
+AGCTGGGACTACCCCCGCTGGCCGCCGTGTATAGCGGGCAGGGGCTACATGTGTACTGGG
+GGCTGGACACTCCCCAGGAGGGGAAGTGGTTGGAGGGGCTCAACAAAAGCTTGATCAAGC
+TGTTTCGCTCCTATAACCCCGAGGAGTCCGCCTTCGACCGCGCCAGAATCCTGCGGGTTC
+CCGGTACGTGCCACAGTAAAAACCCTCAGCGCCCACTGCCGGTCGAGCTACTGTACCTAG
+GCGACGAGCGCCTCCCGCGAGAACGGCTAGAGGCGATTCTGCAGGTCGAGGATCCTCCAG
+CACTCCCCCCGTCGCTGGAACGGGCCATGCGAGCCGGGCTCTCCCCCTGGGAGCCCTCCG
+AGCACGATTTACGACTACTGGTGGAGCACTGGCATGTCGGTGAGCGTAACCAAAAGGCCA
+TGGCCTTTGGTGGATGGTGCGCCTCCCACGGGGTGCCGGAGAAGGTGGCGCTGGATTTGG
+TAGAGCGGATTTGCCGCGAGGCAGGGGATGAGGAGCCCGCCAACCGCCGCAGCGCGGTGG
+CCAACAGCTACCGCCGATATCAGCAGGGGCTGTCGATTCTGGGGTTTTCCAGTTTGCGTA
+AGCTGGTGCCTGGCCTGGAGGGGAAAGGCCGAGTGAGCCTGGGAATGCTTTCCGCCTCCG
+AAAGCGAGGCCCTGGAAGGCGCCGTCCCTGGCGAGAGCCTATCCCTCCCTCCCGAGTACC
+GCCTGGACGAGGCGGGGCGGCTGGTAAAGGTCGAAGTACGCAGCACCCGTTGGGGGATCG
+TGGAGGACATAGAGCTACTGGCCCCCCGCCCCATTGGGGTGCGCGAGGTGTACACCGACC
+TGGCCACCGGCGAAAAGCATTTGCGGCTGTTCTGGCCCGACCTGGATGGCACGGTGGTAG
+AGCGGCTGGTACCGATGGGGGAGGCCATGACCCGGCAAGGGCTGTTACGTTTGGCCGCCC
+AGGGGTTGCCGGTGGACGAACCCAATGCTGCCCAGCTATCGCGCTTTTTACAGATGTACC
+TCTCCCACAACCGCTGGGCACTACCGCACCGGCGAGTCACCTCGCACCTGGGCTGGCAGG
+GAAAAACGTTCATTTTACCCGGCGGCGATGTAGAGGTGCTGGAGGTAGATTCCGAGCCTT
+GGCGCCCAAGGGGCAATCTAGAAGGGTGGCTGGAGGGCCTGAGAGCCCTTCTAAGCTGGG
+GGGTGACCCCGGCCCTTATCGCAGCAGCCCTCAGTGCGACGGCGCCCCTGGTGCGAGGCG
+CGCGGCTGGTCAAGAACCCCATCCTGGCGCTATCCACCACCAGCCATTCGGGGAAGACCA
+CGGCGGTGTACTTCGCACTGAGCATCTGGGGGAGCCCAGAGTACAACGAAACGCTCTACC
+TCGAAGACGCCACGGTGAACGGATTGATGGGTCGAATGATGGCCCGCCAGGATCTGCCGC
+TAGGTTTAGACGACTTACAACGCTATGACGACCGCAAAGTAGGGGAACTGGTGCACTTGC
+TTTCTGGAGGCGCCGAAAAAGCCCGGCTTAAGCGCGATGGCAGCGAGCGCCCGGCCCGGC
+GATGGCGAGGGGTGGCCTTGCTCACTGGAGAGGTGAGCGCATTGCGGGAGACATTGGGTT
+CAGGGGCGGTGAACCGGATGGTGGAGCTCGATGACTACCCTCTGGGGGTGGGCAAAGGAC
+CGGAGGGGGCCGAACGTTCCCGAATCCTGCGCGAAGCGGCTCAGCATTGGGGGCAGGCAC
+GCACCCCGCTGGTCGAGTTGTACGCCGACCTCAACGTGCGGGAGGTAATCGATGCCTTAG
+GCCGATTGGCCTTGGAGGCCGGCGCCCCGGCAGATATGACCGACCTGTGCGGGTTGGTGG
+GGCTAGGGGTACAAATCCTTCAAGTACTTGGAGGGTGGGAGGGGGAGAGCCAGGATGAAG
+CGGCCGTGACCTACTTAGCCCGCAACCTGGTGGAGCTGCGCGAGCGGCACGGCAGCCTGG
+CAGGGCGGGCGATGGAGGCGCTGCGCGACTTCCTGCGCAGTTATGCCGGAGCGGGCGATC
+AGCCGACCGATGAGATCCGGGTACGGGAGGAGCTACAGGCGTTTTACAAGGGGGGGAGCT
+GGTTCATCAACCCTAACGGGCAGGAGGTGGAGCGGGTCATGCGGCGGTATGGAGGGTTGG
+AAGTGCATCTGCCGGAGTGGGCTCGAGCTGGGTGGATTGAGGTGGAGCAGGTAGAGGGGA
+AACGGCGCTATAAACCGTTGGTTCGGTACAAGGGAGAGCGATATCGTTGGGTGGCCGTTC
+CTTTACTTGATCACGCGGAGGATGCTGATGATTGCTAAAACGTCACCACGTGGTGACGTT
+GTGGTGACGCTAGTGGTGACGGTTGTTTTTTTGTGTAGGACGAATAAAACACAATGTGTC
+ACCACCGTCACCACTCTTTATTTCATTTCTATACGCGCGCGTTTTTTTGTACCAGGGGGA
+CCCCCCTACTTAATTAAGTACTTAAGTACCCGGTTAGTAGGGGGGGCAAAAATTTTTGCC
+AAATTTTCTTCTATAAACTGCTTGTTTTAGTGGTGACAGTGGTGACGTTGGGGGATTTCC
+CCGTACAGAACGATAAAAAAGCGTCACCACTAGCGTCACCACAGTGGCACCACCGCAGTG
+ACGGGGGGATGTATGACTGAACCCACCCTCCTCCTCCGCATTGCCCGGTTCTGGGGTGTC
+TCCCTTGCTGACCTATGCCGCCAGTTGCAACCAGAACCGCCGTTGCGCCGGATGGTTGGA
+ACGCTATGCCAGGACTGTTTGAACGGTTTGGAAAGCCACGGCCTCCGCCCTCCGATACAT
+TTGCTCAAAGAACTGCGGACCAATCCCCAGAAAAAGCGCTACGCGCTCTTGCTTGGCTGG
+TTAGAGCAGTATCGGCGTTGGTGTGAGCTGAGTAAGACTCCCTGGACAGAACGCGGGGCC
+GTCCATCAAGAAAACCAGGCAGCCCGGGAAGACCTGGGCTGGCAGATTTACCTGGTGGAG
+TCGCTAATTCAGGAAACTCCCTACCCAAACACTGTCTCTAACTGGATAGAAACGCTCATC
+GGCCTAGAAAAGGAGGAACCTATGCCCATTCAAGGAAAAGTCGCAAACACCAGCTCGCGC
+CTGCACGACCTGGCTGAGATCGAGCAGGCCATTCACGAACTGCCCGGCCAGGTAGAACCT
+TGGGACGCTGACCACAAAATGCTCTACACGTTGTTGCTGGACATCCGCTGCGCCCTGCAG
+ACCTACGGTCCCCGGCACGATCCCACCAGCCTTGAGCAAGATCCCGTCGAAGCGCTCCCT
+GATTATCTGGAGATGTACCGGGAGTATTTGAGTAACTTGAAAGATTCAGACGGAGCTCGA
+ACTGACGACGAGATGCGATATGGGGCTCGGCTGGCCTGGCGAATCTGGCAGATGCTCGAG
+CGCCAAGGGGCTACCTACGAAGATTTAGCAAAGCGAGTGGCACTATTATCTGACCCTTCC
+GCGGCCTAGCCGCGAGGTACCGCCATGCTGAAGGTCCGACCCCTGAAAGCGACAAAGGAC
+ACGGGAGTAGCTAGCCCCTGGGGAGCGGCGGGGGCGACTATGAGGAGGGATTGATTGCGC
+TATACTGAATCCATACACCCCGCTCGAGGGGAAACGGCAGGAGGAGCTGCCATCCCCGAG
+GGCGTGTTGCTCATCCCTGGTAGACCCCAATCCAAGCTCGGCACCCCCGAGTTCGAGCGC
+TGGCGTATGCACGCCAGCCGGGCTGTGCTCGACCAAATCGACAACCCGCCTCTAATCCCG
+TCAAGTTTTCTCGAGCTGGCCCTCGACTTCTACTACCCCTTTGAGCAGCCCAGCTACACT
+GCTGACGACCTGGCCGAGCACCGCATCCCCCGCATCACCGCGGCAGCTGAGCCGGTGCTG
+ATCGCCCTGGTCGGGCTATTGTTCCAGCGTCGAGGGCAGATCAGTAGCCTGAGCGTCACG
+CGGATTGTGCGTCCTGCTAGCGCCCTCGAGGCGGAGTGGGGCGAGGCTTGGCGTAGGGGT
+GGGGTGCGGGTGCGGTATTGCGCGGAGGATGAGGGGCCGTGAGCAAGGAACCGCACCGTC
+CGACTCTTAAAAACCCACGGAGCCGACGCGGGGTGCCTCCTAGCGAGGAACAATGGGAAG
+TTTTCCTGGAGGAGCTGCGCCAGCACGCCACTGTCAAACGGGCAGCCAAAGCGGCTAAGA
+TCCACCACTCCACGGTGTACGAACGTCTGGCTAAAGATGAGGTTTTCCGCCGTGTGGTTG
+AAGAGGCCCTCGAGGTCGGCGCGGTTGCGCTCGAGCAAGAGGCCATCCGCCGCGCGGTCG
+AGGGAGTCAAGGAGCCCGTTTTTTATCAAGGGCAAAAGGTTGACACGGTAACCCGCTACT
+CCGATACTTTATTGATTTTCCTGCTCAAGGGGCTCAAACCCGAGCGTTACAAAGATCGGC
+ACGAGCACACCGGCCCCGGTGGCGGCCCGATTCAGGTGATCAGCATCGAGGTGGTGCCCC
+CCGATGACGCTTGATCGCGATTTGACCACTGTGACCCCGCAGGGCAAGCTGCGCTTCAAC
+CTGCACCGCGGCCAGTGGAAAGCTTGGCAAAGCTCAAAGCGCTTTGTGCTGGTGCTAGCG
+GGTACCCAAGGCGGCAAAACCAGTTTTGGCCCGCTTTGGTTGTACCGCGAGATCCAGCGC
+AAGGGGCCGGGGGATTATATCGTGGCGACTCCGACTTTTCCCCTACTCGAGCTAAAGCTG
+CTGCCGGAGTTTCGCAAGCTTTTCGAGCAGCACCTATTGCTAGGTCGCTACGTCGGATCA
+CCCAGCAAAAAATTTGTCTTCAGCCCGGAGGGCTTCGAGCGCACGTTTGGGCGTAGGCCA
+GGGCCGGACGACGCGCCGGTGCAGGTGTTTTTTGGCCATGCCCAGGACCCTGACTCGCTC
+GAGTCTGCCACCGCCAAAGCCGCGTGGCTCGACGAGGCGGGGCAAAAAAAGTTTCGGCGC
+GACTCCTGGCAGGCCATTCTGCGCCGCCTTTCCATTCACCAAGGCCGGGTGCTCATCACC
+ACCACGCCCTACTATTTGGGCTGGCTTAAGGCCGATTTACACGACCCCGCCCGGCAAGGC
+CACCCTGACATCGAGCTGGTCAATTTCAAATCGGTGGACAATCCCAATTTTCCTCGAGCC
+GAGTACGAGCGCGCTCGGGCTACCTTGCCGCGCTGGAAGTTCGATATGTTCTATAACGGG
+CTCTTCACCCGGCCAGCAGGCCAGATCTATGACTGCTTCGACCCCGAGGTGCACGTTCGG
+CCAGCCTTCAATGTCCCCGAGGACTGGCCGCGCTTCATAGGCCTGGACTTTGGCGGGGTT
+AACACCGCGGCGGTCAAGCTCGCCAAAAACCCGGCGTCCGAAGAATATTTTGTTTATGCC
+GAGTACAAAGCCGGCGGGCGTACAGCCCGGGAGCACGCTGAGGTTTTGCTGAAGGGCGAG
+CCCCGGGCGCCCCACGCGGTGGGCGGGGCCAAGTCGGAGGGGAACTGGAGGCTCGAGTTT
+GCCGCGGCGGGCCTGGGTGTGGCCGCCCCGCCGGTGGCGGATGTCGAGGTGGGTATTAAC
+CGGGTATACGGGCTGCTCAAGAGTGGGCGGTTGTACGTCATGGATAGCTGCCCCGACCTC
+ATCGACGAGATCATCAGCTACAGCCGGGTACTCGACGAGAACGACGAGCCTACCGAGCAA
+ATCGAGGACAAAGAGACCTATCACCGCGCCGATGCCCTGCGCTACATCGCCACTTATCTC
+GCGCGCGGCATCAATGACTGGCAAGTGAAAGGAGAGCACGCCGGATGAGCCAACGTTTTG
+ACGTGACCGGTCAGAGTGTCGGGTGGGCCGAACCGCCCCCCCTCGAGCTGCGCCTATCCC
+CCGACGCGGCCACCAACCCCCGCATTGAGGAGAGCTTGGCCAGCCTCACTGCTTTTGAGG
+CCACCCCCATCCCCTGGCCGCTGGACCCCGCTACCCTGATCGACGTTTGGTACGGGAGCC
+CCTGGCTGGGGGCCATCGGGCGGCTATTAGGGGACGCTCTGGCATCGGCCAATTACGACC
+TCGAGCCCGCCCCTCGCCGCCCCGACGGTACCCGGTTGGGCCGGGGGTCAGGGCAGACCC
+CCCACGATGAACGGCAGTACGACCAGGGCATGGCTTGGCTGGAGCGCGAGGACCTGGGCC
+AGGACGGGCTCAGTCTCTACAGCCTGCCCGAGCTAGCGCGCACCCTAGCGCTGCACCTGG
+ACCAGACCGGCAACGCTTTCGTGGAGGTGGTGCGCGACCGGGCCGGTAGGGGCCCGATCC
+GGCTCGCGGTTTTGCTCCCGCAGTTCGTGAGCTACGTGATCCGCCGGGAAGACGGCATCG
+CTAAGCCGATGCTCTACCAGCTCGATCCCTACTGGGGCCAGCAGTGGTTCATTCCCTTTG
+GCACCCGCCTTCCGGGTGCGCCCGAGCGCGAGTACCTCCATCAACGCCTCCCCAACAGCG
+TGAGCAACGTCTACGGGCTGCCCCCCTGGATCGAGGCCCGGCAGAGCGTGGAGGTGGACA
+ACGCCCACCGCGCCTACTTGCGGGGGTTTTTCCGCTCTCACGCGGCCCCACGCTGGCTGG
+TCGAAATCACCCAGGACCCAAGCTGGACCGGCCCCCAACCGGCGCAAGAGCAGGTGGACC
+AGGTACGGGCCCTCATCGTCAACTACCTCTCGGCCAACGCCGGGGAGATGGCCGGGCGGA
+ACCTAGTGCTCTCCTACCCCGGGGGAATCCTGCTGCGGGCCACCCCGATGGATCAAAAGA
+TCGATGATCCCACCTTCGGGACCACCGCCAAAAACGCCCGCGACGAGATCATGGCGGTGC
+GCCACGTGAGCCTCATCAATCTGGGGCTTCCCGAGGGCGGCTACCGGGCTACCGCCGATC
+AGCAATCCGACAACTTCGACCGGCAGGTACTCGAGCCCTTCGCGGCCCCCCTGCTGGCGA
+TGTTCAACCGGGTGTTGCGCACCCCGCCGCCCTCTGGGCTGGGCATTACCGACTACCGGC
+TGGTGGCCGAGTTCCGCGATGTGGACATCCTTCAGCAGCGCATCGAGGCAGTGATTAAGG
+CTGCAGGGCGCCCCGTGCTCAGCGGCGACGAGGCCCGTGAGCTGCTGGGCTACGAGCCGC
+GCGGGGACGACGAGGTGCTAGTGCCCGCCGGGCTGGTCCCGGCGGGCAGTTTGGTCCCCC
+CACCCGGCCCCGATGATGGCAGCCCGGAATAGCCCCCGCACCAGCCGCCGCCACCTAGCT
+GAGGTCGAGGCGGCGGTGGCTGAGTACGCCGGGTTGCTATGGCAGCGGGCGGCTGCCTGG
+CGGCTACGCTGGTTGCGCTTGGTGCTGCGCCGGATTCGCCCCGCCCTGGAGCGCTTGATA
+ATCGTGCGCACCCCGCCCGAGGCGGTGCTGCTGGAGCAGCTCATCCGGCAGGCAGCCCTC
+GAGTTCCCCATCCCCGACCTCAGCGACACCCTGACCGAGCTGGGGCGGAAGATCGCTCTG
+CAGTATGGCTTCCTCCCCAACGACCCGCGCACGGCGACGCTCGAGCGGGAGTTCAAAGCC
+CTGCTTGAGTCCGACCTCTCGAGCTACTGGCGCACCCTCACTGACCCGGCTACCCTGGCT
+AAACGATTGGCCGAGCTGCGCGATCAGAATAAGAGCACTGCCCAGATCATCCAGGCCGTG
+CAGCGGGAATACGGCGCTGAGTATTTTTCCGCCGAGCGCCTGGTCCGAACGCTCTACAAC
+TCGGGGGCTAACCGGGCTCAGTACGAGGCGCTGCTGGCCCAGGGCTACACCCACCTGCGC
+TGGCTCACCGCGCGGGACAACCGGGTGCGCGTAGCCCACGGCTCGTCGAGGTTTGACCAC
+CGCCGCATGGACGGGGTGATCGTGCCCATTGGGGAATTTTTCATCACCCCATCGGGCTCG
+AGGCTGCGCTACCCGGGTGACCGCAGCCTGGGGGCTCCGGCGGGGGAGGTGGTGAACTGC
+CGGTGTACGGTGGTGGGGGTGGCACTTGGGAACGAGAATGCTCAACTATCGCGCAATGAC
+TTGGATCTTCCCGCACCTCCCGCCCAACCCCGCCGTCAGGATTAGGTTCCAGTAGGCTCC
+CCCTGGCGAAGCTTTCTGCGTCTGCCCCGCAAAAAACTCCTCGAGATCGACCAAGAGGTC
+TTCGAAGTAGTAGAGGAAGCCGCTGCTATCGCTTCGAAGGTTCATGGCTTGCAGGGGCTA
+CCTCGAGTACCGGTAGTGCAACGGTTGCTGGATCGTGATGAACTTGCCCGTTACGTCCCG
+GACCCGGAGACTGGAGATCCGGCATACATCGGAGTTCAGAAGGGCAAGACCACCTTGCTG
+GCAGTCCTGGAAGAGTTTGGCCACATGATCGATCATCAAGCATTTTTTCGGGGCCAGTAC
+GCCAGCCGCGCTGCGCAACAAGGCCAAGGGCCGCTGGTTAGGTGGTGGGAAATTGTCTGG
+GAAACTCAAGCGGTTAGAGAGTTGCGCTCGTTAAGGCGCGCGTTTTACACCTTCGACATT
+GAAGGGCGGAAAAAGGTAGATCGGGGGTTTGTAGCCTACTTGCTTCAGCCCGACGAAATT
+TTTGCCCGTAGCTATCGCCAATTCATCGCGGTCTATTCCGGTGATCCGCGTTTGTTGAAG
+GCCATTGGTTCACCAAAACCACCCCCGGAAGCCCCTGTCTTTAGACATGGGGAGGAAGGG
+GGTGGCGAGCGAAGCTCGCTGAATGGTCAAAAGCGTGATAAACTGAGTCAAGGTATGTCC
+CTCCTGTCCGTGCGTTGCAAACTGATACCCGACGCGAGTACGGCCGAGAAGCTGACCCGC
+ACGGTGAACCAGTTCGCGAATGCCTGTAACTACACCCTCCAAGTCGCAAGGCGGGACAAC
+CTGTGGAACAAGTTCGCCCTGCAACGTGCGGTCTACCGGGAGCTTCGGGAGCGGTTCGGC
+CTCAGCGCCAACCTCGCGGTGCGGGCCATCGCTCGGGTGGGCAAGCGCAAAGGCCACAAA
+GTGGGCGGCTTCAAGGCTACCAGCGTGGACTACGACCAGCGCATCCTCTCGGTCAACCTG
+GACACCGAAGTGGTCAGCCTCTCCACCGTGGACGGGCGGGTGAAAGTCCCCATGCAGATT
+GCGGGGTATCAGCGCCACCTTTTGCGAACCGCCAAAAGCATCCAGGGCGGTCAACTGGTC
+AGGGGGCGGGACTCCTGGTACGTCCACCTGTGGTGCGAGTACGACGACCCGCCCGCCATG
+ACCCCAAACGGCTTTCTCGGGGTTGACCTCGGCATCGTGAACATCGCCACCGATTCGGAC
+GGAGAGACCTACTCCGGCTCCCACCTCAACTCGGTTCGCCACCGCCACCGGAGGCTCAGG
+AGGAAGTTGCAGAAGAAAGGCACCAAGGGGGCCAAGCGCCGCCTGAAGAAGCTCTCGGGC
+AAGGAGGCCCGCTTTTCCAACCATACAAACCACGCGCTCAGCAAGCGCATTGTCGCCAAG
+GCCCAACGCACCGGGAGGGGTATCGCCATCGAGGATTTGGGTGGCATCCGCGACCGGGTA
+CGGCTCAGACGGCCTCAACGGGCGGCCTTGCATAGCTGGGCGTTCTTCGACCTGGGCCAG
+AAGCTTCGGTACAAGGCTGAACGGGCGGGAGTCGTTCTGGTCCAGGTTGACCCCCGCAAC
+ACTTCCCGCACCTGCCCGGCCTGCGGGCACTGCGAGAAGCTCAACCGCGTTTCGCAGGCA
+CAGTTCGTCTGTCGGTCGTGCGGCCTCGTTGGGCACGCAGACCACTTCGCAGCCGTGAAC
+ATTGCCGTTCGCGGCTGGGCCGCTGTAAACCGGCCATACCTGGGGGAAGCGGAGAGTGCT
+ATCCGGCATAATCCTGTCCCTGGAAGCCCCCGGCTTTAGCCGTGGGGTGGTTTACGGCAA
+AACAAACCGGGTTTCGAGATCGGCTATACTATACAGTGGGCAGATCAGGAGTTCGCAGAG
+ATCGCGATCGAACTTGAGGACGTTTTCAGGAGGCTAGGATGGCTGAGATAACCGAAAGGA
+AGCGCGAAAAGCAGACTGCCGCGGCTCGCCGTCTTGAGCGTTTCCGCAGCATGGGCATTG
+ACGGGGCGGAAGCACGCATCTATGCCGGGTTGGGGGGGGGTCAATACCGCAGCGCGTCGG
+AAGGCCCGCGCCGATTCGAGCCGCCTACCCCCGAAGAACTCGCCACATACGAAGATTGAG
+TGTGCTATAGTTAACTCATACATCCCCCTAGGGGAAGGCCCACCGGGCACCTCGAGGGGG
+ATTTTTCTTTGCCCATTCACTCTTTTACCCACCGCATCCCGCTACAACTGCGGCAACTAC
+GCCAGGGCGTCGTGCTGGTGCGGGCCAGCAACGACACGGTGGTGGATGAGTACGGTACCA
+CCATCACCGTCGAAGCGCTGATGCGGGACTGGGTGCCGGCGTTTTTACAGCACCGCACCA
+TCAGCCTGCAGCACAACCTGCCGGACCTGCGCGGCATCCAGGGCAAGCCCTTCGTGGGGC
+TGGCCCGTCGGGTGGACTTTGCTCCCCAGCTCGAGGTGGAGGTGGAGGTGCTCGACCCGG
+AGACCCAAGCCCTGATAGATGCGGGCCGGATCACCGGGGCCAGCCTGGAGTTCGTGCCCC
+TCGAGTCCCGCACCCAACGGGTAGGTGGCAAAGAGAGCGAGGTCTACTACCGGCTGGCGT
+CGGAACCGGAGCTCGCCGGGCTGACCCTCACCGACCTCCCGGCGGTGCCGGGGGCGGAGG
+TCCTCGAGATTCGGGCCGAAGTCCTGGCCCCCTGGCAATTCGCGGTGGTGGACCCCGCGG
+TCTTCGAGGCCCGCAGCCTAGCCGACGCGACGCGGCTGATGTGGTTCCCCCACCACGACG
+CCCCAGGCTTTTATCACAACCCTCGGATTAGCCTCAGCAGAACTTTGGGATCAGCCGAGA
+ACTTTCTAACCGAGCGCAACACCGGCCACCTTTTGAGATGCAGGAGGTTCAGGATCACAT
+CCCGTAGGTACATCAGCCCCGCCGCCCCCTTGCGGCTGCGGGAGGCATCTTCTCCCAACA
+CCGTGTCTCGTTTATGGTGTAAGCGATTCTCTACCTCCCAGTGTCCCCGCCACAGGGCAT
+ACAGCCGCTTGGCCGGGGCCTGTAGGCTGGTCAGGGCATAGGCGGTCTCCTCCCGTAGCT
+CCCCGCTATTCTTGCGCACCACCCGCCGTCGCATCCGCAAGGCCATCCGCGAGCCCCGCC
+AGCCGCTCACCCCCTCCGGCAGGGGGAGCCCTTCCAGGTGCCATATCCAGACCTCTCCAC
+CCCGAACCTGGTGCTGGATGTAGTGGTCGGTCGCCTGGTAGTTGGCAAAGGCCCACTGGA
+TCAGTTCCTTGAGCTCTGCCTGGTTCCCTTTGACGCTGAACAGATACCCCCCTTTTGCTC
+CACCACCACTGCCGCCAACTCCTGGGTGCACAAGGCCGCATCCCCCGTCAGTACCCAGTC
+CACCCCCAGCCCCTCCATGTGTACCACCAGTCCCTGCGCCGCCGCTGCCTCACCGTCGGC
+AATCGCCTGGCTCCCCAAGGAGAGCCCCAGCCCCTGAACCAACGCCGACAAAAAGACCAG
+CGCCTCTTCCCCTCGCCAAGCACACCGGGTGCCCCGGAGGTGTTTACCGTCCACGGCTAC
+GGGCAAGGGTTCATCGCCCTCCTTGCCCAGGGCCTTGAGTACCTCCCGAGCCCAGGATAG
+TAAGGCCTTTTGCAAGGGTTGTAGGTCCTTGCTCAAGGACCAAAAGAGGCGGTAGAGGGT
+GGCTTGCCCGGGTAGTTTGCGCTCACCCCGGCGGGTACGGATATGGACCTCGTCCAGCAA
+GAAGCGTCGCTGGTCTTGCACCCACTGGCTGACGGCCAGGATATTGTGCCGTCCCGAGCC
+CACCGCCATCAAGCAGATCAGCAGCAGGTCTTGCCAGCGATGCTGGGTCTTCAGGTACTC
+GCGGGGATCGGGTATCTGGGCTAGGTATGGCAACGGAGAGGGAATGGAAGCAGTTTTCAT
+ATGGCTTTATGATAAAAGCCTGACGACGCCCGCACGCACGCGGTGGACCCGGACCTGCTG
+AGGCAAGCCCTGGCTGATCTCGAGGCCGGGCGCTTCGAGGTATCCGCCGCCGCAACCCTA
+TCCCGCGAGGAGGTGGCACGCCGCGCTCGAGCCCACCTGGAACGGCACACGGCCCTAGGC
+ATCGGTATGCGTACTACGGAGGAAAACATGGAACAAACCCAATCCCAGGCTCCTACCCAG
+GAGCGCAGCCAGCAGGTTGACCTCAACATCAACCTGGACTTTCGCACCCCCGCCGAGCGC
+GCCGCCGGCGTGGCCGAGACCCCCGCCGAGCGCGCCGCCCGTGAGCAGCGCGAGCGCCAG
+CAGCCCACCGCCCCCAACCCCGCCGAGCGCTGGCTTCAGGCCCGCTCCGCCCAACTCGAG
+GCCGAGGGCACCCCGTCAGCCCAGGCCGAGGCCCAGGCCCGGCAGGAGCTCGAGCAAAAC
+CCCGAGCTGGCCCAGCGGCTGGCCGAGGCGGGCCGTGAGCCCACCGTCGAGGAGCGCGCC
+GCCCGCGCGGCCGCTCAGGCCGTGACCGAGGCCCTGTCCCGCCTGCCCGAGCCCCCGTTG
+GCGCTGGTTACCGACGGCGGCATCTCGGTGCGCTCGCGGCGCCCCACCAGCGATGAGCTG
+CTGTCCGAGATTTTCGCCCGTTCGGTAATCCCTCAACTGCAGCGTCGCCAGCCTACCCCC
+ACCGAGCGGCAGGAAATTGACAACATCCTGCGCCGCAACGGGCTCGACGTGCGCGCCATC
+ACCGTTGAGGCCAACGGCACCGTGATCTACAACGAGCTGGCCCGGCAGTTCGTGGTGCGC
+CCGGAGCCCGATATCATCGCGCGTAACCACTGGGCCAGTGTGCCGATGGGCGGGACCAAC
+AAGCGCACCTTCCCCCGCTTCGACCGCGGCGGCATCTCCCACACCTGGGGGCGCACCTCC
+ACCACCGCCATTACCGAGAGCGACCCCACCCTGGACACGTTCGAGGTCGAGGTCACCGAA
+CTCAACTCCAAGGTGCCCGTGCCCGATAGTTTTTCCTTGTTCAACGCCCAGGGGCCCAGC
+TTCATCCAGCGCGTGCTGCTCCCGGCCATGCGAGGAGCGGCCCAGTACGAGGAGGACCGC
+GCCTTTTTCCTCTCCAACGGGGTGAGCCCTAACCCCACCAAGATCATCGGCCTGCGCAAC
+AAGACCGGCGTGACCGTGGTGGCTTCCTCGGCCAACGGCGACGCCTTCACCCAAGACATC
+CTCACCAGCCTGCTGCGGGCCATGCCCGTGCGCTACCGCAATGACACCAGCCGCCTGGCC
+TACTACTTGCCGGTAGCCCTGGCCGATGACTACGGCGACATCCTGGCCGCCCGGCAGACC
+TCTGGAGGCGATACCTGGCTGCAGCGCTTCGCCAATCAGCCGGGGCCCATGCCTATCGGG
+GTCCACCGCGGCATCCCCATCTACTCCGTCTCCCATTTGCCCACCAACGAGACCCAGGGC
+ACCAGCAGCAACGCCGCTACCATCTACCTGGTGCACCGCGACATCCCGGTGATCGGGGAC
+GCGCTATCCATTCGCATCGAGCCCTATCGCCGGGAAAACTTCATCGACGTGCTGCAGCTG
+CAAGGGTTCGTGGGGCTGGGGTACCAGTGGCCGGACGCTATCGTGCGCCGCTCCGGTGTG
+CTGCCCAAGGTTTAGGAGGTAGCGCATGGCTAAAAAGAACGAGAGTGCCGCCGAAAACCT
+CGAGTCTACCCCAGCCCCCACTGGGCTGGTGCCGGTGCGGCTCAAGCCGGATTCGCCGTA
+TGGCCGGGTGGTGGTGGGTACCGTCGTGGTCGAGCGCTCTAAGTCGCCGGGCGCCGACTG
+GCCGCTGATTCCGGCGGAGGAACTCGAGCGCCTGGCCGAGGAGTACGGCCTCGAGGCCGT
+ACCCATAGACGAGGAGTAGCGTGGGCTGGCTCGCCCCATACGCCGACGACCTGCTACGCC
+TGGCAGGCTACCCTTCCCCCCACCCCCTGGCGGGGGATGCGCTGACCTATGCCGAGCAGG
+CCATCGAAAGCTACACCCGCCGGGTGTGGGGCTCGAGCCAGCCCTTTACCCAGCGTGTGT
+TTACCACGGCCAAATCCTACGCCCTGCCCCTGCCCCCAGATGCTACCAGCGTCGCCACCG
+TCAACGGCAGCCCAGCTCCGACTGGGGTCACCTGGAGCATTACCGCGCTGGGGCTCGAGG
+CCACCGACGCCGAGGGCCGACCGGTGGCCTGGGCTCCCGGCGTGTGGACGGTGGCCGGGC
+AGCGCGGCAGCGCAGCCATCCCCCAGGGAGTGCTCAAAGCCGCCAGCCTGCTGATCAATG
+CCTATTTGAGTCTTTCCGACGCCCAGCGCAGCCAGATGGCCAACGCCAGCCGGGGCGACC
+TGAGCTACTCGATGCGCTATGCCCAGCTGAGCGTGCCCGAGGCCGAGACCTATTTGGCTC
+CTTACGCCAACCGCATCGCCGGGGGGCTGTTGTGAACAACGTGATCGCCAAAATCTACAA
+CACCAAGCAGCGCCTCGAGGCGGGCTTCCTCACCGACGAGACGGGCAGCCTGCTGCTCGA
+GCAGCCCGCCCAGCTTTCGAGCCCCACCCGCCCCTGGGAGCGTGCAGCTGCGCTGGAGGG
+CGTTTTCTCGGCCACGCTCTACGTGCAAAGCGCCGAGGATCTGACCCAATCCGACCTCGC
+CGTCACCGAGGAGCCGATTAGCGGACAAACGCGGCAGTGGCGCGTGCTCAGCCACGCCAA
+CAGCGGCCCCGAGTGGCGCTTGGAGCTATCCAGCCGGGAGGTGCGCCGTGGCCCTTGATC
+CCAGCGTTCGGGCCAAGTTGCGCCGCAAGCTCACCGCAGGGCTGGCGGGCGTGGCCGTGG
+CGCTGACCAACGAGGCCAAGGTGCGGGCCACCCGCCACGTGGACACCGGGGAGCGCCGTA
+ACTCCATCGCCCACGCCGTGCTGCCCAACGGCTCGGTGATCTGGGGCCTGCCGGGCAACG
+CCAAGAACGCCGCGCTCGAGCTGGGCTTCCGCCCCCACTGGGTGCCAGCCGGATATATCG
+GAGTATGGATGCGGCGGCATGGATTGACGCGCGGCAAGCTAACCCGCCGAGCCGCAGGGC
+TCTACGTGGGCGGGCCGGGCTCGAGGCTCGACAGCGGACCCGGTGGGGCCAGCGGCACCC
+GCCGGATCGGCAACAAGAACGTCTTTGGGCGCTGGCGCACGCGGGGCGAGGTTAGCCGCT
+ACCTCGCGCCGGGGAAAGTAGGCCACAGCGTACTGCGCCACACCGTTGCTACTCGCCTGC
+GGGTGGTTGCGCCTGCTGCGTTTATCAGGGGGTACCAGCGTGGCTAGCTTGCAAGCCGCC
+GCGTTGCGGCAGTTCTACGCCGCCCTCGAGACCTACCCCCCGCTGGTGGCCCTCACCGGC
+CACGTCCCCGGCGCGACCAGTCTGGGGGCGGGCGCTCGGATTATTGGCGACTCGGTGCGG
+TTGCGGCCCCATCCCATCCCCGGCGTGGTGCTCGGGCTGGGGAACCGCAACCAGGGGGGC
+AAGGCCACGACACACGAGGCTCTGCGGGATTGGGAGATCAGCCTGCTCGTTTGGGCTGAG
+GACGTATTCCAGGCCGCGGAGATCGCCGAAGCGGTCGAGGACTTCTGCTCCCTGGCCCGT
+TGGGAGACTGGCCCGGTGCGCCAGGCGCAGTGGGTCTCGAGCCAGCAAATGGAGCTTTCT
+CAGGACCAGGAGTATATCAGCGTGCTGATCACGGTGCGCTTACGCATCGCATAGGAGGAC
+ACATGGGACGTTCGGCGGTAGACACCAACAAAATCGGCTTTTCGGCGGGGGCCCGTATGT
+TCGAGGGCCCGGTAGGGGCCACCGAGGCCTCCCTGCGCCCGTTGGGGCTACTGGGGGCGG
+ACGCCACGCTCAACATCGGCCAGACCACCAAGCAGAAGCAGGACCGGGCCCCGCTGGTAG
+TAGTCAAGCAGGCCATCAACCAGCAGTCGGCGCAGATTCAGGTAGTGCTCCACGAGATCA
+CCCAGGATAACCTGCGCCTGGCGTTCGGCCTGCAGGACTCGGACCTCACCGCCCTGGCCG
+GGGGCGACGTGGTGGTGACCGACGAGCAGGTGGTGCTCGATGCGAACGGGAACGGGGTGC
+TGGCCAATCCGGTCAAGACGGGCAACGTGCCGGTGGTGACCAACGTGGGCGGCACCACCA
+CCTACGTGGCCGGGACCGATTACATCTTTATCCCCCGCGACCAGTTCGGGCGCAGCGTGA
+TCTACCGGCTTTCGACCGGCGCGATCCCCAACGGGGCCACGCTCGAGGTGGATTACACCT
+GGACCCGCACCGCGCGGGTGGAGTTCCCCATCGGCTCGCGTACTACCGTAGTCGAGCGCA
+AAATCAAGCTCGAGGAGGAATACAGCGACGGGCGCAAGCTGGTGGCGGTCTTCTATCGCG
+CCGTCTTGAGCATCAACGGCAACATCACCGTCAACACTGACGGCGAGAACGGCATGAGCG
+TGCCGGTCACGGTGGATGGGCTCTACGACCCCACCCAGAACAAGATCGTCTCGATTTACC
+TGGAGGGCTAGTGGCTAGCCAAGCCAAGCTGATCGAGGAATTGCGCGCCCGCGTGGCCGA
+ACTGGAAGCCCGTCTGGCTGCGCTCGAGCCCGCCCCCGGCTCCACATCAGGGCAGCCGGG
+GGAGGTGCGCGTAGGCGGGCAGCCGGTGCGGCTCAGGCCGCTTTCCCCAGCCCAGTGGGT
+GCTGGCGTTGAAGGAGCTGCCCGGTTTCCTGCTGGCGTACGCCGTGCAGGAAGCGCGGGG
+CCAGGAACCCGAGGAGGCATTGCTCGAGCGGCTGGTGAACACCGCGCGGCAGTGGGTGGT
+GGCCTGCGCCATAGACCCCTGCGACCCGGCGATGCTCACCATCCCCGAAGCTCAGCAGGT
+GCTGGTGGAGGTGAGCCGCCAGAACGGGCTGGACGCGCAACTGGCGGAGTTTTTTCGCCA
+GCGACTCGGCCAAACTGCTGGATCAGGCAGCGCGGCGCTACGGAGTCCGCCCCAGCCAGA
+TGCTCGGGCTAACTGATTCGCGGCTAGCGCTAGCATTTGACCTGGGGCTGGCCGATCACT
+GCCTGCGCTGGGAGCTCGAGGAGGGATTAGGCGAGTTTTGGTGGATTAGCGTATTGCGCG
+CATTCACCGGCAAATAGGGGGGACTGTGGCCGAGCAGCTGAACCTGGGAGACCTCATCTA
+TCATCTGGGATTTGCCAACCAGGATGAGTTTCTGCAGGCTCTGCAACGAGTGCTTGAGCA
+GGCTGAGGCCAAGGCCAAATCGGGCGGAGGCGCCGGAGGCCGCGAGTTCGGGGAGGCGTT
+CGAAAACGAGGCCAAAAAAGCCCTCGCCGGAACCGGGTCGCAGCTGGTGCGCTCGCTGGG
+GCTGGACGCCGTTGGGGTGTTCCTCGGCAACGCCCTGTATAACGCATTCCAAAATGCGCT
+GGGCGCGACCAAACAGTTCATCGGGCAGTCCGTAAACGAGTTTGCCCGCTATGAACAGGG
+GTTAGTCCAGCTGAGGCTGGCTGGCGAGGAGAACCTGGGGGCCGCCGCCGCCAAGATCAA
+GGAGATTGCGGAAGCTTCGAAAGTCTTCAGCGAGACCGACGTAAGCCTCACCCTGGGTGA
+GCTGGTCAAAGCTGGATTCGACGCCAGCACCGCGATGGAGCTGACGGCTAAATCCACCAA
+CCTGGCCAGCGCGGAAATCGACACCGCCACCGGCAAATTCCTTGACCTCACCAGCTCGGC
+CAAGTCGGTCTCGGACATCCTCTCTGGCCTGGACTACAACGTCAGTCAGGCCGGGCGGGT
+CATTGACGTGCTGGGCAAAACCTCGCAGGACTCCAAACTGTCGCTCTCCGACCTGGTCCC
+GGCCATTGCCAGCGTCGCGGGGACGGCTAGAGGGGTGGGCCTCGAGGTCGAGGACCTGGG
+GGCGACCTTCGCCGCGCTCAAAGATCGGGGTATCCCCGCCGCCGAAGCGGCCACCGGGCT
+GCGTTCAGTCATCAACTCGCTGATTCAGCCCCCGGCTACAGCTAAAGACGCGTTTGAAAA
+GTTGGGGCTCGTCTTCATCAAAGCCGACGGGAGCACCCGCAGCTACGCCGAGGTGCTGCA
+AAACCTCAACCGGGTGGTAGCCGCCGGGCCCAGGGGGGTTCAGCTATTGGCCCAGGGGAT
+GGACACCTTCGCGCTCAACACCGCCGTGGCCCTGGGCAAATCCTCGAGCGCCATTGGCGA
+CTTCAAACAGAATCTGGAGAACGCCAGCGGGGCCACCGAGGAGCTGGGGAATACCCTGAA
+AAACACGGCCCTAGGGAAATTCCAACAACTCGAGGCCGAAATCGCTAACACCCGGCGAGA
+GATTGGGCAAAACCTGCAGCCCGCCATCGCCCTGTTCCTGGAGAACGTGGCAGGGCCGTT
+CGCCCGCTGGGTGGGGAATATCGCCGCCGGATTCCGCGCCGCTTCCGTATCGGTGCGGGA
+CTACCGCCAGGAGATCGAGGCTGTTCGGAACGGCACCGCGCCGATTAACACCCAAACTCG
+CCTACTGCGCGAGGCCGTGCAGCAGCTCGAAAAAACCACCAGTAAAGAAGGGCAGCCGCT
+AAAGGTTGGACCGATCACGGTAGGGCGCTTTTTCGTGACTGGCTCGCTCGAGGGCGACCT
+AAAGCTGCTCGAGGAACAGCGCAAAAGACTGCAGGAAGCCGAAGCGAAACTGCAAGCGGC
+TAACGCCAAAACGCCGCCCCCGCGTAAGGAGCCCCCGCCGTCCCCAAAACCGCTCGCCAT
+TCCCGACGAAGACCCGGTGATCAGGCAGGCCAGAGAGCTGCAGGACCAGCTAAAGATTCT
+CCAGTATCGCTACACCCTGGGCCGACTTTCCGCTGAGCAATACCGCGCCGAGTTAGAGAA
+GCTGCAACGCCAGCTGCAGGCTCTGGAGAAGGCGGCCACCACCACCGAGCGCAAATCTGC
+GGTGCTGGGCGGGCTAACTGACATTAGGAAGACCCTTGAGGATATTTCCAGGTCAGATTT
+TGAAACTCGCATAAAGGCCCTCAGCGACGAACTCGAGCGGCAGAAAAGGCTTTTTGCCGA
+TACCCGTGATATCAACCAGTATGCGGGCGCGTTGGCGAGCGTGGAGAAAAAAGCTCAAAC
+TCTGGGCAAAACCGCCACCACGGAGCAGGCCAAAAAAAGCGTCCGCGAACTGCTCGACCA
+GATCGCCACAGGCCGGAAGGAGTTGCAAAAAACCCTCGAGGAAGGCGGCACCCAAGCGGC
+AGAAGTTCTCTCGGAGCAGGCCCGAGCTCGCCTGCAAGCCATCTATGGCGATGGGATACA
+AGCCACCATCGCCGCCGTGCGCCGCAGCTATCCCGACTTCAAGAGCGCGTTTGAAGACCT
+GCTCAAAGACGGCTTGAAGTTTGACGATGCCCAAATGCTGGCCGCCCTGGCATTCCCCTC
+TAGCTTTTTGGAAGGGCTGGCAGAGACCTGGGGGGAGGGGCTCAGCACCGCCGCCCAGCG
+GGCCGGGGAACGGGCCCTGGATGAGTTTTACCAGATCCCTGAGCGGCTGCAGAAACAGAC
+CGATGCGGTGCTGCTCCGGCTGCGGGTGAGCGAGATGAGCCCTGAGGAGCTGTTGGGGCT
+CTCGCCGCAACTGCTGGAAAAGTATGTCAAGGAACTCGAGCAGTACGGGATAGACGCGGA
+AAACGAGATCGACCGGCTCAGGACGGCCATCGCCACCCTCACCGCTGATCCCGCCGTAAT
+TGAGCGGGCCATACGGGAGAGTGCTGAGTACGGCGACGAGATTGTAAAAACCGGGCGCAA
+GGTGGCCGACGGCACCGACTACGCCCGCACCGGGCTGGATGAGTTCAGGAAGTCTCTGGA
+GGCCCTGGCCGCCGCGGCGGGCACCCCGCTAGCGGCCATCCAGCAGCTAGCCGTGCTCGA
+GGGGAACCTCAAGGACGCGCTGGCCCTGGGATTCAGCTCTCCCCAGGAAGCCGAGCGGGC
+TCAAGCCCAGCTCGAGGTCCTCTCCGGCTTGCTCGACAAGCTTAGCAATTCTCTGCGAGT
+CACCGAGGCTCCCCTCGACCGCTTCGTTCGCAAGCAGGGGGAGGTACGGGACGGCTTGCA
+GGTGACCATCGAGGGATTCACCTACTACCTCGACACCCTCGAGCAGTTCGCGGCCCTCGC
+AAGCAATCTCCCCGATGATGCGCTCATCGGGCTATTTAGCGGCCTCGAGGCTGAGGCCGA
+GCGGGGCAACGAGCAAGCTAGGGCGCTACTCGAAACGCTGCGGCAGATCATCCTGGCTAG
+GGGCCAGGCGTTTGGCGAGGCCCCCAACCTGGGGGCCACCGATTATCGCAAGCTCGAGCG
+CGAGGGTTACGGCATGGATCAGGGCCGTGAGGCGTTCGAGAAAGACCGCCAGAAACGAGA
+AGATGATGCTCAAAAACAGCTTGAGCAATTCGAGGCCCAGCTCACCGATATCGCGCTATC
+CTTTCCCAAAGCCCTGGTAAGCGGGATTCTCTCCGGGGACGTGGCGGGGGCCCTAAAGCA
+AGCGCTGGGCTCGGCCACCGACTTCTTCCTCAACAAGATGCTGGAAGCCATCCTGGGGCC
+CATAGCCGAAGAGTTCTCCAAAGTCATCGCCAAGCAGGGACTAGGGGCGGCGCTGGGCGG
+CTCATCCATTCTAGGGGCATTAGGGCCCATCGGGCTGGCGGTGGGGGCCGGGCTGCTGCT
+CTTCGACTTCCTCTTCAACAAACCCCAGCCCGCATCAGAAAAAGCCGCCGCTGAACGCTC
+GAGCTTGCAATCCTCAACCCCCTCCATCACCTACAACGTCGAGGCCGTCCTGAACGCCAC
+GCTGCAGGGGGATCTCAAAGACCCGGCGACTCGGGCCGAGTTGCGCGGCCTGATGCGCCA
+GGTGGCGCTAGATGTGCTCAAGGAGGTGCAACTCGTCAAATGAGCAGCTACACGCCGATT
+ACCATTACCCCGCTCAATCCAGCAGGCCCTGCCGTGATTCTGCCCATGCCGGAGTCGGTG
+GAGAGCACTGCCAACACTGTTACCTTCGAGTTTCTCGATCCTATGGACGCGTCGGGGCAG
+CCGGTAGATCTGCCAACACTGGCGGCGCCGGCGCTCACTGGATCACCTGAGCGCATACAG
+CACGACATCCGCCGGGACGGCAAACGTCAGGTGCAATCTGATCCTCCCGCTCGATTGGTT
+GGAGTGCAATGGGCGGAAATTGAGCATTACAGCGCTGTTCAGCGCAGTTATACAGCGATT
+GGCGCGCTTGTGCTGGCGGCCAAACGCTACAACAAAAGCGCCAGCGAGGGCGCCAGTATC
+AGCCTAATCCTCTACCGGGCGGACGCTATCTGGACGGCTGAGGGGGTGCTGGAGCTATGA
+ATCTCGGAACTTCGCCGCTCTTGCCGCCTCGAGTACGCCGCTACCCGATGGACATGAGCA
+ATTTCGAACTTCCCAACGTCAAACGCTGGTGGACGCTGGAGGATTACGCTAAGGTGGGGC
+TGTTTGGGGCATATTTTCACTCTGGCGCGGGGGAGATTCGCGCACAGGCGTTTTGGGGGT
+TGTTCCGCTCCGACCCCAAACCTTATGCTTTTCATCTCACCGATCCGGTCACTCTTTTCC
+CGTATACCTTGGGATCAAACCCGGACATCCGTGTTACCAAGGGCCAGGTTCCCAGCCCTT
+TGGGGGGGAACGAAAGCTATTTTGCTGTACTGGCAACCCCGCCGTTTGGCGGCAGCGGTT
+ATGTGGTCGGGCTGGTGAGAGAACCGGTGAGCTATGTTCCGACGGAGAACTACCGGATAG
+GGCCGAACATCGCGCGAACCAGCCCGCCCAAAACCGGAGTTATTACCCCTATCGGGTTCA
+ACGATGCCCAGACTCATTTGCTGGTTGCTGTGCCGATAGATGACCGAATCCTCGTAGAGC
+GCCTAGAGTTGATACGGGATCCGAATACTCAAGAGCTAACGGGGATGCAGGCTGTGGGAT
+ATACCGAGTGGATACACGGGTATACGGCAGGGTCGGTTTACCTGCGCCAAAACTACGCTG
+CTGGCCTGGGAGGAATCATGACGACGCTTGCCGGGGAATTGGTGGCGTTTGTAATCAACC
+TCGACAGCGACGGCAACGTTATTAGCGGGCTTTCTGGTTTGGTCAATGTAAAATCCCCGT
+TCAATAACAATGCCGTTCATAGCTGGAACGCGGATGACGGCACGCTGATATTTTCCCAGG
+CGGGTTCTACATATGTAGGGCGGGCGTTCCAAACCGCTGTTTACGACGTCATTGACGTTT
+TGCAGCCTTACGATCCCCACAACAATCGTTATTTGTTGGAATCCGCCTCCATACCGTGGC
+TGCCATTGGTAGGGGCCGGGCCACAAACCCTGGCTCAGCGCTATTACTTTGATAAAAATA
+GCTGGGCGTATTTTGGCATGCTCAGCATGTTGCCGCCTGCCAGCTTGGGGTGAGTATGCC
+ACTGCCCCGCAACGATCCAAATCACACTAGCGACAAAGCGCTGTACATCCTGGACGGTAT
+TCTCCTTCCAGGAAACGGATTACTGCCCATCTGGCGGGGGAACCGGCTGGATCTCTACAA
+CGGCTCGCTGTTCGGGGTAGACAACCAAGCGCTGCTGGGGGGCCCGAACTACTGTCTTGC
+GTTCGACCTGCACCGCTCTGAGCTACGATTGTACGAGTTTGACCTCAACCTGCCGCCTGA
+CCTGATCGCTGATCCGGTGCGCCTGCAGCTCGAGGAATCCCTCACCGGTCCGGTGGTGGA
+CGCCAGCATCAGCTTTACCCTGTTCAACCGCGGCCAGCTCAACGTGGATGCGACGTATAG
+CATCGGGTCGCGGCTCGAGCCCTACACCTCGCTGTACCGGTTTTTTATCAACACCATAGA
+CCCCAACCGGGGCCTGGTGGACTATACCGGGGAGACCTATCTGCGCCGCCTGGACCGCAT
+TCCCGCAACCCGCCAGGTCCTGCTGCCGCCCAATGGAGGGCCATACACGCCCAAACAATG
+CTTGCAAGCCATTCTCGACACCTACGGCGTAAACTATGCCCCACTGCCGGAATTGCGGCT
+GCTTGGAGCCGAGGGGCCATTCGTCATCGACACCCCCGGATATGCGTACTTCCCCCCCAA
+AGCGGAGGATAAAACTGAGCCCCCGTCGCTCCTCGAGTTGATCCAGCGGGCCGTCGCTCC
+GTTTGAGGGTTACTATTTACGGATCAACCCGTTCACCAATAGTTTGATGCTGGTGCCACC
+CCCCTGGGCTCCCGAAGCCACCGCGGGGCCTACGCTGGCGAACGCCGATGTTTTGGAAAT
+AGACCCCGGCGAGATTGACCCCTCGACGGTGGTGAACCGCTGCACAGTTAAGAGCCAGGG
+ATTCAGCTTTACGGCCAGCCCGGTAGCGGTGATGGAGCCCGCCTCGTTTGGATTCCGCGG
+GTCGCTCGATCCGAGCAAAGGGGCCGATCCGCTGTTTACCGTCCTTTATCCAACCCCCGC
+AGAGCTAACCGGGAAGAAACTGAATGACGCTCCCATCGTCTACGGCAAAGAGACCCGGCG
+CGGGACGCTGGCCATCTGGCCCCTGCAAGCGCAAACCGTCCTGGGGGATCAAACCCTGCA
+AGTGAACTGGGTACTAACTACCTGGATTTACGAAGCGGGAACCGGCCAGTACGGGGGGAC
+TACCGGCTACCCCAAGAGCGGCAGCAAAACCATCCCCCTGGACGGCTCGAGCGTCGAGCT
+ATTCAAAGAGAGTGTGCAACTAGGGGCCCCGCTTTCCTACGGCCACGTTTGGGTTTACGC
+GGCGTGGGATGCCCAAGCCCAGGGGGTGCGCCTGGACTATGACCTTTACTTGTATTCTCA
+GAGCATCGGGTTTGGCGGGTCGGGGATTATAGTCTATGGCGTGCGGGTGGAGCTGAACGG
+CCTGGCGCGGAAGCTGGACAAGGGCGATGTTGTTGTGGCCACCTTTGGCGAGGTTTACGA
+CTCGGCTCCAGGATTGTCTCTTAGCCAGTCGCGGTACGGGCTACGACAAAAAACTCTGGA
+CATCGATTATCAGCTCACCCCCGATCAGGCTATGGCTATAGCGCAAAATCAGGTAGAAAA
+AGGACTCAACCCCAAACAGATTTATCGGGTGCGCCAGGCGGCGAACATGCGGGTGCGACC
+TGAGCACCTGGGAAGGCGCGTGTATATCCCCCGACCGGACGGGGCTCCGGGGTTGCTGGA
+AGGGACGGTACGGGCCTGGCGCTACCTCGAGGCCCACAGCACGGGCGGGGTACAGGCGGA
+TAGCGAGTTCGAGCTGGAGGTCACCCGCAACGTCTTTGGCGACGTGACCAATTTCACCCA
+ATACGGCGAGGCCATTTACGGTCTGAGCGCGTATTTGTAAGGAGGAATCATGCCGACCTA
+TAAACCCTACACCGAGATCAGCAGCCTGCTGGGATCGGGAGGCGTCAGGCGCATCAAGGA
+GTACCACCTGGACCGCCATGCCGAGGCGCTGGCCAACCAGCTCGAGGCGCTTTGCCGCTT
+TCTGTTCTCCGCGGGCGGGATAGCCGAGGCGGGCAGCGTGACCCTTAGCGGGTTTGACCT
+CCGGGTGCAGAATCGGCTGGGCCTCACTCTGGATGCGCTAGCCCCAGTACGGGTACTCGA
+CGAGATCCTGACTCTGCCCTCCACCCCGGCGACCGGCACCAAATGCCGGGTGGTGATGGC
+AGCCATCCCTCAACTGGCGAGCCCCGCTGACAGCTACACCGACCCCACTACCGCAGAGGT
+GGTTTCCCAGCCCATGAGTGTGGGGCTGGGGGCGCTCTTGTTTGTCGAGGGGGATACCAC
+CAACTACCCGGCTATCCCCAACGGGGCCGCCCCGGTGGCGCAGTTAACCCGCACCTCTAC
+GGACTACACTCTCGATTTAATCGAGAACACCCCGCCCACCTTCCGCTGGTGAGGATTGAA
+ATCGCTGGAGCGTGCTAAACTGAACGTAGACACCCCTTTCAGGGGAAGCGGCCCCTAAGC
+CGCACCTGAAAGGGGGTTTTGTTTGCGGATCGTTTTGGACCCCGGACACGGCAATTTCCC
+TGGGCCCGGCTACGACCCTGGGGTGGTAGGCCCCCCGCCGTTACGGCGCCACGAAGCGGC
+AGCGGCGCTCGAGCAGGCCCTCTCCTGCCGGATGCTGCTCGAGCAGGCGGGGCACGACGT
+GTATCTCACCCGCAACGGGCAGGGTATCTCGGGCAAGCCGGACTTGGCCTGGCGGGTGCG
+CTTTGCGGCCAATCTGCGGGCCGATCTATTCGTGAGTATCCACTTCAACATGATCGGCGG
+GGGTGGGCTGGTCTACCACGCGCCGGGGGCTGCTTCGGAGCGCTTCGCCAGGGGGCTGGC
+CCGGAGGGCCGGGCTCTCGAGGGTGTGGCCCTCGAGCGATTCGCGCTTTGGCGGGCTCTA
+CATAGACGCCTTCCCGGACGCCCGCCCGGCCGTGCTGTGGGAAGTGGACGGCATCGAGCG
+CGCGCCGCTGCCGGGGGCGCTAGGGCGGGGCGCCAGACTCCGGCTGGCAGCGGTGCTAGT
+CCAGGCAGTGAAGGACTTATAAGGGGGAAACCATGCAGTTTAGCGGAATCTTTTTAGAGT
+TAATCAAAATCGCAGCGGAGCTGGCCGACCTCGACGAGCCGGGGGAAAAGAAGCTGGCCG
+ATCTAACCGAGCGGTGCGTGAGCTTGCTCGAGGTGGCCGATGACGCGGCAGTGTCGTTGT
+TGCCGCCTGGATTTCGGGACATCGCGCGATGGCTCATTGACAATCCCGGAGTGGACTCGT
+GGGAGCGGGAAATATCCAAATCCATCGCAGAAGCTGCCTACCAAGCCTGGAAAGCGCTGC
+GGGAGCTATTGGGCAAGGATCAGGCCAAAGCGGTGCTGGGGTAGGTATGCGCGCAAAGTT
+AGCGTTGGCGGCGCTGTTAGCAGTGGGGCTGACCCAATCCGCCAATCCCCCTAAGTCTGT
+ACAGCTTGAATGCCCGGCGGAAGTGAACGGCCCCATCGTAGAGTGCAAACTCACAGTGAC
+GGGGCTGCCGCTGGGATCCAGCGCCGTCAAGGCGATTTTGTACCCGGCGGACAAGACCTC
+GACGGTGAGCCGCCAGGTGCGGGTCAACCGGGTGGCCGCCAATGTTGCCGCACAACCGAC
+GCTGCTTAGTAGCTACTGGCACCGCAAGATCCTGAGTTCTGGCACTGAAGGAGCTCCTGG
+AGTAGATCAGACTGAGATCCGCGACATGCGCTACCTGCCGCGTCAGCTAGTGGCGGGGAC
+ACTGGCCGAGTGGGAAAACGGATTGCCGCAGAACTTCTACGTCAGCCAGGTACCTCCCGA
+ATACCAGGGAGCCGACTTGCTGGTAACCCGCAACTATGGCACCTATGGCAGCGCTGGGTA
+TGCCAACACCTGCTGGACCCGCTTCACCCTGAACCGTTCGGCAAAGGTGATCTTGTTGAT
+GTTCTCAGAGCGTCCAGCTTGGGTGGACGATACCTGGACCGTTGGCCCTGCGGTGGGATA
+CGGCAGGAAAGGGAGCGACAATGTGCTTTCCACCACCGAAACGGCAGACAGCTATTTCAA
+AGTATTTCGGGAGGGGAGTCACTGCCTGCCGGGTCAGGGCGCACCGGGACGCATTTATCA
+AATCGCTTTCATGGAAGCGGATGGCTCGCCCAGCAAGCCCCCAGCGGTTCCGGCAGGATT
+GCCTGTTCCCCAGCCCAACACCTACTGCCCGCAATGGGTGCATGACCAGTACAAAGACTG
+GCATCCCCAGATTGATCCGGTCTACTGGTGTTATTTCGGCCACGAACACGGCTCTGATCC
+TGCACAATTCCCAAAAATCAAGGCGCTCCTAGATTCGGGAGCGATCAATTTGACCTTCGG
+GCGCGTGGAACAAGCCGGCAACGCCACCCCGATGTGCGTCTCCTGCCATCAACAAAAGCT
+CGGGCGAAGCAGGGTTGAGGCCCCCCGGGAATCCTACAAGCTGTTCGCCCTAGACGACCG
+GCAGGGTCATTTGTGGCTGATAAAGTTCGAGCTCTCCTCGCACAACCGAGCCCGGCTCTG
+CCAGCGTCATCACGAGTATGGAATCTGGGCAGTAGATTCCAATACCGGAGAGCTATTGGC
+GGCGCTGCAGTTCGCGAGCGACTTTGGCCCGGCCCTCAACGCCAGCGTGGGCAACAACAC
+TCGTTATAAACCTGATCTCTGCCCAGAAAACGTAGACATACCCATGAACAACGATCAAGG
+CCGTCACCGCATCCCCTTGATCAGCGCTGCTGGGTACGAAAACTGGACTCCCCACTTTCC
+GCCCCAGCTAGGGTTCTATGGTTACGGACGGAGCTACAACCTGGATAACCCCATGACCCG
+TTGCTCGGACGAAGTGGATGCAGATGGATTCTACACCTGCAACCAGGCGGTGCGGGCGCT
+GGATCCCAACAACTACAACTGGGGCGACAACCGCTGGTTCATCATCCCCGGCGGGGATCA
+ACCGGACGGGGGGTTCGGTATCCGGGCTTCCACGGCCATCGCCAGCGGTACTTTCTGCAC
+CGACGTGCTGGGAACCACCCTACGGGACTGCACTGCTCCCGATGCCGTGCAACAGTACAT
+CAAACCCGGACTGGACATTCTGCACAAGGATCAGTTCCGCTGGATTCCCTACGACCCCTG
+GTGGGTGGAGTACAAACCCGTACCCAGCGGATTCGTGAACTTCGACACGCACAACCTCGA
+GGGAGCCCTGAGAGCGCCTAACTAAGGGAGACATGTTCGCAGACACGAGCACCTACGATT
+TTCGAGTCATCCGGGGCGATACCTGGGAGTCCCCCATTTGGCTTGAGGACCCACACGGAT
+TGGAGGACCTCTCCGGGGCAACGGCCCGCCTGCAAGTGCGGGATGCGGCCAAAGCGCTCA
+TCCTGGAGGCCAGCACGGCCAACGGGCGGATTCAGCTACCCGGCCCGGTGGTGCTCGCCC
+AGGACGCTCCGGCGGGGAGCCGGACTCTTCAGGTGCTCCCGCTGCCCGGCCCCCTGCTGG
+GGAACTACCAGGCTCGGCAGACGCTGCGCTTTGCGGGGCTGCCGGTGCGGCTCGCTGCGG
+ACGCGCAAGAGGGGGATACCGCGCTACAGATCGAGCCGTTGGCGGCTCCCCTCAACGCCG
+GGAGCCAAGCGCCGATGGGACTGGTGCTAATCCGAATAGAGGCCAGCGCGATGGACCTCC
+CTCCGGGAGAGTACGCATACGACCTCGAGATTTCCTGGCCGGGTCCCCCAACCACGGTCG
+AAACCCCCTTGCGGGGCAGGCTACTGGTCATAGAGGACATCAGCCATGTCTAGGGTGGTC
+GCGATCGAACCCCAACGGCGGGTGTACGCGGTTGAGCAGGGAGTGCGGATGGTGGCAGTG
+GGGGTGCGCCCGCCCCGAATTGCAGTCTCAGGCGGGAGCGGCGGGGCCACCTACGAGCAC
+TTGCAAAGCAGCCCGGCCAGCGTGTGGACGGTCAACCACAACCTGGGGTTTTACCCCGAC
+GTGCACGTCTACACCCTGGGAAACCTGGAGATCCTGGCCGAAGTGCAGCACGTCTCAGTC
+AACCAAACGCTGGTTTACTTCGTCGCGCCTACCGCAGGGCGGGCGCGCTGTAGCTAGGGA
+GGGAATATGTCAAAGATCGTCGGCAGCAACCTGGACTTCAACAACGTCGCCAAAATCGTC
+AATCTGCCCAATCCCACGGCGCCCCAGGACGCAGCTACCAAAGCCTATGTGGATAGCGCG
+GTGGAGGGGCTGGCCTGGAAGGACTCGTGCCGCGTCGCAACGCAGGGCAACATCAACCTT
+GCGTCTCCAGGATCGACCATCGACGGCATCACGATGGCCGCCGGAGATCGCGTACTGGTG
+CGCGCCCAGACGACTGCCGCCGAAAACGGCATCTACATCTGGAACGGCGCGGCTGTCGCG
+ATGACGCGCGCCCCTGACGCCAACACCGCCGCCGAACTCGAGCAGGCCGTGACCACCGTC
+GAAGAAGGCACCAGCGCGGGGGCCACCTTCCGCCAAACCTCGGTGAATTTTGTTCTGGAT
+ACTGACCCGGTAAGCTGGACCCTCTTCGGTACCGCCGCTCCCAGCGCGTCGGAAACCCAG
+CAGGGCATCATCCAGATCGCCACCCAGGCCCAGACCGACGCGGGTACCGATGATTCGAAG
+GCCATCACGCCGCTCAAGCTGGCCAACTGGGCCGGGCGTAAACGTAAACTCTCCCAAGCG
+ATAGGGGACGGCAGCGCCACCCAGTACAACGTGACCCACAACTTTGGCACCCGTGATGTG
+CTGGTCACGGTGTACCGCAATGCGACCCCGTGGGACGATGTGCTCTGTGACGTCGAGCGC
+CCCGATGCTAACACGGTGCGGGTGCGATTCGCCGCTGCCCCCAGCGCGAACCAGTTTGTG
+GTGGTGGTGATCGGCTAGTGGAGCAGTACAGCCCGCTCAAAATCTTGTCTCTATCCGCGC
+TCCCTGCCGCCTCGGACTACGCCGGTGCGCTGGTTCGGGTGGGGGGCAGCCTCTACTGGT
+CGGACGGCGCCAACTGGCAGCAGCTAGCCCCGGCGGGCGGGGGGGGATTCAGCGGCGTGC
+GCCTTACTGCAGCTAATTTCAGCGTGGCGAATGATACCTGGACCCTGGTTTCGTGGGCCA
+CCCAGGTTTTCGACCTCGGAAACTACTGGGCCTCCACTCAACCCACCCGGCTCACCATCC
+CTAGTACCGGCTACTACCTGATCATCGCTTCCGCCGAGTGGGACCCTGACAGCGGTTCCC
+GCGGCATTCGACTCAAGATCAATGGTGCGACTGTCTATGACTTGGTGATAGACGATACCG
+GGCGGGCGCAACCCAGACGAAACAACGGCAGCATCTTGCTGGCTTTGACAGGGAGCGATT
+ATTTGGAGGTGGAACTCTATCACAACAGCGGCGACCCCACTGAAAACGTCATCCAAGCCG
+AAGTCGGCGCAGTCAGGATGGGATAGCGACTGGAGGCAATGTGGGCAACTGGCAAATCGG
+GCTCGTCGTGTTGGCATCGGTAGTAATCGCGTTCGTGCTGCTGTGGGACTCGTTGTCCAA
+ATCCCGCGATATCCCCCAGGGCTGGCTGTGGCTCATCGCGTTGGTGTGGGGGTCGGTGCT
+GGGGGTGAGCGACTTAATACGGCGGTTCTCGGAGCAGAAGAAAAACAAGGGAAAGGAGGA
+CAACAGCGATGATTGA
+>NC_014212.1|provirus_1746722_1764354
+TCATATGGCTTTATGATAAAAGCCTGAAGTATAGGAGTGGCGGAGGCCGTGCAAGCCGAT
+ACGGGGCAGCCCTGCCCGCTCGATCAACCGCCGAAATGCCCGCATGACGTTTCGGTAGGA
+CAGGGGGGTTCCCCGCTCTGATGGGAAGATCAAGCCGTGATCCTTCCACCTCCGGGCGGT
+GGTGCGCTCCTCGAGCTGGTAGCCCTGGTGCTGGTGTAGCAGCTCTTGCGTCGCAGGGTC
+AAGGTAGATGGGGGCGCTTGACCCCGGCGTTTTGGTAGGCCCCAGGCTGCCATCCTTTCC
+AAGAGTATGTCGGATGTATAGCCGCTCGCCCTGCCAGTCTTCCCAACGCAGGGCCATTGC
+CTCCCCTATGCGGATGCCGGTAGTGAGCATCAGATAGAACATGGGGTAAAGCCGGTGAGC
+CCTTGCGGCCTCGAGGAATGCCGCCGCCTGCTCTCGGTTCCAGGCTCGAGCGGGCCGGAC
+GACTCCCCCCGCCGGGGGGTCTACCGCCTCGATGGGGTTGGCCTCGAGCAATCCTAACCG
+CACTGCATCCCGTAGCGCCGCCCGCAAAAATTGATACAGATGGCGACGGCTCGAGGGCGA
+CAGGTCCGCTAGCTCGGCAAAGCGAGCACGGATAGCCAGCGCGGACAGCCGGGCCATAGG
+GATATTTGCCAGCGGGGCTAACATGCGCTGATACTCGGCATATTTGCGCTGCGTTGAGAG
+GCGAATATTGCGGCTTCGAACGCGCTCATCCGTCCACCGCTCGAGCCATTCTCCCAAGCG
+CAACCGGCTAGCCTGGATCACGCCATATCCCGCTTTGGGCAATAGCCGGGCAAGCCGCTC
+AGCTACCTCGCGCCGAGTTCTGCCGTACACCCAACGCTTTTGCTGCTTGCCATCCAGGCC
+ATAGCCCACCGTGACGAAGGCCGCCCAGCGCCCGTCCTTGCGCTGGAAGATGGAGCCTTC
+GCCTTTGCCACGCCGGGGCATGTTATCCTTTAGTTCAATGGCGATTGAAAATAAAAATCA
+TAATAATAACCAGCAAAATCCACAAATGCACTGGAACTTTTTTCATTACACTCAAGACCG
+GTTTACTTAACTGCCAATATCGTTTTGCAAGCAAAACAAAAGAAGGTGCGACGGAATACT
+CTAAACTAAGTTGACTTAACAAATCGGACTGACCCAAAGACGCTTTATATAAAATGGCAA
+GTTCTCTTTTCCCCCACAACTTCACTTTCGCATGCTGCGCTTGAATCTTTGCGCTCTGCG
+TAAAACCCGGACCTGTTGTGATTACAATTGCGTATTTAGCCTTCCAAACAGGCATAGCCC
+CAAGAACTGCCTGAACAGCATCATTTCCAACTTTACCCTTCCAATGCTTAACCTGAATAG
+CATAAATGCCAATCGGCGATTGAGCTATTATATCGGCTCCAAAATCATTACTTGGTGGCG
+TAGTTTTCGCCTTCCAACCAGGAATTCGATTAAACATTTCCGTTATTAAACGTTCTACAT
+CAACAGCGGAAGCATTTAAAATGCGTTGAGCATAAAACTGCTCAAAATCATTTGGGTCAT
+ACATCCGGTTTTTCACAGCTTGCCCCCAAGCGGATCATGGTAGTAGACACGGCCAATCAC
+CCGCATCTCGGATGGCCGCCACGGCCTGTACTTGGGATTGTCCGACACTAGCCACAACTC
+GCCATCGTCTAGCCGCCGCACGCGCTTTATGGTGTGTCCATCGCCGGGAATTTCGAGGAC
+ATACACCCTCCCCTCGCGCAAATCGAGGTCTGAGGGATCCACATACACCCTGTCCCCATC
+GTTGAGCGTGGGGGCCATACTATCTCCTTCAACCTGGTATAGCAAACTACCCCTGCGCCA
+CACATCCGCCAAAACCGGCATACCATCAGCATCAACGGGCCGCCCGGCGCTGGCAAGGCC
+CCGTACCAGCTCGATAAAAAAGCGCACCTTGCTGACGCGCTCGCCGGGTTGCAAGGACGT
+GGGAGATTCCAAATCTAAAAGAGGTTCTAGCCCGGTTTGTTCTTGCCAATCCGAAGCCCG
+CCAACCCAGCGCTTTCAACAAAAGAGAAAACTGCCTAACCGTAAGTGTAGAAGGGTCTTT
+TTTGCCGTTCTCGAGCCTATATATGAGAGCTTGATACAACTCTCCCCCTGTTTCGTTCTC
+GATATCCACCAAAGATTTCCCTAGCATAGCCCGCCTGGCAGCAATAGCCCGCCCCCACGC
+GGGCTTTTCTTTTTTCGTGACTTTGGGCATACAGCCAATGCTATGGTTAGCGACTAACAT
+AAGTCATTCACCCCCTGTCAACACTATGAACGCTATGACTTGACAAGTCATGAACTTTGT
+GTTCATACTTGGCATTAGCCATGAACGAAAAGTTCATAACCTCAGGGAAGGCGGCAAAGA
+TTTTAGGGGTAGCGACAAGCACGGTCACCGCTATGTGCGAGCGGGGCGAATTTTCCGGGG
+CATATAGACCCGGCAAGTGGTGGCGCATTCCGCTAGCCGAAGTGCAACGCAAGCGGCAGC
+CCCGTAAGCCGGAGGCCCCCCGTGAATAACCCCAAAATCGCCTACCGCGTGGACGAGGCG
+GCAAAGCTTTTGGACGTCCACCCCAGCACGGTTTACGAGCTGGTACGCGCCGGGTCTATC
+CCCCACAAGAGGCTAGGCCGTCGAATCATCATCCCCGCCCGGGCGCTCGAGGAGTGGATT
+AACTCCCCCGAGCCCTGGGCCAGCTACGACTACGCCCATAGGAGATAACCCCGGCTTTCG
+CCGGGGTCAGAAAGGAGTGTGTATGGATAGTGTAACACAGAAAGCACGGCTCGAAGAAGA
+GGCCATCTCCCTATATCGGGAGTACATAGAGAAACACGGTTATGATCCCGAGCGCGCTGC
+TGCGGCGGCGGCGCTGGAGGTGGCCGAGGGGCAGCAGGCCCTCGAGGCGCTGGAGGCCGG
+CAATGCTTCCTAGCCGCATCCAAATCCAACGCCTCGAGAGGGCCTTGCAAATATCGCTCC
+GCCGGGTTCATGGCGGAAATGCTGATTGCGCTGCGTTCCTTTGGGAGCTGCACGAAACGG
+ACTATTACGCCCCACAATACGCGCCCCGGCCCCATCGGGCCTGGCAGGACGCTAAACGCA
+TCATCAACGTCCTCGAGGCCCTCGAGGCCCTCGAGGCCGTCGAGCATGTGCGCATCAAAC
+CTGTTCGGGACGCCTACCGCACGGGGGAGTTCTATGCGTAACAAGCGCTTCAACTGGCTC
+GCCTTTTGGGGGGCCTTTTTCCTGGCCCTGGTGGCCTGGGGGCTGGCTTTTGGCATCCCC
+TGGGGCCTGGATTGGGCCGACCGGAGGCTGCCGTGATGATCCGCTGGCTAATTCGCGGCT
+TTGTGCTGGTGGTGGGGCGGATTGCCCTGCCCATCATCAGCCCGGAGCGGCTAGGAGGCA
+GACTATGAAATGGAGCGAACACGCACAGGAGCAAGCTAGAGCATCGCGTGATCCACGGGT
+CACCGAGGCTTTTCTGCGCATCCAGTCCCCCGGGCACCGCGCGAGGATGGTAGAGCGGCG
+CCTTGAAACGCTGGGCTATTCCGTGCTGCTCAATCAGCGCGGTCCCGAGCTGTGGATGGC
+GGAGTGCTACTACGTTCGGGGCCAGGGTAGCCGACTTTTTGCCCGCCCGGTAGCCCGACA
+GACTGGGAAAACGCGTCTGGGCGCATTATTGGCTATTTGCGGGGAGCTGGGGGTGGTGGT
+GTGACAGTATCCATTGAGGACATGATTACTGCTGTACGCCGTGAGCTGGCGCTGCGGAAA
+AACGTCTACCGCCGCCGGGTAACCGAGGGCCGCATGAAGCCCGAAGAGGCTGCCCGCGAG
+TATGCAACCATGCTGGCGGTCATGCTCACGCTCCGGGACGTGCTCGAGGGCGGGGTAGTC
+GTCGCCAAAGATGTCAAAGATGTTGAAGACTTCAGTGCGAACGCGAACCTACCCACCGAC
+CCCCGCCCCACCGACCGCCTGACCCAACTCGAGCACAAACTAGAGCTGCTCGAGCGGACC
+GTGTCCGCCCTCATCAAGGATTACGCGGAAAAAGTTCTACAGTGATGGACCTTTACCCAT
+TTGCGGGCTTAGCCGCCTGCAACCCTGGCCGCACCGCCCGATTCCGCCGGGCGGGGCTGC
+TAATCGCCCTTACCTGGACTCCCTCGAGGGAGTGGGAGGCCAAAATATGGGGACCTAACG
+GAGTAACGGCTAATCAGCTCGAGGGCATTGCTAAGGCCCTCGAGCTGGACTTTTACGCCA
+TTGAAAGCTATCTATCGGCAGACTTTCAAAGCTACGTGTACGTCATCACTGGGGGCCGCC
+ACATCGCCCCCGAGTTACAGCGTCAATATGATGAACTCATCTCCCAACGCCGCGACACCT
+TCGCGCCCATATCCTGAGTTTAGCCCCAAGCTCGAGGGCTTCCCCCGCCCAATCAGCGAC
+CGGCTGGCGTATCATCTGAGCTACGGAAACCTTAGCCTGCCCCCGGATGATCCCCGCTGG
+GGGCTTATTGATTCGTACTTATCAAGTGAGGCCTTGGCCGTCGGTTGCCAAATAGCGAAA
+TCCGCTAACGCGATATGGCATCGGCGTATTGAGGCTAGCTGGGTGGGGCCGGGCTTGTCA
+AATGCTCCATATCTCGACGCTACGTCCAGCACGCAATTTTTGGGCCTTCGGGCACGACTG
+CTGATTAACCCGGGAACCCTCAAGCTCCGCATAGGGGGGCTATTGCAATCCGGGCTAGGG
+GGGGAGAGCGTGCGGGGAATTATCCGGCGATTGAGTAAAAAAAGCCGGAGTAGGCTACTC
+GAGCTAACCCGCGAGCTGGAAGCGAGCGATATTTACCCCGAGCTAATGATTACGCTGACG
+TACCCGCGCGATTGGGAGGGGGCCATATCGCCCGAGCACGCCGAGGCTCTTTGGCAATTC
+CGCCGCGCCTGGGGCAGGATGAACGCCCACCGCTACCGACCCAAGGGGCCAGGCTGGGCC
+GAGCGCTGGGCCGAGCTGCGGGCTGAAGTCCGTGCGCGGCTTTTGCGGCTGCGCGAGGTC
+GGGCCGGATGGCAAAAAAGTAAAGGCGCACCTCGAGGCCTTCCGCAAAAGATTTGAACGC
+AAATTTGGAACATCGTGGGGGTTGATTTGGAAGTTGGAGTTCCAGCGGAGAGGGGCTCCA
+CACATCCATCTCTTTTTGTGGAACTGCAACGACATCGACCCTACGGAACTCCGGGCCTGG
+ATAGGCCGGGCCTGGGCAGAGATAGTTGCCGGATCAGACCTGAGCGCATATTTCGATCCA
+CAGAAACTAGCGCTATATGACGCCTACCGCGAGCAGGGGGGAAGAGAATTTGCCGAAGCT
+ATGCTCGAAGGCATGGGGCTAAACGCGGGCACTTGGAATCACATTAGGGCGGGAACTGGC
+GTGGAAGTAATTCGGGAAAAACATTGGGGGTATTTGGCTAAGGAGGTGCAGGGTGGGATG
+AATAAAGCGTATCAACACGATGTGCCACGCAGGTATCGCAACGTGGGCCGTTGGTGGGGA
+TACTGGCGTTATAACCGTGCCGGCTGGATTGAGCTATTTTACGATCTCGCCAGCGCTTCT
+ATGCAGGAAATCAAAGAGGCTATTGTAAAGCCGTTTGAGGCCGCCATAAAAACCCTGCCT
+AAGGCGTGTACGGATTTCAAAAAAAGAGCAAAGGCCGCACTTACCCGTTTTCTCAAAACA
+GGATCATTAGCCGCGCAAAAAGTCGATTCTGACGGCGTAGTTACCGAGGGGGCCTACGGC
+TATCTCACTGTATGGGGCCGAGCCGGAGTACAGGCCGCTATAGGGGCGCTATGAGCAGCT
+ACCGCAAACCAAAACACAAATGTCCAGCCACCGGCAAGCGCTCCTACCCCTCCCAACTCG
+CCGCCGAGAACGCCGCCATCCTCTACCGAATGCGGCTAGGCAGCGGGGGCCGTCCCTACG
+TGTGCCCGCATTGTGGATGCTGGCATCTGACCACTCAGCCCCGCCACAGCAAAGATAGGA
+TGGCAACATGCAACAAATAAGAATCCTCTTGCTGATAGCCATAGCGGCTTACTTCGCTTT
+CCAGTTTCGGGGGGCTTCCCCCACCTCGAGCCCCGCCAAAACCCCAGCCCCGACGGATAC
+CCCGCCCTGCACCAGCCACATCCTTGAAGCCGCCGCCAGCACCCGCGAGCTGCGCCTGAA
+GGTGAGCGGAACCGCCCAAACCCTCCAGGTCGGATACGACGGCGGCATGATGGTGAAAGC
+TACCGAAGAGGTGTGCAGCGGGGGAGAGTGCCGCGTCTTTACCCCCGCTGCCCCTAAAAC
+CGTTCAACTCGATGGTTGCCCGGCCATAAACCTGCCCTAATCGCAATACTATTGATGTAT
+ACTGTTACTAATGGAAAGCGAACTAACTAGACGTCCAGGAAGACAACTCACTATGGGCCT
+CTTACGCAAGCGGGACCGGCTGGATATCCGCCAACTTCCGCTTTCTGACCTGCTCTATAC
+CCTCTGGGGCGACCGCACCGCCGCTATCAGCGTTGCCGAATATGCCGGGGGCGACCTGCG
+CAACCTGCAAGGCAAAAGCGCCATGGAACTGCTCGAGCTGCCCGGAGTGGGGGAGGGGAG
+GGTTGCCAAAGTCATCGCCCTGTTTGAAATCATCCGGCGGGTGGTACAGCGGTGAAACTA
+CGCTCCAGCCTGGCAATTCAAGACAAAATCCGACAAAAACACCAAGTCCGGCTTTACGAA
+GTCGCAGAAGCGATCCGTGATCCTCGCCGGTATACCCGCAGGGTCGAGATCGAAGCCGAG
+GGAACGGTTTACATCATTGTGGGGAAAACCAAATCGGGGCGATTGCTGCGGGTAGTATAC
+ATTGCCAAAAAAAATGGCAACTGGTTGAAAACCGCCCTGGATGCCTACCCACGCGACCGA
+AAGATGTACAATAGAAAGTAGCCATGGCGAAGCTCAAGGTACCCAAGTTCAAAAGCCTGG
+ATGAAGAAATGAACTTCTACGCCAACATTGACCTATACGCCGAGGCCCGCGAATTGAGCC
+CCGATGAGGAAAAAGCCTTGGATAAAAGCCTTGGCATCCGGCGTAAACCTCACCCCGCCG
+CTCGAAAGCTCGCGTTGCACCTAAGCAAAACCTCGGGCGGGGATTGACGCCCACCGCTAC
+GTAAACCTGGCAGGGCTCACCTTAGCCCTGCCATAGCTTTTTTGCGCCGGGGCTGAAACG
+CTATCGGTATGGCGGAATTCCGGCGTATCCAGATAAATGCAAACACGCCGCTAACCCCAG
+GCTTTTACGAGTTCGTGGGTGAGGTAGAAGGTAGCCCAGAGCGGGCCACCAAAAGCGACA
+TCCAAAGCTACCTGCGCGGGGCTACCCGGCTGCCCGACCTGGAAGTTCTGGACTGGGCCA
+GGGTCAGCGGGAACACCTGGCGGGTGCTGGTGCAGGTCAAGACCATCCCTAAAACTCAAG
+CTCAAAACGACGGCATGGTGCATACCGCCGTAGCTCCGGTGGTGGTGTGGGTGGTGGGGA
+TCATCGTCACCGCGTTGCTGGTCGGCTACGGCATCTTCAAGTTCAACCAAACCAAGCTCG
+AGATGTTCCAGCTCATCCCCGAGCCCGATCGGAAAAGCGTCGCCATCGCCCAGTCGCTTA
+ACTTCGGCCTGATTGCGGTGGCAGGGCTGGCAGTACTGTTTTTGGTGCTGCGCAAATGAA
+ACGTAAAGAATTGCGGCTCGAGCTGCCCAGCCTGGATTTACCCCCGGCAGAACCCCCCGC
+TGCCGAACCCACCCCCATCCCGCCCGGCGAGCTGGACCCCTTGCTAAAAACGGCGGTGGA
+CTCGCAGCCGGAGGTTAAACCGGCCCCCCAGCCCACCCCCGAACCCCAACCCACGCCCAA
+ACCCAACCCTGCGCCCCAACCTCCATTGCCCCGCAAAGGCTACGGCCCCCTCATCGTAGG
+AGGGGTGGCTTTGTTGATCGGTTTGAGCGCCGCATTGCTCGGAGGCAAACCCAGTGGAAA
+CGGAACCCCTCAACCCCGACCCAACCCCCCCCAACCCCCCAGCCGAAACGATTGGGCCTG
+ACCTCGAGCCCCCCTCGCCGGAAATTCCCGAAGTGGAAAACCTGGAGGGGCTCGAGGCCG
+AACCCGACTCCTCGCCCCCGCCTCCCGCCCGCATCCCCTTCCGAGGAGCCGAGCTGGCCG
+CCTTCGCAGGCATCCTCGGTATGGCGCTGGCCCGGCCCAAAAGCATGGGAGAAGTCAGCG
+TCTTTGGCGAAGCATTCCATGGGCCTATTCGGCTTTCGCTGCCCGCCATGGGCCTGGACT
+TTTCCACCTCGGTAGCCGAAGCCCTGGACTCGCTGCGGGTAGGGGAGGCCCTGGCCGCCT
+TCGGCATCTACAAGCCGGGCGGTTGGGGCGGGGATTTAGGCGAACTGCCGCCGCTCTTAC
+GGCTAGCCCTGGGCGTCGCAGTAGTCGGGTACGCCGGATTTGGAGGGATTCGTGCTGTTC
+AAGAATATCGAGCTGCGCAAGCTGCCCAAATGGGCACTCCCGGCAGCGGCCCTAATCGGG
+TTCCTAGTGCTGATGATGCGAACTAACCCCAAACCCAAAGGGGCCAGGCCATCGGGGCGT
+TACTTTTACCCCATGAATCCCTTTGTGCTGCCCCCCACCACCGGTTGGATGGATACCGAA
+TACCACGACTACGGAGTGCGCGACCACCGGGGAAGCGGCTACCTGGTGCGCCCTGGGTAC
+TGGCATCCGGCGGTAGACCTCAACAACCCCGGCGGGGGGGATAGCGACTGTGGGCAAAGC
+GTTCACGCCATCACCGACGGGGTGGTGATCGTAGCCGGGTGGGCTCCGGTGATCGGGGAA
+CGGGCGGTGATATGGCACGAAGGGCCGGGAGTGTGGTCGGTGTACTGGCATCTGCGCAAC
+CTCGAGGTCAAACCCGGTAGCGTGGTTATGGCCGGGCAAAAAATTGCCGAAGTGGGGCGA
+ATGGCATCCGGCGGGTTCTGCCACCTGCACTTCGGCGTGTACTACGCTCAACCCCCAAGC
+TGGGACTACTTTCCCAACGAACTGAACGTGCCCAAAGAAAAAAGCGTATGGCTCAAGTAC
+TCGGTGGACCCGCTGCAATTCCTGAACAAAAACAAAGCCCAGCTACCGCCTAAATGGGAG
+CGTGACTAATATGGAAAAAGCCCTCAAGCTGGTCAAAGAAAACCCCCTGGCTCTGGCCGC
+CCTGGCCTATGGCCTCTACTCGGGCCTGGGCCGCCTCAAGAACCTCCGCGAGCAGCAAGG
+CTGCCCCAAGTGCGAAACCGCCCAAATGTATTTGGGCTTCGGGCTGGCGGCTTTCGCGGC
+CTATACCCTGTGGCAGGACTACCGGGCATAGTGAACCGCTCCGCTTTGCGCATCATCATC
+TCTGGGAAAACCCGCTCCGGGAAGACCACTCGAGCCCGCGACCTGATCCGCGCCCTGCGC
+CGCAAAGCCCGGCGGGTGGTGGTGGTGAACTTCAAGCCCGAGCTATGGGAATACGCCCAA
+GGGCGCTATACCGTAGACGACGCGGGGAAGAGCGCCGCCCTGGTGGGAACCGCGCTGAAA
+AAACACCGCGATGTGTGGTTTTACCTGCGGGCTCCCCGCCGCCAAGAATTCATGGATGCC
+CTGGCCTGGCACATTTTGCAAGAAAACGACCTGCTACTGGTCTGCGATGAAGCCCACCTG
+GCCTGGCAACGGGGCCAGCTCAGCGAAAATCAGGTGCGCGTCTTTACCCAGGGGGCCGGG
+CAGGGGATCAATACCCTGCTCATCTCGCAAACCCTGGTGTCCCAGGCCGGAAACATTGAC
+CCTTTGCTGGTCAAACAATCCAGCCACCTGGTGTCTTTTCAGCTCACCGAAAAAAACGAA
+GTAGACCGGCTCAGCGAGTACATCCCCGAACTGGGCGAAAACGTCCGGCGGTTAGCCAAA
+GCGAACCTGCCCACCCCCGGCGCGCCCGGAGAGTACGTGGTTAAATCCTTCGACACCGGA
+GAGGCCGGAGTAGCCGCGCGTTCGCCCAGCGATCCAAAACGGCTGCTTTGGATTCCCCTT
+ACGCACGACAACAGCACCGGAGTTTATCGCTTTCTGCACGGCGACTAGGCAGGGCTCACC
+TGAGCCGCGCCGTTGACACCGAGGTAAAAACGCCTCCAAGCTCGAGCTATGGCAGATCGA
+GCCCTTCCGCAAATCGACACCAACCCCTTGCAGGTGGTGCAAGACCCACGGGTGGTTTCC
+GGGGCCATGGGAGTCCTGGGGGCCAACCTACTGCGAAAAGCCCTCTTTACCCAGCAGCGC
+AGCGTGTTTGGGTACGCCGCCAAAGGCAGCGATGGCCGCATTCGCTATTACGAGAACGCC
+GATGAAGCCAAAAAGGGCGACGCCGGGAAGCAGATAGCCAGCGCCTACCAAAGACGCATC
+TTTCTGCACCTCGGCTACGTACTCTTTGGAACGCTGGCTATGAGCTACGGAAAGGAAGCC
+CGCAAAGACGATGTGCTCTCGAGCACCGATGACACCACGCTGATGGTCAAATACGCCGGT
+TTGGGCTTCGCCGCCTCCGGCTTCGCCAACCTGGTAATGACCCTCTTCAACATCGAGTAA
+AGGAGTGATATGAACCCTAGCGCAGGACGCCCCACGGAAATCATCATCAACGACCCTAAC
+GCCTCTTTTTTTGCCGGCCCCCAACGGCTTCGGCTGTGGGAGTATCTCGTACCGGTAGGG
+GTAGAGTTGAAAATTCAAAACCCCTTCCGCCTCATCGCCAAGCTGTACGGGGCCGGAAAC
+GTGCAAATCCCGGCCTCATCCAAACTGTACCTGGCCCGCATCCGCCGGGGAGATTTCGAG
+ATTGAGGACCTGGCCGAGATTCCCTATGCCCCCTACTTCTCTCTCACCATTGACCAGCAG
+CTCGACGCCAACTTTGCCGAGCGGATCACCCACGTGATTGAAAACACCGGGCGCATGGGC
+TACGCCTTCGATGAAGGCGACCGGCTAGCCATCCTCATTGAAAGCACCCTCGCGGTGGAC
+ACCACCAACCCTAACAACCGCATCCAGTTCACCGGTCTGGTGAACAACTAAGGAACGCCA
+TGGGACTCATTGACTCGCTCACCAACCCCCTAGCCGCCGTCGGGGCCGGGGTGAGTAGAA
+TCGCCTCCGTTTTCCGCGACGCGCCCGAAGCAGGCCCTACCCCTACCCCGGCTGCCGCCC
+CCGCTGCCCCCGCGCCTGCCGCCCTGGCAACAACGCCTTGGCGGCAACAGTACATTGACG
+CAAACGACTTTCAAGCCGGGGAAACCTGGCGTAGCGGCGACTATATCCGTCTGGCCCAAT
+TTCTGCTACCAGAAGGCACCGAATGGCGCCTGGAACGAGGCCGCCCTTACGGCTTTTATG
+TGAAGGCGGTGCAGGACCTAGCCGGGCAAAACCTGGGAGCCCCCGCCGCGCGAAACGTGG
+TCATCAACGACTTACAAAAGAGCACCCAAGCCGGCCAGGCTACTCTACCCGCCACCTACC
+ACCCCGATGTAGCGGTGTGGGCTACCACCGGCAGCGGGCGGGTCAAATGCACCATCACCA
+ACGTTGACTACACCACCAAAACCATCACCTTCACCGAACCCGCGGGGGTCAACGGGGCCA
+GCGCCATCCAGGTGTACTACCTCTCCAACGACGGGGATTGGCGCATCCGGGTCGCCCGTG
+AGCTAGGGGTAGATACCAGCATCGTGGCGATCCTCAATGACTCCTTCGCCGTCGCCCACG
+CGGTGGACCAGCTCAACCGGCGCACCGCTCGCTACTGGCCGCAAGATACCGTGCTGGTGC
+AAAAACAACGGCTGGTGCTGGAAGTGCGCACCACGGTGAAAATGGTCTGGACCCCGGAAG
+CTGAAAACATCCTCAACTTCTATGCCTGGATGCGCCAACTCAAGGTGCTCGACGATCAAC
+GCCTGGGCCGGGTAGCGGAAGGTGTGCAGCGCAGGGGGTTCTGATGAATCCGCTCGACTC
+CATCATCAAAGGCGTCCTGGGGGTCTTTGATCAGGTCTACTACTCGGATGAGGAAAAAGC
+CCGCGACCAGCAGCAAAAAGAGCTTGCCGAGGAAAAACTGCGCCTCGAGGCCGAACTACG
+CAAACAGCGCGAACAAACAGCGCAAAACGTAGCTATCGGTGCAGGGGTGGTGGCCCTGGT
+AGGCATCATCACTTGGGGCGTGGTCGCATCTAAAAAAGCTGCGTAGGGTGGGTAGCCATG
+GCTGATAACGTCGGAACCACCATCGCCATCACCGCAGTCGGGCTAGCGGGGGTCGCCGCC
+GCTTTTGTGATCGTGGACCGGTTGACCAAGGCCCAGCAGCCCTTCCAGAATCCAGGCCAA
+CTGCCCGCGCAAAACCCCGGCAATACGCCCGCCCCAAACCCTGGCAATACGCCCGCCCCG
+AACCCCGGCGGCTCTGCTCCCCCTGCCAACCCCGGCACTCCGGGGACCGGCGGCAGCTAC
+ACCTATGGCGACCGCTGCAAGGAACTGCAAAACCAGCGCAACACCTACGAGGGGCTGCAA
+CAAACTGCCCAGCAAAAGATGGATGGCGTCATGGCCGAAGTGGAGGCGCACCGCCGCGAC
+ATCACCCACCACAGGTTATGGTGCATTACGGATTGCAATTGGCACCTGGAAGAGCGCTCC
+AAGCGCATAAACGCCTACGTGCGCGGCGAGCCAGTAAGCGGGTACTGGAACGAACAACAA
+CTGCTCGAGGCCGCTGACGGAGCTGGGGTAAACCTGCGCGAGTACCGCAAGCGCTACCTC
+AAAGCCAAATCGGAATACGACTCCTACGAGCAGCAAATCAAGGATATTGATGCCGAGCTG
+CTGAAACTCTCCAAGCAGGGGGTGCGCTGTTGAACCCCGTAGAAATCAAACAGTGGGCTG
+AGCTGGGGATTAGCGTGCTCGCCTTCCTGTCGTTCGTGGCGTTGGTGTTCAAAGTGGGCC
+TGCCCCTGGTGCAAGCGGTAGAGGCGATGAGTGGGGAATTTCGACTGTTGCGCCAAGCCC
+TAAGCGGCGAACAGATGGAAAATCTGGTACGCGAAATGCGATCCACCCGGCATAGCCTGG
+AGGGTATGAACCGGACCATGCGCCGCCTGGAAGGGGTTCTAGAGCGAAAAGGCTTTACCT
+TCCGCATGGAAGACGAGGTGATGCCGTGAACTACTTGGTGTTGGGCCTGGGATTGGGAGT
+ATTCGCCATTGGCGGGTATCTCTTCCTCGAGGCAAGAAAAACCAAACCCCAGCCCCCCGC
+CCCCGACCCGATCCTGAGCAATCCAGACAACCGCGATGCCTACGACGATTACCGCAAGGG
+GGAAAGGGACTCATGGGGATGAAATGGCTGTGGGGAATCCTGGTAGCGGGGGCAGCGGGA
+GCGGCCTTATGGATCTACGCTCGAGGCCGAAAACCCGCCGCGCCTGGGCTCAAGAACTGC
+GCCCAGGTGATTACCCCCTGCGCCGATGGCTTTATAGCCCCCACCCCCTGCGGCTGTGCC
+AGCCACGGCGGGGCAGCGAGAACTACCCCGCCCCCCTTGCCGCAGCCCCAAACCCCCACT
+CCCCAGCCGACCCCTCCGATCACCATCATGCCGGTGCCTAGCGAACCTCCGCCGGGGGTC
+GGCACCACCCTGCCCCACTGCAACCCCGATGAACTGTTTCAAAACGGGCGGTGTGTACCC
+AAATCCCCTCCGATGGATCAAGCGGCGCCGCCTCCGCCCGCGCCACCAGCGCCTATCCCC
+CCAAAGGTTATAGACGCGCTGAAAGGCATCACCCCACAACCGGCTACCGAAACCAAACCG
+CGAAACGTGACCCTACCCGTAATAGCCGATATCTACTGACGGAGGAACCATGGACACCAA
+ACCCTGGTACATGTCAAAAACCGTATGGGCCGCCCTGCTCACCGGGCTACTGGGAACCTA
+CCAAGGTTTAGATGCCGCGCTCAATGACGCCCTGCCGAACATCCCCCAGTGGGTGTTCTA
+CGTGCTGACCGGGCTGGGCCTGTACGGGCTGCGCACCGCCGATAAAAAGATCGGATAACC
+ATGGAACAACAACCCAGCACCGGCGAACTCATCAAGATGGGCTTCTGGCAGGCCAGCGGG
+CAAGCGCTTTTTTGGGGAATCGTCTTGCTGATACTGGGCATACTGGGCAGCTTCGTGAAA
+ACTCCCCAGCCCACCGCACCAGCAACCTCGGAGAAACCCAAATGTTCGGCCTAGATATAT
+CCAACATCCTGGCGCAGATTCGGGGGCAGCTAGCCCCCGAACTGGAGCGTTTAAAGGTTG
+AACTGGAATGTAAACTGGATGCCCTCATCTCTGCCGTGCTCTCCGGACCGCGCGGGCAGG
+AATACGAATTTGGCCGGGGGAAGCCGGAGGTGCGCGGCCACGATCCGGCTGTATTCCCGG
+CCATCGTCAAACTAGCAGGAAAGCAGCGGGCCAATCTGGCCGCGCTGCTCTCGAAAACCG
+TAACTCGAGGATTCGCCGCCAACATCGGGACCAATCCGGCCATTTTGCGCTTTTGGAAAG
+AGCAAAGCCCCGAACCATCCGCCCCTTTTACCCTACTGCCTGGGCAAACCGTGGACTTTA
+GCTGGTTCTTCGACGAAATCAGCGTGGAGGAAGCCACGCCGGGGCAACCCGTAGAGGTAG
+AGGTGTTAGCCCAATAATGAAGCGCACCGTCCTCACCACCCATCGCGGCAAATCCTATTT
+GCCGGAAATCGCCCTGTGCCTGGGGCCGCAAATCATGGGCCAACCAGGAAGCGGCACCTA
+TGCCGATCTATACGGGCGGGTGTGGGCCTCAACGATTGAGCCCGATGGGCTGGTACACCT
+CTGGCAGGCCACCGCCTCCGACTGGCAGGAAGTGCCCATCCCGCAACCCCCGCACGATCC
+CCGGACCATGCGGCATCACTCATTGGCGTTCGACCAGTCCGCCCGGCACGTGCTGGCCTA
+CGAGATAGCGGGGCAAATCTACATCCGGCAATGGGATGCATTGACCAACCAATACGTTAT
+GCGTGGCCCCTGGCCGGGAGTAGATCCGGTAGTTATAGCCGATGCGACGGTGAATTATTA
+TGTGCCGGATAGCGATGTTTTGCTGTTCTATTTGTCCTCGGATCGCTCCAAGTTGTATAT
+GCGGGTACAACGCGAGCTATATGGCACGGCCCATCTAATACAGAGCTTCCCCAACCCACA
+AATACTTGACCAAGCAGTGTCCATCCCCTATCAATTTGAACTACTGGGCTCAAGCGTGAG
+CGCCCCAAACGATTTAGGATTAGTGGTGCGCTCCGACTTGTACCCCGTGTATTTGCCCCT
+GGACGCCCTGACTACGGCATCCGTCGCAACCCCCAGCGCGGGCAACTATTACCCTGTGGT
+GGTGGTTCGTGACCTCGGTACCGATGCTCTGAGCACAGCATCCTTTGCCGTACCCAGCGC
+GGGCAACTATTACCCTGTGGTGGTGGTGGTTCGTGACCTCGGTACCGATGCTCTGAGCAC
+AGCATCCTTTGCCGTACCCAGCGCGGGCAACTATTACCCTGTGGTGGTGGTTCGTGACCT
+CGGTACCGATGCTCTGAGCACAGCATCCTTTGCCGTACCCAGCGCGGGCAACTATTACTT
+GGTGGTTGTGGGACACGATCTCACTCAACCCCGCTACAACTCCCCCGACACAATCACCGC
+AGCTAACATAGCGGTCCCAAGTCAAGGAGCCTATAATGTTGCCTAGAATAATCATCCGCG
+AGCTAAACGCCCCCAGGCCGCAAATTGGCGTATCCCTGCAACCGCAGGAGATGCACTGGC
+AAATATTGGGGCCGGATGGCCGCGTCATCCGGGAGAGCGAACAACCCCTGCATAATCTAG
+TACTAAACAATGCCAAGGAGCTAGCGGCGACCTATCGCTTCTCCACCCTCAACATGTACG
+CCAAAGTCGGCACGGGCTCGTCAATCCCGAGCGCTACACAAACAGCCCTGGACAATCAAG
+TAGCAGATACTAACTCCATCCCCAGCGGCGAGAGCGACAGCGTCACCTACGTTTCCCCCG
+GAGTCTATGACGTGCGCCGAGTGCGTGAGTTTACCGCAGCCCAGGTAAGGGGAAACAATC
+TGACTGAGTGGGGATGGGGGCCAGTTAGCGGCATTGGAAACCTGATGAGCCGGGAACTCT
+TCAGGGATGCCAACAGCACGCCCATTACGCTCACTTTGGGCACGGATCAAAACCTTCGCC
+TGATATACAAAACCCGCATTACCATATCCCCCGCGCCTAATACCGCTACCCCGGCATCAA
+TCACCATTGCCAATTTGGGAACCTACAATGGCAACTTTTGGACCAAGAGGGGGAACGAAG
+ATGCCGGAAACGGCGACTTATACCTAGCAGAGCTGGCCGCAATAGGGGCAGGAAGCCCTC
+TAAACACTGACACTGCCGGGCTATGTATAGCCGGGCTGTCGGCCAACCTGAACACGGCAG
+AGCCGTATATACATGTATATCGTGTAAATGATTTTGGCTTGTCCTACGCCCCTTACACCG
+CAGCCAGTAAAAAGCGCACTACCCAAACCGTCACGGCGGATATTTCGCAGTGGAACACTA
+CCTTATGGGGGCTGATGATCGGAGCAAACATAACCGGATTTGATAACGTCAGCCACGCCG
+GAGTCGTTTTCAACTTTGGTGCGAGTTTTGTAAAAGACAGCCTGCACAAACTAATTATCA
+ACCCTTGGGACATAGTGACCTGGACATGATTCCTAACGTTTCGACCCGCCCATTTATCGA
+GCCCCCCTTAATCCCCCTGCCCGCCCTGCGGGTGGACTGTGCGCCAACGCCCCGCGTGTT
+GTATTCGCATTTCCCGCAGCGGGTATCCCTGGGCTCGATCCTGTATCTCGATTTATACGC
+CTATGCGTGGTACGCGGGGGGCGGCTATCTAACCCTCAACCGGGGCCGTAAGGGGCTAAG
+GCGCACGTCCCACGGGGTAGAAGATGGCCTTGGCTCAACTCGCACGTAATCCCTGGGTGT
+GGCTGGGGGCCATCGGGGCGCTTATCCTGCTGCGGCCTAGAGGGGGCCTCGAGGCCAACG
+CCAAGCCTGCACCCACCCCCAGGGATGGGGCAGGGTGCGGCTATCCTCGCTCCGACCTGC
+CACCCGCCGTCGCAAAAACCAATGCCGAGCTGATCGAGCGGACCTGGGGGATAATCCTGG
+CCGATAATGGGCGGGTAAACGATTTGGCCCAGAGTTACGGCTACGAAGCCCCACCAGGGC
+AATACGCCCGCGACCTGGCCGCCGCGCTAGTGGGAGCGGCACAGAGCGCCGGAGTGCCGC
+TGGATTTGCTCGTGGCACAATCCAGACGGGAATCAAACCACGTGCCCACCGTTGTAACAA
+ACACGTATTTGAGCATCGGATGGGAGGATGCCGCCATTCGACGGGCAGTTGCAAATAACT
+GGGCCATTGGGCCACTCCAGGTCAAGCCGGGAGTATTCCCCGAGGTCGGCTTGCCGTCCC
+CGAGTCGCTGGCTGGGCGACCCGGTGAGGTGGAGTAGTCAAGCCCGGCTCAGGGATGCAG
+TATTAGCCGGAGCACGATATTTAGCCAAACAAAAAAGTCGCTACGGTACATGGTGCGCCG
+CACTACACGCCTATACCGTAGGGCCTACGGCATACGCCAATGGGGCCAGGGCAGACGGGT
+ATGTGAGCCAGATTATTGCTTGGGCCAACGGGTACACGGAGCTGCGCACATAA
+>NC_014212.1|provirus_1893193_1914973
+GTGACCAGCCTTGATCGCATCTATCAACGTAATCTGAGCCCAACCCAGGCCCGCCACTAC
+GCACGGCTGTGCGAGAGGAATCACAACACGTTTGGAGCGCAAATCTACCACGATGTGGCG
+GAAGCACTGGAAGCTGCCGAGCGTATCCGCGCCGCGATGAGGCTGCAAGGCTACCTCTGC
+CCCACCTGCGGTAACACCGGGAGGCTCGATGACATCCCCTGCTTCCACTGTGCTGCTTGA
+GCCAGCCATGATGACCCCGGATCAGATACTGGCCACCATTGAACGGGCGTCTCGGCCTGT
+ACTGCTTTTTTATACCCACGACACCGCCTTGCGGGTGCGCTTCCTGGGTCGCACCATGCT
+CCCTGACCTGACGGACCCCAGCGATCTGTGGGGATATCGGCCCGGCGAGCAAATAGAACT
+ATTTGGCTGTGGAAGAAAAACAATCAATACATCAAGACTTACGACATCGAGCCGCAGCTC
+GAGGCCACCTACCCCAGCGAAGACACCGTTTGGCGCTGGCTGAAGATGCACCTGGCCGGC
+CTACCCCTTCGGGGAATCGGTCTGGCTGGCCTCGAGCTGATTGAACGACGTATGGCAAAG
+GAGAACCCCCATGCCTAGTGCAAGAGCCCTGGCAATGGCCAAAGCCAGCCCTCAGCAGAA
+CCTGGACGAGCTCTTCGCGGCCCTCCAGGCCGCCCAGGGCCGCCCGCTGGATCTCCACAG
+CTCCGGCCTGGAAGTGCGGGCGTGCTTCCTGGGCCTGGAGGACGGTAAACCCCGCTACGG
+CCTGTACTGCTTGGCCCTGGGCGACTGGCTGAACGTGGCAGAAACCACGCTGCGCACATA
+CCTGAGCCAGTCCGGGCCCTATACGTGGGAAAAGGAAGATGAATAACCCGATCTACGAAG
+CTATCCAGCGAGAGCTGGCCTCCTGCCCGGGGATGAATTTCAGCATCTGGGAACTCCTGG
+CCGCGTTCGAGCTGGAGGCTACCCGCAACAACTACTACCGCCTCTATTACTTTCTGCGCC
+AGCTTGAACAGAAGGGGCTGGTGGGGCGCTGCCCCGGCTGGGCCCCCGGGGGCGGAAGCC
+CTATCTGTACGGATTAAAGGAGCCATATGGACGAGTTTGAACTGGCCCGCCAAGTGTTTC
+GAGTTCTTTGGGAGGCCGGCCCCCAGGGTCTGGATCGCGACGCCCTGGCCCACGCCCTGG
+GCGTGCCGGATCGGGAGATGCGGGAAGCGGTCGAGCTCTGCGCCAAACTGGCGGCAAGGC
+CCAGCGTGCCAGGGGCCAGGCCGGAGGTAGTGGGATTTGACCCCATGACCCGGCGCTACC
+ACATCGCCAACTCGGTGGAGCAGGCCGACCGAATCATCAGCTACGCCCTGAGTTACATCA
+ACAGCGGCCTCGAGCGCGTGCGGGCCTACTGCGAGGCCCGCACCTTGCGCTGGGGGGAGA
+TCGAGACGCCCCAGGCTACACAACAGGCCCTGTTCGAGGCCGAGCGGAGGCTAGAGAGGT
+AAACCCCCCACGCCCCGCCACGCCGTGGCGGGAAGCCGGGGGCTTTCCGAGGGAGGACGC
+TCTGCTGGGCAGGAGCAGGAGGTGGACATGGAACTCACAGAGATCGGATGGCTAGGCCTG
+GTCGCCCTGATCGTGGGCTGGGTGGCTGGTGGGCAGGTGGTTGGAGGCGGTATCAGCGTA
+AGTGCCAGCGTCCTCCTGACGGCGGCCCCGGTGCACATCTACGTCACCCCAATCACCGTC
+TGGAGGCTGACCCACAACCAGCTTGTGGAGCGGTTGTGGGGAACCGGCTTTACCCTGGGC
+GGCACGGTGGTTTACGTGGATCCCCGGCCGCCAGCGACCCAGATGCCCGAGCGCGACATC
+AACAGCCTGCGAACCATGATAGAGCAATACGAGCTGGGGCACATCCTGGGCTGGAGGCAC
+TACGGGCTAGAATACCTTCACCAGATAGCCCACGAAGCCTGCCGGTACGACCCCAAAGCC
+CTGTGGGCGGTGCACTGCCGTAACGACCACAGACCCCCACAAATCCTGCTGCCGCATACC
+GGCGCCATCCGGGTGGTGCTGCCATGAACGCGCATCTGCGAAACACACTGATTGCGTTGC
+TGGCGCTCGCCTACCTGGCGACCCTGGTGATGTCGGCCGGCCACCTGACCAAGTGGTTTG
+ACCTCAGCTTGGGCGAGCTGCCCCGGTTTTTCTCTATTGGCCTGGCGGTGGGCCTGGAGC
+TGCTGGCCTTTACCCTTAGCCTGGCCAGCACCCTCGAGCCCCGCCTGCGCTGGAGCCTGG
+CTGGTGGTCTGTTCTTCTTATTGCTGGTCTGGCTGGGCAACCTGCTGGCAATGGCCCGCG
+TGGCCAACGCCCCCGGCTGGGAGGTGTTCGCCCAGAGCCTGTTTGCCCTGGGGCCGCTGG
+TCGCGGGTAAAGCCATTGGAGAGCTGCTACGGCTGGAGCGGCCCGGACGGCCACCGTCCG
+CCGACCTTTCAACAAGCGGACAGAGGGTCCACGTCCAGACCCACGTTCACACCACTACGG
+TCCACCAGGCGCTCCAGGTCACGGACCGGATGAGTTCATCAACCCAGCCCGGAAAACCGG
+ACGAACGGGTGGAACAACTGCTGGCCGTTCTATCCGGCCAGCCCCTGGGACCTTCCGCCC
+TGGCCCGGCGGACCGGACTACCCAAGACCACGGTCTACCGGCTGACCGCCCGACTGCTCG
+AGGCCGGACTGATTGCGCAGACCCCGGGCGGATACGTCCGCACAGAGGTGGAGCGTGGCC
+GGTAACCTGGAACGCTGGCGGGCGGAGCACACCGCTAAATACCTCTGGTGGGTGGCGCAT
+GGCGTGCGGGGCTGGCAGTCCGACCGGATCAGCTACGCCCCAGAAACAGACCGTTTGGCC
+GCACGACCAAAACAGCCTGGATACCTGGTCATCCAGGTGATGGCGCTGCCCGAGATCGGT
+ATCGACCGCCATACGCTGCGGCTGTGGCGGTCGGACTACCAGGCCCTGCTGGATCGGACC
+GATCCGGCTATCAAAGATGAGTGGGCGGCGTTCCTTCACCGTGCCCGATGGTCTAGCCTG
+TGGTATTTCGACGCGAGGAACAGGCGGATTCGTCCCGGGAACGAGCACCGCGGACTGACC
+GCCTGGACCCTCGAGCTGGGTCGACTGGCCGAGGTACTGCCCGGCGGAAAACCAGCCACC
+CAGCAAAATATCTGATACCATTATTTGTAACGTAACCCGCCGCGTACTACGCGGCGGGTT
+TGGAGTCGCGCGTGGACGAAACCGAGAACCACCTCAACCGTTTGTTGGAACACCTGATCC
+GGGCCATGCGGGCCAACCGAAAAGCCGAGCGGGAGGCCGAACTGCGGGAGGCCGAGAACA
+TTCTGAATGCCCGCAAGGTGATTCTGCAGATTCCCAAGCCCAAAGCACCGGCCTGGTGGC
+AGAACGAGTGGGTTTTTCGCTTCATAGCCACCCTAGTGGGCGCGACCCTGGCAGCCCTGG
+GAATCAACTGGAAGTTTTAAAGGAGGCCTATGATCTTTGACAAGAAAAACCCGCGCCGGG
+CCGCTTTGATCCGGGGGCGGATCCTGGAAGTGATCTATTTCGCGGCGATGGGAGACGCGC
+TAAATCCTGACGACCCTTACAGTATGAGCCGCGGGGTGCTTCAGGCCGCGCTCGAGCAGC
+TCAACGAGCTGCCCGCCGAAACCGACCTGCACGCTGCCCTGCGCTACTGCGCTGAGAAGG
+GGTATCTGGAGGTGGCCTGGCGAAAAGACGGCTCGGGGAGCTTCGACAGCGTGCGCCTGA
+CCACGGCTGGCATCGACCTGTACGAAGGAAGCATCCACGACAAGGCCGTGTATTTTCACT
+CGAGGCGCTGAGATGGAGCGTCTGGATCGTATAGAGGCGCAGATAGGCGATCTGCGGGAG
+GAATTGCGTGGGCTGCGGTTGGCCCAGACACTCACCAATCGGGAGCTGCACGAAACCTTG
+GGTGTGTTGCGAACCGTGCTGGAGCAGGTCAGTCGACAATCCCGCCCACCCCGCCTGCAG
+ATCTGGGCGACCATTGCCATCGGCCTGGCGAGCTTTGGGCTGGGTTTTACCGCCCACTGG
+CGCATCTCAGAGATCGAGGAGGTGAGGCATGTCCAGTTTGTTCTACCCCCGCGAGCCCCG
+GTGCAAAATTTGCAACAGTCCGATTCGCGATGAGATTGACCAGATGCTGCTGGGCAATCA
+ACTGACCGAGCATGGCGAGCGCTGGTGCCTGGAGGCGATTGTGGAGTGGGCTCGGGAGAG
+AGGGTTGAACACCAGCATGGCGGCCCTTTCGCGGCATAAGAACAACCACCTCAATCCGGC
+CGTTCAGGCCGCCCTGGAGACCGAGCGGATGGTGGAGGCCATCAGCGCGGCCACCGGCCG
+TAAGCTCAGCGTGGCCAGGGCCTATGCCAACGCGGTGCTCGCCAAGACCCTGCGGATTCT
+CGACGACCTGGAGTGGGACAGGCTGGACACCGACCAGAAGTTACGCGCTGTAACACACGG
+CCTGCGGGCCGGCGAGGTTTTGTCCAGACTGGAGCGAGCCGACGTGCGGCAGGAGGTGGC
+GACCAAGGTCGAGAAAACTCTGTCGGAAGCTGGCATCAGCCAGGATCTGCTGCAAAAGGT
+GCGGGAGATTTATGGACTGGCCTAATACTGGCTTGTTGCTGCCGTATCAACGGGCCTGGA
+TCGAGGACCAGAGCCGCTTCAAAATCGGGCTGTGGTCGCGGCAGGTTGGTAAGAGCTTTG
+CAGCCTCCCTGGAGGCCGTGCTGGACTGTGTGGCGCACCCGCGCAGCCTGTGGGTTTTTC
+TCTCGCGGGGGGAACGCCAGAGTAAAGAGCTGGCCGAGAAGGCCCAGAGGCACCTGGAGG
+CCATCCAGGTGGTGGCTGAGATGTACGACGAGCCCTTCGACGCCGAGTCCACCCAGACGG
+TGATCCGGCTGCCCAACGGTTCTCGCATCATCAGCCTACCAGCTAACCCAGACACCGCCA
+GGGGCTACTCAGGCAACGTGCTTTTGGATGAATTTGCCCTGCACAAGGACTCCCGCGAGA
+TCTGGGGAGCCCTCTACCCCACCATCACCCGCTCCAAACGGTACCGGCTGCGGGTGCTCT
+CCACTCCCAAGGGCCAGCAAGGCAAATTTTACGAGATCTGGCAGCCCGAGCCCGGCGGAG
+ATCTGTGGAGCCGCCACCGGGTGGACATCTACGACGCGGTGCAGCAGGGCCTGGAGGTGG
+ATCCGGAGGAACTGCGCAAGGGCCTCAAGGACCCGGTTCTGTGGCAGCAGGAGTACCTAC
+TCGAGTTCGTGGACGAGGCCTCTGCCTGGCTGCCCTACGAACTAATTACAAGCTGCGAGA
+GCTCGCAGGCCCGTACCGATGGAGCACTGGAAGGAGATCTGTACCTGGGCATGGACATCG
+GCCGCCACCGCGACCTCAGCGTGATCTGGGTGGCTGAACGCGTGGGGGACGTGCTCTGGA
+CACGCCGGGTGATCTGGCTCGAGCGCACCCCCTTTGCCACCCAGCGAGAGGTTTTATACA
+GCCTCTTGCCACAGGTGCGCCGAGCCTGCATCGACGCCTCCGGCCTGGGCATGCAGCTGG
+CCGAGGAGGCGCAAAGCCGCTTTGGCAGCAGGGTGGAGCCGGTGATGTTTACCCGCGCGG
+TCAAAGAGGATCTGGCCGTTACGCTGCGACGGAAATTTGAGGATCGCCTGATCCGCATAC
+CCCCCGACGACCGCATCCGTGAGAGCCTGCACGCCGTGCGACGCATCACCACCAGCGCAG
+GCCACATCCGCTTCGATGCCGATCGCGATGATGCAGGCCACGCCGACGAGTTCTGGGCCG
+CAGCTTTGATGGCCCACGCGGCGGCCAGCCCCAGCGGGCCCATCACCTTCGAGCGGGTCG
+GCTGGGGCCGTATGAGCCAAAAAGGAGCCTGGTAATGTGGCTGACAGAGCAAATTGCTAA
+ACTGCTGGGCCGCAAACCCCCTGTTGCGCCGCTGCCACACCCTGTCAGCGGGCGCGTCAT
+CAGCGGGACTTCGCGGGGCCTGGAGCCGGAGGGCCTGGCTGCTATCCTGCGGCAGGCCGA
+ACAGGGCGATCTGACCCGGCAGATGGAACTTTTTGAGGAGATCGAGGAGAAAGATGCGTA
+TTTGGCGAGCCTTTTGCAAACGCGCAAGCAGGCGGTGCTGGCCCTGGACTACGCGGTGCT
+ACCCGCCGACGATTCGCCGGCGGCGAGGCAAATCTCGGACGAGGTGAGCGCGCTATTGCA
+GCATATCAACTTGCAGGACCTGCTGCTGGATCTGCTGGACGCGATTGCTAAAGGTCTGAG
+CGTGATTACCATGCGCTGGGAGTACGATCGGGACAGCCGGCGCCAGCTGCCCACCGAATT
+CACCTGGATTCATCCGCGAGACCTGCTCTATGATCCGCAAACCGGCGAACTGCGTCTGCG
+CACCCAGGATGGCCCGCAGAGCATTCCCTACGGCGCGGCCCTGGTGCATCACTACAAGGC
+CAAGTCGGGCGCGCCGTCCCGCGCCGGGCTGCTGCGCAGCCTGGCCTGGCTGTACCTGTT
+CAAGAACTACAGCATCAAGGACTGGATTACCTTCCTGGAACAATACGGCCAGCCCCTGGT
+GCTGGGCAAGTACGATCCCACCGCCAGTAAGGACGAGCTCAACGCCCTCAAAGAGGCGGT
+GGCGGCCATCGGGCCGGAGGGCCGCGGGGTCATCTCCAAAGCCACCGAGATCGAATTCAA
+GGAATCGCAACGCTACGGCACTGCCGACGCTTACAGCCGCTTCATCGAGCTAATGGAGCG
+GGAGATGGCGGTAGCCATCACCGGCTCTCCGCTCTCGAGCTTCGATGGCAGCGGCGGCTC
+CAATGCGATGGCGCTTACCCTGGATAAGATCTCCCAGCGGCTGACGCGTTCGGATGCCAA
+AGCGGTCTACAGCACCTTGCGCCGCGACCTGGTGGTGCCCTTCTGCCATTACAACTTTGA
+CCGGGCCGACCTGGCCCCCCGCCTCGAGCCCATCCTGCGTGAGCCGGAGGACCTGAAGGT
+GGCTGCCGAGACCATCAAAACCCTGGTGGATGCTGGCGCGCCCATACCGTTGCGCTACAT
+CCACGACCGCTTTCAGATCCCGGTGCCGCAAGCAGACGAGCCGGTTCTGGCCCCCTCCAG
+GGCGGGGGTGACCGGGCGGGGCGTCAGGCTGGCATCGGGGGATGCCCGCGGGGCGCGGGG
+ATTTATCAACGGGCAGCTGTACGTGGACGGGCTGGACGAGGTGGCCCGGGCCGAGGCGGC
+GCCGATTCTGAATGACCTCATCGAGCGCATCGCAGCTATGGCAAACCGGCACCACAGCTA
+TTCGGATTTGCGGGAGGCGCTGGTACGGGAGTACCCCAGCCTGGCCAAGCCGGTGCTGGC
+CGAGCTGATCGAGGGCAGCCTGGTGCTGGCCGAGCTGGCCGGGCGCGCTGCAGTAGACGA
+GGACATCTGATATGGCCTGGAATGTTGATGCTGATCCGCTCCAGCCAGCCGAGGCCACCG
+ACTGGTTCCGGCGCAAGCTCAATCTACGCAAGGACGAATACAGACAACTGACCGACCGCG
+CCCGACGGCGAGCCTTCACGGTGGCTGGCGTGGCCTCCCTGGACCTTCTGGCCGAGGTAC
+ACCGCAGCCTGCTGGAAGCCCTTGTGCAGGGAACCCCCTACCAGGCCTGGGCCCAGAACC
+TGGGGCCGACGCTGGCGGCAGCCTGGGGGACGACCAACGGCTACCGGCTCAAACTGGTCT
+TCCAGCAGAACATCCTCTCGGCCTATGCGGCCGGTCGTTACGCCCAGCTCACCGACCCGG
+AGGTGCTGCGGGCCCGGCCATACTGGATGTTCGACGCGGTGCTGGATAGTGCGACCACCG
+AGACCTGCCGGCAGCTCAACGGGGTCGTCCTGCCCCACGATCACCCGCTCTGGGCAAAAA
+ACTACCCCCCGCGCCACTTCGCTTGCAGGAGCGGGATACGCAGTCTAACCGTCCGGGAAG
+CCCAGGAAAGGGGGATAACGGAGAACCCGCCGGAGGTCCAGGCCGAGGCAGGATTTGGAT
+TGCGTTCCGACCCGTCGGAGTGGGGGCGCGACTGGGCCCGGGGGGTGGCCACCAGCGCCA
+GCAGCGCACGCTGGCAACCGGCGTTTGCCGGCACACCGCCAGACTGGCGCACATACGGCC
+GGCCCGAGGCCATTCCACGGGATCGGTTGCCCCCAGACCTCCTGGTACCCTCCATCAGCG
+AGGTGGGTGAAGCCGGCTTCCGCCGTGCGCTGGCGCGGGCCTGGGGCGGCCTGGAGGTGG
+TGGTGGCCGATCCCACCGGGGCGGGAACCATTCTCAACGCCCGGGTGCTGCTGGAGCACC
+TTAGCCGCGAACCGCCGGATGACCGGGAGCGCTACTACGGCCTCTTGCCGGATGTGGTGG
+CAAACCCCTACGAGATCTGGTTGGTACCGCTACAGTCGGATCGTGGGGCGGTAGCCTTTC
+GCAAGTATTACCTCAAGCTCTATGGAGACAAAGAGCGGGCCTTCCTTCTGGTGGTGGAGC
+AGCAGCGGGGAAGCACCTGGACCGCGTATACCCACATCTACAGCAGCAAGAAACGGTATA
+TCGCCGACCGGCGGATTGGTTTTCTGCTGTGGGGGAGGGATTGACACTCCCACGGCTAAA
+GCACGTGGGATTCTTGGTTCGACGAGGACTGCCTACGTTGTGTAGGTCTTACACCCTCTC
+CCCAAGCGTTTAGCGTCTCCGGGTGCCCCACGGCGACGGGGATAGCTCGTATCCCTTCGG
+CCCGGATGTTCAGGGCCGCGTTCAGGTCTCGGTCGTGCACCGCCCCGCACTCACAGGTCC
+AAACCCTGTCCGAGAGGGTGAGGGCGGTGTGGATTGTCCCGCACTCCCGACAAAGCTTGC
+TGCTGGGGAAGTATCGGTCAATCACGACGAGATGTTTGCGATACCAGACCGCCTTGTACT
+CCAACTGCCGCCGAAACTCACCCGGGGCCGCATCTAGAACCGACTTGGACAGCTTGGTTT
+TCGCCATCCCTTTCAGGTTCAGGTCCTCGATGCACAGCCCGTCGTACTTCTGGACGAGTC
+CGGTGGTCAGCTTGTGCAGCCAGTCCTGCCGCTGGTTGCGAACCTTGGCGTGGACCCTGT
+TCAGCCGATGCCTGGCCTTTTCCCGGTTCTTGCTACCCTTCTGCTTGCGGGAAAGCTCCC
+TTTGCGCCCTGCGAAGCTTGCGCTCTGCTTTGCGGTAGAACTTGGGTGGAGCTATTCTTG
+TACCGTCGGAAAGCACTGCGAAGTCTTTCAAGCCGAGGTCAATCCCCACCACATGCTCAG
+GGTTTACGGGGGGCAGGGGTACGTCGGGCATCTCGAACTCGGCGGTCAGGGTGACGTGCC
+AGTGCCCTTCGGTGTCGCGTTTGAATGTTGCGCCTTTGATGACGCAATCAATCGGCTGGC
+TCTGGCGAATCTTCACCCCACCGACCTTGGGGAGGTAAACCTTGCCTTCCTCCACCCGGA
+CGCGCTGGGGAATGCGGAAGCGGGGCGGGTCCTTCTTTCGGGTCTTGAACCGGGGGAACC
+CGGCCCGTCGCTCGAAAAACGCCTTGAACGCCCGGTCGAGGTCTTGGAGGGCTTGTTGCA
+AGAGTTGGCTATCCGCTTCTCTGAGCCAGGCCATCTCAGGCCGCTTCTTCAGGGCGGTGA
+GTTCGGTGGCCTGCCCGTTGTAGGTCAACCCCTTCCCGGTGGCGGCATACGCCTCCTTGC
+GCCGTGCAAGGCCCCAGTTCCACACGAACCGCCGAGCTCCGGCCATACGCAGCAAAGCCT
+CAGCTTGGGCTTGGGTGGGTTCCATGCGGAAGCGGTAGACCTTGCGGAGCAGCATTCAGT
+CCCTCGTCTTCTGGGCGGCGATGTATTGCTCGATGGTTTTGCTACTGACCATGCCAGCCG
+TGGAAACGAAATAGCTCCGTGTCCACAGGGCGGGAAGGCGGATGAGTTGGGGAAACTCCC
+GGCGCAACACGTGCGAGGTGTAGCCCTTCAGGCGGTGGGCGACCTGGTTAGGGGCCACGT
+CGGGGTCTACCGAAATGAACAGGTGTACGTGGTCGGGCATGATTTCCAGGGCGATGATTT
+CCCAGCCTAGTTTAGCGGTCTTCTCCCTAAGCAGAATATCCAAGCGCTCGGCCAACGGTC
+CTACCAGAATCTTGCGGCGGCGCTTGGGCACGAAAACGAAGTGGTAACGCAGCAGCGAGA
+CGGAGGTGTTCTTGTGTTTGTAGGCCGTAGGCACTATCACAGTATAGCACACCTGCCGCC
+CACCATGCGATGTGCCCCTGCGGGGCACATGGGGGAGTCCATGTATCCCATCCCTGAAGG
+GAAGGGTTTTATAGCTCCCCCACACCCCCTCGCTTCTATAAGCCGCTTGCGACCCCCAGC
+CTAGGGGGAAGTCGAGGAGGCCACTTGGAAGCCCGTAAAAACGATCGTAGAGGCAAGAAG
+GAAAATCTATCACAAAAAGAGGAGGTGGGACGTGCACAAGGTGGCACAGATCGCGCTGCT
+GGCGGTGCGGCGGGAACTCCCAGGATTCATAAGCAGCCCGGGCTGGTGCGTGGCGTTCGC
+CTTTGAGTGCATCGCCCGGGCATATGACACCAACCGCTGGCTGCTCTACAGCCGGATGCT
+CGATTCCGTGCAGGCCGACCCCGACCGCAGCCGCTGGGCCCACGACGTGGAGCTGGCCAT
+CGACCGCCTGGACTGGGATGTCACCAAAGCAGACCGGGACCCGGCCGGGGATGACCGCAA
+AGGCCTCTTGCGAATAATCAAGCCCGGTGACTTACTATTCAGTAGCCAGCTCCACGATGA
+GCCACCGAAATCCCGGCGCACCGCCACCGATCGGGAGGGCCACCTCGCCATCTTCGTCGG
+TGAGGTGGAGGGTATACCCAGCGTGGCGGAGAACACCCGCGCGGATCGGGGCAGATGGTT
+TGGGCGGAGGTCAGCCCTGCGCCTGACCCCACTGGCCCACTGGGATACCGTGACCACGGT
+GGGGCGGATCCCCAGCGGGTGGCGGCCGTGAGCGTCTCGGGCTCGTTTGGTGATCTCGAT
+GGCCTGATCCGCCGGCTGGGCCGAATGGCCCAGCCAGCCTTCGCTGCGGGCCTGGCCAAG
+AGCCTGGGGCAGGCCGCCCTGAACCAAATTGACGAATCTTTTGCGGGGCAGCGCGACCCC
+TGGGATCGGCCCTGGAAACCCTCCATCCGGGCCGAGACCACCGGTGGCCAGACCCTGCGC
+CAGAGCGCCCGGCTGCAGCGCAGCATGACCTCGCAGACCGCCCTGACCACCGGCCCTGCC
+GGATTCGAGGTGGGCACCAACGTCCAGTACGCTGCGGCCCACCAGTACGGAGCCACCATC
+AGACCCCGGAAGGCCAAGGCGCTCAGGTTCAAGCTGGGAAAGCGCTTCGTGCAAACCAAC
+CGGGTGGAGGTTCCTCCCCGGCCCTTCATTCCGGAGCCTGTGCTATCCCCCCGCTGGGAA
+CGGGCGCTCGAGGCGGCGGCGGGGGCGTACCTCGACCGAGGGTTGGCCTGATTCGAGCGA
+TCCAGGAAGGGGGTAAACCACCCCACGTCCCGCCACGCTGTGGCGGGACGTGGGGTGAGG
+AGGTGAGGCAATTGACCGAGACCTTGTTGGAGCGCCTTCGGGCTGAGCTGCCCCGCAGGG
+TAAAGCTTGAGCTGGGCCCCGATGCGCTCAATCAACACGAGGGGCCGCTCAAACTGGTGC
+TGGTGCCAGGGCAGGACACGTTTACACCACCGGATACCCGGGCCATCGCCCCTGAGGCGC
+TGGCCAGGGAGACCCTCCCGCAGCCCCGACCCCGGCCGCCCTACACCAGGCTGGCAGGCT
+ATACCCTGCACATCTGGGCGAAGAGCTACCAGGCTGTGGAGGACATCCTCTCCGAGTGCG
+TGGCGGCCTTGCGGCGCATCTGCGGTAGCAGCCTCGAGCTGCTCCCGAGCGGCTGGGACG
+AGGACGAGACCGGCCAGGCGGCGGCGCTACCAGCGGACAAGCGCCGCTATCAGCTGCGGT
+TCAGGGTACTGGTGGAGGTAGGGGCGGCAGAACCGGGCCTGTACGTCCGCCTCGAGCGGG
+CCCTGCTCGACCAGGCGGAAATTCTTCCCTGAGAGGAGCGTTATGGCAAAAGCAACCGAT
+AACAACAACGGCGGGCAAGCTGCACCTGCCCGAAAGACCGTCGAGGAGCTGGCTGCGGAG
+GCCGGTACCCCGGACTGGCTGCTGGCCGCGGCACGGGCCAAACACCGCTGGGTGATCGGG
+CAGGAACTGACCAAAGCGGCCTTCGAGCGGGGCATCCAGGAGGCGGCCAACGAACCCATA
+GGAGGTGAGGTATGACCGGCCTGCCGCGCGTGGAGGTGAGCCCCCAGGACTTCGGCATCG
+GCGCGGTGCCGGGCAACGGTGAGGGGGTGCACGTCAAAATTGGCATCGCCTCCATCCTGC
+CAGCAGGCGAGATCATAACCGTAACCAGCCCGCAGGGGGCCCGGGAGCGGGTCGGCGGCA
+AGCTAGGCGAGGCCGCCGCCCTGGCCTTTGGCGAGGGAACCCGGGCGGTGATCTGCCTGG
+CCGCCAACCCCAGCGTGCCCGGGACAGCGGGCGCTGTGACGCACACCGGCAGCGGCACGG
+CGGTACTGTCTCTGACCGGAACCCCCCGGGATGACTACCGCCTGCGCCTCAGAATCACCC
+GCGCGGCCCCGAACCTGGCTGCGGCCACGGCGGCGTTTCAATACTCGCTGGACAACGGTA
+ACACCTTCAGCGCCGAAATCGCCGTGCCGACCACCGGCCTGTACACCCTGCCCGATACCG
+GCCTGACCCTCAACTGGGCCGACGGCTCCTTTGTGGTCGGTGATGTGTACACCGCGGACT
+GCGTTGCGCCGAGCTACACCACCACCGATCTGGTCACCGCGCTCAACATTTTGTTTGCCC
+GCACCGAGCTATCCTACCGCTTCATTCACGTGGTGGGGGCGGGCAGCCCGACCACCGCTG
+CTACGCTGAACACCCTGCTGGAGGCCCGCGCCGCCGACCCGAACAACCCCCGCTTCATCC
+ACGCCCTGATGGACACGGCGGACCAGGCCGACGCTGCCCTGATCGCCGCGTATGCCGGCA
+CCACCAGCGTGCGAGTGGGTGCAGGAGCCCGCTATGCCGATGTGGTGAGCCCGATCACCG
+GCCTGGTGATGAAGCGGCCGGCCGCATGGGTGGTCGCTGGGCGGTACAGCGGCCGCCCGG
+TCGAGGAACACCCCGGCCGCTACGCCAGCGGAGCGCTGCGCACGGTTGTGAAACTCCACG
+GCGATGAGTCCATCACCCCCGGGCTGGACGCCGCCCGGTTCACCACGCTGCGCACCATCA
+GCGGGGGATTTTACATCACCCGGGGCCGCCTGTTTGCCCCGCCCGGTTCGGACTATGAAC
+AGGTGCAGAACCGCGAGGTGATGGATGTGGCCTGTGAGGTTGCCTACCGGGCCTGGCTGC
+GCTGGCTAAATGAGCAGATCCAGGTCTCCGCGCAGACCGGGCGCATCCTGGAGCGGGAGG
+CCCTGCGGATTGAGGCCTATGTGGAGGGGTTGGTGCGCACCGCGCTGCGGGGCAAAATTT
+CCATTGACGAGGTCATCGACCAGCCCGCTGCCTACGTCCGCATTGACCGCACCGAGAATA
+TCCTGTCCACCAGGACCATCCCCTACGACATCAGTCTGGTGCCACTGGGCTATGCTGAGC
+GGATCACCGGCAAGGTGCGCTTCTTCAACCCACAGCTCCAGCCAGTGGCCTAGGAGGTAG
+ACCATGAGCGTGACCGTGCGAAATGGCAAGGTGTACGACAACTCGAGCATCCAGCTTGAC
+CTGGATGGCGAACGGATTCCGGTCAACGTCGAGTTGGAGTACAACACCGGCGAGGTGTCG
+GAAGAGTATATCTACGCCGGGGGCAAGCCGGTGGGGCGCACCCCCGGACAAATGGCCCCC
+GCCGATGTGACCATCCGGATGCCGCTGGACCAGTGGCAGCAGTTTCGCAGCAAACTGGGG
+GCTAAATACAAGCGCAAGGAGTTCAATGCCGTTGTGACGTTTGTGGACGCCGACGATAAC
+GTGGTCAGTGACAAGCTGAATAGGTTGCGCATCCTCAACGACGCGCTCTCGGCCTCGCCA
+GGCGCCGAGGCGCTTATGCAGGAGCTAACCTGTAAGGCGCTGGATGTGGTGCCTGGCGAT
+CAAGCCACTTTCTGATTTCTGAACCTGCTAGCCCCACCCCGAACGGGGTGGGGCTAGCTC
+TTGAGGCATCAACATGGGAAAAACCATTCTTAGTGAAGACCTCGAGGGCCAGCTGCCCCC
+CACCACCCTGACCGCCCTCCGCGCCACACATGGCGACCGCTTGTTCGCCCTGGTTCGCCA
+GGGGCGGGTGCTGGTGTTCCGCCCGCTCACCAAGGCCGAGTACCGCATGATGCGGGCGGA
+TCTAGACAAGGCGTCTGCCAGCCCGAAGCTGGCACTGGACACCTACGCCATCGGCGAGAA
+GTACGCCAAGCTGGCCCTGTGCTACCCCGACCGGTCCGAGTTCGAGGCCATCCTGGACGA
+CTACCCAGGCCTGGCCGATGTGGTCAGCCAGGACTTAGCGGCAATTGCCCAGATGGCCGA
+AACGGAGTTTCTTCAACAAATCGATTGAACTGCTAAACGACGCCCTGCGGCACCGCGAAC
+AACCCTTGGTAGCGGCCCGACTCCTGCTGGCCTACCGCCGAGGTGAGGATTCCCCCGAGG
+CGCTGGCCGGTGCGGCGTTGGAGGCCGCGGTGCTGCTGGGCCATTTTGGGAGGATCCAAT
+GAGGCGGCTGACATGGTTTTTTGGGTTACGCAGCAATTTTGTAACCCAGTCGCGCGCCAT
+GTCTAGAGGGCTGACGGGGGTTCGGGCAGCCCTCCAAGAAGTGGGCGGTGCGGCCCCGGC
+GACCGCCCGAGCGGTCGCCCAGAGCCTGAGGCTGCCCATCGGCGCGGCGCGTCACCTGGT
+GGGGGCGCTGACCGCTGCGGGGGCTGCGAGCGCGCACCTGGGACGGATCAGTAGCGCGGC
+AGCCAGGGCCCATCAATCCCTGCAGGGCCTGGTCGGCCGGCTGACCAGCCTGCCTGGCCT
+ACTGGCCGCTGGGGCGGTTGGCATGGCCACCAAAAGCATATTTGACGCCATCGGCTTCAA
+AGAACAGCAGTTGATCAGCCTGCGGGTGATGCTACGGCCGCAGGTGGGGCTTGACGCCGG
+TCGGATGGCCCAGCAAACCTACGCCATGCTCGCCCGCTTCGCCGCCGAGACGCCCTTCGA
+GACCCAGGAGGTGATCGCCGGCGGCAAACAGCTGCTAGCCGCGGGTGTGGCGGTGAAAAA
+CCTCCAGGGGCTATTGAAGGATGCCGGCGACCTGGCGGCAGGGATGGGAGTGCGCCTCGA
+GGAGGCCATCGCCCCCATCACCCGGCTGCGTGCCGGCAATTTCGGCGAGGCCTTTGAGCG
+GCTTCGCGACTTCGGTATCAGCCGGGAGGCCCTGGAGGCCAGGGGCCTGAAGTTCGATAA
+AAGCGGCAGCTATGTGGGCTCGGTCAACAAGGCCATGCTGGCGGTGCGCCAGGCCATCAA
+GGAGCGCTTTGGCGGCCTGATGGCCGAGCAGAGCCAGAGCATCTTCGGCCTGATCTCGAC
+CCTGAAGAGCCGACCCTTTGAGCTATTCAGCCAGATGAGCGTGGACCCCCAGGGACCCCT
+CAAGCCCTTCAAGCAAGTGCTGGCCAACCTGGCGGTCCTCACCGACTTCAGCCGGGGGCC
+GGGGGCGGCCCTCTCCAAGCGCTTCCAGGCCAGCCTGGCCGGACTGATAAAAGCGGCCTT
+CGGCCCGCTGGCGGCTGCCAGCGAGCCCAAACAAGCCGGGCAGGCGATCCTGGCGTTCCT
+CGACCGGAGCACCGCGCTGGTTCGGCGGGCCCGGCAGATCTTCCCGACGGCCCTGGGCTA
+TGCCCGGCAGTTCTGGACCGGGATCCAGGCGGGCTTGGCGATTCTGCAAGGGGTCTGGCG
+CACCCTCGAGCCCGCCGCCAGCCTGCTGGGCCGGCTGGCCCAGGGGCTTAGCGCCAGCCA
+GGCGGGCATGGGCGCTGCCAGCGGTAGCGGCCTGGCCCTGGCCGGCACCCTGGTGCTGCT
+GGCGACCGGCCTAAGGCTGCTCAATGCCCTTACCTTCGGACTGGTCGGAACCGTGGCGCG
+GCTGGGACTGGTCTGGCTGGCCACCGGCCTCAAAATGTCTGCAGGCTGGCTGGTTGCCCT
+GGGGCCGGTGGGCCTCCTGATCGGCCTGATCGGCGGGGTGGTTGCGGCGGTGGGGCTGGC
+CTACCAACGGCTGGACTGGTTCCGCAACGGTGTCAACGGTGTCTGGAAAGCGGTCGTGGC
+TGGCGGCAGCGCATTCATCGCCTGGATCAGAGCGCTGCCCCAGACCATCGGCGAGACCCT
+GGCTGGCCTACCGGCGCTGATGCACGAGACCGGCGCCCGGGCAGTACAGGGGCTCTGGAA
+CGGGCTGAGAGCCGCCCCTGGCAGAGTCTGGGAGGCGGCCAAAAACCTGGCTCGGCAGGC
+GGTGGGTGGAAGCCGTGAAGCGTTGCAGGTGCGCAGCCCATCCCGGGTGTTTGCCTCGCT
+GGGCGAGCAGAGCGGGCTGGGTTTGCGGCAGGGCCTGTTGGCCATGCGCGGCGCGGTGGC
+GGGCGCTGGACTGGCCCTGGCCGCAGCAGCCATCCCGGCCACGCTGCAGATCCCGGCCCC
+GGCCGCAGCCCTGGGGGCGGCGAGCCCCCACCGCGAGGTGCATATCCACATTGGCCAGAT
+CGTGCTCGGTCAGGCGCAGACCCCCAGCGAGGCCAAAACCCTGGTGGTAGAGGCCATCCT
+GGAGGCGTTGGAACGGGCCCAGATGGAGGAGGGGGCCTGATGGAACGTGACCAGATCGTA
+TTCGTGGGCACCAGTGGGCAGCGCTTTGCCATCAAGCCCCAGCCCAAGGGGCCGAACGAA
+ATCCAGGGGGTTGTGGCGGTATCGGTGCGCCGGGCTCTGAAGGAGCAGAGCGCCGAGATT
+CCCCAGAGGGGCATTGAGTACACCTACCTCGGCTACGACTACGCGGAGGTCACGGTGGAG
+GTGCGGGTCTGGCGGGAAAGTGAATATGACAAACTACAGCGTCTGATCCAGTTATTCCGC
+CCCAAAGGAAAGGACCAACGGGCCCCCGAGGTTTATCAACCGGTTCACCCAATCCTGCGC
+CGGCACGGCATCACCCACCTCTACATGTTTGCTGTGGAGGAGCCGCCCTACGACCCGGTA
+AAAGGCTGGATGGCCACGCTGAGCCTGCGGGAGTGGAAGCCGGCGTACAAGCGGGTGCAG
+ACCAATGGCACGCGCATCGGAGGCGGCAGTGCCAGCAGCGCGGATACCGGAGGCGCCGAC
+GCCGACCGCGACGGCGTGCTTACCTCCCAGCAGCGTGCCCAGGCCAGCCCGCCCAGCAGC
+AGGGGGGTGCGGCCGTGAGCTTTGCCACAGTCGACGAGCTTCCGATTAGCAGCGGTACGC
+TCACCGTGCCCCGGATAGGTCGCCCCATCGCGGAGCTCCAGCTGGCCGCGAACCGCCTGC
+TGCTGGCGGGTGAATCCGTGCAGATGCGGTTCGCCGATGGCACCACCTACCGGATGGTGG
+TACGCCGCAGTGGCGTGCGCGGGGGCCTGGTGGAGGCGCTGCTGGTGGGCGGCGCGGATC
+GGCTGAACGCCTGGCTGCCCAGCCGCGATTACCAGGGCGTGCCGGCCGCACTGGTGGTGC
+AGGATCTGCTGCGGGAGGCCGGTGAGGCCGCTGGCCTCCTCGAGCTACCCACCGTGTTCA
+CCCGCTGGGTGCGCCGCGCCGGCCCCGCTCATGAGGCGCTACTCCATGTCATGGCCCGGC
+TACCCGACCGGGCCTGGCGCATCCGGGCCGACGGCCGGGTCTGGGCTGGGCTCGAAGCCT
+GGCCGGCTGGACCGGAAGGGGTGGTGGTTGAGGCTGCTCCGGCCCGGGGCTGGTACGACC
+TGCTGCCGCTGCCCAGCCTGGAGCCCGGGGTGCTGCTGACGGCCCAGCTAAACGGTGAAC
+AGCGGCTGCTGGGGAGGGTTGAGCGCGTCGTTCACCAGATTGGCCCCCGGCTGCGCACGG
+CCGTGTACACAGGAGGGTGACGTGCAGGAGCGACTCAAAAAAGCCATTCAGGGCCTGGCC
+CGGCCACCGCACCTGGACTTTCTAGCCCTGTACCCAGCCACGGTGCTTAAGGACCATGAG
+GACATGCACCTGGACTTGCAGGCCGACGACGAGCGCCTGGGTACCCTGACCCGGGTGCCC
+ATCTGGTTGGGCCTGCCGGGGGTTACGGTGCGGGTGGCGGCAGGGGCCCGGGTTCTGCTC
+GGATTCCATCAGGGCGATCCGGAGCGGCGCTACTGTGACCTCTGGGGGGGTGGGGGGCTG
+CGTGAAATCATCCTCACGGCCAGCGTGAAGGTGGTGGTGGACGCCCCCCTTGTCGAGCTG
+GGCGGGAGCGCGGGGGCCAGCGTGCTGCTACAGGGGCAGCCGCTCACGTTCGTGTTCAAT
+ACCACGCCGGTCGCAATGGTGCCGACCGTTGGCACCGTGCAGGCCGGGGGATCCACACGG
+GTAAAAGGGGTGCAGTAGTGGACGACTTTGGTACCGACCTGTCGGTTTTCCCGGACCTTT
+CCTGGACGCTCAAAAGCGGCTACGACAATCTGGCCGAAGCCGCCGTGCGCTGCCTTATGA
+CCGCCCCCGGAGCGCTCTTTTATGCCCCCGAGTACCGCCTGGATCTCAGGCGGTTCCTCA
+ATGAGGCCATCACGCCGGAGGCGCTGCTCGAGGTGGAGACGCTGGCGACGAACGCGCTCG
+AGGCCGATCCCCGTATTGTGTCGGCCGAGGTGCGGGCCAGCTGCCCCGGCCCGGGGGTGC
+TGAACCTCGAGCTGCTGCTAACGACCGAACGCGGCCCGTTTGCACTGGTGCTGCGCATTG
+ATCAGGTGACCGTGGAGGTGTTGCGTGCCTAACCTCAGCCAGCTGTTGCAGCCACGGAGC
+CGTGACGCAGTCCTGGCCGACCTGATCAGCATTTTGCAGACCAGGGGCTACCCTCCCACC
+GACTGGGTTGAGGGCAGTGTGCAGCGCACCCTGATCGAACTGGTTGCGGCAGGCTTGGCC
+GACCTGGAGGCTTTGCGATTGGAGATTGCCAAGGGCGGGTTTCTGGATCTAGCCAGCGGG
+GACTACCTCGACCTACTGGCCCGGAGCGCCTACGCCCTCGAGCGCAAGCAGGCCACCTTT
+GCCCGCCAGACCTTCCGCCTCACCGCCGCGCCAGGCTTTGGGCCCTACAGCATCCAGCCA
+GCCCAGCTTTGGGCGGGAAATGCCGCCGGCCTGCGCTTCAATAACACAGCCGGTGGTACG
+CTCCCGCTGGGGGGCACCCTCGACCTGGAGTTCAAGGCCGAGAGCCCGGGGGCGGCCTAC
+AACCTGCCACTGAACACCGGCACGCTGCTGTTCACGCCCTTACCGGGGGTCACGGTCAGC
+AACATCGGCGTTGTGGAAGCGGCCATCGATCGGGAAACCGACGCGGCCTTCCGGACCCGC
+TGCCGGCTGCGCTGGGCCGAGATCGGCCTAGGGGCAACCCGGGCCGCCTACGAAAGCTGG
+GCGCTGGCCAGCACCCCCAGCATTACCAAGGTGCGCATTCTAGATAACAACCCCCGCGGA
+CAGGGAACGGTGGATGTGGTGGTCTGGGGGGAAGGGGGCCTTGGGGCGGGCGCGGTGGCG
+CAAGTCAACAGCTATATCCAGCAACGCAAACCCCTGACCAGCAACGTCGAGGTGTATGCC
+GCCACCCAGGTCAGTATCGGGGTGACGGCCACCATTCGTCTGCGAGCCGGATTCCTGGCG
+GCCGTGCAGGCTGCGGTTGCCAGCCGCCTGGCGGACTTCCAGCGCGGCCTGGCGATCGGG
+GCCACGGTGTACCGGTCGGCGCTGATTGAAGCTTTGTTTGTTCCAAACGTCGTCGATGTG
+GCCCTGTCGGCTCCGGCTGCGGATACCAGCCTGGGTCCCACGCAGGTGGCCACCTTTACC
+CTGACCCCGACCTGGCTGGAGGTGTAGATGGCAGGAGAGGAGATTCCACTGGTGCCGGTC
+GCCCTGTACCAGGCCTGGCTGCCGGAGCTGGCCCCACCCTGGTTGCAGGGGCCTCGCGGG
+CATGCCCTACTGGCTGGCTGGGGCCAGGCGCTCGACCAGCACGCATCCCTGCTAACGACC
+GCGATACTGGCCCGCTTTGTCCAGCAGGCCCCCGAGGATGCCCTCAACCTGCTGGGGGCC
+GAACGCGGCCTGGGGCGGTATCCGGAAGAGGCCCTGGGCACCTGGCGGGATCGGGTGCTG
+GGGGCTTGGGAATTCTGGCGCTGGTCGGGGACTGAGTTCGGGATGCGCACCGCGCTCGCC
+CAGCTGGGCTACGACGCGGCGGTGGTGCCGGTGTGGACCTACGACGCGACCCGCTGGAGC
+GAATTCGACGTGTACATATACCCCATGACCCGTAGCTACGACGGCTCAACCGCAGAGCGA
+AACCGAATCCTGGGCGTGATCAACCAGGTCAAAGCGGCCCACACGCGGTTGGCAAAACTC
+ACCTATGTGAGCTTCGGTCCACTGACCTGGGATCCTCCAGGCCTCACCTGGGATGCCCCC
+GCAGTATGGGGCGATACCCCGGTGCAACTGTTTCCGTAGGAGGCGTATGCCAAAAACACT
+GAACCCGATTAGCGTCTTTCCGAGCAGCATTGTCAACTTCCCGCAGGCCGGAAACAACGA
+GCCGGTGGCCATCGGACCTTTAGAGGCGGCCATTCAGGCGGTGCTGAACCGCACCGAGCA
+CCTCCATCAGAGCCGCCTGGAGGTGGAAGGCCCCGGCGTCAAACGCCTCCGGCGGGTGGC
+CACCCTGGCGGCGCTGCAAAACCTGACCGGCATGGCCGATCTGGACGTGGTTGCTGTGGA
+CGGCTACGGCCTCTACCGCCTCTTCGACCCCAGCGCCCTCACCGCCGACGGGCTGTGGGT
+GTTGAGCGCGGCTGGCGGTGGCCGCTGGGTGCACAGCAGCTACCTGATGCGCGGCATCAA
+CAACGGCTGGGCCATGCTGGACAGCAGCGGTCGGCTGGCCCAGGACGTGCGCGATGGCTC
+CATCCTCACGCAACACATCGGCAACGGCCAAGTAACGGGGCCGAAGCTGGCCACGGGGGC
+CGCCGTTGCAAATCTCGGCTATACCCCGGTGAACAAAAATGGGGACACCATGACGGGGGC
+GCTGACGGTGACCGCCAACGTTGGCGAGGCGCTCAGCCTCAAGGGCGGGAGCAGCAACCA
+CGTATACCTCGGGTTTTACGCCCGCAGCGCTAACCAGAGCGAGCGTTCTGGTTTCATCGG
+GTACGGCAGCTTCGGGAGCAACAGCCTCGACATCGTCAATGAGATTGGTGGGCATGTGTA
+CATAGCTTCTGCTCAGATGGTTGTGAACAGCAACCTGAGTGTTTTTGGGCAGATCAACGG
+ACGTTACAACCACGCCGAGCGGTTTTCCGTGTGCGCTAACGCGGGCAGCGACATGGTCTT
+GTCCCCAAGCGTTAGTGGGATTATTGCCGAGCTCAACTTAACCTTACCGGCAGGCCGAAA
+GTTGTACTTGCGGCGGCTGCGCCATGCTGGCAACAACAACTTTCGCGCGCATATCTTCAC
+GACCGGGCCGGGCAGCAACCCCTACCTAGCCCCAAACACCTCGGAAGAGCTGAGTTTAGA
+TTATGAACTGAAGAATGTAGCAGAAACGTTTACGCTTATGCTAGCGGTATTCAATGCATC
+TACTAGCAATCAAACAGTTAGCCGAACCTGGTCTGTCTGGGCCGAGCTGGAGATCCGTTA
+A
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_014363.fasta.fasta
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_014364.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_014364.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2212 @@
+>NC_014364.1|provirus_2121424_2157334
+TTAAGAACTTTTTCTATATCTTCCTTCATTTAGTTTTATGCTTAAAAGGTCATCATATTT
+ACAATAATAATGATTGAAGAAATCTTTATATGTAATAAGTATTTTATCAGGAATAAGTGA
+GAGATCATAATTTTCAATGTAACCGATAATTTCAGGGTCTTCTTCCTTTATCTCCCTATA
+GAGGGACCTCCAATTATCAGTCAACCCTTCTTTTTCAGCAATATCACGTAATAAAATATA
+TGAATCTGGCATATGTAAAATCTCAAAGAATTCTGAAATATTTTTTCCAAAAGCTCTTTC
+AAAAAATGATCGATTTCTTCCGACCTTTCCCTTTGTGGAATTCAAAATTAGCTGTATAGC
+ACGTATGTATTTTCTATTCCAGTTCTTTCCGATATATTTTCTAGTCTGATATAATTTTTG
+TTCATCATTGATTGGAGAATAACGCATTGGAAAAGAATATATAATTAAATCAAATTCTTC
+ACATAATTTAATATTTAATTCTAATCGATTCCATAAATCTTCTGGTTTATCTTCAAAATT
+ATATAAAAGATAATTAGATAGATTACGTATTTTATATTTTGCAGATAACCTAATTGCATT
+GATATAAATATCTCGTAATGACCAATGATCAAAAGCAATTCGTAAGGGTTGGATAGCAAT
+TTTCGAAAGTAGTCTCATATTTTCTTCATTACATAATCTTGAATCAATACCTTGATTAAA
+GTCAACTGTCCTTTTTTTATAAGTTATTTTCCTAATATCAAAATTCCTATCGAGTTCTTC
+AAAGCATTGAATTAAAGAGAAAGAATTCGGAACGAAATTGTCGGTTTTAAAATATTTATC
+TAAGATATCCGAAGCAATTTTTTTATTTGAAAGATTTAATTGCTTTACGAAGTTTAATAT
+TTCTTTCCAGAGAGCAACTGAATATTCAAAACTGTTAGTCCCTTTTTTAAGCAACAAATA
+AAAACTATATAGTTTAGTCTTCTGCTTTAATTTAGCACCACGAAAGAATCCTACTTCAAT
+AATATCATTTATGATATCTTTAAAAAAAGGTGATGCTAGAACATTATTATCTAATAAAAG
+AAGCTTTCGACGAATATAATACTTACTATCTATCTCTTTGACAGTTTTTTTTATATCAAT
+ATATGAGACATAATCCGGTTCAATGATTGGTACAGCACAGAATTTGCATTTTCGTATACA
+ACCTCTAGTGGCATAGGTTATATAAGAGTCCCATTCAGGATAAGTATAAGATATTTGATG
+AAGAATGGAATAATCTGGAGTAACAAGGTCTATATTGTCATTAGTTGTTAAACCAATTCT
+TTTAGAATCAGTTAACAAACCATTTACTACCTGTACACCAGTTATATTTTCTATTTCTTC
+TGATAAAACAGAAGCCATTACACCACCAACAAACATATTGCTACTGTTCTTAATGTAAGG
+CTTTAATTCCTTTATAGAAGAAATAGTTATATCCCAGTAGAAAGTGAATAAAGTTGTAAC
+ATAAATTCTATCCCATTTCAGATCATCTATAATTTTATTTTTGCGAGCATCACGAAAAGC
+CTTTCTTAACCAACTTTCAATAGTTGGAAAGAAAAAACCAACATTATTTTCAATTGCCTC
+TAAGTATATCGTTCTACCAGTCTTTAGATAATAAAAGACATTATCCAATATTGTTTCCGG
+AATAATATCATTCTCAATTTTGGTAAATCTATCTACTAAATAGACAGAAAGTTGTTTTAA
+ATAAACCTCTTTAATGTTACCTTTGACAAAGATAACTTCATCACCTAAAGTTTTATGATA
+AGAAGATAATTTCATTAACCCAAGTGGTGGGTATTTGTTTTTATATCTAGGTTCGTATAG
+AAGTATTCTTTTCATTTTAGCTTCATTTTTATTGCAAAGATTAAATTTTCAGCCACATCG
+CTTGTCATCGTCTCATTTATTATAGCAAAAACTTTTGATAAAAGTTTCTTTTCTTTTCTA
+TCTAATTTGCTTAGATCAGAGACAGCATATTTTTTCTTTTCGTGATTATCCTGGCTTTCA
+TTAGTGATAATAGTATTAGTGCTAATTCGTGGCGGATAAACTTTCTTAATGCCGTCTTTT
+ACAATTTTTGAGCTAATTCGTTCTATTCTATGGTCAAGGTCATTTCTTTTCTTTTCTAAT
+TCCTCATGTGTTTTAACAAGAGCATCATATGATGACTCTTCATGCTTTTTGTTTATAAAA
+CTATTTGTTTGTTTATTTTCATCGTATTTGCTCTTTTGTGCATTATAGTCTTCACTTGCA
+TTATTCAGAGAATTAATGTCAGAAGCAAGTTTGCATAAGCTATTTAGGTCTTTAATGTAT
+TTTCGAGTTTCTCGCATTAAAAATCGAAATTCTGGAGAATCTTCAAAGTAATTACGTTGT
+GCGTTAGGTATAATCGTATTCTCAAAAATATGTAACTCACCAATAAAATAATTAACAAAC
+CTTTCTTGAGGCTCAAATAGTTCTCTTAAAACATCGCTCCTTCCGATCTGAAAATTATTT
+TGCCTAAATTTAATACCTGGATAATTTAGTTTAGGAATTAGTTGTAGTTTTCTTGTCAAC
+GCATACCAGCAGAAAGCAATAATTTTTGAATCGTTATATATGACAAAATGATTAATATCA
+ACTATCTCATCATGTTTCTTTTTTTTGTTTGAAGCTATTTTATATATGTCAGTACCATAA
+TTTTTTTTGACTTCTTTCTTATTTACTATAATATAATATTCTTTTAATTTTAGATTATAG
+TTATCAAGGAAATTTCGTATTTTAGTTTTAAATACAAATTTTGAATCAAATTCAACTGGA
+CAAACTTGAGAAATATATTCAATAACTTTTTGCTCTTCCAATAATTCCTGATTATTAACA
+TCACTCAAAATAACTTCGAAATAGTGTTTGTCCGTATCTTCTTTTTCTGTAAAAGACTCG
+GTAGTGTTATTTATAAGATCTATGGCCTCAATCATTTTATCAGCGCGTAAAGAATCACGT
+ATCTTTTGAGCATCCCATCGCAAAATGGAAGCAGTATTTTCTCCATAATATGAGCTTTTC
+ATAGTCAGGGTAGAACAATAGGCTATGCCGGCGAGTCTTCCTATTCCACGAAATCCAATA
+TTTGAATCAATCTTTTTAGTTGATGCAGCAATACTAGTCAGGGTCGAATAAAAAAGACTA
+CTTTTTAAACCAATTCCTGTATCATAAATTGAAATAGCTTTTTCTTGTTTTTTTATTTCT
+ATATATATAGGATTGTTGATGTAATTGTCAAATATTCCTTTTATTTTACAAGCCTCAATT
+GCATCAACCGAATTTTGAATGTATTCTCTATAGATTATTATTGGATCTTGATACATACCT
+ATCGTTAATACATCTAATAAATGCTTTCCTATTTTTATCTCGTCTTTATCCATTCTTTTG
+GTCCTCTATTTATCAAATTGGTAGAAAAGTGGTTTGGGGAATTTAATCATCAAAGGAGAA
+GGAAAAATCGGATTTGTAATAATGTACTCGCCTTGAACCAATCTTGTCATAATATTCTTA
+TATGTGGAATTGATAAAACTATAGTCTTTATTACTTATTTCAATACTATTTGTTCTACCA
+TAACAATTAGTTGAACAGTTTCCTTTTACACCAGCATTTATTGAACTTCGAAATTGCTCA
+GCACCGAATAATACTAAACCTAACGATCTTCCCCTCTCTGTAATATCAAGAATATAACGA
+AGCAAAGGAGAGTTTTTTGGTACATTACTTCCTGCATGCTTATTAAGTTCATCTACAAAG
+ATTATGATACGGTCAGGAAAATCTTCTTTTAAATCTACCCCTTCAAGTTTTGCTTCATAG
+ATGTTTTTCAGAACATCACCAAAAACAAAAGATTGCAAAGTTTCATCTAATTTTGCAATA
+TCAATTACATAAACATTATTTTTCTTTAATTCTCGTAAGGAATCACATAGATGAACCTCA
+TTTTTTTCTTTAATTGCTCTATCAGAGAATAAAGGATTTTTTAATGGCTTTGATATTAGT
+CTTTTGTATTTTTTCCAACTACTAACCGCAATTTCCTTGTTACTTCTATTCTGCTGGCTC
+GAGACACAAAAATCACTAATTCGATCACGAAAATTGTCCCATGTGGAAATATTTGAGAAT
+GGTCCATTATCATCAAGAATTAATTCATTAATTGATTCCATAGTCCTTGTTTGATCATCA
+AAATTCGCAAACAACAATTCTAAACTTTCTTTATCATCCTGAACTGTATATTTAAACGAA
+TTATAAATCCCCTCATTCTTTTGATCGTTTATCAATTCATCAGTTGCATATGTATTTCTT
+ATAATTGCGTTTGAATGGGGATAGAAATACTGAACATTTGAGAACGGTGTAGCATTGATA
+GAAAGATCAGAATATAGATTTTTGTCAAAAATATCTAATGTTTTGTTTTCTCTATCAATA
+CACAAGAGATCCTTTCCTTTTACATTAAAAACAATAAATGCTATTGATTCATTGTCGGTA
+TTAGTTCCTGATATATATTGGTCTTGCAATGACTTTAGTAGAAACATGCAATAGCTGGTT
+TTGGCAGCAAGCCCAGAAATTCCAGATATATTCAAATGAGCCCCTTCTGGTCCTATTAAA
+AACCTTCGGTCTAATTTAACTGGAATGAATTTTTTTTCTTTATCCATTTTTTCATACATT
+TCGATGTAGCCACAAGAAATTGGATACTTTATGTCATTAAGTCCTAATGCAAAAATAATA
+TCATCTTCACTTGCTAAGAAAACTTTTGAACCGTCTAGAACAGGAAGATATATTCCTTTT
+GTATTTCTTAATACTTTGCACTTGACATAATTCATACTGAGTCGCTTGGTCAATAATTTA
+GCATCAGTATTGCCAAAATCATTACTGACAAACGCGCCTAAATAATTAGGAGTGTCAGTA
+ATATGAAAGACATCTTCTACTATACCATATGTAATACTGTCTTTCTGATTATCCACTCTT
+ACAACATCAAAGGCTTGGAGCATAATATTTGTGTTCGTCCAAAACACAAATTCATCATTA
+GTACATGGTTGTTTCTCAGTGGCTGTAATTTTCCCAATAGCAGTAGAAGTGTCCATTATA
+ATACCTCTATTAAAAAATATTCATAAAATAATCATCAGAAATGAAAGTATTTTTAAGGAG
+CCTTTCTGTAAGATGGACTGGATATAAATGATTGGGCCATCGGTCCTCAATACCATATGT
+AGTAGGTAATCTTTCATTGATTATATTTGCTGAGATCATATCTATTTCTTCTGAATCCAT
+TAAATAATTCTCACCATCTTCTGGTACAACCTTCTCGATTTTTACAATACCGTCAAATGG
+ATTATGGTTATAAGTCTTTTCACGGATTCTAATATACCAAGTGATAAAGAAAACAGGCCC
+TTTAGCCCCTTTGGACCTTTTACTTTCGTATTTATATGAAGGCGTTCTATGATATAGTGG
+GAGGTCCGCAATTAAAGATGCTTGTGTTTTTTTCCTGTTATCTTTTAAGAAATCGGGATT
+AAATGTTTTTGATACACCAATAACTCTTTTGTAATTATTTAATAGCAATGAGAAATCATT
+AAAGTCTCCATTTTTCGAATCGATATATTCTATTGAGCCATCTTTTATTAAGTAATTATC
+AACATAACGAAGTCCATCATCATTTACTAATATGTTAATCATTCTTTTTTCTTCATCAAG
+CATAAATTCATGTATTTTTGATATCCCTAAATTCTCGTATGGAATATCTTTTTGCAGATG
+CAAATCTTGATTATAAAGGAGTACTTTATTGATAACGATATTTTGTTTTTTTAGCGTTGA
+AGAATTATTTATTTGAGTTCTTAGATATTCTATCGCCGTTCTTTTATCTTTACAATCATC
+GATCAAAGACACAATTGCAATATTAGGTAGTGCAATTACATTGTATCTATTTAACCTTTT
+ACATTTTAAAATTCTTTTATTTCTTTCACAACAAGCAACACCAACTTGTCCAGCAATTAT
+TGGATAGATACTCTTTTCATATTCTATGCTTGTCAACTTGTAAGTCTTTCTAGAGCCATC
+AACAAAATATTTGAATAATGATTCACCATCCCGGAGAAATTCTTTTTTCATTCTTGATCT
+TAAATCAATGGGATTTGTATAATCAATTTCTTCACCTAAGTTTCTTGTTGAGAATGGAAT
+TTGCTCTTCTGATGAACTATGAAAAGCTATTGAATGTTCATCATTATAGCAGAATTTGTT
+TATATTATAGATTTTACCAATCGTCAGCTTTGCTATAATAGAAAGCGCTCTATCTATCAT
+TTTTAAAAGTCCTAATACTAATTTAGGGAGAATAATTTAAAACCATCCCTCCCAAAGTTC
+TTAATTTCTACACTACCGCTTACTATTTAAGTTCTAATAAGTTTTTACACTTACATTTGT
+TTATTTTAAGTGTCATAAGTATATAAATCAATATCTAATAGCTGCTAATCTGGAAAATAC
+AAGATTTTACATCTTTGGGACCCTACGCCTCCCTCTTAATACTCTGTATAGATCGATCTG
+CTAGGCTGGAAGTCAATGCCTTCACCGTTTCTAAGTCCTTCTCGTCCAACATTTCCAAGT
+CAGCCACGATATTTGCATATCGCTTTGGCGGCTGCCAGTTATCCGGATTTTTGCCGGTTA
+CCAGGTATTCTACGGTAGTATCCAACGATTGGGCAATTCTTACCCCATCATCAACACGCG
+GTAATCGTTTTCTTGCTATCCACCCTCGGAAAGTTTCAAAGCTAATATTCGAGTGATTAG
+AAACCCATTCTTGAGTAGTATTTTGCCGCTTTATTTCTTTTTTGACTATGTCCCAAAATC
+CCATACATCTATTATCGTCTAAAAATGTTGTCAAATGACGCATGTTTTTCTTGACAAAGT
+TGTTAAACGGCCATAATATGCAGTTATGAAAGTTGCTAAACGACAACAAGATAGTCGTTA
+CAAGGTGTCTATTCCATTCAGCGAAGATGAGAGAAACAGATTTGTTACCTTCCTCGAATC
+TACCGGCCGAAAGGCTGGACCCTATCTAAAAATAGAAATGATGAACCGTGTAAGGGAATG
+GGAAGCTATCCAGTCCGGCAAAACACAACTCAATACAAAGCCATTTGAGAAAGTAGGGGA
+GTAGTCATGGGCATAAAAGATGCCGCTGGCCAGTTAAAAAAGTCAGAGGCCGTGAGATGA
+ACATTGACGGCCGCCTTGAAGCGATGCTTGAGATTATCGAGCAGACACTATCCGAGATCA
+AAGAGAGAGAAGAGCACCTGGCTGGCGTATCCCATGAGATCGAACTTGCGACCAGAGATA
+TCGAAGAGTTACGAGGGATCACCGGCAGCTTAGCCGAGATTGTCGAATCAGGGAAACGGA
+TCGAGTGGATGACAACAACCGAAGTGGCTGACGAGCTTCATGTGAATAAACAGACCGTAA
+GAAGGTGGGCAGATACCGGGCTGCTTAGATGCTACCGGATCGTTAAAGAAGGGCATCGGC
+GCTTTGACCGCCGGGAGATATACGAGGACGTGAAGCGGATGGGAGATGAAGGTAACAAAC
+AATGAGATCAGAGCAGAAACAAGGAGAACAGAAATGGCGTTAAACGAAGACAATCAGCAG
+CTTATAACGCTCATTAACGAGCTTGATAGCAGTGGGTACCTAATCAGAAAGATTTCTGAG
+CGGCCTTCATTGTGTCCTGTAAGAGAATTCGAGCTTCTTATTGAAGAAAAGTCCAAGAAA
+GATGATCTCCGCGGTTTGAGTGCTGCCGCGATAGAAGGATAGCGTTCGTTTACGAGGGGT
+GAGTGAGGTTCGGTCTTTACTGGCCTGAACCTCAGATCAAGGATCTTTGAAAATCAATGA
+CTTGTGGATAGGACCTTATCTGCAAATCACGGGGTAGAGAAGGGAAAAAGAGCAGGTGAG
+GGCGTTGGTAGCACCCTCACTAATCCGCGTTCACACACAACGCAAATCACAGACAAAGCT
+GCTGCTCAATACATCATATCGGCAGCTTTATAGAGGAGATAAATCGTTGAATAGTCCTAT
+TTCGTACATCGGAGGAAAAAGCAAACTTGCGGATACTATCATCAACTTTATCCCGGAACA
+TCAAACCTATGTCGAGGTATTTGCCGGTGGTGCGTGGATATTCTTTAGAAAGAAGTATTC
+GAATGGGGAAGTGCTCAACGATAAAGATGGCGATCTGGTATCTCTCTATCGGGTGATTCA
+GAACCACCTCGAGGAGTTTTTACGGCAGTTCAAATGGATATTGACCAGCCGCGAAGTCTT
+CGATGACTTCAAGGGCCAGATGGAAAAAACCGGCCTTACAGATATCCAGAGGGCCGCACG
+GTACTACTACTTACAGCGTTTGTGCTTTGGGGGGAGGGTACTAAACCGAGCTTTTGGCGT
+GGATTCCACCTAAGCGGGCGAGCAACGAAACCGGCGGAAGCGGTTAGAGAGACATTTCTG
+CATCAAGGCAGCTATGCCAGCCTGGCAAAAATAGCAACCAGTGAGTCTGCCGGAAGGCAG
+ATGAGAGGATACGCAGTGAGCAACGTTACGTTGGGAGAGCCTGAAAAGGTCATAGGTTCG
+TCCGGTTGTCAAATCTCCAGATCGCTCACCTCCGGGCCAAACCGGACACTGGTTAAAGGC
+TGGATGGTTTCGCATCCCGTTCAAGACGGCCTTAATAAATGTCTACCAACGGGAAGAGTC
+TACGTCAGTAGCTACCGAGCGCCGGGGAATCGTGGCGCACCTTGGGACTGTGGCGGAGAG
+GTTTATCGCACGTCGGATTAAGTTCCGGTCGAGTCAACGGTGCGAGAGTGGAGACTCGTA
+ACGCAGGTTCGAATCCTGCCGGTCCCAATACGGCGCCAACCACACGCCGAAACCACGAGG
+ATGTGGGGGAAACATGTTTCACAAACGGCTCTCTCCGGAGAATGACCTCCGGGGAGAGGA
+TTTCATCAAAGATCAATGCGAGGTGCAAAACATGAGCAGTACAGACATGAAAACCGCTAC
+CGAACCGGTAGCGGTTAGAAAAAATAAAAGAAAGGTTGTGATGAATCACCCGAAAAGTAG
+CACTATCCGATTCAAAAATCAGGAAATACAGGCAATTGATGAACACCTTGAGTCTATGGA
+CCATCTCATCCAGGACCTCTTTAAGAACGGTAACCGGGCAAACCGGGACCTCTTTGCCAT
+GAGGCTTGCAACCCTGGTGCGGGTGATCCGGGAGACCCTCAACGAAGGGGTGCTTGAGTG
+AACGATCTGCAGAGCCAGGACGTGGTTTCCGAGAACAAGATCATCCAATACATGGAAGCT
+TCGGGAGTCGCCTCTAACCTCAACGATCATGAAAAACGGCAGTTTATCGAGGTGGCCAAG
+GCCTACCAGCTGAACCCCTTCAAGCGTGAAATATACTGCGTGGCCTACGGGCAGGGAGAT
+AACCGGAGGCTGTCGATCATAACAGGCTATGAGGTCTATCTCAAACGGGCGGAGCGAACC
+CAAAAGCTTGACGGGTGGGGTGTTGAAACGGCCGGATCGATCAGAACTCGCTCTCTCAGA
+GCCATTGTCACCATTCACCGGAAGGACTGGCAGAATCCCTTTGTACATGAAGCGTGGTGG
+ATTGAGTACAGGCAGAACAACCGGATGTGGAACGAGAAGCCGGTAACCATGATCAAGAAG
+GTGGCCATTGCCCAGGCCTTCCGGTTTTGTTTTCCCGATGAGTTTGGAGGCATGCCGTAT
+ACCGCAGATGAGCTTTCCGACGAAGAGACCGGATACCGGGATGTTACCGAGGAACATAGT
+GAAATACAGAAAACTCCGCCGCCGGTGCAGGAAGAAGCTACCAAGGTTCCGGAGCACTCC
+GAGGCTATCCCTGAGGATCCGGATGCAAAGGTCAGGGAGGATTTCAAACACAGGCTTGAC
+GGGGCGTTTCTCGGGAAACTGATTACCAGGGACGAGCGGAACACGATGGTTGCAAACAGC
+AAGAAACACTCGGGGAAGACGCTCGACTCTTACATTCGGATGGTAGAGAAGAGGCTCTAT
+GGTCAGCAGCAGAGGGCAGGGCAGGGGCCTTCTGGATCGGGCTCCGGGGATCCGCAGACG
+TCGGTGCCTGAAGCGCCGGAAATCTATTGAGGAAAGGTGCATGGAATCATGAAAGAACAC
+GGAATCATCTTCAACGCCGATATGGTCCGTGCTGATCTTGCCGGAAAGAAATGGCAGACA
+AGACGGCCTGTTAAACACCAGTTTTGTCGATCAGAATACGAGCCGGAGCTCATATCGTGG
+TGGGAACAGAGAAAGCATGAAACGATAGAGTGTTGTGGTAGTTTCAGTGAACTTCAAAAG
+CATGGCCCGTATGGAGGCGTCGGTGATGTGCTTTGGATCAGAGAGACATGGAGAATAGGT
+GCATGGAAATTTCAACCTCATTCTTTTGCGATTGATTACAAAGCAGATAATTATCCTCGT
+CAGGAATGGTTAAGCTGTAATGACGAGCTTATGTTTCTACGGTTATTTGCACAGACGGAG
+AATGATGCTTACAAAAGAGAAATATATCCTAATGGAAATGGTATCTATGATTGGAAACCT
+GGACATTCTCCTGCAGTATGGCGCCCGTCAATCCACATGCCGAAATGGGCCTGCCGGACT
+AAACGCCGAATCACCGGCGTGCGATTACAAAGAGTACAGGATATAAGCGCCGAGGACCAG
+GAAGCCGAAGGATGCGGCCATGAGTTTGCGTTTGTCTGGGATGCTATCTACAAAGAGCGA
+GGCCTCGGCTGGGATGCAAACCCCTGGGTTTGGGTTTACGAATATGACAATACGATCAAT
+CGGGCGAAAACGTCATGAGTAGTCCCCGGACAATCATCATCCCCGCGGCCGAGCGTATCA
+AAACCGGCGAGCGGGGAGTCGTTTCTTTTCGTGCCGGTGAGACTTTCGAACAATACCTTG
+TGCACCTGTTCCGCTACCAGGAAATCGAAAGACGCTCTCCGGCCCCTTACTACTGGCTGG
+CGATCGATGTACCCCACCGTCCCCGGACAACCGGGCACGGCAGCCAGAACCACCATATCA
+ACGGTCATTGTCAACAAATCTCAGTGGAAACCGGCCAGCCCTTCGGGGATGTAAAGCGGC
+TTGCAAAGCAGTTCGCCGTTACCATGGGCTACCCGATCCTTGAGGACGAGTCCGGGGAGC
+CCATACTCGACCTGTGGGGAGATATCCAGGGGATCAGCGAGAGGAACTGCAGTACAGAGG
+ATGCAGCTATTTTGATTGAGGCGATCCACCAGATAGCGGCGGAAATGGATGTGGAGCTGA
+TCGAAGTATGACAGAGCGGCAGGAGGCTATAACGTCAGCTGATATGTGGTTTAGCCGGTA
+TATCCGGGCCCGTGACAGGTGGCGGTCGGTGACAAGCGGATGTAAACGTAATCTGACCTG
+TTCGCACCTGTTCTCACGAAGATTCTACGCTACCCGCTGGGATGAGATGAATGCTTATTG
+TCAGAGCGCAGGGGAGAATGAAGAGCATGACCGGAATCCGGGGAAGCTTATCTGCTACTT
+CATTACGCTTCACGGAGAAGATGCGTACAAAGCGCTTTACCTGAAATCGAGGTCCGGCGT
+GAAGATTACAACGGAAGAGATTCGGACGATTGCACAGTACTACCGGAAGAAGTACGAGGC
+GATCACACAACAGAACCATGACTTTTTTGGCGTTCTTTAGGGAGGAACCATGGCAAACGA
+TATTACCAGTTTCACGGCGGTCGGAAGGCTTACCCGTGATGCAGAGTTGCGATATACGAA
+CAGCGGAATACCGTTGTGTAAGTTCAGCATAGCATCGAATTACAGCAGGAAGGTGCATGA
+TAACTGGCAGGAGGAAGTCAGCTATTTCGATTTCACCCTATTCGGGAAACGTGCTGAGGC
+GCTTGCTCAGTATCTCACCAAAGGTCAGCAGGTGGTGGTTTCAGGACAGCTGAGACAAGA
+CCGGTGGGAGGACAATGGGGAGAAGCGAAGCAGGGTAGCGTTCTTTGCCCAGGATGTACA
+GCTGATTGGGGGAAAACCTGCCGGCCAGAGCAACCAGCAGGGGCAGTATGGAGAGGCCCC
+CTATCAGGGACCGCCGCAGAACCAGCGGGGCGGCTATTCCCAGCAGCCTCCACAGCAAAG
+GCAACAGCAGAATTCCCGGCAGGGTCAGCAACGTCGACAGGGGCCTCCGCCTAACTCCGG
+GTATCAGAAGCCGACAGGCGGCTATGATCAGTGGGGCTACCCGATAAACCCCGGACCGAA
+TAATCAGGGCCCGGATCAGGAAATGGACTTCGAGGACGACATACCCTTTTAAGGACAGGA
+CATTATGGGCGCAAAAAAAAGGATGATAGATCCGGGGATCTGGACGGACCCCAAGATCAT
+GAAACTTTCCTCGGTGTCGGTACTCATCTTCATCGGGATGATCTCGAATGCAGACGATGA
+GGGAATCATCGAGGCTGAACCGGATAGCCTGTACTTCAGGCTGGCACGAAAGGACATCAC
+CATCGATATGATCAAAGAGGCCCTGGAAGACTTCGGGGCCTATGGTCTTGTCCGCCTGTA
+TGGCGGATACGCCTTTTTCCCGAACTGGTTCAAGTATCAGAACCTGAAAGGACGAAAGCC
+GCAGGAGACGAAATTCCGCCGGCCGCCGAAAGAGTATCTGACAGACGAATACCGGAATGA
+ATGGCTTGAGACCTTCAGGAGGGGAAGTGAAGCCCCGTATCCCTTTGAGACCTGTTTTTC
+CAGCGGTGAGTCACCGGTGAGCAACCGGGAAATGGAGGACAAAGAGCCTGCGACAACCAG
+TGAGTCACCGGTGTGCTACCGGTGTGCTACCGGTAGTGCACCAGTGACCACAGAAGTGAA
+GGGAAGTGAAGTGAAGGGAAGTGAGACTAGTATGCCTGCGGCAGCTTCGGCCGAGCCTCA
+GCCTGAGCGGGACGGGGAGGTTTCACCATCGGAGGAGCCGGAACCCGATTCCCCGGAGCC
+TGTTTTCAAGCTCGAATGCCCGGAGCCGAAGAAGCGCAAGGGGAAACCTCCTACCGCCGG
+GAAAGAGCCGACAGACCCGCTGTACCACTCGATCAAGGATTCCTTCCTCGCTGTTGTCGG
+GGACTTCTCGAACTGGGGCAAGGAAGGCAAGGCGATCCACGGGATCATCGAGAAATGCTC
+ACGCGCCTCACCGGAAGACCCTTCGGGCTGTGCCGAGCGGATGATAGGCGAGTTATGGCG
+GCTAAAGAATTCGGGGGATCGGTTCTACCGAGATCAGCCCTTTGTGCCGTCCACCCTCAA
+CGCCTCGGGAATCTGGGACCGGGTTGCCGAGCAGCTGAAGGTCACGGCCGACGAGCTGGA
+AGGTGTGAGGATGTGGGAAGCGCTTGATCCCTACGGGGTGAGAGGCAAGGCAAAGCAGGC
+GGTGGGAGGATAGGCGTATGCAGTGGAACAGCAAAACGTTTATGGCGATGTTGCAGCAGT
+ACTACGGCAAGCTTTCGCCGATCCACGCGGGAGCGCTTGTCGACTGGCTCGATAGCAAGC
+AGTTTTCGGGGGAGTATCTCAAGCGGCTGTACCAGGAGATAACCGAAAGCTACTCAACGA
+AGTACGGGCGGCCTTGTGATCTGGCAGTTGTGAAGGAAACGCACATGGCCCTTGCGCCTT
+CGTATGTGCCCCCTGCCCGGCAGCTTGAGAGTGATCAGCGGATGATTGGGGAGCGGATCG
+TTGAGCGGGAGGAAGGAGCAAAGCTGTTTGCGAGCATCATCGAGAATCTGACGAAGAAAA
+AACGGAAGGTGAAACCGGAGAATAAGTCGAGGAGAGTGCGGAATGACATTCACAGATAAG
+TACCTGAAAGAAAGGATTCCGGCGGTAAAGACGGTTTTCAAAGGGGATGATCCTATTGAA
+AAAGAAATGGTACTTGAGATAACGGACTATGACCGAGGGATCATTGAAATGAAAGCCGGT
+AATGCGTATTACCGGTTTCGGCATGTTGATCTTGAGCGAGCCGTTACATCGATACAGGTG
+CGGCAAGAGGTAAATGCATGAGCGAGTATGGTGTAAGAAAAGTTTGTGGGAATTGTAGGT
+CCTTCGAAAAGTGCTTTGCCGAATCAGAGGAGCTTATCGGAATCTTTTCCTCCGGTTGTC
+TTGCGGCTGATAAGGAGGAGACGCGGCAGATGCCTGCGTGTGGAGACTTTGAGCCGATGA
+TGAAGCCGGTACCGCTGTCCGGGGAGTAAGGGTGCTGGTGTTGGGAGGGGCAATGAGCAC
+GATGATATCGGCGGATTGTAAAGATCAGCGGGTGGCTGACTCTATCCGCTGGCTCTTGTA
+TGAGCTTGAGAAGGCGAAAGACGGCGAGGTGGTGGTGTCGTTCTTCGTGAAAAGCGGGAA
+GGTCCGCGGTGTGGAGAAAGTGGTCAGGGATAAGAGTATAAAACAGGAGTAAGAGCATAC
+ACGGAACATGTTGTGTGAGAATTGGGAAAAAAGCTACCTGTATATTATTTTTACAGGTTT
+CCGCTATTACATTATGGCTGTATTATGTGTATAAATTTTTTAAAAAAAACCAAATTAAAA
+GGATGGATAGAAGAATGAAGAAAATCTGGATTATTCCTGTGTTGCTCCTGTCGATAGGCC
+TCGCCGGATGTAGTATGTTCGGAAACGACGGAGATGATGACGACGATTCCTTCATTGTTG
+GTTACTGGGTTCAAGAGTCGTTCTCTCTCCCCGATACTGATGTCTATGAATTTGCCTCAG
+GTGGGACTTGTGCTGTTTATGCAGACTATGCAATGAGAACCGTAGATCTTGAAACGAACT
+GGTCTTTATCTGGCGATACATTGACCATCATGGGAATTACAGGAACAATAACGAAGGTCA
+GTGAAAATGAGTTTCAATGGAATACTGAACTTGGTAGTCATGCTGTTTACTATCGCAAGG
+GCTACGAGCCTGGTGGGTTTGCATTGGATGGACCATTTACCGAGCTCACTTTAGGAACCG
+CCTATGAAGGGGAGTTTACCGAAGAAACTGATTTCGATGTGTTTACTGTGGCGGTAGAAG
+ATGGGGCAAGCTATGAGATTTTCTGGGAGGATAAATATGATCATGGTGCTTCCTCCTATA
+GTGGAGCCATAGTGGTTTCTGCATATGAGGCAGATAAATCAACCGATTATTTTACGGGTG
+AAAGTACTGGATATCCTATGCCAATGGCTGTTACCGCTAGTGGGACTACCATTTATATCA
+TTACCCGTCGTCCGGTTTCTTTAAAGCTGTCAGGAACCTACAGCTTGAAAGTAAGAAAGG
+TGACACCATAGTAGGCATATTTCCTAAGGCTCTGTGACAAAGAGTAGATATCGGGCATAG
+ATTCCTCTATGCCCGTTTTTTTATAGTTTCCCCCTTGATGCAAAAATTCTTCCGTGATAG
+AATTTTTTTTGTTAGATAACCCAAGGTAAGGATGCTTACCCTGGCCGTTCCGGACGGATT
+CCGGTCGCTCTAATGGTGCAAGAAGCAATCAGGCGGCGAAGTATCTTACGTTAAACACTG
+TGACAGGTGTCTTTCGTGAGCTACTTCGTCGCCTTTTTTTGTGCCCTTTGGCTTTGACAG
+AGGAGAGGACGAGAGACTATGGGAAGGCAGGATAGACGGAAGAGTTCAACACAGCGCGGG
+TATGGAGCAGCCTGGCGGAAGATCCGTATCGAGGTCCTCCAGGCCTGGGGCATCCCGAAG
+CGGCTATGGCCGAAGTATGATGTGGACCACAATCCCGCCTATGACCGGAGAATCGAACCA
+GATCACCGAAAGTACCAGCTCATCCCTCGGCTTCATGCAGATCACAGCAGAAAGACTGCG
+AAGTTTGACAACGGCTTTGGTAACCGGAAGAAGAGAGAACCTCGTCCTGTCTCCCCTATC
+ATCAATCAGAGCACAGCCCGCCTTACGGAGGGGGGATGTAAATCTCTGAGGGAAAAATGC
+CCAAACCACGCGCCTATACAAGAAAACACTCTGTCAGCAAAGGCAAAGGGGGTATAGGCC
+ATGAGTCGAGGCGGACACAACAAAAAGCCGACTATTTTAAAGCTCACCCATGGCACCTTT
+CGGGAGGACCGGGCCAACGAGAAGGAGCCGGAAGTCAAGGCACTTGATGAGACGCCCAAG
+GCGCCGAGCCACCTTAACAATTTTGCAAAGAACAAGTGGAAGGAGCTTGCCCCGGTGCTT
+GCACAAACGAAGGTTCTATCGGAAGCGGACCTCACCATGCTGGAAGCCTTATGCGAGGCA
+TACGGACAGTACCGGGAAGCGCAGTATGCGGTCTACCACTACAAAGATGAGGAGTCCGGG
+AAAACCAAAAAGCGCAGTTTAGCCCAGTACATGAGTGGGAAAAACTCTCAAACCATGCCT
+GAGTACACGGCCATGCGGCAGGCGTTGTCCATGGTCAAAACCATATCCGCAGAGTTCGGG
+CTCTCGCCTGCAACCCGCTCCCGTGTGAATGCAATCGACACACCTGAAGAAAAGGACCCT
+ATGGAAGCTCTTTTAGAAGGGGCCGGATGATGTGGAAACGACTGGTACTTGTGGGGCTTT
+TGATGAGTAGCCTTTTTACCTACCGGCAGTATGCCCAGGATGTTGCAAGCGGGAAGATCG
+TTACCTGCAGGTGGGTGAAGCTTGCTGTAGCCAGGTGGGAAAATGACCTCTTACGGCAGA
+ACTCTCCGGAGTTCCCCTACTACTTTGACGAAGAATGCGCCAACAGGTATATCAGCTTTG
+CCCAGCAGCTTGAGCACACCCAAGGCTTCAGCGGGAAGATCGTGCTTGAACCCTGGCAGC
+AGTTTGCCTGGGCGAATATCTTCGGGTGGAAAAGTACGGCCACGGGCCTGCGGCGGTTTC
+GAAAGGCATACCGGGAGGTAGCACGGAAGAACGGGAAGACGGTCGAAGGGGCTGCAATGA
+TGAACGCCTGCTTCCACCTCGATAAAGAGATCGGGGCGGAAGAGTTCTTTCTGGCGGTGG
+ACCGGAACCAGGCGAAGAAAGGCTATGACGAGGCGGTACGCCAGAACCTTCGAAACCCTA
+CGCTATCGCGGCTTACCAAGGAGTATAGATCCTCAAAGCGCCTTGTGAAGGTCAATGATC
+CTGCGGCCTTCATGACTCCGGTCTCAAGAGATCACAAGAGTCAGGACTCATGGAACCCTC
+ACGCGATCTTAGTGGATGAGTACCATGCCCACGCGACCAATGAGCTGATCAACGTGTATG
+AGTCGGGCATGGGAGCCAGGCGCCAGCCCTTAACGATCATCATCACCACGGCCGGGACGA
+ACATCAACGGGCCTGCCTATCAGGAAGAGCGCACGCTCGTTACCAAGATCCTTGAAGGAA
+GTATCGAGCCGGTTCCGGAACACATCTGGGGGATCATCTACAGCCTGGATGAGGGGGACA
+GGTGGGAGAATCCTGCGGTGTGGATCAAAAGCAACCCGAACATGGGAGTGAGCTTTTACC
+GCGACTACCTTGAAAAGCGTATTGCAGAGGCCAAGGGCTCGCCCCGGAAAGCCAGCGATG
+TTTTGACCAAGAACTTCAATATCTGGCTGTCCTCTCCCACCCGGTGGATGGACCACTCGG
+TATGGATGCGGGGAAGTGCTCCTGTTGTCGAAGAGGAGCTTGTAGGCTCTGGTGCAAGGG
+GCGGGCTTGACCTATCGATGACAACCGACATCACGGCCCTGTGTTGGGCATTCGGTGAGA
+AGGACGGACGGTATCCGCTACTCTGGCGGTTTTTCATACCGGAAGAAGGATTACTTGATC
+GCTGTCACCGTGACCAGGTCGACTACCGCTCGTGGATCGATGAGGGGTGGATGATTGCAA
+CACCGGGGCAGACGGTCAACTACGAGATCGTGTTAGAGGTCTTGCGGCAGGATGCGAACA
+CCTTTGGCGGCCGGTCAATCGGCTATGACCCGTGGCATGCCGGAGAGTTTGAGCGGGAGC
+TTGAGGGAGAGATCGAGCTTGTCAAATATCCTCAACGGTATTCGGGGATGACGGTTCCTA
+CTCAGCTGTTTGAGCGGATGGTGATCGACGGGAAGATCGCCCACGGAGACAACCCGGTTG
+CCTCCTGGATGATGAGCAATGTGGAGCTGAAGGACGACCGGCAGGGGAACATCATGCCCA
+TGAAGCCGAAGCGGGATTCCTACGGCAAGAGGATCGACGGGATCGTGGCGGCCATCATGG
+CGCTTCACCAGGTGACCGGAGGCCAGGTGGAAAGTGCGTATGAAGCGCGGGGGCTTCGAA
+CCCTATGAAAGCGCATATCAAGTTTCGCAACAGAGTAAAGGCTTTTTTCTCACCGCTTTC
+CGGGTTGGATGAGTTTCTCGAGGCTCTAACTGCCGGAGGACGCTCATCATCGGGGATGAG
+TGTAAACGAGGCGACGGCAATGAGCGTGTCTGCCTTTTTCTCGGCGGTCCGGGTCATTAC
+CGAGAGTATTGCCTCCCTTCCGTTGGAGCTTTACGAACGGCTGCCGGAAGGGGGCAAGAG
+GAAGGATGAAGGGACGAAACTCTATCACCTCCTTCACACCCAGCCGAACAGCTGGCAAAC
+CTCCTTCGAGTTTCGGGAGATGCTCACCTATCACATCATCATGCGGGGAAACGGGTATGC
+CTACCTTTCGAGGGGACGGGACGGGCGTATCTACGAGCTGATTCCCATGCATCCGGATAA
+CGTTACAGTCCGGCAGGATGATACCTACCGGCTGCATTACACCTTCCAGTCAAAGCGCGG
+TTCTGTTGCCTTAGAGCAGGGAGAGGTGTTGCACCTGCGGGGCCTGTCTCTTAACGGCTA
+TACGGGCGTGAGCCTTTTGACCTGGGCCCGGGAAGTACTCGGCGGAGCCCTTGGCCAGCA
+GGAGCATGGAAACCGGCTATGGAAGAACGGGGCGAACCCGGGTGTGGTCCTGCGCCATCC
+GAAGACCTTATCTGATATCGCCTACGAGCGGCTGAAAACGGACTGGGAGGACAAGTATGC
+CGGGGCCCGTAATGCGGCCAAGACGGTGATTCTCGAGGAAGGTATGGAGATCGAGCGGCT
+TTCGATGACAAGCGAGGATGCCCAGTACATCGAAAGCAGGAAGTTCACGCGAAGTGAGAT
+CGCCGGGATCACACGGGTGCCGCCGCACATGATCGGAGACCTTGACCGGGCCACGTTCTC
+GAACATCGAGCACCAGGACCTTGCCTTTGTCAAACACACCCTGCGTCCCTGGCTGGTGCG
+GTGGGAACAGGCCTTATCCCGTGATGTGATCAGAGCACCTCGGCGTTTTGCCGAGTTCAA
+CGTGGACGGGCTTGCACGGGGAGATTTGAAAAGCCGGTATGAGTCCTATGCCATCGGCCG
+GAACTGGGGATGGCTGAGCGTGAACGACATCCGGGCAAGGGAGAACATGAACCCGATCGA
+GGACGGGGATGAGTATCTGCGGCCGCTTAACATGCAGCCGGTGGGAGACGAGGTGCCGAA
+GGCGCTACAGGAAAAACAGTCGGGAGAGAAGAGCGATGGAGCATAGAAGCTGGTATGAGA
+TGAAGGGAGAAGATGAAGGGCCTATCACCATCGACATCTTCGATGAGATCGGCGGATGGG
+GTGTGTATGCTGCGGACTTCAAGCGGGAGCTTGAGGCCCTGGCGGAAGGCAACAGTCGGG
+ATATCGTGGTGAACCTGAACTCTCCGGGAGGGGACGTGTTCGAGGGCATTGCCATCTATA
+ACACCATAAGCGCCTACCGGAGCCGGGTGAGCGTGAGGATCACCGGGGTGGCGGCGTCCA
+TAGCATCGGTGATCGCCTTATCGGGATCCCGGAGGATCATGGGGGAAGGGTCGTTTTTTA
+TGATCCACAACCCCTATGCCGTTGTCATGGGAGAGGCGGATGTACTTCGCTCCCGTGCCC
+AGACCCTGGATAAAATCGCCCTCCAGATGGTGGGCATTTACGAACGGCACAGCAGCCTTT
+CGAAAGACGAGATCGAAAAGGCAATGGATGAGGAGACGTGGTACGGACCTGATGAGGCGT
+ATGCCGCAGGCTTTGCCGACGCCATAGAGGATTACGGCGAGATTGCGGCCAAGGCCTTTA
+ACTGGAGGGCCTACCACTATCACAGCGTCCCACAGGCGTTGTGGGAGATGAGGAAACACA
+GACAGGCACCGAGGAGCAAGCGGGAACTTGAAGTACGGCTTGTTGCCCTTGGGTTTAGTA
+GAAATCAGGCGCAAGGGATTATCAGCCGGGGGTACGGGGCCCTGCAGGGGGATCCTGCAG
+ACGGCCATGAGCAGGGGGATCCTGCCGGGGAAGTGGCCAACGGGTTTTTGGAGCTTGCGC
+AGATGTTCCGGCAAGGAGGAAAAGCATAAATGGATCCGGAAATTAGAGCGGCAATTGAAG
+AGCAGAAAAAGGCCTGGAAAGCGTTCCAGGATGCGAACGACCAGCGGCTTTTGAAGATAG
+AAGCCGGGGATGTAAAGGGGCTTTCTGATATCAACGTGAAGATCGACAGGATCACTGCGG
+CGATGGAAGAGAATGCGAAGGTTATCGAGCGGGTCGGAGAGATCGAGAACAGCATCAACA
+AGCTGTCTCTGGGAACCGGCGGTGGCAAGGCCAAAGGGACCGGTGCCTTTAGCGCATACA
+TGAGAAGCGGAGATGAAAGCGGGTTTCGTGCGGATGCCACGGTACAGGTCGATCCCGACG
+GCGGGTGGCTGGTGCCTGAGAACATACGAAAGGAAATCGGACGGATTGCCCAGGGGATTA
+CCGCCATGCGGAACCTTGCCTCTGTGCAGGGAATTTCCGAAGGGGCAAGTTATACCGAGT
+TCGTCACCACCTCCGGAGCCGGGGCCGAATGGGTGGCGGAGACCGAGAAGCGGGAGGAGA
+CCGCCACGCCTTCCCTTGCCCGTATCGATACGGTAGTACATGAGATGTCGGCGAATCCCA
+AGGCGAGCCAGAGGCTCCTTGATGATGCCATGGTGGATATTGAGGCCTGGCTGTCTGGGG
+AAGTGGCCATCGCCTTTGCAGAGCTTGAGGCTGAGAGCTTTATCACCGGAAGCGGGGTCA
+AACAGCCCCGGGGGATCCTTTCCTACGATGCGGTGGAGGATAAGAACTATACGTGGGGAA
+AGCTCGGGTATCGTACAACTGGGGCGGCTGCCGGCTTTGCCTCTTCGAATCCTGAGGATG
+CCCTGGTCGACCTTGCTTATGCACTAAAGAGTAAGTACCGAAACGGGGCCACCTGGCTCA
+TGAGCCGGACAACCTTGGCTGCGGTACGAAAGTTCAAAACATCCATGGGCTACCTGTGGC
+AGCCCTCCTTTCAGGCTGGCGAGCCTTCCATGCTCTTAGGCTACCCGGTGGCTGAGGATG
+ATGCCATGCCTTCTCATACCACAAGCGGGGCCTTTCCCATCGCCTTCGGTGATTTCAAGG
+CAGGCTACCGAATCGTGGACCATATGGGCATTCGGGTACTTCGCGACCCCTACAGTGCAA
+AGCCTTTTATCAGTTTTTACACCACCAAGCAGGTAGGCGGCGGTGTGAAGAATTTCGAAG
+CGATCAAACTCTTGAAGGTCGCAGCCTAAGGAAGGAGGAAGGAGAATGCGGGATATACAC
+CATACCATCGCCATGGAGACTGCCATCGTGCCGGCGCTCTTGAGCGCGGATGGCACCCCT
+GTAGAGGTAGATCTGCAGGGGTATGACGCGGCCGAGGTGGTACTTTCCATCGGGCCCGGT
+GGCATTAGCTTCACCGAGGATAACAAGATCGAGTTTATCCTTTCCCACAGTCTTGACGGG
+GTGACCTACACCCCTGTTACCGCCGGGGATCTGGACGGACTGGAAGGGGACATAGAAGGC
+GGAGTGATCCTCTCGCTTACTGAGGAGAAACCGGAAGCAAGTATGCTGTGTCTCGGGTAT
+GTCGGAGCCCTTCGGTATCTGAAGCTCTCGGCTGTCTTTAGCGGCACCCACGCGGAAGGT
+ACTGCGGTGAGTGCCGTGGTGATAAAGGGCAGGCCGAACCTGGCATAGAAGGATGAAACT
+TTCTTTCCGGCGGGGGCCTTTAGGGGCCTTTTGCCGGGAGAAATAAAAGAAGGACGTAAG
+GTAAAGATGAGTGGAGAGCTAACCAGCTGGCAGGCGGTAAAGGCGCGTCTTGATCTTGAG
+GATAACCAAGAGGATAAGGCAACCGGTCTTATTGCCGTGGCGTCCCGTCGGGCTGAGAGG
+TACACCGGACGGCTTCTTGCAGGTCGGGACGGGACACTGGTGATGGACGGAAGGGCCTCA
+GATCATCTTGTCCTGCCTCAGTACCCGATTAACCGTATCGAGAGCGTGAAGGTCGACCCG
+TACCGTGTATTCGACGGTGAACCTGTCACCGACTATTTCGCAGACCTTGGGGCGGGGATC
+CTGATACGCACCGCCCCTCATCTATGGCCTTTGGGGGTGAAGAACATCCAGGTTACGGGC
+AACTTCGGCTATGGAGCGATCCCTGAGGACCTTGAAGAGTCGGTGATACAGCTGGTCGGC
+TACTGGCTTGGTTCCCAGGGTATCAGCTGGCTGGGTAAAGGGGATGCGGCAAGCGGAGAG
+TATCAAACCATGTATGTGGGGGTGATGGACCTGCCATTTCAGGTTCGTAATGTGTGGGAC
+TCCTACCGGGAGGTGTCAGTGTGAGCTGGGCGAAGAGGAGCAGCAGTGGCCAGAGAAGTA
+CGGTCAGACGCCGGAAGACCGTGCGCTCGTATGCAGGGCTTACCATCTCGGCGGCAGGGA
+ACACGATCGGGCCGCTGACCGAGAAGGCCTATGAGTATGCCCTCGAGTTTTTAGATAAAC
+GGGTGACGGACAGGACCGGGAACCTTCGAGCCGGCATGAGCTATGACGTTAAGGGTCATA
+CCGGAGCGGTGAAGAACGATGCTCCCCATGCCTTCATTGTTGAGTACGGCACAGAGGAAA
+GGGCGACAAAGACCGGTGAGAACCGTGGCCGTATGAAACCACATTCCTTCATGCGGGCCG
+GGAAGAACAAGGCCCTGAGGGAGATACGGAAGATATGGAAAGAAGGATTGAGGAAGGCGC
+TTGATGAGCAGAGCACCGGAAGTTGAGATCACAGAGCAGCTTCGAGCCGACACGGCCCTC
+ATGGAGCGGATCAAAGCAATCTATGACACCGAGAGCCGGGTTTTGCTAAAGATACCGTAC
+CTGGTGGTGAGCCTTGTAAGCGACACGAATGAGAAGGTGTATCTCTCATACTACGGGGGA
+TCAGCTGCCATACAGATCGATATCTATGCAAAGGATGAGAGAAGCTCTGACCTCAGGGCC
+CTTGTCAAAGATGCGGTTCGAAGGATTCGCGGGGTATCGGGGGCCTTGAAGTTCTCCTCG
+GTGGTTGTCACAGGAGATGCGTTTCTCGGTATTGCCCCCAATGGGCTCTACCGCTGGATG
+GTGGAGATCAGAGCGGATTACACGGAAGAAGGAGAGAGATGAGAGATGATGAAGAAAGAG
+CGACTGATTGGAAGTGACGGAAAGCTTGTCACCGTCAATCTTGCATCCGAGGTTACAGGG
+GACGGGATAAAGAGCCTTGATGAACTTGCAGGAGGCCTTGCGGATAACGGGAAAGGTTCC
+GGCTGGTGGAGTATCACGGCAAAGGGAGAAGAGAGCGGTTTTTCCTCGGCCCTTGATGTC
+GGGGAGCTGTTCTGGGATGACGGCACGCTTATCCCGAAAAGTGGGGACAAGTGTGCATTT
+TTAGAGGAAAGCGAGAAGGCCGACATCAACAGCTTTTCGATCGAGGTGAGTAGAAGCGAG
+ATCGATGTGACGACCTTGAGTGACAAGGTCAAACGCTACCGGTCGGGGAAAACGGATATG
+ACCGGCAGCCTTGAGGGGATCACCAACCTTGATATCACCGATGCGGCCGGCTACATCATC
+AACAACTTCATCAAGGTTATCAGGCAGTCGGTAAGCGGGACCATCATCAAAAACGATGTG
+GACGGCTCGCCGATCTACATCAAGGGCGTGATTCAGAAGTCAACGGATAAGGGAGAAAAG
+GAAGCCTTTATCTGGGCAAAGGTCATCATCCTTTCTTCCAGCCTCGGAGCATCGGGGGAA
+GATGCACAGAACTTTTCAAGTAGCTTCAGAATCGCTCCCGGAGATCCTGATCCCACCCTG
+TACATAAGAGAGGTGGGGTAAGGATGGCGGAACCTATCACCATAGCCCGGGACGGGGTGT
+ATGTCCCCTCCTGGGGCAATAAGGGACGGAAGAAGGATGAGAGAATAACGGTGCATTACC
+GGTTTCTCACCTTTGAAGAGGAAGAGAAGATCTACGGCCGGGCCAGGCGGGAAGCCGGGG
+AAGTACCGGAGAAGCAGGATAGCAGGGCCTATGATGCGTGGTATGTGGAGTACCTGTCAC
+AGGCTTGGCTGTTGCGGGTGAAGAAGATGATCACGGAGATCGAAAACCTGTCGGTGAGTA
+TCGACGGCCAGGTGATCGAGGTTAAGGATGGTGAAACGCTCTTCTCAGGTCTCCCCTTAG
+TCGAGCTTGCAAACGAGATTTTGCATGAGCTCAAGGGCCTGACTTCTGTTGATAAAAAAA
+AATAGCCCTTGGAATCGGGCTGTGGATGAGGGGACAGAGCACGCAGAAGGTACGCCGGGA
+GATTGGGGACGGAAAGCTCGGCGTGGTGGTGGACGGGAAGCTGGTAACGATCCTGCGAAG
+TGAAGTGAACGAGTACCTTGATGACTGGTTCTGGAGTGCATTCAGCCTGTGGTACCGCTA
+TAAGCTTTTCGGCGCTCTTCCCTTCTCAGGGGGATGGGCGGAATTACCGGCTTTCATCAT
+CGAGATCATAGAAACGGCAGAGGCCGCCTATAGGAACGGGTATGGGAACAGCACTCATTG
+ATGAGTTAAAGATACTCCTTCGCGCAGAGACACGGACCGCGGTAAAGGCCATGCGCGATG
+CACAGAAACAAACCGACTCACTTGAAGGCCAGCTCAAGAGCCTTGCAACAGGGGCTGTGA
+AAAGTTTCGGAACCTATGCGGCCGCTGCACTGTCGATCAAGAAAGTCATCGATATCTCGA
+GGGAATCGGGCCAGGCGGCAAGTGACGCTCAGGAGACCATGAGTAAGTATGCGGTGGTCT
+TCGATGATGTGAGACAGGCAAGCATGGCAACGGCCAGCCAGCTTGCAGAGGACTTTGACC
+TTGCCTCCTCCACGGCTCAAAAGCTCCTCGGTAATACCGGGGACTTACTCACCGGCTTCG
+GTTTGAGTTCAGATGCTGCCTTAAAGCTCTCCGATACAACAAACCGGCTTGCCATCGACC
+TTGCAAGCTTTTCGAATGCTCAAGGGGGGGCTGCGGCGGTCAGTCATGCCCTGGTATCGG
+CGTTCTCCGGAGAGCGGGAGGCCTTAAAGAGCTACGGGATTGTGATCAACGAGGCCATGG
+TCAAAGAAAAGATGGCAGAGAACACGGCCAAGGGCTTAACCTTTGCCACCGAACAGCAGG
+CGAAGATCCAGGCCACCTTAGACCTTGCAACCGAGCAGTCGAAGAATGCCATCGGGGACT
+ATGCGAGGACCTCAGACAGTGCGGCCAATGTGACGAGGGCCTTGGGGGAAGAGACCAAGC
+GGCTGAAAGAGAACTACGGAACTCTGGTCAATGAGGGGCTGACCCCGGCAAAGGCGTTCT
+TTCGTGACCTGCTTGATTCGATCAACGACAATATCGAGAAGAACCGAGAACTGTCGGCCG
+CCCTTGATGCGATCTACGGCAGAAGCGCGATAGGTGATTCCGTCGAAAGCCTGCAGCAGC
+TTGAGGCGGGCCTCCAGGACCTGAAAGAAAAAGAAGCTGCCCTGCAGGAGCTTGTCAAAA
+GCGGCAGGGGTGATGTGGCGGCCCAGGCGAAAGAGGCTCTATCCGGTATCCAGGGGCAGA
+TTGAAAGGACCGAGCAGCTGATCCTTGCCTCCTCACGGTTTTTGTCGGCTCAGGAAGCAA
+TCAGGCTCGAAGAAAAGCGATCCCTTGAGGCGGCGGCAAAGCTTGCAGCCGTTCGGGAGA
+AAGCTGCCAAAGACAACGAAACGGCGTTGAGTGAGCTTGCAAAGCGAGAGCTTGAAGCCA
+TGGAGCCGAACGAGAAGCAATTGAGGCTCCTGCAGGATGAGATCGACAAGTGGGCTGCCG
+TTCGTGACGCCGGGGTGGCCGCCGGTCAGGATATGGCTGAGGTCCAAAGGCTCCTCAATG
+ATCTTATCGATGAGCGAAACCGAAAGCTTTCGGAAGGCAAGACCAACTGGTCACAGCCGC
+TTGAAGGGCTCTCTGAGTGGGAACAAGAGTATAAGGACATTTTGAATGAAGCCTCCCTTG
+ACCGGCAGCAGATGGAACGGGACGAGGAAGCCCGTCTTGCTGAGATACGGGAGAGCTTTG
+GAAAGAGCCAGCTGCAGGCCCGCCTTGATGAGATACGCCTGCAGGTGGATGCGGCCAAAC
+AGGCCGGTGTGGATGAGGTGGATGTTGAGAAGTGGAAAACCGAGCAGATCATCCAGCTGT
+ATGCCACAAGGGCCCAAGAGGCTATGGCCATCTACAACCAGCTAAGCGGCATGCTCTCTG
+ATATCTACAGCCTCCAGGGGAATCTCTCGGATGCTGCGGCCGAGAAGGAAATTGCAAACC
+TCGACAACCAGATCGAGTTCAAGAAGGCGGCCGGGGAAACATACGAAGACCTTGAAGCCG
+AGAAGACGGAGAAAGAGGACAAGCTTGCGCGGAAGCAGTTCGAACGGGACAAGAAGAACA
+GGAAGAGTGAAACCATAGCATCGGGAGCACAGGCGGTTATCAATGCCTATGCATCCATGA
+ACCCGATTGCAGCCTCGGCTATGGCCGCCGTCATTGCAGGACTGACCGCCCGCAAGGTGG
+CGCTGATCAATCAGCAGCAATACACGGGCCTTGCAGACGGCGGTATTGTGCCGGCACAAG
+GAGATGCCGGAGGGCTGTACCGGCTGGGGGACAAGAACAAAGCTGAGACGGTCATCCCCT
+TTGACATCCGGAACCTCAAAAGCGGCGGGACGACGGTACAGGTGCATGTGGATAATGTGT
+ACGGTCCCGGAGGATCGGAGGCCTTTGCAAAGTACATCGTCCAGACGGTAAAGCGCGGCC
+AGTCATCCGGCCGTGTCGAGAAGTGGGGAGCCTGACGATGAGCTGGCAAATTCTCATTGA
+TTACGGGGACGGCTGGGTCGATATCACCGGCTACGGGGGAGATAACCTTGTCAGGGACTC
+CCTGAAACTCACCGAGAAGCTTCATGACGATGATTTTAAGCCTGCTTTAGGTTCAGCCAC
+GTTTTCTTGTACCCTCACCCCGGCCCTTAGTACCCGGCTTTTGCAGTGTACCGGTACCAT
+CCCGTGTGAGATCTATCATGACGGGGTGATCTGGTTTCGCGGCTTCTCCCGGCCGGTGAC
+CAAGTACAAGGTCACCGATAACGACCGAACCATCGACTTCGAGATCTATGACTATGGGTA
+TCTGCTTGAATCCACCCTGCAGGACGACGTAATGATAACGGACGGGAAGATCTGTGACCC
+GGAAGACCCCGATCATTCGATCGTCCACCTCCTATTGTCCTCTGCAGGCTACCCTCAGCA
+GTACATCGGTATAAGCGAAACCATAGACGAGGTTATCCCGAAGCTCACCTTTGCTTCCGG
+CGACAGCTATGCGGACGATCTTGCGGCGATCCTCTGGGATTACCATCACCTCTACAATGT
+ATCACCTAACGGGGTGATCGACATCTACGACTGGGCCGCCTCTTCCGTCGAAGCGGACGG
+GGCCTTCAGTGAACAGAATATCATAGGATCTCTGGAGGTTGAAAGAAAGGATTCTGAGGC
+CGACCAGGTACAGGTAACCTTCAATCAGTATGAGAAGCTTACCGGCCTTACCCTCTACTA
+TGAGAAGGTCAGTCGATACGAATCGATAGAATCGGATAGTGGTCAGGATGCAGAAGGGCC
+TGGCCTCTGGCCGGCAGAGGGTCCCTACCGTTGTGACTACAACCTTGCCGTCGACAGTTC
+GAATTATGAAGTAGCGGCTGCAGAGAACCAAAGCGTCGAGGTTCATGGATACGTCCCCTT
+TAGCACGGGGTGGAGAATAACGTTTTTCGACTCGCTGTATATAGCCGGGGACCACTATCT
+TGATGTGGCACTACAGGAGCATGCAACCACCTATTCCGACCTGCAGTACAATCTCTCTGG
+CGGCCAGGTTATCAATGAGATCAAGATAACCGGCGACCTTCATATCATCTATAAGGACCA
+AAAGAAAACCTCCGTCTTTTCAGGGCCGAACAGCACGGGCATACTGAAAAAGTATTCTGC
+CACCTACCTGTATGACGATGAGGCTGCCTCTTTCCTTGCAAACGCTCTGTTCTCGTCGAT
+TACGAACGGAAGACTTCATTACACGTTTAAAAGTCTTACCGAAAAGAGCCTTGGAAGCTA
+CGTTACGGTGAGTTCCCTTTCCCTCGGAATCTCGACCCTCATCCGTATCACCGCCCGAAG
+CTGGGATGTTGAGACGGAGATCTGGGAATACGAGGGTGTGAGCGTGGCCCCGCTTGAAAC
+CATCCTCGGGACGATTATTGCAGGGCAGATCGTGGTACCGACAAATCCGGATGAGGCGAA
+GAGTGTGGCCGAGCGGGTGGATGTGGGCCTTGAGTCGGACGGAAGCATCATACAGCCGGT
+CAACGGCAACCAGCTGGTGGATATCGACACCACGGTGGCAGGGCTCTATATGACGGCAAG
+CGCTCTGGGCTTCTTTGATGGAGAGGAGTGGACAGCAGTCATTAATAATGATGGTACCTG
+GTCCTTTCTCGGGGACGGGAATAACTACATCAAGTGGGACGGCTCACGTCTTGAGGTCCA
+CGGGGACCTCTTTCTCTCCGGTGACTCAGAGCTTCGGGGGAAGATTACCGCAGGCAACGG
+TATTGAAAGTGACGACTACGAGCAGGGTGTTTCCGGCTGGAAGATTGGAGGGGACGGGGA
+TGCCTTTTTTAACAACGTGTGGCTTCGTGGGGACCTGTACGGCATACTCCATGACCTGAC
+TATCGATGGAAACCTGATTCTCTCAGACGGGGCGATTAAGGCGGGGGATACCATCCTCGA
+TGCCTCGGGGATCAGAGCCAATGCGGGACGGGTCGGCAACTGGCTGCTCTCAGCTACCGC
+TATACGCTCGGATGAGGTGGGAAAAGCGAGGATAGAGCTTGATCCCGGGGACAACCGTAT
+CGAGGTGTGGGGTTCAAACACAGCCGAGCCTCGGGTTGCCATGGGATACCTTGGGGGCTT
+ATCCGATCCTTCGAACAGAGCAAAAAGCCTTGCCTCTACCATCTTCGGTTTCTGGACCGC
+CGACGGGGATTCGATTGAGATCAGGGGCGAGATGCGCCTTGTTAACGGTCAGTATGTGCT
+CCAGGATGATGCGGCTTTAGAGATCCAGGACAGTAGCACCGGTAAGGCTATCCTTCGGGT
+GGGATCAAACGCGGGGACTCAAGGGGTGCATTTCTTCGATGAGGCGGAAGCGCCTCTTCT
+GTCTCTGGTGGCCGATGGTATCAAGGCCGAAGCTTCAGACAGAACCCTTCATACTATCGT
+ATTCAGCAAAGCCAGCTCTTCGTTTACCTCATATCCTTCCGGTATGCCGAATAAACGTGG
+GGTGTCATTGGAATCAGATGGGCTGATCATTATTGCAAAAGCAAAAGAGAATGTAGTCCT
+TGGATACATAGATGTTAATAAAAAAGTTTTTGACTGGATCGGGGACATCAATTTCGACAT
+AGCAGGCAGCGGCGGAGTAAACCGGTATATCAAGGCCGACGGTCATATTGCGTTGACATT
+CCGTGTTGGCGACACCGAATCAGGGCTTGCGCTTGGGGAAGGGTTGAATCATATATCAGT
+CATACCTGCCATGATATGTAATTCAAATGTTATTGTTCGTCAATCAATGGATGTTTATCA
+GACGCTGACAGTTGGGAAGGATAAAGCAATCTTTCAGATCGACCCTGAGCATAATATTTT
+CACGTACAAGGGGGTATCGGTATTCGAGGCTTCTCACCCCATAGGCTCTCAGTACACACA
+ATACGCCTCAAGCGCAAGTAACGACTTATCGGTTGCCTTCCCGAATAGCGAGTCCCCCGC
+TTACCTGTTTGGAGGGACCTGGGAGAAACTGTGGGACGGCGAAGGCATAGACTTTCATAC
+CGAAGGTTACAACGGTTCAGGACGAACAAATGGGCTGATGCCCGATAATCTGCAATACCA
+CTGGCACGCTGCTTATCAAGTGTTCGCTACCGTCGATGGGGGAAAATACAATGTCGGTCA
+AGCGATCAGCCCCACTTCAGGAACACAGAGAAATGTGGGTGGCCCCATATCGGACGGCAC
+CCACGGAGCCCCACGGCTGGGCGAGCGGACCTCCGACCGCAACCGGCTCATGAGGATATG
+GAGGAGAATTGCATGAAAACCTATGCCGTAATAGATGGATCAATGATTACCACTGTGGTG
+CAAAGCGCCGATGAGGCGGCCAAGCTTGCAGAGCTGTTTCCGGAAAAAACCATCAAGGAG
+GTTCCTGCAGGGTTTACCGGAAACAAAGGCGATGATATCCGCTTCTTCGATGAGGATGGA
+AAGCGGCTTTCGATAGCAGCCGCAACAGAAGCCGGGCTTGTGCCTGAGGTCGGAGAACAT
+GAGGCCGCTATTTGGGAAGGCGGTAGGTATGTGCTTACCCCTGACTATACCGGTGTTCCC
+TACTGGAAAAAGGCCACAGGAGCGGCGGTACACCTGTCCCTCGGCCGAAAGCCCGATGAG
+AGTATGACCGATATAGAGCCTTCGGACCCGCAGGCCGTGTGGAACGAAACGGGCTGGACA
+GTTCCCGAGGAGGTGCTCTCCGAACGGGTTCGCTTAGAACGAGACAGGCTGCTTTCAGAA
+AGCGACTACATCATGATGGCCGACTATCCCCTTACCGACAAATCGGACTGGAAAGCCTAC
+CGGCAGGCTCTCAGGGACATTCCATTGCAGCCAGGCTTCCCTCAGGAGATTTCCTGGCCA
+CAGGCACCGGAAAAAAGGAGTTAAGCCAATGGGCGATAACGACAAAATCGATATGGTCTT
+AAGCATTGTGACGGAACAAGGCCGGGACATCAAAGAGATCAACAGTAAGCTCACCGACTT
+TTTCATCAACCGGGAAAGTACGTGCCCTGTTGAGAAACGCCATGAGAAGAAGATTGAGTA
+CCGAACAGTCATTGTCGGAATGGTGTGCGGTCTTGGTGGTTCGATTATCGGGGGATTACT
+CCCCGTTGTTTTGGGAGGGTGATATGTATTATCAAAACAGTATTGAGATGCCGGAGCGGG
+TACAGAAATGGGGATGCTACGCTACCGTAATTTCTGCGGCAGTAGCAGGAAGGACAAAAC
+GTTCTATCTCACAAGAGGATTTTGTTAATTGTGTGATTGAGTCGGAACGCCGTCGATACC
+TGACTGAGGACCCGGAGGCGCCTGGAACCTTTATGTATGTGGCAGACCCGACAGGGATCT
+TCCGCCTCTTCGGCCTGAATGTACGCTACCTCGGGAAAAAAGACGCGGACTATATATGCC
+AGCCGAACGAGATAGAAATACTCTTGTGGCGACGGTGGAATGAAAAAACGCGCAAGTACA
+TCTACCATTTCACCCTGGGTAACGGCCGTGGCATGACCGTCTATGATCCATGGGCTCCAT
+TCAGCAAGACTGCAAGCGAGGGGGAACTTCGGTCGAAGCGCATCTTTCTCGATCTTGGAG
+AAGTAGCGGCATGAAAAAGCTCATCGTAAAGCTGTGGAAGGCTCTGGGAGAGAAAGGAAA
+GGTGGCGACAATCATCGGTTTCCTTTTTGCCTTCCCGGTGAACATCAAGTTTGTCATCGA
+CTACTTCTCCGGGATCTTTTACTCAAGGGGACAGATGGAAATGGCCCTTGTTACCAATGT
+GCTGGCCATGGTGTGGCTGATCCTGCCGTCGGTTATTTCCATTCATAGCCCGAAGATCAG
+TATCGAGGTAAAGGATTGAGATGCGCAAAATTATTAGCATTATCCTTACTCTTTTTGTGT
+GTTTTTCCGCCGGCTTCCTCCTGGGCACTTACCGCTCAGGAGGCGGCGATAGTGGACGAG
+CTGCAGAGTACGATAGTCGAGGCAAAAAGCGAGATACAGAGTATCAAGCACTCAGCGATG
+AGTATGAGCGAGCAGTTGAGGCTTACGAGGGAGAGCTCGCAGAGCTTCGAAAAGAGGTGG
+CAGGCTACCAGCGAGAAGCTGGAGGACTTACAGAGCGAATCGGAGGAGCGCAAAACGAAA
+GTGTCGGCATTGCAGAGCGAGCGGGACGGGCTGAGGACGGACTATCAAGAGCTCTTGATC
+TATTGCGAAGGCTTAGAGAGGCGGAACCGGCGGCAGGGAATGGCCCTTAAAGCCGGGGGC
+TCTGCCCTGGCTCTCTCTATCATCGTCAATGTGCTGCAGACTGTGTTTTGATTGGTGTGT
+TTGGTGGAGTATAGGAGTTGAACCCTTCGCATGGCAGAATTATAATACTCCCAAGTCATT
+TCGTTGGTTATCTGCATGAATTTCATGTTGATAAAGGAAGTTATATGTAATGCTCTTTTT
+CTCAGATTTCCTTTAAAAAAAGGCATCATGATGTAAATAGTTACATAACGTATTGACTTC
+TTTATCGTGATGCATTATGTTACATCATGAAAGCGGTTTTAAAAAAACCTAAAGGAGTCA
+AATATGGAAACAGTAACAGTAACTTTCAGCATAGAAAAACCAGATTTAGCCGATTATAAT
+CAGCTATACCCGAAAATGCCTTGTAATACCGAAAAGAAGCAAAATCTTTTTGAAGTCATT
+ACAGATGCAAGGAACATTTGTGGTGCATTGCAATTCACAGAATCTACAGGTTCATCACCT
+GTTGCTTTTTATGAAAAACAAATTCAGTCAATGATTGATTCGGGAACTCTTTCTGAACTA
+GATTGGAATGAGAAACAGTTTGTAGGAACATCAACGAGTGTCGTTATGCAAAGCAATGGT
+TGGAATAAAACTGGCCGAAAACAAAGATTCTCAAAAGGGATCTTTAAAAGTGCAGAACTT
+TATTCGCGATAGGGCATTTACCAAGGGTATTTCTTAATTCTCTGGTTGTTTTTCTATACC
+GCGCGAAAAAGAACACTACATATAACAGCGAATATGCGGTTCCGCTTCGCTGCACCCAAA
+TGCGGCGTTGCCGCACTTCGCATATTTCTGAAACGTTAGATGTAATAAATGTTGGACATT
+ATTGAGGAACAAATGGGGCAAGCACTTACAGAAAAAGAAAATGAACTTTATAAAAGGATT
+GATGAAGTTACTCATTATATTTGGGATCCTATTGGCGTGAATGGCTGTCCTGGTGCAAGA
+GATGAGTATTATTCATATTTACCCAAGATTTTCGAGCTTGCCCAAAAAGAGAATTCAGAA
+TCTGAAATTGCAGAATATCTAAATTATGTACAATCTGAGAGAATGGGTCTTAAATCTGAC
+ATAAAAAGATGCAAGGAGATTGCTTCCATAATTATTGACTGGAGCGAAAATCTTGGAATA
+TTGGGGTCTTAACCAACCCCGACATTTACTACATCTAACAGCGAATATACGCTGCGGCTT
+CGCCTTGGCCTTCGCCATATTATGCTGCCAAAAACATCATATAAAACCAGAACGTTAAGC
+ATAGTATGTATTTATTCTCTATTCAAAAAGAACGTTATGGTATTGTTGCTTTCGATAAAT
+CTGATCCATTCGACTATATTATAACCTTACAAGTAAGGAAGAATCCTGATAGATTGAGGT
+CAATCACCATGAGAGGGGGAGCCCGTTTTGCCTAATAAAATAAACAGTTTCCTGGACGTC
+CTAAAGGCTGGTGCCTTAGTTTTGTTCTCCGGGATTATATATGCAGTTGCTATCAAGTAC
+TTCATCATGCCATCAAAAGTCATAATGACCGGATCAGAAGGAATTGCTTTAGCGACATCT
+TATTTTTATAGCTCAGAGCGACTATTTGTTCTCTTATACGCAATTTTCCAAACAGCGCTC
+ATCATTTTTTCTTTTGTAAAAATCGGATGGATATTCAGCACCAAGACTATACTGACAATA
+CTGACGATCATTGTGCTTCTCCTTATCTTACCGGATATCAAAGTGGCATCGCCAGAGCCA
+GAGAATGAGCGTCTCCTCCTTGTGCTCTTTGGTGCTATCATTGCTGGGATTGGGAAAGTC
+GTCTCGTTTCTTAATCGTGGCTCTACTGGAGATGAAGATATCGTCAGTGTTTACTTTTCA
+GAAAAACTGAGAAAACCAGTTGGTAAAATCAGTATTTTCGCCGGCGTTATTTCTACCGTT
+TATGGTTTGATTCTTAATTTTGTCAATTCCCACGATATTTCTATTGTGGCCAATACGCTG
+ATCTATACAGTTATCTACATTTTTGTTGGTGCATTTACGGTCAACACCATATACAAAAGG
+TACAGATACTCCAATATCATGATTAATTCGGAAAATCCTGAAGAGGTTATCAAAATTATC
+AAGTCCATATTGCCAGAGCGAACTTATACAAGGATCAGTGGGACTGGTGGGTATTCCAGC
+AAGGAGAGAACCTTGATATCGATTATTGTAACCCAGGAAGAACTTCCCCAGATAATCCGT
+TCCATAGAGCAGATGGAGGGGAACTACTTTCTTTATCACTCAGAAATAGATGGAATCAAA
+GGTCGTTTTACATATTCCAAAATACGATGAAAATTGGATTCTTGCTTCAGTAAGAGAATC
+GTAATATACCCATAATCATTTGACACGGGTACTAAGCTTAACAGCTGTTGATACGCTCCG
+GCGATACAAAATATACTCGCTTGACAAATGGCGATGCTTTGCCGGGGAGCTATGCCCCGG
+CTTTGCTTGTCAAAAAGTTTTTCTGAGCTTCCGCGATTTGCCGTAAATCCTCCGGCAAAT
+AATCGGTATAATGGTCGGTCATTTCCTGCGAGTCGTGTCCGGTGAATTTCCGTATCACAT
+CGTCAGATACTCCGTTATGACGTAGCAGGGTATTGAAAAATCGCCGAGCTGAATGGAAAG
+TTATATTCCTTCCTTCTCGCTCTATTCCCATCTCGTCCATTCTCTTGTACATCCACTCTC
+GCAGCCGGTTCGCCGTGAGCGGTGTTTCTTGCCGCGGGTGATGCGAGAATACGAAGCGCT
+CAGGGCCTGTCATATAGCAATTAAGCTCTTCTCTCAGCTCTGGCATAATTGGGATTTCCC
+TTATACCTTTATCTTTCACCGGAGTTCGCTTTTTAAGCTTGCTGTGGTACTGCTTTGAGA
+TTTGGAGATAAGAGAGTGTGACTGTTTTATCTCCCCGGACAATCTCAGAGTCAATCACAT
+CATCGGTGAAAAGTCCGCATACTTCGCCGATTCGCAAGCCAGCCATAAAAGCAACTTTCA
+TCGCTGTATAGTAGATTCGATCTTTGTCGCTTGATATTCCCGAGTCTTCGAGAAGCTTTT
+CCACTTCATCTATACTCAAGGCTCCGTATCTATTCTTGTCGACCGATAAAGGCCTGACCA
+TGCGCCAGGGATTGAAATATGCCGCTGTCGTGTCCCGCATCTTCTGGATCCGTTCGTACT
+CTCCAAGGATGGTTGAGTAGACGCTTTTCCAGTTGTTCGCTGTTTTATGACTCACCTGGT
+TAGCCCACTTGAACAGAAGGTCCTCGCAGTCCAGCGGGGTGATTTTCTCAATCGGTTTGT
+CTCCGTGGTATGGAAGGATATGGTCTCTGGTTATCTGGGTAGCTCCGTTGCAGTAGTTCT
+CTGTTATCCCTGGTTTTTCTTTCGAAGAGCGGGCGAGAATTGCCCGGACGTAGCTACTAC
+GCCTATAATCCCAGAAGTACCGACTCTCTACCCATTGGGCAAGAGTTACGACCTTTTCCT
+TTGAAAGGCGGTTTTTCTCAAGTAGCTCCTGACAGTAAGCAACTGCTTCTTTGCGGCTTT
+TGACTTCATCTTTCTTTCGTGTGTAGCCAATCCCGGTGCTTTTCGCCGGTAGACGCTTGC
+CGTCAGTTCCGTATGCTTGATAATACCAGACTGTCTTGTTCTTGAGTGTTCGTGGAAACA
+GGATGTATTCGTTGTCTCTAAATCTTGCCAT
+>NC_014364.1|provirus_2329685_2350621
+ATGGCAACTGATTTCTACCATCTTTTCAAGCGAAAATATCAAAACAAAGCAGGCAGAGAG
+TACTTCTACTGGTGGTATTGGTGGTACGACCCCGATACCGGCCGACAGCTCCAGAAGCCC
+GCAGGACGGGCCGAATCCGTCAGGAAACATGCTCAGGAATATATCAACAATCTCCCTATC
+CCAAGCGGTAAAGCGGATACCGTTCGCGCCGTTGCAGAGGGTATGTTTGAGGCGGGCTCC
+CCTTACCTACTCCGACGTGAAGCCAAGGGTTCGGGGATGAAAGAAGGTACCCTCAGAGCT
+TACTCAGGCTTCGTCAGGAACCACATTGTCAAAGACTGGGGAAATACACCACTTAACCAG
+ATAGAAGGCGCTGACATCGAAGATTGGCTCATGGAGAAGCCTTTTTCAAACTCCACACGG
+AACAGCATCATCGATTGTTGGAACCTCATCTTCCGGGAGGCAAAGAGGTCTAATCAGGTC
+CGCCGGATTCCCACAATAGAGCGCTTTGCCCGGAATTCAAGGCGGTATGACACCTTCCGG
+GATGATGAGCTGTTCGCCCTATTCCCTGAGAAGCGCGAAGACCTTATAGCTCTGTACAGT
+GATCCTGAGAACGACTATTACGAAGAGATTGAGTACTACGGGCTCATGTTTGCCGTGATG
+CTGCTTACGACGGTTTCCGGGGGCCTGCGATCCGGGGAGATACGGGCGCTCTGTAGGGAC
+CAGGTATTCATCAATCAGTCGGGTATCGTGGTTAGTAAGGCTCTGGACAGCAACAACAAG
+GTAACGCTTCCGAAGAAAGGGAAAGATGATAATCCGAAATGGCGGGCTGTACTGTTGCCG
+GAAAGAGCGATCCAGGCCCTCTCATGGTGGCTTGAAGTGGCCCCACCCTCCGGGATGCTG
+TTCAAGTACGCTGATAAGCCGGTTGACCGCAATCTGCTGCTTGATAGGCTCAAGCTGGGC
+ATGGAGCGTGTAGGGCTCAAGCTGGGCATGGAGCGTGTAGGGCTCAAGCTGGGCATGGAG
+CGTGTAGGGCTCAAGCTGGGCATGGAGCGTGTAGGGATCAAGCCGGAGGGGCGGAAGCTG
+AAGGTCCATTCTCTCAGGTACACGTACAACACGAGAATGGAGACTTTACTATCAGAGGAG
+CGGTTATTGCAGTTCATGGGGCATGAATCGAGGCAGATGACGCTCCACTACTCCCGGCCG
+TATTGGCAGGAGAGGCTTGTTGCGTATGGAGGTGACAAGGAGAAAGTCGAGCAGTTCTGG
+AAGTGAGAGATTTTAACGATAGAATCGCTTTAAGCAATTTACTTTAGTCTTTTGAAAGCC
+GAATCGCTCATTTGCTTTTCCATCTTTCTATTACAATTGGGACATAGATACTGTTTTTTC
+CCATCTATCTTCCATACATAATACTTTCTTTTAAATGGAGTTGAACAAATAGCACAACGC
+CTCGGCTTTCGGAAGACAATAGCCAAAATAATTACAATGACAATTATTACATATTCCATA
+TAATAATGTTAATCCGGTTTTTAAGTTCTGTAAATAATTTAGTGTATAAAAATAATTGGT
+AAGTGTTAAGCAACTCTAATCTATTGAGAAGATATTTACCAAATTTTTATATTTTTAAAT
+ATTGCTACTCCTACAGGAGGTGTAATTGAGATATTTGGAGTACAGTATTTATAGACCGTA
+ATAAAAGACGACGACTACTGCACTCAATTAGTTAGTATAAAATATTTCTAAATCGCAAGC
+CTTTCTTTTTTTAATTCTTTAATATAAATCTTAGGTCCAATTCCGAAAATCTCCAACTCT
+AAGTAATCATCAAGTATTTTCTTAATCTTAGCAGAAGTAATAAACTTACTATTTTCATCA
+ATATTAATATTCTTAAAATCATTATTCTTTAAGGCTACCATAACGTAATCACCAATCTCT
+AAATCATTCTTTATATCTCCCTTAGTTACTTCTTTTACAAGTTCTGCATTTAGATATAAT
+TTAGTAACTTCGTCATTATTCGTTAATGCCACAAAAGTATCATTCGTTATATATTTGTCA
+ATTTTTACTTTCAATTTTCTATATCCCATTTCTGGATGCAATAAATAAATTTTCATATAC
+ATGCCTTGCTTCTTAAAAAAAACCTTAATACCATTTTTTACAGTAAATGGTGGGAAATTT
+ATTTCTGAATCTTTATCAATCCATCCAGGATTTCTCTCTACTTTGATCCAAAACGTAATA
+GAAAAATTATATTTATTATTCATTTTTCATCTATTCCTATGTTTATCATTTCGTTCAATT
+TTTCTTGTGTCAAAATATCACCTGTATATTTCTCAGCAGAGGCTCCTTTGTTTTCTTGTT
+TTAACAAATTAGCAATAGCTGTCCAACCAATTAAACCTGAAGCAAAGGCATTGACAGCTG
+TATTGGGATTGATTAATAGCAGCCCTCCAATTGATGAGATCAATACAAATCCAAACCCTT
+TCCACCAAAATTTTACCTTAGTATCTCCTATGGAATAGAAAATATATTTAAAGAAATATG
+CAGCAAATGCTCCGAAAATTGAAGCAGCAATTTTAAAAAACACCCAAGCGTTTGGATCTT
+TACCTTCACATAGCCATTCAAAAACTATTTTCATTTGTTCCATGAATTATTAGCCTTTAT
+TATCACGAAATTATTCTTTTATAAGAATTACTATATCATTTACAAAGATCATGATATTTG
+CCACTCCTACTACAAAAAATTAAAGCATTGTAGATATTTTTACCTCTGTATCTATGTTTT
+GTCGTTTTTGGACAATCGCATTCTCTCCATATTGTTTCTTGAAATATTCTTTAAATTCCT
+CTGTTTTTCTTAGCTCTTTGAATAAGGGCCATTCAATCAGCTCATTTTTACCAATCACTT
+TTCTCTTATTATTATCCTCTTTTATCATTCGTATGGCTGTTCTAAAATCTCTTTCTATAA
+CAGCCTTTGCTATTAAATACTCTTCTGTACATAATGACCAATCAATTTCTGATAGTATTT
+TCTTTGATTCTTCATCTCGCTCTTGCCATAAATATGTCTGAGATAGATTTATTTTTAACA
+TTGTGTCTAATGCCAATATTCTAATTTTACCAAAACTATTTAATGCAAAATTTAAAATAT
+TTTCAGCAATGTTATAGTTTTCCTCTTGTATTTGTTCATATGCAATGGTATTTAAATTTT
+TCTTTATGCTATCGTCTGGATCAAGTATATTCCATACAATATGCCCGAGATATACAACAA
+TTAGAAATATAACATCACATGAATGCTGGAAATATTCAGGTGAAACAGATAATTTAGATC
+CAACAACTATAGTATCACTATTTCTTCCAACTTTTTCTAAATACGACTCATTAACAGAAC
+CATCACAATGGGTAAATAAATTACGCCTTTCAGTGATCTCAATAAACTCCTCTATTAGTT
+TTTTATCACTTCTCAGATTTATGTTAAGTTTTTTCTCAAACCACTTAAGATGATCATCAT
+GTGAACATCGAATAACTGAATCAACTTCTTTTTCAATTAAATATGTAATAGCCTTCTCTA
+TAGAATCAAATTTTTTAATATCTGCAAATGTTAACTTCCTATCTGAAGTATTTAATATTT
+CAGGCTGTTTATTCAGAACATAACGTATCAAGTTACCTATGTAGAAATCAAATTGACTTA
+TAAGAGATATAATATAATTCCGTGGTGCTATATTTAAAGATATTTCTAATTTACTTATTT
+TTTCTTTTATACGTATAAATCTTGTGAATTGGGATTCTGGAATTCTATATCCTTCACCTT
+TCTCTTTATCAGATATTTTCTCACATTTAGTTTCTAAGAATCTGTTATATTCAATCAAAA
+GGTTATTATGTAATTGTTCATACAAAGTAGCAGAAATTGGCAATGTATTCTTGATGGCAT
+CAATCGCACTTACGGTCTTGTTAAGGATATCAATAATTTCCATAAACTACCTTTTCTGTG
+TAATAAAGATTTGATCTTCCGTTCACCTCAAATATTCAAGATATTGACCTGATGCCAAAG
+TGTAGGAGAACAACGATTTTACTGCCGTTGTAACGTCTCCGCAGAAAACGTGACAATGGA
+CAAGCCAACTTTAACTAGTTGTTCTATAGAATTATTTTTACATGATATTCTCCAGGAAGC
+CAAGCAAATCATTACTCCACTTATTGTAAGTTTTTACTCTACTATACAAGGGTGTTGAGA
+ATAAGATATCCGTTGGCCATTTTATTTTAGCTATAGAATAGTAAGGTATAACTTTTTTGT
+ACATATCATTCATTGTCGCTCTATTTAAATGTATTGTACAATTTCTTGTAATCTGCAAAT
+GTTTAATACTATTACTATATGATCCTACAAGGGAACTAATCTTTACTTCATGTAATGCAA
+TTGCAATATTTAAAATTGAATCAAAGGATCCCCAAGTAGGCTCTTGGAACGAAGCACTTA
+TAGCTCCATAAGGATTTTTTCTCTTATTTATTTTATATAAAATATTATAGACTATCTCTT
+TTTCATTTTTTGTATTTAATATACTATTTCGATGTTGATAGCTATTATTAACATCGAAAT
+AACCTGTGTATTTTGATATCCAATATGATCTCCAATACGAATTCCATGCCTGCCAGAAGT
+AATTAATTATTCCATCTATTTCAAAGCGATTATTACATGATTCATTCTTGTTTAATAAAA
+AGGTACACTTTTCAAAAGAATTATATAAGGATAGATAGTTCTTTCTTAAATTCATACTTT
+CTGTAAAGCTTTAATAAAAAATTTTGTACGATTTATTCTATTGCTTACACTATGAGTTGT
+CTTTAAGCTTGATTTTACAAATTCTGAATATTCACCATCTTCAACTTTTTCATCTACCTC
+ACTTAGCATATTTATTATTTCACTAATTGATTCATTAGTATTATTACAGAATTTCCCTAT
+AGGTAATAATCCATCGATTATTTCTGAATTAATATTTTTTATGCCCCAATTATTATACAA
+TAATGCTGCAAATAAACTATAAAAATTAAAACCACTTAAAAGTTCTTTTTCTAAAAGATC
+TTTTAACTCTGTTTTGATGAAATCTAATGTTAGAAATAATTTACTTTTTATCTCATCTCC
+ATATATGAAATCTTTATCATTGATTTTGTAAAGATTATCAAGCTTTGAGACGCTCCTTGT
+GACAATGCCTTCTATAATCAATTGACATAATTCTGTGAAAAGATCTGCATCTATCATCCT
+AGAAATATCTCTTTGAGATAATATTTTATAATCTTCAAGTATTGGTGTGTATCGTTCAAT
+AACATCTTTAATAAACCATTTAAAATATCCTTGATAGGTAGCATGTCTTTGTTCCGGTTT
+ATTCAATGGCAAAGTATAAGAATTTATTCTTCTGAAAATTTCAATAACCTCATCTCTTGA
+AGCACCTACAGCTGTGTCTACTGAAATCTCATAAGATAAGAAATTTGATTTATCATCATC
+TGACAATTCTGAAAATATTATATTGGGATATTCAGAACTTATTTTTGATAGTTTAAATTT
+GTTATCTATAAAATCTATAATAGAAGTACATCTTTGTTGTCCATCAATAATTTCCCGTAT
+AGACCTTTTAGTTTTCAAATCTATCTTCTGTAATAAAGTAATTTTAGGAAAAGGAAATCC
+TTTTATGATAGTATCAATAAAGAAGGATCTTGAATTATTAGGCCATAAACCTCGTTCCCT
+TTGATACTCTTTGTTAATTATTAATTCCTCGTCTGTATAGTATTTATATAGATCAGCTAT
+ATTCATTGTATTTCGTATAATTTTCATTCTCGCTCCTTATAAAGGACTTCATTTACCATG
+ATATTAAAGTATGGTATTAAATCAATTTCTGTATACTGATCACATGAACTGTTTGATGAA
+GTGTCATAACGTTACCCACACAACACAAAACAGCAACGTAGCGATATGCACCCAATCTGC
+TCAATGTTATTGTTAAGTTTTTCCCTTTGATAATGTAAATAGAAAACCGCTCAAGGCACC
+TCCAATATCATTAAGCAGCCTAGCATGATCGCCATTTAATTCGTAACTTCCTGGAGCAGC
+ACCATGGGCGGAACCAAAATGTGTTCTTAGGCTGCCAATAGCACTGAAAATGCCCTTTAC
+ATTCCCCAATAGTCTTTTTAGATCATCATTTACTTGCTCATCTGGTGAAAGATTTAATAC
+TTTCATTGTTTCCGCAATTAAACTAGAAATATCTCTCCTAACAGGTTGTGGCTGCTCTAA
+ATCTGATAGTATCTTTTTACAAACTGCTTCAAGATAACTACATGTTCTTGTGATGGAATC
+GGCGGGATCAGTTTGAATGCAGTTTCGTGCTTTCAACCAACTTCCATACAAATTGTGATC
+ATCAGTCTCTTGAAGTACCTTCGTTGTATGTTTAAATATCAGATTAGATTCACTATTAAG
+CATCTTATCTATAACGGTATAATTATTAGCTGGCAGCTCCATATCATCCAACTGGGATGC
+GAGATCTTCCAGCAACGAATTTAATGACTCTTCGCTTGATAATGATTCAAGCCATTCGAT
+AGGCGCGGAAGATAGTTCCTGTATACTATAAGTACGCCAATCAACCGGGATATGTTCGAG
+TGAATCTTCTATATCCATATAAGTAGATCTATAGGCAATGGCAAGTTTTTCAGAATTACA
+AAATAAGTACCCGTATACCCAATCGTCTGGACCAATCATCCCCAGATGTTTTTCTTTTGA
+ATGACCAGAGATAGAGACATCCTGCAATGTCTCTTTTATTACAACCCCAAATTCCTGCAG
+TTTTGGATAGATCTTATCTCTTTTGGATTTTATTGCTAATACTCTTGATCTAATGTCATC
+TATCGTAGGCATTTTAATAATCCCCCAAGTAAACTTACCAGCGCATAGATTAAGTTTTTT
+GAGTAGAAAAGGATCCACAGTCTTTTCTGTATATAGACCCAATAAAAAGTTAATAATCTC
+CTTGTATTTGATAAAAGCATGAACGGGTAGTTTTGGGGCATAAGACCAATCACAATTCAT
+ACTTATATCTAAATCTTTATATGAATAATTGTAACCCCACTGTCTTCATAGAGCAACAAA
+AAAACTCAACTTTCTCTAACAGCTTGCTATCGTGAGAACTTTATAATCTTGCATTCGATA
+GCCTTTACGCCTCTCGCTTAGCTCTTTGAGCAGAACGATCAGCCAGGCTGGAAGTCAGTG
+CCCTAACTGTTTCCAGATCCTTCTCATCCAATGCTTCCAAGTCCTCTACGATATCTGCAT
+AGCGTTTCGGTACTTGCCAGTTGTCCGGATTCTTGCCAGTTACCAGATATTCTACGGTAG
+TATCAAGCACCTCAGCTATTTCTACGGCTTGATCCGCATTAGGCATTGTTTTTCTTGACA
+TCCACTTCCGAAAAGTTCCAAAACTCACGCCGGTTTTATTGGCGACCCATTCTTGAGTTG
+TCTTTTGCTCTTTAATTAAGGTCTTTAGCCTTTCCCAGAAATCCATACTTCATTATCGGC
+TATAAATAGAGCAAATTGTCACAAAAAACACTTGACAATGTTCCTTTATTGCTCGATTAT
+GAATGTATGAATAGAGCAAAAATGGAACATAAGAGTCCGCCAGCTGTGAAAGTTAATCTA
+ACTGAGGATGAAATTAAAAGAATTGATAAGGGTCCCTTAAAAGCAACTTCAGGGAGAGGT
+CGTGCAACTTGGGTTCGTAACCTCATTACCAAGGAACTTGACCGTTACGAATCCATCCAG
+TCCGGCAACACACAACTCGACTCAAAACCATTTAATCAAAACAAGGAGATGAAATGACGT
+ACATGAACCAGACCGAAGCGGCGAAGTACCTTCACGTATCGCCCAGCTATGTGAGCAACC
+TGACCAGACAAAAAATGATACCTCACAAGCGGATCGGCGGGAAAGTGATCTACACAAAAG
+AGCTTCTCGACCGGTGGATACTTGAAGATTCATTACGAAGCGTCGGGATAGACCCGAAGA
+AAAGCCGCCTGAGCGACACGGTTTTAGGAGAAGAGCCTTCAACTACGGGGGATGAGTAAC
+GGGCCTACCCGGCCGGAACCTCAGATCGGTGATCTTTGACAGATAAGAGAAGGGATTAAG
+AGATAAGGATTTAGTGCTGTCCTGTATAGGGAAACCATTTGGAATGCTGAGAAAGCAGCC
+TCTGACCAGGCCATTACCACTTGTGGGGTTCGAATCCCCGAGGGCAGCAAATCATAATCT
+GCTACCGGTCAGTAGACCGGCAATCTACTCCGTGAAAAGCGGGAAAGGAGGAAAGCGTGA
+CAGACAAAACGAAGCGCATTATAGCCTATGCGCTGACTGCGATAGCCGCCGCAGTTTTGG
+CGTTTGCCGAGCTGTTTGGCTGGGACCTGCCGGACTGGGGAACAATCATGAACGTAATAG
+TCATCATTGCATCTCAGGTCTTCGGCATTGAGTGGATTCCACCCAAGCGGGCAAGCAATG
+GAACCGGCGGAAACGGTTAAAAATTTCAGATGAGATAACGGCTAAAAACAGGCAAACGAG
+ACGCAATCGTTAACTGCGTTGGCGCCCGGGAAAATTAGATAGGGCTGACCGGGGGCAACC
+AGTGAGACCGCAAGTAGACGGGCATAATTGAGGCGAAAGCCGAGTGAATGATCAGGATGG
+CAACCTGATTGAAAAGCGTGTTATGTCGATAGCCTAAGCTCCGGGTCGCGCCGGACACTG
+GTTATTGTTGATCTTACGGTATAGATGTGTTGGCCACCAAGTACCAGCAATGGTGATTTA
+TATCGCACTATCAACTACCGAGCGCCGGGGAATCGTGGCGCTTTAAGTGACCGGATGACC
+AACCATATACCTTTTCGATATGGCGGTAAACAGCACCTCCCCAAGGCGTAACGGTCGTCC
+GGTTTCTTAACTCCCTCGTATGGGGGAGAAAAACAATCCGTGATGCCGGAGAAATAATAG
+CATCTATATTTTCGCGGCTGTATGCCGGGATTCAAACAGGTTGGATCGGTAAACACCAAT
+TTTCCTACCGGTCCAACAACTTTCAACCTTTTTCAAGGAGGACATGGTAATGGAATTGGA
+AGAAAAAGAAAGCTTGCAAGGTTTCATAGGAGTGAAAAGGATCAAAGCACGACCGATGAC
+CAGGCGTGGATACAACGGCTATCGTGGCTGGCAACTTCCTGCGGATGAAAATGGAGATGA
+TGAAGGGATGCTTGTCGAGTATGTCGATGGCGGTAAATCCAATCATCCCGCACATGAGGG
+CTATATCAGCTGGTCACCTATCGATGTTTTCAATCGTGCATATCGGCCATGTGATGCCCT
+TACGTTTGGCTTTGCAATCGAAGCGGCAAAGGCCGGAGAGAAGATTGCCCGAAAAGGCTG
+GAATGGAAAGGGCATGTTTGTCTTCTACCAGAAGGGCTACCCGGAAGGAATACCGATCAA
+CAAAAATACCGCAGAGGCAACAAGATTGCCGGAAGGAACCGTCTGCAAATTCCGGCCGTA
+TCTCATGATGAAGACAGCACAAAACGACTTCGTGCCATGGGTTGCATCGCAGACCGACAT
+CTTAGCGGAGGACTGGGAGATTATCGAGCAGGGAGAACAGAAATGAGTATTGAAACAAAA
+GAAAAGGCCGCTCCAGGCAAGGATACGGCCACAGAAAACAACCACACCAATACTACCATG
+ATTGGATTCAGGCAGCAAGAACTTCACGAGATCGAGGAAAGCCTTGAGGAGATGGACCAC
+AAGATACAGGAGCTTTTCCGTTTCGGAACCGCCCATAACCGGGACATCTTCGCCATGAAG
+CTATCTGGTGAGGTACGGAGAATCAGAGATCAGTTGAACGAAGGGAGGCTGATGTGACGA
+TCGAAAAGACAAGCCAGATCAAGGCAGGTGATAACCTTGTGATGGTGATCTACGGCAAAG
+GCGGTGTGGGAAAGACAAGCTTCACCGCCTCAGCTCCGAACGTGATCCTTCTCGACTTTG
+AGAACGGAACCAAATACCTGGGAGCCCGCGGCTTCAATGTAGATGTGATCAGGCTCAAGA
+GCTGGCCGGCAAACGCTGAGAAACAGAAGCTTGCGGCCTTGGTTGCACCCTACCACACCA
+TCGCTCTTGATCCCCTTGGGGAAGCGATGGAGAAGCTCCTCAATTCACCGGCGTTGAATG
+GCCGGAAGTTCCGACAGGCAGACGGATCGTTGACCATGGCAGGATGGGGCGAAGCTAAGG
+CACAGATGCGAAGCTTCATTAAGTGGCTCCGGGATTCCGGAAAGAACGTGATCATCGTCG
+CTCACGTTTCGGAAGAGAAAGACGGGGAGATGATCACCAACCGCATACAGGTTGCAACAA
+AGCTCAGGGAAGAGATACCGAACATCGTGGATGTTATCAGCTACATGGGAGTGAAGATGG
+TCGACGACAAACCTGTTCGCATCCTCTACACACCCCGGCAGGGAGACCAGTTTGACTCAA
+AGGATCGAACCGGCCGGATTCCCTTGACTGTACAGGTCAGCGAACATGATGGCTTTAACG
+ACCTGCTCAAGGCTATGGAGATCGGGCAGCAGAACATCCCTGAAAACAAGATGCCGGTAC
+CGGAGGCAACACCTACCACATCCCAGGGGCCGCAGGACGAGAAGCATACGGAAACCACAC
+CAAAAGACCCGGACGAGGAAGCGCGAACACAACTCAAGTACCAGCTTGACGGTGCCATTG
+TCGGGGAGCTGGTTACCAAGGCCGAGCGGGATGAGGTGCTTGCAAACAGCAAGAAGTACA
+AGGGCCAGGTGCTTGAGGCCTACATCAAGAGGATCAGCGATGAACTCTTCAATCTCCAGC
+AGAAGGCAGAAAGCGCAAACAGCACCGTTGCACCTGAGCGGAAAAATCAGCAGGCAGAGA
+AACCGGAAGAGGTTTTGGAAGAACAGCCGCAGGACGACGAAGAGTATGCGGCAGAAGAGG
+CCGGACAAGCAGAGCTCGAAATCTGGTAGGACAGGAGAAGGACATGAATATTACGGACAT
+AACCGTTGAGGATATCATCGAGGAACAGGAGACGGCAGAAGAAACGGGACTTGAGAAGCT
+CAAAGGCGATATTGATGAAGTGATCAGTCGGATGGAAGAGCTTTCCATCCAGAGTGACGA
+ACAGCTTGCAGAAGCAGGTCAGTGGCTTGTGAAGAACAAGCAGACACAGAAGATCGTCAA
+GGACCACTTCGAGCCTGAACGCAAAGAGACCTATGCGGCCTACAAGGCTGTGACCGATCA
+GATCAAGAAGTACACCGACATCCTGACCAAGGCTGAAAGAACCGTCAAAAAGAAGATGGG
+AGCATACCAGGCGGAACAGGAACAGCGACGCATCGAGGCAGCAGAGAAACAGCGTAAAGA
+AGCGGAGAAGGAACGGGAGCAGCCAAAGGAAAAGGGAAATTCTGCACCTTCTATTCCCCT
+TCCCCCTGAGAAGAAAGAAGAGCCGGTGAAGATTGACGGGGTTTCCTTTTCGGATAACTG
+GACCTTCATCATTGAAGAGACCGACAAAATCCCGAGGGAATACATGATCCCGGATGAGAA
+GAAAATCCGCCAGGTGGTGAAGGCGTTAAAGGCTGATACCAATATTCCCGGTATCAAGGT
+CTACGCGGAAAAGACCGTCAGTGCCAGGACATGAGACCATGACAATTGAGGCACGAATAA
+ACATTGACTTTGCCCCTGAGGAACACACCTACCGCGTTGACGGCAGGAAAGTTTCCAGTG
+TGACAAGCATCCTCAAAAGTGAAGGGTTCATTGATACCCGGTGGTACAAGCCATCGGGTA
+CTTCTCGCGGGGAAATGGTCCACCAGGGAACGGAGGCAATCGACCGGGGCCACCTTACCA
+TTGCACAGTTCCCACCATCGGAAATTATTCCCTACCTCAAAGCCTGGCAGGCCTTCAAGG
+CTGATATCGGGGTGAGCGAGTTTGTGATCATCGAGCTTCCGATCGGCAGCAAGGTTATGG
+AATACGGGGGAATCCCGGACCGGGTTGCAGTGATCAACGGGGAGTATTGGCTTCTTGATA
+TCAAGAGCGGAGCACATGAGCTATGGCACGGTCACCAGCTGGCCGCCTACAAGATAGCCC
+TTGAAGAGACCTTCGGACTGCCGATTGCAAAGCGTCGGGTGGTGCACCTGAAGAAAACCG
+GGAAGTACTCAATTTGTGGGGAGGACAAGAAGATCGGTTCCTTTGACCTTCCGGTCTGGG
+AACAGCAGTGGATTGCGATCGCGACCGCTCGGCTGATCAAACAGCGGTACGCAAAGATAA
+AACCGGAGACTGTATGAGCCAGAGAGCAATTGTCATTCCAGCGGCCGAACGGATGAAGAC
+CGGAGAGCCGGGAGTCGTTTCCTTCCGCGTCGGTGAGGTATTCCATGAGTACCTTGTACA
+CCTTTTCAGGTACCAGGAGATAGAACGCAAGTCACCATCACCCTATTACTCACTCAAGAT
+CGACACTCCAAAGCGGCCGAGGACAACAGGAGAGAACAGCCAGAACCATCATATCAACGG
+TCACTGTCAACAGATAGCCGTTGATACCGGCCAGCCATTTGAGGACGTGAAGAAGTACGC
+GAAACAATTCGCGCTCACCATGGGCTACCCCATCCTTGAGGACGAGAACGGCGAGCCTAT
+ACACGACCTATGGGGAAAACCGCAAGGGATCAGTGAGTCTGATTGCAGTACGGAAGATGC
+CGCGATCCTGATTGAAGCGATCCACCAGTTAGCGGCGGAAATGGGAATCAACCTCATCGA
+GGACTAAGGAAGCACCATGGGAAAAACAACAAAGCAGAGAGCAAAACCGGTACGAAGACA
+GAAGACACGACGGCAAAAGGCCGTAGATGCGGCAGACCGGTGGTTCAGTCTCTACATACG
+ACAACGGGATGGGAACCGTTCAGTGACAAGTAACTGTATAAGGAACCTGACCTGTTCACA
+CCTGTTCTCACGAAGATTCTACGCTACCCGCTGGGATGAGATGAATGCCTATTGCCAGAC
+GGCAGGAGAGAACCTTTACCACAACCGGGATGCAGGACCTTTGACCAGTTACTTTCTCGA
+TGTGCATGGAGAGGAAGCCTACCGGAAGCTGTATGAAAAGGCCCGCTCAGGGGCCAAGTT
+CAGAACAGACGAGATCGAGGATATCGCTGCTTACTACAAGAGCCGGTTTGAACGGCTTAC
+ACAGAAGCAGCGCGACTTTTTCAATGTTATTTAGGGAGGGACTATGGCAAACGATATTAC
+CAGTTTCACGGCAGTAGGACGAGTGACCCGTGATGCGGAATTCCGATACACGAACGGTGG
+AACACAACTGTGCAAGTTCAGCATTGCGTCGAATTACAGCAGGAAGGTACGGGATAACTG
+GCAGGATGAAGTCAGCTATTTCGATTTCACCCTATTCGGGAAACGGGCAGAAGCACTTGC
+TCAGTATCTCACCAAAGGTCAGCAGGTGGTGGTTTCAGGACAGCTCAGACAAGACCGGTG
+GGAGGACAATGGGGAGAAGCGAAGCAGGGTTGCGTTCTTCGCCCAGGATGTACAGCTGAT
+CGGGGGAAAGCCCGCCGGTCAGAGTAACGGGCAGTATGGAGAGGCCCCTTACCAGGGTCC
+GCCGCAGAACCGGCAGCAAGGCTACCAGCAGGGGCCTCCGCCTAACAGCGGCTACCAGAA
+GCCGACAAGCGGCTATGACCAGTGGGGACACCCCATAAACCCCGGACCTAATAATCAGGG
+CCCGGAACAGGAAATGAACTTCGACGACGACATACCGTTTTAAGGACGAATTACCATGGC
+ACGACGCAGAATGATCGACCCGTCAATTTGGAGCAATGAACAAGCGCAGTGTTTATCAAC
+ATCGGCGTTCAAGGTGTATGTGTTTCTCATTTCACAGTCCGATGATGAGGGGTACCTGAA
+GGTATCCCTCGTCATGTGGCCCTCATTGATTAACCCGGTTGACAGGAGCTACACGAAAGA
+ACAGCTGGTAAATGACCTCAATGAGATTCTTGCCGCGGGGCTGGTGGAAGCCTACAAGTC
+GGGTGATGAGGTCTATGTGAAACATCCTCATTGGACACTGTACCAGACCATACAGAAGCC
+TTCAGGAAGCAAATACCCGAAAGATGGCGAAAGAATCTACCGCATAGAGGAATATCGTAA
+TGATATCGGTACGGTACCACATGAATATGATACCGATACAATACCGGTAAACGACCACTC
+TCATTTCGTACCGCCTAAGTTAAGTAAAGAGAAGTTAAGTAAAGATAATACTAAGATACC
+TTCGGTAGCATCGGCAGAGCCTCAGCCTGAGCAGGGAGAAGCGACTAAACCGGCAGAAGA
+GCCGGAGCCGGAAAGCTCTCCACTTCCCCCACCCGATTCGCAACCCGATCCAGAACCTGA
+CATCGAACCGGTTCTTGAGCTTGAATGCCAGGCACCGAAGAAGCGCAAAGCCAGCAAGGG
+GAAAGCACCTACCGCCGGGAAAGAACCGGCAGACCCGCTGTACCACTCGATCAAGGATTC
+CTTCCTCGCTGTGGCCGGAGACTTCACGAACTGGGGCAAGGAAGGCAAGGCGATCCACGG
+GATCATCGAGAAATGCTCACGCGCCTCACCGGAAGACCCTGCCGGGTGTGCCGAGCGGAT
+GATCGGGGAGTTATGGCGGCTAAAAAATTCCCGAGATCGGTTCTACCGAGATCAGCCCTT
+TCTCCCCTCCACCCTCAACGCTTCGGGAATCTGGGACCGGGTGGCGGAGCAGCTGAAGAT
+CACGGCGGACGAGCTGGAAGGTGCGAGGATGTGGGAAGCGCTTGACCCCTACGGGGTGAG
+AGGTAAGGCAAAGCAGGCGGTGGGAGGCTAACAGGTATGCAGTGGAACAGCAACTGGAAC
+ACGAAAACGTTCATGGCGATGTTGCAGCAGTACTACGGCAAGCTTTCGCCGATCCACGCG
+GGAGCGCTTGTCGACTGGCTCGATAGCAAGCAGTTTTCGGGGGAGTATCTCAAGAGGCTG
+TACCAGGAGATAACCGAGAGCTACTCAACGAAGTTCGGCCGTCCCTGTGATCTTGCGATC
+GTGAAGGAAGCTGACGAGCGGCTGTACCCGCATTACTTTCCACCGGCGAACCTGCTTGAG
+GGGGACGGGAAGATGATTGAGGAGCGGGTGGCCGAGCGGGAAGAGGCGGCACAGTTTATG
+CATAACCTGATCGAGAACCTTGTGAAGAAAAAGCGGCGGGTGAAGCCAGTGAAGAAGCCG
+AGGAGAGTGCGGAATGACATTCACAGATAAGTACCTGAAAGAAAGGATTCCGGCGTTAAA
+GACCGTTTTCAAAGGCGATGATCCTATTGAAAAGGAAATGGTACTTGAGATAACGGACTA
+TGACCGAGGGATCATTGAAATGAAAGCTGGTAATGAGTACTACCGGTTCCGGCATGTTGA
+TCTTGAGCGAGCCGTTACATCGATACAGGTGCGGCAAGAGGTAAATGCATGAGCGAGTAT
+GGTGTAAGAAAAGTTTGTGGGAATTGTAGATCCTTCGAAAAGTGCTTTGCCGAATCAGAG
+GAGCTTATCGGAATCTTTTCCTCCGGTTGTCTTGCGGCTGATAAGGAGGAGACGCGGCAG
+ATGCCTGCGTGTGGAGACTTTGAGCCGATGATGAAGCCGGTACCGCTGTCCGGGGAATAA
+AGGTGCTGGTGTTGGGAGGGGCAATGAGCACGATGATATCGGCGGACTGTAAGGATCAGC
+GGGTGGCTGACTCTATCCGCTGGCTTTTGTATGAGCTTGAGAAGGCAAAAGACGGCGAGG
+TGGTGGTGTCGTTCTATGTGAAGGGCGGGAAGGTTCGGGGAGTGGAGAAAGTGGTCAGGG
+ATAAGAGTATTAAGCCGACATAGGACATACACGGAACATGTTGTGTGAGAATTGGAAAAA
+AAACTGGCTGTATATTGTTTTTATAAGTTTACGGTATATACATTATGGTGGTATAACGTG
+TATAAATTGTTTTTAAAAAACCAAACTAAAAGAAAGGATGGAAGGATGAAGAAAATCTGG
+ATTATTCCGGTGTTGCTCCTGTCGATAGGCCTCGCCGGTTGTAGTATGTTTGGAAACGAC
+GGGGATGACGACGATGATAACAATACCTCCGCTCCCTTTACTATTGTTGGTTCCTGGGTT
+AGGGAGTCGCCCTCTTATTCCGATACTGATGTCTATCTATTTGCCTCAGATGGTACGATG
+ACTCTCTATAGCGATTATGCAATGACAACCGTAGCTTCAGTATGGACCTGGGCATTATCT
+GGCGATACATTAGCCTTTGATGGTGACACACCCTTGCAAATGACAAATATCAGTGAAAAT
+GAGTTTATCATGGGTTCTTCTACCTATTATCGTAAGGGGTTCGAGCCTGATGGACATTCT
+GAATCATTGCCTGTTGGTTTCTGGGTTATGGCGTCTCCCTCTTATTCCGATAGTGAAGTC
+ACTCTATTTGCCTCAGATGGGACTTATACTCTTTATAAAGACTATGCAGTGGCAAATGTA
+AGTGAAAAAGGGACCTGGTCATTATCAGATGACAGTTTAACCGTCGACGCTTCTTTAACT
+AACGCAACAGAAACAATAACGGTTGTTAGTGAAAATGAATTTACATGGAATGGATGGACC
+TTCTATCGCAAAGGCACCGAGCCTGATGGACATAATGATCTAATAGGTACGTGGGTTCCA
+TCTTTTTACTCTATACCTGATACCGAAGTACATCAGTATAAAGCTGATGGAACCTTCACA
+TACTATAGTGATTACGCGATGCAGAAGATCTATCGTGAAGGTACCTGGACGTGGAACTCT
+GATCATACAGTCCTTACAATAGTCTTCACACGCTACGCCAATGGTTCTCAAGACTCTCAA
+GTTAAGTTTCTCAGTGGTAATAAAATCCAGTATGGTGCTGAGTACTTATATCGGAAAGGA
+TCTGAACCCTGTGGGAATGTCTTGTCCGGTTCTGCTACAACGCTGGCTGTCGATACAGCG
+TATACAGGTGAATTTACTGATCTAAGTGCTAAACTTTTTTGTGTAACGGTAGAGGATGGG
+GCAAGCTATGAGATTTCCTGGGATGATTCTGATGAGGGTAGCGGTTCCTATACTGGAGAT
+ATATCAGTCTCCGCATATAAAGCGGATAAGGCAAGCAAGTATTTTGCAGAAGAAGATCGT
+GGATATTCTGTTCCCCAGAGTCTTTCCGCTAATGGCACTGTCATGTATATCGTTGTGGTT
+CCTTACCTTGAGTTTTATTTTAGTGACTCCCTTGGTACCTACAGCCTAACCGTAACAAAG
+GTGACACCATAGTAGGCATATTTCCTAAGGCTCTGTGACAAAGAGTAGATATCGGGCATA
+GATTTCTCTATGCCCATTTTTTTTGTCTTCGTGAAGGGCGGGAAGGTTCGGGGTGTGGAG
+AAAGTGGTCAGGGATAAGAGTATTAAGCCAGCGTAGGACATACACGGAATATGTTGTGTG
+AGAATCCTGAAAAAGAGCTACCTGTATATTGTTTTTATTGGTTTACGATGTATACATAAC
+AAGTATAATGTGTATAGTGTAAACTATAAAACAAACCAAAAGGAAGGATGGAAGAATGAA
+AAAAATCTGGATTATTCCGGTGTTGCTCCTGTCGATAGGCCTCGCTGGTTGTAGTATGTT
+TGGAAACGACGGGGATGACGACGACGATGATACCGCTGCTCCCTTTACTATTGTTGGTTC
+CTGGGTTAAGGAGTCGCCCTCTTACCCTACTACTCATGTCTATGAATTTGCCTCAGACGG
+ATCTTGTAATATTTATGACAACTATGCAATGACAGGCGTACCGTATAAAACAACCTGGTC
+ATTATCTGGTGATACTTGGAGCCTTGATGACGACTACTCAGCTACAATAACAATTATCAG
+TGAGAATGAGTTTACCGTGAACGACAGCACTACCACCTATTATCGTAAGGGCTACGAGCC
+TGGTGGGCATGTTGATGAAACATTGCCTATTGGCTCCTGGGTTATCGACCGTTGCTCTTT
+CCCTAATACTAATGTCTATCTATTTGCCTCAGATGGGACTGTTATTCTTTATGCAGACTA
+TGCAATGACAACCGAAGATGCTGCAAGTACCTGGTCATTATCTGGTGATACTTTGACCCT
+TGATGGCGACTCAGCTACAATAACAATTATCAGTGGGAATGAGTTTACATGGGATGGATA
+TAGCTACTACCGCAAAGGCTACGAGCCTGATGGGTTTGCATTGGATGGACCTGCTGCCTC
+TCTGAGTTTAGGAACCGCCTATGACGGGAACTTTACCGATGGAGCTGATTTCGATGTGTT
+TACTGTGGCGGTAGAAGATGGGGCAAACTATGATATTACCTGGGATGACTCTTTTGACGG
+TAGTCACCACTATAGTGGAGACATAAAGGTTATTGCATATGCGGCAGATAGAGCAACCGC
+TTATTTTTTTGACAAAGATAATGGATATACTCACCCTGAGACTATAACCGCTAGTGGAAC
+AATCATCTATATCATTGCCCGTCCGTATGATTCAGACTCGGTAGGGACCTACAGCCTGAC
+GGTGACAAAGCAGTAGCATATTGTTGTTATCACCATGAACTAAAACACATGACGGGCATA
+GATTCCTCTATGCCCGTTTTTTTATGGTTTCCCCCTTGATGCAAAAATTCTTCCGTGATA
+GAATTTTTCTTGTTAGATAACCCAAGGTAAGCATACTTACCCTGGCCGTTCCGGACGGAT
+TCCGGTCGCTCTAATGGTGCAAGAAGCAATCAGGCGGCGAAGTACCTTACGTTAAACACT
+GTAACAGGTGTCTTTCGTGAGCTACTTCGCCGCCTTTTTTTGTGCCCTTTGGCTTTGACA
+GAGGAGAGGACGAGAGACTATGGGAAGGCAGGATAGACGAAAGAGTTCGACACAGCGCGG
+GTATGGAGCAGCCTGGCGGAAGATACGCATCGAGGTCCTCCAGGCCTGGGGCATCCCGAG
+GCTCCATGCAGATCACAGCAGAAAAACTGCGAAGTTTGACAACGGCTTTGGTAACCAGAA
+GAGGAAGGAACCTCGTCCCGTTTCCCCTATCATCAATCAGGGCACAGCCCGCCTTACGGA
+GGGGGGATGTAAATCTCTGGGGGAAAAATGCCCAAACCACGCGCCTATACAAACAAACAC
+TCTGTCAGCAAAGGCAAAGGGGGTATAGGCCATGAGTCGCGGCGGACACAACAAAAAGCC
+GACTATTTTAAAGCTTACCCATGGCACCTTCAGAGAGGACCGGGCCAATGAGAAGGAGCC
+GGAAGTCAAGGCACTTGATGAGGCGCCCAAGGCACCGAGCCACCTCAACACTTTTGCAAA
+GAACAAGTGGAAGGAACTTGCCCCGGTGCTTGCACAGACCCGTGTACTCTCTGCGACTGA
+TCTCACCATGCTGGAAGCCTTGTGCGAGGCATACGGACAGTACCGGGAAGCGCAGTATGC
+GGTCTACCACTACACAGATGATGACGGGAAGAAGAGGAAACGAAACCTTGCCCAGTACAT
+GAGTGGGAAAAACTCTCAAACCATGCCTGAGTACACGGCCATGCGGCAGGCGTTGTCCAT
+GGTCAAAACCATATCCGCAGAGTTCGGGCTCTCGCCTGCAACCCGCTCCCGCGTGAGTGC
+AATCGACACACCTGAAGCAAAGGACCCTATGGAAGCGCTTTTAGAAGGGGCCGGATGATG
+TGGAAGCGACTCGTACTTGTGGGGCTTTTGATGAGTAGCCTGTTTACCTACCGCCAGTAT
+GCCCAGGATGTTGCAAGCGGGAAGGTTGTCACCTGCAGGTGGGTGAAGCTTGCTGTAGCC
+AGGTGGGAAAATGACCTCTTACGGCAGAATACTCCGGATTTCCCCTACTACTTTGATGAG
+AAATGCGCCAACAGGTATATCAGCTTTGCTCAGCAGCTTGAGCACACGCAAGGCTTCAGC
+GGGAAGATCGTGCTTGAACCCTGGCAGCAGTTTGCCTGGGCGAATATCTTCGGGTGGAAA
+AGTACGGCCACGGGCCTGAGGCGGTTTCGAAAGGCATACCGGGAGGTTGCAAGGAAGAAC
+GGGAAGACGGTCGAAGGGGCAGCAATGATGAACGCCTGCTTTCACCTCGATAAAGAGATC
+GGGGCCGAAGAGTTCTTTCTGGCGGTGGACCGGAACCAGGCGAAGAAAGGCTATGACGAG
+GCGGTACGCCAGAACCTTCGTAACCCTACATTATCGCGGCTTACCAAGGAGTACCGATCC
+TCAAAACGCCTTGTAAAGGTCAATGACCCTGCGGCCTTCATGACCCCGGTCTCAAGAGAT
+CACAAGAGTCAGGACTCCTGGAACCCGCATGCGATCTTAGTGGATGAGTACCATGCCCAC
+GCGACCAATGAGCTGATCAACGTGTATGAGTCGGGCATGGGAGCACGGAAGCAGCCCTTA
+ACGATCATCATCACCACGGCCGGGACGAACATCAACGGGCCTGCCTATCAGGAAGAGCGC
+ACGCTCGTTACCAAGATCCTTGAGGGAAGCATCGAGCCGGTTCCGGAACACATCTGGGGG
+ATCATCTACACCCTTGATGAGGGGGACAGGTGGGAAGATCCTGCGGTGTGGATCAAAAGC
+AACCCTAATATGGGAGTGAGCTTTTACCGCGACTATCTTGAAAAGCGTATTGCAGAGGCC
+AAGGGCTCGCCCCGGAAAGCCAGCGATGTTTTGACGAAGAACTTCAACATATGGCTTTCC
+TCTCCCACCCGGTGGATGGATCACTCGGTGTGGATGCGGGGAAGCGCTCTGGTCATTGAA
+GAAGAGCTTGTCGGACGAGGGGCCCGTGGCGGGCTTGATCTATCGATGACAACCGATATC
+ACGGCCCTGTGCTGGGCATTCGGTGAGAAGGACGGGCTGAGGAGGGACTATCAAGAGCTC
+TTGATCAGATACGAAGGCTTAGAGAGGCAGAACCGGCAGCAGCAAACGGCCCTTAAAGCC
+GGGGGCTCTGTCCTGGCCGCCTCTATCATTGTGAATGTGCTGCAAGCTGTGTTTTGA
+>NC_014364.1|provirus_2666253_2703772
+ATGGGACGAGCAAGGAAGCCTTTCAAGTATTATTTCCGTCAGGTTAAAGGAAAGAATATC
+TGGTATTATTCGATTTCCCCGGTTTCTGGTGTGCCTTTCGAGTTATGCGAGGACCGGAAA
+AGTAGCCATATAGAGGCTGAACTTGACGGTTCAGGCAAGCCAAAGAGATCGAGTGAACAA
+AAGATAGTACGCTTTTGCCTTAACAGAATACGCGAGCTGAAAGACGGTTCAGAATCACAA
+TCGCCAACGCTCGCGGAATTCCTTCGTCCATACTTCACGCCAGAATGCCCGCACATTACC
+CGCGTTCTATCAGACGGCAGGCGTTATTCTGACACCTTTCGTAAAGACCAACGATCACGA
+ATAGACCGTCTGGTTCTTACGCACCGAATAGCCGAATTCAGAATGGACGAACTGACTCCG
+GGAGATATCGAGGACTTTAAAAAGGATCTTCGAAGGTCAGGAACAGGAACGAGAACAATC
+AACCTTACCGTCGGAGCGATAAGGACAGCTATCAATGAGGGGCTTCACAGAGGCGACATA
+AAAAACGATCCAACCGTCGGGGTACATAGTATTAAATCCGACGAAGAGGAAAGAGGAATT
+TTCTCAATCGAAGAAATTAGAAAGATGTTTTCCTTTCCTGGTGGATTAAGATTGTGGGGA
+TATGATACCGGATACCACGGATCTCCGTCTGGGGAGAAGGTATTGCCGATTATTCCTTAC
+ACTCTTGCACTCTTGATGTTTGCAACCGGTGAAAGGCCATCCGCCATATTGCGACTTAAT
+TGGGAAGATGTAGATAGTGATATGATCACGTTCAGGGTTACAAAGGCGGCAGGGGCCAGG
+AGTATACCCATTGTCACGATGGCAACAAAGGCGCTTCGTGAGCTCTCTGATTCAATGCTG
+CATGTGGCCCCTGCCGATCCTGTTTTCTGTCATGACGACACTGGCCAGCGTTTAACATAT
+GCGTTTTTCCCAAAACGTTTCGCCCACATGATGGCTACGCTTGACCTGCCGACTAATGAT
+GCTGACGGACGAAAGCGAACGCCCTACTCACTTAAAAGTTCTTTGATTACTCACCTCATT
+GACGGCGGAGCCGATCCTATCCTTGTACGGGAATATGTAGGACACTCACACGGGACGGGT
+GAAAAACGGCTCACTAAGGTACAAAGTAGGTATAAAAAAGCCCAACGAGAGAGGCTTAAG
+ATATTGCTGCCGGATATTGAGGTTCTTCTTTCTGCGGAATCTGTTGTAATAACAGAAAGT
+TAAGGAGTATCCTCTTTGGCCAAAAGAAGTAGTCTCCAAGCGGCTGTTGGTATCCCTCTC
+TCTCCCCCTACCCACTTTCTAATTGTGCGAGGGTTGACCCCTGCAATCTTGGCAGCCTGC
+GAACCAGTTAAGCCTTTTTCCTTGAGCAGTGCCCTGAGTTTTGCCGGTGACGGTGCTGTA
+TTTTCAGCAATTGCCCATTCTGAGTTGTCAGGGTAATTATAAGAGAGCTCACCCGGCTTG
+TCTTTATTGCCCTTTCCTATGTATCTATTTGCCAGGATATCAATTTTACCATTTTCAACT
+TTGTAGTATATTTCCTCCCCCTCTTCGTCGTGTACAAAAATCTGCAAGTCGCCACGTTGG
+AAGATGATGAAATCACTTTTCGGTCTTAATTTATCTTCTACCATATTCGCCTCCTCCCCA
+TTGAGGGAGAGGCGGGTCATAAAGACCCTGCCTCAGCGAAGCTATAATACCGGCCGTTAC
+CAATGATTATATGGTCAAGTACCGGTATCCCAAGTATTTCGCCTGCATCATGCAGCCTTT
+GTGTTATTTGCTCATCCTCTGGACTCGGCAAAATCTGTCCCGATGGGTGGTTGTGAGCAA
+CAATGATTGCCACAGCATTGTCAACAATCGCCGGATAAAATACCTCACGAGGATGCACAA
+GCGTCCTGTTTGCAAGCCCTATTGTGACAATATGCTGACCGTTTACCTGGTGCGCACCAT
+CAAGCGTCAGTACAATAAAATGATCCTGCCGCTCGCTGGCATAGCGGCTCAATAAGTCGT
+ATGCATCTACTGGATTGTTGATTTTGGTTTTCTCGTTCATCGGTAACTCCTTGGTTCCGG
+TATTTCAGCCTTCCCATACGGGCGGCCTTGGTTGATCTCTCAATCAACCTTACTTTTATA
+GTATAGGCCCATTGGGCCTATGTGTCAACTATTTTTATTATAAATTATTTAATTTTTTAG
+ATATAAATAGTATCAGTGTCGTCATCATACCCTATCAATAATTCATGATCATTTTTGACA
+AAACGATGCATATCAATTTCGCAATCTACAATTTTAGAGCCAGAAGAGTGATCAACCCCT
+CATACTTCTAATTATAAATATTGCACCGCTTTCCCGTATTCTGGACCGCCATTGATAGAT
+GTCGTCCAATCGTTATTGATACCGATCTCCTGCTCTATTCGTTGCAGAGTGTCTCTACTA
+TCTATGATCATGCCTTCATTCAATATTCTGGTAATCGTAGATTTGTTGACGCCGATCTTT
+CTTGCAAGATCAGCTCTTGATAATTCTTGTTGTTCCATGTAATCAATGATCTTCTTCTGT
+GCTATCGTCACCGCCAGCATCTCCCCGGAGCTCCTCAAGATAGTCAACAAGTGCAAACTG
+CTGACCAATATTGAGTGACCTGAGCTTTTTTATAATATCCCCGCGGTTAACCCCAAAATA
+TTCAAACTGTGCATCTATCTCGTCTTCCGTATCCGCAAGGACCGCTCCAGGAATAACAGC
+GCCAGGCTCATAAGCTGTTGACAATGCATTATTAAGCATCAGATTCACTTCTCCATCTGA
+AAATAGCTCACGAAGCGTTCGCTTCTCCCTCTTCATGAGTTCCTCGTACCTGTCGGCAAC
+TATAGTGATTGCTCTCGATGCTCCACCATGACGTTTGACAAGAGGATCAAGCTTCTTCTC
+AAGTACCGAATTCCAATAGATCGATGTTTTCCCGCTCATGCTCGTTTCTCCTTTTGCTTT
+ATAAATAGACAGCCCCGCCGAAGCGGGGCATGATTGGTTAAGCCTCTATGATATAATAAT
+CAGGTCTACCAGCTTCGTTGTGAGATAGGTAATATATACCATCTTCCTCTTCGTCAATCC
+ATTCTTGAGCCTGAGCCGCAGAATCAAATGTAATCTCTTCCCATCCTGATTCATCCCTTG
+CCCACTGGATTGGCTGATATCCATAGTAATTTCCGATAACCAAAACTTTACATTCCCCGG
+TATACTCAGGATCTGCTTTAATACTATCAGGATCTCTATGACCCCATGCAATAGATTCCA
+TAATCGGATCATCAGAATTGCTTATCCACTCGCTTACTTGTTCGCTGACAAAGGCCTCGT
+AATCTTTTTTAGTATTTCCAAGCAAATCATCTTCTTCAACTTCCCATAATGAGTATTCAT
+TGATCTGATCTTCATAATAGTAAATTCTACCAGTTTCAGGGTCTTTGTAAAGCGTGGAAG
+AATAGTTATCAAATTGATTAGTATTTTGATGTTCTTCGGCTAAGATTTCCCATCTTTCCC
+GAACTTCAGCCTGATCGATTTCGTCTGTGCTTAACTTCTCAACTCTTATTTCTGTCATTT
+CTTTCTCCTTCGCCTTCCCTTCCGGGTAGCGTTTTGGTTTTGTTAAGGTCTCAATCAACC
+TTACTCTTGCATTATACCTCTATATAGCGGTACAGTCAACAGAAAGTTTCAAAAAAAATG
+TTAATTTTCTTTGTTAATTTATTATGGTATTTTATTGCGAAATGAGGAAATTCAGAAGAT
+TGCCTGTAGGATGTTCACAATAATAGAGACAGCCAGGACAGAGCCACCGGCTTTAAGGGT
+CGTCTGCTGCCGCCGGTTCTGCCTCTCTAAGCCTTCGCAATAGATCAAGAGCTCTTGATA
+GTCCTTCCTCAGCCCGTCCCGCTCGCTCTGCAATGCTGCTACTTTCGCTTTGCGCTCCTC
+CGATTCGCTCTGTAAGCTTTCCAGCCTCTTTTCTGTATCCTGCCACCTCTTTTCGAAGTT
+CTGCGAGCTCTCCCTCGTACGTCTCAACTGCTCGCTCATACTCATCGCTGAGTGCTTGAT
+ACTCTGTATCTCGCTTTTTGCCTCGACTATCGTATTCTGCAGCTCGTCCACTATTGCCTC
+TTCCTGAGCGGTAAGTGCCCAGGAGGAAGCCAGCGGAAAAACACACGCCAAGAGCAAGGA
+TAATGCTAATAATTTTGCGCATCTCAATCCTTCACCTCGATACTGATCTTCGGTCCGTGG
+ATGGAAACAACCGACGGCAGGATCAGCCACACCATGGCCAGCACATTGGTAACCAGGGCC
+ATTTCCATCTGGCCCCGGGTGTAGAAGACTCCGGAGAAGTAGTCGATGATAAACTTGATG
+TTCACCGGGAAGGCAAAAAGGAAACCGATGATTGTCGCCACCTTTCCTTTCTCTCCCAGA
+GCCTTCCACAGCTTTACGATGAGCTTTTTCATGCCGCTACTTCTCCAAGATCGAGAAAGA
+TGCGCTTCGACCGAAGTTCCCCCTCGCTTGCAGTCTTGCTGAATGGAGCCCATGGATCAT
+AGACGGTCATGCCACGGCCGTTACCCAGGGTGAAATGGTAGATGTACTTGCGCGTTTTTC
+ATTCCACCGTCGCCACAAGAGTATTTCTATCTCGTTCGGCTGGCATATATAGTCCGCGTC
+TTTTTTCCCGAGGTAGCGTACATTCAGGCCGAAGAGGCGGAAGATCCCGGCGGGGTCCGC
+CACATACATAAAGGTTCCAGGCGCCTCCGGGTCCTCGGTCAGATAACGACGGTTTTCAGC
+CTCAACCACAGCGTTCACAAACTGCTCTTGTGAAATGACTCGTTTCGTTCTGCCTGCTGC
+TCCCGCAGCAATTGAAGTAGCGTAGCATCCCCACTGCTGCACCCGATCCGGCATCTCAAT
+ACTGTTTTGATAATACATACGTCTTCACCCTCCCAAAACGACGGGGAGTAGTCCCCCGAT
+AATCGAACCACCAAGACCGCACACCATTCCGACAATGACTGTTCGGTACTCAATCTTCTT
+CTCATGGCGTTTCTCAACAGGGCACGTACTTTCCCGGTTGATGAAAAAGTCGGTGAGCTT
+ACTGTTGATCTCTTTGATGTCCCGGCCTTGTTCCGTCACAATGCTTAAGACCATATCGAT
+TTTGTCGTTATCGCCCATTGGCTTAGCTCCTTTTCTCCGGTACCTGTGGCCAGGAAATCT
+CCTGCGGGAAGCCTGGCTGTAGGGGAATGTCCCTGAGAGCCTGCCGGTAGGCTTCCCAGT
+CCGACTTGTCGGTAAGGGGATAGTCGGCCATCATGATGTAGTCACTCTCAGATAACAGCC
+TGTCTCGTTCTAAGCGAACCCGTTCGGAGAGCACCTCCTCGGGAACCGTCCAGCCCGTTT
+CGTTCCACACGGCCTGCGGGTCCGAAGGCTCTATATCGGTCATACTCTCATCGGGCTTTC
+GGCCGAGGGACAGGTGTACCGCCGCTCCTGTGGCCTTGTTCCAGTAGGGAACACCGGTAT
+AGTCAGGGGTAAGCACATACCTACCGCCTTCCCAGGTGATAGCCTCATGTTCTCCGGCCT
+CAGGCACAAGCCCGGCTTCTGTTGCGGCTGCTATCGAAAGCCGATTTCCTTCCTCATCGA
+AGAAGCGGATATCATCGCCTTTGTTTCCGGTAAACCCTGCAGGAACCTCCTTGATGGTTT
+TTTCCGGAAACAGCTCTGCAAGCTTTGCCGTCTCATCGGCACTTTGCACCACAGCGGTGA
+TCATTGAGCCATCTACTACGGCGTAGGTTTTCATGCAATTCTCCTCCATATCCTCATGAG
+GCGGTTACGGTCGGATGTTCTTGCCCCAATGCGAGGAGTACCGTTCGTACCATCACTTTT
+GGGGCCCGATGTTTTGCCTTGAATTGTTGTATCAACATTGGCAGCCGCATTGATATCCTC
+AGCTTTTCCTGGTACGTCTTCAGTCGTGTATCCATAGACAAAAATTTTAGGATTACTTCC
+GCTTGTATTAGTTCCTACACCATTAAGTGTGATAAAGCCTTGGAGATTATCGGGCATTAG
+CCCATTTGTTCGGCCAGAACCGTTGTAACCTTCGGTATGAAAGTCTATGCCTTCACCGTC
+CCACAGTTTCTCCCAGGTCCCTCCAAACAGGTAAGCAGGGGACTCGTTAGTCGGAAAGGC
+AACCGATAGGTCGTTACTTGCGCTTGAGGCGTATTGTGTGTACTGGGAGCCTACAGGGTG
+GGAATTTTGTTCTACATCGAGATTCCCTTTGTGGTAAATATCATATCCTTTGTAACTCAG
+GTGCTCGTTATTGACGATAAAATCCTGTCCGCCTAACTCAACGATAAGTTCAAGTGAAGC
+AACTATCTTTCTGGTGGTTAATTTTTCACAGTAAAACCCACCGTTGCCAAATAACGACAA
+TCCATCGGGGTTAGCTTCTGTAACATAAAGCTGTACATAACCAACATCATTATCCGCGGG
+GAATTTCAGAACATCTCTAATCCACATGGTATTTGTATGTATTTCGCCGTCCCAGACAAA
+GTTTGCGAGATCTATATATCCGTACACTCTCTTGGACCCAAAACGTGTAAATGTAATCAA
+TCTTTGCGGCTCAATTGAAAGAGAAGGTTCATCCGGCATGCCGGCAGGATAGGAAGTGAA
+AGCAGAGCGGGCCTTACCGAAGATAACCTGTTCTCCGGCAGCCTTGATACCATCGGCCAC
+CAGAGACAGAAGAGGCGCTTCCGTCTCATCGAAGAAATGCACACCCTGTCGTCCGGCATT
+CGATCCCACCCGAAGGATCGCCTTACCGGTGGTACTGTCCTGGATCTCTAAGGCCGCATC
+ATCCTGGAGCACATACTGACCATCAACAAGGCGCATCTCGCCCCTGATCTCGATCGAATC
+CCCGTCGGCCGTCCAGAAACCGAAAATGGTAGAGGCAAGGCTTTTTGCTCTGTCCGAAGG
+GTCAGAAAGCCCCCCAAGGTATCCCATGGCAACCCGAGGCTCGGCCCCGGCAGCCCCCCA
+CACCTCGATACGGTTGTCTCCGGGATCAAGCTCTATCCTCGCTTTTCCCACCTCATCCGA
+GCGTATGGCGGTGGATGAAAGCAGCCAGTTGCCGACCCGTCCCGCATTGGCCCTGATCCC
+CGAAGCATCGAGGATCGTATCCCCCGCCTTGATGGCCCCGCCCGAGAGGGTCAGGTTTCC
+GTCAATGGTCAGGTCATGGAGTATGCCGTACAGGTCCCCACGAAGCCACACGTTGTTAAA
+AAAGGCATCCCCGTCCCCTCCAATCTTCCAGCCCGAAACACCACCCTGCTTGTAGTCGTC
+ACTTTCAATACCGTTGCCTGCGGTAATCTTTCCCCGAAGCTCTGAGTCACCGGAGAGAAA
+CAGGTCTCCATGAATCTGGAGGGTTCCGCCGTCCCACTTGATGTAGTTATTCCCGTCCCC
+GAGAAAGGACCAGGTACCATCATTATTAATGACTGCTGTCCACTCCTCTCCATCAAAGAA
+GCCCAGAGCGCTTGCCGTCATATAGAGCCCTGCCACCGTGGTGTCGATATCCACCAGCTG
+GTTGCCGTTGACCGGCTGTATGATGCTTCCGTCCGACTCAAGGCCCACATCCACCCGCTC
+GGCCACACTCTTCGCCTCATCCGGATTGGTCGGCACCACAATCTGCCCTGCAACAACCGT
+CCCGAGGATGGTTTCAAGCGGGGCCACACTTACGCCCTCGTATTCCCATATCTCCGTTTC
+AACATCCCAGCTTCGGGAAGTGATACGAACGGTATTTGATATGCCGAGGGAAAGGGAGCT
+CACCGTAACGTAGCTTCCAAGGCTCTTTTCGGTAAGACTTTTAAACGTGTAATGAAGTCT
+TCCTGTGGTAATCGAGGAATACAAAGCGTTTGCAAGCTCGGTTGCCGCGTCATCGTCATA
+CAGGTAGTTGGCTGAATACTTTTTCAGTTTGCCCGTGCTCTCCGGCCTTGAGAATACGGA
+GGTTTTCTTTTGATCCTTGTAAACAATATCGAGATCACCGGTTACCTTGATCTCATTGAT
+AAGCTGGCCGTCTGCAAGGTTAAATTGGAATTCCGAATAGGTTGTTGCATGGTTTTCCAT
+AACAAGGTCATAGACACCGAACAACTGTCCCATCCCTAAAATATCTATCCATGTGCTGTG
+TCCAGGCTCCGGACCGAAAGAAACCCACGTATACCCATGGAGTTCCAGTTTTTGGTTTTC
+AGCTCCGACTATCTCATAATTTGAACTACCAATATCGAGATTGTAGTCACAGCGATAGGG
+ACCATCTGCCGGCCAAAGCGCCGGACCTTCGGCATCCTGGCCGCTATTTGATGCTATCGA
+TTCCCATTTATCAACCTTCTCATAGTAGAGGGTAAGCCCGGTAAGCTTCTCATACTGATT
+GAAGGATACCTGTACCTGCTCAGCCTCAGAATCCTTTCTCTCAACCTCCAGAGATCCTAT
+GATATTCTGTTCACTGAAAGCCCCGTCCGCTTCGACAGAAGAGGATGCCCAGTCGTAGAT
+GTCGATCACCCCGTCGGGGAATACATTGTAGAGATGATGGTAATCCCAGAGGATTGCCTC
+AAGATCGTCTGCATAGCTGTCGCCGGAAGCAAAGGCAAGCTTCGGGATAACTTTGTTTAT
+CGTTTCCCGTATTCCGATGTACTGGGAAGGGTAGCCGGCCGATGCCAAGAGTATGTGAAC
+AATAGAATGGTCGGGATCATCAGGGTCACAGATCTTCCCGTCCGATATCATCACGTCGTC
+CTGCAGGGTGGATTCAAGCAGATACCCATAATCATAGATCTCGAAGTCGATCGTCCGGTC
+GTTATCGGTGACCTTGTACTTGGTCACCGGCCGGGAGAAGCCGCGAAACCAGATCACCCC
+GTCACGATAGATTTCACACGGAATATCTCCGGTACACTGCAAAAGCCGCATTGCAAGGGC
+CGGAGTGAGAGTAGCCGAGAACGTGGCCGAACCTAAAGCAGGTTTGAAATCATCGTCATG
+AAGCTTCTCGGTAAGCTTCAGAGAGTCTCTGACAAAGTTATCTCCACCGTAGCCGGTGAT
+ATCGACCCAGCCGTCCCCGTAATCAATGAGAATTTGCCAGCTCATCGTCAGGCTCCCCAC
+TTCTCGACACGGCCGGATGACTGGCCGCGCTTTACCGTCTGGACGATGTACTTTGCAAAG
+GCCTCCGATCCTCCGGGACCGTACACGCTGTCCACATGCACCTGTACCGTCGTCCCGCCG
+CTTTTGAGGTTCCGGATGTCAAAGGGGATGACCGTCTCAGCTTTGTTTTTATCTCCGAGC
+CGGTACAATCCTCCGGACTCTCCCTGCGCCGGCACAATACCGCCGTCTGCAAGGCCCGTG
+TACTGCTGCTGATTGATCAGCGCCACCTTGCGGGCGGTCAGCCCTGCAATGACGGCGGCC
+ATGGCCGAGGCCGCAATCGGGTTCATGGATGCATAGGCATTGATAACCGCCTGTGCTCCC
+GATGCTATGGTTTCACTCTTCCTGTTCTTCTTGTCCCGTTCGAACTGCTTCCGCGCAAGC
+TTGTCCTCTTTCTCCGTCTTCTCGGCTTCAAGGTCTTCGTATGTTTCCCCGGCCGCCTTC
+TTAAACTCGATCTGGTTGTCGAGGTTGGAAATTTCCTTCTCGGCCGCAGCATCCGAGAGA
+TCCCCCTGGAGGCTGTAGATATCAGAAAGCATGCCGTTTAGCTGGTTGTAGATGGCCATA
+GCCTCCTGGGCCCTTGAGGCATACAGCTGGATGATCTGCTCGGTTTTCCACTTCTCAACA
+TCCACCTCATCCACACCGGCCTGTTTGGCCGCATCCACCTGCAGGCGTATCTCATCAAGG
+CGGGCCTGCAGCTGGCTCTTTCCAAAGCTCTCCCGTATCTCGGCAAGACGGGCCTCCTCG
+TCCCGTTCCATCTGCTGCCGGTCAAGGGAGGCTTCATTTAGAATGTCTTTATACTCTTGT
+TCCCACTCAGAAAGCCCTTCAAGCGGCTGTGACCAGTCGGTCTTGCCTTCCGAAAGCTTT
+CGGTTTCTCTCATCGATAAGATCGTTAAGGAGCCTCTGGACCTCAGCCATATCCTGACCG
+GCGGCCACCCCGGCATTACGAACGGCAGCCCACTTGTCGATCTCATCCTGCAGGAGTTTC
+AGCTGCTTCTCGTTCGGCTCCATGGCATCGAGCCGGCGCTTTCTGTACAGCTCAAGGGCT
+TGTACATTGTTCTTTGCAGCCTCGGCGGCAATTCGGTTTTGTTCGGTTGAGATGCTCGCA
+AGTTCCTGTTCAGCCTGTTTCTGCTGACCTAATGCCCTGATCGTTGCAATGATCTCGGCG
+ATCTTCGCTTCCTGGTTTGCAATGATCGTACTGGAAGCCTCATTCTCCTGGCCGTAGTAC
+CGGTCCTGCAGATCCATGAGCTTTTCCTGTTCAAGGGCAAGCGCCTGCTGAGCCTGCAGG
+AGTGCTTTTGACCCCTTGGTATCGACCGTTCCTCCTGCCTTCTCATAGGCATCGAGGACC
+TCTTTGATATCAAGAAGACTGTTGCGGGCGTTTGCCGCCTCGGTGACGATATCGGTCAGC
+CATCTGACAAAGGGCTCCATACCGTCGGATATCGATCGGCCCAGACTCTCCTTGTAATCA
+CCGACGGCATTACTTAACTGGGTAACCGCAGCAACACCGTTTTGAGCTTTTGCCTTGGCA
+AGTTCGAAGCCGTCAGCCATGGCCTTCTGAACGATTGCATGCTTCTCTCCATCGCCGGTG
+GCGGTCCTCAACTGCGGGATGTATCGCTGGAGCATGGTGTAATCGTCATTCATCGCCAGA
+GCAACAGCCTTCATGGATGTTTGCAGGTTGATCCCGAAGGCGTTTGCAAGCCCGATCGCT
+CCCTTCGATGCTTCTTCAAGCTTATCGCTTGCAACTCCCTGGCTTTTTGCAAGCTGCATA
+ATACTCAGGATAGCCTCATCACCGTAGGTCGTGACACTTTGGATCCCCGAAGCTATCTCC
+TTGAGGCCGGGTAACAGATCATCGGCAGACTCTCCGGTCGCCCTGATTGCCGCGGCAAGA
+GCATCCTCGGCTTCTATCTGTACGCCGTACAGCTTGACCGATTCCTTCATCTGCTGCATC
+ACCGCCTTCACTGATACGGCCGCAGCAGCATAAGCGCCGAAACTCTTTGCAGCCCCCACT
+GCAAGGTTTTTGAGCTGGCCTTCCAGTGAGTCGGTTTGCTTCTCTGCATCGCGCATGGCC
+TTTACCGCGGCCCGTGTCTCTGCGCGAAGAAGTATTTTCAGCTCGTCAATTACTGTTGAT
+CCCATACCCGTTCCTATAGGCACCTTCCGCCGTTTCTATGATCTCGACGATGAAAGCCGG
+TAATTCCGCCCATCCCCCTGAGAAGGGAAGAGCGCCGAAAAGCTTATAGCGGTACCACAG
+ACCGAAGGCACTCCAAAACCAGTCATCAAGGTACTCGTTCACTTCACTTCGCAGGATCGT
+TACCAGCCTTCCGTCGACCACCACGCCGAGCCTTCCGTCTCCAATCTCCCGGCGCACCTT
+CTGCGAGCTCTGGCCCTTCATCCACAGCCCGATTCCAAGAGCTATTTTTTTTTATCAACG
+GAAGTCAGGCTCTTGAGCTCGTGCATGAGCTCACTTGCAAGTGCAACAAGGGGTAGATCG
+GAGAACAGCTGCTCTCCGCTGTCCACTTCAATACAGTTTCCCTCGACGCACACGACAAGA
+TTATCAATACCGGTAATCATCTTCTTTACCCGAAGTACCCACGCTATTGTCAGATAGTCG
+GCATACCACCCTTCGTACGCTGCCTCATTATCCTTATCCGGCACCGGCCCGGCTTCCCGA
+CGTGCCCGGCCGTAGATCTTCTCTTCCTCTTCAAAGGTGAGAAACCGGTAATGCACCGTT
+ATTCTCTCATCCTTCTTCCGTCCCTTATTGCCCCAGGAGGGGACATACACCCCGTCCCGG
+GCTATGGTGATAGGTTTCGCCATCTTTATGCCGCCTCTCTTATGTACAGGGTGGGATCAG
+GGTCTCCCGGTGCTATGCGAAAGCTACTTGAAAAGTTCTGTGCATCTTCTCCCGAGGCCC
+CAAGGCTGGAAGAAAGAATGATGACCTTTGCCCAGATAAAGGCTTCCTTTTCCCCTTTAT
+CCGTTGACTTCTGGATCACGCCCTTGATGTAGATCGGCGAGCCGTCCACATCGTTTTTGA
+TGATGGTGCCACTTGCCGACTGCCTTATAACCTTGATGAAGTTGTTGATGACGTAGCCGG
+CTGCATCGGTAACATCCAGGGTAGTAAGCCCTTCAAGGCCGCCTGTCATATCCGTTTTCC
+CTGATCGGTAGCGTTTGACCTTGTCACTCAAGGTGGTCACATCGATCTCATTTTTATTGA
+AATCAATCGAAAAGCTCTGGATATCAGCCTTCTCACTTTCCTCTAAAAAGGCACACGCAT
+CTCCTGACTCAGGCACAAGAGAACCGTCGTCCCAGAACAGCTCGCCATTTTCAAGGACCG
+AGGCAAAAGCGCTTGTCTCTCCCACTGCCGTGATACTCCACCAGCCGGCGCCTTCTCCGC
+TTGCCACTTCTCCTCCTACCAGTTCATCAAGACTCTTTGCCCCGTCGCCTGCAACCTCAG
+AGTCAAGTTTGACGGTGACAAGCTTCCCGTCACTTCCCACAAGTCTGTCTATTTCCATAT
+CATCCTTCTCCTTCTTCCGTGTAATCTGCCCTAATCTCCACCATCCAGCGGTAGAGCCCA
+TTGGGGGCAATGCCGAGAGACGCATCTCCTGTGACAACCACCGAGGAGAACTTCAAGGCC
+CCCGATACCCCGCGAATCCTTCGAACCGCATCTTTGACAAAGGCCCGAAGATCAGAGCTT
+CTCTCATCCTTTGCATAGATATCGATCTGTATGGCAGCTGATCCCCCGTAGTATGAGAGA
+TACACCTTTTCATTCGTGTCGCTTACAAGGCTCACCACCAGGTACGGTATCTTTAACAAA
+ACCCGGCTCTCGGTGTCATAGATCGCTTTGATCCTCTCCATGAGGGCCGTGTCGGCTCGA
+AGCTGCTCTGTGATCTCAACTTCCGGTGCTCTGCTCATCAAGCGCCTTCCTCAATCCTTC
+TTTCCAGATCTTCCGTATCTCCCTCATGGCCTTGTTCTTCCCGGCCCGCATGAAGGAATG
+CGGCTTCATACGGCCACGGTTCTCACCGGTCTTTGTCGCCCGTTCCTCTGTTCCATACTC
+AACAATGAAGGCATGGGGAGCATTGTTCTTCACCGCTCCGGTATGACCCTTCACGTCATA
+ACTCATGCCGGCTCTTAGGTTCCCGGTCCTGTCCGTCACCCGTTTATCTAAAAACTCGAG
+GGCATACTCATAGGCCTTCTCGGTCAACGGCCCGATCGTGTTCTCGGCCGCCGAGATGGT
+AAGGCCTGCATACGAGCGCACGGTCTTCCGGCGTCTGACCGTACTTCTCTGGCCACTGCT
+GCTCCTTTTCGCCCAGCTCATACCGAAACCTCACGGTAGGCGTCCCACACATTACGAACC
+TGAAAAGGCAGGTCCATGACCCCCACATACATGGTTTGATACTCCCCACTTAATGCATTC
+CCCTTATCCAGCCAGCTGATACCCTGGGAACCAAGCCAGTAGCCCACCAGCTGTATCACC
+GACTCCTCAAGGTCCTCAGGGATAGATCCTTCCTCATACCCAGCACGGTAGGACACCTTG
+ATATTGCGAAAGCCGCGTACCCAGCATGAGCGGCGAAACAGCCTGCCGGTCTCATCATCC
+CGTGTGTACTCAGTAAGCTCAGTACCGGTGTCAAAGACTCCATAGGTATCAAACCACACT
+CCCGTGACACTCAGGATCGGATATTGCGGTAATTGCAACGTCCGGCTGCCGGTTCCCGAT
+AAAATGACAACATGGTCGTCTGCTGAAAGCTTTCTGCTTGTGTAGGTTTCTGCCCGCCGG
+GATGCCACGGCGATAAGGCTTTCTGCCTCATTCTCCTGGCTCTCCTCAAGATCAAGCCGC
+TTCTTCACCGCCTCCCATGTTGTCAGGTTATTCATCTCTTACGCCTGGCCCTTTGCAGCT
+GCCTCGCTGATCGCAGCTTTCAGCCTGTCCTCTCCCCACCGTTCAAGGGTGGACGGAGCT
+CCCACCTTCAGCTGGGCGGCAAGGTCGACAAGACCACTCTTGTCAAGCTCATCAAGCTTC
+ACCGTCTCAATAGTTTCCTCGTTTGTTTCAACACCCTTTTCGTCAAGGAATTTCGCATGA
+CCTGCACGTACCAGGTCCTTTGCAACGTCATCCGGTGCCGAAACCTTCCCCGGTATGTAC
+GAGAAATCCTTCCCGACAACCGAAACCAATACTTCAATGTCTTTCAAATCTTCTCTCCTT
+TTCCTACCTTGCAAGCCGGATGCCTTCCGGCTTGCAAAAGGGGCTCTATGCCGCCGCCAT
+TGCAAGGTGTTTGATCGGATGCGTACCCGCATCAACCAACAGCGAACCGTGGCGGAAGAA
+CGCGATAAACCCAACCTGGGCATACTCGGCGTACCGCTCGGTCAAACGCAGAATGATGCC
+GCCTGTTACATCCCGAATCTTGAAGGCCGACATATCTCCGAACAGCACCGCTTTCTCTCC
+GGCTTCCATCCCCGCCATGTTCTGGTTGATGATGTACTTGTACCCGTTGATCGTATCGGG
+TTCTCTAAGCGCAACACCGGGAAGCCACAGGGGCCTGCCCTGGCTGTCCTTGAGTTTCTT
+GAAAGCCTTGAGCGTACCGTCGTTGAACATAAGTTCTGCATTCAACCGGTAGGAAGGATC
+GATCGAGTGAATGAGATCTATGACCTCATCGTAGGAAAGAGCTCCCGCCGCTGCTGCGGT
+CTTTCCGAGTACCGAGCCTGTGACAATGCCCTGAGGCTGCTCGCTTCCGGTTCCGGTGGT
+AAAGTAGGCGGATGTGGCCCTGCCGATACGCTCGGCAATCTTGGCCCGCAGGTACGCCTC
+GATATCAACACCGGAGTCCTGCAACAGCTGATAGCTCACCCGGATGATTTTCGATGAGAA
+CATGTAGGCATACAGGTTTTTCGATCCGAATGTCAGATCTTTCTCGCCAGCGGCCGTGTT
+CTCCGAGAGAATTTCCCCCACGTTCTCGGTATCGTTTCCCGTCGGAATCTGTATGTCACG
+GCCGTTGGTGGTGGTGATCACCTCGGCCCGGCTCTGACGGGGACCGTTGAACTGCTTCAT
+TGCATCCACAATCCCCGAGGCCATTTCATCGGGCACCGTATACCCTCCGGTGCTGTCGGT
+TCCCACACTCAAAGCACGGCCTTCAACCTCTTTGTGGTGCTCCATGAGAATGGAGCGGTG
+CTCAGCACTCACCCCGGAAAGGCCGTTACGAAGGTAGGAGTCAAAGGCAGATCGATAGGT
+ATCGTGTTCCTCTTCCTGCTGCCGTCCTTCATCCTTCTTACGGGCATCCTCTTCGAGCAT
+CCGCTCTTCAATGGCAAGCTCCCGTTCGGCTGCCTCAATGTCGCCGGTAAGCTTTTCAAC
+CCCGTCAAGCCGCTCGTTGTACGAGCGAAGCTCTTCTGAGGTGAGCTTTCCGTCTTCGTT
+CGCCGCTTCTTTTTCTTCGCGGTATTTCCTCGTCTCTTCCCACAGGGTTTTGCGTTTCTT
+CCTCATCTCAACAATCTTGTCGAATCTCTGTGCCATAATTCCTTATCTCCTTACATGAGC
+ATGCCGAGCATCTTCTCGCGCTCTGTATAGTTGCAATCAGCCTCAGACCGCTTGCGCTCT
+TCCGGGTGGCTCGTAGCCGGCGCGGTTAGCTCTTCGATCTTGCTGCCGATATGTTCAAGT
+TTCTGTCGCTCCTCTTCGCTGATATCCCCTGATACCGACCTCAAGGTCAGTTCCTGTAGC
+TCCTCCGGATCGAAATCAAGTCCCATTGACCTAAGGTCAACGGAGGTCTGCGGATAGGCC
+GGGAAGGTCACCGGTGATACTTCAATCAGCTGCACTTCCACCAGCTCCCGGACCAGCCGG
+TTGTTCTCGTCCTTGGTCCACTTGTCCCGTATGGTGCGGAACCTAAAGGACATCTGGTCC
+ACATCCCCACGCTCAACCGAAAGCATGAAGTCCCGTGCCCACTGGGTATCGGGAGGAGAT
+GCCTCAAAGGAAAGCCCGTCCGAGTCCTCGATAATGGACAGGGTCCCGGCCTTCCGTGAG
+CCCAGGACATAGTTGTTGTCATGGTTCCACAGGGCTTTCACGTTGCTCTCACTCAAGGTC
+TTGGTAAAAGCTCCGGGATTGATCTTCTCCCGAAAGCCCCCGAGGTCCTCCGAAAGCTGG
+TTGTAGACCGCAGGACGTCCTACGATCTTCCGACTCTCTTCTCCTTCCTGCCGGCTTCTC
+AGCTCAACGGGAAAGGTCAATACGTCATGCTTTATCATCCCTCATCTCCTAATGATCTGA
+TTTCGGCTTCAAGCCTCCGGGCCTCCCAATCCTCAAAGCCTCCTGAGTCAAACAGCCGTA
+TGGAGCGCTCCGTATAGCCTTCAGCATCAAAGCAAAGCCCTGCACGCCGTAATGAAGGCT
+CTAAGGCAGAGAGCTGTTCGACGAAGCTTTTTCCCTCATCCGCATAAAAGGCCCGTACCG
+CTTCCGCATCACCTACCACTTGCATTTCGCTTTTCTTCATCCAGGCCGAAAGGCTTCGCG
+CCTCACGCCGTGCAATCCGGCTCACTGTGGATCGCAGATACTCTAGGGCAATCTCCCTGG
+CCGCTTTCTGTCCTCCTCGCTCCTGACTTCCCGCAGAAGGGGCGGAGAGCGGAACAACGT
+CCCCTGCCTCGGTGATCATGGCGTTGTTCATCTGCACGACAAACGAGTCGCCGTATTCGG
+ATTCGATCGGATTCTTGTTCTCCATCTGCCGCCACTCGTTCGGTGTGATAATGCCGTTGC
+GCCTCTCTATCTCCAAAGCCTCGGCCCTGCTTTTCTTATCTCCACGAAGCAGGGAGTCAA
+AGTTGAACTCCACAAACACCTCAGGCTCTCCGGCGAAAAGCTTGTAGTTCATCTCCTGCT
+CAAAGCGCACAAGCCAGGGGCGAAGCGAGTGGACCAGAAAGGAAATGTTCAGGTGTTCGA
+TGTTCGAGAAGGTTGCATGCTCAAGGTCGTTGATGAAGTGGGCGGGAACTCGCAGGATTC
+CGGCGATTTCGCTTCGGGTGAACTTTCTCGCCTCGATCGCCTGTGCCTCTTCAGGGCTTA
+CCGAGGTCTTCTCCCACTTGATCCCTTCCTCAAGTACTGCGGTGCGGTGTGCATTCGAAA
+GCCCTCCATAGGCCATCTGCCATGCAGTTTTTAATCTGGTCTTTGCTTCCGGTGTGAGCT
+TTGACGGGTGACTCAAGAAGCCCGAAGGATGGGCACCGTTTGAGAAAAAGGTCCCTTCAT
+ACCGGTCAAGAGCTGCTGCATATCCCACCGTTTCTTTTGAGTAGTCAAGCAGTCCCCGGC
+CTTTGATGCCGTCCCCAAGGGCCGAGATGTGCAGGACCCGGTACGAAGGAAGGCCGATGC
+GCTGGTTTCCAATTGTGGTCACATACACGATTGACTGCCGCTCGGTGTAAACGACCGTGG
+TCTGTTCAGGGGCAAGGGGCCAGAGTGCAACAGGATACCCGTCCCGGTCAAACTCGATTT
+CCGCATAGTGGTTTCCCCGCATGACAAGCTGCTTCATGGCAAGCTCGCGGTAGTTGATCC
+CACTCATAAAGGGATTCGGCCGTACCTTGAGTATCCGGTAAGCCGGGTGATCTGTTGCCC
+GCATCTTCCCACCGTTTCCCGTCCTCCGGTAGGTCTCAAGGGAAAGGGAGCCCACCGATT
+CAGAGAGCACCCGCACACAGGCAAGCACCGAAGCAACGCCCATGGCGCTCTTCTCGTTGA
+CCGCCACGCCCGTGCTGGTCGGCTCCCCCTCAAAGTAGGAAACAACCTCAGGGGAGGATA
+AGGGAATTTCCGGATTCTCAAGGCTTCCCCGCATCTTGGCTATTGCCTTTAGTCCTCCGA
+TTGCACCGCGAAGGTCAGAGAACAAGCTCATAGGACAAGGACCTCCTGGCTGTCGTATAC
+CGATCCGTCCGATCCGTTTTCCACCACCTGGTGAAGCGCCATGATGGCAGCCACGATCCC
+GTCGATCCTCTTGCCGTAGGAATCACGCTTCGGCTTCATGGGCATGATGTTTCCCTGCCG
+GTCGTCTTTGAGCTCCACATTGCTCATCATCCAGGAGGCAACCGGGTTGTCCCCGTGAGC
+GATCTTCCCGTCGATCACCATCCGCTCAAACAGCTGAGTAGGAACCGTCATCCCCGAATA
+CCGTTGAGGATATTTGACAAGCTCGATCTCTCCCTCAAGTTCCCGCTCAAACTCTCCGGC
+ATGCCACGGATCGTATCCGATCGACCGGCCGCCGAAGGTGTTCGCATCCTGCCGCAAGAC
+CTCTAACACGATCTCGTAGTTGACCGTCTGTCCCGGTGTTGCGATCATCCACCCCTCATC
+GATCCACGACCGGTAGTCAACCTGGTCACGGTGACAGCGATCAAGTAATCCCTCTTCCGG
+TATGAAAAACCGCCATAACAGCGGATACCGTCCGTCCTTCTCACCGAATGCCCAACACAG
+GGCCGTGATATCTGTTGTCATCGACAGATCAAGCCCGCCACGGGCCCCTCGTCCGACAAG
+CTCTTCTTCGGCAACAGGAGCGCTTCCCCGCATCCATACCGAATGGTCCATCCACCGGGT
+GGGAGAGGACAGCCATATGTTGAAGTTCTTGGTCAAAACATCGCTGGCTTTCCGGGGCGA
+TCCCTTGGCCTCTGCAATACGCTTTTCAAGGTAGTCGCGGTAAAAGCTCACCCCCATGTT
+CGGGTTGCTTTTGATCCACACCGCAGGATCTTCCCACCTGTCCCCCTCATCCAGGCTGTA
+GATGATCCCCCAGATGTGTTCCGGAACCGGCTCGATACTTCCTTCAAGGATCTTTGTAAC
+GAGCGTGCGCTCTTCCTGATAGGCAGGCCCGTTGATGTTCGTCCCGGCCGTGGTAATGAT
+GATCGTTAAGGGCTGACGCCTGGCTCCCATGCCCGACTCATACACGTTGATCAGCTCATT
+GGTCGCGTGGGCATGGTACTCATCCACTAAGATCGCGTGAGGGTTCCATGAGTCCTGACT
+CTTGTGATCTCTTGAGACCGGAGTCATGAAGGCCGCAGGATCATTGATCTTTACAAGGCG
+TTTTGAGGATCGGTACTCCTTGGTAAGCCGCGATAGCGTAGGATTCCGAAGGTTCTGCCG
+TACCGCCTCGTCATAGCCTTTCTTCGCCTGGTTCCGGTCCACCGCCAGAAAGAACTCTTC
+GGCCCCGATCTCTTTATCGAGGTGGAAGCAGGCGTTCATCATTGCAGCCCCTTCGACCGT
+CTTCCCGTTCTTCCTTGCTACCTCCCGGTATGCCTTTCGAAACCTCCTCAGGCCCGTGGC
+CGTACTTTTCCATCCGAAGATGTTCGCCCAGGCAAACTGTTGCCAGGGTTCAAGTACGAT
+CTTCCCGCTGAAGCCTTGCGTGTGCTCAAGCTCCTGGGCAAAGCTGATATACCTGTTGGC
+ACATTTCTCATCAAAGTAGTAGGGGAACTCCGGAGTATTCTGCCGTAAGAGGTCCTTCTC
+CCACCTGGCCACGGCAAGCTTCACCCACCTGCAGGTAACGATCTTCCCGCTTGCAACATC
+CTGGGCATACTGGCGGTAGGTAAAAAGGCTACTCATCAAAAGCCCCACAAGTACGAGTCG
+TTTCCACATCATCCGGCCCCTTCCAGAAGGCACTCCATGGGGTCCTTCGCTTCAGGTGTG
+TCGATTGCATTTACGCGGGAGCGGGTTGCAGGCGAGAGCCCGAACTCTGCGGATATGGTT
+TTGACCATGGACAACGCCTGCCGCATGGCCGTGTACTCAGGCATGGTTTGAGAATTCTTA
+CCACTCATGTACTGGGCTAAACTGCGCTTTTTGGTTTTCCCGGACTCCTCATCTTTGTAG
+TGGTAGACCGCGTACTGTGCTTCCCGGTACTGTCCGTATGCCTCGCATAAGGCTTCCAGC
+ATCGTGAGGTCCGCTTCCGAGAGTACACGGGTCTGTGCAAGCACCTGGGCAAGCTCCTTC
+CACTTGTTCTTTGCAAAATTGTTGAGGTGGCTTGGCGCCTTGGGCGCCTCATCAAGTGCC
+TTGACCTCCGGCTCCTTCTCGTTGGCCCGGTCCTCCCGAAAGGTGCCATGGGTTAGCTTT
+AAAATAGTCGGCTTTTTGTTGTGTCCGCCGCGGCTCATGGCCTATACCCCCTTTGCCTTT
+GCTGACAGAGTGTTTTCTTGTATGGGCGCGTGGTTTGGGCATTTTTCCCCCAGAGATTTA
+CACCCCCCCTCCGTCACTCGGGCTGTGCTCTGATTGATGATAGGAGAGACAGGTCGGGGT
+TCCTTCCTCTTTCTGTTGCCAAACCCGTTGTCAAACTTCGCGGTCTTTCTGCTGTGTTCT
+CCATGGAGCCGGGGGATGAGCTGGTACTTTCGGTGATCTGGTTCAATAGCCGGGTCATAG
+GCGGGATTGTGGTCCACATCGTACTTCGGCCACAGTCGCTTTGGGATGCCCCAGGCCTGT
+AAGACCTCGATGCGTATCTTACGCCAGGTTGCTCCATACCCGCGCTGTGTTGATGTCTTC
+CGTCTATCCTGCCTTCCCATAGTCTCTCGTCCTCTCCTCTGTCAAAGCCAAAGGGCACAA
+AAAAAGGCGGCGAAGTAGCTCACGAAAGACACCTGTTACAGTGTTTAACGTAAGGTACTT
+CGCCGCCTGATTGCTTCTTGCACCATTAGAGCGACCGGAATCCGTCCGGAACGGCCAAGG
+TAAGCATCCTTACCTCGGGTTATCTGACAAGAAAAATCCTATCACGGAAAAATTTTTTTA
+TCAAGTTAAAATGTAAAAAATATATTAAACTTTTCTTAATCTATTCAAAACGTCATGATA
+ATATTCACGCTCCCAGTTTTCCCAATCATAGAAGTATTGATCAATTCCACCAATAGCATC
+TACACGTATATGATCTCTTTCATAACGTCCACCACCAAGCATTGCATATGCGGGGTGTGT
+CGGCAAATCGTGTTTCTTCAGATATGCGAATATCTCCCATGTTTTCCATAATGAAAGCGG
+TGCTGCCGTTTTTTTTGAAGTAATCCCATGAACAAAATACCGTATTTTTCTGGTGTTAGA
+TTCTTGCATCCTTATCCCAGTTATGCGTCGCCCAAATTCTTCAAATAAATAATCTCCTTT
+TTCTTTAAAAGGCTTCGGACTATACATATTATCTGGCGTGTATTCAATCTCATATTCGTA
+ATATCTAATGCTAAAACGTTTTAAGAATGCATCCCTAACCGGTAGGCAATCAGGATTAAA
+GAATGGCTTTTCTACAATCCAGATGAACGGTACATCTATGCCGGCACATACGCACAGATG
+TGCCAGAACAACTGAATCTTTACCCCACGACACAGAAACGTAACAGACTTCTTTAGCAAT
+TCCTTGAATATCAATGATTGCCTGATCTATTTTACTTTGTTTTAAATCAGCTGCCCGTAT
+ACCGTCCGCTTCCTCTAATTCTTTCCACAGCTTCAAATCATGCGATGTATTCCTTTCGCT
+TTTAATCAACATGTAAATACCCTTTTTCGTCTTCCCTGATCGGCACGACTACAGATAAAT
+CATTTACATTGCGGGTAATTGTAGATTTGTTCACGGAAAAGACTCGTGCAAGATCAGATC
+GTCTCATAGGCTTTTGTTTTAATAATTCTTCAATCTTCCGACAGCGTATATATTTTGTTT
+CAAACATCGAATATTTGCCACGATCAGACTGTTTTAATTCCCTAAGAAAATCTAACATGG
+TATTGCAATCTCCATAAATGTATCAGGATGCCAATATGGTGGGAATGCTCCTCCATACGA
+ATGGCGGAAACCATACCAGTCTTTAACGGCTTCAATCGGCATTGTTTTCATCAGAACTTT
+TTTACCTTGGTGCATTGCAAAGATAGAATTATCTTCCTCTTGTTCTTCATACTCCCATCC
+TCCGATAATTCCATAACCGACATTTCTTAAATGACCAAGCGAAGGAATTTTTTTCAACAA
+CTTATTGATTTCTTTCCTATCGCCGCGAACGAACCAGCATATTTTATCTATAAGCCGAAT
+ACGGAGCGGAACAAATCGTGATTTATATGGCCCTGACGATGTTAAGAGTTTTTTCCGATG
+TAATGGATGCAGCATAAGAGCGGACAAATCTGTGTCAAATCGCTTTGATTGATGATCGCT
+CCATTCTGCTTTGACCTCTCCAAGTATCGGATCAGAGCAACAATATACGTCGTGTCCACA
+AATTGTCCGCTGTGCAAGTGGTATAGGAGGCCTTTTGATTTCAGAAAGAGAAACATTACG
+TGTTAATTTTCGAGCATGTTTCATTCCTAACCGCATGGATAATTCGTATTCCAGAAGCGA
+GTCGATAAATGGCGCATCACCGCAGAGCGGTGATAACAGGTGCGCCGTAACTTTCCAGTT
+TTTTATCATAACAATTCAACCTTTGAAGGAAACGCTTTTGACAGCCATCTTTTGAATGCG
+TCTGTGTTTGCCTGCACGTGATCGATATATTCCTGTACCAATTCATCAGGGCCCCTTTCT
+GTTCCAAACCAGTCTGTCAGTCCATCAATCCAAATTGATGATTTTAATTTTCCATGGCCT
+ATACGTGCGCTTCCACCGATGATGCCATCGTTGTCTTGCCATAACTTAATGGCATGCAGG
+GCTGATCCAACCTCAAGCGGAGAGACATTGTAAAGCGTTATGTCGTGATAAAACAAAGCT
+CCAGGTATAATGTTCTCTCCAGAGTAAATCATAAGGTTAGATTTTTTTTCTGCTATCTCA
+CCGAGTATTTCGGTAGCATCTTTCATGCGAGACGCATCGCCACGGGTATATTGATATTTT
+GAAACAAAATGTTGTGCGGGCTTTAAAACACCATCAGGTAATTCGTAATCGCCAGAAAGT
+TTTTCAATTACCTCTTGATTTTCGGCACAGCACAGAAGTCCACGAGAGACAAATAGCGAG
+CCACCGACTACCTGATTTTTCAAGCTTCCTCCGAGCAGACGATACAACGGGGATACTTCT
+TGAAGCTCTGCAATAAGCGGAATATTATCGTTCGTTGATGACTCGGTAAGGCTTCCTCCG
+GTCAGCATATAATTCGCCTGATCGATGGTGAGCTTTCCGCGAAGTCCACATTGATCGATA
+AGATATAGCGCTCCAGGTTGTCTTATCATTTTGTGCCGGAGAGCGTTTCCGGAAAGAACA
+GGGATTTCAACAACGTCGTTGTCATAAAAAACCTTTTCGCGGTTAATGATAGACTCATTC
+CCGGAGACTCCCATCATGTGAGTAATAGGAGAAAGCGCTTCTGAGAGAAAATGTATTTTG
+CATATTCCAATCTGTTTCATTACTTCTCCACCTTCTTTGTATTCCATAAGTTCCGAGAAT
+AAACCAAAATAATATTGTATTTTTTCTCCATGATGTAGAGAAAGTGCTTTTTCCACTCTG
+TAGGCTTCGTTTCCATGCTTTCGAGAAAATAAGCCAACTCTTCACATGATGCAACTTTTC
+CCGGATCGGCCTTGATAAACTCAAGGATAAGATTAACAAATTCTTCGAAATCCCCTCCAC
+ATTTTTTCACTGATGAAACGATTCCGTTCCCGATTCGCTCCCATAGAGTTTTACGATCGA
+AATCATCAGAGAAGAGCTTAGGTAAACTCGAACAGAACTTGATCGCTTCCTCCTTGATTA
+CCTTCTCTTCCATTTCCGGTAGACTTTTCGACGTATCTACCAATCCCGCCAGCTTTTGAC
+GAAATTCTTGTGCTGATAACAAAGTCATTTTTTGCCTCTTCCTTTCCCGGGCATAACCAT
+GCCGCGAGCTCTCCCAATGGGGAGGAATAGATTTTAATCCACTCAACGAGTGGGCCTTCT
+GAACCATACAGATCGATAATGTTTTTATAATTGATAAACTCATCAGGATTTTTTAATGCA
+ATTTTCCCGATAGCAGCAGCGACAAGTTTTGCTTTTTGTAAATATTTTTTTAGCGTTGCT
+ATCTCAACGCTGATTTCCTTTTCTTCAAGAAGTACGGAAAAAATGTTCTGATCATAATTA
+ACCGGCGCGCGGAAAATAAGCTGCTTTTGTCCAGAATCGGCAAGTACGATAGAAAACGGC
+GGTTTCGGAGGAGATAAACATATCCGGCGCAAAACGCGCAGATGTTTTTTTGTCATGGCT
+AATTTTTTATTTTCAGTCAGTACCCACGAATACATTCGCGGTTGACCAGCGCGTCCTATT
+TTAGTTGTACCGTCTATCTGAGTAACTTCATAAATCCCTGATAAAGATTCAACGCAGCAT
+CCGCAAACATAGTCGGAACCAGGATATTTCACAATATCGCGATTTGTGAAAGTTTGTTTC
+ACATATTTTTTCTTGGTGTATGTTCCATCGCATGGCATTCCGCAATAAAAGCATCGATGT
+TCCCCTATATTATATTTATTTGGTGCAAATAGATATGATGCTGTTATCATATTTCAGAAC
+CTTTAACATTCTTATCCCTGACCACTTTCTCCACTCCCCTGATATTCCCGCCTTTCACAT
+AGAACGACACTACCACCTCGCCGTCTTTTATTTTCTCAAGTTCATATAAAAGCCAACGGA
+TAGAGTTAGCCACACGCTGATCCTTACAGTCTGCCGATATCATCATATTCATTGCCCCTC
+CCAAGGCTGAAGCCTTACTCCCCGGATAGCCCTACCAGCTTCATGATCGGCTCAAAGTCT
+CCACACGCTGGCATATGCCGTGTCTCTTCCTTATCAGCCGCAAGACAACCGGGGGAGTAG
+ATTCCAATAAGCTCCTCAGATTCGGCAAAGCACTTTTCGAAGTTTCGGCAATTTCCACAA
+ACTTTTCTTACACCATACTCGTTCATGCATTTACCTCTTGCCGCACCTGTATCGATGTAA
+CAGCTCGTTCAAGATCAACATGCCGGAACCGGTAATACGCATTACCAGCTTTCATTTCAA
+TGATCCCTCGGTCATAGTCCGTTATATCAAGGACTATTTCCTTTTCAATAGGATCATCCC
+CTTTGAAAACCGTCTTTACCGCCGGAATCCTTTCTTTCAGGTACTTATCTGTTAATGTCA
+TTCCGCACTCTCCTCGATTTCTTCACCGGCTTCACCCGCCGCTTTTTCTTCACAAGGTTC
+TCGATCAGGTTATGCATAAACTGTGCCGCCTCTTCCCGCTCGGCCACCCGCTCCTCAATC
+ATCTTCCCGTCCCCCTCAAGCAGGTTCGCCGGCGGAAAGTAATGCGGGTACAGCCGCTCG
+TCAGCTTCCTTCACGATCGCCAGATCACAGGGTCTCCCGTACTTCGTCGAGTAGCTTTCC
+GTGATCTCCTGGTACAGCCGCATGAGGTAATCCCCGGACAGCTGTTTGTCGGCAAGCCAG
+TCTCCAAGTGCTCCCGCGTGGATCGGCGAAAGACGCCCGTAGTACTGCTGCAACATCGCC
+ATGAATGTTTTGCTGTTCCACTGCATACGCCTATCCTCCCACCGCCTGCTTTGCCTTGCC
+TCTCACCCCGTAGGGGTCAAGCGCCTCCCACATCCTCGCACCTTCCAGCTCATCGGCCGT
+GATCTTCAGCTGCTCCGCCACCCGGTCCCAGATCCCCGAAGCGTTGAGGGTAGACGGGAC
+AAAGGGCTGATCTCGGTAGAACCGATCTCGGGAATTTTTTAACCGCCATAACTCCCCGAT
+CATCCGCTCGGCACACCCCGCAGGGTCCTCCGGTGACGCCCGTGAGCATTTCTCGATGAT
+CCCGTGGATCGCCTTGCCTTCCTTGCCCCAGTTCGAGAAGTCCCCGACAACGGCCAGGAA
+GGAATCCTTGATCGAGTGGTACAGCGGGTCTGTCGGTTCTTTCCCGCTTGAAGGCGGTTT
+TCCCTTTCGCGTTTTCGGTTCCGGGCATTCAAGCTTGAAAACAGGCTCCGGGGAATCGGG
+TTCCGGATCCTCCGGTGGTGAAACCTCCCTGTCCCGCTCAGGCTGAGGCTCGGCCGAAGC
+TGCCGCAGGCATACTAGTCTCACTTCCCTTCACTTCACTTCCCTTCACTTCTGTGGTCAC
+TGGTGCACTACCGGTAGCACACTGGTGAGTCACCGGTGACTCACTGGTTGTCGAAGGCGC
+TTTGTCCTCCATTTCCCGGTTGCTCACCGGTGACTCACCTCTGGAAAAACAGGTCTCAAA
+GGGATACGGGGCTTCACTTCCCCTCCTGAAGGTCTCAAGCCATTCATTCCGGTATTCGTC
+CGTCAGATACTCTTTCGGCGGCCGGCGGAATTTCGTCTCCTGCGGCTTTCGTCCTTTCAG
+GTTCTGATACTTGAACCAGTTCGGGAAAAAGGCGTATCCGCCATACAGGCGGACAAGACC
+ACAGGCCCCGAAGTCTTCCAGGGCCTCTTTGATCATATCGATGGTGATGTCCTTTCGTGC
+CAGCCTGAAGTACAGGCTATCCGGTTCAGCCTCGATGATTCCCTCATCGTCGGCATTCGA
+GATCATCCCGATGAAGATGAGTACCGACACCGAGGAAAGTTTCATGATCTTGGGGTCCGT
+CCAGATCCCCGGATCTATCATCCTTTTTTTTGCACCCATAATATCCTGTCCTTAAAAGGG
+TATGTCGTCCTCGAAGTCCATTTCCTGATCCGGGCCCTGATTATTCGGTCCGGGGTTGAT
+CGGGTAGCCCCACTGATCATAGCCGCCTGTCGGCTTCTGATACCCGGAGTTAGCCCCCTG
+TCGACGTTGCTGTCCCTGCCGGGAATTCTGCTGTTGCCTTTGCTGTGGAGGCTGCTGAGA
+ATAGCCGCCCCGCTGGTTCTGCGGCGGTCCCTGGTAGGGGGCTTCTCCATACTGCCCCTG
+CTGGTTACTCTGGCCGACAGGCTTTCCGCTGATCAGCTGTACATCCTGGGCAAAGAACGC
+TACCCTGCTTCGTTTCTGTCCGTTGTCTTCCCACCGGTCTTGTCTCAGCTGTCCTGAAAC
+CACCACCTGCTGACCTTTGGTGAGATACTTAGCAAGTGCCTCAGCGCGTTTCCCGAATAG
+GGTGAAATCAAAATAGCTGACTTCCTCCTGCCAGTTGTCATGCACCTTCCTGCTGTAATT
+CGATGCTATGCTGAACTTACACAACGGTGTCCCGCTGTTCGTATATCGCAACTCTGCATC
+ACGGGTAAGCCTTCCGACCGCCGTGAAACTGGTAATATCGTTTGCCATGGTTCCTCCCTA
+AAGAACGCCAAAAAAGTCATGGTTCTGTTGTGTGATCGCCTCGTACTTCTTCCGGTAGTA
+CTGTGCAATCGTCCGAATCTCTTCCGTTGTAATCTTTACGCCGGACCTCGATTTCAGGTA
+AAGCGCTTTGTATGCATCCTCTCCGTGAAGCGTAATGAAGTAGCAGATAAGCTTCCCCGG
+ATCCCGGTCATGCTCTTCGTTCTCTGCTGCACTCTGACAATAAGCATTCATCTCATCCCA
+GCGGGTAGCGTAGAATCTTCGTGAAAACAGGTGTGAACAGGTGAGGTTCTGTGTACAGTT
+ACTTGTCACTGACCGGTTACCGTCCCTCTGTCGTATGTAGAGACTGAACCACCGGTCAGC
+CGCATCTACAGCCTTCTGTCTTCGTACCGGTTTGCCTTTCGCCTTCGTCATGCTGTTATC
+CCTTCAAGATCAAAAAGTGTAGGCGTTGCCGCTTCAATATCAGCCGCCTTAAGATAGGAC
+AGCCCATCCTTGAAACTCTGCGGGTTTAGCTCGTACCCGATACCATATCGGCCCATTTTC
+ACCGCCATGTACGGAACGGTCATGAGCCCGCCGAAGGGATCAAGCACAACTTCTCCTTTG
+CTGCTGTACCTGTTTATGATCCGCTCCACGATGTCGAACTGCAAAGGGCAGATGTGAAAC
+TCAAGGTCCTTTCGGGCCTGCTCCCCGTTGAGCGTTCGCATACGGTTCACATCGTCCCAC
+ACATCAGGATGCCAGCTCCCAGGTGCTACGACCATGAACCCGGAGGGCAGTTTCTCACGC
+TGTTGGAGCTTTTCTGCCAGGTTGATATGGTCGTGATAGTCATAGACAGAAGCACGGGAG
+AACTCTCTATAGGTTTTCTGCATATCGCCTACCGATACCTTTTCAAGCTCTGCACTTGTA
+AGAAGTCTGTCACCGGATGACCGCCAGAATTGATGAGCATCGATCTGCCAACGGGATCGC
+GGGTATTCTTGTTTTGTTTTTTTGACGGTCTCATCTGCGTAGGCCCTGGATGTATCGGTC
+GGCAGCTTCCGAAATAATAGGATATACTCCGGGCAGCCGACGCCCATCTTCGTGCCGTCC
+TTACATTGTTCAGTCCATCCGAGACGGTAGGTCTGGTTATTCTCGCGGACCACATCGGTG
+ACAACAGTAATTCGGCCCATGTACATAAAGCCGTGCTTCATAAAGTGGGATACGGTAAGA
+TCGCTGAAAGGATCAACTGTCGGCATTCCGCTTCCGGTAGCATTACCGAAAAGGATCCTG
+TCTTTCACATGGATAGCAGCGACCCGACCGGGCTTGAGAACTCGCATAAGCTCCGGAGTA
+AGATAGTCCATCTGCTCAAAAAACTTGTCATTGTCCACGTTGTGGCCAAAGTCGTTATAG
+GTCGGAGTGTATTCATAATGATTTGAAAACGGGATCGACGTATGAATAAGATCGACTGAG
+TCGTCCGGCCGGTCTGCGATCGCTATGACATTGTCGGCATTTACAGCCGTCCAGTTTTTC
+CCCTTCTTGATGATCTTCTTTTCCCAGATCGACCGCTCAAGGCGGGTGACAGCATCGAAA
+GAGTTGAGCCCGTATTTCCGGACGATCTCAGTCATCATGTCTACAAGCCGCCGGTGCTGT
+TCCCATTTGTGCATGAGTGTTTCATATATTGACCGCTCGCTTTCGGTGTAGATGATATGG
+ATCTCCACCTGCTCGCTTTGGAGAAAGCGGTAAATACGGTGTACCGCCTGGATGAAATCG
+TTGAACTTGTATCCGATCCCGAGAAAAATAGCCTTGTGGCAATGGTACTGAAAGTTTGCT
+CCTGAGCCGCTGATTTCCGGCTTGGTAGAAAGGTACTTAAACTTTCCATCGGAAAAACCT
+ATGGCGTTCTCCGCCCGTTCTTCTTCTTTTTGGCTTCCGTAGATCCAGCGGGACTCCGGC
+AAAGCCTTCTTGATTGCATGTCTCTCTGCTTCCAGGTCGTGCCAGATGATGTAGTGACTA
+TCAGGATCCGCGTCGATGATCTCCCGCATTTTCGCTACTCTGACATAAATACTTTCTCTC
+TTTTCCCTGCTGGCATCTTTTAGGCCGGTGGTTGCATCGCGGAACATCTTTACCTGTCCG
+TCATCCTCAGTACCTGCGGTTGAGTGGTCCACCTTGAGTTCATGCTCTATTACTTTAAGT
+TGAGGCAGGTCATACCCGGTATCATCATAGCCAAGGTCTGAAGGTTTGGTGATGAAAAGA
+GCCCAGGTGGAAAGCCAAAGCCAGAATTCTTCCTCTTTATGAGGGTGAAGCTTAAGATTG
+TTTGCCTTGGTACTATCTCGTTTGAAAAAGCGGGTAAGTGCCTGGCCCGTGTCCATGATC
+TCCAGATACCCGGCGTAGTGGATCAACTCCTTGTATTTGTTCGGCGAAGGCGTGGCGGTT
+GCGACGTACTTATATTTTACCCCTTGAAAAAGGTTCAAGAAGGTCTGATAGGTCTTTGTG
+CCATACCCGCGAAGTACCGATGCCTCGTCAAGGCTGGTGACAGTGAAAAAGCGCGGATCA
+ATATCACCATCTCTCACCCGCTCATAATTTGTGATCAAAAGGCTTGCATCTGCGCCTTTT
+ACCTCATCCATGGTTCGCACATAGCAGAGTTTGACTCCGAGCTTTCGCTCTGCGTCCTTG
+GCAAACTCGTGACGGACTTCCAACGGAGCTACAATGAGCGATTTACCTCCTTCGTGTTCG
+ACAATCGTCTTGCAGATAATAAGCTGCTGAATGGTTTTGCCGAGTCCAAAGCTTTGAAAC
+AAGGCCCGGCGTCCTCCTCTCAACGCCCAGTTGATGGAATCCCTTTGATGTGGCTTGAGT
+TTCGTTCCGTCGAGAAACTCGATATTGCCAACTTGTGCATCAATACCAGAGTCCGGTGCA
+ATGCACATTTTATCTTTCAAGAAATCTATGTATGGTTTCATTCTTAGTCCTCGATGAGTT
+CAATTTCCATTTCCGCCGCTATCTGGTGGATAGCTTCGATGAGGATCGATGCATCCTCTG
+TACTGCACTGTGTTTCACTGATCCCCTGGATATCTCCCCACAGGTCGAGTATGGGCTCCC
+CGGATTCGTCCTCAAGGATCGGGTAGCCCATGGTGACGGCAAACTGTTTTGCAAGCCGCT
+TTACATCCCCGAAGGGCTGGCCGGTTTCCACTGATATCTGTTGACAATGGCCGTTGATAT
+GGTGGTTCTGGCTGCCATGCCCGGTTGTCCGGGGACGGTGGGGCACATCGATCGCCAGCC
+AGTAGTACGGGGCCGGGGACCGTCGTTCGATCTCCTGGTAGCGGAACAGGTGCACAAGGT
+ACTGTTCGAAAGCCTCACCCACCTTGAAGGAGACAAGGCCCCGCTCGCCGGTTTTGATAC
+GCTCGGCCGCGGGGATGATGATTGTCCGGGGACTACTCATGACGTTTTCGCCAGATTGAT
+CGTATTGTCATATTCGTAAACCCAAACCCAGGGGTTTGCATCCCAGCCGAGGCCTCGCTC
+TTTGTAGATAGCATCCCAGACAAACGCAAACTCATGGCCGCATCCTTCGGCTTCCTGGTC
+ATCGGCGCTTATATCCTGTACTCTCTGTAATCGAACACCGGTGATTCGGCGTTTAGTCCG
+ACAGGCCCATTTCGGCATGTGGATCGATGGATGCCATTTATTTTGTTTAATGTCGTCAAC
+CGAAAAATAAACAGTTCCGTAATGTTCAATAACATTGGAATCAGCCTTATATCTAATTGA
+TGTGCCAGAAGTTGAACCAGACCAGATAGATATAGGTTTCCATGTCTCTCTGATCCAAAG
+CACATCACCGACGCCTCCATACGGGCCATGCTTTTGCAATTCACTGAAACTACCACAACA
+CTCTATCGTTTCATGCTTTCTCTGTTCCCACCACGATATGAGCTCCGGCTCGTATTCTGA
+TCGACAAAACTGGTGTTTAACAGGCCGTCTTGTCTGCCATTTCTTTCCGGCAAGATCAGC
+ACGGACCATATCGGCGTTGAAGATGATTCCGTGTTCTTTCATGATTCCATGCACCTTTCC
+TTAAAAGATTTCCAACTCTTCAGGCTCCGGCGTCTGCGGATCCCCGGAGCCGTTACCCGA
+TATAGGAGGCCTCTGCCCTGCTCTCTGCTGCTGACCATAGAGCCTCTTCTCTACCATCCG
+AATGTAAGAGTCGAGCGTCTTCCCAGAGTGCTTCTTGCTGTTTGCAACCATCGTGTTTCT
+TTCTTCCCTGGTGATCAGTTTCCCGAGAAATGCCCCGTCAAGTCTGTGCTTGAAATCCTC
+CCGAACCTTTGCATCCGGATCCTGGGCGGCAGCCTCGGAGTGCTCCGGAACCTTGGTAGA
+TTCTTCTTCCTGTACCGGCGGAGTACCCTGTTCCTCGGTAACATCTCGGTATCCGGTTTC
+TTCGTCGGAAAGCTCATCTGCGGTATACGGCATGCCTCCAAACTCATCGGGAAAACAAAA
+CCGGAAGGCCTGGGCGATGGCCACCTTCTTGATCATGGTCACCGGCTTCTCGTTCCACAT
+ACGGTTGTTCTGCTTGTACTCAATCCACCACGCTTCATGTACAAAGGGATTCTGCCAGTC
+CTTCCGGTGAATGGTAACAATGGCTCTGAGAGAGCGAGTTCTGATCGATCCGGCCGTTTC
+GACACTCCACCCGTCAAGCTTTTGGGTTCGCTCCGCCCGTTTGAGATAGACCTCGTAGCC
+TGTTATGATCGACAGCCTCCGGTTATCTCCTTCCCCGTAGGCCACACAGTATATTTCACG
+TTTGAAGGGGTTTAGCTGGTAGGCCTTGGCCACCTCGATAAACTGCCGTTTTTCATGATC
+GTTGAGGTTGTTGCCGATTCCCGAAGCTTCCATGTATTGGATGATCTTGTTCTCGGAAAC
+CACGTCCTGACTCTGCAGATCGTTCACTCAAGTACCCCTTCGTTGAGGGTCTCCCGGATC
+ACCCGCACCAGGGTTGCAAGCCTCATGGCAAAGAGGTCACGATTTGCCCGGTTGCCGTTC
+TTAAAGAGGTCCTGGATGAGATGGTCCATAGACTCAAGGTGTTCATCAATTGCCTGTATT
+TCCTGATTTTTGAATCGGATAGTGCTACTTTTCGGGTGATTCATCACAACCTTTCTTTTA
+TTTTCTCTAACCGCTACCGGTTCGGTAGCGGTTTTCATGTCTGTACTGCTCATGTTTTGC
+ACCTCGCATTGATCTTTGATAAAATCCTCTCCCCGGAGACCATTCTCCGGAGAGAGCCGT
+TTGTGAAACATGTTTCCCCCACATCCTCGTGGTTTCGGCGTGTGGTTGGCGCCGTATTGG
+GACCAGCAGGATTCGAACCTGCAGAGGTTAGCGCTTTCATGGTTGCAACTCCATGCCCCA
+TTTTCTGCCTGAACGCTGCTGTCAGACACACTCATCGGAATAGGGTCCCGATACGATACC
+GTTTCGCTACAGTCCCAAGGTGCGCCACGATTCCCCGGCGCTCGGTAGCTACTGACGTAG
+CCTCTTCCCGTTGGTAGACATTTATTAAGGCCGTCTTGAACGGGATGCGAAACCATCCAG
+CCTTTAACCAGTGTCCGGTTTGGCCCGGAGGTGAGCGATCTGGAGATTTGACAACCGGAC
+GAACCTATGACCTTTTCAGGCTCTCCCAACGTAACGTTGCTCACTGCGTATCCTCTCATC
+TGCCTTCCGCAGACTCACTGGTTGCTATTTTTGCCAGGCCGGCATAGCTGCCTGTGAAAA
+GGGCATCTCTAACCGCTTCCGCCGGTGGTGTTGCTCGCCCGCTTGGGTGGTATCCACTCG
+ATGCCAAATACCTGAGATGCAATGATGACGATTACGTTCATAACCACTCCCCAGTCCGGC
+AGGTCCCAGCCAAACAGCTCGGCAAACGCTAAAACTGCGGCGGCAATCGCGGTCAACGCA
+TAGGCTATAATGCGCTTCGTTTTGTCCTTCACACTTCTCTCCTTTCCCGCTTTCGCGGTG
+TAAATTGCCGGTTCACTGACCGGCGGCAGTTCTATGAAACGACCTTGATACCGTCCAGGC
+GTTCAAGGAAATACTCTGCAACCCTCTGCACCGCTTCGATCTTCCACTTCCCCCCGTCTG
+CCTCGAACAATGCCAGGGTGGGAATCTTCCCTTCTTCTGCTTTCATGCGGAAAAGTAGCT
+GGCTCTCAGGCTGGTCGATCTCCCGGAAGGTCCGGTACGGTTTGAGTGATACAATCGGCT
+TAAATGACCCGGATTCTTTCAAAGCGCCACTCATTCCTCGCCTAAGCGATACTTCCTGAG
+TCATTCCGTCATCACCGGAGACAACTTCATCGGTTACCGTCAGGCGCGAAGTAAACTGCA
+AAAGCAATTCTTGGTCCTCAGTCGGAACCAATAAGGATCGGAGCTTGATTTGAAATTCTT
+CACTTACCATGAACCGGCTGAAAGGGAAGGTCTCAAAACCGTCACTCAGGTTGACCTCGG
+CATAGAGATCACGCTGACGTTTACGTCCGGCAAGTTCCCCGTAAAGGCGGACCTTTTTGT
+AGGACACAACGTGAATGAGTAGCTCTTCTCTGTTTTCCAGTTCCTTGTCGATCGGCTCAT
+CAAGTAAGTCGACAAGCCCCTGGAGCGTTTCGAGCTTCAAGCCCTCCGGGTGAGGTTCAA
+ATAGAATAGGTTCGAGATTCGGGGATGCATACTTGATCCCGTCTACTTCCAGCTCCAGGC
+TTTCCTCCCGGAGTTTTGCAATTTGCTGTACGGCTGTTCCGTCCATTTACTTTGCCCCCT
+GCATTTGTACGATGTTCTCTTCCATGGGAAGGTCCTGCTGTCGCGGATCGGTCGTGTAGG
+CTTCCATTGAGCCTCCGCTCTTTGAGAACAACACGAACGATTCCGTCGGTTTGATCGGTG
+CAAGTTTTGTTTTCACACCGCAGATTGTGTTTGCGCTGCTCCGGTCCTTTGACGGTTTCA
+CCTTCACGCTGACGGTGACTTCCCGGGTGATCTGGGCATCACAGTTATCGTCTGCAATGT
+TGTCCATGATCTGCTGCCAGGCTTCGTCAAAAAGATCGATGACAGCGCCTTTGTTGAGGG
+TCTCTATCGTGACCCGCTTGTAATCTTCTGCCATTGGTCCTCCTTCAATTTTTGATTTGT
+AGGATTGCAGGACTGGGATTTGAACCCAGGGCGACGGGGATATGAGCCCCGCATGTTCCC
+ACTACACCATCCTGCTTTGTGTCATTTACTCGAATGGTTTTATATCGAGTTGTGTCTTTC
+CTGATTGGATGGTTTCGTATCGGTCAAGTTCCTTGATGATGAGCTTGCGAACCCATGTCG
+CACGACCTCTTCCTGATGTTTCTTTTAATGGGCCATTATCGATTCTGTTGATTTCATTCT
+CAGTTAGAACGACTTTCACAGCTGGAGGGCTTTTATGTTCCAATTTTGCTCTATTCATAC
+ACTCATAATAGAGCAATAAAAGAACAATATCAAGTGTTTTTTGTGACATTTTGCTCTATT
+TATTGCCGATAATAGAGTATGGATTTCTGGGAACGGTTAAAGACCTTAATCAAAGAACAA
+AAGACAACTCAAGAATGGGTTGCAAATAAAACCGGCGTGAGTTTTGGAACTTTTCGAAAG
+TGGATGTCAAGAAAAACAATGCCCAATGCGGACCAAGCCGTAGAAATAGCTGATGTTCTT
+GATACTACCGTAGAATACCTGGTAAAAGGTAAGTCTTCAGATACCTGGCAGCCTCCGAGA
+CGTTACGCCGATATTGTAAAACTGCTCGAAGAGCTTGACGACTCGGAACTTGAGGCCGTA
+AAAGTCCTGGCCGAGGGGTACGCCTCCAGGAAGCGAAACAAACCCCAGAAAGAAACGTGA
+AGCCAGGTAGCTGAAAAACCCTTCTCTAATCTGTCAAAGATCACCGATCTGAGGTTCCGG
+CCGGGTAGGCCAAAACGTCACTCAACCCCTCGTAGTCGAACGCAAGATTTCTTTCGCGGT
+AGCGCCCAGGCCACAAGATTCAATGCCGACAAATATGGCCCTCAATAACAGACACAAGAT
+AATCGGGAAGAGTTCCAGCCGAATGCTGGGCCATGAGCTCAGCAAGCACACCGTCGCCTA
+CATCCGGACACGTTAACAATGCTTCCAGGTACAGCGCCCGCGTCTCCGATGTGATCTCAA
+GCCACTCCTCGATCTGCTCTTCTGTCCACATTCGCTTGCTACCCTCAGTGTGGTTAGAAA
+AACCAGCCATAGGCTGCATGTGACGAACAGAGGCAATGGTCTTGTAGCTAACTCCTTTCA
+GCGCACTTGCCGCCTTCATGTCATACAACCGTCTTCGATTGTTAATTGTGTTTGCGGTAA
+TATCTCCGAGCTCCTCTATGGCAGTAGCTAATGATCTGAATGCGGATTGGATTCTTTCGG
+TAATAACTTCATTCTCTTTCATGCTACTCCCCTACTTTCTCGAATGGCTTTGAGTCGAGT
+TGCGTTTTGCCGGACTGAATGGCTTCCCATTCCTTTACGCGGTTCATCATCTCTACTTTT
+AGATAGGGCCCAGCCTTCCGGCCAGTAGATTCGAGGAAGCTAACAAATCTGGCTCTCTCA
+TCTTCGCTGAATGGAATGGATACCTTATAACGACTATCTTGTTGTCGTTTAGCAACTTTC
+ATAACTGTATATTATGGTCGATCAACAACTTTGTCAAGAAAAATATGCGTCATTTGACAA
+CATTTTTAGACGATAATAGGTGTATGGAATTTTGGGATATAGTCAAAAAAGAAATAAAGC
+GGCAAAACACTACTCAAGAATGGGTTTCTAATCACTCGAATATTAGCTTTGAAACATTTC
+GAGGATGGATAGCAAGAAAACGATTACCTCGAGTTGATGATGGGGTAAAAATTGCCCAAT
+CATTGGATACTACCGTAGAATACCTGGTAACAGGAAAGAACCCCGACAACTGGCAACCTC
+CGAGACGCTATGCTGATATCGTTGCAGCCTTAGAAGTGCTTGATGATAAAGACATCGAGA
+CGGTTAAAACATTAGCGGTTAGCCTGGCAGAGAGAACAAACATTGAATATCGCAAAAAGA
+GAGACGCTTAACGTAAAAAGTTGTAACATTATTCCTTTTAGACGTTAACATTTTTTACAA
+AAAGTGAATCTCTCATTGATTTAATCGAGTAGTCGTTTTAACATATTCAAAAATAGAGTA
+TTGGGAGATATAAATGAGAAAGAAGTATGCAATACTAAGTGAAGACGAGCTACACGAAGA
+TATCAAAATCATACCACCGAATGATGACAAGATTATCGAAATAGCCGATAGAGATGGTAA
+TACGTATTCAGTCAACATGAAAGAGCTTTCATGTACCTGTGAAGATTGGGAAACTGATAG
+ACATAATTTCTGCATCGGCGATCCGAGAAGATGCTGTTTTCATATCAAGAAAGCGTTTAG
+AAGAAATAATGCTATAGAAGAGCAAAAACCTGTCATAAAGGCTATTTTAAACGAATATCA
+CACTGTAAGACTGAATATGCTATTCGGAATGCTTGGAAGCCAACCGGTAGCAATCTTCTA
+TGATGATGAATCACCATGGATGGATGTATTCACAGAAATTGATCAAAACAAACAAATTGG
+TAGATCTGGATTTAACTATAAAGAAAAACGCTGGGCATATAACGAAGAGCCTGTCAATGG
+CGATAAAATAGCTTCGTTTATTGTAAATAGTATATAATTCCAAACTCTTCAAGTAGAGGC
+TATTTAAACATCAGGAGGACATAAATGAGTTTTGTTGTTTTTATCATCTGGGTTGTGCTT
+GCTTTTCTTTTGGCTTCGAGTGCTAAAAGCAAAGGACGTTCTTACGCAGGGTTTCTGGTA
+TTAGGGTTGATCCTATCGCCAGTTATCGGATTCATTATTTTGCTTGTGATGGGAGAAAAT
+AAAGACATTGTGCAGCAGCAAAATATAGAATCCGGTATTACAAAAAAATGCCCTTATTGT
+GCAAATGAAATTAAGAAAGAAGCCATTGTCTGCCAATATTGCGGGAGAGACCTCCCCCAA
+AAACCGGAAGAATAATCATGAGCGATATAGATAATAATGCAAATGATAAAAAAGCCAACA
+AGTCTAAAAAAGTAACACTTGTTTTGATCCTAATAATCATTGTTGCAATTCCGATCTTTA
+CCGGTTTTATAGTAATTCAGCCAGTTGGGGCATTGCCTGACGGTATCACAATATGGTACT
+TCCGCGCTGGTCTAAACTTACCCTTTATCACCTCGCCAGACGGATTTTCTTTGAAACAGA
+CTGGCCAATTGTCTTTAATGAGTAGAATGGTATCTATGTCAGCAATAACAACGGCGATTA
+AAGATAGGATTATTATTCGTTTGCCATATAGTAGAACTCTATACAAGATTTCAACAGGCG
+GGCAGGAGTTTGGCCAATAA
+>NC_014364.1|provirus_2976748_3014759
+ATGCCAAGGAAAACTGAACAATTCTCCATTATTCTCCGTCCTCCATCAAAGGTGTATCAT
+TTCAAGTTGGCAGGGTGGTCCAACTATAAGAGCACTCAGGTGTTTTTCGATCAGCACCGG
+GAGCGTTTTCAGAAACACCTAAACTGCAAAACAAAAGCCGATGCCCAAGAAGTGGTCAGA
+ATGGCAATCACCATTCAGGAAGAATCAAAACGGCCTATGCCATTATCTTCCCAGGTGAGA
+CTAATAGACCTGCTGAAAGATGCCTACACTTGGGACCGATGTCCACATGTCCGGCGTCTA
+CGGGACGAGGGAAAGGCTATCACAAAGCGCCATGTCCAAGACAGTCGGAACATTATCAAA
+TCCCACATCCTCTGTTGTAAAGATTTTGTGAATAAGCCAATTGCCAAGATGAGAAGATCA
+GACGTTCTGGAGTTCCGGTCATTCATGTTGGATCGGGTAGGACCAAGAACTGTCAACAAA
+GCACTTTCGATTGTAAAGGCGGTTATTAGAGAAGCAATCTTCCAGGAGGTGATCGACCGA
+GATCCTACAATCGGAGTAAGCAAGGTGAAGCTTACCGAGAAAAAAGAACCTGGCGTTTTC
+ACTAAAGAGGAGCTTCTATTGATGTTTCCGGAAAAAGGGATTGGCCCATGGAAAAGCATC
+ACTGATCATACGGTCTTCCTTACCGCTGCAAGCACCGGGATGCGGAGGAGTGAGATACTG
+GCCCTACGGTGGGAGAACGTGAACCTGGAAAAGCAGTTTATCAATGTGGTCGAAGCTTTC
+AAAGACTACCGGATGATAGAGATCGGCAAACCGAAATGGGAGCGTTCCCGGGTGGTCCCG
+ATTCCCAAGAAACTGGTCACCAGGCTGAAGGATCTGAGAGATCAATCACCATACGCAAAA
+GATTCGGATTATGTGTTTTGTTACAAGGATGGTACTCACTTGGGTGGAACTTGGTGGAGT
+AAGCATTTCCGCTCCGCTTGCATTGCTATTGGAGTGATCAAAGCTAAAAAAAAGGTCAAA
+GAAAATGAAGATCCTAACCCACGGAACCTTACTCCACATTCCTTCCGGCATACACTAAAT
+ACACTGTTACTAAGCAACGGATACGATAGCGGAAAGATCAGAGCTACTCTGGGATGGACC
+AGTGAAAAAATCCAGGACAATTATACTCATTTTTCGATAGACCACCTGAACGGTCAGTCG
+GATATGGTAGAGAGCTTTTTTGAAAAGGATAAAAAAAATGGAACCAATTAAAAACGATAT
+CATTCCGGGAAAACATTTTTTATAGCCTCTTTCCAAATTTCGCTTAGATAAATATCAAAC
+CTTACTCAACCTTTCACTTCCTAAATTGCAAAATTTTACCCTGTGTCTTCCGCCCTTCCC
+TCTTCGTTTTCCCAGCGCCTAGCCATAACCAGAAGATCATCAACTCGATCCTCCGGGAGC
+CGCAGGGCCAACTTTGCCAACTTCAATGCCTTGGGATTTGCATTCAGTTGAGCCCCCAGA
+ATATCTTTCGACTCCTCCCCGCTTATCAGGTACTCCACGGAAACGCCCAGGGCTTTGGCT
+AGCAGAACAGCCCTATCTGACCGGGGGATAGAGGCCTTTGCACTCATCCAAATTTCTATT
+GTCCTGTAATTGATGCCAGTTTTCTTTCCAAGTTCTTTAGCAGTGAAGCCATGAGAGACC
+ATTAATAGTTTTAGTCGTTCAGTAAACTTAGAAGCAGTCATACCTCTTTCATCGGCAATA
+TTAGTATGTTTCTGGAAAAAAATACATATAAATGTGTGTTTTTGTTTGACAAACACATAT
+TTATATGTAAAATAATCTTCATAGCACATAAAAACATGTGTTAAGGAGATTGTATGAGAG
+ATATCAGGGTTCCTCTTGATGAAGAAATTATCGAAGAAATCAAAACAGGCCCCCTTTCTA
+TAACAGGAGGACAGGGAGCCGCTTCCTGGGTACGTCAGTTGATCCTGAAAGAACTGGAAC
+GATATCGGTCCATAAAGAATGGCAACTCTCAGCTCAATGTAGAGGCATTCCATAATTGAT
+CAAGGTTGAAGAACGCAATGGATATCGTAAATAGAAATGAGACTATCACCTTCGATGATT
+CTATCGAAGGTGTAACCAAAACTCTGGCAGAAGCTCTGGCTATGGTTGTTTCAAAAGGGA
+TCAAGCCGGTGGTGATCGAAAAGCAGGATACCATAGTTGATGTTAAAGGCGCTGCTGAGT
+ATCTGAAAGTATCTACTGCCACCATCCATCGGATGACTAAAGATCGGGAAATTCCCTATT
+TCAAGGTGAAAGGCAATAACCGGTTTTCGATCAAAGAACTGGAGAAATACATATCAAATC
+AAATGATCCATCCTAACAAAAGGAGGAAGTAGAGGGACTACAAGAAGGGCGCCATTGTAA
+ACCTGATTAATGTCTTGCGGCTTGAGCGCTACCGCGAAAGAAATCTTGCGTTCGACTACG
+AGGGAGTGAGTGAGGCTCCTGCCTTCACCGGGCGGAATCTCAGATCAGGGATCTTTGACA
+GATTAGAGAAGGATTTTGCAGCTACCTGGCTTCATGTTTCTTTCTGGGATTTGTTTTGCT
+TCCTGGCGGCGTACCCTTCAACGAGGATTCTTACGGCCTCAAGCTCCGAGTCGTCAAGCT
+CTTCGAGCCGGTTTACAATATCGGCATAACGTCTCGGACGGATATAACCAATAAATAAAC
+TACAATTAAAATATGTAATGCAATATAAGGTCTAATCTATCTTTCTACTAAGTATTCATC
+AAGCATTGAGTTAATCACCTTAGATACAGTCTTATTGGCACCATAAGGTGAATCACCCGA
+AGCAGTACCCTCTGCCAGAATAAGCCCGGAAGATATCTCCACCCATCTTATAGAAAGATC
+AGTTATAACATTATGGACAACATCAAAGTAATATCTATATTTAAAGTGGACAGCTATTCT
+CTGAATATCCTTACCTATAGCATCAGCACTATATGTTCCTTTTTCTACATAGTTAGGGTC
+AATTCTAAGTATTTCGATATTCCTTTTATCAAATTCTTGAGAGATTACCTTCCCGATATT
+TAATGGATCATCAAGTTCTGGGAGGAAGAAAACCACATCTTTTTGTATCTGTTGACGAAA
+AGATGTGTCATAGGTGGCACAGCCAAACAGTAAAAACGTTAAGGATATGAACAATAGATA
+TGCTCGTTTCAATTTTGTGCTCCATTTTTATTCTTATGACCAATTATAGATGAATTGAAG
+AGAAATTCAACTGTGCTTTTACGATTACATTTTTAAAGATCTTTGTTAATCTGGAAAATA
+CAGGATTTTTCGCTACCCTGACCTACGCCTCTCTCTGGGCCCTATTCTGTTTTCTGGCTA
+CATAGCCTTCAGCAAGTACTCTCATAGCCTCAAGTTCTGGCTCATCGAGCTCCTCAAGCA
+GATTGAAAAGATCGGCGTAACGGTGGGGAGGCTGCCAGGAGTCAGCTTCTTCACCCGTTA
+CAAGATATTCAACAGTGGTATTGAGTGCTTTTGCAATTGCAGTGGCTTGCTCTACATTCG
+GTAGACGTCCCTTTGCCGTCCACCCTTTGAGGGTGTTGTAGCTAATGCCAGCTTTCCATG
+CTAACCATTCTTGAGTCTTCTTTTGATTTCGTAACTCTTCTTTTACTCGGTCAATGAAAT
+CCATACTCTCTTTATCGGAAAAAATACTCCATTTGGATACCATTTTTCTTGACAAAGAAT
+CCGTTCGGAGTAATAATAGCAATATGAAAGAATCCAAACGGATACCTGATGATCGTTATA
+AAGCATCTATCCCATTCAATACAGAAGAGAAAAGTAGGTTCATCTTTTTTCTAAAGGCAA
+CCGGCAGGAAGGCTGGACCCTACCTAAAGGTAGAGATGATGAATCGCGTAAAGGAATGGG
+AAGCCATCCAGTCGGGAAAGACACAACTCGATATAAAACCATTCGAGTAAATGAGACAGA
+GCAGGATCGTGTAAGGAGAACATACGGGCTCATATACGAGGGAAGAGCGACGTTTCGGCC
+TACCCGGCCGGAACCTCAAATCGGTGATCTTTGACAGATAAGAGAAGGGATTTAGAGATA
+AGGATTTAGTGCTGTCCTGTATAGGGAAACCATTTGGAATGCTGATAAAGCAGCCTCTGA
+CCAGGCCATTACCACTTGTGGGGTTCGAATCCCCGAGGACAGCAATCGGAGCGAAGCCTT
+GTTTGCATGCCGAAGCGCAATAGTGCAAATGTCGGGATTTAACTCGCCGGAGACGTAACC
+GGCACAATCTACTCCGTGAAAACGGGAAAGGAGGAAGGCGTGACAGACAAGACGAAGCGC
+ATTATTGCCTATGCGCTGACTGCGATAGCCGCCGCAGTTTTGGCGTTTGCCGAGCTGTTT
+GGCTGGGACCTGCCGGACTGGGGAACAATCATGAACGTAATAGTCATCATTGCATCCCAG
+GTCTTCGGCATTGAGTGGATTCCACCCAAGCGGGCAAGCAATGGAACCGGCGGAAACGGT
+TAAAAATTTCAGATGAGATAACGGCTAAAAACAGGCAAACGAGACGCAATCGTTAACTGC
+GTTGGCGCCCGGGAAAATTAGATAGGGCTGACCGGGGGCAACCAGTGAGACCGCAAGTAG
+ACGGGCATAATTGAGGCGGAAGCCGAGTGAATGATCAGGATGGCAACCTGATTGAAAAGC
+GTGTTATGTCGATAGCCTAAGCTCCGGGTCGCGCCGGACACTGGTTTTACCTTATTTCCG
+CAAGGAAGCAGTCTGGTCGTTACTGTACAAGTGGTTTGCCTTATTGGTTTAGCAAAGTGG
+AAACGACAAACCAGGTCTATAGACTGCCTTAACGGGTTAAGGTACCGGGCGCCGGGGAAT
+CGTGGCGCTTTTAAGTGACCGGATGACCAACCATATACCTTTCCGATATGGCGGTAAACA
+GCACCTCCCCAAGGCGTAACGGTCGTCCGGTTTCTTAACTTCCCCGTATGGGGGAGAAAA
+ACAATCCGTGATGCCGGAGAAATAATAGCATCTATATTTTCGCGGCTGTATGTCGGGATT
+CAAACAGGTTGGATCGGTAAACACCAATTTTCCTACCGGTCCAACACCTTTCAACCTTTT
+TCAAGGAGGACATGGTAATGGAATTGGAAGAAAAAGAAAGCTTGCAAGGTTTCATAGGAG
+TGAAAAGGATCAAAGCGCGATCAATGACCAGGCGTGGATACAACGGCTATCGCGGCTGGC
+AACTTCCTGCGGATGAAAACGGAGATGATGAAGGAATGCTTGTCGAGTATGTCGATGGCG
+GTAAATCCAATCATCCCGCACATGAAGGCTATATCAGCTGGTCACCTATCGATGTTTTCA
+ATCATGCTTATCGGCCATGTGATGCCCTTACGTTTGGCTTTGCAATCGAAGCGGCAAAGG
+CCGGAGAGAAGATTGCCCGGAAAGGCTGGAATGGAAAAGGCATGTTTGTCTTCTACCAGA
+AGGGCTACCCGGAAGGAATACCGATCAACAAAAACACCGCGGAGGCAACAAGATTGCCGG
+AAGGAACCGTCTGCAAATTTCGGCCGTATCTCATGATGAAGACAGCACAAAACGACTTTG
+TGCCGTGGGTTGCATCGCAAACCGACATCTTAGCGGAGGACTGGGAGATTATCGAGCAGG
+GAGAACAGAAATGAGTATTGAAACAAAAGAAAAGGCCGCTCCAGGCAAGGATACGGCCAA
+GAATAACAACCACACCAATATTACCATGATTGGATTCAGGCAGCAAGAACTTCACGAGAT
+CGAAAAAAGCCTTGAGGAGATGGACCACAAGATACAGGAGCTTTTCCGTTTCGGAACAGC
+CCATAACCGGGACATCTTCGCCATGAAGCTGGCTAATGAGGTACGGAGAATCAGAGATCA
+GTTGAACTCAGGGAGGCTGATGTGACCATCGAAAAGACAAGCCAGATCAAGGCGGGCGAC
+AACCTTGTGATGGTGATCTACGGCAAAGGCGGTGTGGGAAAGACAACCTTCACCGCCACA
+GCTCCTAACGTGATCCTTCTCGACTTTGAGAACGGCACCAAGTACCTGGGAGCCCGCGGC
+TTCAATGTGGATGTGATCAGGCTCAAGAGCTGGCCGGCAAACGCGGAGAAACAGAAGCTT
+GCGGCCTTGGTGGCCCCCTACCACACCATTGCTCTTGATCCCCTTGGGGAGGCGATGGAG
+AAGCTCCTCAATTCATCGGCGTTAAACGGCCGGAAGTTCCGTCAGGCAGACGGGTCGTTG
+ACCATGGCAGGATGGGGAGAAGCGAAGGCGCAGATGCGCAGCTTCATCAAGTGGCTCCGG
+GATTCCGGTAAGAACGTGATCATCGTTGCCCATGTATCGGAAGAGAAAGACGGGGAGATG
+ATCACCAACCGCATACAGGTTGCAACAAAGCTCAGGGAAGAGATACCCAACATCGTGGAT
+GTTATCAGCTACATGGGCGTGAAGATGGTAGACGACAAGCCTGTTCGCATCCTCTACACA
+CCCCGGCAGGGAGACCAGTTTGACTCAAAGGATCGAACCGGGAGAGTTCCGCTTACGGTA
+CAGGTCAGCGAACACGACGGCTTTAATGACCTGCTCAAGGCTATGGGAATCGGGCAGCAG
+AACATCCCGGAAAACAAGATGCCGGTACCGGAGGCAACACCTACCACATTCCAGGGGCCG
+CAGGACGAGAAGCAAACGGAACCCACACAAAAGGACCCGGACGAGGAAGCGCGAACACAA
+CTCAAGTATCAGCTTGACGGTGCCATTGTCGGGGAACTGGTTACCAAGGCCGAACGGGAT
+GAGGTGCTTGCAAACAGCAAGAAGTACAAGGGCCAGGTGCTTGAGGCCTACATCCAGAGG
+ATCAGCGATGAACTCTTTAATCTCCAGCAGAAGGCAGAAAGCGCAAACAGCACGGTTGCA
+CCTGAGCGCCAGAAAGAGAAAGAGGATCAGCCGCAGGAAGAAGAAGAGTATGCGCCAGAA
+GAACCAGAGCCCGAAGAGCTCGAAATCTGGTAGGACAGGAGAAGGACATGAATATTACGG
+ACATAACCGTTGACGATATCATCGAGGAACAGGAGACGGCAGAAGAAACGGGACTTGAGA
+AGCTCAAAGGCGATATTGATGAAGTGATCAGTCGGATGGAAGCGCTTTCCATCCAGAGTG
+ATGAACAGCTTGCAGAAGCAGGCGAATGGCTTGTGAAGAACAAGCAGACACAGAAGATCG
+TCAAGGACCACTTCGAGCCTGAACGCAAAGAGACCTATGCGGCCTATAAGGCTGTGACCG
+ATCAGATTAAGAAGTACACCGACATTCTGACCAAGGCTGAAAGAACCGTCAAAAAGAAGA
+TGGGAGCATACCAGGCAGAACAGGACCGGCTACGCATCGAGGCAGCGGAAAAACAGCGTA
+AAGAAGCGGAGAAGGAACGGGAGCAGTCAAGGAAAGACGGAAATTCCGCCCCTGTTATTC
+CCCTTCCACCGGAGAAGAAAGAGGAGCCGGTGAAGATTGAAGGGGTGTCCTTTTCGGAAA
+ACTGGACATTCATCATTGAAGAGACCGACAAAATCCCGCGGGAATACATGGTTCCGGATG
+AGAAGAAAATCCGCCAGGTGGTGAAGGCGTTAAAGGCTGATACCAATATTCCCGGTATCA
+AGGTCTACGCGGAAAAGACCGTCAGTGCCAGGACATGAGACCATGACACTTGAGGCACAA
+ATAAACATAGACTTTGCCCCTGAGGAACACGCCTACCGCGTTGACGGCAGGAAAGTTTCC
+AGTGTGACAAGCATCCTCAAAAGTGAGGGGTTCATTGATACCCGGTGGTACAAGCCATCG
+GGTACCTCTCGCGGGGAGATGGTCCACCAGGGAACGGAGGCAATCGACCGGGGCCACCTT
+ACCATTGCACAGTTCCCACCATCGGAAATTATTCCCTACCTCAAAGCCTGGCAGTCGTTC
+AAGGCTGATATCGGGGTGAGTGAGTTTGTGATCATCGAGCTTCCGATCGGCAGCAAGGTG
+ATGGAATACGGGGGCATCCCGGATCGGGTTGCCGTGATCAACGGGGAGTATTGGCTTCTT
+GATATCAAGAGCGGAGCACATGAGCTCTGGCACGGTCACCAGCTGGCCGCCTACAAGATA
+GCCCTTGAAGAGACCTTCGGGCTGAAGGTTGCAAAGCGTCGGGTGGTGCACCTAAAGAAA
+ACCGGGAAGTACTCGATCTGTGGGGAGGACAAGAAGATCGGCTCCTTTGACCTTCCGGTC
+TGGGAACAGCAGTGGATTGCGATCGCGACCGCTCGGCTGATCAAACAGCGGTACGCAAAG
+ATAAAACCGGAGACTGTATGAGTCAGAGGGCAATTGTCATTCCAGCGGCCGAACGGGTGA
+AAACCGGAGAGCCGGGAGTCGTTTCCTTCCGCGTCGGAGAGGTATTCCATGAGTACCTTA
+TCCACCTTTTCCGGTACCAGGAAACAGAACGCAAGTCACCTGCCCCCTATTACTCACTCA
+AGATCGACACCCCGAAGCGGCCGAGGACAACCGGAGAGAACAGCCAGAACCATCATATCA
+ACGGCCACTGTCAACAGATTTCCGTTGATACCGGCCAGCCTTTCGAGGACGTGAAGAAGT
+ACGCGAAACAGTTCGCGCTCACCATGGGCTACCCCATCCTTGAGGACGAGAACGGGGAAC
+CCATACACGACCTATGGGGAAAACCGCAAGGGATCAGTGAGTCTGATTGCAGTACTGAGG
+ATGCGGCAATCCTCATTGAAGCGATCCACCAGATAGCGGCGGAAATGGATATCAACCTCA
+TCGAGGACTAAGGAAGCACCATGGGAAAAACAGCAACAGGGACAAAGCAGAGAGCAAAAC
+CGGTACGAAGACAGAAGACACGACGACAAAAGGCCGTAGATGCAGCAGATCGGTGGTTCA
+GTCTCTACATACGACAAAGGGATGGGAACCGTTCAGTGACAAGTAACTGTACAAGGAACC
+TGACCTGTTCACACCTGTTCTCACGAAGATTCTACGCTACCCGCTGGGATGAGACGAATG
+CCTATTGCCAGACGGCCGGAGAGAACCTCTACCACAACCGGGATGCAGGACCTTTGACCA
+GTTACTTTCTGGATGTGCATGGAGAGGAGGCCTACCGGAAGCTGTATGAAAAGGCCCGAT
+CAGGGGCCAAGTTCAGAACAGAAGAGATCGAGGATATCGCTGCTTACTACAAGAGCCGGT
+TTGAGCGGCTTACACAGAAGCAGCGCGACTTTTTCAATGTTATTTAGGGAGGGACTATGG
+CAAACGATATTACCAGTTTCACGGCAGTCGGACGAGTGACCCGTGATGCGGAATTCCGAT
+ACACGAACGGTGGAACGCAGCTGTGCAAGTTCAGCATTGCGTCGAATTATAGCAGGAAGG
+TACGGGATAACTGGCAGGATGAAGTCAGCTACTTTGACTTCACCCTATTCGGAAAACGGG
+CGGAAGCACTTGCTCAGTATCTCACCAAAGGTCAGCAGGTGGTCGTTTCGGGCCAGCTGC
+GGCAGGAGCGGTGGGAAGACAACGGACAGAAGCGAAGCAGGGTTGCGTTCTTCGCCCAGG
+ATGTACAGCTGATCGGGGGAAAGCCCACCGGTCAGAGTAACGGGCAACGGTATGGAGAGG
+CCCCTTACCAGGGTCCGCCGCAGAACCGGCAGCAAGGCTACCAGCAGGGGCCACCGCCTA
+ACAGCGGCTACCAGAAGCCGACGAGCGGCTATGACCAGTGGGGACATCCGATAAACCCCG
+GACCTAATAATCAGGGCCCGGAACAAGAAATGAACTTCGACGACGATATACCGTTTTAAG
+GACGAATTACCATGGCACGACGCAGAATGATCGACCCGTCAATTTGGAGCAATGAACAAG
+CGCAGTGTTTATCAACATCGGCGTTCAAGGTGTATGTGTTTCTGATTTCACAGTCCGATG
+ATGAGGGGTACCTGAAGGTATCCCTCGTCATGTGGCCCTCATTGATCAACCCTGTTGACA
+GGAGCTACACGAAGGACCAGCTGGTAAATGACCTCAATGAAATACTCTCTTGCGGCTTGG
+TAGAGGCCTACCGGTTGGGTGATGAGGTCTATGTGAAACATCCTCATTGGACACTTTACC
+AGACCATACAGAAGCCTTCAGGAAGCAAATACCCGAAAGATGGGGAAAGAATCTATCGCA
+TAGAGGAATATCGTAATGATATCGGTACGGTACCACATGAATATGATACCGATACCGTAC
+CGGTACGAGAGGAGTATGATACCGATACAATACCGGTAAACGACCACTCTCATTTCGTAC
+CGCCTAAGTTAAGTAAAGAGAAGTTAAGTAAAGATAATACTAAGATACCTTCGGTAGCAT
+CGGCAGAGCCTCAGCCGGAGCCTGGAGAGGCGACAAAACCGGCAGAAGAGCCGGAGCCGG
+AAAGCTCCCCACTTCCCCCACCCGATTCGGAACCCGATCCAGAACCTAAGCCGGAGCCCG
+AACATGAACCCGACATCGAACCGGTTCTTGAGCTTGAATGCCAGGCACCGAAGAAGCGCA
+AAGCCAGCAAGGGGAAAGCACCTACCGCCGGGAAAGAACCGGCAGACCCGCTGTACCACT
+CGATCAAGGATTCCTTCCTGGCTGTTGTCGGGGACTTCTCGAACTGGGGCAAGGAAGGCA
+AGGCGATCCACGGGATCATCGAGAAATGCTCTCGCGCCTCACCGGAAGACCCTGCCGGGT
+GTGCCGAGCGGATGATCGGGGAGTTATGGCGGCTAAAGAATTCGGCGGATCGGTTCTACC
+GAGATCAGCCCTTTGTTCCGTCGACCCTCAACGCTTCGGGAATCTGGGACCGGGTAGCCG
+AGCAGCTGAAGATCACGGCCGATGAGCTGGAAGGTGTGAGGATGTGGGAAGCGCTTGACC
+CCTACGGGGTGAGAGGAAAGAGCAAGCAGGCGGTGGGAGGTTAAGCGTATGCAGTGGAAC
+ACCAAGACATTCATGGCGATGTTGCAGCAGTACTACGGCAAGCTTTCGCCGATCCACGCG
+GGAGCGTTAGTCGACTGGCTCGATAGCAAGCAGTTTTCGGGTGAGTATCTCAAGCGGCTG
+TACCAGGAGATAACCGAGAGCTACTCAACGAAGTACGGGAGGCCCTGTGACCTTGCGATC
+GTGAAGGAAACGCACATGGCCCTTGCACCTTCGTATGTGCCCCCTGCCCGGCAGCTTGAA
+AGTGATCAGCGGATGATCGGGGAGCGGTTTGTTGAGCGGGAGGAAGGCGCAAAGCTGTTT
+GCGAGCATCATCGAGAATCTGACGAAGAAAAAGCGGCGGGTGAAACCGGAGAATAAGTCG
+AGGAGAGTGCGGAATGACATTCACAGATAAGTACCTGAAAGAAAGGATTCCGGCGGTAAA
+GACGGTTTTCAAAGGGGATGATCGTATTGAAAAGGAAATGGTACTTGAGATAACGGACTA
+TGACCGAGGGATCATTGAAATGAAAGCCGGTAATGCGTATTACCGGTTCCGGCATGTTGA
+TCTTGAGCGAGCCATTACATCGATGCAGGTGCGGCAAGAGGTAAATGCATGAGCGAGTAT
+GGTGTAAGAAAAGTTTGCGGGAATTGCAGAAGTTTCGAAAAGTGCTTTGCCGAATCAGAG
+GAGCTTATCGGAATCTACTCCCCGGGTTGTCTTGCGGCTGATAAGGAGGAGACGCGGTAT
+ATGCCTGCGTGTGGAGACTTTGAGCCGATGATGAAGCTGGTAGGGCTGTTAGGAACGGAA
+GATGAGGGCCGGTAATGGGACGTAAGCTTGCCATTGAAACACATCCACAGCGGCACGAAA
+TAGAGCAAATGCTCTTGAATAAAGTACCGGTGTCCCACATTAGCGAGCAATTCGGTGTCA
+GTCGCGGTGCAATTGCCCGGTTTCGAGACAGCTTTGAAGGCAGTTTCAAGGCAATTGCGA
+CGAAACGAAGTGAATTGCTTACAAAATCGGTTGATGATCTCGAGGAGTTCCAGGAGGACC
+TTCGGGGTGCGGAGAGTATCTGGAACACCTTAAAGCGGATCACCCAACGGGCATGGATGG
+TCCTTGACGCCTGCCATGCGTACCTGCAGGACCCGGACGATCCAGGCAAGTATGACCTCG
+GCCCTCGGGGAGAAGATATCACCGTTGTGCTGACCGAGTACGATGATGAGGGGAAGCTGC
+AAAAGGAAAAGCGAAAGCTCTCGGATGTGATCGCGGAGATTGAGGGGACGGGGAAGAACG
+TTGCCGAGATCAACTACAAGATCGCGGATCCCCGAAAGCTGATCCTTGATACGGCCAATA
+CCCTGAACAAGCAGCTTGAGCTTATCGCGAGGCTGCAAGGAGAGCTACAGGACGTGACGG
+TGAACATCACCCAGACATCTGAATGGAAAGAGATACAGACGACCATCCTGCAAGTGACAA
+AAGACTACCCAGAAGTGAGGGAGAAAATTGCCAGTGCCTTTACCGCCGGGGATGCTCCGG
+CAGACGTTAACTGAAAGCCTTCGGGCGACACTCGCTCCAAGGCAATACCTCCGGTCTCTC
+GGGTTTACGCCGTTCCTGTGGCAGGATTGGGCCCTTGACCAGTCGCTTCGCAGACTGCTT
+TTGAATTGCTGCCGACAGGCGGGCAAAAGCACGGTCATAGCTGCAAAGGCGGCACACAAG
+GCGAAGTTCTTTTCAGGCAGCCTCATCATTCTGGTGTCCCCTGCTCTGCGGCAGAGCAAG
+GAGCTGATGCGCAAGGTAGAGGACTTCATTGCACTGGACAAGAGCTTTCCTCCGGCAAGT
+GAGGAAGACAACCAGCTGACCAAGGAGTTTAAGAACCGTTCCAGGATCGTGGCGCTTCCG
+GGAAGTGAGAAGACGATCCGAGGCTTGAGCGGCCCGACCTTGATCATCATCGATGAGGCG
+AGCCGAATCCCGGATGAGCTGTACAAAGCAATCAGGCCCATGATGGCCGGAGCAGATACA
+GAGCTGGTACTCATGACCACGCCTTTTGGAAAACGTGGTGTGTTCTATGATGCGTGGTCA
+AGAAGTAAACGCTGGACAAAGATCGAGGTCGTCGGCCGGGACATTCTCGGACGGTTTCCC
+AACGAACAGGTTTACGCACAGCTGAGGCGGAAAGACGGGATTAAGGCCTGCTATTCGCCC
+CGCCATAGTGTTGAGTTTCTCGGGGAGGAGCTGGAAGAGATGGGCGAATGGTGGTACCGC
+CAGGAATACGGCGGAGAGTTCATGGACCCGATCGATTCGGTTTTCAATATGGAAGATGTA
+CGGGCGGCGATTATCAACGATACACCGGCCATAAGCTTTGCGCCGATTATCGAGGAAGAC
+GTACCGGCGCTTCACTTTTAGGGACATGGGAGGGGAATAATTGATCCGAAACATTGTATC
+TGTTGACCTTGGCCAGCAGTTTGACTTTACCGCAATCAGCGTGACGCAAACACGTGAACA
+GTGGACGACGGGGCCGAACATCCCGGCTGAGTGGAAGGCGACAAGCGGGGATAGGCTTCT
+GACCTATTACTACTATCTGCGGTACCTGGAACGCATGAAGATGAAATACCCGGACGTTGT
+CCGCGAGGTCAAGAAGATCGTTACCGCGCTTGAGAATGACCAAACAACGGCGCTTTTGGT
+GGATGCAACGGGCGTGGGCCTGCCGGTGGTTGAAATGATGCGGGAAGACCTGCTTTTGCC
+GATACCGATCATCATTACCGGCGGTAACAGTATCTCAGAGCAGAACGGAGGATTCCATAT
+TCCCAAGCGTTTCCTTGTTGCGGCATTGCAGGGACTCTTTGAGACCGGCCGACTGAAAAT
+CGCTTCCGGTATCGGTTGCCTTGCAGAGTTCATGCATGAGATCGAAAACTTCCGGGTGAA
+GATCACGCAGAGCGGGAACGACACGTATGAAGCATGGCGGGAGAGTGACCACGACGACCT
+TGTGATCAGCGTTGCGATGGGAGCCTGGTATGCGCAACGGGAAAGCATCAACAACATTCT
+CATACGAAAGAACGATAAGGAGGTGCTGGATGAGTACGATCCTCTCGATAGACTGTAAAG
+ACCCAAAGGTCAAACGATCGATCCAGTGGCTCCTGGCTGAGCTGGGAAGCCTCTCATACG
+GGGAGATCATGCTCTCGTTCACGCTCCACGACGGACAGGTGAAGTCGATCGACAAGGCGA
+CGAAAGAAAAGCAGAGGAATGCTTGATCCGGGAATTCCGGGAGGTATAAGATATGGATAT
+GCAAAAACCATTAGACAAAAAGATCAAATACGGATTGTGGATCGCATTCGGATATGTGTG
+CGGGGTGCTCCTCATCCTTGCGCCTATTCATGAGTTTGGCCATTGGGCCATCGGTAACCT
+CATAGGCTATCGGACCTATTTCTATGGCTGGACCTATGTAAGCCATGACGGATATCCGGA
+CACACCATGGCAGGGATACGTCGAAATGGGAGCAGGCCCAACCTTTGAGATTGTGGCCTA
+CCTTGTGATCTCGGCACTCCTGGCGTGGAAGCGAAAGTATGGTGGAGCCTTTTTCTTCTT
+GGGCCAACAGCTCTATTTTCCGATCAGGTTCTTTCACGATGATGAGTGGTACTTTCTGTA
+TGCGTATGGGAAGGCATTGATCCCGGCGAGCATTGTATTTGCCGTGATCATGTGCGTGGT
+GATCTGGGCAAACATGGAGCAGGACAAGGTACGGGCTGCGAAGCTTGCACGGGAGAAAGC
+GAGAAAACAGAAAACGAACGAGCGGCCCCTTGTCAAAGAAAGAGCTTTGAGATAGAATTT
+TTCATAACATAAGGGCGGGAAACCGTCGCGATCCGGCCGTATGCCGGTCGTCTACCTGAA
+TACCACAGGCGGCGAAGTATCTGAGTTGACATTGTAACAGGTGTCGGCGCAGGTACTTTG
+CCGCCTTTTTTTGTGCCCTTTTGGTGGCACTGGGAGGGATTATGCCGATTAATGCGCTTC
+GCAGGCGATGGAACGAGGGAGTTGTGGCAGACAACGCCTATGACAAACAGAGCGGTGATG
+CTGGCGGTGGTTACACCTGGCAGGAACGACGGCAGCTTAGAAATGATGGTGCTGAAGACG
+TCTCCAACGAGCAGATGGGAAGCATCCTGAAACAGGTATACGGTGACGCTTCGGAAGAGA
+CCTTCAAAAAGGCCGTGAAAGAGTATGACCTCTCCGATCTCAACCCTCAGCGGCAGAAAA
+ACTTTCTTTATGAAAAGCTTCAGGAAAAAATCAGGCAGGACCGGGAAAACAGCGCGGAGC
+GGGTGTGGTAAGAGGCTGGCATGGCTGAGGAAAAGAGCGCACAAGAGATCATCCAAACCT
+TCGAGCAGCTCAAGCAGGAACGATCCACGTGGGAAGATGAGTACCAGGAGATAACCGAAC
+AAATCTTTCCCCGTCGAAGCGTATGGACGGACAACAAGGGCCGCGCTTCCCGTTCAGGCG
+GGCTCATCTATGACGGCACCCCGATCTCCGCTCTCAACCTCCTTGCAAACGGGCTTGTCG
+GCTATCTCGTATCACCGGCAACTCGGTGGTTCAAACTCAGGCCGACACAAGATGAACTGC
+TCCAGATACGTGGGGCCAGACAGTGGCTTGAGATCGTTGAGAACCTCATCTATGACGAGT
+TTAACAGGTCCAACTTCTACGAGGAAATCGTGGAGTACTTCCGCGACGGCGGCAGCATAG
+GGATCGCAACCATTTATGTGCAGGAGGACATCGGCCGCCGAATGGCCAATTACTCATGCA
+GACACCCGAAGGAAATCTACATTGCCGAGGACCGCTTCGGGTACATCGACACCGTGTTCC
+GCCGATTCTTCCCAACGGCCAAGGAACTCGAAGAAGAGTTCGGCCGTGAGGCGTTATCGG
+ATGGCGTGCAAAACCTCTGTGAACGCAGTCCCTATGAGCGGGTGGAGATCATCCACGCGG
+TTTACCCTCGTAAGAAGCGCAATCCCAGAAAGAAAGGCAATCGTGACATGAAGTTTGCCT
+CTGCCTATGTGGAAGGCGGAAGCAACCATAAGATCAGGGAACGGGGGTACGAGCGGCTTC
+CGTATGTAGTGTGGCGCTGGTCGACAAACTCCGATGAGGTGTACGGCCGGGGACCCGGAT
+ATGATGCGCTTGTCGATGTGAAACGGCTGAACAGGCTGAGCCGGGACATGCTCAAACAAA
+GCCAGATGGCCGTTGATCCTCCCCTTGCTGTTCCTGAGAAGATGCGGGGAAAGGTCAACT
+GGGTTCCTCGGGGACTCAACTATTACCAGAACCCGAATGAGGTTCCTGTTGCCCTGAATC
+CCGGTATGCAGTTCCAGGTCGGCCTTGATCGGGAACAACACATGCAGCAGATCATCGAGA
+AGCACTTTATGACCGACTTTTTCCTCATGCTCGAACAGGCACCGAAGGAGATGACGGCAA
+CCGAGGTAATGGAGCGGCAGTCGGAGAAAGCGGCGGTACTCGGTACGGTGATCGGCCGAA
+TCAGCAGTGAGTTTCTCGACCCGATCATCGACATAACCTTTGATATTGCCATGAAAGGCA
+AACGGCTTCCCCCTCCACCGCCGGAGTTTGCCGAGGCCATGTACAAGACAAACGGCGGAA
+TCGAAATCGATTACCTGGGGCCGCTTGCACAGGCACAAAAGAAATTCCACGTTACGCAGG
+GAGCACAACAGAGTCTCAACGCCGTTGCTCCCATTATGCAGATCAACCCGCAAGTCGCGG
+ACCTCATCAACTGGGATCAGCTGACAATGGAAATACTCCACGCCTATGGCATGCCGCAGA
+AAGCCATTGTCGACCTTCGGGATGTGCAGAAGATCAGGCAGCAACGAGCGGTGCAACAGG
+CTGCGGCCATGCAACAGCAGCAGGCACAGCAGCTTATCGATAAGTACCCCATGGACAAAC
+AAGCCCCGCCGGACTCTCCCATGGAGGAAATCGGTAACCAACTCCGTGATGCCCTGAAAG
+GCGGAAATGGAGGTGCGGCGTGATCAGATGGGGAGAGCCGGTTTCACCGGAAGCAGAGCG
+TATCAGAGAGACCTACCGGAGGACCTTTTCCACCCCGGAAGGGAAAAAGGCACTGCTCTA
+CATCCTCACCGACCTGGGCTTTTTCGATGCGACGAAGGACGAAGCCGCACAGGCCCTTCG
+CAATTTTGCAGTCAGACTGCTTGAGCAGATGGGAATACTGCATGAGGCCAATGCAGAAAC
+ACTGGTGGCGCAACTTCTCAAGCTTGCGCCCTATGACTTACAGACTCACCGGAAGATCGG
+TGAACGGGAGGACTTTTCATGAGTGACATTATGGACCCTCAGACGACTGGGGACAATCCG
+AACAACGATAACGGTGCCGGTGCGAATGCTGGCGCCGAAGGGGCCGGAGAACAGCAGCAA
+GCGCAACAGACACAGCAGACAACGACTTCGGACCTTCCCAGGTGGATGTATCAGCTTTCA
+GGAGACCTGCAGAAAGACGATCGCCTGTCCGGTTTTACGAAACCCGATGAACTGGCGAAA
+GCGTATCTCGATTATGCGGGGAAAGCCGACAAGCTGATTGAGCTACCGGGAGAAAAGGAC
+GCGGAAGGATGGAAGAAGTTTTACGGCAAACTCGGCAGACCGGAGACACCGGAAGGATAC
+GACTTTTCCGGTGTGAGTATCCCGGAAACCATAGAAAAGAGTGAACTTGCCGACTTCCGC
+AACATGGCGCACGAGCTTGGACTATCGAAGGCCCAGGCAGCGAAGCTACTCGAACACTCC
+ATTGCCGACCTCAACAGCATCACCACCAAAGCCGACGAAAACGCGAAGGCTGAGGCACAA
+AAGAAGCTTGATGAGAAGAAGCAGAAGATCGGAGCCCTCGTGGAGAAATACGGGGACAAC
+TTCGAGGAGATTGTCACGAAGGCTCATCGTGCGTATGAGGCAGTCGGGAGCAAGGAACTC
+GGTGAGTACCTTGACTCAAGCGGACTTGGTGACGACCCGGTGATGGTCGGCGCGTTTCTT
+TCCATTGCGGAGAAGATCGGGGAAGACACGCTGTTCGGCTCATCCCATGGAGGTGGTCGT
+GACGAAGGCGCCGACTGGTATCCCAACACAAATTTTGACTCATAACGGGAGGGCATATGC
+CTACTATACCCCAGAAAAGTGAGCTTACGCTTGTCGAGCTTGCAAAGCGAATGGACCCCA
+AAGGCAAGCAGGCGGAGATCGCCGAGGTACTCGAAGAGACCAACGAAATTCTCGAAGACC
+TTCGGTTTGTTGAAGCCAACAACGTAACGACTCATGTGTCGTCTATTCGTAAGACCTTGC
+CGGAAGGTTCCTGGCGTTCGATCGGTGGATACACCAAGAGCACCTCCAGTGCTGTTCGTC
+AGATAACCGAGGACGTGGGAATGCTTGAAGCCTACTCCAAAGTAGACAAAAAGCTTGCCC
+ATCTTTCCGGCAATCCTGCGGCGTTCCGCAAGCAGGAGGACAAGGCCTTTATCCAGGGAC
+TTGGAATCCAGATGGCAACCGCATTCATCTACGGCGCCAGGGCGATCGATCCCGCATCGT
+TTAACGGTCTTGCTGTTCGGTTCAACGCTTACGGCATGCCGAACGTAACCAATGCAGGCG
+GCAACGGTGTAAACGAAGGTGTTACCAGCCTTTGGATGGCGCAGCACGATGTCGGCTCGT
+TTCACGGATTCTATCCCAGGGGCAGCAAGGCCGGTCTTGATGTAAAGGACCTCGGGGAGG
+ATACGGAAACCACGGCGGAAGGAGAACGGCAGATTTACCGGTCGCACTTCACCTGGGACA
+TGGGAATCATGATCCGCGATTATCGTGCGATACAGCGGGTTGCCAATATTCCGGTTTTCA
+ATGATTCGGAAAAGTTCGTGAAGTTCGACAACTTCATGATTGCCGCCCTCAACAGGATGC
+CCAAGCGCGGCCGTGGTGCTGTTATCTACGCGAATCTCGACATGTTCACCATGTTCGACA
+TTCTCGCAAAGGACAAGAGCAATGTCGCCTATGGCTCTGCGGAAGTGTTCGGCAAAACCG
+TTACGACCTTCCGTGGTGTTCCCATTCGACTCGTTGAGGCAATTTCTTCCGATGAAGACG
+TTGTCACCGAGACTGCGGCATAAGGAGGTTTACACAAATGATTCTTGATAAACGACTGAT
+GTTCAGCGAGAACCAGGCTATCACGGCCACTGCCGTGAGCACAAACTCGCTCACCTTCGA
+GGTCGATGATCTTGGCACGGGCGAGCCGGTTACCCTCTGGACGCAGGTAACCGAGGCCTT
+TACTGCTGCCGGAGATGCGAGTCTACATATTGATCTCCAGCATTCCGATGACGGGAGCAC
+CTGGAAAGACCTTGTGCCCTCCAGGGCCTTTGCGCTTTCCGATCTTGGCCTTGGGGCGAA
+TCCCTTGAAGATCAACGTACCTGCCGGGGCAAAGAAGCACATGCGGCTGAATTACCCGGT
+AGCAGATGGTCCCATGACCGCGGGGAAAATTACCGCCGGGCTGAAGCGATAGGAGGTGCA
+ATGATGAAAGTAAAATGCCTGGTATACACCTATCACCTGGGGCGTATCTGGCGCGAAGGG
+GTCGTCTATGATTATCCCGACGACAAGACTCCGCCGAAACGGCGTTTTAAGGTACTCGAA
+GCGCCGAAGGAAAAGGCGAAAGAGAAACCCGAAAACAGTGATCCGGAAAAAGAGAAGCTC
+ATCGCCCGTGCATCCGAACTGGGTATCGGGCCACCTTCCACCCTCTCCCGTTGGGGCGTG
+GATAAGCTGAAAGATGAGATCGGCAGGGCTGAGGCTGCCCTTGCTGCGGCAAGTGTCGGC
+GGCAGTGGAGCGTAAAGGGTCGCCATGACTGCGCTGGAACTCATCAACATTGCCTTGACT
+CGGATGAATGAATCGAAATTGACGAGCATCACGATCGACACCTATGTTGCCGACCTTTGC
+AGGCTCTTTCTCAAACCTGTTGCCGATGAGGTGACCCTTGAGGAAGACTGGCAGTTTGCG
+CGTAAGCGGGAAGCTTTGAGAACGGACGATGAGGGTGAGAACCAGACAGATTATGGATAC
+ATGTACCGGCTCCCTGCGGACTGTCTTTTTCCGAGGCAGCTCCGCAGTAAGGGGCAGTAC
+GAGATAGAGGACGGACGGCTTTACACCGGGGATGAAGCGGCAGTGCTCATCTACACAAGA
+TCAATGGTTGAGATAGCGCATGATGACGAGAATGGGCTCGATATTCCCGTACTTGTGACC
+TCGTTCCCGGTGACCTTTGCCCAGGCGGTTGCTTGCCGTCTGGGGAGCCAGATCGGCCCA
+AAGATATCGGACAATTTCAATCTCGCCTCCGCGCTCGGCCAGGAATACATGGTCATGCTT
+GAAAAGACCAAGGCCTTTGACGGCATGCTTTCTCCGGCCGAGGATGAGGCGGTAGAACTC
+TGGAGTGATATTCAATGAGCCGCCAGAGAATCCTTGTGACAGATTTTACCCGTGGGATTG
+TCTCTCCTCGGATGGTTCCCAGAATCGACCAGACAAAGGCGGTGTCAGAACTTACCGGCT
+TTGTCGTCCTTCCCGACGGTGGAATTCGGCGCCGGGAGGGGACCATCTATGCAAGGCGAG
+GGCTTGGGGTGCTTCCGACAGACTGTGAAGCGGTTCCGGCCTTTACCACCTTTGACAAGC
+GGATTACTGGAACAGAAACGCTACACCTTGCATGGATCAATGACGCACCACGCCAGCTCA
+ATGTACAGAACATGACCAATCGAACCATACAGAGTGTGGCAAGCGAGAGTCTTGAGGCTG
+GAAAGCCTCTTCTTGATTCGGGGAAATTCAACAACGATCTTGAATCCCTGTACGCGCAGA
+ATATTCACCTGTGGACACCTGGGGCCAGTCATGTACTGGACCTTGAGACCTGGGCCCTTG
+CAGAAAAGACCAGCCAGGAGATCAGCACGATCTATCAGGCACGAATGATCGCGGTAAACC
+GCACCTGGGGAACGGTCTACATGAGTGTCGCGTACATCTATCTTGATTTTGATTCGGACG
+GACACCTTGAGCTTATTCCCGATTTCTACGGATTCGAGCATCCCCGGTGGATCGTTGCCT
+TCGGTGGGGATGTGTATATCGGAACGGACAAAAGCGAGTGGATGCTTACCAGTGGGTATC
+CCTACTTCACCGATGACCTTGGCGGACTGATGATGCAGAAGATTAGCGGGATCGGGGCCG
+ACCTTGCCGTTGTGTTCGGTTCCTCGATCATCCTTGCAAAGGATAGACGGCTTGTCAGGA
+TCGTGTATTCATCGGCCGGGGAATTCCAATCCCAGAGCATGGCGGAGCTTATCGACAACA
+CGGATATCATTCAGATCGATGTGATTGAATACGGAAGCCATCGGTACCTGGTCTTTATTG
+ATCGGGATCGTCGGCTTTGGTGTTTGACCGAGTGCCAGAACACCGGCGTTGCTGCATGGC
+AAATCCTTGCCGAGCATGTCGGCTGGGTGAAAAGCTACGGCCAGGACCTCTATATCGCTA
+TTGAGCGGGACGGAGACTGGAACGTCGAAGTCATTCCCATGGACAACCTGAATTACCCAG
+GGAACCGGTCACAGGGGCTCAAAGACGTGCTATTTGAGCGGAGGGTATACGGCGATTGCG
+GGGGCTTTCTCCGCATTGATCATGATCCTTCGACCGGCTACTCGGTTACCGGCGACAGAT
+TACCGGAACGTCAAACCATGGAAGTCTACCTCCCGGAAGGCCAGTACATCGGCCAAAGAG
+ATACCGATGCAAACGGCCTCCTCATTGGATCGGCCGAAGAGATCGCAACCTGGGCAGGTT
+ACGACGGGAAACCGGTCTACCTCTATTGCTACCAGAGCGGGAAAACATTCACCTCCAGGG
+TGAAGACGCTCCCGCTTGAAATGGGAACAGCAATGGGGCCCGGCCTGGGCGCTCTTCGGA
+GAATCAACCGGGTGATTGTCAGAGTATTTGAATCAAAGGCACTCAGGGCCCGTGCCAATA
+CCGGGCGATGGGAAACATGGGAAAGTGAGGACTTGTTTTCCGGAAATGTAGAGCTTCCGA
+TCGACTGTGCTCACAGTGATCTCGTGCAGCTTGAGATCGAGGCAATCGGAGATAAACCGC
+TGCATATTCACTCAATCCAAATCGACGCAACCATGGGGGACGAATGATGATAGAGCCTGT
+CATAGTGCAGCACATGGTCGCCGAGGCAATGGGAATTGATTTCACAAACGTTGCCGTATG
+TATTCAGCAAGGATGGCTACAGGCCGTCATTGCCGGGGCGGCTCTCGTAGTAGGGGCCGT
+TGCCCAGTATCAAAGTAATAAAGCAGCAAAAAAGGCAGCGAAAGAACAAGCAGAACTTGC
+CAAAAAGCAGGCCGCCTTTAACAAAAAACAGGGCCTACAGCTTTACGGTGATGAAGGACT
+ATACAGGCAGCAAGCCAGCGAAGCCTTGGCTAATACCCAGGAAGAATACGATATAAACAA
+AGAGCAAATCGAATTTTCCTGGGATCAGGCGCAGCAATCCTACGACCTCAACCTCTCCAC
+CCTTGATCACAACAGATTGCGTGCGGATGAAAGCATTGATGATCAGAACTTGAAAAATCA
+GGCTGCTCTCGGTGCCTTTGGCGTCCGTGGCGGTTCCTCCAGAACAAAAGCCAACAAAAC
+GATCGCAGATGCAAGAGAAAATCTTTCCTTTGAATATGGCCAGAACAAAACACAACTCAA
+CATGAGCCTCGAAAGCGCTCAAAAGCAGACTGAACTTGCACAGGAGCAGCTTGACCTCGG
+GATGCAGAAGGCACAGCAGTCGTATGGGTACGCAATCGAACAGGCAGACATGGGCAAAGA
+GGCGGCCCTGAAAGGCTATGAGTTTGCCTCAGAGGGAATCAGCAACCAGTTGCAATCAGT
+ATATGACCAGGCAAATTCCTGGTCGGTTATAACCGCAGGTCTAAGCGGTCTACAATCCGG
+CTTTCAAATGGCATCGGCCGTTAACACTTTTGGACAACAGTATTTAAACGACGATGATAA
+AGTCAATTTTTGGAAAGATTGGTGGGCGTGATAATGGAGGACCATAATGCCTAATGCGTT
+TGATGCCATCTTAAAGGCAATGGAAACAACGGCTATGGGGCTTCAAACATACCAAAGAAT
+TGATGCTCCACGAGTCGAATATGAAGCGACGAAACTCCAGAGCCAGATAAAACTCGGCCT
+CGATTCTTTCTCTCGTGACGCGGAGAAACTGCCGTATGGACAGATACAACAGGCATGGAC
+CGAACGGCAGGAACAGATTACCGACATGATCGGGCAACAGCCCTCGGAAATCCAGTATGT
+CATGAAAAATTGGTGGCAGAACGCATCGACTAGCTACCAGTCAACCATGAACGGGCTTGT
+TGATCAGAAGTACCGGGCACAAGAACTGACTTCGCTTTCCGAGCAAATTGACGAACTTGC
+AAAGGACGGAAGCGATGAATCAATTGCAAAAATCAAGAAGCTTGTCGAATCTGCCAATGG
+AAGTGGGGTTATCGATCCTGGGACGGCGTACAAGCTGAGTTTTGAGTCAATCGCGAAGGT
+CAACTACAACGCCGCCAAAGCCAACGCTTTGCAGATCATGGATAAGGACGGTGTCAGTGC
+AGCCCTTGAGTATGCCATGAACGGAAACGAGAAGCTCTCAAACGACATGCGCATAGCGCT
+ACGAAACGAGATCAAGACCATTTACACCGACCGGGAGAATGGAAGGATTCAGCTTGATAC
+GCAGGCGAACGACGATGCCTCTTCCCTTGCTGAACAAATCCTTGATGGTGAGAAGCCCTT
+GTCTTCAATGGACCAGTTGATTGAAAGCGATACTCGCATGAGCGGCAGAAGTCGACTGAA
+TTGGCGTAATTGGATGATCGCCGTACAAACCCAAAGGGACAAAGAACCCGATCCCGAAAT
+GGCCGCTTATGCAAAGACTGCTCTTAACAAGGTTATGGAGGACTGGGAGAAGAATGGACC
+GAAAGCTGAACAGAAGAACATGCTTTTGCAGCTTTTGACAAATGGCTACATCAACAAAAA
+CACCTATGATGATTACCTCTCTACGATTTCCAAGGATCCCATAACAGAGCCGGAGTTTGA
+CGACGGAATCAAGCTCATCAAATCAGCCTTGAAAGATAACGACGAAGGCATGGAGCAGGC
+CCTTGCCGCCTTCAGGCAGAAAGTCTATGCAAATCGTTACATCGGCGATGAGCTCAACCA
+AAATCGGTGGACCGGCCAGGAGCTTGCCCAGGTTGCGCAGAACATCGCAGCTCCCACCGT
+CTTGAACGAAATGAAGATGGATCAGTTTCACGTCGGAGGATTTAACCTTGACGGTTCCTT
+CTTAAACTCCGTTGAAGAGAACATCCTGAACGCTCAGAACGGAAGGTTTCTCGGTTTGAC
+GGAGGAACATGCCCAGATGTTCAACCAGATTCAGGAAGGCCAGGAACAAATCATCTTGCA
+GCTCCTGCCGGACGGAACCACGATCAACAAGATCACCAGGAACAAAAACGGTCTTCCCGA
+ATTCCACACGACAGTCGGAACATTCATGTTTGCAATCCCAACAGATGAGAATGGGGAGCC
+AACGTCAAAAGACGAGGTCCTCATCTATCACCTTGGTGGCGATCAATGGGCGGAGTATGA
+CCGAAAAGCCGTCAAGCAAGAAGCCGACCAGCGCAATGTTTCCGATGCTACGGCCCTTGC
+CTCAGCAGAGAAAGCCTACCTTGATCAGGAAGATACTCCGAGGCAAGGCATCCCTCGGTT
+TACCGTCAATGACGATTACTCTCCCTTAGAGAAAGAGCTTGACCTCATGCGGCAAGAGCT
+CCTTGTCGGTGGCGGATTTAGTCAGTATGGGAGGCAGTGGGACTCTACCGCAACCCGAAG
+AATCAAAGAGATTGCAGAGCGTCGGGGGCTGCCGACTTCGACCGTCGTCCAGGCGGCAAA
+GAGCGTCGGATATGTTGATGAGGATTTCAAGATCGGCGTTTTTCGATTCTGGCCTTTTGG
+AGGTCGAGAGTGAACATCCTTTGGAAGAAACGGGAACCGGAAAACACACGGGGTGCTGCA
+ACCTCCCCCTGGAAAACCGACGGATTCAGAATCGTGTCGGGCACAATCAATTCTCTTGAT
+CAAATGAGTCAGGAAACCGAACCCACCCCAGGAGAGGCGGTCGAGAAGCTCAAATACAAG
+GATGCATTCCAGCAAATCCTTGAGGGAACGCTCGGCGATGGTTTCTCCGATGAAAGCCTT
+CAAAAGCAGTTCTACCAGGTAGCAATGGCCGCCAAGAATCCAGAGGAAGAGATGGCAAAG
+ATGGCAACATCCGCCTTTCTCTCCCAGCGTTTGAATGCTCCACCCGATGTTGTGTACAAG
+AACTTTGATTTCTACACCGAGAAGTACATGACCACAAAACAGGCGCCGCTCTCAGCTTGG
+GCCGCGATCAAGAATGAAGCGTACACCAGCCAGCTCATGATTGAGCGTGGAAAGATCGGC
+TATGAACTCATGTTTGACCCGGAGAACCAAGAGCTTTGGGACAAGCTGCTTGATATCAAT
+GAGAAGGTTCCGCCACAGGATAACCAGAAACGCTCTGTGCCCATTGAACTGGTAAAAGGT
+GCGGCGAAATTTCTTCCCTACGTGGCGACCGGAGCAATCGGCTCTGCCGATGAATCGATG
+TTCGGTGCAGGGCTTGGCGCTGTCGCAGCCGCTTCGCTGGCCTCTGCCGGGACACTTTCC
+GGGGTGCTGACCGTACCCTCTCTCATCCTCTCGGGCTACCAGATTGGGAAAAAGGTCGGG
+TCAATGGATGAGTATTTCAAGATAAGCGCCGGAAATACCTATGCGGACACCATGCAGAAG
+AAAAGCGCTGACGGGAAAACGGTTCCCGTGGGCATTGCCAGGGCCTTTGCCTTGGCCTCC
+GGGACACTTGCCGGAGCATTGGACACCATACAGCTTGATCGTTTTGTAGGCGGTTCCCAG
+TGGTTGCGTAAGGCCGTACCGCAAGCCGTCAAGAAGAGTCTGCAAGACAGCTGGTTTTCA
+GCAATCCTCGGGAACCCCGTTGCGAAGTTTGCCGGCCGATGGGGATCCTCTGTAGCGGAA
+AGCGTGGTTGAGGAGACCTTCCAGGAGACCATCGAAATGATGGGAACCGAGGTTGCCGTA
+ACCGTTGCGAATTGGGCAAAGAATACGAACATCCCACAGGCGACAATCGACGACTGGAAA
+GATATGTGGATGCAGACCATTCGCGATACGGCGAAGGGAACCACCCTTCTCGCCCTGCCC
+GGCGTTACGGCCGAGAGCTTTGCGGCCGAACACCAGAAGCGACAGTCGGCAAAGGATCGA
+GAGGCCGCCCTTGCCAGCGGAAACGCGGATATCGATCTCGGGAAGTTCAACGACTATGCG
+GCCATTTTTGAGGAAGAGGATCTTCAGAAGAGCACTGAGAAACTGGTCGCCTGGAAAAGC
+GCGGAGCTGAAAAAGGCGGAACAGCGGCTTGCCTCCGACCCCACTCAGGAAAACTTTGCG
+ATGCATGAACTACAGTCGCAGGAACTTGATAGAGCCGAGCTTGAGGCCTCCGTCGCAAAG
+AAAGTGAGCGAGCCAAGAGTTTGGGAGATGACGCAAGACCAGTGGATAGCGCAAAAGCAG
+AGGCTCTCAGACCAAGAGCTTGAAAGCCTCAAGACTTCCATTGCCGCAGGCTTTCCCGGA
+TTCACGGATCAAGAGCTTGAGGTTTCCGCAATCGCAATGGATACCATTGCAAGAAACTTC
+GGACAGACCGGGACCGCTTTACTCGATACCATGCTGACGATCGTACCGGCAGATGAAGGG
+CAAGCAGCGGTTGAAACACTTTTCCCGGGTAAGAGCGTATCGCAGACAAACAGTGCCGCT
+ACCTTTTTCCGAGATGCAGAGGGGAAGCTCCTTTCTCCGACAGAGGCCGCAAGGGGACAG
+GCTAAGGCCTTTATCGCTTCCCTCTCTTCTCCAGATTTGTCGACCTTTCTGCATGAGTAT
+TTTCACTTTGCCGATGTCATGCTCATCTCTCAAAGCCCGGAGCACCGACAGCTCTTTTCA
+AAAGCGCTTGGAAAGGATTACTCACAGTTTACCGATCAAGACCGCGAATACCTTGCGTAC
+ATGTTCGAGAAATATCATCGAGACGGTACGGCTCCCACTCCTGAACTCAAAAGCTTGTTT
+GCCAGGATCGCAACGTCACTCAAGCAGTTTGTAGAACGGATGGTCGGCCTCAAGCCGATG
+AATGAGGATCTACGCAAGGCCTATGATGCGCTCTACTCCCTGAGGTCGGAGGATATCAAG
+AACGACAATCCCGATCTCAAGGAAAAAGTGGTACCAATCAAAAGGTATGCACTTTTTCAA
+GCAGAACCAAACGAACGGGAAGGCTTTCAGAGGACACTAAGAGAGGCATTTGAATATAAA
+GGCCAAGGTGTTATTAAGCTTTCAAATCGAACGCCTGAAGCTTTAAAAGCATCTGGAGCA
+AAAGACCTTCCTATAGTCCTTACAAGAAAGAGTCTTGAGCATATCAGAAAGGACCATCCC
+AATATACCAAAATTGGTTTTGTTATCAATGCTTGATGATATTTCCGATCCGGTAATGGTA
+TTTGATAGTGCTTCGAATACTGAAAAAAGAAAAGGATTTGTCATTGTAACTAATCAGATA
+GTTGATGATGCGCCTGTAGTTATTGCTATGCATTTGGAGGTTGGGAAGCCTCAATGGCAA
+ATACATAAAATAGCTTCCGAGTATGAAAAAAACAGTTATAAAACTGTCTTTTCGAAATGG
+GTAGATCAAGGTCTGCTTCGGTATGTAGATAAAGAAAGAGCCCTGAATAATCCACACATC
+TCCGCCGGGCTCCGCTTGCCCCTGGAGGTAGATAATTCAAGACCCCTCTTAAATAAGGTA
+GTACTGAAAACTGACCTTGTCAACAATAAGCAAACAAAGCCACTTTTCCAGGCTCTTTCT
+CCCTTGCAAAAGCTCAAGCAGAAATGGGACCAAGAAATCGAAAAAGCGGAACAGGAGCTT
+GCAGAGGCAGAAGACCGGGTAAAGGCCGGAGAATCATTTTCCGTTGTCGACAAGGCCCTT
+GAGCATCTGCTTTCCCTCCAGGAAGAACGCGAGCTTGCAATCCGGGATTACGAAGCGAAC
+CGGATGACGGACCATGATGCGTATTCGGATGCCGTAGAAGCCTCGGTACAAAAGACGGTG
+GAAAACGGCGATTGGGTACCGGATTCCCAACTGAAAGATTATAGCTCGCAGAATTGGGCC
+CGTGATGAAATCGAATACCGGCAGCAGGCCATAGAGGATGCTGGAAAGTATGCCGACAAA
+GACGAGTATATCGCCTCTCAGGTTCTTTCCGACAACCTCGAAGACGGACACACGCCGGAG
+TACTACGGGAACATCTTTGATGCCTCCCGCGAGACAGAAGCGAATCTGACCGGCCGGGAA
+GCAAACTATCGCTTTATCAAATCACTTTCTGCAGATTACCTTTCCTCTGAACTCCTTGAG
+GCTCTGCACGTGTTTGGAAGCGATGGCCTTTCCGGCTGGCATCCTATAGTAAAGAACGCA
+GCCCTTAGCCTTAAAAAAGGCAAGAAGCTTTCACAGGCCCTGTACAAAAAGGTTATGGAT
+CAGATCAAGGCCGATCCCGAAGTCTACCGGATGAGTTTTGCCGAAGCAGCTCAGGACACC
+GAAGGAATGCGACAAATTCAGTGGGAAATCGAGCACTCAGAAGAAACAGAACTCGAGAAA
+CAGCTCAAGGCAAACCGTCAGCTGCGCAGACAAAACGAAAAGCTCAACAAGTCGGTTGAG
+GCCTTAAACCGCGAAATCGACCTAACAAATAGTGTCCTCGGCGATTACAAGCGAAAGCAA
+GAGGGATTGGAAGAGGCTTTCCGTTCTGCTCGGGAAGAAGCGCGAAAGGGTGACGTTGAA
+AGTCGAAAACAGTGGGTAAGCCTACTCTCTGATGCAAGAAAGGAAGCGTATCTGCAAACG
+CGCAGGGCCGTAGCTGATACGAAGCAGAAAATCCGAGATATGCGGGATGCAAAGGCCTTC
+TATGAACGAATGATAAAAGCCATCATGCGACCGGCCGGACGCTCAATTGCCTATGATCAG
+CAGGTCCAGATCAGGGAAATACAAGGCCGGTATGTGGCCAGGTTTACCCGACGAGAAAAG
+GAAATGCGGCAGGCATACCGGAAGCTCCTTTCCGACGCCGGTATCGATCCACGAATCAAG
+GAAGCCATACAAGAGAACCTGAGTAAGCAAAGCCTTCGCGATCTATCTCCGGAAGAAATA
+GAGAGCCTGCACGCTGAGATTGCGGCCCTGAGAACAAAAGGGCGTGAAATTCGGGAAGCG
+CAACTTGCCACTGAGCACATCACCAGGCAATCAGCCATCCAGAACGTGCTCGAAACACTG
+GGCTTTGAAAAGCCGGAAGAAGGGCTCGGGCTCAAGAAAACAGAACGTGGACGCAATAGC
+TCTATCTTGCAGAAAGAACGCCTGACCACCCTCCTTCCGTCTCATATCGCGGAGATGTTT
+GACGGAGGCAAGAAAGGCTCGTTTTACCGCTGGTTGATCGTTGAGGTTGAGAAAGCAAAA
+TCCGAAGCAATCAACAATAAAGACCGAAGGATGAACGCCGGGTATGAAGAAATGAAAAAG
+CTCGGCATCAAACCGAAGGACTTGATCAAAGAGCGGAGCATTGACGGGCTCACCTTCCAG
+GTTCAGGAAATCATGGGGCTATACGTCTATATGCAGAATGAATCCGAACGTGAACGACTT
+CTGTATGGGAATAGGATAAAACCGGAAACCATAGCAAAGGCAATCAAAACGCTTACACCG
+GAGCAGAAAGCGTTTGCCGATTGGATGATCGACTCTTTTGAAACCGACTATTCTCGTTTT
+GAGTCTGCATTCATCGCCGACCAAAATACAGCAATGGGGAAAGAGAAACGCTATTTTCCC
+ATGATGGTGAAAGACCTCCAATTCGATACGAAAGCACAGGAGATTGCCTCTGATTTACTC
+TCCCGCAGCCATGCCGTAAAAAGCTTTGTTTCAAGAGGATCAACACATAATCGAATCAAA
+ATAAGCAGAGAGCACCAGCCCTCCATGAGGCTTGATGCCTTCAATATCTGGGCAACAAAT
+GTGGATCGCCAGGAGGACTACATCAATAACGGTCTCCTTGTTAAGCGGCTGCATGCAATC
+TTCGGTAACCGGGAGGTCCAGGAAGCCATCATACAGCGCTATGGTAAGGATGCGGCAAAC
+TGGCTCAAGGATCAGATCAACGAGATTGCAAAGCCGCTTGCCGGAGTTAAGTATTACGAG
+CCGATCATGCAGCTTTCGCAAAAACTCCGTTCACATGTCGGCTTGGCCGCTCTTGCCTGG
+AACGCACTCACCCCCTTAAAGCAGTTTCCTTCCCTTTTCCTGGCCATGGGCCGGGTTCCT
+GCAGGAGAACTCCTTGCAGCAAGCGGAAGGCTTATCGCTTCGGGTACCGGGCTGGTTAAG
+AAAATGCACGAGCTTGATCCCTATATGCGGGCCATGGACTACGACCCGGTGCTTACGGAA
+ATGAGGGAAGCGGACAAAAACCGCTATGAAAGATTTGTCACCAAGACTGGAGAGCTTGGG
+ATGAAAGGAATCTTTGTCGTCGACAAAGCCGTTAAAAGCATTATCTGGGATGCTGTCTAC
+GAGCACAATCTGAAACAGGGGAAGACACAGGATGAAGCGATACACGAAGCACGCAGGGCC
+ATCATTGAAACGCAGCCAGGCGGATTTCGTGAGGACTTACCCGTTGTTGCCCGTCAGGGT
+GAGTTTTTCAAATGGATGACGCTTTTCAGCTCTCAGTTGCAGAAGCTATACAACATGACA
+ACCTATGATATTCCCCAAGCCGTCAAGCAGGGGGACATCGCCACGGCACTTCGTATGAGT
+ACCGGGTATATCATGGCTGCCGTTTTGATCGGGATGATTAACAAGAAAAGCACGCCGGAA
+GACGCCAAAGATGCCGGAAGCATGGTCCTTGAACAACTGGTCACATCGATCCCGATTCTT
+GGAAGCCTCTTTGTGCAGGGGGCAAAAGGCTGGTCGTCAAGCAATCCCGTGACGGAAACG
+GCCAACCAAGTCGGAAAGGTTATCAACGCAATCGGAAAAGATAAGTCGGATGAGCAGGTC
+ATGAAAACGGTCATGGATGCTCTGGAACAAGCTCTTTTCTTGGGAGGACTGCCGACGGTT
+CAGGCAAACCGGATGATCGATTTTGCCGAGACCGGGGATCCCTGGGAAATTGTGGGAGGA
+CGGAGCAATGAGTAACGTTGAGCTTGAACTTAAAGGCCTAAGAGCTGCATCACTTACCAA
+GAAGGAGTACGAACAGGGGTACGATCGGAGTGATGCAGACGGTAATAGCATAGTCACGAC
+AACACCACAGGCACCGGAGAACCTTATCGTTTCAGCACGAAATCGAGTGGTTTCGATTAC
+GTGGGACAGGCAGGAAAACCTCACTCCCCCTCACAGTTACATCATCGAATGGTCCCTTGA
+TGAGGAGACCTGGAATAAAGTCGGCGATACCACCTCCAATCTGTTTATTCATGAGGGATA
+CATAAAAACAGTCGATGATGCTGCGGTCGATACCCGGAATTTCTACCGAGTGAAAATACT
+GTTGGCCAGTGGTATATCGGGCCCCTATAGCGAGATTGCTTCTGTTCTGTGTGAACCGGT
+AAAACAGACCGACTTAATTGGTTCGCTTGCCGGGAAGATTGATGCCGGGGCCTCTGCAAA
+CGATATAGCTCAGATGCTACAGGGCTATGCAAAAGAAAAAGGCGTTACCCTTACGCAGGC
+GTTCGGCAACTGGGAGAACCTGAGCGATGCATCCGTGACCGTTGATGAAGGAGGACCGGG
+GGAAACAACAAAAAAACTGTCCTTCATTATGAAGAATGTAGTTATTGCCGATCTTATCCT
+CGGTTCCCTGATTAAAGGTGAACACATCGAAGCACATAGCATTGACGCAACACACCTGAA
+AGCCGACATCCTGAAAGTACTTTTCAGCCTGACCTCGCCGAATATCGAAGTCACCGATGA
+GGGACAAGCATACAACTTGAATAATTATGCAAGGCTCCTGATAACTCCCTATACCATCAC
+CTGGCAGACGAGAAGTTCCATTGACTCTCCCTGGACCAGCCGAAGAATGCTCGGCAATAA
+CGAAGGAGATGATCTACTTGCCGATATAGCGCGTTTCCGAGGCCTCTTTCCATTAGATAG
+GGGCTTTGACCGATCTATTGGTTTTGGAAGGCCGGTAGGTTCACTCACCTACTCGTTTGA
+CAACATACTAACAGATCAAAACGGTGAGAATGCTTTTAGTGGAAAACAGACCGCATATAC
+AACGGGGAAATTTGGAGAAACACAAGCGGGAGCTATTGCCGCATCTACTAGTGCCGATTA
+TGCGGGGATGGTAGAGAAAGTATTTTCCCGGTCAATTACTGATTATTGGACATTGGCATT
+CTGGCTAAAGGAAACAGCCGCTCCCGTCTGCACGACAAAAGTCATTGAGATCAAAGAATT
+AACGCAAACGATAATAAGAAATACACAGGCCATAGGCGACGTGTCTTTTTCCAAAAGTGG
+AAATTACCTTGCGATTGTTTGTGCAGGAAGCCAAGGCCAGGATAACGGAACCTTTATCTA
+CAAGAAAAACGCAGGGTCCTTTTTCCTTTTAACAAAACTTGTACCATCTGCATCAGAGAG
+CTACCAACCTACAAATATCGCTTGGAGTGCCAACGATCAGTACCTTGTGATCACCGGTAA
+CTATGCAGGGCACATGTACAAAAGGAACGAGGATACCTTCAACTTACTCGGCCGCCTTGA
+GGGGATAGACAATACATCACGATCGGTTTGTTTTTCGAGCGATGGGAATTATCTTGCTTG
+TTCTTCCGGGTCAGGAAACTTGCTAAAAGCATATAAAAGGTCCGGCGATGTTTTTTCCAG
+GTATTCTCTTTCCTACACCATAAACGCAAATGCAAAAGCCCTTAGCCTTTCAAGTGACGG
+CACGTATTTGATGGCGACGGTTTCAGGATATGGTGGTGAAATTGACGGTCTATACCTCTT
+TAAGAACAATGGCTCCGAATATCGGTTACTCACTATTATTCACCATTATGATATCGATAA
+TAGCTATTTTTACTCAGTAGAATTCTCTCACAACGACAATTACATTGCTTTCGGTACTCG
+TCACGGTGTCATGATTTATAAACGTGTTGGGGACAATCTCCAGAAAGTGACAGATGTAGA
+GGCTGAAAATGATAGTGTCATTTATTCGGTACACTGGAGCCCCAATGACAGATACCTATT
+TTTTACGGGAGCAACAAGACCGTCAATTTACCGTCGAGATGGAGATGTCTTTACAAAGAA
+ATCCGATTTAGGAATATTCTCAGAATTTTACCAGTCCCCTTGTGCTGGTCTATCGGCAAC
+ACATTTTGCCTATGCAGACAGAGTCGATAGTACTTCAACCACACATGAAAAGGTTTACAT
+CTATGCGTTTGAGGAGAATGACAACTGGTGGCTTGAACCTTCTTTGCAGAATGTACCGAA
+GCTACTCTCGTTTGAAACCGATGAGGATGTTTTATCCGTTTACCGGAAACCCCATTCCAT
+AGTCCTTGCAAAGGCCGTAACCAAAACATCTCAAACACTCACCATCGATGAGGTAAAGGT
+TTGGAACTTCATAGCTTTACGAAGCAATGGCGATGGGACAATCAGCTTCATGCTCAATTC
+GCAAAAGGTCACATTGACGGTATCGCTTAAAGATACAGAGAGCTTGAAAATCATCTTTTA
+CCTTCTGAAAGAAAATGGTCTCAAGATCGATGACATGATCTTCTTTACCGGTCTACTGAC
+TGACGACTTCCTTCAGACCTATCGAAATTCTGGCTATCCCTGGGCTGATGCGGAATTCGG
+CGACACCTTTATAGGAGCTTCCCCAGGAAAAAAAATCCGTGTTATCGACAAGGTCGTTTT
+TGAGAAAGAGATTGATGCGGCCATACCCACCCCCGTTGTGGATCACGAATGGAACGGTAC
+GCAGTTATCGATTACCGATGAAAGCGGTCAGGGGCCATATGTCGATCTCAAGGGACCCGA
+AGGCCCTCAGGGGCCCCAAGGTAAACAAGGAGTCCAGGGGCCTACCGGACCGACCGGTCC
+TAAAGGAGACAAGGGGCCGACTGGCCCTACTGGACCGAAAGGACCAACCGGTCCCAAGGG
+AGAACAAGGCCCCACGGGTCCCACAGGACCCCGCGGAGTACAGGGGCCGACAGGGAATAC
+CGGGCCCGCCGGACCAACAGGACCACGGGGGCCTCAAGGAAATCCCGGAATAACAATTCC
+CGATATATCAGGCCTTGCCGAAATTACATCGATCGACCCGTCAAAAGATAAGCTGATTGT
+CTATGACGCAAGTACGGGTACGCATAAATCAATGCGGATATCAGAACGTTTTCCCGTAGG
+CTCCCAGTACACACAATATGCCTCAAGCGCAAGCAATGACCTCTCGGTTGCCTTTCCGAA
+TAGCGAGTCCCCCGCTTACCTGTTTGGAGGGACCTGGGAGAAACTGTGGGACGGCGAAGG
+CATAGACTTTCATACCGAAGGTTATAACGGTTCAGGACGAACAAATGGGCTAATGCCCGA
+TAATCTCCAAGGCTTTATCACACTTAATGGTGTAGGAACTAATACAAGCGGAAGTAATCC
+TAAAATTTTTGTCTATGGATACACGACTGAAGACGTACCAGGAAAAGCTGAGGATATCAA
+TGCGGCTGCCAATATTAATACAACAATTCAAGGCAAAACATCGGGACCCAAAAGTGATGG
+TACGAACGGTACTCCTCGCATTGGGGCAAGAACATCCGACCGTAACCGCCTCATGAGGAT
+ATGGAGGAGAATTGCATGAAAACCTATGCCGTAACAGACGGCTCAATGATCACCGCTGTG
+GTGCAAAGCGCCGATGAGACGGCAAAGCTTGCAGAGCTGTTTCCGGAAAAGAGCATCAAG
+GAGATTCCTTCCTGCTTTAGCGGAAGCAAAGGAGATGATATCCGCTTTTACGATGAGGAT
+GGAAAGCGGCTTTCGGTAGCAGCCGCAACAGAAGCCGGGCTCGTGCTTGAAGCCGGAGAA
+CATGAGGCCTCTATCTGGGAAGGCGGTAAGTATGTGCTTGTCCCCGACTATACCGGTGTT
+CCCTACTGGGACAAGGCCACAGGAGAGGCGGTACACCTGTCCCTCGGCCGAAAGCCTGAT
+GAGAGTATGACCGACATTGCCCCGCCGGACCCTGGGGCCTTGTGGAGTGAAACGGGTTGG
+ATGGTCCCTGATGAGGTGCTCTCCGAACGGATTCGCATGGAACGTGATGCGCTGCTTTCA
+GGGAGTGACTACATCATGATGGCCGACTATCCCCTGGCCGATAAATCGAAGTGGAAAGCC
+TACCGACAGGCTCTCAGGGACATTCCCCTACAGCCAGGCTTCCCTCAGGAGATTTCCTGG
+CCACAGGTACCGGAGAAAAGGAGTTAAGCCAATGGGCGATAACGACAAAATCGATATGGT
+CTTAAGCATTGTGACGGAACAAGGCCGGGACATCAAAGAGATCAACAGTAAGCTCACCGA
+CTTTTTCATCAACCGGGAAAGTACGTGCCCTGTTGAGAAACGCCATGAGAAGAAGATTGA
+GTACCGAACAGTCATTGTCGGAATGGTGTGCGGTCTTGGTGGTTCGATTATCGGGGGACT
+ACTCCCCGTTGTTTTGGGAGGGTGAAAAATATGATTATGAGCTGGAATCGACGAGAGAAA
+AAACTCGTTTGTGGAAACAGAAAAATACCTTGTTCCTGCATTGTTCGCAACGAGCTTAAT
+GGATGGAGACCGCTGGCAAATAAACCGGCACAGGATGAGGTCGTAAGGTCTCTACCGGAG
+AATATTCCGTACATGCCACGACCGTTTCCGGTCGGACGTTGGAATGTTGGCAGACCAGTG
+CCTCGATCTCATCCGTATAAAGCCCCCTATTACATCCCGACTGATGCCTTCCAGATGCTG
+CCGAGATGGGAACTTGACGACGATGGTGGATATCTTCGGGAAACGGAGGATATGGTCCGT
+GACGAAGATTATGGACTTCATTGCTCATCATCAAACACAACACTCGGCTGTATCAGAATC
+ACCAAGGAAAAGGATTTGCTCTGGATGGTCGAGAAGATCAATAGAACGCTTGATACAGGA
+GAAAAGGTGTATCTGGAGGTAGCGGCATGAAGAAATTCTTCAAAAGTTTTTTCAATTCCA
+CGAATGACATAAACGAGAGTACGGTTATCGGGTTTGTCGTTGCCATTTTGTTTGTTGCGG
+CGACCTTCCTGAATATTGTGGATGCCGAAAAATACCAAACGATCGGCTGGGTATTGGTTG
+GATTGTTTACCGGATCAACGGCGCGAAATATCGTTGACACATTGAAAAGGTCAAAGGGCA
+ATCCCTAACGAGGTGAAGGATTGAGATGCGCAAAATTATTAGCATTATCCTTACTCTTTT
+TGTGTGTTTTTCCGCTGGTTTCCTCCTGGGCACTTACCGCTCAGGAAGAGGCGATAGTGG
+ACGAGCTGCAGAATACGATAGTAGAGGCAAAAAGCGAGATACAGAGTATCAAAAGCTCAG
+CAATGAGTATGAGCGAGCAGTTGAGACGTACGAGGGAGAGCTCGCAGAGCTTCGAGCGGA
+AGTGGCAGGATACGGAAAAGAAGCTGGAGGGCTTACAGAGCGAATCGGAGGAACGGAAAG
+CCAAAGTGTCGGCATTGCAGAGCGAGCGGGACGGGCTGAGGAAGGACTATCAAGAGCTCT
+TGATCTATTGCGAAGGCTTAGAGAGGCGGAATCAGCGGCAGCAGACGGCCCTTAAAGCCG
+GGGGCTCTCTCCTGGCCGCCTCAATCATCGTGAATGTACTGCAGGCTCTGTTTTGATCTT
+GCTAAGGGGGAAGAGTTGCATCCTTCTCATGGGAGGATTATAATACTCATGGGTCATTTC
+GTTGGTTATCTGCATGAAATTCATGTTGATAAAGGAAGTTATATGCAATTTCTTTTTTGG
+CTAAAGATATATGAGAAAGAGCCCGCCGTCCATGGGCTCCGTTAAGAAATTAGGAGGATT
+AGATGAAAGATATCTCAGAAATAAATATGAATCTTGATGAATATAATTTTTATACTTTTC
+AATTCGTTGATGAACTTAGATATTTTTTTACCCCTGAACAAGTTTTTAATAAAAATGACG
+CATTTAATAATTTCATTGAAAATTTAAAGGTAAAATTTAGAGACTGTGGATGGGAAGGAG
+ATGGAGAACTTAATATTGGTTGGCTTCCTCCATTTCTTGATGAATCTATTGATCCTAATT
+ATGGAAATATATATTGGCATATTAAACAGGATAATAACGGCTATTCTTTTATTGCATCAC
+CTTCTACTTTTTATTCTTCACGAATATTGGATCAAAATAAAAAACGTTTTATAGGTAGCA
+AGATTCTTGAAACTCAATCTATTACGGAAATTACAAGTAAAATACTTATAGGGAAAACCA
+AAGAGATTCAAGATATTATTAATGATTTAAAATTAGAAAGTTATCCAGATATCATTTTAA
+AAACTATACTCATTAGCATCCAAAGTGATCTCGTTTCATCCTTTATATCTTTTATTGAAG
+ATGTATATTTACAATTTATCATTCATTTTTTCGAGGAGAACAATAGAGACAATTTAAGAC
+TAAGTAAAATCGATGCTAAAATTGATATGAAAAGTATTAATTCAGACATTGATTATAGTG
+ATAGAGAGCAATCATTAACACTTCGATTAATTATGAAATCTATTTGGGAAAATTTTAAAT
+TTTGGCCATTTAAAGAAAAATATAATGAGATCACAAAAGCTATTGATTTCCAAATTGATC
+AATCATCTCGTGATATGCTTTTTAAGCATGTATATTTACGAAATTGTATCCATCACAAAA
+ATGGACAAGTTCAGAATGATTTACAAAAAATGTTAGGTAGAAATAATATAAAGGTGTTAA
+ACAATCAAAATAGAGAAATTGTGTTGAAAGAATGGGATTCTATAGATTTATCTATAAACG
+AAATATCAATTTTTAAAGAAAAATTAGAAGACTTCATAAGCAAATATGAGGTACATATTT
+TACAAAGAATGACAAGTAGATCAATACATCATAGTTTTAAAAACCCAATTGTCAGGAAAT
+TTGATTTATCAGCAAAGAAAGACACTGATTAA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_015761.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_015761.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1407 @@
+>NC_015761.1|provirus_847397_862760
+TTACTGATAGGGATGCTTCTGTTTTTCTTCCCCCTTCGTTCTTACAAAAGTAATTCGATA
+TTTGGTCACCTGTAAGCCGGTAAGATTTATTGCTTCTCGCCAGCGTGCGCCTGTGCTTAA
+GCATATCTTGACTACCAGTGCCAGAATTGAGTCCTGACGTTTGCAATCAGCCAGCAATTC
+AACAATCTGCTCATGGGTAAGCCATGCCATCTCTTTTTCTGCGATGATGAATTTTCGCAT
+GTTCTCCAGTGGGTTCGGATACGACTGTGACCGAAGTGGACCGGGAAAACTAGCTGTGCC
+GGGTGAGAGTGGGCGAGCTTGAAACCAACTGGATTAACTGGCTGACGCTGCGTGCCGGTG
+GTGCCCGTACATGGTGGTGTCCGTCGCCGGATGAGCAGGTGGTGGTGCTGAGCATGGGCG
+GCAATCTGGAAACCGCTTTTGTGCTGCCCGCCATCTACTCCAATCAGTTTGCGCCGCCGT
+CGGATTCTGTGGACGGCTGCGTGACGGAGTACCCGGACGGGGGCTGGTTTGAGTACGAAC
+CCGCCACCGGGCGGTGGCATGTCCGGGGTATCAAATCCATGGTGATCGAGGCGGCGGATA
+ATATCACCCTCAAAACCGGTGAGTTTGTGGTGGAGGCTGACACAACACGCATTAACAGCG
+AGGTGGTGATCAACGGCGGCGTCACCCAGGGCGGCGGCGCAATGAGTCTAACGGGGTCGT
+GATGGATAAACACGGTCACACTGGCGTTAAGTCAGGCGGGGATACATCGGGAGGTCCGGT
+ATGACGTTGTATATCGGTATGAGCAGGAATGACGGGCAGGTAATTGCAGATACCGACCAT
+CTGCGCCAGTCGGTGCGGGATATTCTGCTGACGCCGCAGGGCAGTCGTCTTGCTCGCCGG
+GAATATGGCTCCCTACTGTCTGCCCTGATTGACCAGCCGCAGAACCCGGCACTGCGCCTG
+CAGATTATGTCTGCAGTCTATGTGGCGCTGAACCGCTGGGAGCCGCGCCTTACGCTGGAC
+TCCATCACCATCAACGGCAATTTTGACGGCTCTATGGTGGTTGAGCTTACGGGACATAGT
+AATAACGGAGCACCGGTTTCCCTTTCCATATCAACAGGAGCAGACAATGGCAGTCATTGA
+CCTTTCCTGGTTACCGCCGCCGCAGATAGTGGACGTGCCGGATTTTGAGACGTTGCTGGC
+TGAGCGCAAGGCCTCTTTTGTGGCTCTTTATCCTGTGGATGAACAGGACGCGGTGCGGCG
+CACGCTGGCGCTGGAATCTGAACCCGTCACCAAGCTGCTGCAGGAAAGCACCTACCGCGA
+AATCCTGCTGCGCCAGCGTATTAACGAGGCTGCGCAGGCGGTGATGGTGGCCTATTCGAT
+GGGAAATGATCTTGAGCAGCTGGCAGCCAACTGCAACGTGAAACGTCTGACGGTAGTGCC
+TGCTGATAATGATGCAGTACCGCCGGTCGCCGCAGTGATGGAAGATGATGAGGCGCTGCG
+CCAGCGCATCCCTGCAGCATTTGAGGGACTGTCCGTTGCTGGCCCTACGGGAGCCTATGA
+ATTTCACGCCAGAAGTGCGGACGGACGTGTGGCAGATGCCAGCGCAACCAGTCCGGCCCC
+TGCCGAGGTGGTACTTACCGTGCTGAGCCGGGAGGGTGACGGTACAGCAGTAAAAGACCT
+GCTGGATGTGATTGAAAAAGCCCTGAACAGTGAAAGTGTACGCCCGGTGGCTGACCGTCT
+GACGGTTCGTAGTGCGGAGATCATCCCGTACCGGGTGAAGGCTACCATTTTTCTTTATCC
+AGGGCCGGAAGAGGAGCCTGTTATGGCGGCGGCAAAAGCCAGCCTGCAGAGGTACATCGC
+CAGTCAGACGAGGCTGGGACGTGATATCCGCCGCAGCGCCATTTATGCCGCGTTGCACGT
+GGAGGGCGTCCAGCGTGTGGAGCTGACGTCCCCTCTGGAGGATGTGGTGCTGGATAAGAC
+GCAGGCGGCATCCTGTACTGAATGGAGCGTTACCAACGGGGGCACGGATGAATAGTCTGT
+TGCCGCCGGGTTCGTCGCCGCTTGAGCGCCGACTGGCGCAGACCTGCAACGGGATTTCCG
+ATCTGCAGGTATCGCTGCGTGATTTGTGGAACCCGGCAACCTGCCCGATCAGATTTCTGC
+CTTATCTTGCCTGGGCGTTTTCTGTTGACCGCTGGGATGAGAGCTGGGCAGAAAGCGTCA
+AGCGCCGCGTTGTGCAGGACGCTTTTTATATCCATCAGCACAAGGGGACAACCAGCGCCG
+TGCGGCGCGTGGTGGAGCCGTTCGGCTTCCTGATCCGCATCATTGAGTGGTGGCAGACCG
+GCGAAACGCCGGGGACGTTCCGTCTGGATATTGGCGTGCAGGACCAGGGCATAACAGAAG
+GAACCTATCTGGAGCTGGAGCGCCTGATCGGTGATGCCAAACCATGCAGCCGTCATCTGG
+TTGGTATGTCCATCAACCTGCAGACAGGCGGCCCGTATTTTGTGGGTGCAGCCACCTACA
+CCGGCGAAGAAATCACGATCTACCCGTACATCAACGAAACCATTATTTCCGGCGGCACCG
+CCTATGAGGGCGGAGCGGTCCATGTTATTGACACGATGAGAGTGAACCCATGAGCGCAAA
+ATTTTACACCCTGCTGACGGATATCGGCGCGGCGAAACTGGCAAGCGCCACCGCGCTCGG
+TGTCCCGTTGAAAATTACCCATATGGAGGTGGGTAGCGGTGGCGGTGTGCTGCCCACACC
+CAATTCGCAACAGACCGCATTAGTGGCTGAGGAGCGCCGCGCGGCGCTGAATATGCTGTA
+TATCGATCCGCAGAATAGCAGCCAGATTATTGCTGAGCAGGTGATCCCGGAAAATAAGGG
+CGGTTGGTGGATTCGTGAAGTTGGTTTGTTTGATGAAACCGGTGCGTTGATCGCTGTGGG
+TAACTGCCCTGAGAGCTACGAGTCACAACTGGCAGAAGGGAGCGGACGTACGCAGACCGT
+GCGCATGGTACTGATTACCAGCAGCACCGATAACATCACCCTGAAAATTGGCCCTGCTGT
+GGTTCTGGCAACCCGCAAATATGTGGATAACAAGGTGCTGGAGCTTAAGGTGTATGTTGA
+TGACCTGATGGCAAAGCACCTTGAAGCTGTTGATCCTCATTCGCAGTATGCACCAAAAGA
+CAGTCCGACACTCACCGGCACGCCAAAAGCGCCGACTGCGGCGGCAGGCAATAATTCGAC
+GCAGCTTGCAAATACGGCCTTTGTGCAGGCTGCTATTCTTGCCATGATTGGTGGCGCACC
+GGCAACGCTGGATGCGCTGAAAGAAATTGCAGCAGCTATCAATAATGACCCGAATTTCAG
+TACCACCATGAACAATGCGCTGACACTGAAAGCACCGCTGGCAAATCCGGCCCTGACCGG
+AACGCCCACGGCTCCCACTGCAGTTCAGTCAACGAACAATACGCAGATTGCCACTACCGC
+GTTTGTGAAATCTGCCGTTGCCGGGCTGGTCGGTTCCGTCGCCGGAGGCGCTGGATACAC
+TGAATGAACTGGCGGCTGCGATGGGAAATGATCCTAACTTTACGACAACAGTGATGAACG
+CGTTGTCGGGAAAACAGCCACCTGATGCCACGCTGACAAATCTCAGCGGGAAAAGCATTT
+CAGGGCTTCTCGAATACCTCGGTTTTCAAAAACGTCAGAATAATGTGGGACATTGTTAAT
+TCAAACGATACATACAACATTTATTTCATTGGAAAATAATAGTTAAGATTGAATTAAAAA
+AATACCATTCACACATTTTTATTTATATAAAAATATCAAAAAAAATTAGTCACAACAAAC
+ATCATTTATTTTCATCCCTGCCATCAATCTTAGATTGAATTTTAGCATGTCAAATGATAT
+ATTATAAATCGTTCATTATATTTTAAAGGGTTAAACAAAGAATGAGTGATAGTCAGGGAT
+TTCAGATTATATTTATTTTTACATGTTTGATATTCGCAATAGTATTATTCTCTCATAGAA
+AATTTAGTTATATTGATCGTGTAACTGAGAATGACAGAAACACCAGGTTGGATAGTTTGA
+GATTTTTAATGTCATCATTTGTTGCATTTCATCATTTTATTTTTAGCTATCATCTTGTCA
+ATAGTGGGCAGTGGATAATCCCAAACCATCCAATTGAAGAATTTGCTGGAAAGTTCGGCG
+TTGCTATTTTTTTTATGATTTCAGGATATTTGTTTGTTAAGTGTATAGAAAAAAAAGTAA
+ATTGGCTAACTTTCTTTATAAAGCGGTTTTTTAGAATTTGGCCTGTATGTGCTTTGTCCT
+CGGTAATTTGTATACTAATTGTTATATATATTGAAATTAAAAATAATATCCCCCTCAATA
+CTGATGGCATAATGCAATGGTTTGATGGCGGTCTAATCATAGATACACGTCCCAACCTGG
+GCTACGAACATTCAACCTTAATAAATGCAGGTGTTACCTGGACATTATATTATGAGTGGG
+TGTTTTATTTCTCGTTGCCTTTTATTTCTTTATTTTCTTCTAAAAACAAAAGCTCTCAAA
+TTTTACTATCAATAGTCTTTTTATCTATATACATATTTAGTAAGTATGATTATTTATTGT
+CATGTTTTATACTGCTTTTTGCGCTTGGTGGTATGGCAAAAAAAATAAGAGAACAAATAT
+CAAATGTTAATCAACATACTGTAAACATACTGGCAGTCACTTCATTTATTTTATGCTTCT
+ACTTTGGTTATAAAGAAAATCCATTTACGATATCAATGATATTTCTGTATTTTGTTTTTT
+TCCTTTCAGTTTGTCTTGGCGCTGATATTTTTGGAGTGCTTAGATTAAAAGGAATCATTA
+GGCTTGGTGATGTCAGTTATAGCATATATTTGCTGCATGGGATATTTTGGTTCATCATGA
+ACAAGCTCATATTCAGCGCAGGGTTTGAGAATTCACAAGCCATATACTATACAGCTTCAT
+TTTTAACATGGATTTTCATATGCGTATTCTCCAGCATCGTGTATGCATTGTTAGAAGTGA
+AATTTATACATATTGGAAATATTATATGTAAAAAAATCACAAATAGTAACATTCAGTAAT
+CTAAAAGATATTATATATAAAAAATTAACACCAGACCTCCTAAGATCTGGTGTTAACACA
+TGATGTTATGAGCACTTAATTGAAAGACTGAAAACCATTAATTACTTCTTGCGGAAATAT
+AACTGTAAATGATGAATATTTAGTATTAAAAATAAACATTAAGCACATTGATTTTATCTT
+GGTTTTTGCCAAGTACTATAGCAGATGGATGAGATTGTAATTAACTGGTGGCGGTGGATA
+CTTCCAGCACACACCAGAAATTAACTAAACTGTTCCCCGGTAAGGCAGGCCATACAGGTT
+TTGAAGTATCTACACGCATCAACAAGACCCGGTATTTCCTCCACGCAATCAATGCAACGG
+ACTCATCCGCAGTCGCTATCTCCGCATCAACAGCATCCTGACGCCATTCAATCTCAGTAT
+CGGCTACTGTCTTTAAACGCAATTTTTCAGATTCTGCACGAGAGACTAATTCATCATGAG
+TCGGGGCAAGAATATCAACCCATGCAGGCATTCCATCGCAGTCCACTCCGAGAATTTTAC
+CCTCAGGCGCGGGGCCAGAATATTCAATGTGGATTGATGCAGTGACTTCAACTAAATCAT
+CAGGCCAATTTCCTGCCTGTTCATAGAAGAACTTCAATACTTCATCATAAAAACCGATAT
+TTGACGCGCTAAATAAAATGATCATATCAATATCCTATAGCGAACCAGAACCCACCACCG
+TTTGAGTTGAAATCAGAGTCATTAGCGACATAGAAGCCAAATCCTGTTCGCGATACCCCT
+GTCGACGAACAACCAACCCCTTTACCAGATTGTGACGTTGCGTCCAGACTACAAATAACG
+GAAGCCGCTATTGGCGGAAATGTAATGGTAAAGGTTACATTTGTGTTTTCCCAGCTTGAG
+TCGGCCCGACTTTACCCCATTGAAAAATAAGCCCTCCGGGCAAATACTGATATCCGGTCT
+CGTTTTTTGATACACCAAAAGCGTTCATATCCGGAACTTGATTTGCTCCAGTACCAATTA
+TTTTGAGAGCAGCGCTTCCCAGTTGAAGTAACGTTCTGACCTCATCAACAGTATTTTTGG
+CGATAATATCGCACCCAGTTTTGTCAGTGTGGTTATATCAGCAGAATTGTTACTGTTGAA
+AAATGGCAGTTTGTCCTTCGCTATTTCCAGCCCGGATAATGCAGTCAGCTGTTGTGAGTA
+ATTCTGTTTGTTTCCCAGTGCTTCTGTTAAACCGACGTTTAAGAAAATGCTGTTTTCCCG
+TCTGGCTGGCATTATTTGGGCTTTTGCATAAGGGAAAACAAATGTTAGTCGGCTATGTGC
+GCGTATCAACAAGTGAGCAAAACACAGCGCTGCAGCGTGATGCACTGGAACGCTCAGGAT
+GTGAGCTAATTTTTGAAGACAAAATGAGCGGAAAAACAGCAGACAGGCCCGGGCTAAAAA
+GGCTGCTCAGGACGTTATCAGAGGGAGACACGCCGGTTGTATGGAAACTCGACAGGCTGG
+GACGAAGCATGCAACACCTTGTGACCCTGATAGAAGAACTCCGACAGTGCGGAGTTTAAT
+TTCCGCAGTCTGACTGACAACATAGATACCAGTACGCCAATGGGGCGGTTTTTCTTTCAC
+GTTATGGGGGCACAGGCGGAGATGGAACGCGAGCTGATAGTGGAACGAACCCGTGCGGGA
+CTACAAGCTGCAAGAGCTAAAGGCAGGATTGGAGGGCGAAGACCAAAACTGACGCCAGAG
+CAATGGGCGCAGGCAGGTTACTTGCTGAAGGTGAAACACGGCAGCAGGTTGCTTTAATTT
+TTGATATGGGTATCTCAACGTTATACCGCAAATATCCTGCGACATTGTGTGATTAACAGG
+ACAACGCCGCGCAGCTGTCTGCGTGACGTAATCAATACAACACAGGGCGAAGCCTATTCC
+AATCAGGAGGTTCGCCGCTATGGCTCAGGATTACCACCACGGGGTGCGCGTTGTTGAAGT
+CAACGAGGGCACCCGCTCTATCACCACGGTGAGCACCGCTATCATGGGCATGGTCTGCAC
+CGGCGATGATGTTGATGCGTCCGTGTTTCCCCTCAATAAGCCGGTCCTGCTGACTGATGT
+GCTTACCGCCAGCGGTAACGGGTGAGTCAGGAACGCTGGCCCGTTAGCTGGATGCGATTG
+CCGACCAGTCAAAACCCGTGACGGTTGTTGTGCGCGGGCCGCCATAAAGAAGTGGATTCC
+GGCGAGTGGAAAACCGGCGAGAGCAGCAGCACCAAAGTCAGCAGTATCAACAGCTACGCG
+AAACTGACCATTAATGGTGAGGTGCTCTATGAGGTCGATCTGGTCAACATGGTAGAAATC
+GTTGGCGGCGTGGACCTGATGGAAGAACACCGTAATGCCCTTGGCCTCTGATTAACCTTA
+ACGGCGCGGGCAGCCGCGCCAGTATTTCATTAACAGGATACGAACATGAGCGACAAGCTG
+ACTGAAAAGACCGTAAAACTGGATACTCCCATCATGCGCGGTAAAGCTGAAATTACCGAA
+ATTGTGCTGCGCAAGCCTCAGTCCGGCGCACTGCGTGGCACCCGTCTGCAGGCCATTATG
+GATATGGACGTGGGCGCAATGATGACTGTGATTCCACGAATCTCCACCCCGACGCTGACC
+GCGCAGGAAATGGCAGAGCTGGACCCCGCCGATCTCACCGCGCTGTCGGTAGAGGTGGTG
+ACTTTTTTGTTGAAGAAGTCGGTGCTTGCCGGTTTACCGACAGCCTGACGATTGATGATC
+TTGTGGCGGACATCGCCACCATCTTTCACTGGTCGCCATCCATCACTGACGTTATGCCGC
+TGACTGAGGTGCTGGCGTGGCGGCATAAGGCAATTCAGCGAAGCGGGGCCAGCGATGAGT
+GACAATAACCTGCGTCTGCAGGTGATTCTTAATGCGGTTGACAAGCTCACCCGCCCATTT
+CGATCCGCGCAGGCCAGCTCAAAAGAGCTGGCTGCAGCCATTCAGCAAAGCCGCGCCCGT
+TTAAAAGAATTAGATGCTCAGGCGGGCCGCATTGACGGTTTCTGCAAGGCCAGCGCGCAG
+CTGGCAGTCACCGGTAACAGCCTGAAAGCCGCACGCGAAGAAGCTGCGAAACTTGCCACG
+CAATTCTCTGCCACCAACCGCCCGACGGCGGCGCAGGCACGGCTGCTTGAGCAGGCAAAG
+AACCGCGTTACGGAGTTACAGAGCAAATATAACGGTCTACGTCAGTCAGTGCAGCGCCAG
+CGTCTTGCGCTCAATGAAGCCGGACTGGACACGAAAAAGCTCAGTAGTGCGCAGCGGGAA
+CTGCGGCAGAATGCCGACGAAACCCGGCAGGCCCTGGACCGGCAGCAGAAATCCCTTAAA
+CGCCTGGGCGAACAGCAGGCGCGAATGAACGCCGTCCGCGATCAGTATTCGCGCCGTCTT
+GAGGTGCGGGATCGCATCGCCGGGGCAGGGGCTACCACTACGGCTGCAGGGGTGGCAATG
+GGCGCACCTGTTGTGGCGGCAGTTAAGAGCTACGCCAGCATGGAAGATGCCATCAAGGCC
+GCCAGCGAACAGCTGCCGATGGAGAACGGCGCTATAGACTATGCCGCGCTGGTTGAAGGT
+GGTGCTCGCATGGGTGTGACCAATCAGGACGATCCTTACGAAGAGCAGAAACGTGACCTG
+CTGGCTTTTGCATCCACGGCGGCAAAAGCGGCAACGGCCTTTGAGCTGCCCGCCGATGAG
+CTGGCGGAAGGATTGGGGAAAATCGCACAGCTCTATAAAGTGCCGACGCGCAATATTGAA
+CAACTGGGCGATGCGCTGAACTACCTGGACGATAACGCCATGTCAAAGGGTGGGGACATT
+ATCAACGTCCTGCAGCGTATGGGGGGCGTGGCTGACCGCCTTGACTTCGAAAGGCTGCTG
+CGCTGGGTTCAACATTCCTTTCTCTTGGGGCTGCCCCGGAAATTGCCGCCAGCGCCTCTA
+ATGCCATGGTGCGTGAACTGTCCATTGCCACCATGCAAAGTAAGCGCTTCTTTGAAGGCA
+TGAATCTGTTGCAACTCAATCCGGCGGAGATTGAAAAGCAGATGACCACCGATGCCATGG
+GCACCATTCAGCGGGTTCTGGAGAAGGTCAACAATCTGCCGCAGGATAAACGCCTGTCAG
+CCATGACAATGATTTTTGGCAAAGAGTTTGGCGATGATGCGGCAAAGCTGGCTAACAACC
+TGCCGGAGCTGCAGCGTCAGCTGAAACTCACATCAGGCAGTGGTGCTAATGGCTCGATGC
+AGAAAGAATCCGACATTAACAAGGATTCATTGTCTGCGCAGTGGTTGCTGGTTAAGACTG
+GCGCGCAGAACGCTTTCAGCAGTCTGGGGGAAACGTTGCGTCAGGCGCTGATGGATATTA
+TGGGCATGGTTAAGGGCGTGACCGGGGCGCTGCGTCGCTGGGTGGAGCAGAACCCCGTGC
+TGGCTGGCACGCTGATGAAAGTGGCGGCGGCTACGGCGGCTGTCACTGTAGGGCTGGGTA
+CACTTGCCGTGGCGGTAGCTGCCGTGCTGGGGCCGATTGCGGTGATTCGGTTTGGCCTGT
+CTGTGCTGGGTGTAAAAACATTACCTTCCGTTGCTGCAGCGGTAACACGTACTGGCGGTG
+CCCTGTCATGGCTGGCAGGTGCGCCACTTTCCCTGTTGCGTCGGGGTATGGCGTCATCCG
+GTGGCAGTGTCGGGTTACTGAGTGCCCCGCTTAATTCCCAGCATCGCTCAGCCGGAATAG
+CGGGTAATGCGCTGAAAACGGTAGCAGGTGTGCCGCTTGCCGTGTTCCGTGCCGGTATGT
+CAGGCATCCGTAATGTTATCGGTATGGTGATGAACCCGCTGGCGGCGTTGCGGGGTGGGC
+TGACAGCTGCCGGTGGCGTGTTGCGTTTTCTTGTTTCTGGTCCGCTGGCATTACTTCGCG
+GCGCGCTGTTTGGCATTTCTGGCCTGCTGGGCGCGCTGCTCAGTCCGATAGGGCTGGTTG
+TGGCTGCGCTGGCTGGTGTGGCGCTGGTTGTGTGGAAATACTGGCAGCCCATCGGTGCAT
+TTCTGGGGGGCGTGGTGGAAGGGTTCAAAGCCGCTGCTGCGCCCATCAGCGCCGCCTTTG
+AGCCGCTCAGACCCGTGTTTCAGTGGATTGGTGACAGGGTGCAGGCCTTGTGGGGCTGGT
+TCAGTGATTTACTTACCCCGGTTAAATCCACTTCCGAAGAACTGAACAGCGCAGCTGCAA
+TGGGGCGTCGGTTTGGTGAGGCGCTGGCGGAAGGTCTGAATAGGGTGATGCACCCGCTGG
+AGTCTCTTAAATCCGGTGTGTCATGGCTACTGGAAAAGCTCGGTATTGTCAGTAAGGAGG
+CGGCAAAGGCGAAACTGCCCGCGCAGGTTACGCAGCAGCAGTCCGCCACAGTGAACAGTG
+ACGGCAAAGAGGTGCTGCCGCCAGGCGGGTTCCCGGCTTACGCGGGGATGTACGACAATG
+GCGGGATCATTCCACGCGGGCAGTTTGGCGTTGTCGGAGAAAATGGCCCTGAAATTGTGA
+ACGGACCGGCAAATGTTACCAGCAGGCGGCGTACTGCTGAGCTGGCCTCTGTCGTTGCTG
+GCGTGATGGGGGTAGCTGCGACACCTGCAGAAGCGGCTCCGCTTCATCCGTTCAGTTTGC
+CTGCGAGGGCATACCAGCCCCCGCTTGCTAAGGCAGATAGCCCGCCGCCGGTTATTCGTT
+ATGAGATAAATGCGCCCATTCATATTGTCGCTCAGCCTGGGCAGAACGCGCAGGATATTG
+CCCGTGAAGTGGCACGCCAGCTTGACGAGCGGGAGCGCCGGGCCAGGGCAAAAGCGCGCA
+GCAATTTCAGCGATCAGGGGGGGATGAATCATGATGATGGTACTGGGTTTATATGTATTT
+ATGCTGCGCACTGTCCCTTATCAGGAACTGCAGTATCAGCGCAGCTGGCGACACGCCGCC
+AACAGCCGGGTGAACCGCCGTCCGTCAACGCAGTTTCTTGGCCCGGATAATGATTCACTG
+ACACTGTCCGGGGTTCTGCTGCCGGAAGTGACCGGCGGCAGACTGTCATTACTGGCGCTT
+GAACAGATGGCTGAACTGGGCAAGGCATGGCCTTTGATTGAAGGCTATGGAACCATTTAC
+GGCATGTTTGTTATTGAGAGTCTGAGCCAGACAAAGACGGAGTTTTTTGCCAGCGGAATG
+CCCAGGCGCATTGAGTTTACGATCACCCTCAAACGGGTTGATGAGTCGCTTTCTGACATG
+TTCGGGAGCCTGAGTGACCAGCTCAGCAACCTGCAGGACTCTGCTGTTTCTGCGATTGGG
+GGGATTAAAAACACGGCTGGAGGGTTGCTGCAGTGAACGTTAATTCTGATCTTCTGAATC
+TGAACAGCAAAAGCCCGGCTTTCAGTATCGTCATTGAAGGTAAGGACGTGACGACCGTGC
+TGGATACCCGCCTGATGAGTCTGACACTGACGGATAACCGGGGCTTTGAAGCGGACCAGC
+TTGATCTGGAGCTGGACGACGCCGACGGGCTGATCGCCCTGCCGCGACGTGGGGCTGTGA
+TTCAGCTGGCGCTGGGCTGGAAAGGCCAGCCGCTTTTCCCTAAAGGGGCTTTTACCGTAG
+ATGAAATTGAACACAGCGGAGCCCCTGATCGGCTGACCATCAGAGCGCGTAGCGCAGATT
+TCCGTGAAACCCTCAATACACGGCGCGAAAAATCATGGCATCAGACAACGGTGGGGGAGG
+TGGTAAAGGAAATAGCCGCACGGCATAACCTCAAAATGGCGCTGGGTAAAGACCTGACGG
+ATAAGGCGCTGGATCATCTGGACCAGACCAATGAAAGCGATGCAAGTTTTCTGATGAAAC
+TGGCGAGACAGTATGGGGCGATTGCTTCCGTTAAAGACGGGAACCTGCCAGTTATCACCA
+TCACGCGCAAAGTCGGTGACGGTCATCGGTTCACCCTTGCTGATCGTGGTGCCTATACCG
+GTGTTATTGCCAGCTGGTTGCATACGCGTGAACCCAGGAAAAAAGAAACAACCAGTGTTA
+AGCGTCGTCGAAAGAAAACCACCACACCCAAAGAGCCGGAAGCAAAACAGGGAGATAATC
+TGGTGGGAACGGATGAAAACGTGTTGGTTCTTAATCGTACCTACGCCAACCGGAGCAATG
+CAGAGCGCGCAGCAAAAATGCAGTGGGAACGCCTGCAGCGCGGCGTTGCGTCATTCTCGC
+TGCAACTGGCAGAAGGCCGGGCAGATCTATATACCGAAATGCCGGTGAAGGTGAGCGGCT
+TTAAGCAGCCGATTGATGATGCCGAATGGACCATTACCACCCTGACGCATTCTGTCAGCC
+CGGATAATGGATTTACGACCTGTCTGGAGCTTGAAGTGAGAATTGATGATTTCGAAATGG
+AATGATTATTCGCAATGGAGAACTTTTAAGTTTGCAAAATGGAATAATACGGTATTATTA
+TTGTGAATTTAGCAAAAATGGGGAGAGCTCGAAAAATGATGATTTGCCCACTGTGTGGAA
+GTGCCGCCCATACTCGCAGCAGTTTTCAGGTATCTTCATTGACCAAAGAGCGTTACAACC
+AGTGCCAGAACATTAACTGCAGCCATACTTTTGTTACCCATGAAACTTTTGTTCGTTCAA
+TTGCAACGCCAAAAGAGTCGAATCCGGTTCGGCCGCATCCAATGAAATCAGGACAGGTGA
+CGTTCTCTCTTTGACGCTGCCGCCATTTTGTCGCCATCTTTAAAAAACAGTGCTTCTAAC
+ATCATGATTTTAAACGGCATAAAATTCAAACAACAAAAAACCCATCAACCTTGAACCTAA
+ATGGCGGGGTTGATGGGCTCCACAAAATGGGGACATCAAAGAAAAGCAGTGGCAATAGGT
+ATGACTGAGGCTTTAACGGAAAGTTCTACTTATCTGCAAAATTTTTTCACTTAAAGGCAA
+ACTTCAGTTTTATCCTAATCCCGGCCAGATGATAACAATGAGCGTCCCCGCCAGTGTCAG
+CAGAACGTTGGCGATAGCATAAGTCCCGGCATAACCCAGCGCCGGAATATTGCTGCGCGC
+CGTATCGCTAATGATTTCCATCGCCGGGGCACAGGTACGGGCGCCCATCATGGCGCCGAA
+CAGCAGCGCCCGGTTCATACGCAGGACATAGGCACCGAACAGGAAGCAAATCACTACTGG
+CACCAGGCTAACGACAAGGCCTGCTATTAGCATTTGCCCGCCGACCGCGCCCAGACCATT
+ACTGATACCGCTGCCTGCGCTTAAACCGACGCCTGCCATAAATACCATTAAGCCGAACTC
+TTTTACCATGTTAAGCGCGCCCTGAGGAATATAACCAAAGGTAGGATGGTTAGCGCGCAG
+GAAACCGAGCATGATCCCGGCGAACAGCAACCCGGCCGCGTTACCGATGCCGAAACTAAA
+ATTGCTGAACTGGAAGGTAATCATCCCGATCATTAAGCCGATGATAAAAAAAGCGCAGAA
+GGCGAGCAGGTCCGTCACCTGGCTATGAATCGAAATAAAGCCGATGCGATCGGCGATGGT
+TTTTACGCGTCGGGCATCGCCGCTCACCTGTAACACGTCGCCTTTATTCAGCACCACGTT
+ATCATCGATAGGCATTTCGATCTGGCTGCGGATGACGCGGTTAAGGAAGCAGCCATGATC
+GGTCAGCTTGAGTTGAGCGAGACGACGACCGACGGCATTGTGGTTTTTCACTACAATTTC
+TTCCGTTACGATGCGCATATCAAGCAGATCGCGGTCAAACACTTCCTTACCATTACGGAA
+GCTGGGGTCGAGCCGGGCGTGCGCATCCGGATAGCCGACCAGTGCAATCTCGTCGCCCAT
+TTGCAACACCGCGTCGCCATCCGGGTTCGCCAGAATGCCGTTACGGCGAATACGTTCGAT
+ATAGCACCCTGTCTGGCGGTAAATACCCAGTTCGCGCAGGTTTTTACCGTCAGCCCAGGC
+CACCAGTTCCGGGCCCACCCGGTAAGCGCGGATAACCGGCAGATAAACTTTGCGATTGGC
+ATCGGTATCCAGGCCACGTTCACGGGCAATTTGCTGGGCGCTGGTTTGCAAATCCTGATG
+CTGTAGTTTAGGCAGGTAACGTGCGCCCACGATCAGGCTGACCAACCCGATGAGATAGGT
+CAGGGCATAGCCCAGACTGAGATTATCGAGAGCGGAGGAGAGCTGCGCGCTGGCGATGCC
+GGAATGTCGCAGGGTATCGCCTGCGCCCACCAGAACGGGCGTCGATGTCATTGAGCCCGC
+CAGCATACCGGCCGTCAGACCGATATCCCAGCCAAATACCTTACCCAGGCCTAAGGCAAT
+CAGCAGGGCGCTACCGACCATGACCAGGGCAAGCATCAGATAATTTTTACCGTCGCGAAA
+AAAAATCGAAAAAAAGTTGGGGCCCGCTTCAACGCCGACACAAAAAATAAATAGCATGAA
+TCCCAAATTTAGCGCGTCGGTGTTAATACTAAAGTGTTGCTGCCCTAATAAGAGAGAGAC
+CACCAAAACGCCAATGGAATTACCAAGTTGGACTGAACCCAGGCGTAACTTGCCAAGACA
+CAGGCCCAAAGCAAGGACCACAAATAATAACAGGATGTAATTCCCATTTAACAAATCTGC
+GACGTTTATATTCACGGAGACTAACTTCTTGTTTACGAGTAAGCTGTTGAAAGAAATGGT
+AATTTACGCTACTGTTTTTATCATGCGTTAAGGGTGTAATCGTATTGCATATAGCATCCA
+AATAAAACAACACAACAATATATCCTGCTAGTTTAATCTTATTGCGTACTAACGGCTATA
+AGAATCGTGCAGGTGTGTTTTTGGCATGGAATGCCACATGACTTTATCTGACTGGATGCC
+TCACGGCGGAAAGCGTGTTCGATAGAGAGAGTGTCAGGAGGAACGATTGAAACATAAACA
+GAGGTGGGCAGGCGTTGTCTGCTGCTTTGTACTCTTTATTGTGGTGTGTCTTTCATTAAC
+TATGCACGTGCAAGGCGCTTTTCGCGCGACCGGGCATCCTGAAATTGGGCTGTTATTTTT
+TACATTGCCAGGTGCAGTGGCGAGTTTTTGCTCTCATCGGCGCGAGGTGATCCGACCGTT
+GATCGGGGCGATGCTGGCGGCGCCGTTTTGTCTGGTGCTCATGCGCTTTGTATTTATGCC
+CACTCGTTCATTATGGCAAGAGCTTGCGTGGCTGTTTAGTGCGGTATTCTGGTGTGCTTT
+AGGCGCGCTCTGCTATCTGTTCATCAGTAGTCTGTTCAGTCAGAGGCGGAAAAAGCACCG
+ATAA
+>NC_015761.1|provirus_1007223_1045009
+TCACTTTTCCCCAATAACCGGACGATCCAGTGTCGGGCTGATTTGTACCTTCCTGTCGTA
+GATAAGCACCTGGCTTTCTGTTTTGTGGCCGCTGAAAATCTGCTTATCCCTGCTACTACC
+CTCAAAATCTGAAATAGCTTTTGCCTTGATATCATGGAATGTGTAATCCAGCTGTCGGCC
+CAGTTCACTTTGTGCGGCGCGTACAGCTTTTAACCAGCGATTATTGAACGTCTTGTGGAT
+GAACTGACCACGATTGTTGTTGTAGAGAACCAGCGCGTCAGGTGACAGTTTTGGACATTC
+TGTCTGTGCTGTTTTCAGCGCTTGCTGAAGGCGAGGTGTCCAGACCTTAATCTGTTTTTT
+TCCGGTCTTTCCTTGCTGGATAAAAATACCCTTATCAGAAACTTGCATCCAGCGCAGAGC
+GAGTACGTCAGCTTGCCGGGCGGCGCACAGGTAAGAAATTTCCATTGCAGCCCTGACAAC
+GTGATCAGCATGCTTATAAATAGCCAGGTAGTCTTCGTCAGTGATGTATTGCTCGCGAGC
+CTTGAGAGAGAATTTACTGACGCCAGCACACGGATTTCCCTTAACGTAACCGCGTTCATA
+TCCCCAGCGGTAAACACGTGACATACTGCTCATCTCCTGGTTGGCCTGGTTTTTACTTTG
+CAGTCCACGACGATCCATAAACTGACGCACATCTTCTGGCTTTATTACATCAGCTTTAAC
+TTTACCAAACACGGCAAGTAATTTTTTCTGATGTTGTAAATAATCCCGCTGGGTTCGTAT
+TGCAAGCTCGGTGTAGTAGGCGCTTTTAAGAAACATTCCCCAGAGCTTTTCAAACGTCAT
+TACATCTGAGTAATTGCGCCGTTCTTCCTCGTACCGTTTCCATAATGCCGACATAGTGAG
+TGTGATTGGCCCCAGTGTCACAGTTTCCCGCGACGTGGGTTTGTAGTAGTAACGCGTTTT
+TGTTTTGGATACGCGCGGCGGCAGTTTGTTATCTCCAGGATCCTTTCTTCTGCGCCCCAT
+TTAAATAGCTCCGAAATCGGGTTTTTCTTCTGTTCTGGTCTGTACGGTGATCTGTCCGTT
+CAATACAGCGTTAATGTGCGTCCAGGTCACCATCGGGCGACCTTCCCGGTCGGGTATGTA
+CGAGACGCCGCCGCGGTCAAGGATTTCCCTTTGTTTGGATGCCTTCTGATAACCGGTAAA
+CTCAATCAGTTCTGCGTCTGTTAGCAGATCGTTTTCTCTGGTCATGTTGGTCTTTCCTCA
+TCATCCGGTAACCGCATTGTTTAAGCATCCGGATCTCCTTTCTGCGCCAGCAGGTAGCAG
+AGGCGGCGGATTAAAACCTCAATCCGGTTGAGCGGGACGGCCTGCTGTCGAGCTGGTTTA
+CGTGCGAAATCAATCATTCTCACCCTCGTTTGCCTTATCGCCGGCCAGCGGAACGTTTAT
+CACCTTCTGCGCGTTAACTTTTCCACCTCATTCCGGTCTTCGTATGCCCCGGACGGCTAC
+TTCGTGGGCGTCCTGCCTCGGTGGTTCGTTGTTGCTATGGAATAAGTAAAGCATCATTTT
+ACTTCTTAGTCAACTTATACGGAATTAAAGCGTAAAGCAAAGCTGTACAACAAGCATGTT
+CATTTTTGGACTATGTTTAGCAGCTCAATATGTATATGATTAAAAAAACATCAGTAAGAG
+GTGGTTATGGAACGCGATGAGCTGGAAGAAGACCGTGCGACATTCATTGCGGGTGAGATT
+GGCGGCGCAGTGGTCGAATTGATAATCGACGGCGTAGTGATCAGCCGCGATGCAACAGTT
+AAACGTCTGAAGGAGAAGAGGAGGTGAGTCGGGAACGTTATTCACAAAGGTGTATTACGG
+GATGCAGCAGCTATGGTGAGGAAAGGGCAGTAAATACCCGGCGCGGTGGCCGGGTTGGAT
+TCATAAACTAAATTACTGAAGCATTGACGCAGCGTTTAACATCTTCTCATAATAAAAATT
+CATATCTTCTTTACTGTACGCGTTTATAAGGTTATCTGCATGTTTTTCAAGAAGATTTAT
+TTGCTGTTTTGCTGTTTTTTCTTGTGCTGTAGTTTCCGCTGCATAAATAACAAATGAGTC
+AATATTATATTTGTAAATTTCACATGCTTTTGAAATTGTTAAAGCACTCACAGCAGCCTC
+ACCCATTTGTTTTTTAAAATTTTCTGAACGGAAATCTAAAGTTTCAGTCAGATGGTATTT
+GCCGTTCTTAAGCAAGAAATCTGCAACTAAACCTTCGTCATCGCTTATAGGATAGTTAGC
+AACAATCTTGTGCTGATAAAGGTCTTCAGAGTATTTGCTAAAGATTCCGTGCTGCATGAA
+GGTTGACTTTATTTCAAAGAAAACTTTTCTTTTCAGTTGCTTGTGAGATTGTTTCTGTGG
+ATTTACTAACCTATTCATCAAATCAGTAATTTTTGTTTCGTAATTATCATTGCTTTGAAT
+GGTAAACATACCAAAAGAAGATAGTGATAACGATCCCTTAAAAAGGCAGGGAAGAAGTTC
+AACGTCATTTATTTTGTGTGACAAATCAAAAAGTGAGTTTGAAAGATCTTCCAAGTAATT
+TTGTGAAAGACCTTTATCAATTGCTTTAAGCTTTGAAACTGAATTAAGCATGCGTACGTC
+TATGTCGGAGTCGTGGTAAACGATCAAGCCAACGTTAATCGTTTCACCTTTCTCAAGATT
+AGGCGTAACTCTGATTAAGCTGTATTTGAAGGTTTTCAAGAGGTTATCTCCAGTCTTATA
+GCGTTTATTCGCTCAATTCTTTCCTCACTATCCCACCACTTCAGAAAATATTCTTTATGC
+ATTGGTGGCATCCATGCGACAGGCATGGACTCTAGTATATCAGAGATTGTAGCAACTCCA
+ATTTTCTCAATCTTGTCAAGTATTGACAATGCGCACATTCTTAATTCTGGTGTATCGCCG
+ACAAATTGCTTAGCTATAGACCAGTTTGTTGATGTGCTTGAGTCCGTAGGAAGTGTGTGC
+GGGGTGCTACGTGGCCAACCGATAACAAAAGAACTCAAGCTAAAATCGAACGTTTTTACT
+ATGATATGACCGCGCGTATTCTCCATGTAAAGATAATTATTGAGATGGCGATCAATGTTG
+TACACGAATTGGTCAAATGCATAAATTGCCCATAGCTGTTTTTTCAATGACTCAGAGGCG
+TTTGCCAGCAAATTGATCCATTGCGGGCCGTTAAGTCCTGACTTCCATGCAGAAAACTCA
+ATGCGAGAGCCAAATACATACTCGCCATCAGCAATACACTTAAGAACCTTACAAACAGGA
+GTTGCAATACCACACCTTTCAGCCAAATTTGTGCAAAACCACTCTGCAGCAGGTACTTGA
+GTTGGGTTTTGTACAGGAAAAGGAGGTGCAGTTTTCATACTTTTAACCGCATACTCCATC
+TCATCAGTGGCAATGGCAAAACCAGAAAGATGCACAGTACCCAAGTTCGATGGGGTATAT
+TCATTGAACTCTAATTCAAATAAACTTCCTTGTTCCGGGTCCGGTTCGCTATTGTTTGGA
+TCTTGTTCTTCTGTCATCTGCTTTTTACCCCACAAAGAAGACATGTAAACCTCATGAAAT
+TAAATTATCTCTATAATATTCTTAGCTTTTTTCTATTCCGGTCTCTCATGGCGAGCATAG
+CCAAGTTTTCTCCCCATGCTTCATGTTCGTAAGCGGGGCAGTTCTAGTTTGTTAGGCTTC
+GAAATGTGTGGTTGAGCAGAGCCTAACTAGGGTAGTTACTCCACATCGCCCTTAATCCGC
+CGCCCCATATACTTGGCGTACAGTTCATCGAGCTCCTTCAGGCGCAGGGATACGATTCGC
+AACATGTTCTGTTGTTCTTCTTCCGGTAACTGGCGATAGAGCTCAAGCAGGCGCTGTTCG
+TCAGGTTTAAGTCCGTCTTTCTCTCCGACATCCTCACCAAGCAGCCACGGAACTGATACG
+CCAGCAGCATCAGCAATAGCTAATGCGGAGCTTTTGCTAATTCTTCCTGTTTTGAACCAA
+CTGGAAACTGCTTGCTTGCTGACACCAGCTACCCTGGCCATCTCTGTTTTAGAGAAACCC
+TTCTTATTTAACTCTGCCAGCCTGGAGATCAGGCCATTCGTCAGTGTGTTATCGCTCATC
+GCCTCATTGTAAATGATTGCTTTACTTGTAGGTAGGCATGCTATGTTTGACTTGTTGGTA
+AAATGATGCTTTACTGTTGTCATCTAAGGAGGTCCTATGACTGGTATTGAAAAAGCAATT
+CAAAAATTTGGAACAGGGGCTGCTCTTGGAAGAGCGCTTGGATTTTCAAAAATGACAATT
+TCCAACTGGAAAAAGACCGGGATTCCACCCGATCACATTCGTTCAGTTTTCGAACTTACA
+GGTGTTACGCCACATGAGTTACGGCCTGACTTGTATCCAAATCCAACAGATGCATTACCA
+AGCCAAGAGGCATCAGCCAAATAACCATAGAGGATATTTACCCATGGAGAACGCAATTGC
+ACGAAAGTTAGACCCACCAGAAATCAACCCGATTGAGATAGAGAGTGTCCTGCTCAACCG
+GCTTGCATCAGTAGGGCAGAAATCATACGCCGAGCATATGGGCATCAGCGAGTCGACAGT
+CAGCAGGCGTAAAGCTGAGGGATATTTCTGCAACATGGCGAAAGAGCTGGCTTTTCTTGG
+GATTCAGGCCGCGCCACCGGAAGCGGTACTGGTATCCAGAAACTATCTCACAGCAGTAGA
+GATTCTCGCTGATGCCGGGCTAAAGGCTGAACGAGCCAGGCCGGATGCGCTGGGGTGGGA
+CTGAAAATGGCAGCAACCAAAAAGGCGAAAGCCGCGGTGAGGGGTCACCAACGGCTTTCA
+GGTGGAATTAACTGGATCAATTCACAGGAGTAATTATGGCAAACACTGCCGAAGTAATCA
+ATTTTCCTGTGCCTGACGTGGCACCTAAGGAGCCGCGCGTGGCAGATCTCGATGATGGCT
+ATACGCGCCTGGCAAATGAACTTCTGGATGCCGTGATGTGTTCTGGTTTGCCGGAGACTG
+AGCTGTGCATCCTGATGGCCGTATGGCGCAAAACGTATGGATACAACAAGAAAATGGACT
+GGATCAGCAACGAGCAGCTAGAGGAGATGATTCAGAAGCATCATACCCATTGCTCGACAG
+CAAAAAACAGTCTGATCAGGAAGAAGGTTCTGATTCAGGAAGGCCGCAGGGTTGGTATGA
+ATATCCATATTTCCGAATGGCAAACTAAAAATAACGGATTCTGCAAAACATTAGCCAAAC
+CTGCTAAGAAAACCTTAGCGGAAGTTGCTAACGCACCTAAGCAGAAGTTGCTAACCACAA
+AAGACAAACTAACAAAAGACAATATTAAAAGATCTACGTCCGAGAATTCTGACGAATCCT
+CTGACAATCCAGGAAAGAAACCTCATGTTCTAAAACCAGAAGCGGCGATTCAGAGAGGCA
+ACAAGTGGGGAACTGCTGAAGACCTAACTGCTGCCGAGTGGATGTTTGACCTGATAAAAA
+CCATTTCTCCATCAGCCAGAAAACCTAACCTGGCAGGATGGGCTAACGATATACGCCTGA
+TGCGTGAATGTGACGGACGAACACATCGCGACATGTGCGTGCTGTTTCGCTGGGCGTGCC
+ATGACAGCTTCTGGGCTGGCAATGTCATTAGTCCGGCAAAGCTCCGCGAAAAGTGGACTC
+AACTCGATATCAACCGCAACAAGCAACAGACTGGCACAACTGCCTCTAAGCCAAAACTTG
+ACCTAAATAACACTGACTGGATTTACGGAGTGGAGCTATGAAAAACATTGCTGCGCAGAT
+GGTTAATTTTGACCGTGAGCAGATGCGCCGTATTGCCAACAACATGCCGGAACAGCATGA
+CGATAAGCTGCAAGTTGAGCAGGTTGCTAAGGTCATCAATAACGTGTTTAGTCATCTTAT
+GGCCGCGTTCCCTGCTACCACGGCTAATCGCAGCCAGGCCGAGATGAACGAAATCCGGCG
+CCAGTGGGTTCTGGCTTTCCGTGAGAACGGCATCACCACCATGGAGCAAGTTGCGGCCGG
+AATGCGTGTCGCCCGCCGTCAGGAACGTCCGTTTCTGCCATCGCCGGGACAGTTTGTAGC
+GTGGTGCCGTGAGGGGAGTGGAGCACTCGGGGTCAGTGTTGACGACATCATGGGCGAATA
+CTGGCGCTGGAGAAAGCTGGTTTTCCGTTATCCGACAGGTGAGCAGTTCCCATGGAGAGA
+TAAAAATCCGCTGTATTACCACGTCTGCCTGGAGCTGCGCCGCCGTGGAACTGAGGGGCA
+ATTAAGTGAAATGGAACTTATCCGGGCCGCTGGCGACATCCTGCATGACTGGGAAAAGCG
+AGCTCTTGCAGGTAAACCCATACCGCCTATTCGTCGCGCTTTAGCCGCGCCGTCGCGGGA
+TCGCGGTCTAACGCCAGCCGAGATGCTAATGGCTAAATACAAACAACGCAAAGACGCCGG
+TCTGATTTAACAGGAGCAACCAATTGAGCATTCTCACCATTCTAGATGTCGGTCTTGCCT
+TAATGGGGTGGCTGTTCATCATGTTCAGAGCGGGTCAGTGGTTTATCTCCGTTGCGCTAA
+AGCAATGGGATAAGCGCAGAAAGCAATCTCGTCGGCAAAAAGCAGTAAACGAATTTTACG
+ATGCGTTTGACCTGTCCAGTATCGAACCTGGTACAACGGTTCGCCTAACGACTAAAGGCG
+ATCTGACAATCATGATGTTTCGCCGGGAGGCCGCCCAATGAGCAACATCGACAAACAGGC
+GCGGGAGCAACTGGAAGCCGCAGAACGCAGCATGGCAGAACAAAGCGCGATTGTAGCTGC
+TGCTGAAAAACTGGTCCGTTGCAAAGGTCGTTATCACAGCGAACTGAACTACCGGGCGCT
+TGCAAAACTGTTTGGTGTCATTACGCCGGATTTACCACCACTTGAGCATGAAAACGTTCA
+ATGCGCAGACGCTGCTGAAGGGTTTCGTATCGCGCTGGCATCGTTGGAATCCATGACACC
+AGAAAAGCGGGCGAAACATGACGCCAGTATAGAAGCATTCAAAGAGATGTTGCCGCAACC
+AGCACCGGTAGACAAAGAATTTATCCCTAAAAACCTGGACAAGGCGTTGGGTGTTGTTGG
+TGTTGCGTTACCTGAATCAAAGGAAGAGTTTAATTTCCAGATAGAGCGCTGGATACAGCG
+TCTCATTGATCGGGTTATTCGTTATGCCGATGAATTCAAAGAGCAGCCAGCGCCGGTAGT
+GCCGGATGAGTGCCCGGCTGAGTTATTGGCGTTCTGTGAGCAGGTGATTGATAGCCGTAT
+CACCGCAAACGCAAAAGCTGATGAGCTATGGAACGACTGCCGCGATGCCATGCTTAATGG
+CGATACTTTTCGGGGAAACTCAATTTCGTCAACCAATAATTTTCGGGGAATCGCGGAAAC
+GTCAACCAACTCTCAGGTAATTCCGGATGGCTGGATAAGCTGTAGTGAGCGGATGCCTGA
+GCAAGGTGCTTACATTTCAGCGGTGTCAAGGCATGGTGAATACGTAGCCGGGCAAGTTAT
+TGACGACTGGCTAGATCTGCATGATGGAACATCATTCGGACTTGATGAGGTGTATCTATG
+GATGATGTTGCCTCCACTGCCAGCAGCACCACAAAAGGAGGTTAAGTGATAGGCGTCAAG
+AGCAAGAGGGAGAGGTTAGCATAAACATTAATCAAGGCTCTTATGGGCTTTTTATTCTAT
+TATAAACGGACTTTTTTTGAGGGTGATACCATGAAGCCGAAGAAGCTAAATGCTGAGCAG
+CAATATCAAACAGACCTTGAATTGGTCAAGAAGAAGCCCGCAAATCGTACCGAGGCAAAA
+GCTCATTTGGCAGCGCAGTTACGGATTAGCAAGTACAAGGCGCAGAACTCTTCCAAAATT
+CGCGTTGGCAGTTTCAGGGGAAGAAAGAAGGTGCATTTCAGTAAGGCCGAAGAAGATGCC
+AGGGCGGCACTAAATAAAGCAAATGCCATTAGATTTTCTGAAGGGGAGGTTGAATCCGTT
+GATACAGATCGAATCTCTGAGAGTAATAAACGCTGGCGTGGGAGAACTGCTGACTAATGT
+CTGACTGGAATATTGCAGCACAATCAAAAGACAAGCAGGACAACGAGGCGCTCAGTTTTA
+CCTACGAATACGCGTTTGCCCCGGAAAACCGCTACAAATACTAACCCGTTGCGGCGGGTT
+GGCGGGAGGGTAGATTATAATTAAAGCCCACCCAGATGGGCTTTTTAGCAAGGTTTATCC
+GAGAGCGCCGTAAAACCCCGTTCTTTTAGGTCGGGGATATAAGGCGTGCGTGCCCTTGAT
+CTTCTAACTAACCAAGAATTCCCTTCTTTTAGGGAGGGGAGTGTCAATCAGGAATGTGTA
+TTATAAATCCACTTATGTCCCAGGTATCCATCGGGACGTGATACCCTAATTCTTTCAAGC
+GATTAAATGTTGGCTGGAAAACGGATAGATAATCATCTTCGTTTAGACCCTCAAGATCTA
+AATCGTCGAGCTCGACACTGAAACTAGAGTGTCCTAGCTTTATTTTTTTACTTATCTCGG
+CGAATGTTCTCTTAAAAATGATTCTGGAAACTTCTTCTTTTGCTTTTTGTATGATAGCGA
+CGGCCTCTTTGGCTGAAATCTGTTTATCAGCAGGGATTTCTCCTACAAAACTACCTTCTA
+ATCTTTGAACAATCTCTGCGTTCATTGATCGGCCATTTCCCTTAGCGGCAACTTCAATTT
+TCTCTTTTAATTCAATTGGAAGTCTAATACGCAACTGCGGATCTTCTCTGCTCATTTTTC
+ACGAACACCTTAGAAAGTTCACAATATGTAAATTATGCCCCACCGTGGGGTTGACAGCAA
+TGACGCACGGTGTGACAATCAAATTGCCCCACCGTGAGGCAATTTAAGGGGGTGGAGATG
+GAAAAAGCAAAAGACATGTATCAACGCAAGGTTCGTTTTCCAGAGGATGTAAGGAAGGCG
+ATTGAAAGAAATGGGGAAGAAGAGTGTCGGCAGTTCAACACGGAACTTATTTATCAATTG
+AGGAAAGTGTACGGACTGGTTAGAGAGAAGAATGCTAGGACATAAAAATGGCGAAGCCCA
+GCAGTGCGCTAACACTAACCGGGCCTCTATCGAAGATAACCGCAAAGGAAATATCGACAT
+GCCTAATTTAGCAATAAAACCTACTGAATGCACTATCAACGTCCCGTTTTACGGTTCTGA
+GCTTTATGTGGTTAACCATAACGACGAGCCGTACACCCCAATGAAACCGATCGTTGAGGG
+TATGGGCATGGATTGGAAAAGCCAATTCATCAAATTAAAACAGAGATTTAAAACCTGCGT
+GGTGGATATCACCATTCAGCTACCCGGGGATAACCAACGGCGTAGTGTTATCTGCCTCGC
+CTTGCGTAAGTTGTCCGCATGGCTAAACACAATCAGCCCAAACAAGGTTCGTCCAGAAAT
+CTGCGAGCGCGTTATTCGTTATCAGGAAGAGTGTGACGATGTGCTCTATGAATACTGGAC
+TAAGAGGCAGGTAATTAACCCGCGCAAATCGGAAACGAACGTTGACGATCGTACTCCATT
+GCGCGGCCTGGTAAACCGCATCATGGGTAAAACCGGTATTCACTATCAGACCCTTTACAA
+AATGATCCACCGAGAGTTTGGCGTGAATCATATTGATGAATTGACAGGGAAACTGATTGC
+TGAGGCGATGGAATACCTTGCGGGGAAAGTTCTGGAAGGTGAGTTATTACCAAAAGACCA
+AGGCAGATCCACGCTTTCATCCGCAATCCCCAAACATGGGCCTGGTAGGGTACTGCTTAA
+CCTGAATGAAAACGGTCAGGTTAAGGACACTTATCCGTTAACTGAGGATCAGGTAGTCAT
+GTCATTTGATGCATTTGTCAGCTATTTCAGGAAAAAGGGATGGGTAGTGGCCCCAAGGGA
+TGAGGTAGCAAAAGGAATAATGGGGGCAATACAGGTTTTATCGTAGCAAAAAAGAAAAAC
+CGCCAGTTGCTGCTGGCGGCCTATGTCACAAACCCTATCATCACATAAGGAATGTCGAAT
+GACTTGTAAGAATGTAGCAAAGCTCGGATCTGTTGTCACGGATAAAACCATTGATAGCCA
+GTACCTGCTTGAGATGGTAAATCACGCTCGTAAACAGTGCGGTGAAAAAGAAGTCCGCAA
+CAACGACTTTATTGGACGTATTAAGGATGAGCTTGAAGGTGAGCACTACGAAATTTTCGT
+AGTTCAAAAAGCAAACAAAACAACCTCTGAAAAAATTGTTATGTCAATTAAGCAAGCCCT
+TCGAGTGGCCGCTCGTGAATCAAAAGCGGTGCGTCGCTCCCTGGTCGATAAACTGGAAGA
+CATGCAATCCATCCAGATTCCTGCGCAAAGTAATTCCGGTCTTTCTGAATACCGTCTTGC
+AAAGGCCGAACAGTTGAAAGCGCTGGCGCTGGAGAAAAATATCGTATCCGCTCGTAAGTT
+GATGGTGATGCTGCCCCGTCTTGACCCTATGTCCCACCAGACGCTGGCGGCTTCGCTGAT
+TAATCCGATTATCGGTTATGACGCGATCCCCTTACCAGTGATTGAAGAGCATTACTACAC
+CGCAGCGGAAGTGGGTGAGAAAATCGGTGTCAGCGCCAATAAAATCGGTCGCATCGCTAA
+CGCAAACAACCTTAAAACTGAGCAGTACGGCAAGTTCTTCCTGGATAAATCCGCGTACTC
+CAGTAAGCAGGTCGAGGCGTTCCGCTACAACACAGAAGGGATCGAGGCGCTCCGCCATTT
+GATTCAAGGTGTTGATGTGGCATAAGAATCACAACTCAGAAAGTCTAACCCGCCCATTGC
+TGGGAATTCCTCGGCAATGGGCGGGTTTTCCGCTTAAAATCTGATATGAAACAACATGCT
+AGCTTTTGCAAAAAGTGCTATTCACCTCTTGAATATTCTTTCTAACATGTATACTGTGTT
+TATATACAGTAGTTAAATGTAGAGGGAATTATGAGAATTGAGCTTGTTATCAGCCGGACA
+AAACAGCTTCCGGAAGGTGCCGTTCCTGCACTTGAAAAAGAATTAATTACCCGTCTCCAG
+AATCAGTATGAAAACTGCAACTTAACCATCCGTCGAGGCAGTCAGGATGGTCTGAGTATC
+ATCGGCGCCGCTGATGGCGATAAAAAACGTATACAGAGCATTCTGCAGGAAACGTGGGAA
+AGCGCTGACGACTGGTTTTATTAACATTGCGCTTAATGCTGGCGCGCATTTTTCAGAATA
+CCGCAATTTGCGTATCCCTTTGATGCTGCTGCCGACAATTTTTAACCGCGTCTGTACATC
+GCCTGAAGGGAGAACAAAAATTGAGTAATTCAGCTTTGCAAAAGTCAGAAGATAGCTGGT
+ATGACATTGTAAGAAGATCTGATGGCTGCGTGGTGTTTAGCTTTCCATCATCAGGCAGGC
+ATCTTATCTATCGTGTAAATGGCATGGTATCTATGCGTCCTTTGCTGGATGATGAAGAAG
+TTTTTACTCCCAACGGTTTTGTGCATTTTATTCGCCGTCTCGGCTACCGGGTAACACCAC
+CTTCTGATAATATGAAATCAACGGCCTGAACAACCGTTAACCTTCTGCGCCACGGAGAAC
+ACCATGGCGCACGAATTACAACTCATCAAGCAGTCATCTGGAATTCTGATCCCCGCAACG
+CCGGAGACCAGTGATATTCTGCAATCAAAAATCAAACTCGGCGCCGTGCTGGTGGCTGAG
+TTCCGTCAGGTGAGGAATCCTGCATTCCATCGCCGCTTTTTCGCGTTGCTTAATCTTGGG
+TTTGAATACTGGGAACCCACCGGCGGCGCCATTTCTGCCAATGAGCGCAAACTGGTAAAC
+GGTTATGCAAAGTTTCTCGCTGCATATGGCGGGAATGAAAGCGCATTACTGGATGCGGCT
+GAACAGTATCTGGAACAGATTGCAAACCGCCGGGTAACAAACGGGATTAGCCTGTGTAAA
+TCATTCGATGCCTACCGCGCATGGGTGACGGTTGAGGCTGGTCACTATGACGCCATCCAG
+TTACCGGACGGCACCCTTCGCAAACATCCCCGCAGCATCGCTTTTTCCAGTATGGATGAG
+GTCGAATTTCAGCAGGTGTATAAATCTGCGCTTGATGTTCTCTGGCGCTGGATTTTATCA
+CGTACATTCCGTACTCAGCGCGAGGCCGAGAACGCTGCCGCCCAGCTCATGAGCTTTGCG
+GGGTGATGGCGATGAAATACTCCTGGTTCCATCATCACGACTGCACAACCGAGCAGGCCG
+ACACGCTGATATCGGATTATCAGAAGCGGGGCGTAAGGACAGAAAAGAGCCTGAACCCTG
+ACTTCATTACCTGGACTGTCAGCGCGAAATTACCTGAATATGCACACCGGGAGCGGACGC
+CAAAATCCTTACGCCAAAAGGTCTGGGGGTGAACATGGCTATTTATCGCAGTAAAAAGTG
+GCTTGCTGGTGGTGCCAGTTTGACTGCTCCCCGGCCTGAAGGCCGGGGTTTCCCGGAGGT
+ATTCTGATGAAGCCTGAAGTTATTGAGTCCCTTCGGTGGCGTACCGAATCCTTCACAATT
+ACATCCGTATTCAGCAAAATGTAGGGGAAAATAAGTGAAAAATTTATCCTGGATACGCCA
+GCAACTGATCACGGCGACGGCAGATCTAAGCGGTGCAACAAAAGGGCAGCTTATGGCCTG
+GCTGGAGAACGCACAATTTGACACGAAAACCTATCCCCGAAAAAAACAGCGCATCCGTGA
+TGAAGTGACCGGGAAAATAATAACGCTGAATAACCCTCCGATTCCGGGTAAGCAATCACT
+GGCGAAAGGAAGCGCAATTCCGCTTGTGCAGCCGGTAGAATACGCCACTTCCTCATGGCG
+TCGGGCGCTTTTGTCACTTGATGAACACTACAAGGCCTGGCTGCTGTGGAACTACAGTGC
+AAACACTTGCTGGGAGCATCAGGTTGATATAACCCGCTGGGGCTGGAGTGCGTTTGCGGC
+GCAACTCGACGGAAAGAAGATGGCCGGTAAAACACAGGAACGACTCCGGGCGTTAATCTG
+GCTGGCGGCACAGGATGTCAAATCTGAATTAGCCGGGCGTGAGGTTTATCAATATAAAGA
+GTTAGCGGGACTGGTAGGCGTTAGCGAAAAGAACTGGTCAGAAACCTTCACCAGACACTG
+GCTGACCATGCGTGCGGTATTTCTGCGTCTTGATCAGGCGTCTCTTTTGAGTGTATCGAA
+GACGCGATCGGAGCAGGTCGCATTCAATCAATACGCACTTAATTGACACAAACAGGCATC
+CGGGGCTATATTCCCGGAACGCCAGCAAAATCTGGCGTCGGGATTGGCGTCCCGGATGTT
+AAGAGGCGACACCAGACGCGCCAGCGTCTTTTTTATTGTCGTTTGCACAGTCACATCTTC
+GCATTATGGTGGGCTGTGTGGGGGCGGAGAAATCCGCGCCGGTTCCTCTTACCCGGTTAC
+GCCAACCCTGCACAGTTCACCACCCATCGATTGGCGTCGTTGGTGGTGATTATCTCAGTT
+AAGAGGGAATTACCATGACAACTCAAATTTCTGCCGAAACTCTTGCTCCGATTACCCATC
+ACCAAATCCCCGTCATTACCACTGAGCTGTTGGCGCAACTTTATGGAACTGAAACAAACA
+ATATCAAAGTAAATTTCAGTCGAAATTCAGATCGTTTTGTATGCGGGAAACATTACTTCA
+AGATTGAAGGAGATGAACTTCGCGCTATGAAGCACGAGGTTACTCAAAGTAACTCTGTGA
+AAATTGCCCGTAATGTTCGATCCCTCATTCTCTGGACAGAACGCGGCGCAGCCCGCCACG
+CGAAGATGCTCGAAACCGATCAGGCTTGGGAGGTATTCGAGAAACTGGAGGATTACTATT
+TCAGCCGGAAGCAACCTGTTCCAGCACGTCAGTCCCATCCCGCGATTCCATTTCCAAAAG
+AACGGCGTTTCATTGTAACAGTGTTCCCTGACGGAACTGCTGATACCCAACCTTTGCCTG
+ACGACGTATTTGTCGGCAAAATATCGAGCATATTAAGTGATCTTCGCCAGATGGGGTGGA
+TAGTGATTAAGCGTGACCGGCTGGTTGAAACGCTCGCGACATGGTGACTGCAAAACTGGA
+TTAAAACGGCTATATTTCGTGTAAATCTGATATTGTTGTTATAGTTTCAATCGTCGACCA
+AACAAATTCAAGCCTCGCCAACGTGCGGGGCTTTTGCGTTTTAGGGGGCTCTCATTCGCG
+GGCCTTTTCTATTCAACAGGCTTTGAATTGTGGCTTCTTGTGCACGTCGCCACAAGAGCC
+TGAATCGTATTGCCGCCAGTTGCGCATAACGTTCTGGAATCATACTCACGTGACCAGTGG
+CATAACCAATTTTCCAGGTCATCCACTGAGTAATCTTTACGGGCCAAACCCTCTGCGATG
+GTTACGACCTCATCACTCGGTGCTGTAAGCTCATATCCGTTCAGCAACAGGAATACGTAA
+CCTGCCATCATAGCGGTGCGTTTGTTTGCGTTTGCGAATGGATGATTCTGGATCAGGCTT
+TCAATTAGAACAGCAGACAGACGAAACATATCGTCTGTCTGCTCATAATATCGAATGGTA
+CTTGGCCGGGACTGGGAAGAACTGAGGTTGTTCGGATTCAGTACGCCTATCGGTTCATTG
+GGCGTCTGAATCTCAATCAGAGACCTGTTGATGTAAACGATATCTTCAATGGAAAGATAA
+TTGACTCCTTCAACATACTCTATCGTCATCCGTTTTTACTCAGACCTTTGAAAGTTCTTC
+CATCGCCTTCTCGTAACGAGCAAACCCAAACTCAAAGGCGTTTTTAACTTGAGCAGTATG
+TGAACATGCTTTGCTGATCGCTGCACGAGGTTTCGCCACCGTGGATTTGTCACGAGGCGG
+AATGTACAAGCGATCTGCCTTTTTTAATGCGTGACCCATGATTATCACCCTCATGCACGT
+TTGGCAGTGCTTTCTCAAATTGTAAATTTTAGGATGTAAACACATCCAAAGAATTTATGA
+CTACTTTAAGTGGTTGAGGACAATTTAATACCATTCGTCATATTTGAGCAATGGGCCTAT
+GTCTGAAGATAGAAGCAAGTTCGACGAAAATTGCATTGGACACTTTGCAAGTTAACGACA
+TTTTCGCAGAACTACCCCTCATGTAATAGTAAACTATTGTCACGTTCTCAGGAGATAGTC
+TGAGCCTATGACTCGACTAGAGTGAACACAATGCCGATAAATAGCACTTTTTGCACAAAA
+ATCATGTCCTGGTTGGAATGCACAACGCCCAACATTGCTGTGGTATTACGCCCCCAGTGA
+CTGCTCCCCGCCCTTCAGGGCGGGGAGCAGTCACGGAACATTGTTACAACGAAACGCCGT
+TCTTTTGGAAATGGAATCGCGGGATGGGACTGACGTGCTGGAACAGGTTGTTTCTGGGTG
+AAATAGTAATCCTCCAGTTTCTCGAATACCTCCCATGCCTGACGACGTATTTGTCGGCAA
+AATATCGAGCATATTAAGTGATCTTCGCCAGATGGGGTGGATAGTGATTAAGCGTGACCG
+GCTGGTTGAAATGCTCGCGACATGGTGATTGCAAAACTGGATTAAAACGGCTATATTTCG
+AGTAAATCTGATATCGTCGCCATAGCTTCAATCGTCGACCAAACAAATTCAAGCCTCGCC
+ATCGTGCGGGGCTTTTCTGTTTGTGCCGTCCGGAATAATCCCACTGAGTTTTGTCGTTAA
+TCCACCGGGTGGCCTTCCTGCTTCACACTGAGCCATTCGAGCTATCGAAAGAGAGGTTTT
+GACTGCTCCACGACCTTCAGGGCGGGAAGCAGTCGATTCTTTTTCTTAATTTAAATGAGA
+GGTTGAATATCATGAAGAAGATTTTTTTTGCTTTTGCATTGGTAATGATGGCTGGTGCGA
+GTAATGTCTATGCAACGGTTAATAACTGGTATCTGAAAGACACTACGAAATATGAGAATG
+TTAAAATTACGAATGTTTTTTATGCTCCTTATTTACACTCGCCAAGGATTTGTGCATATT
+TCACTGCATCATCAGGTGGTTCAAATGTTACTGGGTGCGCGGTGGCTGATAATGGCTATT
+ATCAGAAGAATGCAGGACAGACATCACCTTTCATGGAAATTTTTGATACTGTAAAATATT
+TTTATACAACAGGTGAGAAAATATCTGTTTATATAAGAATAAATGCATTTTCGCACTTTG
+ATTCAAGCGTGTCACAAAATGAAATCGTGGCTATCGGGACCTGTAATCAGTGGTGTTTTG
+GAGAGATAATTAAATAATTTTTATAATATACCATAAGGAAATATGATGACAGGTTATTCT
+CGTTTCTTAAGGCTGGGGGTATACCTTATGTTTGCGTATAGCCCTTTTTCATCTGCTGTC
+GATTTTGTTTATCGTGTGGACTCGAGACCTCCGGATGTTATTTTTCGGGATGGCTTTAGT
+TCTCACGGTAATAACAGAAATCTTCAGCAACATATCAGAGGTGACTCCTGTGCCGCCGGT
+AGTCGGGACAGTAACTATATTGCGACCACCTCAGATATTAATGAGACTTATAATATAGCC
+CGAGTATATTATTCTAGGGCAACATTTAGTGGCAGATTGTACAGATACAGAATCCGTGCA
+GACAATAGTTTCTATAGCCTTCCGCCGTCTGTCGCTTATATTGAGTCACGTGGTGTCCAG
+TTTAATCATTTTGAGCGAGTGATGATGCGGTTGCAAAGTGAGTATGTAGCCGTAAATTCT
+ATCCCAATTGAAAATATCCAGGAAGCAGTTGAGCTTGTTTACGACAGAAATACAAGCCAG
+GTAAGAGACGGGCCTGGAACATCAAATTCCCGTTATTTACGAGTGAGTACACAATCAAAT
+CCAGGGGTAATACCCAACTTACCAGTACCACAGGTCAGTACCCGGGAAAGGATTAGTGCA
+TTTGGTACTTTAATCAGTGCTTGTTTTTCAATGAGAGGAGTGCGCAGGGATGATACACGT
+ATTAATTCTAATTACTATGAAATGGAGTTTTACGACGCGCGGGGAGTTTTAACGGAATTA
+TTGAAGTGACTGCTCCCCGCCCTGAAGGCCGAGGTTTCCCGGAGGCATTCTGATGAATAG
+AGAATTTGACAAGTGACTTTCAGGAAAATGTCTCGCACTAGCGGGGCATTTTTACCCGGC
+TTTTCGCGGAAAGCCCCTTCCTTTTAGGTAGGGGATATAAGGCGCTCTCGGATAAATCAG
+CCCGTGAAGCCTGATCCTATTTCCCCTCAATTCTGAGAGGACTCACAGCAATTAAGAGGG
+GGATGAATGTCCGAACCTGTATCCAGTGCGACAGTGTTGGCTGGTGGAGTAATGGGGGCC
+AGTGTATTCGGCCTGGCAACCGGAACCGATTATGGTGTGGTATTCGGCGCTTTTGCCGGC
+GCGGTATTTTATGTCGCCACGGCAACCAACATTGGACGCATCAGGCTGGTCGCTTATTTT
+ATTACATCATTTATTGTGGGAGTGCTTGGCGCCGGGCTGATAGGTACTAAGCTTGCGGCA
+ATAACGCATTATGAAAAACCACTGGATGCTCTTGGCGCAGTGATTATTTCTGCAATGTGT
+ATAAAGTTTCTCACTTTTCTTAACAGTCAGGATCTGAACAGCCTGTTCAGTATTCTTTCT
+CGTATCAGGGGAGGGGGATCAAATGGTAGCAAATGACCCTTCTGCAGTTCTGAATGCCGT
+AATTTGTGGGGTAATAGTAATCGTTCTGATGTTTTACCGACGCGGTGATGCGGCACACCG
+CCCCCTGATTTCGTTACTGGCCTATGTCATGGTGCTGGTATATGCCAGCGTCCCTTTCCG
+GTTTGTTTTTGGTTTATATGAATCATCCCACTGGCTGGTGGTGATGGTGAATATCCTTAT
+CTGCGCCGCTGTGCTGTGGGCTCGCGGTAATGTGGCGCGTCTGGTCGATGCACTGAGGCA
+CTGATGGATCAACAACAATTTCAGCAGGCGGCTGGTATCAGCGCCGGGCTTTCTGCGCGC
+TGGTTTTCGCACATTGATGCGGCAATGAGCGAATTCGGTATTACTGCGCCACTGGATCAG
+GCCATGTTTATTGCACAAACAGGACATGAATCAGCAGGATTTACTGTTCTGAAGGAAAGC
+TTCAATTATTCGGTGGAGGCGCTGAAAAAGACGTTTGGTAAACGCCTTACGCCTTATCAG
+TGCGAAATGCTGGGGCGTATTGATGGTCGCCAGGTTGCCCACCAGCCACAAATAGCCAAT
+CTGGTTTACGGTGGTCGCATGGGGAACAAAGACACCGGAGATGGCTGGAAGTATCGCGGG
+CGTGGGCTTATCCAGATTACCGGGCTGGAGAATTACACCAGATGTGGCGTTGCCCTGAAA
+CTGGATCTGGTGGCGAATCCGGGACAGCTTGAGCTGGATCGTCATGCCGCCCGTTCCGCA
+GCGTGGTTTTTTGTGACTAGAGGGTGTCTGAAATACTCCGGCGACCTGGTACGCGTTACG
+CAGATCATTAACGGAGGGCAGAACGGCATCGGTGACAGGCGAGAGCGCTTTGAAAAAGCA
+AAATCGGTGCTGGTATGAATCTGTTACCTGTATTGCTTAAAAAATTCTGGAAGCCATTAG
+CAGAAATACTGCTGGTGGCTTTTTTGTTATGTGCTGGTGCGTACTGGTGTTATTCACGAG
+GTTATCAGAAGGCGGATACATCCTGGAAATACCAGTGGGCGCAACGAGACCTTACCGATG
+CGACCGCTGCATTGCAGCGTGAAGTAACCGAACGAGCGAAAGAACAGCGTCGCCAGCACG
+CCGCAGATGAAGAACGGAAAAGAGCCGATGAAGAACTGGCAAAAATACAGGCCAACGCTG
+ATGCTGCTGAGCGTGCTCGCGGTGGGCTGCAACAGCAGCTCGCAGCAGTACAACGGCAAC
+TTGCAGGAAGTGAAACCGGCAGGCTTTCCGCTCTTGCCGCAGCAAGCCAGGCAAAAGCCG
+AGACCGGAATACTGCTCGCCCAGTTGCTTGGCGAAGCTGACGATCTGGCGGGAAAGTTCG
+CAAAAGAGGCTGATGAGCGTTATGTCGCCGGAAGCACATGCGAACGTACCTGGGACAAAG
+TGACCGGGCAGAAGTGAAACCTGGTGACTGCTCCCCGGCTTGAAGGCCGAGGTTTCCCGG
+AGGCATTCTGATGAATAGAGATTTTGACAAGTGACTTTCAGGAAAATGCCTCGCACTAGC
+GGGGCATTTTTACGTCTGCAGTAAACGCGCTTCACACGCGCGACTTATGAACACAGAACC
+TTTCAGGATGACCCTTGAGGATGCCGGTTTGGTAATCGGTGCCTTTCTGTGGGCCGGAAT
+CCTGTGTGACAAGGTTCATCACTAAAAGGTAATCACTGATGAATTATCAAACAGTTATTG
+TCAATGGTGTGTCCGTTCGTGTTGATGAGGGGGGACGCTACAACTTAAACGATCTCCATG
+CAGCAGCAGTTGCAAATGGCGAGGCAACTGAATCTCAACGTCCCAGTAATTTTCTGAGGA
+GTGCACAGATTAAACGGTTCATTTCAGCACTAAAAGCCAAAGCTCAAAAAAGAGCTTTGA
+AAGAGATTCAACCACTTAAAGTAATAAAGGGTGGGGTTGATTCTGGTGTGTGGGGTGTTG
+AACTACTGGCAATCAGATATGCAGCATGGATTAAGCCGGAATTTGAAATCGAAGTTTATG
+AAGTTTTCAAAACGGTTGTCCGTCTCGGCGTTGGTGCTATGTCTCGCCTGAACAAAATTG
+ACCACATCATCAACACGGAAACCAAAGCGATAAGCCAGTGCGCAAGTCAAATGGCTAAGT
+GGGGCGTTGGTGGGCGGAAAAGATTGCTTCACGTTGCTCGTGAGCGAGTAGTGAATGAAG
+TGCAAATGTATTTACCCGGCATGGTGTGATTACAGCCGGTTAATCCAGTTTGTGCATTAC
+GACAGTACTGCTGGCCTGTCTGTCACTGTTAGCCAGCTGCGTGCCGAAGCAGAAAAACTT
+GCCACCCGCCTGGACGCCGCAAAGCACACCGCAAATCTTGCCGCTGCCGTCAGAAGCAAA
+ACAGCCGACGCCACCGCCGGAATGCTTGCCGACATGCTCGGAGATATTGCAGCAGAAGCT
+AAACGATATGCTGCAATCGCTGACGAACGTTACACCGCCAGGATAACGTGCGAATGGATA
+CATGGCTCTTTAAGAGAAGAAAAAAATATGTTGAGTCGGGGAAAGTCATATTGATTTTTG
+TTAACATTACTATTTTGGTAGGGTGGTAATTGATATAATGAAGAATTCATTACTACGAGA
+ATTTCATTATGAGAATAAATATTGATTACCTTAAGGGCCTAACTGGACTTTTTTTAGAAT
+CCAATCAGCACTTTTTAACCATATCTGAATTAATTGAATCGGGTTATGACATTACTACCG
+GAGAGGGGGCATTTCATGCACTGCTGCTTGCAGAACAGGGCTATATAAGTAATTTGAAAA
+ATGAAACTGGAACCCCTGAGTCCATCGGTTTGTTTGTCACCAGGAGTGGAGACTTTGATT
+ATACAAATTCAAAGCTTAGATTAACGACTGATGGTATGGAATTTGCATTGTCTCTAGATA
+AGGACGATGTTTTTGAGCGCTTGAAGAATCTTAGTAATGAACCTATTTCAGTAATAAAAG
+ATGTTGGTGTTGAATTATTGAAAGGATATGCAAAAAAGAAATTTGGTTTGAGTGTTTAAA
+TTTAGTTAAATTCCATGGTGATATTTACATTAACTATCCGTCATAATTTAACACTTAATT
+TCTGAATTATGGCAACACGAGGTGTAAATGGCTGAATTAAATTATGAGGCAATTGGGCGT
+TGCAAAGTACTTGGCGAAAGTATCAGACGACTTGATATAGACCGCAACAAGTACATCCAA
+GAGTTACGCGCTGAAGTATCTAGATTAAGCAAAGGTAACTCGAATGCTACTCCACCAGTG
+ATAGTTATCTTTGATATAAATCTGATTAATACATTATCGGAGAGAATTGCCATTGCTGAT
+AGTGATCTTATGTCAGCTGTTACAGAGTTTAACAACTGGTGCCAGGATGCAGGAGAGAAA
+CCTGTAGTTCTTAAAGAACCTTTCCGTACATAACTGCTAGATTATCACTACCACTTATTT
+ACATAGCCTCGCATATGCGAGGCTTTTTTATGTGCAGAACACGAGCACCACCATGGATTT
+TTGTAAGGATGAACCATGCCAGCACTAATTCCTCGAGCCTGTCGTAAGCGCGGCTGTCAC
+AGTACAACAACAGATCCATCCGGATATTGTGAAGGCCATAAAAGTGAAAGCTGGAAGCAA
+TACAAGCCAGGCCAGTCCCGACATCAGCGCGGCTACGGTTCGAAGTGGGACATTATCCGT
+GCGCGTATCCTGAAGCGTGATCAATACCTGTGTCAGAACCATCGACGGCAGAAGATAGCT
+AAGAAAGCGACCAGCGTTGATCACATCATTCCAAAAGCTCATGGCGGCACTGATGATGAT
+TCGAATCTGGAATCGTTATGCTGGGAATGCCATCGGGCCAAGACAGCCAGAGAGAGACTG
+AACTGATGGTGTATATCCACTGCACATATTGTGGTTCAAAACTGCATTCAGTCGCAGTCG
+CTAACTGCCCAAAAACATAAGGAGGTCAGTATGTTTATGTTACTGCTCAGCGGTAACCGA
+TATACCCCTGATACCTTCATTTCCGTCAGGCAGGTGTATGGCTCGGTGATGCAGAACGCA
+GGATTATCAGTGGTGGTCAGGTCTCTGCGGGGAGAGGCCGTCAGCAGAGGGCTTATGCTT
+AACGTGCCCGTCAGGATTGTCGGTGGAGCGGTCCTGAGTGGTGGGGACACACTGGTTAAA
+CCGGTGAAAAGTCTCCACGGTTTTCTTTTAGTGACAAAAGAGGTGTGAGTTGACGAATAC
+AGTTAATCCCCTGACAGTACTGGACATCAGAACGCTGGTCGGATTTAAACAGATAACGCC
+TGGTGAGATTACCGGGGAGCCGGTGGAGGCCCTGAAACGGTGCGGCATTACTGCTTTCAG
+GGACATTGTGCCAGGAAAGTCGGTTATCCGGACAGGCAGTATGATGGTGCAGGGCAATAC
+ATTTTATGGCCTGCAGGCGCAGACAGAGAAAAACATGTCTGCAGCAACATTCACGCTGGA
+ACTGCTCCCCCGAATGCTGGATCTGAAGGTGCAGGCCATACAGGTTGGTTTCCGCATGAG
+TCAGAAGCCGGTAGTACTCTCGCAGGTGAACACTACTATGTTATCGATACCAAGAAATGG
+GACTGCGCCCACAAGGGTGAATAGTGTCAGAACAGCAACGGAGGAAACCAGCGCGTACTA
+TGAGCTGGTAATAAGCACGGACAGTCAGGGGGTAAATGCAACTGTACAGGTGTATGTCAG
+CCGCCAGCCTGTGGAAAACCTTACTTTGACAATGGCTGGCAGTCACGGTGAATACCCTCT
+TGCACTGACGGTCGGGTCAGTATTCAGCCCGGTGAAAGAGGATGGTTTCAGCTTTATGGT
+CGGAGATATTTATATTGCTCAACTGGATTATAACAGCGACCACACGGTAACGCCGCATCT
+GCTGGGTAATCTTACGCTGGAGCCATTTAAAGTAGCCTCTTACGAGGGGGACCGGCACAG
+CAACACTCACGGTGAGGATATTGTCACTGCACTGAACACGCTGGACCCGAATAATGATAT
+GGGGGTGCTGGCGGTGAAGCCGGTGGCGCAACCGGCCAGCGTGACGTTTGAGCTGCCGGA
+CAGTACAGGGAAGGCGATACTGGGCGTGGCGCTGAATGTAGTTTATCGGGACTCTATAGC
+GCCGGAAAACCGGCTGCGTTATCAGATAACCGAAGGCACAACACAGCTGCCGGTGGAGAT
+TATCACCGAGCGAAGGGCGGATGTGACCGGGTTTACCACATTTAGTAAGTTCATGGCATC
+CCCTGTGGATGGTGGAGAATGGAATGCCGAAAATCTGGCGTTCAGTATGAACCTGTTAAA
+CAATCCTGGCGAGGGGCGTTAAACAGAAAGTTTCCTGCAGGCATCACGAAGTGAAACCCG
+GCTCCGGCAATCATCAAAATGCCTCCGGGAATCCCCGTCCTTCAGGGCGGGGAGCAGTCA
+ATGGGGAAATTACCGGGAAGTGAAATCTGCATGAAAATGGAATACCAGGAAGGAGGTGCT
+GAGTCCCGTCTGAAACTACGTGTGAATAATGAGCAGACTAAATGGAATGTGTCCTAAATA
+TGATTGAAAGCGTTGCATTAAAGATATTAAAACCTTGAGGATATTTAAGTATCAGTACTG
+GATGGATGATAGTGAGATGATGTGAGGTATATTTTCAAAAGAAATTAATAGCTGCTGTAT
+TTTTGATATTAATAATATAAAAGGAAATGAAATATGCCGTTAAGTTTTTCAAGTTTAAGT
+TTAAATACCTTTGATGGGAGCGGGAGCATAGATACATATACGTTGGATATGCTCGACAGT
+ATACGTAATGAAGCCAGACCTGCTGATGGCGGGACTGGGTCGACTGAAATTCAGGTGCAA
+CTATCTGATGTGCTATACCAGGTATGCCATCGGCCCGATAAAGGCTTATTTAACGTGGTT
+CCGTTGTGTGAGCCGGGGCTGGATCGTTTTTCTTGTCAGGTAAGGGAGGGCAATGCAAAA
+AAGCTGGCAAAAGAATTAAACATTTCATGGAAGATTGATTTATGTAATTTTCAGGTTGAA
+TCAGGAAGTTTTGCATGTTCTGAAGAATATTTAACATGTCCGATAACGATGGCTATTCCA
+ACAAACGGTATTTTTGTTAAAGCATCATCACGGTCAGATGTTTGTCACTTATTTGATAAA
+GAGGCATTCTTCAATGTACTGTCCCTGGAGTTAAGACACCCTTTGAGTCAGGAGCCTATC
+CGTAGTGATATGATAGTTAGAAAGAGCGAATGTTATTTTAATACCGAACGTGATTGTTTT
+ACCTTAAGATAGAATCTGATTAAACATTATCAGATGAACATGAACTTTGTACGGACAGGC
+GGAGGCGGCTGTCTTCACAGCTTACGAGTCTGAGGAGTAAGAGACCCGGCAGCGAGAAAT
+CCCCGCCACCTCTGATGTAACAGGTACTTCAATGCACCCGTACTTAACCCGCTGGGCGGG
+TTGGCGGGAGGGTAGATTATAATTAAAGCCCACTCAGATGGCTTTTTAGCAAGGCTTATC
+CGAGAGAGCCGTAAAACCCCGTCCTTTTGGGGCGGGGATATAAGGCGTGCCCTTGATCTT
+CTAACTAACCAAGAATCCCCTTCCTTTAGGGAGGGGAGTGTCAAATTACGCCCAGGCCAG
+TGGCAGGATGGATGACAGAACACCCGGGAAATGTTCTCTGGCATGACGTTGCATATCATA
+CGCCACAATGCTGGTACAGGTAAAGGCATTATGGAGGCCGTGAAAACGGTTGGACCAGTC
+GGTAAGCTTGTCTACGGACGGGAATATTTCCGGAGACAGTTCATACGCTTTCTGCATCAG
+CGCCTCCGCATAGCCTCTCAGGATAGTCGGAGAATCGTGTTCAGTGCCGAAAATAGCGCT
+GGAGGAATAGCGTGCGAATGCGGTACTGAGACAGAACAGGGTTTCCGCCTGTTTCTGTGG
+GGTGGCATCAGTCAGGTGATAAGCATTGAGGATATGCTGGTAGTGTGGCGGGCTGAGTTT
+ACCTTCAGGAAGCAGGGATTCAAAAACAGCGTTCAGACGTGACTGTGAAGGGGCATCAAC
+AAACTTCACGTCGGAATATTTCTGTTTCGTGGCGGCAATAAACTGCTGGTTAAGCTCCCT
+GTGTTCTTCAGAGCTTAGGATGGTATCAATCAGTTGCCCAAAGCGTCGCTGTTGGGCCTG
+CTGATTAAATGCGGTGTGAAACACCGGAAAGTCATGACGGAATAATTCTTCCGGAGAGAT
+TTGCGCGGTGGAGACGTTCTCTCCCCCTCTCAGCAGGTAAAAGCGGTCCCATGCAGTGTC
+AGGTTTGGGGTTTAACATCGTTGACAGTGTGTCAGCGGAGAGCATCATCGCCGTGTCAGA
+AGCTCGGGAGGAGAGCAGCAGGAAATTATCTGCAGCGCTGGTTGTCCAGTCCGGGCTGCC
+GTCATAATCGCCGAACAGCCCATTATTGATGTGTGGAGACACCAACGGGTGAGCAAGATA
+CCGCTCATAAAGTGCCGCGGCTTTCTGGCGGATGTCATCAGTGCAGTCCACGCCTGTCAT
+ACAGTGTACAATCACCTGATTAAAGAATCCGCTGTGAGTGGTCATGGCGGCGCTGTTCCT
+GTCAAACGAATCCAGCAGCACAGGCAGTATGCGCTGCTGATGATATGTGTCAGGAGCTGG
+CAGGGGAACGTCATTATAGGTCTGGCACTGATGGGCAAAAAAACTTTCCTTAACAGGCCT
+GAGCCACTCGCTGATAAGTACACTTTGCGTATAGGGGGGGTGGGCCAGCACGCTTACCAG
+CGAACTTTCAACTGGCCGGATATGTGCCTCTGATAAGCAGCCACTCCGCAATGACTTAAC
+CAGGTCTTCCATTGCCCGGACTTTTTCCTGACTGTATTTATCGGGCAGGCTGTCAATGGT
+CATCAGAATACTTTTACCATCATTGTGTTCATGATTTAAAAATCCATCCACAGCGTTCTC
+AGTCCAAAGGAGTGGCATTTGTATCCAGATATCACCTAAACGAATAAAATCTCCGCCCCC
+TGATTTTGACGGAGGTGATGAATTATCCGGTTCATTTAAAATAACGCCAGAGAGGTTTGC
+TTTGTGATGCATACACGTATTTTTTAATGTTGTATTAATAAAAGAGGGCTGTTGTTGTGT
+AAAAACTGAATACTGTAAAAACGCATTATTCATATCTGAATGACTAAATTTCGTATTGCT
+GCAGATTGCACCACGCAGTGTCGAATAAGTGAACCGGCATTCGTCAAAATGTAAATCAGA
+TATATCAGAATGAGCGAAATTTGAATTTGAAAAGTTGAACCCCTTAAGGATATCGCCGTC
+TCGCTCCATGAAGCTGGAAGGCAATATTTCACTGAATAAAATGTAACGGAAATCTGCGCC
+TGAAAAATCAAGTTCTGTGGTCGAGAGAGTTTCTCCGGCTTTCTGTCGTAAAACTGCATC
+CGTGAGTTTCTTAGCCCATTCGGCAGGTGATGACGGGGAAGACGTAGCCTGAAGTGAGAG
+GGAGGGTGATACTGGTGGTGTTCTGGCTTCAGAAACCGTTGGCCTGTTATTGGCTGATAC
+AGAGACTCCACCGGGGAGTGGGGCCGCACCTGTCACTCTGTAATTATAATCACGTGATTG
+ATTTGCAATATTCTTATGCATGAATGCTGTAGTAATTTTTGAGACATCTTCCGCTGAAAT
+ATTTTTCTTACAGGTGTTATTTGTGTCAGTAATATTTTTAACAGTAATCAATGTTTTGTT
+TAAGGTGTTTTTATCTTTCGGATGAAAGAATTTTTTTATTTTTTGTGGTAACGCGAATTC
+AATCGGTGAGTCCTTTCCTATTTTAAATTTTTCATTTAAAGATATAGGTGTGTTTTTAAC
+GCTGGTTATTTCTGAGGAGAACCGGTTTTTCGTACGCTCATGGATAGTTTTAACTAATTT
+TTTAACCTGGAAGGGAATGGTGGAAAAATTAATTCTGCTTGATGATATATTCATTAAAAT
+CCTTTATCAACATCTGTTATGGAAAAACGCTCTGGCTTTTTAACGCCTTAAAAGTAAGTT
+CCATATGTTGCTATTGCAATAGCGATCACAATTCATCATATTATCTGGCATGTTTCTTTC
+AGAAAGTGTCCATTCTGTCATTATGTTTTGAAATAACCCACCGTGTGGTGGGGGCTGACG
+TATCTGCGGAAAAATACAGGTATAAGGGAGCGGGTCGGGTACCGAAGCCCATGGATGCGC
+AAAAGTGAACCCGCTTCGATGCCCAACCGTTGCCAGGCCAATCCGCTGGCGCCTGATTGA
+CAGCTCCCCGCCCTGAAGGACGGGGATTCCCACTTCAACGAGCCGAACCTAAGCCGCTTT
+GAGCGATTCAGGATTTACAGGCTCTCCGTGGGCTAACACTGCCAGCCCGGCAGCTTTGAT
+ACTACGTGCCGCGTTAACGTCCCTGTCGTGGTCAGTTCCGCACTCAGGGCACTGCCATTT
+ACGAACATCAAGAGGCATTTTTTTCATGGTGAAACCGCAACAGCTACAGCGTTTTGAGGA
+CGGGAAAAACTGGTCAATGGCGACTACTGACCGCCCGGCCCATTCGCCTTTGTACTGGAG
+CTGGCGCACAAGTTCGCCCCAGCTCGCGTCTGCTATCGCTTTGGACAGCGACGGGTTGCG
+GAGCATGTTCTTCACTTTCAGGGATTCGACGCAAACAACTTGGTTATCGTTAATCAGTTT
+GCGGGATGCCTTGTGCAGGGCATCCAGTCGGCAATCAGCAATTTTCGCGTGGAGTCGGGC
+CACCTTTAAGCGGGCTTTGGCGCGGTTCTTTGAGCCTTTGGCCTTTTTGCTTAACCGGCG
+CTGGAGTAGTGCCAGGCGAGCCGCGTATTTAGCGGTATGGCGGGGATTGCCGGACCTGAA
+TCCGGTATCGGTGACGAACAAATCTTTTAAACCAACATCAATGCCGACCATTGAAGAGGT
+GATCGGCAGTGATGCGGGTTCAAATTCGCAAAGGCACGAAACAAAGTACCGCCCTGCGGC
+ATCTTTGGAAATGGTGACGGTAGACGGCACGGACGGCAGCGGACGACTCCAGCGCACGTC
+TAAGGGGATTTTGCTCTTTGCCATGTACAGCTTGCCGTCGCGGTATTTAAACGCGCTCGC
+AGTGAACTCAGCCGCCTGCCTGTGCCGTTTGCTTTTGAATGTCGGATATGCAGCCCGTCC
+GGCGAAGAAGTTAGCAAAGGCGGTTTGTTGGTGGCGCAAAGACTGCTGGAGGGGAACGCA
+GGAAACGTCGTTAAGCCAGGCAAATTCCGGCTCCTTTTTCAGCGCCGTAAGGCGAGCGTT
+GGCCTGTAGGTAACCGATCTTTTCCTTTCGCTCGTAGTACGCATCGGTACGCCAGCGGAG
+GATGGAGTTGTAGACGAAACGCACACAACCGAACGTCTGAGCTAAAAGCTCAGCCTGCTC
+AGTCGTGGGGTAAAACCGGTATTTATATGCGCGTTTCATAGCCTCACATATTAAAGAGGA
+AAATGTGATTATGCAAAAGACAGTTAGCCGGAAAACCGCCTCCTTTCCTCCCCGGCCTGA
+AGGCCGGGGTTTCCCGGAGGCATTCTGATGACTGAAAATACTCTGCTCCGGGACGAGCTT
+TCGTGATGTTGAAAAAATACCACTCCCTCCTTTCAAAAAGCGTATCAGCTTGATAATACG
+TTTGAGAGCGAGTGCTTAGCTAACCCGGAGATTCACTATGCAGTTTTCAACGACCCCAAC
+GCTGGAAGGACAAAGCATCGTGGAGTACTGCGGTGTGGTGACGGGCGAAGCCATTTTAGG
+TGCCAATATTATTGGTGCCTGGTCTGACGCCCGGCGAGTGGCGCTTTATCCCTGCATCCA
+TATAGTCGATTGCCTTTTGGAGTTCTTCAATCAAAGTAATGGCTTTCGTCCGTGAGATAC
+ACATAAACTGGTCAAGGAACTCTTGCAACGTCAGTAGCATTCCTGAACTGACAGATTTTG
+AAGTGAGCTATTCACTTCTCACGAACGAGGTCTATCTGTCCACCTCATTTACAGACAACA
+TGGCCTGTATACCAAACTGGCCGTTGGAATCTGTACTGGTCATATGGTTATCTGATACTG
+TTTTTTTTGTACAGTTCATTATTCGGTGGTTGTGTAAGTGTAGTCAAGTGGATATGCCTG
+ACTGGAAAGAATATTGTTTGTTTGATAGGAGCTAACTTTTTGTTTTTGCTGAATGTTTGA
+AATAAAGTAGTATTCTTTCTATTTATTATAACCACATGATAATAAATAAATTTTTTCCGG
+TCTTGAAAACCGGCGACCCGAAAGGGTTCCAGAGTTCGAATCTCTGCGCTTCCGCCAGAT
+TAAACAAGGGGTTACCGAAAGGTAACCCCTTTGTTTTTGGGCTGTTAGAATACACTTAGA
+ATATTCACTTAGAATATTTTCCCTTGTTCCTTTAACGGCAGACAAAAAAATCCCGCCGAA
+GCGGGAGAATTTCAGGCCTGGATGAGACGCTTAAACAGCAACTGTTTGATGTCCTGACGG
+TGCGACAAAATCGCATGTGCTGTTACTGTCGAGCCATCCACCGAATACAAAACACGATAC
+CCGCCTGCGGTATTGCATTCCCGGTATTTTGCCACCCCGAGTTTCATCAGTTCCGGGCAA
+ATCTGACAACCGAGCGGAAACTGGCCTACCTGTTTCTCAAATTGTTCGAGAATTTCTGAA
+ACCACAGGTTTAGCTTCTACCTCATGCCGGTGGAGAAAACTTGCGATATCGTCGACGCAG
+GTTTTGACGGTGTGTGTGTATTCGATTTTGACTTTTTCCATTACTGGATCCTTATATCAA
+TTTCTCTCATATAAGCCCGTCCAGTAACTGCTCCTTTGAATATACGTTGCCATTGGTTTT
+GTCCTGCTCTGACAGGGTAAGAAGTTTCAGAAGAGCAATGGCGTTTTCCCGCTCCTGTTG
+CTGAGCATATGACTCAATAACATACGCGGGTACACCATTTTGAGTTACCAGTATTGGCTC
+TGACAATTCGAGAGAAGCAGCATTCTTCTTGACGAAGCTGATCGTTTCTACTCGCATTAG
+GCGTAACCTCGCTTTAAATAAAATCCTCAGGATTGTTGATTCGGCCTAAATATAGACCAT
+ATTTAGGCCTTTGACAACTATGCGAACTGGCTGATAGCCGGGATATCAAGGGAAGGGGTT
+ACTTTAACCTTACGATCGTAAACCAGTACCTGGCTCTCGGTTTTGTGGCCGGAGAATAGC
+TGCTTATCGCGACTCGATCCTTTATAGTCAGAAATCGCCTTTGCTTTGATGTCGTGGAAT
+GTACATCCGAACGGTGTTCCGGCTTTTTGCTCTGCGGCTTTTTTTGCTTTGTCCCACCAC
+TTATTAAGTGTCCTGCCCGTCACCTTTTCGCCGTTAGCGTTGGTGATAACATATTTTCCA
+TTTTCGCCCATAGTATTTCTCGCGAGTTGAAATGCGGAACGAAGGCGAGGAGACTGCTCC
+TTAATTTGTTTCTTCCCGGTTTTTGTTCTGCTCAATAAACAAATCAGCATCCATCACATC
+ACCCGAGACCTTCTCCAGAACGTCCCCTGGCGGGCGGCGCACAAATACGAAACTTCCATC
+GCAACGCGTAATGTAGGTGTGGTTTCTTCATAAATCGCCGCATAATGCTCATCACTGATG
+TAGACGGTACGTGGTTTCGAGATAAATTTACGTCCCCTTTTTCAGGGGTTCCCCTTCACA
+TATCCACGTGCAAATCCCCATCCGTAAACACGGCTAAGGCTCGCGAGCTGTGTCTTACTT
+TTCAGCCTTCTCTTGCCCATAAAAATTCTGATGTGTTCTGTTTTTACCGTGTCTGCACGC
+ATTTTCCCAAAAACAGCCAGCAGATTACGCTGGGGCTGGTGATACTCTTTTTGAATTCGT
+GGTGCTGGCTCGGTACTGGCATTTTATCGGGGATATTACCGGGGGGCGAAATCTGCATGA
+AAATGGAATACCAGGAAGGAGATCAGGAACTCCATCTGTGAACACGGCTCAATAATGAGC
+AGACTAAATGGAATATGTCCTAAATTTGATTGAAAGCGTTGCATTAAAGATATTAAAACC
+TTGAGGATATTTAAGGATCAGTACTGGATGGATGATAGTGAGATGATGTGAGGTATATTT
+TCAAAAGAAATTAATAGCTGCTGTATTTTTTATATTAATAATATAAAAGGAAATGAAATA
+TGCCGTTAAGTTTTTCAAGTTTAAGTTTAAATACCTTTGATGGGAGCGGGAGCATAGATA
+CATATACGTTGGATATGCTCGACAGTATACGTAATGAAGCCAGACCTGCTGATGGCGGGA
+CTGGGTCGACTGAAATTCAGGTGCAACTATCTGATGTGCTATACCAGGTATGCCATCGGC
+CCGATAAAGGCTTATTTAACGTGGTTCCGTTGTGTGAGCCGGGGCTGGATCGTTTTTCTT
+GTCAGGTAAGGGAGGGCAATGCAAAAAAGCTGGCAAAAGAATTAAACATTTCATGGAAGA
+TTGATTTATGTAATTTTCAGGTTGAATCAGGAAGTTTTGCATGTTCTGAAGAATATTTAA
+CATGTCCGATAACGATGGCTATTCCAACAAACGGTATTTTTGTTAAAGCATCATCACGGT
+CAGATGTTTGTCACTTATTTGATAAAGAGGCATTCTTCAATGTACTGTCCCTGGAGTTAA
+GACACCCTTTGAGTCAGGAGCCTATCCGTAGTGATATGATAGTTAGAAAGAGCGAATGTT
+ATTTTAATACCGAACGTGATTGTTTTACCTTAAGATAGAATCTGATTAAACATTATCAGA
+TGAACATGAACTTTGTACGGACAGGCGGAGGCGGCTGTCTTCACGGCTTACGAGTCTGAG
+GAGTAAGAGGCCCGGCAGCCAGAAATCTCCGTCACCTTCGATATGTCAGGTATCCTCAAC
+GCACCCACATTCAACCCGCTACGGCAGGTTTTTTAATGTTCGGGAAATACTGGCACGACA
+AGAGGCTGCGATGGAGGCCTGATAACGGACGAGGTTTACAACAATGGCTATTCTACGCAA
+TACGAAAATATTTTGCGTCTGGCCGGAACTGGTGATGGGGAGATATTAATCGGATGGAGT
+GGGGTAACGGTGCGCCAGCTCCCGCCTATCTCTGTGGCCATCGTGATGCCGCTGACGCTG
+AGTGGTCCGAATGGGCAATGCTCTACACCTTACTAAATCCGCCACTGGTTCGTATCCAGT
+AGGGGAGGCGATTGTATGGCTGTCTGATGCCACTCCAGCAGGTTACGCCCTGATGTACGG
+GCAGTCCTTCGATAAATCTGTTTACCCGCCACTAGCGATAGCCTATCCAGCCGGCGTTAT
+TCCGGGCATGTGCGGCTGGACAATCAAAGGTAAACCCGCAAGCAGCCGCGCAATGTTGTC
+ACAGGAAATGAGCGGTAACGAATCGCACAGTCATAGCGCCAGGACGCAGGATACCATAGG
+GAGACTGGTAGACTGTGTTGATACCTCAAGCCCCACCAGGTCGGAAATACCAACATGATG
+CGTTTTGTACGGGCTGGATTTCCGGTACACTGTTGTACTCATATTCACACTTAAAATATT
+CTTATCATTCTTATAAACAATTTATATAAATTGTTTTGCATGTTAGCATTCCATATTGGT
+TTAAATTCACAGGATTTTTTAAGAGGTATGACCACTATAGCAATTGTTACTGCTTATTTT
+GATATAGGCAGAAGCCAATGGACATCTCAAAATGGATTTGCTCCATGCATTGAACGAGAT
+ACTGATGAATATATGGCCTGGTTTTCTAATCTTGCACAACTTGAAAATGATATGGTTATT
+TTTACCTCACCTGACCTCAAACCCAGGATTGAGGAAATCCGGAGAGGAAAACCAACAACG
+ATTGTTACATTAGATTTCAATAAAGAATTTCATCATATCAGGAACCGGATTGCCTCTATA
+CAGTCAGATGTAACGTTCAGGCTTAGAACACCTGTCGAGCAGCGCGGGAATCCAGAGTTC
+CTGTCGGCTGATTACGTTTTACTCTGCAATCTGAAAACATACTTTGTAAATAAAGCTATC
+AGGCAGGGGTTGATCAAAGACGACATGGTTGCCTGGATTGATTTTGGATATTGTAGAGAT
+TCAGATACCACGAATGGAATAAAAACGTGGTCCTGGTCCTTCAATAAGGAAAAAATGCAT
+TTTTTTACGATTAGAAGGGGTCTTAAACTTGAAACACTGGAATCAGTATACAACTGTATG
+TCAGGTAACCGTGTGTATATCATCGGTGGCGTTCTGGTCGGAGCGCTGGAAAAGTGGCAA
+GAATTTTACAGATTGGTGTGGCATTGCCAAAAAAAGGTGTTGAGAGAAAATATTGTGGAT
+GATGATCAGGGGATATTTCTAATGTGTTATTATTATAGACCTGACATGATAAAGTTAAAC
+TACCTGGGTAAAAACAAGTGGTTTGATTTATTCAGATGTAAGGGAAGGCGAACGATTCGT
+ACTTTTTTTCGCAAGATGAGAATATTATGTCTATACAAATGAATGTGTTAATTTATAAAA
+AGCCAGGCATGTAGATTATGCCGGGCTTTTAAAAACTGAGAGATTTATTTTTTACCCTGT
+ATCTCTAAATGAGACTGGTTTTCATTTGCCGATTTCACTCTGTCATTATTCATTTCACTA
+TTAACAATCTTTTTATTAAGCATATAACCAATGAGACATGAAAGGATAGACTTAATCATT
+AGACCACTTAGCCATCTGTCCTTGCTTCTGAATTGTTCAGCGAATGAACAATCAAATTTG
+TCATTGGTAGATTTATATAGAAAGGTATGTACCATTGCTCCCTGCCTATCATAATCCCAT
+GACCTTTATTGATCATTTGTTGATGACACCAGATGCCAGGTCGGAAATGGCGTAAACCCA
+GCATCGCAGGAACCCGGTAGCAGACTGTAAGGGCAGATAGCACTTCCGGGCATATATCTA
+CTGAAAAATCAACATATATAGAATTGACTCCAGATCAGAATAATGTATTTCTATTCCTCC
+TCCGGTGAAAGTGGTTCCTCCTTAATCTGCACTAAGCGTAATGCCATGCCCGGTTCAAAA
+TGCTGGTAATCCGCTCCGTAGTCAAACCACAGTTCTTCCCCGGCGGAGATGTCGCGTGTG
+GTGAGGTAAAAGGTAATATTCTTTCCGACAAGGACCGCGCTGACGTTCTGTCTTGCTTCT
+GCCTCCGCGGTCCGGCGGCCAAATACCGGGTTGTTAATCAGGCTGAGGAGATTTCCCTGC
+GGCCAGGCAGAAACGATTCGCTCCTGGCTTCGTGTGGCAAAGTAATAATTACTGGCTTCC
+CTGCCGTATTCTTTTTCATATTCATACCGTACCGTTTCGCTTTCCAGCAGGCGGCCGGAG
+TAGGGCCCCAGTACGGTGAAGGCGGGAAGGTCAGTACGCGCGTAAACGGTGCGCCCCCGG
+TAGCCGTCGCTGTCATCAAGAGGAATCGACACGGTCATCATGTCATTCATGCGCGCATCA
+TGGTTACCTTCATTTTGCAGGAACCACTGGACATCCTGATTAATCCGGGCTTTTGTCTCC
+CGGGGGAGCCGGTTAAAAAGGCTCCCCCAGAGAGTGACCTGTAAGGTCTCCTTTCTGCCT
+TCTGCCTGTGCCAGAACCGATACCGTCGGGTCACGCCAGTGCTGCAGAATCGGCAGGTTA
+TTGTTTATCTGATGCGTCCGCCAGGTCACGGCGTCTTCCTCTTTCTTAATCTGTTTTGTC
+GTTGGAACCGGAATATCTTCCCCTGCCACGGGGATGGCGCGCTTATCGCCGCTGCTTGCC
+AGAGATGTATCCGCCCTGACGGTGAGTGACCCCCTTCCACCCGTGGATGTTGAAGGCTGT
+GAACTGTCCTGCGTGACAGTGGTGGTGAATAACGTGCTGCCGTGGGGCATTTTGCTGTCT
+GCCGGTGCCAGAGATTGTCCGGTACGTTCGTTGGATATCCCCTGTGCCTGCGCCCATGTT
+CTCTGGCCGCCAGCCTCGCGTGTCGCCTCCGTCGACAGGTTCCGCCATGTCTGCATCGGG
+GAATCGGTAACAGGGGCATTCCTTTTCTTTGACTGCTGCAGCCGCACTACACCGCGGGGT
+GCCAGTCCGGTGTTTGTCAGAAAGGTTCTGGCACTTCCGACGGATATTCCCTGTGCCTGC
+GCCCATGCTACCCAGCCACCAGCCTCGCGTTTCGCCTCTGGTGTCATGTCCCGCCACGCT
+CGAATCTGTTTACTGGTAATAGAGGTTCCTTTTCCCTCTGGCGGCCGCAGGCGCGCCACG
+CCGCTGGAAGTCAATCCGGTGTTTGTCAGATAGTTCGCTGCACTTATGATATTTATTCCC
+AGTGCCTGCGCCCATGCTTTCCAGCCGCCAGACTCGCGTTTTGCCTCCGGTGTCAGGTCC
+CGCCACGTCTGAATCTGGGTTTTGGTAATAGGGACGTCCCTTTTCCCGGGCGGCTGCAGC
+CGCGCCACACCGCGGTATGTCAGTCCGGTGTTTGTCAGAAAGGTTCTGGCACTTCCGACG
+GATATTCCCTGTCCCTGCGCCCATGCTACCCAGCCACCAGCCTCGCGTTTCGCCTCCGGT
+GTCATGTCCCGCCATGCTCGAATCTGTTTACTGGTAATAGAGGTCCCTCTTACTTCTGGC
+GGTCGCAGGCGTGCCACGCCGCCGGGAGACAATCCAGTGTTTGTTAAAAAGTTCGCTGCA
+CTTCCGACGGATATTCCCTGTGCCTGTGCCCATGCTCTCCAGCCACCCGCCTCGCGTTTC
+GCCTCCGGTGTCAGGTCCCGCCACGTCTGAATCTGGGCGTCGGTAATAGAGGCTCCTCTT
+CCTTCTGGCGGCTGCAGTCGCGCCACACCGCGGAGTGTCAGTCCGGTGTTTGTCAGAAAG
+CTTTTGGCACTTCCGACAGATATTCCCTGTGTGTGCGCCCATGCTCTCCAGCCGCCAGAC
+TCGCGTTTCGCCTCCGGTGTCAGGTCACGCCACGCCCGAAGTTGTTTGTCCGTAATGGAG
+GGGCGCTTCGCCTCAGCCGGCAACAACCGCTCTATGCCGCGCGGAGTCAGTCCGCTGTTT
+GTCAGATAGTTCTCAGCATTCCTGATGGCTATTCCCTGTGCCCGCGCCCATACTTTCCAG
+CTACCAGCCTCACGTTTTGCCTCCGGCGTCAGGTCACGCCACGCCTGAAGTTGTCTGCTT
+GTAATGGAGGAAAACTTCTTCCCGACCGACAATAACCGCGCTACGCCGCGGGGAGTGAGT
+CCGCTGTTTGTCAGATAGTTCCTGCTACTCTCGATGCCTATTCCCTGCGCCCGCGCCCAT
+ACTTTCCAGCTACCAGCCTCACGTTTTGCCTCCGGCGTCAGGTCATTCCACGCCTGAATC
+TGCGCGTTGGTAATGGAAGGGAGCTTTGGGCGCGCTCCAGGCTCTGTTACGGTAGCGGTC
+CTGCTGTCAGAGCTTACTGACAACGGTAGTTCTTCCTGGGAATGTGCTGCATGCCATTCC
+GGGTCGCTCAGAAGGAGTGTGACAGTAGGAAAGTTGCTGCTTTTACCGGCGGCAATTGCG
+CATTGGGTTTCACCTGTGCCGACCATTCGCTCTGCCGTAAAATTTGCCTGCCGTCCCGGG
+GACGCCAGTGCTTTTAGCCTTAAAAAGCGCTTCAACCTGTCCGGTGCCGGTGTGCCTTCC
+TCCGGCTGATAAAAAACGCGAAAGCAGTGTGCAGCCTCATCCTGAGCGGTCAAGGGGAAC
+CAGTCCCGGATATCGTTCCACGCCCGGCTTAAGTGGGTATCTGAGGTGCTGCTGGCTGCT
+GGTGCGTGAAAATGAATGACTGACCCGATACCCCGCATGGTGCCTCCTGCTGATACCCGT
+CTGGTTTAACGTAAACAGGAGAACGCTACCATCGCGCCTTATAATTTTCTTTTAAATAAT
+GTCCATCTGCATGAACGTGCTCCGGTCCTGTCGATTTAAATCGGTCAATTCCGTGAGTGG
+CCGAGTACACAACAGGGGGCGAAAAACTGTGGCTATCTGACTGGGTAAGCCGAGGCAGAA
+CGCTTTCATTGAGCGCTTTAACCGGATATACCGTACAGAAATACTTGCTTTTATCTGTTC
+AGAACACTGAATGAAGTGCGAGAAATTATAGATAATGGTTGTCAGAATATAACTGTTAAC
+GCTTGTATGTATCACTGAACAATATGAAGCCGGAGGAATATCGACAACCCCCTTATTTGG
+CCGGGAACTAAAAAAATACATGGAACTAAAATGAGTCTATTTACAACTGTTTCATAAGGG
+TTCAAAATCAACCGTTGTGCCAGGAATCTTACCTGACAACCTGTATGCCACCCTCAAATT
+GTTGCGTTGAGCCTGCTCCACCAGTGAAATAATCGTGATGAAAAATAGTCCAGGTTGTCA
+CAAAAAAACGGATATATAATAATTAGTCGGTTAAAATCGCAGCGGTCAGTTTAATTGGTG
+ATTAATTAAATAAATATAGTTACCAGTCTTATATACACGTTAATTATTAAAACAATCACT
+CTACGGTAGAGTAATGGTTTAGATTTGTTGTGCTATGAATATCATTATGAAGCGGCATAA
+TGCCTTATGAATAAATAGGCGAACAGTCATTTATCATTATGACGGTTAACTTTCAAGTAA
+CGGGTGGAGCATTATGATTTGTTGTTATCAATCGGTGAGGCAGAAGGGGAGAAAAAGAGA
+TGAAATACCAAAAGCGACTAGCGGGAATGATGGTTATTACCGTCATGATGATGACGGGAT
+GTTCAACGTATAATCCCGTACAACTCCGTCAGCATCAATTAGAAAGAAACTATACTTATT
+ATCTTCTTGATCCTCCGCTGTACGAAGGAGATGTAGTAGAATATAAATGTAAAGACGGAA
+GTCAGGATACAGTGACTATTCAGAAAGTAACGCCGCAGTCATTAATCACCAGTACTGGCC
+AGGTTATTCCACTATCTGATCTGACCTCACTTGAGAGAAAGGATATTTCCAAAGGGAAAA
+CCGCTGCTGCTGTGGGGGCTGGCGTTGGCGTGACGGCGCTGGTTATTGCTGCGATTTTTG
+CTGCCACCCTGTCTGCCGGATTAGCTGCAATGATGGTCCATGGTTAA
+>NC_015761.1|provirus_3084741_3115735
+TCAGAGCCACAATGGTCGCTGACCACCAACAGTCGGGTGCGGCGGTGCCGGGTCGATGGA
+TCCCGGAGTAACAATAAAGCGTTCTATCGTTTCCATTGTCATAAACGTACAACTGCAGTT
+GATATTCTGGCACTGGTGGTAGCGCTCTTTCGTATTTTCGGTTAGATAGCGGCTTGTTCG
+CGCATGTGCGGCATGATGGCACTTCGGACAATGAAACATAACCCACCTCTTATTCTCAAT
+TCGTGAACCAATAATAATCACTAATTCACTTTTTGTGAATACATTTTATTCATCATCCGA
+TTCTGCACTGTACTCCACATCAGAGAGTTTAACCTCAAGCTCTAAGCCCGTCGTGAAGCC
+ACTATTATTCATATTGTGAGTCACCTTACTGATTAACCACGATTGCTCGTCTATGACGCG
+CTTAAAGCCTGACACGCGCACCGGTGTCTCAGGGAATAAATCAGCCCTACCAAGCGCCAG
+CGTAATTGAAAACTCCGCAACGCCTCGCTGCAGCTTATCCCACTTAGCCTGAGCGGCGCG
+CATCGCCTGCGCCTTAGAAGCGTAGACCGTCGTCAGCGCCAGTACGTTATCGGCCTCACC
+GGCCATATACTCACCCTCGCGAGCCTCCGGCTCTTTTCTGGACTTCGTCTTTTTGCTGAC
+CGGCTTTGCTTTCGGGTGTTCCAGTGCGCGAAGGTGCTTCTCTTTTGGCTGGCGTTTCAG
+CGTCACTTTCTGTTTTTGCGGCTTCGGGTCTTTGGTGTGCAACCATTTAGCTGTTACACC
+GGTATAAGCTCCGCGGTCGGCAATGGCAAACTGATGACGGTCGCCGTCACTGCGGGTCAG
+CGTCATTTGTGGAATGGGCTTACCGCTGGCCGTCAGCGCACTACCGGCTTTCAGAAACAG
+TAGTTTTCCCGCTTTAACCGATACAGTCGCTCCGTTTCGGTCAGCCAGCCGGGTAAGAAA
+TACCGCGTCGGATTCCTGCGACTGGTCGATATGTGGTACCGGTATTTGTTTCAGCGAATC
+CGCGACGCTGGCCGTCAGTTTGTTACGCTTTGCGATGGTGCTAACCAGTTCGCCGAGGGT
+GGTGTCGTGCCATGATTCCTCGCGCCGTGAATTGAGCGTGCCGCGAAAGTCTGCACTACG
+CGCCCGGATGGTCAGGGTATCAGGCGCACCCCGGTGCTCAATCTCATCGACCGTAAAATC
+GCCTTTATTCAGAAGCGCCGAACCTTGCCAGCCAAGCCACAGCGTCAGCACCGCCCCGCG
+CATGGGTAATTCGACTTTTCCGTCGGTATCGTCGAGCTCAATGTCGAGCTGGTCAGCCTC
+AAAACCCCGGTTGTCGGTCATGGTGAGAGAAATCAGCCGGTTACTAAAATTGCTGGTAAT
+GTCCTGGCTGTTCAGCGTTAGCATAAATGCCGGTGCAAGACTGGCACCGGCGTCAATGGT
+CATGCCCGTAATCATATGGTCAGCCCTCCGAGCGCACCCTGCAGCTTATCGGTCAGATTA
+CCGGCAGAGCCGAGAAGCTCGCTCGCCTGTTTATTCAGGTCGCCAAACATTGCCGTCAGT
+GATTCATCGACCCGTTTTAGCGAAAGCGTGAAATCAATCTTTCTTGCCGCGCCATCGCTG
+AAAAACTCGGCGTGCGTGGTCGACACCTTATCGATGATATACATCCCGAGGATTTTGCCG
+GTCCCCTCAATCAGCGGCCACGCCCTGCCCTCATCGGCCATCAGTTCCACAGCCAGCAGG
+GATATATGACCGCCGGTAATGGCAGGGTAAAGCGTACCGGCAAGCTGTATTGAGGTTTCC
+CCCTCGCCGAGAAACTGATATGCAGGCGGTTTACCGACCCGGTCATTAGACGCCCAGCGG
+TAATCTTTCGAATGCTGCATTGACTGATAAGGCAGAGTACGGAGTTCAAATACAAACATG
+CCGAGAGCAAGCATCATCGTTTAATTCTCCCTTAGTCGTGGCTCATGCTGGCGCGCTGAC
+GCGCACGCTTTTCGCGCTCAATTTGTTCGAGTGTGTCGCGTAGCTGGCGGTCGAGTTGAT
+GCCCCGGAGCAACACCGCCCGGTAGCGAAATGTTGTATTCGCTTTTGCTCTGGTCGATGT
+AAGAGCGTCCCGCCGGTGCGGTAACGGGCTGATAAGCCTGATACCCGCCATAGGTGCTGG
+TCGCCGGAATGTAGGAATTCCCCTGCGTGGCGGCGTTGGTTTTGGCGGCGGTCTGGTCGA
+GGCTGTCCGATTCTTTGTTGATGATGCCGAGCTTTTCGAGAAGCCAGTCGACACCACTGC
+GTAGCTTGTTGAAAACGTTCAGCGGTGCCATCAGCGCTGAGGCCAACGCCTGACCGAAAA
+TAACGCCAGCATTTTTACAGCTATCGAGCGTCTCCTGCGTAGCTTTGACCGGTGCAATCA
+GGTCTTTAAACCATTGCCAGACTCCGCGCAGCTTCTCACCGAGTCCGTCAAAAATGGGTG
+CCAGTGGTGCAAACATTTCCCCGACCGGAGCAAAAGCACTCATGATGCCCTCAATCACCC
+CCGAGAAAAATGCGCTGATGGGCTCCCAATATTTACGGATAAGTAGCGCCCCGGCCACAA
+TCGCCGTCCCGACGGCCACAATCGGCCAGGTGATTGCACCGAGAGCTGTCACAATGGCAC
+TACCGGCAACAGTCAAGGCGGTACCCATCACGCCAGCGGCGGCAATGATGGCGTTAATCC
+CCATGACAACCGGCCACGCAACGAGACCAATGCCACCGATGATACCAATCAGAGCAAGTG
+CGCCCCCGGCAATAATGCCGATAGTTGTCGCCAGACCTTTGTTTTTCTTGATCCAGTCGT
+CGAGCTTTAACACGTATTGTGTGGCGGTTTTGGTGAGTTTACGCAGCGAGTCCTCTTGCT
+GGTCAAAAAGGTCGGTACCGACGGCCTCATAAGCCGACTGGAACTCTTTAAAGTCGCCGC
+CGAGGTTATCCTGCATAACCTTAACCAGTTCCTCGGTTTTACCGTCCGAGGCTTTAAACG
+CGGCAGTGAGCCGGTCAAGTTTTCCGCTTGAGGCTGCTTCCATCAGTACCGCCGCCGCCG
+AGCTGGCCTCCTCGCCGAAAATGGTTTTCATGTACTCGCCGCGCTGGCTTGTCCCGAGGT
+TGTTTTTCTCAAAGCTGCGCTGCATTTCTTTCAGGATGGAGAATATCGGGCGCGTGTTCC
+CCTTGCTGTCTGACGTTTTGACGCCGAGTTCCTTAATGGCCTCAAACGCTTTTCCGGTGG
+GAGCCTGCAGGCGGCTGAGAATGGCGCGGCTACCCGTACCCGCCATTGACCCGGTGATTT
+TGGCGTCGTGCAGTGCACCGACCATTGCGGCGGTTTGCTCGATGCTTACCCCAGCATTTT
+TCGCCACTGGCGCGGCATAGGTCAGCGCGTCGCTCAGTCCGTCAAAATCGGCGGCGGTTT
+TGTTCATCGTCATCGAGAGAACGTCGCCAATGTGAGCAATCTTGTCGTTTGAAAGTTGAA
+ACGCTGATTTCATCCCGGTCAGCAGCGCAGCGTTTTCCTCCATTGAGCGCCGGTTTGACA
+GCGCCATATTCAGCGTGACTGGCGTCGCCGCCTGAATGGCAGCAGCGTCACCGCCGCTTT
+TCGCAATGATGATTTGCGCGCTCGCTGCGTCATCTGCAGAGGCTGCAGTATTGTCGCCGA
+GCTGGCGAGCCTGTTTGCGTAGCGCCTGCATTTCTGGCGACTGTTTATCAACCCCGAGCA
+CAGCTTGCAGCTCGGAATTTTTCTGTGCAAAGTCATAACCGGGCATTAGTAATTTAACCC
+CGGCCATCGTTCCCGCCGTCGCAATACCGACCCCGGCAGCGCCTGCTGCGGCCATGTTAC
+CGGCAAGCTCTTTACCTGATTTATATCGTTCTTTCACCCGGCTTAATTTCGCCTGCTGCG
+CACTGACGCGCGCCAGTGCATTACGCTGTCGGTTAAGCTGCGCCGTCGTTTCGCTGATGG
+AGGTTTTGAGTCGACGTTCATCGGCAGACAGGGTGCGGGTATTGATACCGGCCTGCATCA
+GCTCGGAACGCTGGCGCTGTACCGATGTTCTCAGGCTGTTATATTTCATCTGCAGCTCAG
+AGGCGGCACGTTTTGCCGCTTCGAGCGCCTGCGCCTGCGCGCGGGTCGGACTGGTGGTGT
+TTTTAAACTGCACAGCCAGCTCACCGGCTTCGCGCTTTGCCTTGTCAAGCGCCTGACCAG
+TCACGGCCAGTTGCGCGCTTGCCTTACGAAAGCCGTCGATTTTCGACGCCTGACCGTTCA
+GGTCGCGCAGACCCTTTTGTGTGTTGCGAATATCACCCGACAGGGTTTTACTCGCGGTCT
+GGATGGATTTAAGCGGTCGGGTCGCCTGGTCGACCGCTTTCAGCAATACCTCAAGCCTCA
+GGTTATTACTCATTGTGGTTTCCGCTACGCTGCAGCGCCTTTTCGCGCCATGTGATGAGC
+TCGGTCAGGCTCAGGGAACAGAGTTCTGATGGCGGCCAGTGGAATATCACTGCGATATCC
+GCCATCAGGTCATCAGTCGACAGGTCTGGCGGGAAGTCTATTCCGCCGAAGCTGGTGACA
+AAAAACCAATCACCTTAGCGGCCAGCGACAACATATCGGGCAGGTTCATCGCGGTAAGCT
+CCTGCGCGGTGAGCGCGGGGTAGGTCATGCGGGGCAGCACCTTAATCAGGGCGTCGACTT
+CGGACTGCGCCACCGCTGCCAGACTGACGCCGCGCAGGGTACCGGCGTTCGGCTCAATCA
+GGGTGACTTTATCAATCGTCTGACCGGCGCGCTTAATCGGTTTGTCCAGGGTCACGACGT
+TCGGGTTTACGGTGTCAGTTTCATTTCCAGCCGTATCAATAAATTCAGCGGTTTTACGTG
+GTGCTTTTGCCATGATGTTTTTCTCTGTTCTGAATGGGGTTAATAACCGGCCAGCAGTGC
+TGACCGGTCAGGGAATTACAGCCCGATTGCGCGGCGGTGCTGCTCCAGACGGTCGACGCC
+GTTCACCTTCTCGACCATGTTGACGGTGTCGATTTCGATGACGTCGCTGCCATCAATCGT
+GAGGCGGTAGTAGGTGCAGACAGTCGACAGTTTGGTCGAGGTGTTTTCACCCTGCTTATT
+CTCACCGCCGTCGATTTCTTTATGACGGCCACGCATGACCACCTCGACCGCCACGATTTC
+GCCGGTGTCGTCGCGCTGGTAAGAACCAGCAAAACGCAGCGGCACAGCATCAGCGCCCGG
+GGCGGCGTACTGCGCCCACAGAGCCACATCAGGCAGGCCGCCGACAGACCATTCGACGGT
+TAATGCATCGTCGTCGAGGCCGAGATCAATCGCTGCCGCGCCATTCATACCGCCGCCGCG
+ATAGTTTTCGAGCTTGCGGGTCAGCTTCGGCAGCGTCACGGATTCAACAACGCCCATGTA
+GCTGAGGCCATCGTTGAACATATTCAGGTATTTGAGTTTACGGGGTAGTGCCATGTTGTT
+TCAGGCTCCTTAGCTGTTGACCGATTCGGCCAGATTCACCAGATATTTATCGGTGATACG
+CTGGCGCAGGGTCAGGCTTTCCAGTGGCGGAACTGGTGTATAGTCGTAGTCGATATACAG
+TTTCCCGGCCTTGAGGGTTTCCTTGTCGTTCGATTCCTCATCGAACCAGCATTTACCCTC
+CACGATGTAGCCGTTTGATTTCAGCTCGCGGAATTTGGCGTTAATGCCGTCAACAATGTC
+ACGAATGAGCGTGGCGGTAATGGGCTTGTCGACCGCCCACATGTGCGCCTCCGCCATCGT
+GTCGGCCAGTACCTGCGCGGTGCGGGTGTAGTTCTCAAACAGAAAAAGCGGGTCATCCGA
+GCAGGTGCGGTTACCCCAGAAGCGGAAACCGTCCTTGCGTACCAGCGTTGTAACCCCGGC
+CTCGTTGAGCAGGTCAGCATCGGTGCCGGATGCCTGCAAATCCCAGAACACTGAGGCGCT
+GATGCCGGTAACGCCCTGTACACCAACGTTAGACAGGGTTTTGTGCCAGCCGACAGTCTG
+GTCGATGTAAGCACGCAGGCCGAGTGCACGCGCAGTGGCGTAAGCCGTTGCGGTGGTATT
+TTTGACGGTGTCCCATGCGAGGAAATCAGGCCAGATAACCATCAGCTCGCGCTGGCTGAA
+ATTTTTACGATATTCCATCGCTTCGGAAATAGTCTTACATCCCCACGCGCTGAGGTAAGC
+AAATGCACGTAACTTAATGGCAGCCGACGCAAGCGCAACCGCGACCTCTTTAGTATCCAG
+CCCCGGCACCCCAAGAATACGTGGCTTGACGCCGGTGACGGCCTGAGCGGTCAGGAGAGC
+CTTGATACCGGTGTATTTACCGTTCTCATCCGTACCTCCGATAATGTTGGAAACAGTCTG
+TGCGAGCGCAGCTTCCTCGTCATCGCCGGTTCCATCCTCAACACGCACAACAACAGTGAC
+GGGTTTTGACTGGTCTGCGATGGCCTGCAGTGATGCAGCCAGCGTGCCTTTTTTACCGGC
+TTTCGCAATGGCACTTTGCACATTGGTAATCAGTACCGGTTCATTGAGGGGAAATAGCGT
+GGCATCTGCATCGCTGGCTGTACAAACCATGCCGACGACCGCAGTCGCTACTGTGGAAAT
+AACACGCGTACCGTCATTAACTTCGATGACCTGCGTGCCGTGGTGAAAATCACTCATCCG
+GTTAACTCCGTGGTTAAGGGGTGAGTATATTTTCAGGTCAGTACACAAGAGGGGGCTATT
+TGTACCGGCTGTCAGGTTGATGGCACAACGACAGGAAAAAGAAAAGGCGGGTAATAAACC
+CACCTGAATATTTAGCGTGGTATATCCGGCCAGTCAGGCGCAGATGTATCCACCCTGTTT
+ACCATTACGCTGTAGAGCTCCCATGCTTCCAGCCGTTTAAACTCTTCATCTGTGGCAATT
+TTTAGTTTTACTGCCCGCGCCAGCGGTGCAATGGCTGATTCAGCCTCAGCAAGGCGGCGA
+ACTTTTTCAGCCTCCGCCTTTTTACGCAGCTCTTCCGGCGAATAAACCCGTTGAACGACT
+TTACCGTCTTTAAACTGCCAGCCGCCTGAAATATCAGCGCGACGGTTTTCATCCGTATCA
+GGTAGCTCCGCCACGCTCTGGCCTGCAGGCCATAAACCGGAAATATCGCGCGTGATACAC
+GTAATAACATCGTTATCGTCGTAGGTAATTTTCAGTGTGTCTTCTGAAAATAATTGCTGG
+CATGCATACCAGTCCTGACCATCCTCTGATTGTAGATGCGCCGCACCGGCGAATAATGTG
+TCGTCTGGTTCCGGTGTATACGGAATGAAATTTTTAATATTTAAAAACTGCTTGTTCTTT
+TTATTTTTTGCCGCTGTCATAATTATTCCTTCTTATACACTTGGGGCTGTCACCCACGTA
+TCACCAACCAGATACTGAATTGGACGGTAATAAACCTTGTCATCACCACCTTCCATTTCC
+CAGCTACCGTCAGTATGGAACCCCGTCACCACCTGTCCGCCGCCAAGCTGAAAATCACGC
+CACAGACCGCCAGAAAGCGCCACGGGGCCAAGTCTGACCGCTTTTACTACATTGTTGTGA
+ATCCATGTACTTAACCAGCCATTTCCCCATAACGAACCAAAGATATCACCGTTATTCTGA
+TAAATAGCGCCACCTATATTTAACGCGTTACAGTAGACGATACCGTTAACAGTAAATGAA
+ATACTTCCGTCCGTATTTCGTTGACTGTATAAATGCCATCCCTGTTCATCGCTCAGCTCA
+ATGACTGTTGGACGTTCTCCACCTCCCCACAGACTTAAACCAGCATTCAGTGCAGAATTG
+TTACCACTCGATAACGTCAGTGTTTTTCCGTTGCCGGTGCGCACGACACCAGTAGCGCGA
+ATATCTGCCAGCATGTGCAGCCCGGAATTGTCGATATAACCGACCTGGGCACTATTGGCA
+TAAATACCCAGAACGCCGTCACTGTGCCACTTAAACCCTGTATCGTTATCGCCGAATACA
+ATCGAATTACCGCCCAGTGCATTGTCAGTACCAATACCCAGTGGGCCGTTAAGCCGCCCC
+CCGGTAATCGGCAATGCACCCACATCACTGGCTGAAGGTTTATTTACGGTGTTGTAGTCA
+ATAACCCACTGGCGGCTGGTATTCGGTTCCGTTCCCCAGTCCTGGCGCTTTGCGTTCGCG
+CCCATATGCGCGTAATAGTGCTGAAACCAGACTTCACCGATTTTCTCAACAAACAGATAT
+CCATAGCTGTACAGCTTGCTGCCATCCGGATAGGTCGGAAAATCAGCGACCGTATCAGAA
+TTCGACACCGCCACCCGCCACCATCCTGGAGTATTAGCTGATGCCATCGTGCCGTTATCG
+GTAATCTGTCCAATGGCATCGGCGGAAATAGCCTTCACATCTGACGCCCACAGGGTGATA
+TCCCCGGATAATGGATGCCCATTGACCTTACGGTCTGACGGGACGCGTCCGTTCGCATTA
+TCCATAGCCGCTTTAACCGCTTTCGGCGTTGCGGCCAGCGTCTCAGACGTGCTGTCAGTG
+GCATTGCTGAGCTGGATAATCCCTTTACGTGCTGTAGTGGCGTCCTGAGCTGTATATTTC
+GCGTTAGCAAGGTCATATGCCACCTTGACCGCTTTCGGTGTCGCGGCAAGCGTCTCAGAC
+ACACTGTTAGTGGCATTGCTGAGTTGCACAATGCCTTTACGCGTTGTGGTGGCGTCCTGA
+GCTGTATATTTCGCATTAGCAAGGTCATACGCTGTCTTGACAGCTTTCGGCGTCGCTGCG
+AGCGTTTCAGACTCGCTGTCTGTCGCGTTACTGAGCTGAGTAAACCCTTTTTCTTTAAGA
+GTGGCATCAGGATGACGACGGGATTTTTCATGTTCGGCGAGCCTGTCGTCGACATAATCC
+TGCGTCGCCATCACCATCGTTGAGTCAATGGAAAGCTCCACAGACTCGACACTGCTGACA
+ATGATGACCATGCGGCATGTCTGCGCACGCCCTGAGCCCTCGGCCAGTTCTGGCTTGTAG
+CTTTCGGCCATATTGGCGACAGCAATCAGCGTCCCTTCATCGTCATAAAGGCCAAGCTCA
+CGCATCCAGAAGCCGCCCACCTCCGGCGGAATAACCAGCTCGGCCACAATGTAATTACTG
+TACCGGTTGTCCTGGCTGATTTTATTCAGAGTGTGACGCCAGACCTCATTAACAAGCTGC
+GTCTGACCGGCATCAGGCACCGGCAGTTTTCCACCGCCGTCACCAACAGCCATAACGTTA
+AGATTTATTTTCTTACCGCCCGGCATGGTGGCCGCAGCAAGCTTAGCGGCTCCGGCAGTG
+GTGATAACGGTTTTAAATTTCGTGCTCATTATTCCTCACTTATCCCGGGTAAACCGTAAT
+AATATCGCCATCGCAGGACACGCCGCCGGTATACAAATAACCGGGAATGTCCCGGACAAT
+ATTCAGGCCAGTCAGATGACGACTGGCTGGTTTTGCATCCGCAATCAGTCGTTCCATTTC
+GAAATACATTTCCTCGGTAATGCCACTTTCAAGCACCCCGATATCAAGCCGGAATGTGCC
+GGGCGGGTCGCTGCTTTCCCACCATTCCGTTACATTGATGACATAGCCGAGAGGCTCCAC
+TACCCGACGGATTGCGCCGATAGTCCCCTTGTGGCAGTGAATGAAATATGCATCATGGAT
+AACGGCACGTTTTGTTCCCTCCGGCCAGTTCTCATCCCACCGGTCGACAGAAAATGCCCA
+CGCCAGCCACGGCAGCAAATTTTCCGGACAGGTGTCAGGGTTCCACAACGAGCGGATGTT
+GACCGGCGTTCTTTCAATCTCAGCACATGCCCTTGCGGCGGCAACCTCCAGTGGCGATGA
+GCCTACCGGCAGCAATCGTGAGTCATTCATCAGAGCCCCCGATTACAAGGCTGTAGTCAG
+TGCAAAAGGACGCCTGTGTGTTATCGAGAACAATATCCGCGACCGGTGCCGCCAGCTCCA
+CCCGCTGAACACCCTCAACATGCAGGGCGGCATAAATCGCTGATTTACGGATATCGCGCC
+CGAGGCGGTGCTGCGCGCTGATATAGGCTTTCAGCTTTGCCTCAGCCGCCGCCCTGATGG
+GTTCACTTTCCGGGCCGGGATAAAGATAAAGCGTGGCGTTAATCTGGTAGTTAACAATTT
+CGGCTGACTGTACCGTCACCCGGTCAGCGACCGGCCTGACATCTTCTGCGTTCAGGGCAT
+TGCGCACAATTGCAAGCAGTTCCTCAGATGCGACGCCGTTGTTTTCACGAGACAGCACGG
+AAATCGTCACACAGGCTGGCGACGGGCTGATAACTGAAATATCGCCGACGCGCCCGTCAG
+CACTACGGCCGTGATACTGGTACGATCCGACAGACCCCGCCACGCTCAGTCCCTCAAAAG
+CCTGCTGTATACGCAGACGATAATCGGCGTCGAGTTCCATTTCTGCCGGAGTGGGTGGAA
+TGGTGGTGTCATCAGCAGGCGTGACGACAAGGCGCTCAACACTGAAATTCGCCCCGATAT
+TATCGAGGTCACTTTCTATGGCATAAGCCAGCATCACTGCGCGTGCAGCTTCATTGACAC
+GCTGACGCCAGATAACCTCGCGGTAGGCGTTTTCCTGCAGCAATTTAACAATTGGCTCAG
+ACTCAAGTGCGAGCGTCCGGGCGACGGCTTCCTGCTGGTTTTCCGGATAGAGCGAAATCA
+GCGTTGCAATGCGCTCCGCAAGGATAGTTTCATAGTCCAGTTCCTCGACCACATCAGGAA
+CAGGTAGCAGACTCAGGTCAACAGTTGCCATAGTGGTTTAACTCAGTGAAACAGTGGTTG
+AAACTGACGCACCGGTATCGGTACGCATCCCGGTAATATCGACATACATTTCGCCAGTGT
+CGCCACGCTCAAAGCTGATTGAGGTAAGCCTGATGCGTGGTTCCCATTTCTGGATCGCGG
+AATAGCACGCCACCATGATTTGCAGCCTGAGCGCCGGGTTTTGCGGCATATCAATCAGCG
+CAGACAGGAGCGAGCCATATTCACGACGCATTACCCGCGAGCCGACCGGCGTCAGCAGAA
+TGTCGCGCATGCTCTGGCTGATATGCTCACTGTCACTGATAGCGAGGCCGGTATTGCGGT
+TCATCCCCAGATAACGCGCCGTCATCTGGTGCCCTCCGTCCAGCTCCCGCCCCGTTGCAC
+GCCGCCGTGACCGTGGTCATCGACCTGTACGCCGTTTGATTTCAACGTGCCACCGGTATG
+TTCGATGTTTCCCCGCATGGTGCCGCCTTTCTGCACCTCAAGCGTCGCCGTCGTCAGTTT
+GTTGGTGCATACCACCTCCGGGGTGTCGAGGGTGATACGTTCTGCCGCTTTTACCAGTAC
+CACCGGCACGGTGGCGGTAATGGACTCCGATGCCGTCACATCGGCAGTCTTGATGCCGCT
+GACCGTCAGTGCACCGGTTTCCGGCTCATACTCCATAACAGCGCCGTCGGGGAACACCAC
+ATGCCACGCATCCGCCGAGGCTGACGGGGCAGGGTTATCGTCGGAGAAAATCCCCGGCAG
+CACGAAAGCAGTATCAAGCTCGCCACCAATTGCCAGCAGCAGCACCTGCTCACCGACCGA
+GGGAGCCCACCATGTCCGCGAACGACCGGCGCGGGTGGTCAGCCAGTTCAGCCATGCAGT
+CTGGATCCCGCCGCTTTGTACGCGGCACAGCCCCTGCGCGGTATCGACCTCAGTCACCAC
+ACCTGAGCGGATGAGGTTGCGAATCGCGCGCGTGAGCTCCTGTATTGTGGATAACGTATT
+CATAGTGCAAGGATGCCTCTGGTCTGGAGTCGCGCCAATTCGCGCGGCTCCGGTGGTGGT
+TCACACAATATTTATTTACCGAGATGCCTGATAATGATGTCTTCAATCATCTGCTCATCG
+TCGCGGGTGAAACCGAGCAACGGGCGCGCCGCGTACTGCACATCCCGGCTGTGACGATTT
+GGCCGGTCTTTTAGACCATACTGATGCACCCGCGCCATGCGCTGTACCCTGCCGGTAAAT
+TCCACCACCGCCGCACTGTCGCTGCCTTTGGCTTTCATAAAGCGGTTAGTGCGCAGTCTG
+GCGAACATTTCGCGCCTGATACGGCCTTTCTTACTTCGTACCGGCTGGCGCTTTCGGGCG
+GCATACGGGGTGCCGTCGGGTGCCTGCTGTCGCCTGATGCGCTGCTGCTGACTGGCGCGC
+AGTTTTTTTGCAATGTCAGCCGCCATTTGCCGACGCGCCGCCGGTGACAGGCTGGCAATC
+AGACCGGTAAGGCGCTCCTGCAGCGCGGTTAACTCACTCATCCCACTTACTCACCAGCTC
+GCCGTTAACGTACAGCTCGACCGGGCGCGTCACTGGCTCAGGCAGCGGTGGCTCAGGGGC
+ATAGCTGACATGCAGTGCGCCGTCGACCTCTTTGACGAGCGTGCGCTCGGTGAGTCTCAG
+GCTGATACTGATATCGAGCGAGTCGTCGTTATTGATATCAATCACCCATGTGAATCCTTT
+CTCCCGCCCGTCGTCGGTGGTCATAATGTCCGGCTGATGCTCACGCAGCCATGCCTGTAC
+CGGCACAAATATCAAATCGAGGTCGCCGGTAAAGTCAGTCACCACCACGTTAAGCACGTA
+CACCTTTTCAAACGACAGCGAGCTCTCCAGTCGGGAATCCGTATGCCCGTTATCAGCGAA
+CAGGCGCAGCATATCGGGGTTGTTTCGGAGCTGCGGCACGGCGTTAATCAGCGCCTTGCG
+CAGGCTTTTGTGCTTCTGCATCGAGTTCATCCTGACAGTGTTTGACGGTTTTGACCTGTA
+GCGCGCAGGCGGTCAGCGCGCCCTCAAGGCGGCGGATATCAGCGCTCAGGTCACCATTAG
+TTTTCGGATCACTTCCCGGCATCGGGCAAAGGCTCACCCTCGGGCATCCGCTGACCACAA
+TCACCGGCGCTGGCGCAGGCGGCGCGGGTGTGCAGCCTGCGCACAGCATCAGGCAGAGGA
+GCGTTATACCAGCGGCGAAAGGCTTCATTTTCATCAAGTAACCTCGTTATCGTCTGCTCG
+CGGCGGTTTGCTTCTGCGCCTGCCTTTGCGAGCTGTTCGCGCAGTGCCACCTGCGCGGAT
+TCATTACGTCGGGCGAGCTGGCCGGCGACACTGAGCTGATTTTTCAGCATGCCAATCGTC
+GCCTTTTGCTCGCTCGCAACGCGGTTTGCCGTCTCAAAGGAACGGGATAAATTGCCATTC
+TCATGGCGCAACCACATCAGACCGAGCACGGCCAGCACAAACAGCGTTATCAGGACTTTC
+ATGCCACCACCCCGCCAGCCGTGCGCCAGACGGTAACCAGCTTTTCGAGACTGTGCTCGC
+GCTGGCCGTAACCGGCACCCGGCAATGACGCCCAGATATTCCGGCAACGGGAAACAGCAC
+GCTCAATACGCCCCGCCCGGATATCGTCAATAGCACCGCGCTCCCGGATTAACTGGATCG
+CGAGCTTGTCCTGCGACAGTGGGCTGAAATCAGGCAATGCGAGCTGTTTTTTATAGTGCG
+GCCAGAACATATAAAGCTGCTGGTAACGCCCCGATGCCGTGGATTTCTCGCCACGGCGAT
+TAAACACTTTCGCGGGTCGGCCATGTGCGAAAGGGTGGTCGCTGTAATCGGTGAAAATCT
+CTGGCCTGCCATCAAGGCCGGTAACAATGACGTCGTAGCCACGGTTTTTCGTCAGCGGAT
+GGTTCGCCGTTCCTTCGGAATACGCCAGCATGTCCAGAAAGGCGGCGATATTCTGGTGAG
+TATTAATGACCGGCATCGCCTTCCCCCTTCTGTGACTTAAAGCGGCGCTGAATGGCGATT
+TCCACCACCTGATAACCGGCAATACCGAGCATGGATCCAATACCGCACACAGCGGGCAGT
+GACATATCAGGAAACTGCACCAGAACAACACCGGCGACCATTGAGACAAAACCGCCGAGC
+AACATGCGCCCGATAAACAAACGCGGGGTGATGGGTTCACCGCCTGCCAGCACTTTTCCG
+ACCACAATCAGTGCCCCAATCACAAACAGTGACAGGACGCCTTTTTCCCCTTCTGTCATG
+GTTTACTCCCAAAGATTGATAGTTTCAGTTACGGGTGAAGACGGCACATCGGGCAGGTCA
+ATTGCCGTGCCATTCGGCAGAATGACGCCCAGCTCAGACAGGCCTGGATTAGCCTGCAGC
+ACCGTTTCAACCACGCCCTCAGTGCGCCCGTAATACCTGGCGCAAATCACGTCGAGGGTG
+TCGCCCTGCATCGACCTGACCTTCATCAGAGTTGGCCCACGATGCAGCGCGGTTTGTCCT
+GCAGACGCGCGACCGACCAGCGCATATCCCGCCACAGGTCATCAATGGTGGTTTCGACGC
+TGTCGGCTTTTTTGTCACCCTTGCCGGTGGCTTCAACACCGCGATAGCGCTCATACAGGG
+TGGCGGTTGCCATCGCCGTTACGGCGCTCAGATAGTGGAAAATACGCACATTCTCGCCAT
+CGATTTCCTCAGCAGGCACGTCGGCCAGATGCTTAAACCCGGCGGCAGTCTGGCGCAGCC
+GGTAGTCGTAAAGCTCCGCATTGGTTTCCGCCATGCCAGTTCTGATGGCATGGCGCAGGC
+GCGCATCGGAAACCGTCTGCTCAAGCCGCATCAGCTCGCGCACACGCTTCGGATCCACAT
+CAGGGAAAAAGAACGTGTTTTTAATTACTGCATCGCCCGTCTCCGGTACGGGAATCACCA
+CGCCCGGTACGTCCTGTGGTTCGTCGGGCTGGTTCAGAATCACTGTCGTCATGACAACCT
+CATCAGGTTGGGCGGTGGACGCCGGTCGCTGTCAGGGTCAAAACCCGCTTTGACCGGCGT
+GCCGCCCGGCTCGGGGAGCGTTCAGTTAACCGGCGGTTTTTACCGCCTTTGGTGGACGCC
+CGCGCTTTGCTGCCGGTTTGGCGACAGGTTTGCGCGTGCGCGGTTTAGTCGTTTTACGGG
+GTGGTGCCTCCGCTTTTGGCTTCAGTGCGCGTTCCAGCCGCTCAATCTCTTTGCGCACAC
+CGGCATTGCGGTCGAGCTGCATCGCACGTTGAAACTGAGCCAGTGCCTCAGCATTCTGAC
+CGATATCGCGCAGGGTCAGGCCGGTCACCTTATGCAGACGGGCGCGCACCATATCGGGAA
+CGTCAGCGCCGTCGGTCAGGCTGAGGGTGGTCAGCAGTAATGCGAGGTCGACAGGCTCAC
+CGGCATCGCGCAGGCGCAGTGCGGCAAGCGCCACCTCCTCAACCAGCATGTAAGGCGTCG
+TGCGGCGATGGTCAGTGGTGAGGCCGTATTTCAGCGCATAGGGCGCAATTTCCAGCGCGC
+CAGCGATATCACCGGCATCAAGACGCCACAGCATGACGGTCATGACAATGTCATCCTGCG
+CACCGCGACCATCAGCCAGCACACCGGCGACCCACGGCGCATAGAACGGCAGCAGCTCGC
+GCTTTTTCTCGGCTTTACGTTCGTTTGAACGGATATTTTTTAACGTGCGGCGGTCATCGG
+CCAGCTTAACCAGCATCTGCTCATAGGCGGTTGCATGGCGCAGTGGGGCTTGCTCCCGCT
+GCGCGGCTTGAGAGGCCGAGACCCGCATCATGTGACGCTGTGCGGGGCTCGTCATGGTTT
+AGACTCCGCTTTCCGGTGCTGCAGGTGCGGTGAAATCGCCCAGGGTGATGTTTTCCAGCA
+GGCACCCGGCGGCATACGCCTCGACCACATAGTCGATATTCATCGACTCGTAGTTTTCCA
+CGCGGTCACGCTTGGGGTTTTCGATGACTGAACGCCGATGACCATCATCCATGAAGTAGA
+TTGAGAGATTTTCCATCGTGGTCACCAGTACAGCATTCGCAGGGAAGTACGGCACGCGCA
+CGGCAGGCAGGTTGCCGATGCGTTTCTGGCTGATGATGGTATCCGCAGCGAGCGACTCGC
+TGTTTTCCTGCTGCTTGTTAACCAGCGGGAAATATTTATCGGCCAGCAGCTTACGGCCAA
+CGATGGCAACCAGTTTGGTTGAGTCCTGATAAACCTCATCAATCAGGGTACCTGTCGCAT
+CCATTACCAACGCGTCAAGATTCTCATAGTCGCCGTTTTTACCGACACGAATCACATCGG
+AAACGACTTGACCCTCATCGTCGGTGATTTTACTCATCACGCGCGCCGGTGCTTCGTTAC
+GGTACTTCTGCAGCCAGCCGACCGCTACATCCTGCAACATTGGATTAGTTTTGCGATTCG
+AGGTCGGCGCACGATGAGTACCGTTAAATCCGGCCATGATGAAATCCAGTGCCTGACGCT
+GGATAATCGCGTCACGGATGCGGCGCTGGAAGTCCTGAAAACGCGCCCACAGGTCGAGCG
+TCTTGTAGCGCAGGTGGAAGTCAAAGTTGACCTGGTTGCACTCGTACAAATTGGACTCAA
+GCGCGACAAAGTCAGCAGTTTCACGCTCATCGTCACCTGAGGTGTCGGTCGTGCTGGCAA
+TAGTGCCATCCACACCCACACCGATTTTTTCACCTTTCAGCTCATCAACCGGAAAAATGT
+TAATCATCTGCAGAAATGCGGATGACGCCTGCACGGTGTTCATCAGCGTTTGCGTGACGG
+ACGGCTCGACGGTGAATTTTTTGCTAACGTCATCAACGCTGATGCCGTTCAGTTTGGCGA
+GCTGGGTCAGATAGGCATTGAACTTAAAACGGGTTTCCTGACGCATAGTATTTCCTGTTT
+GAATTAATCGGTTAGTCACAGCATCGGGCGGAATTGCCGCCCGGTTCCAATCTGCGGTTT
+ATCAGCAGTCGGTCAGCAGCTCGTCGCCACCGCCGCCGCTGGCTTTCGTGCGTCGCGGCT
+GGCTGAAACTTTCGGTTTTGTCGAGGGTGGTTTTCAGGGCGGAAAATGCCTGGCTGGTTT
+CTTCAACCTTGCCGGTCAGTTCCTGTTTAAAGGTGGCTAGCGCGGTTTCCATATCGGAAA
+GACGCTTATCCTGCGCAGTGAGACTGGTCTGCACATGTTCGCTGACGGCGGTCACCGCCT
+CATGCACATCACTCATGCGCGCATCGTCGCTGACCTGCTTACGGCTGAAAATGGCTTTCA
+CCTTGTCGGCCAGGCTGTTAAGCACTGTGTCGGGAACATCTTCAAATTCCAGTTCGGCCA
+GCGTGGCGACTGAAAAGACATTTTCAGGACTGGCCTTAAAGCGCTGCAGCGGGTTGTGCT
+TCGCCTTACGGCAGAATTCGAGGTATTCAGTGCCGAGGCTCGCAGGGTCATCAGTGACCG
+CAAGGCCGACAAGATAGCATTTGCCGGTGTTACCAAAATTCGGCTGAATTTCCATAGAGG
+TATAGACCTTCTGCGCGGCTTTATTCATCGCGATAAGGTCATCGGTTGGGGTGATTCTGG
+CGAACAACGCCCATTTGCCATTCAGCGCAGAATCGTCGTCAATCTTTTCGGCTTTCAGCT
+CAACCACATCGCCATAACGTTTAAACATGCCGTCGGGCAAAAGGCCGCGAATGTGTTCAA
+GGTTAATACGGCAACCGTAGACGCGCGGGTCATAGGTTTCGGCCATTTCCTGAATATCGC
+TGGCGCTGATAATGCGCCCGTCGCAGGTATCACCCTCGACGCCGATGCGAAAGAATTTTG
+AGACTTTTTTTGCCATTGTCAGGAGTCCTGAGGTTGGGGTTACGGGTCAACGCCAGTTTC
+CAGTCTCAGGACTCGCCAGACCACCAATGACGACTGGATAACCTCCCACACAACAGCACC
+TTAGCGAATCACTGGCGGCCATTAAGTAGCCTTGCCCTGAATCCACTACGGCGAGGCATC
+AATGACCATTTCCACCGATACAACCTTATTGCATGACCCGCGACGACAGGCATCGCTGCT
+TTACTGGCAGGGCTTTTCCGTGCCACAGATTGCCGAAATGCTGCAGGTCAAGCGCCCGAC
+CGTGCAGAGTTGGAAACAGCGCGACGGCTGGGACGGCATCGCACCGATTTCCCGTGTCGA
+AAGCAGCCTTGAGGCGCGCCTGATTCAGCTCATCGCCAAGCCGCAAAAGTCAGGCGGCGA
+CTTCAAAGAGATTGACCTGCTCGGGCGGCAGATTGAGCGACTGGCGCGCGTCAACCGCTA
+CAACCAGACCGGCAACGAGGCCGACCTTAACCCCAACGTTGCCAACCGTAACAAGGGGGA
+GCGTAAGAGGCCGAAAAAGAACTTTTTCAGCGATGAGGCTGTCGCAAAGCTGGAAGAAAT
+TTTCTTCGACCAGTCTTTCGAATACCAGTTGCAGTGGTACCGGGCAGGACTGGCGCACCG
+TATTCGCGATATTCTCAAATCCCGCCAGATTGGCGCGACGTTCTACTTTTCCCGCGAGGC
+ACTGCTGCGCGCGCTCAAGACCGGCCATAACCAGATTTTTCTGTCGGCCAGTAAAACGCA
+GGCTTACGTGTTCCGGGAATACATCATCCAGTTTGCGCGACTGGTTGACGTCGACCTGAC
+CGGCGACCCGATTGTCATCGGCAACAACGGCGCAAAGCTGATTTTTCTCGGCACCAATTC
+CAACACCGCACAGAGCCATAACGGCGACCTGTATGTCGATGAAATATTCTGGATCCCGAA
+TTTTCAGAAGCTGCGCAAAGTCGCATCGGGCATGGCCTCGCAAAAGCATCTGCGCTCAAC
+TTACTTTTCGACACCTTCCACGCTGGCGCACGGCGCTTACCCCTTCTGGTCTGGCGAGCT
+GTTCAACAAGGGGCGCGCCAGTGCCGCTGACCGCATCGAAATCGACATCAGTCACAGCGC
+GCTCGCCGGTGGGCTTCTTTGCGCTGACGGACAGTGGCGGCAGATTGTCACTATTGAGGA
+CGCCCTTGCCGGTGGCTGCACCCTGTTCGACCTCGACCAGCTCAGACGCGAAAACAGTGA
+TGAGGACTTTAAAAACCTGTTTATGTGCGAGTTTGTCGACGATAAGGCATCGGTATTCCC
+GTTCGAGGAACTGCAGCGCTGCATGGTCGACGTGATGGAAACATGGGAGGACTTCGCCCC
+GTTCGCCGACCATCCATTCGGCTCGCGACCGGTCTGGATTGGCTACGACCCGTCCCACAC
+CGGCGACAGTGCCGGATGTGTCGTACTCGCGCCGCCGGTGGTTTCGGGTGGCAAGTTTCG
+CATGCTGGAGCGTCACCAGTGGAAAGGCATGGACTTTGCCGCGCAGGCAGAAGGCATCCG
+CAGGCTCACTGAGAAATACAACGTCGAATACATCGGCATTGACGCAACAGGCCTCGGTCT
+CGGCGTATTCCAGTTGGTGCGCTCATTCTACCCGGCGGCACGCGGTATCCGTTACACGCC
+AGAAATGAAAACCGCAATGGTGCTCAAGGCGAAAGACACGATTCGCCGTGGCTGTCTGGA
+GTACGACGCCGGAGCAACTGATGTCACACAGTCGTTTATGTCCATCCGCAAAACCATGAC
+CAGCAGCGGGCGCAGCGCCACCTATGAGGCCAGCCGCACCGAGGAAGCCAGTCACGCTGA
+TATCGCATGGGCCACCATGCATGCCCTGTTAAACGAACCGCTTTCTGCCGGTAGCGGCAT
+GCAGCCTAAATCTATTCTGGAGTTCAACTAATGGGTAAGCAAAAATCCCGTAAAGCCGCC
+GCGCAGAAAGCCCGCGCACCACAGCAACTGAAAGCCAGCGCACCGCAAAAAATGGAGGCA
+TTCACCTTCGGTGAGCCGGTGCCGGTGCTCGATAAGCGCGATATTCTGGATTACGTCGAG
+TGCATCAGTAACGGCAAATGGTACGAGCCGCCGGTCAGCTTCTCCGGGCTGGCAAAAAGC
+CTGCGCTCTGCAGTGCATCACAGCTCGCCGATTTACGTTAAACGCAATGTGCTCGCAAGT
+ACCTACATTCCGCATCCACTGCTGTCCCGTCAGGATTTCAGCCGCTTTGCGCTCGACTAT
+CTGGTATTCGGTAACGCCTTTCTTGAGCAGCGCCACAGCGTCACCGGCCAGTTAATCAAA
+CTGCTGACTTCACCGGCAAAATATACCCGGCGCGGGGTCGATGACTCGGTTTTCTGGTTT
+GTGGAAAACTTCACTCAACCGCATGAGTTCGCACCCGATACCGTGTTCCACCTGCTGGAG
+CCTGATATTAATCAGGAGATTTACGGCCTGCCTGAATATCTCAGCGCGCTTAATTCCGCC
+TGGCTGAATGAATCCGCGACGCTGTTCCGCCGCAAGTATTACCAGAACGGCGCGCACGCA
+GGTTACATCATGTATGTGACTGACCCGGCGCAAAGCGCGACTGACGTCGAATCGCTGCGC
+GATGCAATGCGTAACTCTAAAGGGCTCGGCAACTTTAAAAACCTGTTTTTCTACTCACCG
+AACGGGAAACCGGACGGCATAAAAATCGTGCCATTGAGCGAAGTCGCCACAAAGGATGAC
+TTTTTCAACATCAAGAAAGCCAGCGCCGCTGACCTGATGGATGCGCACCGCGTACCTTTC
+CAGCTCATGGGCGGCAAGCCTGAGAATATCGGCTCAATGGGTGATGTTGAGAAGGTGGCA
+AAGGTCTTTGTGCGTAACGAGTTATCACCCTTACAGGACAGATTCAGGGAGGTAAACGAC
+TGGCTCGGCATGGAGGTCATCAGGTTCAAAGAGTACACCCTCGACAACCCGGAATAACTT
+AGGTCAGCTTAATCTCTGCGCTCATCATTGAAGATACAATCTGCGAAAGCTATAGTGCAT
+CAGATATCAAAATAATGGATGCGGAGATTAATATTTTGGAAACTAATTTTGAAATAACCC
+TGGAAGGTTTCGCTACTGAAGAAGAAGCAAATAATATCGGTAGGTTCACGCTAGAAGCCA
+TCCGGGCTTTAAATAACAATCTCAACCTTGAAATCTCAAAATTAAAATGCATTGTTATTT
+CCTATAACTTTAGCGAAGCCCTTCAAAAGATAACATCCACTTACCAACACAAATCTCCTA
+GTTCATACACCAATAGCAAACAGGGTGCAGCCGTCGGACAATTAGTATCAAAAATTGGCA
+ATGATGGGCTATGTGAAGAATATACCCTTGTACTATCTATTGAATTTTTTGCTGAGCTTT
+TCAATGATGGAAGCTTCTTAAAATTGAACGAAGAAGGATACCGCGCAGTCATCCATCGTA
+TTCACCATGAATTAGTGCACGTACATGAAAAAAACTTACTAACATGCTTAGCCCAAAACT
+TTACGGTCAACGAGTATGGCAGCGCGCTTCTTATCTCAGCCACGCGTGCATGGTCTGAAT
+ATCTCGCTAATTACATGTCTTCAGGGTCAGCCCCTCAAGAGACTATCGATTTATTTCTAG
+AGAATCTTGATACCGTTGTAAATGAAGTATCTGACGAGATTGGAAAACTCATCTGGGACT
+ATAAACGCTATAATACGCCTCTGAGTGAAATGTATCTCGAAGTAAAAAAACGCATCAGGC
+TTATCATCAACTCTTATGCTTATGCGATGGGTTATGTCCACTCTCTAAATATCAATATTA
+AAGAATACGATCCAAAGCTATCCCTTACACTATCCAACTCAAAGATAAGATATCAATTAT
+CAGAATTAGGCATTGCTTTTCAGAATCTTTATGGCAAGTTTAATGACCAGCACATTACAG
+GTTTTGATGATTATCGGGAAATAACAATAGTCATTAGTGAAATATTCAAGCAGTTTGGGC
+TTGTTTTAGAGTGTCCCGATTGGTCTAGTGACTGTGAACTCTACATACATGTAAATTAGT
+TTAATCATTGTAAAAACATTAGCAGTTTGAATCTCGCCATTCCTGTTAAGCCGCTGTCTC
+TAGGCGGCTTTTCCATGCACACCACCGTCACGCCTCAGACGCGCCACACGCGCACAACCA
+CCCCCGACCACCAACGAACCGACAGCGACCACGAAAGCGCCATCACGACGCGCTCAGACG
+ATAATTTTTAATATTACGCACCACCGCTGGCGCGCAATGCTTTCCCCGCCACGCCTGCCC
+GCTTTATGGGTCGGTTTTAATGCAGGTGCATGACCACTCTGGAACCGCGCCAGCTCTGAC
+AGAATACGCTCAGAACTGGCACGACTGGGGCATGCAAAAAAATGCACCTAAGGCATGCAT
+CATTTACTTGCGTACTCTTTACTCATTTTTTTCGCTGTTAATTTTCGCAAAAATACCTTC
+TTGAATGAATCCAATAGATGACATCTTGTCATGCTTACCAACAAGAAAGTCTTCAAATTC
+CTGAAAGTGCCCTAGAATACACTCTTGAATTTTGTCAAATACAGGTGTGAATTCATTTGA
+GTTGATGAGAGAGGTGATTTTTGTTGCGAAACCTATGCTATCAACACCAAATGTATATGA
+GTCATCATCATTTTTTCTGAATTTGAAATCTATTTGGAAAGGCGACTGTGGGTAAGTATT
+AGAGTCTTTATAGACGGTCAATATAAATCCTAAATGCCAGAACCCATCATCCCCCAAATG
+AGTAGCTCCAGTGGGAGTATATTTCGTATTTGGTTTTTCATCTTTATCTAACGGGATTAT
+TTTATATGCTTTTTCATTATCAATCCCAAGATAATCTAAATAATTTTTAATCACGTGACC
+AGAAAAGTTATACGCATCAAATCGAGTATCAGAAAGTTTGTTCCGAAACTCGGTATATGC
+ACTGCACAGCTCTGTAAACTTTGACATAATCTATCCTCTTTCGATTGTAAGTATCTAACG
+CCTCGCAGGGCTCGTTGTTCAACCCTGCCAGTACTGAAAGCGAGTTTCAGCACCGGCAGC
+GTTCGTCACTATATTGTTTAATTGTCGAGTATCGAATCGACCTCACCCGTTCGCACGTTG
+ACGCGTGCCGCTACGGTTTGTTTGACCACACCACCATAAGCATTAGTACCGCGAAACGTT
+GTTTTTACAACGGCATGCGGGTCTTTATTCAAAATCAGATGGTAGACCGTTGAAACATGT
+TTATAAGAAGAATCATCATTCATGCTGGCTTTTATCAGCTTCTCTAACGGGCGATAAGAG
+CCATCCCAACCGCTAAAATTACCCTGAAATGCGTCAAGATTGATTTTATTATTCAGGGAT
+TGTGGATCCTTCTCGAAGTCGTTGAAACACCACCCCAACACATCACCGAGCTTTAACGCA
+TCATCTTTCGTAAAAGTGTACTCACTCATACAGGCATAAAAAGCATCAGCAGAGCTTACC
+GGTACACCTTTGAAGCCAACATAGCCTTTAACGATATCGTGCCGGGTTTCTTTTGGCTCA
+TTGCGATATTCTTTGAGAGTCTTATCTGCGTACTCAAACGTTGGCGTAGTCGGTTCCACT
+TTAACCTCCGGCACGTCAGTTTTTGCCACAGGCTGACTTTTTTCAGTCGGCCATAAGATT
+GAGCCAATAACACCCAGCGCCAGACAGCCACCGAGATAAACCGCACTGGAGCGCTTACGG
+TTCGGCATTCGAACCATCGACGGCTTGATTAACCCCACGATAAAAGCAATAAAGAGAGCC
+AGAGATAAAAATGCTATTACGGTATCCATGATTTTCCTTAGTGTGTAATCCCCATACAAA
+ACAACCCCATGCTATCAAACATGGGGTCGAGGGTTGCACATTTTTCAGGGATTAACGCCA
+GCTCTCATCTTCCCACACTTCCTGAAGGATGCTATCCAGCGCTTCGCGGTCTGAATCTTT
+ATCGAATCCCATCAGCTCGACACCGGTCATGGCTCCCTTTTTAACAGTAACGCGCGTTGA
+GGGGAAAACAGACTGTATTCGCCTGGTCAATTCGCATTGAAAAGCATCAATTACCGGCTG
+GCCGATTTTTTGGTCTTTATCCAACGTGATATTTACTTTCACCTTGCCCTCCTTTGCAAA
+GGTTGCATCAACAGGTGGCGCGGAAAAAACAACAGAAAAATTATTATTTTTCATTAGGTT
+GCCTCTTGCTATCTCCGCGATTAGATTCAATGCAATTTCACGATCTCTTTCCTTACAAGT
+ACCTTCAGCAGTCAGACGCGCAATCATTTCGACCCGCTCAATCATAACGTGCTCGTTTAG
+CTCTCTATCCACACAACCTCCATTACGAGATACTGTATATACATACAGTAACACGTAATA
+ACAAAAGGTGTGAAGAAAAAATCACAGTTAAACACACTGTATGTACATGATATGGATGAA
+TATTAACGGTTATATTTTCGTTGCGAGTTCAGCTAAAGCCGCAACACGATTGAGGATTAT
+CCTAGCCTTAGCCTGATACGATGGTGCTGAGGTAAATATTTCTCCCTTGGCCGTTCCTCT
+CAACCATTTACCGTTAAAGCAACTTTTACCACCGGCCATCAGGTGCAGGGCTTCGCCCCG
+GCTGATTGTGATGCCGGTAGTCAGATGTATCTCGTCGATAGTTTTCGCTATAGCTGCGTT
+TTGCTCATCCGTTCCGTGGATAAATTTTCGCCGTATTGCTGGCTTTTGCTTCCTGAGTCG
+GTTTGTCAGCTCTCGTTTTTCACGTCGACTTAGGGGTTTAGATAAATCGAGTTCCGGTGG
+ATCGCTTTCGCTTCCCGTACAGTTATTGACAGAACTCCGAGAGGGCGCAGGAGCGCCCTT
+AACGTCAACGGCCAAATCAACGGCACGCTTCGGCACAATTTTCCACTGCGTTAGCCGGGT
+TAAAATCGGAGTGCCAGCACCAATAGCGGAATCGTATACGCCACGAATGCAGACGGTTTC
+CTCACCATACTGATTAAACTCGGTGCGCGGTTCATACAGTGTGCGCACCTGCAAATCATC
+GCGACGGACAAACGGCCCACCCTGCGCATTAACGTAACCAGCCCAGTCACCGGCGTCAGC
+GGCATCATGGACGGCGGCAAACTCAACGCTCAGACCGTGCGCGACCTCGGTATCAGCGAG
+ACGACGCAATTCACGGTAGACCGTCACCGGCGCACCGCCGATAAACTGAAACTGACGGAT
+GTGCCAGCGCGCCGCCCATGCTGAAACGGCGGGCGCCGTCTCTTTTAGCAGCTCACCGCT
+TTCGTCATCGGTCTCGTCATCGAGAGCATAACCGTCGATGTTTTTAGAAATGTATTTCGC
+GACATAACCGGTAGCACTGCCTTTCTCCGGGTCGATAGCCTCAGCATGAAAGCGGGCTTT
+TTTAGCCTTATCACTTTTAAGTTCGTGGCGGTCTTCCTCCCATGCATAATCGCGGATGAT
+GAGGCGCACGCGCTCGACGTCTTCTGGCAACATGAACATAAGCATGTGCCAATGCGGCGT
+TCCGTCGTGATGAGGCTCGGCAACACGTATGCCGAAAATGCGAATTTCTTTCCGATGTAG
+CTTGGCACGAATGCGCGCCCAAAGGCCGGTTAGGTAGCTCTGCGTGTCCGACGGGCTGGC
+GCCGTTCCATTTGCTGTTACGGTATCCCCCTTTAGTCGTGGCATGATATTTAGACGGTGC
+GGTCAGAGTGTAAAACTCCCCGACGTATCCGAGTTCATTGCAGATATTTTCAAACCCACG
+GATGCGGGTCATCAGCTCGCAGCGGCGTATCGCAGGGTTAGCGACCGAGCCGTCAAATTT
+TTCAATCAGGCTGATACGGTTGCCGTCTTCGTCTTCGAGATCCAGACCTTTGAGAAATTC
+ACGAGTGCGGCGCTTTTGTTCACGCCAGTCAGTCACGCAGTTTTTACTCGCATAGGCATG
+CTTTTTCTTACTGACGTTACCGACAGTAATTTGCAGATGTTCGCGCCATGCAGCCGCAAT
+GCGACGAAGACGACCACGCCACCACACATCGTTAAACATGCGAGCGATGGCCGGGGCGAT
+TTCATCTTCTCCGACATATTTCTTTGTCACTCGCTCCCAATGCGGAGGGGTAACATTGAA
+TTGCAGAGAAATAAAACCGGCGCGCATGTACCAGGTGTACAGCGTTTTAAGCTCGCTAAA
+TCCGGTGTCATCAATGTCAGCCAGTTCAGCGCGAATGAAATTCGCGATATCAGCGGCCAA
+AAGGTCGATATCGGCGCGTGACATGTCCGGGAGTCGGTTATATCTGGCAACCATATTGAC
+CATGCGTGACGCCAGATATTGCATAAGTTCAGTATCAAAATGACTGCCAAAAACAGCGGC
+TGATACATTGCTGTTGATACCCGCGCACTCGTATTTTTTTGCGACCAGTTCAAGACGTGG
+CAATACCCTTTTGCAGAAACTTATTAAAAAGGCATTGGCTCGTTGACTGCCCTGATTTTT
+CTCCAGCACAGCAGCGGTGCGATAAACATCAAAACGCACGCATTCAGGCTGGAGAGAAAG
+CACCTTTCTCGCATGCAGCAAAGCCGCGAGCATACGGTCGCGGCGATATTGTTGGTCATA
+GGTAAGATATGGGCTGGCTATTGCCTGTTTTGGAAAATTCCATACAAAGGCATAATCAAT
+CTCACCCATAGCCTTTGCTGAGACAGGTGTGTCTATGACTTTATTCACTGAAGAAGATCC
+CACCCAACGCCGCTATGTTGATTCGATTACAGAGGTGACAGCTTTCGAAGCTACGAAAGA
+ACCAATGAAGATCATTTCCGCATCCGACATGCTGGGCATTTGCGATGCTTTTCTTTCTGA
+GACTCAATGCCACATAGCAGACCGGCTACCTCTTTCAATAGCTGGTCGGCATGAGCTAGG
+TCGGAAAATTGAGTGGAATTGTCCACATAGCTGGAAACCACGCGAAGAATGGTCAACACA
+TGTTCGGCACGCCTTACAAATTTTAAATCGACGTTATTTGGATACCCCAGTATCTCAACT
+GGATGACTGGCAGACCTGGGAAGAACTATCGACAGATATTCATGTGTCGGCTCGCTGTAC
+TCGGCGGACTGTTGAGTTTTATCGCTCTGGAAATCCCCAGCATTTACCGATGTCGACTGA
+GCTTTTTGCTGTTCCCGAAGTTTTTTCAAAATTTGTAGCTTCGATTCTTTCGGGTGATAT
+TCACCCTGTTTGGATGTGGCATGCTGACGCAGCCAAAACGCCGCGATGCCTCGATGGGCT
+TTATCCCAAATACGCGCCGCTTTCTTGAGCTGGCTTAGTGGTCTGGTAGTCATATCGCAC
+CCCGATAGTGTTTTAATTTAAGTTCGGCGATTTGCTGGCAGGTCACGCAAAAAGCCACGC
+CCGGAATCGCAGCGCGGCGAGCTTCCGGGATTGGTGCGTCACATTCTTCGCAAAGAAAAC
+GGGAAGGCGCAGCGATACGGCTGCGCGCGTTGCTGATGTGGCGCTCGCGGTCTTCCTGCT
+CGCGCTGTTGTGCTAAATCCATTGCGTCGGCCATTAGTGCAGCTCCTGTGATTCATTCTC
+AAAGCGGGTTGCTTCACGACGCAGCAGTTCGGCAGCTTCGGTGCCGCTCATACCCTCTTT
+GGTGATATGGATAGCCAGCGCCTCAAGGCGGATGGAAACAGCGAGCGCGCGGTCTTTACG
+CTCTTCTTTTTTTGCATCGATCAGCAATACGGCCAGCGCATCACTATCAGTGTTAAAACT
+ACGGATTTCGGTATTACGCATAATTGATTCTCCTGATTTCGGGCAATAAGAAGCCCGGCG
+GGTTTACGCCAGATAATTTCTTTTTTTTAATTAGCTATAACCAAATACGACGGCTGGTTT
+ACTTTTCAATTGGCTGATAATTTCAGCTTTCAGGCTATCTTTAAACTGCTTGCAGCACTC
+CCATTCCGGGTCAACTCGTAAAATTATCCCATCGCGGGTTTTAATTTCAAAACCGTCTTC
+CATGTTCGGAATCATGGCACCTAAAACAATCCTTAATTCATCGCGTGACATGTTTAACCC
+CTTTAATAATAAAGTGGACAATACGAATAATTAAAAAACCTGACGATTTCGGCGGCTTTG
+TTTTCAGCCCTTTTAATAATTCGGACTGTGAGTGGCTCGGGTGCCAGCGCTTGCCGTCCT
+TACCTGCGATCCAGCCGTGGCCGTAGTGCATGCCGGGGCTTTGTTTAACGAGCAGAGACG
+CGAATGACGGTTCACTTTTCAGCATACGCACCTCAAATCAGCCCGAAGGATGCGCCAATA
+CCGCTCATGGTATCGACCACGCTCGACATAGCGGGATTAGTCTGCAGACGCGCATGCAAC
+GCCAGCGCCGACAACGACAACATGCGAATGCCAGCATTAACGCTTTCAATCATGTTGTGC
+TTACGGGCAGAGGTCAGGCGCTCGTCAGAGGCTGCACCGCTCGCCAGCTCGCCGAGTTCA
+CTCATTGCACGCATGACATAAGACTGCAATTTGTCTTTAGCCAGCTCATTAACCGGCACG
+CATGGCAGGCAATGAATCTGCGCCAGAAAACCATCAACGAGGGTTGAATCTTCGGTCAGG
+TCAGTCAGCAGCCACAATTCAGGCGGCGTGAACTGGTGAGGCTGTTCCGGGTTGAGCTTG
+TTACGTAACGTCTGAACATTCATACCCGCACGCTCGGCAAGCTTCGCCATGTTGTGACGC
+TGCGCAAAAGCCCTGCACGCTTCGTCATAGTGGGGATGTTTGGAAATCTGAAAATCAAAC
+ATGTTGAGCCCTCAAAATTCACATAAAGTGAATTACGCACCAATAACGAGTTGAAAACGG
+GAATGGCCCAATGCCTTACGCATCTGTTCCTCTTTCCAGCGGGCATAGTAGATACGAACT
+TGACCGCCAGCACGTTTACAGCCCTTACGGATAACGCGAGGTTCGATAGGTAAACGCGGG
+TTATCTCCGGTTGTCCAGCGGCGCGCGGTGCGGTATGACACCCCCTCAAGTTCTGCAAAC
+TGTTGCAGGGTGACGATGGGGGCAGGCACTTTGATGATTGCGATTTCAGAAGCCATGTTG
+CATGATTCCCTATTTGCCAAAGATTGCAATTAAAGGGCCACCGTTTGCCAACATAGGGCC
+ATCAATTGCGTAGGTTTAGCCAAAATATACTTCCCAATTGAGAAGTAGTAAATAGGTTTT
+ATCGATATGAGAATAGATTCTTTAGGATGGAGCAACGTTGATGTACTGGATCGCATCTGC
+GAGGCTTACGGGTTTTCACAGAAAATTCAGCTAGCTAACCATTTCGATATTGCATCGAGC
+TCCCTCTCTAACAGATATACCCGAGGCGCTATTTCGTATGACTTTGCGGCACACTGCGCT
+CTTGAAACAGGGGCCAATCTGCAGTGGTTACTTACAGGAAAAGGGCAACCGTTCACATCT
+TCTGCGACAGCCGAGGACACAATGAGCATCGAGTTATTCACATTAAGTGAAGAAATACTC
+AAAAGTGATGGTTCTATAACAGTCGACGCTCATTTTTTCACAAAGCCGCTTACAGATGCG
+ATGGCTATACGAACGGAAGGAAAACTCCATTTCATTGATAAGCAGGCATCACTCTCTGAC
+GGCCTTTGGCTGGTCGACATAGAGGGTGGAATTAGTATTCGAGAGCTAACAAAACTCCCG
+GGTAGAAAATTGCACGTTACTGGTGGAAAGGTTCCTTTTGAGTGCGGTATTGATGACATA
+AAGACGCTGGGTAGAGTGGTAGGTGTGTACAGCGAGGTTAATTGATGACTGTCCGTAAAA
+ACCCCGCTGGAGGTTGGATTTGCGAACTTTATCCTAACGGGGCAAAAGGCAAGCGTATCA
+GAAAGAAATTCGCCACCAAAGGTGAAGCGCTGGCCTTTGAACAATACACCGTACAAAATC
+CGTGGCAGGAGGAAAAGGAAGACAGGCGAACGCTAAAAGAATTGGTCGACGCATGGTATA
+GCGCTCATGGTATTACCTTGAGAGACGGACTAAAACGCCAGCTAGCTATGCACCATGCCT
+TTGAGTGTATGGGCGAACCACTCGCACGCGATTTCGATGCACAGATGTTTTCCCGCTACC
+GGGAAAAGCGGCTAAAGGGTGAATATGCCCGTTCAAATAGGGTTAAAGAGGTTTCCCCTC
+GCACGCTTAATCTTGAACTCGCTTACTTCCGCGCGGTGTTCAATGAGTTAAATCGCCTCG
+GCGAATGGAAGGGTGAAAATCCTCTAAAAAATATGCGCCCTTTCCGCACAGAAGAAATGG
+AAATGGCCTGGTTAACTCACGACCAGATTGCGCAACTGCTCGGAGAGTGCAAACGCCATG
+ACCACCCTGATTTAGAAACAGTGGTGAGAATCTGTCTCGCCACTGGCGCTCGATGGTCAG
+AGGCTGAGAGCCTGAAAAAAAGCCAGCTCGCGAAATACAAAATCACGTACACCAACACAA
+AAGGCAGAAAAAACCGCACAGTTCCCATCAGTAAAGAGCTTTATGACTCCCTACCTGATG
+ACAAAAAAGGCCGACTGTTTAGTGATTGTTATGGGGCGTTCAGGTCTGCTCTGGAAAGGA
+CAGGCATCGAATTACCGGCCGGGCAACTTACCCACGTTTTACGGCATACCTTCGCCAGCC
+ATTTTATGATGAATGGTGGTAATATTCTGGTCTTGCAGCGCGTGCTTGGTCATACCGACA
+TAAAAATGACGATGCGATATGCGCACTTTGCCCCTGACCACTTAGAGGATGCCGTTAAAC
+TTAATCCACTGGCGATGAGTGGCGATAAAATGGCGGTAGAAATGGCTCAAACTGGCCCTT
+AGCTGGTCAAGAGTGGCCCTTTATGTCTATGATTTATAAAGCAACCTATTGATTTTCGGT
+TGTTCTGTTAGGAACTCATAATCGCTTGGTCGCTGGTTCAAGTCCAGCAGGGGCCACCAA
+ATAAAACAAGGGCTTACGCTAAAAACGTGAGTCCTTTTGTTATCTATGGAAAACCCCCAG
+CCTAGCTGGGGTTTTCCATAGACAAAAAAAGCCGGTCGTTTGACCGGCTACTTGTTGTTT
+TAGTTCTGTGACGCTTTCCCGTCAATACACTGATATTCGACGTAGACGTCCATTTGTCTG
+CATCCTATTGGGCTGGGATCCGTACATTGTGACGTCTGGCCTCCGAACGCCTCGGCGCCA
+TCATATCCCCACACCCTGCATTTTTGGGCGGCCAATGATTGGCCCTGATTCATATCTACG
+CTCGCTTTTTCAAACGCGCCGTAACTTTCGCCAACGTGATACCCCATCCTGATCGTTCCA
+TCGGCTTTACTTCCTCCGACGGGTGTCATTTGCTTATGAACAGTGCAACCAGAAAGTATT
+AAAAAACCAAAAAGACAAAATGCAATTTTTTTCAT
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_017033.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_017033.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1731 @@
+>NC_017033.1|provirus_1052334_1094910
+TCAGCGCCGTCCCAAGCCCAGCCTGGCAGCCATGGAGCTGGCGGAGCGACGAGTGAATGA
+CGCCTGGGTTGAGGCATTGTCCCGGTTGCGATCCGTGGAGGTGTGGCCTGTTCCGCGGCG
+GCCCAGAGCGCAGATGGCCTGCCAGCCCGACGTGGCCACGATCCGGATCAGGGTCGAACG
+CGTATTGTATGAAAGTGTGTCCATGGTCCCGGCCTCTTGGTCTAGACGATCTCGACAATG
+CACCCTTGCGTACGGCAACGCGACAACTTGGCCGCTGTTGGCGGCTCGGTCTGATGGACT
+TCTGCTTGTGAAGCGACATCCCCGGACCGTGCGGGACAGGCTCGGGTCCCGTTTGACCAG
+GCCTGCAATCGTAGACTGCACTTGTTGATGTTAGCTGGGTGTTATGCGCAGGGGGCCAGT
+CCCGGCTTCGCATCGAAGAGACACATGGATGGCCGTCCCCATGCCAGGGCCGTCATGCCG
+ACATCGGGGGGCATCATCGGCTGGCCGGGCGCGGATCGACTGCAGCCACCCCATCCAGTC
+CGGGCATCGACGGTTTCTTGCCAGCGGGCGACACGCCATCTGGTGGCTCAACTACACAAA
+AAATCAGAAAAGACTCGACGCCCCGAACATATGCAGGCATACTACTTCGCTCCGCTGCCC
+GAGTGGTGGAATTGGTAGACGCAGAGGACTCAAAATCCTCCGCCGCAAGGCTTGTCGGTT
+CGAGTCCGACCTCGGGCACCAGCGGAAAATCAACAGGTTGCAAGTCTGGTCAAAAAGTGA
+CCATTTCCGCAATCAGGTGACTTTTCCGCAATTGCTACCGTGTGGGTGTGACTTTGTCCC
+CACGCCGGTTCCGGGTGTAGTGCTCCGTCATGGTGACCGAGCTGTGCCCCAACTGCTTCT
+GAGCTTGCCTGATATCGCCCGACGACTCTGCCTTGTCGGTGCCGGCTTTCGCTCGCAGAT
+CCCTGAATTGGAAGTTTTCGAATTTCACCCCGGCTTTGACCCTGGCGCGCTGAAAGGCAC
+CATTGAGCATCCGGTATGACATCGTGCCGCCTTTGGCTGTGGTGATCAGTTTCCGGGTAA
+TGGCCCCCATGCGCCGCTTTCGCTCCACCATTGCATTGATCAGCTCGGCGAGCTCGCCCA
+CGACTTCGATGCGCCGCTTGGCTCCGGTCTTGCCCTGGACGACTTGCAGCTGTCCATTGC
+GGATATCGTCCTCATCCATGCTCAAGGTATCGGCGACGCGCTGACCGGTGAGGTAGGCCA
+GATCCATGGCATCGCGCAGCGGCTGCTCGGCTGCCGTCCACACAGCCAGGAAGACCTCGT
+CCTCGATGTAGATGTCGCGGCCGGTTTCCCGATTGCCTCGCACGCCGGCGCATGGATTGG
+GGAGCTTGGTGTAGCCCATTTCCCGGGCCCAGTTCCAGATATGCGAAAGCAGGGCGCGTT
+CCCGATTGGCGCGGACCTTCGCCTTGCGCCACACGATGTACTGTTTGACGTGCTGCGGCT
+CGATGGCCTCAAGCGGGCAGGGCGGATCATCAAAATAGCTCATGAGCATTTTGACCTCCT
+TGAGATTGCCCCGCTGAGTTGTCGGCGACTTGGTCGGCAGCACCTCGGCGATATACCGAT
+CGGTGACATATCGCAGGGTGATGATCCCTGCCGGCCGCTCATGACCTTCGCGCTCGATTT
+CGGCCCAGCGCTTGATGGCCAGGCCATAGTCCGTACCGAGGGGCTCTTCCTTTCGTGGTT
+TGCCGCCGTGGTCGTAGTAGTAATAGGAGCGAGTCCCGCGCTTGCGGATCCGCAAGTGCG
+GGATAGCCCCGGGGTTGGATGGCCTTCGGCCCATGTCATGCCCTTGCTTTGTTGGAGGCC
+CAGCGTTTGGTAGGCTGCTGTGAGCTGGTTTCGCCCTCAATCGCGCTACGGGTAACGATC
+GGCCAGCCGCCGGCGTCCAAGTGGTGCCGGATGCCATTCGATACCAGCACACGGATCTGT
+TTCTTTCGTGTGTAGGCCCGCAGGTAAGCCGCGAGCTCGGTTTTGCTCAGAGCAATCTTT
+TCCGCCGCTCCCATCACGCTCCCTCACGATTTCGCGCCATGGCGCCGTCGATGGCAATGT
+CCATTGCCTTTCCAATGAGCATCGTTGCTCCTGATGCATCGTCATCCACTAGAAAAGGCG
+GCTCGATCATGCCGGCGGTAAATCCAGTTTCAGGGTCGGGAGACTCGATCGCTGCGAATC
+GTTCGGAATGGTCTCGAAGCCATCGGTAGCGCCGCGCATCCAGCATTGCCATTTCGAAAT
+CTGCTGTGTCGATGCCCTGCATATCAGTTCATCCTCCGAAGCATTAGTGCGGGCTCCGAT
+CCTTTTGCCTGCTCTACTCGCTTATCCATCCAGTCCGCCGTTGCCTCCTCTCCCGCGAGT
+GCTCGCATCGCCTCAATGACGCCGATCATGAGCAGATCCAGGTAGTCAGCTCTGGATTCC
+ATGTCAGGTAGCTCATCCATGAACCCAAGGGCGGCAATGACTTCTGCAGCGCTTTTGTCT
+TGATCAACCATAGTTCTGTTTCTCACATTCATTGCGTGCGGCCAGCCCTGCAGCTGCAGG
+CGGCATTGGCGTGGTGGTGTAGATGGCCCGGATCGTGCCGGCGGCGGCCGGGCGAGCATC
+GGGCGGGAGTTCCTGCAGGCCGGCCAGCATCTGGTCCAGCGATACCCCGGCGGCGCGGGC
+CTGCTCTGCGGTGGATGCGACTTGGGCGAGTGAGCTGCACCAGGTAGAAGTTGCCGGTGC
+CGGCTGCGATGCCAGCGTGGCGGCGAAGAGCAGGGCGGGGATCACTGAGTTCCCTGGATC
+TGTAAGCTAGGCCGACCGATCGGGCGAGCGGAGGTCGCATCAATGGCCGCCGGCAACTGA
+CCCACTTCGTCGGCGAGGCGGATAGCGTCGATCTCGACCTTCACTGCGTTGATGTAGGTC
+CCAGCGACCAATGCCGTGGCTTTGGCCCGCTCGATGACCTCGGGGTTCGACTCCGGATCA
+CCCAAGGATTCCAGCATTGCAACCAGGTGATCTCGCACATCGGACATCTTGTTCTTCATG
+ACTGCTGCCTTTTGTTGATCTTGCGTTGTAGGGCACCCTTGAGCTGGATGAGCTGGGCGA
+CTTCCTTGGGATATCGGGTGTGGTAGCTGTTCCGGCGCATCAGTTCGGCTCGGCTAAGCA
+GCTCGAGTCGGTCGGCCGTGATAAGTGAGGCCTCAACGGTTGCGCAGCCTGGCTTGAACA
+CCACGGCGTGACCCGGCGGAATGGGGCCATGGACTGCCTCCCAGACGAGGCGGTGTACAG
+CGACCCACCGTCTGGCCGGGTAAAGCGAGGGATCGTCGGTGACCTTGCGTTCAAGGTAGC
+CATCCCTGCAGATTCGCTCGCTACCAATTGGCCGGTAGTTGTGCTGAGCAGCGCCGGCCA
+TCTTTCCAGCCTTGAATTGAGTTTCAGCCATTCGACCCGGGGCCCAGCCTGGAGGATGCT
+TCTTGCCTTTGTTGGCAGGAGTTTGGCCAGGCTTGAATTGGGTGGCGATCATGCGCGGAT
+TTGTCCGTCCTCGAGCGATGCGGCCGGAGACATCGCTGGCCATGAAGGCCTCGCTTTTCC
+TGACGCCGAGTGTGGCGGCCCGCCCGTAGATTGCCGGCTTGGACCTGCCCATGCGGCGGG
+ATAGATCTGCGCAGGTGATGTCGGGGAAGAACTCACGAACCATGGCGTCTTCTGCCTTTG
+TCCAGGGTCGACGGCTCATGCCAATGCCCTCCGGCCAATATCAGTCAGGTCATACCTGCC
+CTTGCCGGCGTGGCGTAGCAGGCCTGTACGAGCGAGGCGGCGGAGCTTTCCGGGCGGTAG
+CGCGACGGCACCGGAGGCGAACAGCTGGATCTCGCCGCGCTCGGCCGGCAGGACCAGCTC
+GGGGTTGATCGGATCGGCCGGCGCGGCCGGGATCTCAGCAGCGGTATTGCCGGGCATGCT
+TCCGTAGCCTATTTTCGCCAGCCCCTGTTCGGCCTTGCGGACCATGTCCTGGGCCGATTC
+GCTCTCGCGCCAGTTGGGGTAATCCTCGAGCCAGTGATCGAGGAACGTTTCTGCCGGGGA
+GGCCATAACGGTGGTTCCTGTGTAGCCGCCAGCTATCGAGCGGCGATGTGGGTGGTCAGC
+ATTTCATTGAGTGCTGGAGGGATATCGGGGAAGTGCAGCCAGGGCTGCTTGAATTGCGGG
+GCCCAACTGCATTCGCCTGCTGCGTCTCCGACGCAATTCCTTCGACACCAGGCGTTAGGC
+TTGCCATTGAGGACCTTGACCCGGACGCGGTGGAGCCGTGAGTCAAACCAACCATCAAGT
+GGCTGGAACATGTCGATGGTCGGCACAGAGTTATCGATGGCCATCTGCAGGCCTCCGTTG
+GCTAGAAGGGGATATCGTCGTCATCGAAGGGCGGGGCGCCCTGATCCGGCGGAGGCTCGT
+GTTGCTGGGCATGGCCGCGCTGGTTGGCCTGCTGGCCACGACCGCGGGAATTGCCGGGCT
+GCTGCCGGTTGCCGCTGGATCCACCATCGCCACTCAGCATCTGCATATCGGTGGCGATCA
+CTTCCGTGGTGAAGCGCTTGATGCCTTCCTTGTCGGTGTATTCCTTGGTGCGCAGCGAGC
+CTTCGATGTAGACCTGCCGGCCCTTGCGGAGATACTCCTGGGCAATCTCGCCCAGCTTTC
+CGAATAGCACGACGCGGTGCCATTCGGTGCGCTCCTGCCGCTGGCCGGACTGCTTGTCGT
+TCCAGGTCTCGGCTGTGGCGACGCGGAGCTGGCAGACGGCTGTGCCGCCGCCGGTGTATC
+GCAGCTCCGGATCGCCACCGAGGTTGCCGACCAGGATGACCTTGTTGATGCCGCGGGCCA
+TCAGTGGGCAGGCGCCGGGGAGGTGGCAGTCGAGCGCATTTTTGCGGCGTGGAAGTCCAA
+AATCACCGAGAGCCACAGCCGGATAGCGTTGGGTGTAAATCCAGCCCGGATCAAGGCCTG
+ATCAGCTGCGCTTGAGGCTTGCGGATCTTCCGAAGCGCTGCACATCGCGAGGCCCCCAAC
+CATGGCCATCAACTGGCCTTTGATGGACATGACTTCAGCAACAAACTCAGCCTCACCAGA
+GGCTTCGGCGCGTTTAGCTATCGAATCGACAAGGTCCTTGAACGACTTTTTTTCGTGAAT
+CACGGCATGACTCTCCCGTGCCGGCCCAAAGAGCCAGTAGCAAAATGTGTGTTGTGGGGT
+GACCGGTGAGCGCCGGCCGCGCGGTGGGTCAGGAGGCTTGGGCTGCGTTGTCGGTGGTGC
+TGGGAAGAGTGGCGTCCTCGATTTGGATGCCGAGTCCAATCTTGCTCACAAGGTCATCCT
+GGGAGGCGAGGTCAGCGCGGATGTGCTTGCGAACCACGTAGGCAATAGCCTGGGCCTTGG
+ATGGTGCTCGGACCAGGTAGTCTCGGGCCAAGCCGGCTTCGCGGGGCGCATCGATCAGCT
+CATTCGTCACGAGGTAGATCCGTGCCTTGGCAGGCTGGCCTGTATCGGTCGGGCCGTGTC
+TCACGAGCCACCTCCGAGCATGCCGGCAAAGGCCAGGGTAAACATGGAGCCAAGGAAGAT
+GCCGGCGGCCATGTATGCGGCGCGCAGAGCTTGCCCGCGGCCGGTGGTGATGGGAGGGAT
+GTAACCCATGTTGGTGATCTCCATCCGCCCGGGGGCGGTTCTGCGTGAGATGTCTCACAG
+TTGTGGCGGTGCGGCCTAAAAATGAATGAGCGAGCGACGCAAGACTTGTATAGGATCAGC
+GGTTGCTCGGCGGTTCGAGCTGAAATCCCTGCTGATTGCAGTTGCTATGTGGATCTGAAA
+CGTAATGTGTCACCTGTAATGCCTATGCATGGATATTCGTCGCTACCCCCGCTCCTGTTC
+CTGACTGGACTCATTTGTGCGGCTGGCTTTTCAATGGTCTTGAGGGCGCTCGGTGACGAA
+AGGGCGTACAAGTACTGGGCATTGAGTCTGTGGGCAGGTGTCTTTTCAGCTGCCTTGATC
+ATCATCTTCCCCAGTCACCGTCCTTTGGCTGTGGTCGTGTTAGGCCACGCCGCACTGGCT
+GCATCACAAGTCCTTTTGATTGCTGGCTTTTTCAGGTACTGCCGCCTGAAGTGGAGCGTT
+ACAGCTCTGATTGTTCCTGCTGTTGCCTACACGGCTGCTCAGACGGCGCTGTATCTGTTC
+GGGCTAGGAAGCTTCCCTAGATTCGCTCTGTACAGCCTTGCTGTTGCAGTTTGGGATATT
+TGGTCCGTCCAGCTTCTTTTGCGATACCTCCCGGGACAGGCTTTTTACGGGAGTCGTCTT
+GCCGTGCTCGTGATCTCGGTGCATGCGGCATTGCATACCTTCAGCCTTATCCTGGCTTCG
+TCGGACCTTTTGTTTGGACTCGCGAAGAGCGCCAGTGAGTCGCTGCCGATCTACTACATT
+GCGATTTGCATGAGCTTGGCGAAGGCCTTTGCGTTGCTTGCGATGGTCATCGAAAAGCTG
+ATCAACGATCTAAAGATTGCCGCCGAAATTGATGGCATGACAGGCCTTGCAAATAGATCC
+TCGCTCATAGATCGGGGCGAAGAATTGCTCATGCGGTGCAGAGAAGAGGGCGTCAAATTC
+GCTGTCTTGTTCGTGGATATCGACCAATTCAAAGCAATCAATGACGACTTGGGGCACCAC
+GCTGGGGACATTGCCCTAAAAGCATTCGCATCGATCGTCAAAGACATCTTCGACGAAGAG
+GATGACATCTGTGGCCGCTATGGTGGTGAGGAGTTCGTCTGCCTCCTTACAGGCGATTCG
+GCCACCAACGTTGTGCGGAAGTCTGAGATGCTGCGTAGCAGGCTGGCTCACAAACCGATC
+CGGATCGGTGGGCATGCGCTAACCATGACGGTAAGTATTGGCGTCGCAACTGATGATGGT
+GAGATCTGCCTGCTTAGACTGATCAAACGAGCTGATGGCGCACTATATGAGTCCAAGAAC
+TCAGGTCGAGATCGCGTCACTCTGGCAGTCTGATCTTGAGGGCGGGCCTGACTCATCCTT
+GCTGGGTTAGAATCAGGCACCCGGTTGAATGGTGCTGGCATGGCTATTTGCGATAACCCA
+GACGTGATGGATAAGGTCTGGCAAGGCCTGGTTGATGTGGTCAGCCGATACGATCCGGCG
+ATCCGTGGGCATCTTCAGCACTGGGTGCAAGAGGAGCTGGACCGGTTACCGCCAGAGGCG
+GGGCAGGCCTATCTACGTGCCTCCTCAGGGCGTGCTGTGATCGAGGCTGAGGAGCAGGCA
+GAGCTGTCTGCGATCCTGCGGTCACTGAAGAAGACGCTTCACGAGGATGCTCGAGGCAAA
+TTGCGCGGAGTGGTCTAACAGGGCGTCTGCTTTCCAGCTGATCCGTAGTTGCGATGTTCG
+GATTGGACTGGCGACTGGGCATTTCCAGGGGATTTCGGAGTTTTCCATCGCGGTGCTGGG
+CGGCCGCCTCACGGCGTCCAGGCTGCTGTCTACAGCCGCCAGTCCAATGCCCCCGGCTAC
+TCGCAGGGGCGGCGAGGTCATGTCACCCAGCGGTGGTTTGCGTCGTCCGAGGAGCGCGCT
+TGCACCGGGCCATGGCTGCCGAGGTTTTGTTGTGCACGCCCACTCACGGCTTGGACGCTC
+CGGACTGACTCCGGCTGCAAGGCATTGGGCTGCCGCCTGGCGGCCCCGCTACGGGCCATT
+CCTTTTCCCAGCGATGAGATGGCACTCCGGGTGTTCAGCGCCCCGGCCGGCGCAATTTCC
+AGGCGGCAGGCCAATGCCTACTCATGGGGTGAGCGGTTTGTCACTGTTCACAGGTATGCG
+GCCAGAGGAGATTACGTTGTTGATGAGCCGCGGGATGAGGTCAAACAGCTCGCGGTCCAT
+GTGCTTGAAGTCAACGCAGTGGATCATTCGCAGGCGCTCATATGACTCGCATGTCTCTGG
+TGTCTGGGGGATGTTGAAGGCCCCGACAAGGTCATTCAGAGGGCAGATGTCGAAGAAGCC
+GCTGCTTGAGCCGGATCTCTTCTGCCAATCTGAGATTGACTTACGCAATACGGCGCGCTG
+CTCAAGAGTTGCCCCATCCGGATCTGGCCATACGATCATGTCGATGAATGATGGCGCTCT
+CTTTATGGTTGAAAACACCATCGCTCCAGTGTCGATGGTCACTTCCTGCTTGGCTGCGCT
+ACCGCCAAATAGGCGTGCGATGATCGCTTTCATGCTTTGCTCGTTTTGGCGTCGAATTGT
+GATGAGGTCTGTCGGGCCCGCTACGGCCCTGTCCGACGCAAGAGGCGCCGAGTGTTCAGC
+GCCTCGGCCAGCGCAATCCCAAACCCCATCACAATGGCCACTGTCTCCAATGGCCGTTGC
+TGACCTCTATCCAGGCTGGTCAGGCCTTGGCTCCCTATGCATGTCCAGCGCAGCCTTGCG
+GGTGCGTGCTCCGGAGATCCTCAGGGAACCGTCCCGTTGTGAATGAGCGGGTGATGCGTG
+CCGGGCGTTTCGCGCCGGCAATCCAAATATAGGTACGACTATATATTCATGCAAGCATGC
+CTATTAAGCAAGCTTATATTTGTTCATCATTTGTTTATGATTCTGTGCATCCTGTACTTG
+GGCATGTAGAGCAGGCGCATACGCCTGACGAGGGTTACAATGGAGCCACCATCTAGGGGA
+TAGATATGCTCAAGAGAATGTTGCTCGTTGCAGCCGGCTTGGCTATGTGTGGCCAGGCAT
+ATGCCATTACGTATGGCCAATATCAGGCCGCTGAGTCCGAGCCTGGGTCGGTTGCTGCTG
+GCGCTATGGGCATGTACCTAGTGGGGGCTAATTGCCGGAGCTCAGATGACCAATGCCTAC
+GCAAAGATTTCAGGTCATGGGGCGCTTTTTTGCCCGCCCGGTAAATTGAAGCTGGACGAT
+AGGGTTGCCGCAGTATTGATAGATCAGGAGGCCCCCAAGGGCCATGCGACTGATGACACG
+GACATCGAGTCGATTCTGATTGCGGCCATGGCTCAAGGCTTCCCCTGCAAGGAATGATCC
+AGGTTATCGGCTGGCGCTGACAGGGAGGGTTGCTGATTGGTCTGATTGATGGTCGTCTGC
+ACATGGTGGTCTTTACGCCACGCGCTGGCGCGGTGCACGTGATCAGCTTCCGCAAGGCCA
+ACGCCAGAGAGGTTAAACTGTATGAAAAAAGCACCAAACCCCAGCAAGATTGATGCTGAA
+GCTCCTGAGTGGGGCGTCGAGGCCTTCGGAAAGGCCAGGCCAGCGCATGATGTACTTCCT
+GGAATCTTTGGCGAGAGGGTGGCCAAGGAGTTGCTGCGCCCACGGGGAAGGCCGCGTGTA
+GCTGAGCCCAAGGTCGCGACCAACGTACGTTACTCTCCGGAGATCCTCGATTACTTCAAG
+GCGGATGGCCCAGGCTGGCAGACCCGCATGGAGCAGGCACTATGCGAGTACATCTCGGCG
+CATCCGAGGGCTTGAGGCACTAGACTGCTGCTGAGCATAGCTGTATGAGATCTGTCGCAG
+TGGATGAGACGCCGCTATGTCAAATTCCCAGCCATGTAATGACCCACCGCTTTCTGCTCA
+GGTCATGCGGTTAATGTAGCGGCGTAAGCCTCATCCGGGGTCATCATCTTCAGTGCCTGA
+TGCGGGCGTTGTTGGTTGTAGAAGGCGATCCAGTCGGCGATCACCCGCAGGGCATGGACC
+TGGCTCTCGAAACGATGCCGGTGCACGCACTGCCCGCAGCAGAATGGCATAGCCGAGAGC
+CTAGCCCGCACGATCAAGCGTGATTACGCGGCCTTGATGTCCAAACCTGAGCCGGCCATG
+GCCATGCGAAACCTCGCATTGGCCTTCCAACACTATAGCGAGCATGATCCCCTTAGCGCC
+CTGAAGTACCGCCTTCTAGTGAGTACCGGTGCCGATTGGCGTCGTTAAACCAAGTGTGAG
+TCGGTGTCCGAAAATATGGGGAGCACTCCAACTATCAAAGACTCATGCTGATCGCCTTAT
+AGATCGCATTGGATTGAGTGTCGTGTTATGCACATGTTATCCACAGACTGATCGATTGAG
+AGGTGCTAGACTTGCACACAAGTTTTTTCAAAACTCCCGTTTATCGAGGATTGCTATGAG
+CGAGCGACTGACGAAAGTTCCGACCCCGCAGGGCGAAGTTGAGGGTAGGGAAGTGCAGAT
+TGTTGAGTCCTTAGAACGCTGGTCTGACGTGACTCTTTCTGACGGGACGACGTTTCGTGC
+AAAAATTAATATTGTTAACGTTGTTCGCATTGATGGTCAGTATGATGCTCAAGGTAATCC
+TTCATACATGATTAATGCTCAGCCAGCTATTGCAATGGTGCACGTTCCTGACGAACTGCG
+TAAAAAAGGATAGGTCTTATGATCGAATTCCAGAGCAATATCGGCACAGTAATAAATTAT
+GGCTCTAACTCTTTGATGCCTATTTCGGTGTTAATTTCAAGAGATTCGCCCTCTGTGGAT
+TTTGACTCTAGAAATGCTGGTAAGCACTCCTGTTTTGGAGGTGCGCTCGAGCCAATGTCG
+GTGAGTGCATTTACTGGCCATGATTTTGCCATTAAATCTAAAGGCAGGCCATTTGCTTTC
+AGGTTAAACCCTTCTTTGAGATTTATTTCGGATTCTCATGATTATGGTGAAGCATCGTTT
+AGACTGTTGGCAGAGAAGTTGAAAGACGATGTGAGGATGTCTTCTTCGCTTTCGGATATG
+GAGTCCTCTAAATATTTTAGAGATATCTTATCAATGAATGGGGATGTGGTTAGATGGATT
+TTAGAAGATATTAAGAGTAATAGGAAGGATCCTTTCCCTTGGTTCAAGGCACTGCGCTTA
+CTGACAGACGAGGATCCAGCCAAAATTGCACCTAGAGGGGACTGGGTTGCAATGGCTGAT
+AAATGGATTGCCTGGGGGGAATCTGATGGGCGATTGGTTTGATCTAGCTAAAGAGAAGGG
+TTTTCCTAGACTGACAAAAAGCTCGTCTCGTATTACGAGTACTGAAACAAGTAGATACAA
+CTGTCTCGCATGGGCTGCAAATGTAGAAAACAGGTGGTGGTGGCCATATGGAGACGCTTG
+GTGGCCTGAAAATGTGCCGCGAACACTTGATATCGATTCATTGAAGGCGGCATACAGGAC
+TGTTGGATTTGTTGATTGTAATGACGGATTGCTTGAGGCGGATATAGAGAAAATCGCCCT
+TTACGCATTGAATTCAGAATTTACCCATGCTGCGCGCCAGCTCCCAAGCGGAAAGTGGGC
+TAGTAAAATGGGGCATAGTCATGATATCGAGCACGACTGTGTGACCACCGTTGAAGGCGG
+GATTTATGGTGAATGCGTTGCTTATATGTGCCGGCGCCGTGCCATAGATTGACTATTTAG
+ATCAATTGCAGGACGCCAAAGGTCGGAACTCTTTTTTGAGTGATTACCTTCTTGCCTTAT
+TTAAAATGCATATACCAGCAGGTGTGAGTGATCAGCGGTGTAGTGTGCTCGTCACCATGC
+GATCCAAGTCAACGAACAGAGCATCACGTTCGGTCTTCGAGGCAGGTGATGCCATAAGGA
+AAGCGGCCACGATTACGCTATGGCCATCAGGCCAGGTCAGGATACCGATGTCGTTGTAGC
+TGGAGGTTAGGCACGTCCAGTGTGTAGGACGTGCCGCTTTTGTCCGCAAGTCGTAAGCCT
+TGGGGCAGTCCTCGCCGCAGGCGTTCCGGCTTTGTCTGTGCCTGCATCAGTGCAAGCAGC
+GCGTGTGTCGATGTAGGTGAGAGCAGGGCGCCATGTTGCAATTTCTGGAGAAAGTCCGCA
+TCCACCCGCATGCCTGTGATGCCATGTGCGCGCAGGAAGGTCGTGACCTCCTGCGGCGGA
+ACCAGCTTGAGCAATGCATCGACGGCGGTGTTGTCGCTATCGCTGACTGCGGCGGCCAGT
+AGTTGTCGAACGGTGTATGTCATCCGCCCGCCGTGAAAATGCGCACCGATGGACGGTACG
+GCGGAGCCACAGACAACATCTGAGCGCGTCAGCGTTACTGTATGTTCCATCGACAGCTTG
+CTGCCGCTGGCCTGAGCGACACCGCTTCCGCAAGGTGAGGTCGCCGGACGCTTACGATTG
+CCTCAGTCATTGCACTCAATTGATGACACGCCCTAGTGCACCAACAACGAGGCGCACCCT
+GTTCAGGCCTGACATTTTTCATACCCTGGAGCTGGATCGGGTAATGATGCTGCACCAGGG
+GAGGCTTACACGTCGTGCTTGCGTGGACTCATGGTATCTCCAGGTCAGATGGCAGTGTCC
+CGCCTGTGGCCCGGTTACACAAAATCTAGGACACCCTCAGACCTCAAATTTTCAGCCCTT
+TCCAAACCGTCCGTAATTTCGGGGTAGAACCCCTTACGAGAAGCTTCGCCGAGTTGGGCC
+TCGTGCCGCTGCTAGCACTCCATTGTGCTGGCAGACATGGCGCGGCTTACAGTTCTTCGT
+CGCGCTTCATCTGGATCGCTCCCAGGACGCGGCCAGCAATGCAGATATCAGAGGCCTGAT
+CAGGCCGGTAGATATCCGGGTGATCCGGATCGGCCAGGCTCACAACATGGAAGCCGTCGC
+GACGGATCTCGATGCGCTTGACCAGGGCATGGCCATGGAGCAGGACGACGAAGATACCGC
+CGTCCATGGGGTCTCGATCCTCAATGTCCACGAACACGACATCGCCATGCTTTATGCGCG
+GGGTCATGGAGTGTCCGCGAACTGTGAGGAGCTTCACTCGATCGGGGCTGACGGCGCGGC
+CAACTTTCTGACGGACCTGCCACTCGGCGATATCCACTTCCTGGAGCACTTCCGGCTCTT
+CACTGTTCAGCACACCTGGCCCCGCTCCGCCTGCACCCATGACTTGGAAGCGAAGGTAGC
+CTTCTGGTGTCTCAGATCGTGAGATTCCCAGATGTTCGAGCGGGCCTCTTGGGCCTACGC
+CAGTGGCCAGCCAGCGAGGGGATACGTCAAGCACGTCTGAAAGCTCAATGAGCGTGGTGT
+CCTTGAGGCTCTTGGTTGAGCCTGACTCCCATTGATAAGCCGATGCTGCCTTGACGCCTA
+CCCGTCTGGCTAGCTCTGCCGGCTCACTGATGCCTGCAGCCTCTCTGGCTTCTTTGATTC
+GTTCTGCGAGCGTTCCAGTCATGTAAGGGAGCTTATATGGTGCATGTATAGTTGTGCTTG
+CATGATAGATGTAAGCAAGCCTATTATTGCGCCATGAAAAGCGCACCTAAGATCACGAAG
+GCAGAAGCAATTTCGCCCTTTGGCAGCGGCTACGCTCTTGCGAAAGCCCTGGGAATTGCA
+CCAGCGTCCGTATATCAGTGGCCTGATGGCATGCCTATACCTGAGCTTCAGGCAATGCGC
+CTGGCATTTTTGATCCGGCCGGATATTTTCGGCCCAGCTCAGACCAAGCGTCGTAGTGGT
+CACGGTAAGGCGGCGTGATGAATCGACTGATCCTTTCCGATAGCGCCGCCGTGATTGCCC
+TGGCCATATACCTGGGCATCCCCTTCGAGCTGATTCCCCGCGCACTGCGCAACCTGCTGC
+TGATGGCCTGGGGCGCGTTCGTGCTCCTGCAGATCGCCGGCCGGTCTGTATCTACCTTTT
+CGCTTTTCATGAAGCGCCGCCCATCGGACTGCACTCCGGAGGCCAAATGATTCCTGCCGC
+AATCGTTCTGCATGCCAATGGCATGTTTATCGAAGACGACTCTGTCGAAGTTGACTGCAT
+CGTGCTTCCGTTGACGGACTGTCTCGACATCAGCTTCCACCGGATACGAACTGGCGAAGC
+AGTGTTCCAAGCACACTCGGTGCTGGCGACAGCGTCGACCAGCCCGCGTCGATCAGCTTT
+TCGACCAGGCGTCCTATGGCATCGCCCCGTGCGTCACGAAGAACCTGTAACCAGCCTTTC
+TTGTCCTCGTCCGGAATGCTCATGCGCTGGACCTGAGCCTCAAGCAGCTGACGGAGGGTG
+TCCTCATGAAGCTTGACGGTCACCGTTCCAAGGATGGCGCTGAGCCCTCCGTCAGCACGC
+ATGAAGTCAATGCCGGCGGCCGTTATGCGCGCTCGAGCCATCCCGTATTGGGAGGGATCC
+TCAACGTATGTCTCAAGATGCGCAGCAATCATTCCGTGCTCATCGAGATAGTGCAGGTTG
+CGTGCGACTTCGCCAGTCGGGTCGTTCTTGATGGCCTGACAAAAGTCTTGTTGCTGCGGG
+TATGCCTTAAGCAGCTCTTCAAGAATCTTGCGTTGATGGTCTCGCGCAAATCTTTCCATG
+GACTCCATCTTCCGGTGAATACCAATGACTGAACTGTCGCATTCCAAGGGCGTCAGTGCC
+ATGAGTATCGTTTTTCATGCCTCCCGCAAAGACCTGGTCCGGAGCATCGCCCGCGATGCC
+TTCAACGCTGGCGATCTCAACCTGATGAACTACGCGGACCGGATCCAGGAGCTGTACTTC
+ACCTTGATCCCGCCGGCGAGCCAGGACACCAACCTGCGCCAGCCTTGTGATGATGCCACC
+GGTGAGCGGTTCGAAGCTGATCGCCGCCACAACCGGCAGATCGTTGAGCGCTGGGTGAAA
+GGGCGGGTCGCTGAGTTCCCTGACGATCTGGAAGAGCCATGGGTCATGGCATTGCCCGAC
+CAGTGGCGTGACAAGGCGCTCACGGAGCTGTCGGCCCGCTATGGCTTACTGCCTGCGCCG
+ATCCCCAGTGGCGGCCATACAGCGGCATGGACCGGCGACATCATGCAGTCCATGGCCGAC
+GTCCTGCGTGACTTCGCGCCTATTGCCGAGGACGGCGTGATCAATCATCTGGACGCCGAC
+GATCTGCCGGCCTTCATCCTTTCCAGTGCAAAGGCCATGGGCATTTTGTCGAGCATGCAG
+CGGCAGGCAAGCGAAGCCTTGCAGGAAGCCGAGCGGAGGAAAGCACGGTGAACTATTACC
+AGCGCCATATCGGCGACTACGCCCGGGATACCGGCCATCTGTCCCTGCTGGAGCATGGGG
+TCTACATGATCCTGCTCGATCACCATTATGCTTCTGAGGCGGGCATTCCCGATGGGAAGC
+AGTACCGCCTGGCACGTGCACGCACGCCCGAGGAACGGGAGGCCGTCGACAACATCCTGG
+ACGAGTTCTTTGACCTGAAGGATGGGGTTTGGATCAATCGCCGCGCACATCACGAGGTGC
+TGCGCTTCCACTCCACCATGGCCGACGATGCAGATCAGAAACGCGGTGCTGCAGAACGCC
+AGGCAAAGGCCCGCGCACGTCGCTCGGCGCTGTTCGATGAGCTGGCGACCTACGGGGTGG
+TGCCCGACTTCAACGCCTCCATGCAGCAGCTCCGCCACATGCTTGATGAGGTGAAGTCAC
+AGCGTAAGTCACAGGCTCCGTCACGTAACGTCACGCGTGACGTTACGGCTAACCAAGAGC
+CATTACCCAATACCCATTACCCAACAGCCAATACCCAAGAGCCAGTAAACCTCTCCGTAG
+GTGAAGTTGCTCAAGACTTGGGAACTGAGGTTCTAGGGGAGGTCTTTTCCGCGCGCACGG
+CAAATGCGCCGGCAGAGGATCTGGATGGCAGGGTGATTGACGCCTGCAAGGCACTGCGCC
+GTCTTGGGGTTACCAGCGCTAATCCCGCGCTACCGAACCTGCGGGCGGCTATCCAGGCCG
+GAGCGTCGACGGATCACCTCGTCGCGATCACGCAGCAGCAGATCGAGGACGGCAGGGCGC
+CCAATGCCAACTACATCGCCCGCAAGGCGATTGGCCAGATCGAGGACGCCAAGCGACCGG
+CGCCGGTCCGCGCCGGTGGCGCTGGGATCGCACAGAACAAGCAGGAAGCCATCGAGAACC
+GCAACCGCAGTGTCGCCCAGCGTTGGGCCAGCTCTGCCAACGAAGAGCCCCAGGAGGCTG
+AATATGCAATCGGGTGATATGAATGGTTTTGCCGAGATGCTCTCGGAGGTCATGGCCTAC
+TACGCCAAGGACGTGAGCGAGTTCATGCTCTCGGTGTTCTGGGACGGGCTGAAGATGCAC
+GAGTTCCAGGACGTGAGCCGTGCATTCACGCTGCACGCTCGTGACCCGGATCGCGGCCAG
+TGGGCGCCGAAGGTGGCCGATATCACCCGCTTGCTTGAAGGCTCGACCAGCAGCCAGGGC
+ATGACGGCTTGGTCGAAAGTCGACAGGGCCATTCGGTCGGTCGGCGGCAACCAGTCGGTG
+GTCTTCGATGAGCCGCTGATCCATGCCGTGATCTTCGACATGGGCGGCTGGTCGAAGCTC
+TGTCAAACGATGGTGGATGAGCTGCCTTTCGTTGCACGGGACTTCGAGCGACGCTTTGGC
+GCCTATCGCCTTCGCCGCGAGCTTCCGGATTACCCCAGCCACCTGATCGGGAACCACGAG
+GCTCAGAATCGCCTCAATGGCTTCAACCGTGTTCGCCCGGTGCTGATCGGCGACGAGCAC
+AGGGCCCTGGCCGTGATGAATGGCGGGTCCAACGGGAGCCCGCTACGGATCACGCGGATC
+AGCGACGAGGTTGCCCGCATTGGTCAGGCGGCAGCACTAGAACACGGAAAGGGGCAGGCG
+GCGTGATCATCAACCTGCCGCCCGGCACCCATGCCACCGAGCTGTCCCTGCGCTTCGCCC
+GCTTGGGTGATCCCTCCAAGCCGATGACCTGCGGGCAGTGCGCTCATTTCATTCCCAGCA
+CCAGCAAGAGCTGCGGCTATGCCGAGCGACCTGCCGGCCAGGGCGATGCAGCTGCCTGCA
+TTGAGTTCGAGGTGGCACCGTGAGGGCCTTCAAATTGATCCTTGGTAACCGGCAGAGCGT
+GTTTGATCTGGCTGGCATCGTGCGCGAGCACGTTCGTCAGTCGACCTTCGAATGGGCTCT
+GGTGATTCGTCCCAGCGGTGACGCGGCCCTGTACATCGCCACCACGCAATCGACCCAGAT
+GACGGCTCACGACCATCCGGAGCAGATCGTGGGCGTGTTCACGCGGATCCATGATGTGGC
+AACGATCCGCCGTGACATTCAGCGCTGGGTCGATGCCGACGGCTACAACCAGAAGCTGGC
+TCCGATCCGCCTGGTCGAGGGGCGCAACAAAGGCATGTGGGGCGGTCCGATGTTTCGTGA
+ACCCCGCCGGATTGCCCCGCTGATGCATGGCCGCCGCAAGCCCCGGCCGACGTGCCCGGA
+GCATGGTATCCCGTTGCCTCCGGACAGGGACTGGCGCGGCCGAGCTATCAACGGCCCGTG
+CCCGATGTGTGTCGCACGCCGCAAAGCCCGGGAGGGATTGCTGTGAAGGGCGGTCGTCAT
+GCGGCGCAGGCCACGGCCGTCCAGCGCGACCGGATCGTCATGGTGAAGGAGCTTGGATGC
+ATCTGCTGCCAGATGAACCGAGCTGCTGGTCGACCCACGGCATTCTTCGGCGTGGCTGAA
+GCGCATCACCTGCTGTCTGGCGGTCGGCGGCGCGGTCATGAGTACACCATCGGACTCTGT
+CCCTGGCACCACCGTGCCGTGCCGCCGTTCGAGTCGGCCGGTACCGCCGATATGGTGCGC
+ATGTTCGGCCCCAGCGTGGCCACCGGCAGCCGGGCATTCCACGAGCGGTACGGTACTGAC
+GACGAGCTGCTCGAGTACCAGGAGCAACTACTGGCCGGCGCGCGGGCGGTGATGCGGGAG
+GTGGCGGTATGAGAAAGGCAGTGTTCACGGCATCCTGGGTAGCGGGTGGTTCTATCGCCG
+GCGTTCTTCTGTTCTTTGGCCTGTTTTGGGTTGCCAGTCACCTTCATGGTCTATGGGCCG
+GTGCATTTTGCTGTCTACCCATGTGCGCATGGAGTGCAGGGTTCATTGCATGGATGAAAT
+ATCCAGGAGCAAAGGATGAGCAAGCGAGCACATCCGAGATGTCGAAGGCTCGCCAGCTGG
+CAAAAGGGCAGCCTTGCATGATCGGAATCGCAGGCACGTGCAATGGAGACCCCGAGACGA
+CGGTATTTGCACGTTACCCAATGGATGTCTACTTCGATATCGAAATGAGCTCAGATGACG
+AGTTGGGGGCATGGGCCTGCTCAGCTTGCAATGCTGTGCTGGTTAGACGCCCCCCTATCC
+TCGAAGAGTTTTTTTTGCAGTTGAGGCTCTTTCACGCCGAAGGCGTTCTGCGCACCCAGC
+ATGCGATAAGGGAGATGGACAGGTGAAAATGCATTGCGTGGCCACTGAGCACGCCGAGCA
+GGTCGCACTGATGCGCTGGGCTGCCGCAGCCGTGAAGCGTCACCCGGATCTGGCGCTGTT
+GTTCGCCATCCCTAACGGCGGGCAGCGCCACAAGCTGGTGGCGGCGAAGCTGCGGGCCGA
+GGGCGTTCGCCCAGGTGTGCCCGACCTGTTCCTGCCGGCGCCGCGCGGCCCGCATCACGG
+GTTGTTCGTGGAGATGAAGCGCACCGTAGGCGGCGCCGTCAGTTCGGTCCAGAAGGTCTG
+GCACCGCGAGCTGGCCGCCCGTGGTTATCACGTCGTCGTGTGTCGTGGATGGGAGCAAGC
+ACAGGCCGCGATACTCGAGTACCTCTGCATGACAGGTGTCGCGTGATTGCCTGGACGCGC
+GGCAGCCAGCCGCCGGCGCAGGGACGCTACTTGGTGATCGAGAAGGTGTACCAGCGCCCG
+ACATTCGGGTCATGGCGCCCAGATCTGGGTTGGTGCATCGGTGGGCGATGGATTGGGCGC
+AACGCGGTCGAGGCCTGGGCCGATGAGCCGGCAAGTCCGGAATGGTTGAACGATTGCCGG
+ACACAGCCGGCGGCAGCAACGAATTGACGAACGAGGATCTGAACAACATGGCACACATCG
+GCAAAATGCTTGGCCGGCTGAACCCCAAGACCCAAACCTACTCCGACTCGGCCGGCGGCG
+TTGTCGAGCTGAGTGCACAGGACATTGCCGCCGCGCTGGCGTTCGTGCCGGCCGGACTCG
+GCCGTGAGCTGCTTTGCCATGTCTGGTGGCCCGGTGGCGCCGACCGCACGCGGGCACAGC
+TGGATGCGGCTGTGATGGAGCTGCTGGCCAATGAGTGGCGCATCAGGGAGAGCGCAATGC
+TGGATGCGATGCTTATGGTGGCGACACCCGATGTCGGCCGCCGGCGTGCGCAGGATGCCT
+ATGCCCTGGCGCATGCCAATCGCTGGCCGAGCTGGGGAAAGGTGCAACAGGGATTGCTGC
+AGCCGTCACCGGTGTACGCGGCACTTCGGGACGCGGTGCTTTTCGAGCTGCGCACCGGTC
+ACCATGGCGATGCGGACTCCGGCGCATCGGGGGCGATGAGTGATCGAGAGCGGGCAGAGA
+TGATTGGACGGTCCCATGTCACCTACATGAACAACGGATGGCGCCGGGTATATGAGTGGC
+TGCTGGATCGCTGCACAAGCGAGGTGGGTGTCGCTCAGCGAAGGTTTGGACGGGCGGCCG
+CGTAAGCCGCCTCGCACTGGTAGCGTGCAGCACTACCATTTTTGAGGGTAAATTCCCTAT
+CGTGACGAAAGCCCCGCAATCTTGTGGGGCTTTTTTACGCCACCTTGCAACGGGTCAGTT
+ACTGCGTCGCAGCCTTCATTGGCGACACGGTGAATTGCATCGCCAGACCCAAGGCACTGC
+TGATCCGGGCCATCGTTTCGAATCGCGGCTTGCTGCCGGGAGTCAGTGCTTTGTAAAGGC
+TTTCCCGCCCAAGGCCTGACTTGCGGGCAATCTCGCTCATACCCTGCGCCTTGGCAACAT
+GGCTGAAGGCGCGGAGCAGTTCGTCCTGATCACCATCGACCATCACCTGGTTGAGGTATT
+CGGTAATCGCTTCTTCGCTGTCGAGCAAGCTGGAGAGATCGAAGTCAGTCAGTTTCGTGG
+TCATTTTGGATCTCCTTGGCCAACTGCTTGGCCTTGTTGATATCTGCGCTTTGGCTACTT
+TTGTCGCCACCGCAGAGCAGAATGACGATCTGAAGGTTGCGAATCGTGTAGTACACCCGG
+TAGCCAGGGCCTGTTGGGATCCGCAGCTCTGACACACCGTCGCCAACAGGCTTGTGATCA
+CCGAAGTTGCCCTGTGAAGCACGTTCGATGCGCCGAGCAACAGCGATCTTCGCCTTGAGG
+TCTTTGACCGAAGCGATCCAGCTACGGAAGCCATCGGTCTGCTTGACGATGTAGTTCATA
+GGCCAATTGTATCCAAGTGGATACAGTGATAGCAACAATATCCACGAAGTGGGACGCTCA
+TGAGCCACGTTATCGAACTCGTTACGCTGGATGGCGAGCATCGTGTCGGCAGTATGGATA
+TCGCCTCATCTCTGGGGATCCAGCACAAGAATGTGCTCGAGCTGCTACGCCGTTATCGCG
+ATGACTTTGCGCAGTTCGGAAGGGTCGCGTTTGAAACGCGACCCTTTGAAACCCCGGGTG
+GCAGCCAGTCACGTGAGGTGGCAATGCTGTCTGAAGATCAGTGCTATTTGCTGCTTACCT
+ACAGCCGCAACACCGTGCGGGTCCGGTCGCTCAAGGTAGCGCTGGTGCGGGCATTTGGCA
+GCGCGCGCCGCGAAGGCATCTCCCGGTCGCTGACCGCCTGGCAGGAGCTGCAACGCCTCG
+AGATCGAGAACGCCAGCTCGCTGACCCGGGCATCCATCGGCTCGCGCCTGATGCTCGAAC
+GCAAGCGCGCCTTGCCTCAGTTGCGGGCCCGGCGCGAGAAGCTGGAAGCGCAAGTCATCC
+TGCCGATGTTCGCCTTGCCGAACTGACGGTCCTATCCACTGAACAGGCATTCCCGCGGCT
+GCGGGTTTTTTTATGCCCGGAGAATGAGCATGAGCAAAGAAGCCGCACTCGCGGTGGCGA
+AGATCTCGCCGCCCGTAGCGTGGCTGTATGGCGAGATCACAGGTTTCTGGCAATGGATGG
+GCGGCGTCAATTGGGGCGTGGTCACCGGTGCCCTGACTGCGCTGTACACCCTCTTGATGA
+TGATCCACCTGCTGGCGCACTGGAACCAGCGGGGCGTGCGGAGTGAAGACGATGGCAATC
+TCCCGTAAGCCCGCGGCCGTCGCCGGCCTGTTCGGTTTGGCTGTGGCCATCGCAGGCTGG
+ATCATCGCGCCATCGGAAGGCAACAGCCCTGTGGGCTACGCCGATCTCGCTGGTGTGCCG
+ACGGCATGCCTTGGCCACACCGGCTCGGGCGTGGTTGTCGGCCAGCGATACAGCGAGGCG
+CAGTGCCAAGCCTGGTTCGCCAGTGATGTCGGCGCGGCCGCTCGTGGCGTGCAGGCCTGC
+ATCCATGGACCGATGACCAGCTACCAATGGGGCGCGTTCACTTCAACGGCCTTCAATATC
+GGCGTCGGACAGTTCTGCCGGTCATCGATCGCTGCCAAGGCCAATGCCGGCGACATGCCG
+GGCGCGTGCGCCGCGATCTCGCTGTACGTGTATGCCGCGGGCCAGCCGCAACCCGGATTG
+ATACGGCGTCGCGCGGCCGAGCGTGCGCTGTGCGAGGGCCATACCTGATGCGCGTCATGG
+CCGGAATCATCATTGCCCTGGTGCTGGCTGTGGCTGGTGTCAGCTGGCACGACATCCACG
+AGACGCGGGCAGCGGCGAAGGCTATCGCGGCCCGCGACGATGCCCATGCGGCCAACGTGC
+AGCTGCAGCTGACGCTGCAGACCGAGCGCAACAACACCGCTGCGGCCAACGCGGTCGCGG
+CGCAATACGAGAAGGACAAAGCCCATGCCGAACAAACGGCCACTTCGATCGCTGCTGATC
+TGCGTGCTGCTCGTATCCGGCTGCGCCCAGTCTGGCGTTGTCCGGCCGCAACTGCAGTGC
+CCGCAGCCAGCACCGGTACCGGCCAGCCTCATGCAGTTACCGACGTACAGGCAGCAGCTG
+CAGCAGCAGTTGTTCGAGTCGGCGCCGATGCCGACGCACAAGTGAAGGCGCTGCAGGCTT
+TCATCCGATCACAGCAACCGGCCGCGGCCGGCACGGCGAGTCAGCCATGAATTTCATCAC
+CACCATCCGCTGGCTGTTCCGCCGGCTTTTCGTCAAGGAGTCACCCATGACCGAACCCGT
+ACAGCCGGCTGTCGCCGGCACCGCCGCCGTGGCGCAGCCCGCACAGTCCGTGCAGCCCGC
+CGTGGTCCGCACCGATGTCGTCCAGGCCCAGCCCGTCGTGGCGGACCCGTCCGTCGAGCA
+ACTGAAGGCCGAGGTGGCTGCGCTCAAGGCCGAGCTGGCCAAGGTCGAGCCTGCGCGCCA
+GAAGTTCGTCGAGCTGCTCAAGTCCGTCGGTCATGACGTCGAGCTGGTCGCCGACGAGGC
+CTGGGCGCTGGCCAAGAAGGCCATCTGACCGCGGGGATGGCCGTGGGGTAGGTCCCCGCG
+GCCTTCCCGCATCAAATGCGATCCATTCCCATTTGCGCCCGAATGGGCATGGATGGGAGT
+CATTCGCACCTAGGGTCCTCCTGAGGCCCCCCTGGGCCTGCTACGGGTGATCAACACCGC
+GATCCTTCGCTACATACCACCTTTTTTCGGCATGTCCGTGTCCGGTTCCGGTTGAGCAAA
+AATGGCCCTGCAAAAGGACATCGCCGAGCACCTGGATTTGAGCGATCGGCAAGTGCGCCG
+ATTGCTCGCAGATGGCTTCCTGCCTAGCTCCAAGGGCACTGGCGGCTATGATCTGGACGC
+ATGCCGGCTGGCCTATATTCGCTATCTGAGAGGCCTCGGAAACGGGCAAGTAAAAGCGGA
+CACGGCCCCCCTCGAAGACCTCGATCTGGACCCGTTGGCCGAAGAGAAGCTGTTGCAGCA
+GAAGCTGCGTCTGACCGCGGCTCAGGCCGATGGTCAGGAGCTGAAAAACGATATCAGCCG
+CCGGCGCTCGGTGCCGGTGGATTTCGCCATGTTCGTGCTGAGTGGCCTGGCGGCCGAGGT
+CGCCTCGATCCTCGACACGCTGCCGCTGACCATGCGTCGGCGACATCCCGAGTTGGAGCC
+ACGGCATCAGGAAACGCTGGAGCGTGAGCTGGCCAAGGCGCGCAATCGCGCCGCCGGGCT
+GGACGAACGCCTGCCAGGACTGCTTGATGAGTATCTCGCCAGCCCAGATTGATGAGCTGG
+GCCGCGCGGTCAAAGCTGGCCTGCTGCCACTGGCGCGGCCTGAGCCGCAGACCCCGGTGG
+AATGGGCCAACGATCATTTTTACCTGAGCTCGGAATCGAGCTATCAGGAAGGGCGCTGGG
+AAACGCTGCCGTTTCAGGTCGCGATTCTCAATGCCATGGGCAATGACTCGATCCGCACCA
+TCAACGTGATCAAGTCGGCCCGCGTGGGCTATTCGAAGATGCTGCTGTGCGCAGCGGCCT
+ATCAGACCGAGCACAAGAAGCGGAACATCCTCGCGCTGCTGCCGACGGACGATGCGGCCG
+CTGGCTTTATGAAAAGCCAGATCGAGACGATGATCCGCGACGTGCCGGCCGTGCGTGCAC
+TGGCGCCCTGGTACGGCACCAAGCATCGCGACAATACGCTGACCGCCAAGCGGTTCAGCC
+ATCGCAAGCAGCTGTGGTGCTTGGGCGGCGCCGCGGCCAAGAATTACCGCGAGAAGTCGG
+TCGACACCATCATCTACGATGAGTTGGCCGCCTTTGAGCCTGATGTGGAATCGGAGGGTA
+GTCCGACTTTCCTCGGTGACAAGCGCATCGAGGGCTCGACCTTCCCGAAGTCGATCCGCG
+GCTCCACGCCCAAGATCAAGGGCACCTGCCAGATCGAAGCTGCGGCGGGTGAGTCGCCGT
+ATCTGTTTCGGCTGGCCGTGCCTTGCCCGCATTGCGGTCAGGAGCAGGTGCTGAAGTGGG
+GTGGCAAGGATTGCGCCTACGGCATCAAGTGGGACCCCGACAAGCCGACGGATGCCTGGT
+ATGTCTGCGAGCACCATGGCTGCCTGATCCGGCAGCACGAGCTGCAGCCCTTGCAGGCCG
+AGGGGCGCTGGGTCTGCGAGCACACCGGTCTGTGGACGCGCGACGGGTTGGATTTCTTCG
+ACTCTGCTTGCGAGCCGGTACCGACGCCGGAGTCGATCACCTTCCATATCTGGACGGCTT
+ACAGCCCGTTCACGACCTGGTCGCGGATCGTGCTGGATTTCCTCAAGGCCAAGAGCGACC
+CGAACAAGCTCAAGACCTTCGTCAACACCACCCTGGGCGAGACCTGGGAGGAAGAAACCG
+GCGAGAAGGTCGAGTGGGAGCAGCTCTACGGTCGCCGCGAGATCTGGCCGGGTCTGCCGG
+CGCGGGTCGGCGTGCTGGTCGGTGGCATCGATACGCAGGATGACCGTTACGAGGGTCGGG
+TCTGGGCGTTCGGTCCGGGCGAGGAAAGTTGGCTGGTCTCGCGCTGGATCCTCTACGGGG
+ACCCGGCCAGCGAGGAGCTTCGCCGCAAGGTGCGGGAAAAGATCGCGGAGATCTTCGCCC
+GCGAGGACGGTGCCCGGATGCGGGTATCGATGTGGTGCTGGGACTCGGGTGGTCATTACA
+CCGATGAGGTCTATGCCGAGAGCAAGGCCATCGGCGTGCAGTGGGTGATTCCGGTCAAAG
+GTGCCAGTCGGTACGGGCGGCCGATCGCCAATTTCCCGCGGACCAAGAACAAGGCCGGGG
+TCTATCTGACTGAGGTCGGTACCGACAACGCCAAGGAGCTGATCTACAGCCGTCTGAAGT
+TGCAGCCGACCCCGGGCGAAGCCTCGCTGGGCGTCATTCACCTACCGGCTGATGATGCGA
+TCTGCGATCAGACCGAGCTGCAGCAGCTGACCGCTGAAACCAAGGTCATGAAGATCGAGA
+AGGGCCAGCGGGTCTACCGCTGGGACGCCAAGGGGCGCCGCAACGAGGCCCTGGACTGCC
+TGGTGTATGCCGTGGCGGCCCTGCGCATCGCCCAGCAGCACTTCGGACTCAATCTGGACA
+CACCGCCGGCCGTGGCGACTACGCCGCGGGCGCGGCCTGCGCGGCGCGGCACACGGAGCA
+AGGCAAGCTAAATGGCAACGACATCCCCCGAAGTCATCCAAATCCAAGCACGGCTGACCC
+GGGTGGTGGCCGCGATCGATGCGTTGATCAGCGGCGCCCAGGTGGTGCGCTTTCGTGACC
+GCGAGGTGCGCCGTGCCGATCTCGGTGAACTGCGCAGCCTGGAACAACAACTGCGCTTGC
+AGCTGGCCGCCGCCCAGGCTCGGGCCGCGCGGATGGGCCGCAATCGCGTCAGCTATGTGG
+CGATCTGATGGGCATGTTTGGCAAAACCTCCATCCGTGACCGGATGAACAAGCTGGCCGT
+GTCCTATCTGGCGGCGGGCGGCGTCAAGGCGCAGGGTGGAGGCGGTGGCGTGGAGACACG
+CTGGCGCGGTGCCTCGCGGCTGCTGCGCTCGATGGTCAGCTGGGTACCGGGCGTGGGCAG
+CCCCCGCCGGGACCTGCAGCGCTACGAGCGGCATATGCTGGTCGCCCGCTCGCGCGATGC
+GATGCGCAACCATCTGATCGGCCGTGCGGCGGTGAACCGGGTCCGCACCAGCGTGGTCGG
+TACCGGCCTGCTGTGCCGGCCCAGCGTGAATGCCCAGGCCCTGGGCCTGAGCGAGGACCA
+GGCCGATACCTTGAATGCGCAGCTGGAGCGTGAGTTCCGGCTGTGGTCGGAAGATCCGCG
+CGAGTGCGATGCCGAGGCCAGCAGCAATTTCCACCAGCTGCAGAGCCTGGCCCTGGTCAG
+TGCGCTGACCGGCGGCGATGTGTTCGTGACGACGCCCAGCATCGAGCGCGAGGGCGCGAT
+CTTTTCGACCCGGCTGCAGCTGATCGAAACGGACCGGGTCAGCAACCCGGACGGCATGCC
+GGACACCGACAACCTGATCGAGGGCGTGGCCTTCGACAACAACGGGGCACCGACGCACGT
+CTACGTGTGCAGCGGCTACCCCTACGAGCAGAAGATCCGGACCATGCTGACCTGGCAGAA
+GATCCCGGTGTTCGGTGCCGTCACGGGCCGGCGCCGGGTGCTGCAGATCTGGTGTGATCG
+GGATCGGCCTGGCCAGAAACGCGGCGCGCCGTATCTGGCACCGGTGCTGGAGCCTTTGCA
+GAAGCTGGAGCGCTACAGCTCGGCCGAGCTGATGGCGGCGGTGGTCAGCGCGATGTTCAC
+GGTGTTCATCAAGAAGACGCCGGAAGCCGATCCCGCCAGTCTGGTCCAGAACCCGCTGGT
+GTCGATGGGCGGCCATGACGAGGCAGACATTCCGGTGCCGATCCCGGACGAGCCGGGCAC
+GGTGGAGCTGGGCGAGGGCGCGGTGGTTGATCTGGCCCCGGGCGAAGAGCCCGCGGTGGT
+CAACCCGGCCCGACCCAATGCGCAATTTGATCCGTTCTTCATGGCGATCGCCAAGGAGAT
+CGGCGCGGCGCTGGAGCAGCCGGTCGAAGAGATCCTGATGCACTACAGCTCGAGCTACAG
+CGCGGCACGTGCCGCGATGTTGCAGGCCTGGCGTTATTACGAGATGCGCCGGTGGTGGCT
+GGTCTGCGATTTCTGCCAGCCGGCCTATGAGCTGTTTATCGATGAGGCGGTCGCACGCGG
+CCGTATTCATCTGCCGGGCTATGCCGATCCGGCCCAGCGCCGGGCCTATACGCGGGCCAT
+CTGGATCGGCCCTGCACGGGGTGCGATCGATGAGCTCAAGGAAGCACGGGCGGCGCAGGC
+GCGCATCGATGCCGGCGTCAGCACGGAAACCATGGAGACCATGGCGATGAGCGGCGAGTC
+GTGGGAGGAAGTGATCCAGCAGCGGGGCCGCGAGATGGAGCGCCGTCGCCAGCTGGGCCT
+GATCCCGCCGACACCGAAACAAGCCCCGGTCCTGCAGGAGCAAGAGTGATGATCAACCTG
+GCCGACATGGCTGCGGCGCGGCCGTGGCTGATGATGCCGCAGTCGCTGGAGCGGCTTCTG
+GCGATTGCCGACCGGCAGCTGGAACCGCAGGCGCTGGAGACACGCCCCGGCGATGAGCTG
+CGCAATACCCGCACGACCAGCGTGCGTGATGGCGTGGCCATCGTGCCGGTGACCGGCCCG
+ATCTTCCGCTACGCCAATCTGATGACCCGGATCTGCGGCGCCACCAGCACCCAGGTGCTG
+GCGACCGATATCCAGGCCGCGCTGGATGACCCGAGTGTGCGAGCCATCGTGCTGGATATC
+GATTCGCCCGGCGGCGAGGCCAACGGCATCAACGAGCTGGCCGAGATGATCTTCGCGGCC
+CGCGGGCAGAAGCCGATCGTGTCCTATGTCGGCGGTACCGGCGCCAGTGCCGGTTACTGG
+ATCGCCAGCGCGGCCGACGAGATCGTGGCCGACGAGACGGCCGTCCTCGGCAGCATCGGC
+GTGGTGCTCGAGGTGATGCTGGCCGACGATGCGCCTGGCAAGCGCCGGCTGCAGATCGTC
+AGCCAGAACGCGCCGAACAAGCGGCCCGACCTCAAGACCGAGGAAGGGCAGGCCAAGGTC
+GGCGACATGATCAACAGCATGGCCAGGGTCTTCGAGGCCAAGGTCGCGCGCAACCGCGGC
+GTGGCCCTGGATCAGGTCGGGCCGATGGGTGACCACGGTGGTGTGCGCATCGGCGCCGAT
+GCTGTGGCCGCCGGCCTGGCCGATCGGCTGGGCTCGCTTGAATCTGTGGTGGCCGAGTTG
+AGCCAGCGCAGACCCTCTCCTTTCCAAAACACTCGGAGGTCCCCCATGGGGCACAAAGTC
+AGCAGCACCGAAGAGCTGCAGCAAGCCATCAGCGCGGGTGTGGATCCCGCCACCATCGAA
+CTGATTCCCGCCGCGGCGCAGGATGATCCGGCGCTGGCCCAGCAGGCGGCCGCCGCCGAG
+CGTGCACGCATCCAGGGCATCAACGCCTTGGCGCGGCCCGGTTTCGAGAAGGAGGTCGCT
+GCGGCGATCGAGAGCGGGATGCCGGTGGCCGAAGCGGCCCTGTCGATCCTGACCGCCGCC
+GGCGAGCGCGGCATCACCCTGGAAGGCATCGCCGCTGATGCCACCCATGCCCGTGGCGCT
+GCCCCGGGCGAGCAGGCCACGGCCGCACGGGAGTTCAACCCTCGTGCGATCTGGAGCAGC
+CGTAAAGGAGCGCAGTGATGACCACTCTGACCATGAATCCCCGCACCGGCGAGTTCCTGC
+TCAGCGAAGCCATGGGCACGCGCTCGCGTGACCAGGTGTCCCTGGCGGCCACCGCCGCGT
+ATATCCCGGCCGGTACCGTCATGGCCAAGGCCACCGATGGGACCTGGGCGCCGTATGCCG
+ATCCGGTGGCCGCGGCCGCCGGAACCAGCACCGGCACCACGTCGGGCACGACGGATACCA
+CGGGTACCGAGACCACCACGGCGGCCACGACGCCTTCCGAGGTCGGCGTGCTGTATCGCG
+GCGCGCAGATCAACACCGATACCCAGCCGGCGGTGATGGTGACCCGCGATGCCGAACTGG
+ATCAGGTCCTGCTGATCGGCTTGACCGACACGGCCAGCAGCCTGCTGGCCGCCCAGGGCC
+TGATCCTGCGTTAAGCGCACACCTCATCACCTCTACACACAAAGCCGCCTTCGGGCGGTT
+TTTTTATGGGACACATGCATGGCGACCCTCGATATTTTCAATGACAGCGCGTTTGGGCTG
+ACCTCCCTGACTGCGGCGATCAATCAGAACCCGGAAGGCCAGGCGTCTCCGGACATGCTC
+GATGCCCTCTTCTCTGAAGATGGCGTGACCACCACCAGCGTGTTCATCGATCGTCAAAAC
+GATTCGCTGGACCTTGTGCCTGCCGCCGAGCGCGGTGCACCGGCCAGCCCGACCCGATCG
+CCGAAGCGCGACGGTATCGACTTCCGCACCATTCACCTGCCGACTGACGGCGTGGTGCTG
+GCCGATGAAGTCCAGAACATCCGAGCCTTCGGACGTGAGAGCGAGCTGGAGCAGGTGCAA
+GGCTTTGTCGACAAGCGCCTGCTCAAGATGCGCCAGCGGCTGACCGCAACGATCCGTTAC
+CACCGCATGGGCGCGGTCGCCGGTCAGATCTACGATGCCGACGGCAAGACCTTGCTGTAC
+GACCTGTTCAAGCAGTTCGGCATCAAGCAGCAGGTCCAGGCCTTGGGGCTGGCGACTTCG
+ACCAGTGGCATTCTGCAGAAGATCGTCGCGGCTCAGCGCATGGCCGAGGATGTGATCGCC
+GGCGCTGCTCCGATCACCGGCTGGCAGGCGGTCTGCGGCCGTGGGTTCATGGATGCGATG
+ACGGCCAACGAGGACATTCGTCAGTCCTTCCAGCGCATCAACGAGGGCACCTTCCTGGTG
+AACAACTACCGCGGCGGCTTCCCCTATGCCGGCGTGATGTGGAAGGAGTACTACGGCAAG
+TTGGGCAGCACCGAGTTCATCGACACCAACTCGGCGTATCTGATCCCGACCGGGGTGCCC
+GATCTGCTGATTACCCGCTTCGCGCCGGCAAATCATATCGATGTGGTCAATACCACCGGC
+GTGCCGTATTACGCCAGTCTGGAGATGATGAAGCATGGCGCGGGTGTGGATCTGTTGGCG
+CAGTCCAATGCCCTGAACATCTGCACCCGCCCGCGGGCGATCATCAAGCTGACCGCCTGA
+TGTTCCGGGACCTGGTCAGCCAGATGGACGACCAGGTCTTTCCGGCCCTGGGCGATCCGG
+CGGTGCACAAGGGCGAGACGATCCTCGGGATGTTCGATGCGCCGTGGCTGGAGCCTGAGT
+TCGGGCGTCAGCAGACGGCGCTGCGATCACCGGTGTTTGTGGTGCGTGACGCGGTGGCGG
+CGGCCATCGCACCGGGCGATACCCTCGATCTGCAGATTGAGGGCATCGATGCCGGCCTCT
+ACACGGTGACCAAGCTGGAGCCTGATGGCACGGGCTTGATCACCCTGGTACTGAGGCGCG
+CCAAATGATCGAGCTGAAATTCTCGCTGGCTGATGCCCGCAAGCTCGAGCAGTTTCGGCA
+GGCCGCCCCGAAAGAGGCGGCCGATGCCCAGCGCCGGGCCATCAACAAGACCCTGCGCTG
+GCTGCGCACGCACATGTCACGGGCCATCAGCCGGCGTGATCGCATTGCGGTGACGGCGGT
+GCGTCAGCGCCTGTCGGCCTATGCGATCCGCCCCGGCGGCAAGCAGGGCAAGCTCTGGCT
+GGGTCTGGATCCGTTGGAGGCCTCGCGGTTGGGCAAGGTGCGCCAGACGGCGACTGGTGT
+CTCGGTCGCAGGTCGGCGCTTTCGGGGCGCCTTCTACCAGAAGGTCTATGGCGGCAAGCC
+GGACGTCTGGATCCGCACCCACAGTAAGCATTTCAGCACCTCGGCTTATCCCGGGGTGGC
+CATGGGCGGCCCTGCCATCGATGAAGGCATGTCCGGCCGCTTTCCGGTGGCCAAGGTCAA
+GGTCAGCATCGAGGACGTGCGCGAGGAGTTCGAGCAGTGGGTGGACCGTGCTGCCGAGCG
+ACTGGCGGTCGTGCTGCAGCAGGAAATGCGCTACGCGATGATGAAGGCGATACAGCGATG
+AGCAACGACGAAAGTGCCGGCGACATCCAGTCGGTCGATCTACCCGCTGTCAGCACGGCG
+ATCGCCTCGACCTTGAGCACACTGTTCCCGGCCTTCGTGTCGGTGCAGGCCATGCCGGAT
+CAGGGCGAGATCATGGATCTGCCGGTACCGGCCGTGTTTATTGACCTGGAACAGATCGAG
+CCGGCGCCCGATCCCGGCACGGGGCAGTCCGCCGTGCGCTGTAGATTCTGCGCCTATCTG
+CTGATCGGCCCGGAATGCCAAGGCCATACCCGGCTGCTGGGCAGCATGGTGACGGCAATG
+ATTGCGGCGCTGCGCGAGCAGTGCTGGGGCGTCTCGGCTGAACCGGCCGAGTTCGTGGAG
+GCGATGCCAGATGGCAGCCGGCCCGAGCTGGACAATCTTGTGGTCTGGTCGGTGCGCTGG
+GATCAGGTGATCTATCTGGGCGAAGCCAGCTGGGACTGGGCGGACAGCACCGGCTTGACC
+CTGCTGGTTGGGATCTCGCCCGAGGTCGGGCCTGAGTATATCCAGGACTATTTCGATCCA
+AAGGAGCGGCTCGATGAGCTATCCACTGGCCGAACATGACCGGATGATCGCGGCCATGCT
+GCTGCCTTGCGTGGTGGAGGCGGTCGATCCGGTCCAGCAGCGGATCAAGGTCAGCAACGG
+CGACTGGATCAGCCCCTGGGTGCGCTGGCACAGCGGTGCGGCCGGCGCGGTGCAGATCTG
+GCGCGTGCCCAGCGTGGGCGAGCCGGGTGTGCTACTCAGCCCCAGCGGCACGGTGGCGGC
+CGGGACCTTCGTGCCAGGCCTTTTGAGTGCGCAATGGCCGAACAGCGAGAGCTCGGCCGA
+TGTGACCTCCATCCAATGGCCGGACGGTACCCGTATCGCCTATGACGCCGCCAGTGGCGC
+GCTCACGGCGGCGCTGCCCAAGGGGCAGCTCAGTGCATCGGTGGGGCAGGTATCAGCCGT
+GCTGAGCGAGCAGAGCGCCGTCCTCACGGCACCCAACATCAAACTTGCGGGTACGGTCGA
+GATCGAGGGCGATCTGACCGTGTCCGGTACGGCCCAGGCCGCGAGCTTGTCCAGCCAGGG
+CGGGATTGACGCGAAGGGCAACATCCAAGCTGCCGGCACGGTGCACGGCAGCAACCTCTG
+AGAGAGAAGCCATGGCAACGACCACTGATTCGGGCGCGACCACCGCGGCCGCGGATACGG
+CCGCAACGACGGCCGCCAATACCTCGAGCACCAGCACGACTGCGTCCGCTACCGCGGCAA
+CGCCCGCAACCAGCAGCACGGCGAGCACGACCGCCACCCGCACCACCGGTACAAGCTCCG
+CCACGGCGACCACCGTGACGCCTGCGGCGCCGACCCTGCCGGTGACCTTCAAGGATTTGC
+AGTATCTGAGCCGGGTGCTGATCCTCGATGACGGGCGCACCTTGCAGGTCAGCCGTTCCA
+AGGTGACGGCCTACGATGCGGCCGCCTATGCGTTTCTGGCCTCGCGTGTGGACTTCGCCA
+AGTCATGATCGTCGGGATGAGCCGCACCACGGGCCAGCCGGTGCATGGTGTGGCCTATCT
+CGTGCAATGCATCGAAGACGTGCTGACCACGCCGCTGGGCAGCCGCCGGATGCGTCCCGA
+GTACGGCTCATCCATCCGCCAGATGGTCGATCTGCCCATGAACGAGGGCTGGAAAAGCGC
+CGTGCAGGCCGAGACCGTGCGGGCGCTGTCCCGCTGGATCCCGACCTTCAAACTTTCCTC
+CGCCCAGGTGGTGTCCGTGCTCAATGGCACGATCAGCTTCACCGTGAAGGGGCAGTACCT
+GGGTGACAACGTCACCCTGCAGGTGAGTGCATGAGCCTGATCGATCTTTCCCAGCTGCCG
+GTACCCGACGTGGTCGAGACGTTGGCCTACGAGGATATTTTCCAGGCCCTGCTGACCGAC
+CTGATGGCGGCTGCCGGTGACAGCTGGACCTCGGCGATGGAAACCGACCCGGTGATGAAG
+CTGATGGAGGTCTGCGCCTATCGCGAGCTGATGCTGCGGGCCCGGGTTAACGATGCGGTG
+AAGGGCTGTTTTCTCTCCACGGCAACTGGTTCGGATCTCGACAATCTGGCGGCGTTCTTC
+CAGGTCGAGCGGGAGACAGTCATGCCGGCCGATGCCAGCACCGGCACCGCGGCGGTGATG
+GAGAGCGACGATGCCCTGCGGGTGCGCGTCGGCCTGGCACCATCATCGTTCTCGGTAGCC
+GGGCCGGAAGAGGCCTACGAGTACTGGGCCCGCACCGCTTCGACGCACATCGTCGATGCC
+AAGGCGACCAGCCCCAATCCCGGCGAGGTGGTGGTGGCCGTGCTGGCTGACAGCGCGGAT
+GGCACGGCCTCGGACGATATCGTGGCCGCCGTGCAGGCGATCCTGTCTGATGACGATGTG
+CGGCCCATGACCGATCAGGTCACGGTGCAGTCAGCCGCGATCGTGGGCTTCGCGGTTGCG
+GCGACCTTGCCGACGTACTCAGGGCCGGATCCTTCGGTGGCGCTCAGTGCGGCTGCGGAT
+GGCCTCAACACCTACCTGGCCAGCGCCAAGAAGATCGGCGTGTCCGTCACGCGGGCGGGC
+ATCATCGCCGCCCTGAAGGTGGCGGGTATCCAGAACGTGATCCTGACCGAGCCGGCCGAA
+GATGTCGCGATCAGCGATACCCAGGCCGGCAACTGCACGGGCATCACTCTGACCCCGGGG
+ACGACCGTTGACTAGCCTGCTACCACCCAACCGCACCAGCTTCGAGGCGGCGCTGGAAGT
+GCCGCAGGAGCGGGTCGATGCCATCCCGACGCCACTGGCTTCGCTCTGGAACCCCGACAC
+GGTGCCCTCGGCGCTGCTGCCGTGGCTGGCCTGGTCGCTGTCGCTGGAGAGCTGGCAGTC
+GTACTGGTCCGATACCGTCAAGCGCAACCGAGTCCGGCAGGCGATCACCATCGCCCGTCA
+TCGCGGTACTGCCGGTGCCGTGAAGGCAGCGGTGGAAGCCTTTGGTGGCTATGTGTCCAT
+TCGGGAGTGGTGGGAAACCACCCCGAAGGGCACGCCGCACACCTTCGCCTTGCTGCTCAC
+GCTCTCCGGCGCCGATGGCAACGTGGCCACCGCCGAGTACGTCGACGATGTGATCGAGGC
+GGTCCGCCAGGCGAAGCCGCTGCGCTCGCATTTCACCTTCACGCAGGGCATCAACGCGAC
+GGGTTCAGTCGGCGTGATCGCCGCGGCCCGCCCGCTGGCCTATGCGCATCTGCAATTTGA
+TGGAGCTTCCTGATGGGTTTGACAGTCACCATCACTGACGCCGGCCGCGCGGCGCTGCGC
+AACGCCGCCGGCAACGGCACCAATGCGGTCACGATCGCTGCGGTCGGACTCAGTTCGCAA
+GCCTTCACGCCCGGCGCGGCCATTCCGGCCGAGATCAAGCGGCTGACCACGATTTCCGGC
+GGCGCCACGGCGGCTGATACCATCCACGTCACCGTGCTGGACTCCGGCGATGACGATTAC
+TCAGTGTACGGTTTCGCGCTGTACCTCAGCGATGGCACGCTGTTCGCCTCCTATGGGCAA
+TCCACGGTGATCGTGGAAAAGTCCGCCCAGGCCATGATGCAGCTGGCGCTGGATGTCCGC
+TTTGTCGATGTCGCGGCCAGCAGCATCAGCTTCGGCGATGCCAATTTCATGAACCCGGCG
+GCGACTGAGGACACGCTGGGCGTGGTCAAGCTGGCCAGTGCCGATGATGCGACGTCCGGC
+ACGGACAATCAGAAAGCGATCACGCCGCAGGTGCTTTCCGGGCTGCTGACGCCGAAGATC
+AACAATCTGCAGAGCCAGCTGAATACGGCGGTGATGACGATCCTGCCGGCGGATGACACC
+GTCAACACCCGGATCAATCTCTTCGCGGTGAACGATGCGACAGGCCTGCCGTTTGTGGCT
+GATGCCAAGGGCATCACACGCCAGCTGGCGACGGTGTCCTGGTCCTCGAACCTTGTCGGC
+CAGGAGGCCACAGCGCGGCAGAGCGCAGATCAGAACCTGCAGAATCAGGTCAATGTGAGG
+ATCCCAAGTAATCCCGGCACGGGGTTTCAGTCCATCACCAACCTGACATTGTCAGCAACG
+GGGCAGCCCATCTTTGTCGGCTCCGGCGGAGGGACGACCCAGGGCATCACCACCTTCAGC
+GATGCGCAGACCAATCAGGTTCTGCAGATCGGCTACCAGTACAAGGGGGATTACCTCTCG
+ATCAATGTCGGTGGCTCGTGGGTCTATGGCGCGACCCAGAGCTGGGTGAACAACCAGATT
+GCTGTCGAGACAAAGCGAGCATCCGGTGTCGAATCGGGTCTGCAAACCCAGCTCAACGGC
+GCTGCGATGACGCTGACGGTGGCCGATGATGGCACCAATCAGCGTGCGGCACTGGTAGCC
+ATCAACAAGGCCTGGAATCTCCCGTTCATCACCTCAGCCCAGAATGTGGGCTATCACCTG
+GTGCGGACCGAGCCGGGTGCGGGGTTTCAGGCGGTCACCAATTTCTCGCTCAATGCCGCG
+GGCCAGCCCATCTTCGTGGGCTCCGGTGGTGGCACGACCCAGGGCATCACAACCTTCAAT
+GATGCGCAGACCAACCAGGTGCTGCAGATCGGTTACCAGTACAAGGGCGACTATCTTTCC
+ATCAACGTGGGCGGATCGTGGGTCTACGGCGCGACGCAGAACTGGGTCACTGGCAACTTC
+GCCGGTCAGCAGGTCGACACGAATACCTTCGGTGTCTCCAAGATCGGGGTGAGCAAGCAG
+GTCGGCGCCGGGATCCAGATGCTGTGGACCTATGGCACGGACGGAGTAGGGCGCTGGTGC
+CCGATTTCCGCACCGGGTAATGGCTTCTATTTCGCCACCAACCTGACGATGGGGGCCGAT
+GGGTCGCTCTATGCCTTGTCCTCGAAAGATGGTGCGACCAACGGCTATGCACCAAGCTCC
+TACGGCACCATCGCCGGGGGCTACTACGTCCGCATCGGAAACATACTGATCCAGGCGTTT
+TCAGCAGGCGTGCTCAGTGCAGGCGATTCGATTGCATTTCCGATTGCCTTTTCAGCCGCG
+CCAGTGGTGTCCACGACCGTCGACAACAACCGGGACGGCGCCAATCGTCCGGTCGCCATC
+AATCCGACGGTCGGGACAGTGACTGCATCGGGTTTCAAGATCAACATCGCCGCCATCTCG
+GGGGCGAACCAGCCGGCAGGTACCGGCCAGGTGTGGGTATTTGCCATGGGGCCTGCATAA
+ATGACTGACAACACCGACGAGACGGCACCGGTGGCCACCGCAGCTGCCGTGGACATGGCG
+ACCGATGCGACATCGAATGTCGAGACGCAATGGCCTGCCCGCTACTACGCCAGCTATGAC
+ACGTCCGCCACCGGGCCCACCGAGGTCTCCGGCTGGTATGACGTGTGGGGCATGTCCAGC
+ACGGCGAATGTGCCTGCGGCTGCGGATATGCTTGCGCTTACGGTCGAGCAATGGGCTGCT
+CGGCTTCCGTATGGGCAGGGCGTGCATGAGGGGGCCATTGTGGCCTACACGCCATCCAGC
+ACCGTCACTCTGGCGGATCAGGCTGGATTCGCCTACCCGGCAGCCGTCGCGACGGTACAG
+AGTGAGTACGGCGTCCTCAACGAGCCAACACCCGATGACTGGGTGACCTATTTGAAGGCG
+CTGAAGGCCATCCGGGACGGCACCGACACCACCAGCACGGCGCTACCGGCTGCACCCGGT
+AGCTGAGCCCTAGCAGGCCACATTTCACCGATTTAGATGCCCGCTGATGCGGGCTTTTTC
+ATGCCTGGAGCTTCTATGCCTTCCACCAGTTTCTTTCATGGCGTCACGACCTCGATCGTG
+ACCAACGGCGTGCGCACCATCTCGGTGCCCAGCTCGTCGATCATCGGCCTCGTCGATACC
+TTCACCCCGGGCGCCGGCGCATCGGCCAGTGCCGATACCCCGACCCTGATCACCTCGCTG
+ACCGATGCGGCGGCGGCCTTCGGCTCGGCGTCCTCGATCTACAAAAGCCTGCAGCAGATC
+TACAACGTCGCCCAGCCGGTGATCGTGGCAGTGGGTGTCAACGCGGCCGCAGGCTCCACC
+ACGAGCACCAGCGGCACGACCACCACCGATGCCAATGCGCTGACCTCGGCGATCATCGGC
+GGCGAAACCACGGCCGGCGCGCGTACCGGCCTGCAGGCGCTGCTGGATGGCCAGTCGGTG
+CTCGGCTACCGGCCGCGCTTGGTCATCGCCCCGGGTCAGTCCGCCAATCAGGCGGTGGCC
+ACCGCGATGGATACCCTGGCCGGGCGCCTGCAGGCCATCGGCATCATCGATGGTCCCAAC
+ACCACTGATGACGATGCCACCGCCTACGCCGCGAACTTCGGCAGCAAGCGACTCTTCATG
+GCCGACCCCTATGTGCAGGTTTATGACACCACGAGCAGCAGCACGGTGGCGCTACCCAGC
+AGCCCGGTGATCGCAGGCATGTTTGCGGCGACCGATGCGCAGTATGGCTACTGGGCCTCG
+CCTTCGAACAAGGTCATTGCCGGCATCACCGGTACCGTGCGGCCGATCGAGTTCCTGGAC
+GGTGATCCGTCCTGCCGTGCGAACCTGCTCAACAACGCCAACATCACCACCATCATCCGC
+GAGAGCGGCTTCCGGGTGTGGGGTAACCGCACCCTGTCCAGCGATCCGCTGTGGCAGTTC
+GTGACCCGGGTCCGCACCGTGGACATGGTCATGGCGGCCGTGTTGGCCGGCACCCGTTGG
+GCGGTCGACCTGGGCATCACCAAGGCCTATGTCCACGAGGTCACCGAGTCGGTCAACGAC
+TTCATGCGTGACCAGAAGGCGCTGGGCGCGGTGATCGATTTCGAAGTCTATCCGGACCCG
+GATCTGAACACGGCGAGCGCGCTGGAGCAGGGCAAGATTTACTGGCGCATCCGCTTCACC
+GACGTGCCGCCGGCAGAAAACCCCAACTTCCTGATCGAGGTCACCGATCAGTGGATCACC
+GAGGTGCTGGACAGCACCACGACCTCGAGCAACTAAGGAGCCGGCATGATTCCGCAGACC
+CTCTTCAACACCAATCTCTTTGTCGCCGGCGTGTCCTTCGCCGGCGATGTGCCGACCCTG
+ACGCTGCCCCAGCTGCAGCTGGCCACCGACGATTACCGCGCCGGCGGCATGGACGGCACC
+ATCGACATGGACATGGGCCTCCAGAAGATGGAGGCCTCCTTCACCACCAATGGCGTGCGC
+GCGGAGTCGCTGAGCCTATTCGGCCTGGCCGACGGCAACGGCTTCTCGGGGACCTTCCGC
+GGCAGCTTCAAGGGGCAGGGCGGCGTGACTACCGCCGTGGTGGCCACCATCCGCGGCACC
+CTGAAAACCATCGACCCGGGTGACTGGTCGGCCGGTACCAAGGCCGAGATCAAGCATACC
+GTCGGCGTGACCTACTACAAGCTGCAGGTCGGCGGCACGGTGATCTACGAGATCGACCCG
+GTGAACGCGATCCGCATCATCAATGGAACCGACCAGCTGGCCAGCATGCGCAGTGACCTG
+GGCCTGTAAGGAGCCGACATGACCACGAAGAACGAAAAGAAGAACCCCTGGCTGGATGTG
+ACCGATTCCGGGGCCGTGATCCGCCTTCGCCGGGTGAGCGAGTGCAATGGCGTCAAGGTC
+GATCGGCTCTCGATGCGGGCCCCGACGGTGAAGGACGTGCGTACGGCACGCAAGGCTGCG
+GGCGAAGATTCGGCCGACCATGAGATGCAGTTGTTTGCCAGTCTGTGCGAGGTCAGCCTC
+AAGGATCTGGAGGGGCTGACGATGGTCGACTATGACCGTCTGCAGGCCGCCTATTTTCGC
+CTGGTGGCGGACGACGGGGCTGTCGCCGGCGACTGTGCATAAGCTCGCTGTGCAGTGTGT
+CCGACAGCTGGGCATCCAGCCGTCGGAAGTCGATCGCATGACGGTCACCGACATGCTCTG
+GTGGCTGCAGGAGTCGTAGGGAAGGACCATGGCCAGGAACATCAATATCGGCCTGGTCAT
+CGGCGGCGCGATCGCGTCGTCCATGGGCCGGGCCTTCGATGACGTGCAGTCGCGTATCGG
+GCGGCTGGAGAAGACCGGGCAGCGGGCCCGCGTGCTGCAGCGGATGATTGGGGAAACCCA
+GGAGCTGCAGCGGGACTATCAGCGTCTGGCCGCCACCGGTTCATCCATGGCGGATAGGGT
+GCAGCGCAAGCTGCACTCCAATCTCGATGCCTTGCGTGATCAGGGTGTGGCCGTGGCCAG
+CCTCGAGGCGGCCTACCGCAAATTGGGCGCGACCGCCCGGCGGGCGGAGTTTCGGGCGGT
+GGGCACCAGCAATTTACAGACGGCTCGTGATGGCCTGGGGCAGACCGTGGCCCAAGGCGT
+GCGCGTAGGCGCGACCGTGGCGGCACCGGCCTACACGGCGGCCAACTTTCAGGCCACGGT
+GCGCGATATCGCCATCAAGGCCGGGATCGCCAATACGGGGCAGGAGAGCCAGGTCGCCCG
+CGGCATCATCGCCAATGGGCAGGCCAACGGCATGGGGCGCGGCCAGATGGCTGACCTGGT
+CAATCAGCTGGTCAGTGCCGGCATGGATCTGAAGCAGGCAATGAGTTACGCGCCGGTGGC
+GGCGAAGTTCTCGGTGGGGCAAGGTGTGTCCGGCGAAGATACCGGCAAGCTGATCTCCGC
+CATCAGCCGCAATGCCAAGATCACCACGCCCGAAGGCATGGCCAAGGCTCTGAGCTCAAT
+CGCCTACCAAGGGCAGGCTGGTAACTTCGAGGCCGAAGACATGGCGCGCTGGTTCCCGGA
+TCTCTTGGCCCAGATGCAGAAGCTGGGGCTGACCGGTCAGGACTCGGTGAACCAGCTGGG
+TGCCATGCTGCAGGTTCAGCGCAACGTCGCCGGCACGTCGGACGAGGCCGGCAACAACCT
+GGTCAACTGGATCAGCAAGATCGGCGCGCAAGAGACGGTCCAGAACTACGCCAAGGCCGG
+CATCGATTATGCCGGCTCCATGCAGATGAACATGACCAAGCATGGCATGTCGGCCCTCGA
+GGCCAGTTTTGGCCTGGCTGAGAAATACATTGAGGCGGTCGATCCGAAGCGTGCGGCGGA
+CATGGCCAAGGGACTGGCCGGTATCGACAAGACCCTGGATCCCGACAAGGTGCGGGCGCA
+GGTGGAAGCGCTGAATCAGCAGATGCGCACGGGGCATATCTTCACCGATCTGCAGGTGAA
+TGCGGCGCTGACCGCCTACCTGCAGGGCCGCAAGCTTTATGGGCAGCTGAAGGCCGACTC
+AGCCAAGGCCGGCGATATCCTGGACAAGAATCTGGCCCAGCGCAGGCAGACCAGCCTGCA
+GATGTGGAAGGAGGCCGGCTATGCCTGGGACAACGCGCTCAACTCCATGGGGCAGGCGAT
+CGAACCGCTGACCGACAAGGTGGCCGGGTTCGCCAAGACGGCGGCGGCTGCGGTGGATAC
+CGTTGCGACCAAGGCGCCCGGGGTTGCAGAAGCCGTGCTTGGCGTTGTGGGCGGTCTGGT
+GGCCCTGAAGGCTGCGGCCGTGGCCTTTACCGCAGTGAAGGGGATCTACCAGATCGGACG
+CTCTGTGACGGGCAAGGGGTGGCAGCCGGAAAATCGCCCGGCAGGCTTGCCCACCGGCTC
+CGGCGGCCCGATGGATCGAGGTGGCGTGGTGCCCGTGCGGGTTATCAACTGGCCCAAGCA
+GTTTGGCCCATCAGATGAGCCGGGTGGAGCCGTGGCAGGGGCTGAAGGTAGCCCTAGTGC
+CGGTAGCCGGATCGGCAAGGCCATCGAGGCTGCCCGCGGAGCGGCGAAGTTTGGTGGCGC
+GCTGGCCCTGATCGACGGCGCCATCAATGCCGGCAGCGTCTTCGCCACTGCCAAAACGCG
+AGATGAGAAGTTCAGCGGCTATGGCGGCGCGGCCGGCGAGACGGTCGGGGCCACGGCGGG
+CGCTGCCGCCGGCGCGGCGCTGGGCTCGATCGTGCCCGTCGCCGGCACAGCCCTTGGCAC
+CATCGCCGGTAGCATCATTGGCGGCTGGGCCGGCAAAACCCTAGGCGAACTGGCCGGCAA
+GCATCTGGCCACGAGTACCGCGGAGCACGCCGATGACAAGTCCTCGGCGGATGCCGACAA
+AGGTGCGGCGAACTTGCCGCCGATCCAGGCGGGGCCGTTCTCGCCCACCATCCAGATCAA
+TATGCAGCAGCCCACCGGTGATCCGCGAGCCTGGGCCGAGCAGGTCTGGCCCATTCTTCA
+ACAGAAGCACGCTGATTACCTGGGCCGACTCCAGCGTGGCCAGCTCTTCGATGCGCCGAT
+GGTGTAACCCATGCCGTATATGCAAAACATGCAGGGGGCGCTGCAGTCCCTGGTCAGCTC
+CGGCGCGGCCGGTCAGCGCAGTCTGGACAGTATGCTGGGTCCGATGAATACCGGTACAGC
+CCAGCTGACCAGCTCGGTGTCCGAGATCAGCAGCCTGCCGTTCCTGTCCTCGGGCGATAG
+CCAGTCGATCCAGCGGGTGACGCGCCGCATCGTCCAGGCCCAGGCCATGGTCGGCAAGGT
+GATGAACACCTATACCCAGGTCAATCGGGTGGCTTCGGGTGTGGCGGCCTCCTATACGGC
+GCTGGGCGGCCAGGTCACGGCGGCCCGTAATGCGGTCAGCAAGATCATCGGCAAGGTCAA
+TCCCTCGCTGGCCAGCGCCATCTCCACATCGATCCTCAACCCCACCACCAGCCATGCCGC
+GGCGGTGAAGCCCTTTCCGCATCTGCTGATCATGCAGCCGGTCGTCTCGGGCGGCACGCC
+GTTCTATTTCAACCTGGACACGGCGGCTTTTGATTCGCTGCAGCGCCAGACCAGCTATGG
+CTGGCAGGGGCAGGAGCGTCTGGGTCGGCGGCCGGCGCAGCAGTTCGTCGGCATGGGCAC
+CGACAAGATCACCTTGTCCGGCGCGATCTATCCGCACTTCAAGGGCGGCCTGACACAGCT
+GGACAGCCTGCGCACCCTGGCCGGTACCGGCAAGCCCTACATCCTCACCACCGGTTACGG
+GCAAGTGCTGGGTACCTGGTGCCTGAGCTCGATCAGCGAACAGCAATCTGCGCTGCTGCA
+CGGCGGTATCCCCCGCAAGCAGGGCTTCACTTTGGAATTTGACCGCTATGGCGACGATCT
+ACAGAACCTGTGACGGCGACCTGCTGGACATGCTGTGCAACCAGCACTATGCCTCGCTGG
+ACGGAACCGTCGAGGCGGTACTGTCCGCCAATCCCGGTCTGGCCAGCCAGGCCCAGCCTT
+ATGCCGCCGGCATCCAGATCATGATGCCCGACATCGCCACGCCTGTTGAGACCGAGGTAC
+AGCTATGGGATTGAGCAACACACCGCTGGCTCGCGTCGAGGTGAATGGCAAGGACATCAC
+CGCCCTGATCACCGACCGGCTACTGATGATCCAGACCATCGACAAGGCCGGCATGGAGGC
+CGACCAGTTCGAGATACGGCTGGATGACCGGGACGGCAAGCTGTCGCTGCCGGCACGTGG
+CGCCGTGCTCAGCATCTACCTGGGCTATGCCGAGCAGAGCGTGGGCCTGGTCGGGCAGTA
+CACGGTCGACGAGATCGAATATGCCGGGCCGCCGGACAGCATTGTCCTGCGAGGCAAGTC
+GGCCAGTATGCTGGGTTCCGGAAAAAGCACTCGATCGGGCAGTTGGGACAATGTCCCGCT
+CGGCCAGATCGTGGCCGACGTGGCCGGCCGCAATGGCTGGACGCCGCTGTGCTCAGTGGC
+CGATGTGGTGGAGCGTGCCGACCAGGTCAAGGAGAGCGACTTCCACTTCATCACCCGCAT
+TGCTCGGCAGCATGGCTGCACCGCCAAGTTGGGGGGCGGCAAGCTGATCGTGGTGCCGCT
+AGGCATGGCCAGCAGCGGCAGCGGCAAGAGCATCTCGGCCATCACGCTGACGCGATCGGA
+CCTGACCCGCTTCCAGTTTCAGCTGGCCGACCGGTCAGCCATGGCCTCGGCCAAGGCCGG
+CTATCTCGATCCGGCCTCTGGCAAGCTTGCCATCGTCGACGTGACCAATCCCAATGTACC
+CGACGGGCTGCCCGGCGTGCATGTGGACCGACACCTGCACCCAAATCGTACAGCGGCCCA
+GCGCGCGGCCAAGGCACGCATCGATGCCTTCAACCAATCCACTGCCCTGGTGCGCCTAGA
+GATGCCGGGGCGCACCGAATTATTTGCCGAGCGCCCCATCAGCATCAACGGCCTGAAGAC
+CGGTATCGATGGCACCTATATTGCGAGCAGCGTGGAGCAGACGCTCACGCGGGCAGGTTG
+GAGCACGACGGTTGAGTGCAATGGTGGGAATGATGGGAAGGCAGCGGCATCTGGCAAGCG
+GAAGTCGGTGCTGAAGGTTATTGATGCTGGTGAGTAA
+>NC_017033.1|provirus_1557694_1600481
+TCACTCCCCCTCCTTGTATTCCGGGGCGGCGGCAAGAAATGTCCTCCAGATCGTTGACGG
+GAAGGCATTCGGGTTCTGCTCATCCAGATAGGCCGCCACGTCCATGGCCTCGGTGAGCTG
+CTCCGGCACCAACTTCCACCCCGGCGGCGCTTTGGTGAGGGCGGCCATGATGCAGGCAAA
+GTTCTCGGGCGTGTATCGGCCGCTGATCACCTCATCCTTGATCAGTCGATGAGATCCAGT
+CGATGCGCAAATATCCCGTGCCATCCTCTCCAGTACAGTCATGGCCATTACTCAACCCTC
+CCTGTTTCGGCAAATTGGGCCAGCATCCGAGATAGACGCCGCGCCTCTTCGCGGCCTACC
+TGCACACTTCTCGTCGGCCTGCAGGTGCTGCTACATACCAGCCAGCATCGGCCGCCGATC
+ATCTGCAGCTCGATCGACTCGGTGCGGTCGTTTTTGAGTCGGATCGCATCGGCCATTACT
+CAATCACCTCGCGCACGTGGATGCATTCGATACATCCGTTATCAGCCCCTTGATCAGCTG
+ACTCCTTGCTATCGCAGATATATATCTCGCCGTCAAAATACAGATTCACCCAAAACTCCC
+GCGGACTCACCTCCTCGCTGATGCGGTATTTATCACTTGCGTGAAGATGGTCATTTTTAC
+CCCACGCGCACCATGAATCAGACATCCAGCACTGAACTTTCTTCCCATTCTTCATTCCCT
+GAGCCGCGGCAATAACGCCATCCCACCCAGTCACGGGCTCGCCCCATTTGATTCGGTCAG
+TCATGCCATGTCCTCATCGGTGATGGTGTGTTCCTGGATGTTTTTGATGGCACCGAACAT
+CGCGGGCGGCAGTTCGGATAGCCAGGAACGCAGATGCTTGACCAGAGATTTGTGGTGCGG
+GTCGAGAAGTCCAGACTCGTAATCGTCTGCCAGAAAACCATGCTTCTCCTTCGCATGGTC
+GGCCATCGAAGAGATGACTTCCCATGAAAGGGTGCTTGCCGACAGGTGTTGGTATGGAGT
+GAACTGGCCAAACCTGATCACCGATCCAGCACTGAGATCGCCACCCGATGCATCTATGGC
+ATCCCCTATGGTGTCGTACAGGAATGCGTCGTCTCCGGGACGCTCCCACTTGATTTGTGG
+ATCACCCATCGTTCTGTTCCTCACATGCATTGCGCGTGGCCCACCCTACGGCTGCAGGTG
+GCATCGGCGCGATGGTGTAGATGGCCCGGATCGTGCCGGCGGCGGCCGGGCGAGCATCGG
+GCGGAAGTGTGTGCAGGCCGGCCAGCACCTGATTCAACATGATGCCGGCAGCGCGGGCCT
+GCTCGGCGGTGGATGCGACCTGGGCGAGTGAGCTGCACCAGGTTGGCGCGGCCGGCGTCG
+GTGTGGCCAGCGCGGCGGTCAGGAGTAGGACCGGGACCATCACCCCACCTCCGGCGCGTC
+AGGGATGGGCATGTAATGGCTGTAGTTGGTTGACACTATTTTGCCATTGGGTGACTTCCA
+GCATTCCTCGATGTCATCCCATCCCGCAATTGCTTTTGGATAGATGGCAGCCAGTGTTAG
+CTGACCTAGAATGACATTTCCAGCGGCCTTTTCTGACCCATCAATCGGCAGCCAGCGCGG
+GGCGTATTTGGCGTGGGCGGCTTTCCATGTCTGCCAGTTCAAATCAACCTCACGGCCCTC
+CAGAGCCATGTACCGCGCATGGTCCTCAAACTCATCTCGCAGTGCGATTACTTTCTGCTC
+AGTGCTCATGCGGCCATGGCCTCCATGTTGTGGGCCGGATCGAGGTTCGCCCGGGCGATG
+GCAGCCAGCGGTGGCGGGCTAACCGAATTTCCGCACATGCGCGTGCTGGCGCTGATGCTG
+AGGCGCCGGCCGTCAGCGGTGCGATCGATGATGTAATCCGCGGGAAACCCCTGGGCCCGG
+TAAAGCTCGGCCGGCTTGAGCATCCGCAGGCCGATATCCACGATGACGTAGGGCGTGCCC
+TTGATGGTTACAGTGACCAGGGCCAGCCGGTCGCGGGTGGTGACGGTGTCGAGCGGGTCG
+CGCAGATTTTCGCCGTGAGCCGTTCCGTAGTATTTGATCAGGAATGCCGCGACGCGCAGA
+GCTCCATCGGTCTGCTGCTGGCTGAGAGTGCATGTCACCAGTCGCTGCTGGCTTCCGCTC
+CCCACGATGGTCGGTGCCGGCTGTCGAAGGTCATTCCCGGCCCCGGTGTAGAAGCCGCCA
+TTGGCCTGCTCGAGAAAAGCAGATACGACACCGAGAGCATGTGCAGCACCTGCCGGTCGG
+GCTGCACCGGCACCGCTGGTGATCGTGGGCACCGGCTCAGTAATCGCAACCCCGGCCCGG
+ACATCGCCTCGGATCTTGATCAGGTGCGCCGATACGGCGGAGAAGTGCCCACCTTTGATG
+CCGCTGACCTGTGTCCGCAGTGGCTCATCAGCTGCAAATACTCGCTGGCTGCTGCCGTTG
+GCATGTTCGGTGAGGAATGCTGCTGCTGGGCCCGGAACAATGAACGGCTCATCTGTATCC
+AGCACGAATTTGTGGATGCCCTTGGCGATGCGCCGGCAGGTGGCATCTGCCAGAGGCCTT
+GCCCGCTCGAATATCGACGGGCAGGGTATCGACCAATCGATGCAGTCGGCGGCGGTGACG
+AGCGGCTGTAGGCCGAGACCGCGGCCATGGGTCTGTGCTGGCCAGACAATGGGCAGCCCA
+TCCCGGCGCGCGATGAGAAAAAGTCGCTCCCGGCTGGTGCCGGCACCGTAGTCGCTAGCG
+ATCAGGAGCCTGTGCTTGACCTGGTATCCCATGCCGCGCAGCTCATGAAGGAAGCGCGCC
+CAGGTCTGACCGGCTCGGCGCTTGTCGGGGACCAGGAATTGCTGGTCGACCGGGACACGC
+TCACCACGGAGGGCGACAGTGCCGTCCAGTTTCACAACGCGTCCGGTCGCCGGATCGCGC
+TTGGCAATCAGCGGACCCCAGCTGCGGATTTGTCGGACGTTCTCCAGCGAAATGATCCGC
+GGCGCACGCCCGGCACGCGCCAGGGCTCCGGCCCACTTCAGCACAACCCACGATAGCGAC
+CGGGTGGCCCGGCTTCGCGGTTGGCCGCCCTTTGCCTGGCTGAAATGGGTGCAGTCCGGG
+CTGGCATGGAACCAGCCGACCGGGCGGCCGGCGACTTCTCGCACTGGATCGGTCTGCCAG
+ACATCCTCGCGGTGATGAACGGTAAACGGGTGGTTTGCAGCATGCATGCCGATGGCGTCG
+GCATCATGGTTGATGGCGATATCCGGATCCCGCCCCAGCGCCTGCCGCAGGGCCTCACTG
+GCTCCGCCACCGCCGGCAAACAGGTCCACGATGATTTCTCCCGGGTGTAAGCGGCTGAGT
+CCGGAGGTGCGCGGGAAGTTGAAAGTAGGCTGTGCGCTCACGCCACCTCCCTCCGCTCAA
+CCCTGGCCCGAGGCTTCGGAGGAACCCGAATAAACCCCATCCAATGCTCCAGATCTGCCA
+TTGCCACGGCGAAGATGGAATGCTCTGGATGGCACTCGCCAGTGCCCGACGCATTACCCT
+GGTAGACCCCGACAAGTCGGCTGGAGTGCGTGACCAGAAACCCGTCATATCCGGCCTCGT
+GGTGCGTGACGAACGCAACGCCGCCGGTCTCGCCGATGTACACCGCGATCCGACCATGCT
+CCAGCGCGTTCTCGCTGATCTCTTTCGCTATGGCATCACTGCCACGGCTGATGTTTCCGA
+GTGATTTCATGCTTCGTCCTCAGGAGGCCATTTTCTCGGCCACTGTTTCGGGCAGATCCG
+GGAAGGTGCCCCACGGTTTGGAAAACTCAGGGGCCCATGGTGAATCGTGGCCGCAGGCCA
+TCTTTCCGCAGCGCATACGTGGCTCGCCGTCTCGGACAAGCACTCGCATACGGCCGGATC
+GCCAGTCGAACCAGCCGTCGAGCGGCTGGAACATGTCGATGGTTGGAAGGGAGTTGTCGG
+CGGCCATGGTCAGGCCGCCTTACGCTCGGTGAGGCCGAGGCCGACATCCTTGATCCGAGC
+CATCATGGCCCGCAGCATGTCGAGCACCTGGTCCTCGCGGTACAGCTTGGCTGCACGATC
+GGTGCCGGCCGGGTTGAACCCGAGCTGGGCCAGTCCGTCTGCAGTGATCGAAAGCGGTGC
+GATCAAGGCGCTGATGTCGCCCAGCTTGATGGTCTTGGCAGGGCCTGCCGGTTGGGCGAC
+TTTTTCGGCCTTGGCTGGGATCTCGTCCGTTGATGCCGCAAAGTGGCTCTGCGCCTGAGG
+TGCGGACTGGACGACTTTTGCAGATGCCGGCGGAGTCTCGTCCACCACCTTGGCCGCATC
+CTGCTCGCGGGACAGCTTCTCGGCTTCTTCCTTGCGGATCTGCTCGCGCTGCCGCTCCAG
+TCGCTCAGTCTCCTGCCGTTCGAACTCGCCGATACGAGCCGCGACCAAGTTGCGGAGATC
+TTCAGGCGACTTGGTTTGTGCCAGCATCACCCGATCGGCAAACAGTGACTGGTGCTGATG
+TTGATTTTTCAGGATGCTGACGTTGGCGCGGATGGTCTCGGCCCGCTGGCTCGCAGCGAT
+CTTGATGTCGGCCACGGCCGTACTGACTGCGTCCCGCATGCTGCTGATCGATCGCTTGCC
+TTTGATCGATGCGCCGATGCCCGCCAGGGTGGCCTGGTCCGGCCGCGGCGCAAATTCACC
+GAGGCTCACAACCAACTGCTCGTAGTGGGCCCTGGCTGCACGGATGCCGGCGTCGACGAT
+CTCCTGTCGGATGCTGATGTCGCGAGCCTTGACGCATTTTTCCAGATCAAGACGGATACG
+GCGGGCCTCTTCCTTCAGCTCATCCATCGCCCGGAAAACCGCCTCGACCGGCGCGGCATC
+GGCGAGCGCTGCAGACTTCACCGATTCCAGACGGTCTTCCACGCCCTTCGCCCAGGTGAT
+CGTCTTCCTGGCATCGGCGAAATCTTCATCAGTCTGCAGATCCCGGTTGATACCGCCGAA
+CACAGCCATGGCATGAGTCTTGAACGCATCCAGATTCGATGCGGTGACCATGCCGCTGAC
+AGCCACATGCAGGGCAGGGAGCTGATCCGGAGCCTTGCCGACCGGCGCCGGCGCCACTTC
+CTGCTCCGGCTGATAAGCGGAAATGTCCTGCTCGAGCTGGGCCCAGCCGGCAACAATGCG
+CGCACGCAGTGCGGGATCTGAGAGATACCAGCAACCACGGCTATCGGACTGGATGTCTCC
+ATCCCATGATGTCGCCATAAACAGAGCCCTGTCTGCGCCGGATACCATCATCTGCTGCTC
+TAGCTGGGCGCAGTAGATCTCCGGAAGCACGACCTCATCGCCATGAAGCGGGATATGGCC
+ATCAGCGACATGCTTGCGCGGAATCGCTGATCGCAATGCCATGTTGAGCGTTTTGTGCTC
+CCAGATGGCATCTTCCATCATCGTCAGGCCGTCGAAGCTGGCTGAAAGACGGCCCTCGGT
+GCCGACGCAGGGGAACAGATCTTCGCCAATGACTTGTTCGGCCAGAGGCCTGCACAGCGC
+CTCAATGCGATGGCCTTCATCAAAGATGCGTTGCAACTGCGGGGTAATCTCGCGCTCGAT
+ACCAGTAGCCAAGCGCTTGATCAGCTCGCTGCGCGACTCATAGGGCGACAGTCCGAGCAT
+GGCTGGTGCATCACTGGCATTGAAATGCGCAGAGCGGTGGGCATGCCATTCCGGCGTGCC
+CTGGGTGAGCTTTACGATCTTCATTCGACTACCTCCACCTCGGTGGTTTCGAGGTCACGG
+ATGGCGCCCAGCTGACCGGGCGTCAGGGTGTATTTGGTATGGACCATGGCGATGATCTCG
+TCGGCAGTTTTGCGACCACTCTGGATGCGCTCGGACCAGGTGCCAAAGTTCTTGTTGAAC
+TCGTCATCCGAGTAGGGCGGAAGCTCCTGTGCAATCCGCTCAGCCCGCTGCGTGGCGCTA
+TCGGCCTGCGATACCGTGATCCGCTCTGCCTCATCGTGGTCATAGATCCCAACGAATCCG
+AAAGCGATACGCGAGCACTGGATCATGGCCTTGTGGCGTAGCATCCGGCGCGGGTGGGAC
+TGCCAGGGGCCTGCGTTGTTTCGCTTGCACTCGGCCATCCACTCGGTGACGCGAATCGGG
+TGCGATCGATCCTTGCGGTAGATGATGCAGGTGCAGCTCTGGTCATCCTGTTCAAAGTTG
+ATGCCATCGAACTGGGCGTGACCGTTGATGATCCGCGACCATCCATCGACGCCAACCACC
+GGAACGATGCCGCCCTTGTCCGGGAAGGCATAGATCTCTTTCGTCCAGGGATTGAGGCCG
+TACTGGTTGGCAACCATGAGAAGGGCCGCCATCTGCTCGTCGGTCACGTTGCCCTTGAAC
+GCGGTGGACTTGAGCGTTTCGACCAGATCCTTGGAATCAACATTCAGCAGGCCGAGATTC
+TTGGCCAGGCCATCGACCTGGGTGGTGACGAGTGCGGACATAACAACTCCTGCCGGCCTG
+CGCCAGCACAATCAAAAGGGAAGGGGATTTGAATTAGTGGAAGCCGCGGGGCGGCTCTTG
+GTAATTTCGTTCGGCTCGTCCGTAAGCCCATGACCAAAGCAGCGCTTCGATCTCTCGCCA
+GTCCTTGGTGGCCACAGCCTTGGCCATGGCCTCACAGTCGTTGGGGCGGTCGAGTAGGGT
+GGCGAGAAACTCCTCGGCCACCTCAGGATCTGCTACGGACCGGATTGCTTCGCGCTCGAT
+GATCGATTCACGATCAGCTGCAGCATCGCCGGCGTGGTCGCATTGCCAGCCGGGAGGATC
+GGGGAGGTATAGGGTCATTCCTCCACCCCGTCATAATCGTCATCGACTTCCATCCAAGCC
+GAGTCGTCCTCGGCCTGGTTATCTGGATTTCCGGGATGGGTGCAGCTACCGCATGGCGGG
+GTCAAGTGGCACGAGCAATTGCCCCCGTCAAATTCGGAATCAAAATCGGCTCGCTCGGCT
+TCAGCCTCAGGCGTCAGTACACGCTTCATGCCGCCATCTCCTGCCTCGACCCAGCATCAT
+GCGCATCAGCCATCTCCGTCAGGCCTGCGATCAACTCGCGGATGCTACTCATCGGAATGC
+ATATGGACACAGCCATGTCGCAAGTGGTCCGATCAAACACAATCGCAGCCCGGCTAAATG
+CCGTCTCACCCCGGTAATGGATGTAGGTGGTCAAATTGCTCTCGCTGCCTATGACCTTCA
+TGCCACACCCCCGGCGATCAGTGGCCACTTCGGATGGATGGCCAGCATCAGGCCAAGGTC
+CGTCTGATTGAACCGGCCGAACCAGCGGCAGGCCGCCTTGCAGCGCTTCGTGTTGGATTT
+CATGACTTTCTCCAGGCACAAAAAAAGCCGGATGGCCGGCTGTTGGTTGATTAGATTTCG
+ACGGGCCTGCCGTCTTTCAGTGAGTACCAGACATTCGGCTTGATGCCATCCTTGCCGACA
+ACGCCTGCCCATACGTCGATGATTTCGTGGTCCTCGTTGCGCTCAACGAGGAATAGGGCA
+TTTCCGTCTGTGCCCATGACTTTCCCCTCATAACCCGAGGCCATGGCTGCTCCCCAGTCG
+CCGGTCGAGCTGGCTGCGCCCCAGTCGCCGGTCGAGCTGGCTGCGCCGTAGTCGCCGGTC
+GAGCTGGCTGCGCCGTAGTCGCCGGTCGAGCTGGCTGCGCCCCGGTTGCCGGTCGAGCTG
+GCTGCGCCCCGGTTGCCGGTCGAGCTGGCTGCGCCGTAGTCGCCGGTCGAGCTGGCTGCG
+CCGTAGTCGCCGGTCGAGCTGGCTGCGCCCTGGTAGCCGGTCGAGCTGGCTGCGCCGTAG
+TCGCCGGTCGAGCTGGCTGCGCCCCAGTCGCCGGTCGAGCTGGCTGCGCCGCGCTCATCC
+TTGGACTGATCGCCATCCGCTTTCTTTGCCCGACTGAACGTAAAATCGATGGCCGCCTTG
+ATGATGCCCGGCAATCCGATTTCAGCCTTGATTCCAATCTTCTCGCAGGCCAGCTTGTCG
+CTTTCCCGATCCACCTTCCCGGATGCCTCGATTACTGCGAAGCGTGCACCTGCGGGCGGG
+TAGTATCCAAACACATCGAGCGGATACTCGCAGCAGTGGAAGCCTTCGTTGCAGGCCTTC
+ACCTCGCCTTCGTGGACATACTCCTTGCCGACCTCATACTGAAAATCTCGGCACTTGAGA
+TCCTTGTCAAAGCCCTTGTAAGCCACGATCACTTCGTTTGCCATGAACTTTCCTCAAAAA
+AAAGCCAGCTCATGGCCGGCTTGAAAGTGGTAGATACGGCATGTGCCGCACCGATAGAGA
+ATGAGTGGCTGGGTATTGCGCCGGCCTCGCACGGCTCAACGCCATCCAGTGGCGGGGTAT
+TGCCGGCCTATCAGTGGCCGGGTCTTAAATCAAATCGACTTACCGCCAGGCAGCGCCCGA
+TTTGCAGGCAGATGATCGGCCCGCGTGGCGTTGTAGCGAATCTTCTCCATGGCCGCGCCG
+AACACGTCGAGGTGAAGGGCCCCAGCCAGATCGAGGATCCGGATCACCGCATCGGCCATC
+TCGACTTCCATACCCTTGCGCTCAGGCAGATGGTCGTCCATCAGATCCTTGCGGAACGCC
+TCCAGCGCCTCGCTGACTTCGGAATGCACAAGGGCCAGCTTGCCGGCGATGAAGTGCTTC
+CTTGCATCGGGATCGCGCCACGCCAAACTGTTCCACCAGCCGCCATCGACGGCCGCGCCG
+TGGCATAGCGACTGAAATGCCTGCAGAGACGACAGGCTCAAGCTGTGTGCTTGCATATTT
+GCGCTCCTCTGCGCGTTGAATTGTGATGGGGTCTGTCGGCCCGCTACGGCCACATTTTTC
+ACCAACAAGGAAGTCCGAGTGTTCAGCGCCTCGGTCAGCGCAACCTCAAATCCCATCACA
+ATGGCCCCTGCTACCAAGGGCCAAAGTCTCTGCCGATCCGTCACTTGGCTGAACATCCCT
+CAGATGCTTTGACCCGCCGTGACCGGCAGCTATTCGGTTGTGGAAGATCCCAGGCCGTGG
+GTCAGCGTTTCGCTGCGGCGCGGGTTGACTATACGAAACGCATACCAACGAGGCAATGCG
+AAACGCATAATTTATGGATGCGAATCGCATACTGTTCAGCGTCCATTTATCTAAATCTCA
+CCCCGTGAGACGCGCACAGGCCATCATTTCCCCACCAGGAGGAAACATGGCCAAAGAGAC
+GATTTACGTGGTGCAGACGTGGGTGGCGGGGAAACGCGGGCAGTTGATCGCCGATCCGCC
+GATACCGATGACGGCAGAGGATGCGGCTGTGCGCCGGGCCTACAGGCTGGAGGAGGATAA
+GGCCGCGGTCATGGTCTTTGCTCAGACGGCGGACTCAGAGACGGGCGACTATGATGATCC
+AAGGATCATCCTGCGGCTGGGGGAGGAGGTGGAGATGGGGTAGGGCATGAAAAACCCCGC
+CGGAGCGGGGTTAGTGATTTATCTTGGCCTGTACCGCGGGCTGCATGCCCGTTGTTGGCT
+GAGCGTATGCTGGAACTTGAATGATGATGGGGGCAGCTTGGGTCGCTGAGAGCGTCGATG
+GCGGCTTCCACAGGGTATTCATAGCAACCACCACTGCGACGAGTGTGCCAATGATTGTTA
+GCACCGTCGCAAGCATCCACCCCTTGATATCACTGCGCACACCTTCGATGTCTGCCTTGG
+TGGCCAAGGTAGGCAAGATGGTGTCTAGCCGTGTTTCAAGGGTGGTAAGGCGCTGTTCCA
+TACCTCCATCATGTGTTCCACCACCGCCATTTGCAAGTGCTGGGCCAATAGCTGCCGCTT
+GCAGCGGATCCATGGCGCCAGGAAGGTAAGTTACCTTAGGCATCGTCGGCGGCCTTCTTT
+TCTGGGTTTCTCCTTACCCACTGCGACACGACGAATAGGTCATGGCTCCTGATATATCCG
+CAATTACCACATCCAAGAGATATTATTGCCCTTCCTGCTACGCTCCCACCCAGTCGCTCT
+ACCATCCCACTATCTGGTCTTGGATTTTCTGCGAAAGGGATCATTGTGAATAGCCCAAAT
+CTATTTTCTGTTCCGATATAGAACCATGCTGACTCGCCGCAGCACGAGCAATTAGGGCTT
+AATGTTTTTTCTCCAAGAAATCTTCTGAAATCTTCCTCAGTTACAGATGTAACTGGCGGT
+GATAGTATTCTCGATTTACCATCGTTCATTCATTTGCCTTGACTGAGTTGCAATATATAA
+GTGAAATATCGATTCTTTTTTTGGATTGCACACCTCACTCCGCCAGCATCAGGCACTCGG
+ACCAGCGATTCACTTCGGTACAGCCTTTAATAGGGGCTTTAGGCTGTTTGCATTGGCCTT
+ACCCCAGGCTATCAGTGCGGCCTGCAGGCGGTCAGACATGTTGTTCATGTCTGCGATGCA
+TGACTTATCGTCTCCATGTCGACATAACGTGTTCTTCGGCTCTAGCTCGTCAAACTGGAT
+AGCCATTTCAGTTTGGATGATTCTTTCCAAGTTGATTGGTCCATGAAGGAAGGCGTCCAT
+TGCGATCTTTGCAAGTTCAGTAATCACTTCATCTTGCTGGACACAGGACCCCATCTCGAC
+GAACTCGACGCCCTTGCCGTGAACGATGCAAGCCATATCGATGCGGTCACCCGGTTTTGC
+CATCTCAAGGAACTTCGAGTCTCGGACGCTAATATATGCAGTTACCATCTGCATTTTAAT
+GATAAAATCATCATCACTAAATTTTTCAGCTCCTCCAAAGTATCCATTCACAAAAGTGTA
+CTTGTTTCGGTACTTGGCATCAGCGCCAATTGGATTCTGCATAAATTCAGTGGCGATAGT
+TAAATCGCGCGTGCTAGGAATGACTAGTTTTCGCCATAGTTCGGCATGTTCGCTTTTGCC
+ACCATGGACAAAAGTCAGAAGATCGTTAGAGAAAAAAATCCTTAAGAAGCGCTGCTGTAC
+TGCGTCTGGATGTATGGCCTCATCAATAGTCGCCGACCGTGCATTGGAAATAGTTGCAAA
+AAAGGCAAGCGCTGAAATAAATACAAGCGCGACGAGCCTCATCAGAGCTCGCCTATCACA
+CGCGCCTTGATCGTCTCGTACTCCGAGTCGCTGATCAGACCCTGGTCGAGCATCTCCTTG
+GCGTTCTTTAGTCGTGCCGCGGGATCGGGATCGGTCGCCGGTTGGCTTGATCCAAATCCA
+CCCTGAAATCCACCAGATTTCGCCCGCATCTCTTCCAGCTCACGATGCCGGCGCTTCTCG
+CGCCAGGACTGCTCCTGAGCCTGGGCCATTCGGTAAACCTCTTGGGCCTCAGCCTTCCTC
+AGCCCATCGATGCGGTATGTGACCACAACACCGCCGCTTGCCAGATCGGGCTGAGTGAGA
+TGCCGGATGATGACTGAGCTGCTGAAAATTCCGACCCGGATATTGGCATCTTTCACGTCC
+TGCCAGCGGATGTCAGTTGGCGTAAAGCCACCGAAAAGCCCGCGCGTCATACCGATAATA
+CGACCAGTGGTCGCTGCCAAAAGAGCTCTTCGATGGGTGATCGCAAATATGCGCCTCTGG
+ACAGTAGATGCCCTTACGGACTCACCCGGGACCAGCATGGATGTGATGTACGAGAAGGCC
+TTGGCCGGTACGCCCTCAAGGCCAAGGGTAGAGTCTGTGCGCATTACCTTTCCCCAATAA
+GCGGCCGGTCTAGGGCCGCATGCTCCTGATCATTGCCAGAATCGCCTGCTGCTGGGCTTC
+AGATAGGCCTCTCATTTCACGTGCTACAGATGCCGCAATTGGCTCCTCTACGAGCTCTGC
+ATTGCCTGCCATAGCATCCAAATCGGTCTCCAGCACATCCAGGAGCGCCCTCAGTTCGTC
+CACTTTCCACCTCGATCCGCGACTGCCATTGAACCATGCGGCCACCGTCTGATACGCAAC
+AGCGATACCGCGAGTGTTGAGCGCGTCCGTGATCTGCTCGATTGAAAGATTTAGGGCTTC
+CCGCCGAGCGCGGAGATTAGCAATGAACTGACTCAAATCCTGAGACTCCATATGGATGTT
+GTCAGGGTATCGCGAGCACTTGCGCGCAAAGTATGCGAATCGTATAGTTGCAACATATGC
+GAAACGAATACCTGCCCATGACCGAAAAAGAAGAGCTTTCCGCTTACGTCCGTGATGCGG
+GCGGCATCTCGTCTGCTGCGCGCAAGCTTGATATTCCATACCAGACACTCGCCGCGGTGA
+TGAATGGCAATCGAGGCATCGGACGGTCCCTGGCCAGCCGAATGGAAAAGGGTTCTGGTG
+GCGTCCTGAAGGCTTCGCGCCTTATTTGGATTGCCGCTGAGAAAAAGGAGGCTGCATGAA
+CGCCTCTCAGCGTCAGGTCTTGTCCTCAGTCCTCCGGCTCGCCGCCGGCCTCAATCCTCC
+TCAACAGGATTGTCCTTCTCCCACTGAATGCGCTCATCGAGGATCGCGGTGTACTCGCCG
+GTCATCTCGGTCACGAGATCAGAAATCCCGCGTGGAATTTGTCCGCACGAAGCAGCGATC
+GATGCAGTGGCAACAGCTTCAGACAAGCACTCATCAATCCGACGCCGGCAGTGCGGGGCG
+TCGCACGTATCCATCATCAGGGCCTTGATCACCGCGTCTTGCGCGAGTGACCGCGCATAG
+AGATCAAGAACCAACCTCTCCAGATTCAGCTTGGTATCCGACATGTACGAGAACCCTACT
+CATATCCGCGACAAAATCATCAAGGTTCGCCTGAACGCCGACGAGCGCAATCTCGTCGAC
+GCATTGGCCCGCATCAACAAGACCCAGCCCTCGGTCTTCCTGAGGGACCTGGTGATCCAG
+GGTCTTGCTGTCGTGACGAAGGATACCCCCAAGCAGAGCGCCGCCTGAAGGACCCTAAAT
+AGGCCCTCAGGAGGGCCCTCTAAATGACAGAAGACCTTCCCATCGACCTGACGCCTGCAC
+AGGCGGACAGGATCTCAGCGTTTGCGAAAGAACAGGGCCTGACCGTCGAACAGGCCGTTA
+CCAAGCTGGCCCGTGAAGCGATCAATGAGCGCTACGTGCTGCCCAAGAACCGGGGATCAG
+TTTTGCCCATAAGGGCCCTCAAAAGGGCCCCAAGAGGTCCCTCTCATGACTGATCGAGTC
+ATCCATACGCCTGCATCTCGCGCCACCGATCCTGTGTCGTCGCACGACGCAGAGATGCGC
+GTCACGCGCTCCGGCTCCAGGCACTCCAACCGCCTCGCTGTCGTCGAGGCTGTTCGCCGC
+TACAACGACGACATGACGTCTGCCGAGATTGCCCTGGCTGCGGGCCTTGATTACCACGAG
+GCTGCGCGCCGGCTGCCCGAGTGCGTGACAGCCGGCGATCTGAAGAAGGGTCCCATGCGC
+GTCTGTTCAGTGCGCGGGACTCTGGTCTGCTCGTGGGTGATGGCATGAGCATCGAGATGA
+TGAATGAGGTCAAGCCTCTAAAGATTGGCCCCACGCGAAAGGCCGTCATGATCTGGCTGG
+CCAACTGCGCCAATCATGACCGGAAATGCTGGCCCAAAATGAGCGACCTGGAGGATTGGA
+CGAACTACGGTCGGACGGCAATCATTGAGGCGATCAAGTCCCTCGAAAAAGACGGCTATT
+TGACCGTGGATCGATCGGGGCGGAACAACGTTTACACCATGAATCAGGTCCGCCAGACGG
+ACCAGTCCGTCTCCCGGACCAGTCCGTCTCCCGGACCTCAGAAGTCCGTCTCCCGGACCT
+CAGGAGTCCGCCAGGCGGACCCTAACAGTAATAAAACCAAAATAACAAACGAAGAGGAGA
+GAGTCGGGCGCATCCAGGCGACCTCGATCTCCTGTCCCGACGGCATCAGCGACGACCACT
+GGTCGATGTGGATCGCCCAGCTTCAGAGCGACGGCAAGGAATCAATCTCCCGCCTGCAGG
+CCGCCAAGCTCCAGGTCCTTCGCATCGTCCGTGATGGGGGCGACGCCGAGGCAGTCATCG
+AGGCCGCCGTGCTCCGCGGCTGGCGCGACCTGCAGGACATCCACGCCGAGATGAAAGCCA
+GGGCATCGGCCCGCAAAAACAATCACCAATCCAGCGCCGGCGATACGGCCGGTGGATCCA
+GCACCCGCACCGGAGTCAACTACCGTGGAAACCGCACATCAGGCCGCAAGCTCAGCGCTG
+TTGAACAGGTCGAGGCAGCCATTGCAGAAAACGAACGAGCACGAGCGGACGCTGCAGGCG
+CAGCATGCATCGCAGCCGAAGGCGCCGCAGACCATGGTCAATGCTTTTTGGGCGCGGATG
+GCGACGATGTTCGGGCATAGCTGGGTGAGCCAGTACGGCGCGAATCCTGCCGGGTTGGCG
+GGAGATACCTGGGGCACCGTTCTTGCTGGCCTGACTGGCGAGCAGATCGCCCAGGGCATG
+CGGGAGACGCTGGCACTGGGTTCCGATTGGCCGCCGAGCGCTCCGCGGTTCCGCGCCATG
+TGCATCGGCATCCCGTCGCTGGCCGCCACGCAGCACGCGATGCGTACCGGTGCCACCGAC
+CCGTTTACCCGGCAGGCCTGGACCTACATCGACTCGTTCCAGTTCCGCTCGGCCGATGCT
+GATCAGGCCGCTCGCATGATGCGTGACGCCCACGAGCTGACGGTGCGATTTGTGATGGAC
+GGCGGTGAGCTGCCCGCCGAGCCCGTCGCGGCGATTGCTGTAGACCCGGCGCCCGAGCAT
+GTGCCGGCCAGTCCGGATTTTGCACGGCAGAGGATCGAGGAGATCCAGCGTCAGCTGGGT
+GCGGGAGAGGTGGCATGATCGAGCGCATCTCCGACACGAACGATATGTCCAGCGCAGCTG
+AGGAAATGGCCCGGATCGCTGCAGCTCAGTTCCGTAAGCCCGAAGGTCCCGCAGCCACCG
+GCGAATGCCTCAACTGCGGCGAATCACTGCCGGATGGCCTGCGCTGGTGCGACACCGATT
+GCCGGCACGATTACGAGCGTCGGGAGGCGATGTCCGCATGAATATGGACGTTCTCATCTA
+CCGGATTCTGGCAGAAATGGGTCCGATGACGATCAGTCAGATATCGACGGAACTGTCCTG
+CAGCAACCGCAGTGTTCGCCAGCCTCTGGACCTTCTGGTTAATTCGGGGAAAGTATCGGC
+TACCCACTCGGTGAAGGGCGGATCTTACTGCGTCACCTATGAGGCCGTCGCATGACTGCC
+TTCGCCTGCGCCCATCACATCGCCCGCATCGGCCGGCTGCCCAGCGCCCAATGGCGTGCC
+GAGGTCAACCAGCTCCCCGCCGACTGCGGTCGCAACGATTGCACCACCCGGAACTGCCAG
+CGCGAAGTCCAATCGCGCCTTGAGATGCAGTGGAAGATCCGCCGAGCCAAGAGGAAAGCA
+GCATGACCCAGACATTCACCCTCAACGCCGGCGGGGTAGAGCGCGCCGATGTGATGGCCA
+GCGCTGTGCGGTTCATTGCCGGATTACCTGGATCCAAGAGCTGGAAGGTCGAGATCAAGG
+AGTCCCGCAAGGGCCGCACCCTCGACCAGAACGCAGCCCTGTGGGCCGTGGCCTATCCGC
+CGCTGCGCGAGGCCACCGGCCACAGTGTCGAGGATCTTCACGAGTATTTCTGCGGTGAGT
+ATTTCGGATGGACCGAGTACGAGGTGATGGGAAATCCCCGCAGCCGGCCGATCCGGACCA
+CGACGACCGGCGAGGATGGTAAGCGAGACCTGATCGACGCCCGGACTTTCAGTGACTTCT
+ACGCCACTGTGCAGCGCATTGCTGCCGGCATGGGAGTGATCATTCCGGATCCCGATCCGT
+TCCATGGGGACGCCGGGAGGTGGGCGGCATGAAGGTTTGTCCGATCAAGCCACGGATTGC
+CGCAATCTTTGGTCAGTGGATCTGTTTTTCTGACGACTGCGGAGGGCGAGGCTTAACGCC
+AAGGGATGCGTACATCGCGTGGTTTTTGAACTGGTCTCAAGGCGGCCAGAGGGCATTTCG
+ATGAGCGCACCCAAGATGACCAAAGCCCGCAAGCTGGCCAAGGGGCAGCCGTGCATGATC
+CGCATCCCCGGCATTTGCAATGGCAACCCTGAGACGACGGTGCTGGCTCACTACCGGCTT
+GCCGGCTATAGCGGCACCGGAATGAAGCCGCCGGACGAAATGGGGGCATGGGCCTGCTCG
+GCGTGTCATGACGTGGTGGATGGGCGGGTTCGACCAAAGTACTCATGGATTTCTGGTGGT
+GATGGCAGCCTCCTTTCCAGTGATCGATTCTCCAGTGGTGCGATCAAGCTCATGCATGCG
+GAGGGCGTCATGCGCACCCAACAGGCGATCAGGGAGATGGGCCGATGAGGGCGATCATGC
+TGCATATCGGGCTGGGCCTTGCGATGTTCGCGGCCATGCTCCCGGGCCATCCGGCGCTCA
+AGAGCATCTACCGGGCAGCGGCAGAACGGACGGAGGAGCAGATCCGGGCAGAGCAGAAGC
+GGGCCCGAAAGCTCGCACGGCCGGCGTGGAGGCAGTGATGGTCATGATGCCCATCAAGAC
+TGTATCGGTCCTCAACGGATCGCAGGGCAACTGGCGGCCGGCTGCCGCACGCCGACGCCG
+GCAGCGGTCGGATGCATTCGTGCTGTGCCCGCGGGCCAGCCTCCCATGCACCGTGACCAT
+GACGCGGCTATCGGCCGGCACGCTGGATGACGACAACCTGCGCAGTGCCCTGAAATCAGT
+CCGGGATGGCATTGCCGACCGGCTGGGAATTGATGATCGGGATCCGCGCGTGAGCTGGGC
+CTATGCCCAGGCGAAGTGCCCGCGGGGGAAATTCGGTGTTCGCGTTGAATTTGAATCAAA
+ACAGGGGATCTGACCATGGCGCATATCGGCAAACTACTGGGGCGGCTGAACCCCAAGACG
+CAGACCTTCACCGATGCCTCCGGCGGCGTTCCCGAACTCACCCCGCAGGATATCGCCGGG
+GCGCTGGCGTTCGTGCCGTCAGGCCTCGGTCGCGAGCTGCTGTGCCACGTCTGGTGGCCT
+GGAGGTGCTGAGCGCACCAGGGCGCAACTGGATGCGGCGATCATGGAGTTGCTGGCAAAA
+GAGTGGCGCCGCCGTGAGGACGCACAGCTGGACGCCATGCTGATGGTCGCAACACCCGAT
+GTTGGCCGCCGCCGGGCGCAGGATGCCTTTGCCCAGGCCCACAAGGAGCGCTGGCCGAGC
+TGGGGGAAGATGGAGCAGGGCATTCTGCAGCCGTCAGAGGTCTACGTGCGGATCAGGGAC
+GCCGTGCTTATGGAGCTGCGTGCAGGCTATTTTGGTGATGCTGACTCAGGCGCAGGCCGC
+GCATGGAGTGACCGTGATCGGGCTGAGATGATCGAGCGCTCGAATGTCACTTACAGCACC
+AACGGATGGAAGCGAGTCTACGAGTGGCTGCTTGATCACTGCGCGAATGAGGTCGGCATT
+GCTCAGAGACGATTCGGACGTGCAGCCGCTTAGACTGTTAGTGTGAAGCACTAACAGTTT
+TTGGGGTAAATTCCCTATCGTGACGAAAGCCCCGCCGGGCACTGGCGGGGCTTTGACTTC
+ATTAATCAGCTGTTGCGAAGATGGTTGAAGAGATCAAGTATTTCCCTTACTGATGATGCA
+GTGATGATGTTGTCCATGTCTAGATCATGAGGTGACGGGCCAATGACTGATTCGCCCTTG
+ATGTTCCACGAGCATCCCGTGTCGACTGCCTCGATATCTATCGACCCCGAGAATGTCTCG
+TCTTTGCTCGATGGGTTGTAGCCGTCAATGGTTCCGAACTTTCCAGATACGGTTCTGATG
+GGCATTTCAAATATCTTCACATAAGTCATTTTCACAATCTCTTTGATTTTCAAACGAAAT
+GAGCTTCGGATTCAGCCGTAGCTGTATTTATTGTAGCTAATCGGTGCTTTATGCCTCTTC
+CCCTGCCAATCGAGCCGCAGGTGGCACTGGCATCTGTCATCGACCCAGCCCTTGAACAGC
+TTCCCCGTGCCCTTGATAGCGATCAGGCCGCCGTTCTGCTGCTGGCGATTGCCATCCAAG
+AGTCGGGCCTGCGTACCCGTCAGCAATATGGCGGACCTGCACATGGCCTGTTCCAGTTCG
+AGACGGGCGGATGCAGCGCAGTACTGGGAAGCCCGCTCAGTCGGCCGCTGCTGTTGCCAG
+TCCTCACGCAGCATGGCGTGTCGGCCACTCCTCAGGCGATCTATCAGGCGCTGCTGACGG
+ACGACATCCTTGCCGCCAAGGTTGCGCGTTTGCTGCTGTGGACTGATCGCCGCGTATTGC
+CGGCCCTCGGCGACATCGAGGGCGCCTGGAAGTACTACTACCGCAACTGGCGGCCCGGCG
+GCCCACGGCCTGACCACTGGCAGGTCAATTACCGAATAGCGCTCACAGCGCTTGGGAATC
+ACACATGTCACTGAGCATCTTCGCATCCATCGGCGTGCGGGCATCTGCTGTCGTCGCTGG
+TTTTGCGGGGAGCGTGGTGCATATCGCAGTCACCGAGCAGATGACCCGGGCCCGTGCTTT
+GGCGGCCATTGTTGCCGGCACCGGCTGTGCCGCCTATCTGCCCGACTACCTGGTGCTGCA
+CTACCAGCTGCCGGCGCCCATGACCAACTCAATCGCGTTCGTCTGCGGCCTCTGCGGGCT
+ATCGGTCGCACTCCGGGTGCAGGCGATGATCACCAGCGCATTTCATGGAGGTAACTCCAA
+ATGATGCTCGCAACGATCAACATCCTGTCAGCCCTACTGGTGTTGGCCGTGTCCATCGAT
+GCGGCTCGGCGCCTGTCATTCCGCTGCCACCCGGTAGCCACTGGCGGTCATGTGTTGATG
+GCGATTGCCGAGATGGTGTGCATCTACCAGACCGCAGACCTTCGCAGCGTCCCTGCCTGG
+GTGGCAGTCATCAACCTGGTGCTGTCCTACATGGCCATGTCGTCATACCTGCACATCGAG
+CGCACAGGGAGGTTCGGCTGCAAATGAGCATCGCAACCATCATCGCAGTGCTCAATGGCA
+TCTGGACCCTTGGCAAGAACCTGATCGGCGCCTTCAAGAAGAAGCCGGCAGGGCAGGGCG
+CCGAGGATGCCGCCACTCAGGCAGTAGCTGCCACCAACACCGAATCGAGCGAGACGGCGA
+GCATCGCCCGCCAGTCGATCGCATCCGTCCAGGAGTCAGCCAATGCTGCGCGTACTGAGA
+ATGACCACCTTGCTGCTGATGCTGCTTCCGCTGGGAGCGTGCAAGACGCTGACCAAGTCG
+TCCAGCGAGCCATCGCCGCAGCAAACGCAAAACTTAATCCAGGTTCGGACCATCAAGCCG
+ACCGTCCTGTGTGATATGGGAGATCTCCAAAGTGACCCCCTCCCGAATTATCCAGCTCTG
+CCTGGAATGGTTCCGCTCGCCGCTGATAAAGCCCGCGACGTCTGGGCCATCGGCGTTGCC
+GGTCAGTACGGCCAGCTCGCCATCCGATACAACGCAATCCTTTCCTGTCTCGCCGGCTAT
+CGCCAGCGCGGCCTTATCAACTGACGAGGTTATCCCCATGTCGTTTTCCCTGTCCAAGAT
+CGGTGCCGATATCACCGAGGCCGTATCCGCCGCCGAGGCCGTGGGCGATGCGATCAAGGT
+CGTCTACAACTCCGTCGCCCCGCTGATGGACTCGGCTGAAAAGGCCTATGACGGCGTCAC
+CGATGCCGGCGGCACCAAGAAGGCTGCAGTGCTGGCGAGCGCCAAGGCCGTGGCCGAGGC
+CCTGGGGCAGGACTGGAAGAGCATCGAAGCCGGCGCATCGTCCCTGGTTGACGCCATCAA
+GGGCGCCTACAACGTGGCGAAGGACATCGTCGATCCGGCGAAGTCGACCACCGTCGCCAG
+CGCTGCGGCGTAAGGGGGTAGATCATGACTGTCAATGTCGTGACCGAAGACGGCACCATC
+GCCGAGGTTTCCACCCCGAGTGATGCCTCCGGCTCCTCCTATACCCTCCCGGCTGCCACC
+AGCTCTGCCCTGGGCGGTGTGAAGGAGGGCGCGTATGTCGCCAATGCCGGCGAGTCCACC
+GCAACGGATGTGGCTGGTGCGGTAACGTCCATCAATGCCGTCGCCACCCAACTCAATGCG
+CTGATCGCATCGCTCCAAGCATCGGGCGCATTGGCTGCGTCCAGCTGATCGAGGTAAGTC
+ATGGCCGGCAACAAATCAACGAAGCCGGCCACTGACTGGGAACGCATCGAGGCGGACTAC
+CGGGCTGGCGTGCTGTCGATCCGTGAGATCGCTGGCAATCATGGGATCACGGATACCGCC
+ATTCGTAAGCGGGCCAAGGCCCATGGCTGGGAAAGAGACCTTGCCGAGAAGATCCGGGCA
+AAGGCCGAGTCCAAGGTTCGCAGTGCAGAGGTTCGCACCCAGGTTCGCACTGAGGGCGCA
+ATCTCGGATCGCGAACTGATTGAGGCCAACGCCGAGGTCATCGCCAACGTCCGCATGGCC
+CACCGGCAGGATATTGGTCGGGCACGCAGTCTCGCCATGTCCCTGCTGGCTGAGCTGGAA
+TCGCAGACGCATCACCTCGATATGGTGGATCAGCTGCGCGACCTAGTGGTGAACAGCGAG
+GACGGCATCGACGCCAAGCTGCTGACGATGTTCCAGGCCGTGACCTCACTACCTGGTCGC
+ACCAAGACCATGAAGGAGCTGGCCGACTCGCTGCAGAAGCTCGTGACGCTGGAGCGTGAT
+GCCTATGGGCTGGCCGAGGCATCCAAGGTTGAGCTGACCGGCAAGAACGGTGAGCCGATC
+CAGCAGCAGGTATCCCATGTCGATGAGCGCACAGTCTCAGCGGTCATCGACCGACTCAAC
+GCCGAGTTCTGAGGGGCTTCCCCTCGATCTGGCGATCATCAAGCAGCTGTGCGAGCGGGA
+TCACCTGTTCTTCAGTCGCTACTTCTTCAAGCACCGGCAGGGCATCCGCTTCCTGCAGAA
+CTGGCACCACCGCCGGATCTGCTCGATTGTCGAGGATGTCATTGCTGGTCGACGTAAGAA
+CGTCGTCATCAACGTTCCGCCGGGCAGCTCCAAGACGGAGCTGGTGGCAATCAATCTCAT
+CGCCCGGGGGCTTGCCATCAATCCCCGGGCCCGGTTCCTGCATATCTCCTATTCGGATGA
+CCTCGCGCTGCTCAACAGCGAGACCGCCAAGGAGATCGTGCAGTCCGAGGAATACCAGGC
+GCTGTGGCCGCTCTCGATAGCCTCAGACGCCAAGAGCAAGAAGCGCTGGAACGTCGAGGC
+CAATGGCCAGAAGCTGGGTGGCGTCTATGCGGTTTCGCTCGGCGGCCAGATCACTGGCTT
+CCGTGCCGGCCACATGGCTCCCGGATGGCAGGGCGCGATCATCATCGATGACCCGCTCAA
+GGTCGAGGATGCGTACAGCAAGACGAACCGCGACAAGGCGAACCGTAAGCTGCTGTCCAC
+GGTGAAGAGCCGAAAGGCCAACCCGGACACGCCGATCATCATCATCATGCAGCGCCTGGC
+TGAGGAAGACCCCACCGGTTTCATCAAGTCCGGCAAGCTGCCGGGTGACTGGGAGTTCAT
+TGAGATCCCTGCGCTGATCGACGATGCATACATCGCCGCACTGCCCGAGGATCTGCAAGA
+CGCGGCGTCCCAGGGCGATGCAGATCAGGACGGCCGGCGCAGCTACTGGCCCTACAAGGA
+GCCACTGGACGATCTGCTGGCGATGGAACGGGCTGACCGGTTCGTGTTCACCGGCCAATA
+CATGCAGCGGCCCAGCCCGCTCGGCGGCGGCATCATCCAGTCGGCCAAATTTGGCCGGTA
+CAAGGTGGTCCCGGAGATGGTCAAGCGGGTCATCTTCGCCGATACGGCGCAGAAGACGGC
+CGAGCGCAACGACTACTCAGTGCTGGAATGCTGGGGTCTGGGCAAGAACGGACGCATCTA
+CCTGCTGGACCTTCTCCGCGGGAAATGGGAGGCGCCTGAGCTGAAGCGCAAAGCCATCGA
+CTTCTGGCACAAGCACCTTGCTGTGCCGGCGTGGCCGAATGGCGCCCTGGTCAAGCTGAT
+GGTCGAGGACAAGGCCTCGGGCACAGGCCTGATCCAGGACATCCGGGCATCGGGATTGAT
+CCCGGTCGAAGGTATCCAGCGCAACACCGACAAGCTGACCCGCGTCATGGACGTGGTCAG
+CTATATCGACTCTGGCTATGTGCACATCCCCGAGGATGCGCCATGGATCAGCGACTTCAC
+CGCCGAGTGTGACGCCTTCACGGCGGACAACACCCATGCACACGATGACCAGATCGACCC
+TATGGTCGATGCCATCAACAACCTGCTGGGCACCGGCAGGGTGCTGAGCGTCTGGGAGAA
+ACTGGGCCAATGAGCCGAGGCAAACGGAAAACGCCACGGCTCGGCACGTCAGCAATGGCG
+CGCGACTCGGCCAAGGCCAGGCGCAAGACCATCGACAGCTTCGAGAATTTCGAGGCTCGG
+GTCGGCATCCAGGCGGGCAACCTGTCGGGCGGTGCCGGCTACACGTTCGATTTCGTCTCG
+CGCAACCGCGTCGAGATGGAGGCCATGTACCGGTCCAGCTGGATCGTCGGCCAGGCCGTC
+GATGTGGTGGCCGAGGACATGACCAAGGCCGGTATCGAGCTTCGGTCTGAGCTGGACCCG
+AGCGACGAGGCCAAACTGCTCAAGGCCATGACCAAGATGCAGCTCTGGGATCAGCTCTGC
+GACACGCTCAAGTGGTCACGCCTCTACGGCGGCGCGGTCGGCGTGCTGATGATCGACGGC
+CAGGACATGAAGACGCCGCTGAACATCGACAGCATTGGTCGCGGCCAGTTCAAGGGCATC
+CTGCCGTTGGACCGTTGGCTGGTGCAGCCCTCGATGGAAGAGCTGATCACCGAGTACGGC
+CCCGACATCGGCAAGCCGAAGTTCTACGACGTGGTGGCCGACAGCATGGCCCTGCGCCGG
+CAGCGGATCCACTACACCCGCGTTGTGCGCTTCGATGGCGTGGATCTGCCGTACTGGCAG
+CGCATCAGCGAGAACCTGTGGGGGCAGTCTGTCGTCGAGCGCCTGTATGACCGCCTCGTG
+GCGTTCGACAGCACGACGCAGGGCGCGGCCCAGCTGGTCTACAAGGCCCACCTGCGAACC
+TACAAGGTCCCAGGCCTGCGCGAAGTGATTGCCATGGGCGGCCCTGCGCTTGAGGGCCTG
+CTCAAGCAGATCGACATGATCCGCCGGATGCAGACCAACGAGGGCATGACCCTCATGGAT
+GCTGCCGACGAGTACGAAGCCCACCAGTATTCGTTCTCCGGGATGGCTGACATCCTGCTG
+CAGTTCGGCCAGCAGCTTTCTGGCGCCCTGCAGATCCCACTGGTCCGCCTGTTCGGTCAG
+TCTCCGGCTGGACTGAACTCGACCGGCGAGTCGGACATGGAGATGTACCGCGATGGCATC
+CATCAGCGGCAGGAGCGCCGTTTGCGCACGCCGGTGGACACGATCCTGCGCATCCTCTGC
+CGGTCGGTGCTGGGCATCGACGCACCGGAAGAACTGGACTTCGACTTCGTCCATCTCAAG
+CAGATGACGGCCGAGGAAAAGGCCAATGTCTCGAAAACGACCACGGATGCCGTTATCCAG
+GCATTCGATGCCGGCCTCATCTCGCAGCGCGTGGCTCTGAAGGAGCTGCAGCAGTCGAGC
+GACGAGACCGGCATCTGGACCAACATCAGCGACGAGGATATCGAGGCGGCCGACGATGCG
+CCGCCCGATCCGGGAGAGGGCGACTTTGGCGAAGATCCATACCCGCCGGAGCCCGGTGCC
+GACCCGGAAGGCGGAGATCCAGTACGCGGCCAGTCTGAAACAGGTGGCGGCCGCGATCGG
+TCGATTGATCGCTGGCTTCGACCCTGGCGATATCGGCGCGCTGCCTGATATCCAGTCTCG
+GCTGGAGCAGTACAGCTACAACCTGGGCGACTGGGCGCATCGCACTGGCCTGAGGATGAT
+CAAGGACGTCAACGCCCGCGATCTGAAAGCATGGCGCGAGCACTCGCGGGACATGTCCCA
+CGCACTTCGCAAGGAGCTGCTGAATGCTCCGACCGGCCAGGCATTCCATCAACGGCTGAC
+GGAGCAGGTCCACCTGATCCAATCCCTGCCGCTGGACGCTGCGAGGCGCGTGCATCACCT
+GACGACCGAGGGCCTGACCAGCGGCCGGCGTGCTGAGGACATCGCCAAGGAGATTGCGAG
+ATCCGGCGAGGTGTCGGCATCGCGGGCGATCCTGATCGCTCGGACTGAGGTGTCCCGCAC
+GGCATCAGTTCTCAGTCAGGCCCGCGCCCAGCATGTCGGTTCGACGGAGTACATCTGGCG
+AACCTCGCAGGATGGCGACGTCCGGCCTGGGCATAGGGCCATGAACGGCACCGTTTGCAG
+ATGGGCAAGTCCGCCGGGCATCAATGAGGGCACGGCGAGCAAGCCGAGAATCATGCACCA
+CCACCCCGGCTGCATCTGGAATTGCAGGTGTTGGGCGGATGCGATTATTGCGGAGTGAGT
+TCATGGTCCGCATTCATCCTGACTGGAATTTGAGCCGTGATTGAGCAGACTGGACAGATT
+TAAAAAGCTGGCCAATAGACACCAGTTGATGGCATGATTCGGCGCCGCAATATTGCGGCG
+CAACATAGGCATGACATGGCTACCGAACTGAAAGAAGATCAGAAACTTAAAGCGGACATC
+ATGGCTAAGATTTTGGCAGGTGCCATCGATGGCGCGACCCTGTACGCCATCGGCCATGGG
+CGCGCAAACCTCAAGTACTCCGGGATGCTGAATGGAGCAAAGCGGATTGCCGATGACATT
+CTCAAGAAAGTCTGATCCATCGCATCAATGTAGAACGAAGGCCCGCACTGCGCGGGCCTT
+TTTTATGGGCCAAATATGCGCTTCTACACCATCCAAAAGCTCGGACCGAAGCGCGAGCTG
+ACGCCCGAGGGCTTCCTGCTGTGCCTGGACGTGCCGGTGGCGCGCACTGGCGAGATGATC
+TACGGCGAAGGCGAGGTGCCCATCGAGGGCAGCATGGACGGCCTGATCCGGATCACCCGG
+ACGCCGGACGAGGTATTCCGTGCCGAGACACTGGCCAGTTGCCAGGGCAAGCCCATCACG
+CTCGACCATCCTGACGAGTTCGTGACGCCTGAAACGTCGCGCACACTGTCCATGGGGTCG
+ATGCAGAACATCCGGCGCGGCACTGGAGCTGATGAGGACGTGATCCTCGCCGACCTGCTC
+ATTACCGACGCGGAGGCTATCAAGGCCGTGCAGGCCGATGGCATCGAAGAAGTCTCGCTC
+GGGTACGAAGCCGACTACGAGCAAACCGAACCCGGCCGCGGGGTGCAGCGGAACATCATC
+GTGAATCACTGCGCCCTGGTGCGGTACGGGCGTTGTGGCCCGCGCTGCGCGATTGGGGAC
+AAGGAGACTGTTATGGCCAAGCCCGTCAAGCCCGGGAAGAAGTTGTCGTTCAGCGACCGA
+CTGCGTCGCGCCTTCATGTCCAAGGACGCCGACGAGGCCGAGAAGCTGGCCCAGGAGGCC
+GAGGACGCAGCCGAAGAGGAAGAGCAGAAGCGGCGCGAGTCGGAAGATTCCGGCGACGAT
+GATGACGGCGACGATGGCAAGGGCCGGGACAAGGTCGGCGACACCGCCACGCTGAAGCTG
+CTGCGATCGATGGACAAGCGCCTCAAGTCGTTGGACGAGCGCATGTGCAAGATGGAGGAC
+GCCGAGGGTGATGGCGAAGAGGAGGAAGAGGCGGAGACCAACGACGCCGGCGACCTGACC
+AGTGCCGAGGCCTCCCCGAAGGTCGATCTGGATGGCGTGAAGATCTACACCGGTGACGCC
+CGCACTCAGTTCCGGCAGCGGCTGGAAATCGTATCGCCCGGCGCCAAGATGCCGACCTTC
+GATGCCAAGACCACTGATGCGGCCATTGCCGCGAAGCTCTGCGCGTGCCAGCGCCGCGCC
+CTGGGCGACGCCATGAAGACCGACGGCGGTCTGAGTGCAGTCTCCCCGTTCCTCGGCGGA
+CTCGATCCGCAGACCGCCCCGATGGCCGTAGTCAATGCCGCTTTCACCGGAGCTGCCGAG
+CTGCTGCGCCGTCGCAACAACGACCACGGCAGCATGAGTCTGCCCAACCAGCGGCAGATG
+CCCAACAGCATCGCCGACATCAACAAGCGCAGCCAGGCCTACTGGGCCGACCGCGCCGCA
+CGCTGAGGAGCTGACATGCCCGCCTATCTGTATCGCATGCCGTCGGGTATCCCCGGCGAC
+GTCACCCGCTATTCCGTTTCCACCATCGAGCCGGTCCCGACCGATTCGAGCAATCCGTTC
+GCCAGCTTCGGCATCCCCGGCAAGATCGTCAGTGGCAAGTTCGTGCCGCTGGCATCCGGC
+GACACCGATGTGAAGGTCTACGGCTTCCTGGTCCGCGCCTATCCGACCCAGAACGGCGTC
+AATCAGGCGCTGGGTGCCGATACCCCGCTGGCTGGCGTCATGGGCAATGTCCTGCGCCGC
+GGCTACATCGCCGTGAAGCTCAATGCCGGCGTGGCCGCGCTGGGCGCTCCGGTCTACGTC
+CGCGTCGGTGGCGCCACGGACTCCCAGCCCATTGGTGGTATCGAGGCCGCGGCCGACGCC
+ACGGCCGGCAACACCATCGAGCTGGCGAACTGCACCTTCATGTCCGCGGCTGATGCCTCG
+GGCAATGTCGAGATCGCCTACAACCTGTAATCCCCCACAAAGCCCTGCCAACGAAGCCCT
+GCCATCGAGCGGGGCTTTTTTGTGGGCGCGATTCGAGGAAACCCCCGATGAGTCAACTGA
+TTCTCCCGCGCTCGGTGAAGCGAGCGTATACCCGCGATGGCCTGCAGACCTTCGACAGCC
+GCACCATCGACAGCTCCGGTGCGTTCCTGGTCGGCGAGCTGGAGCGCCTGGACTACCGTC
+TGCACGAGCCGCTGGCCGCAGTGACCTGGTCGCGCGATATCCATCTGCGCGAAGATGTTT
+CGATGGCCGACGAGATGTCGAGCTTCACCAACAGTTCGTTCGCTGCCGCGGGCGGCATCT
+CCCCGACCGGCAAGGCCTGGGTCGGCAAGGACGCCAGCGCTATCACCGGTCTGGGCCTGG
+ACATCGGCAAGACCATGCATCCGCTGTCCCTGTGGGCCATGCAGATCGGCTGGACCATCC
+CGGAACTGGCCTCGGCGCAGCAGCTGGGCCGTCCGGTGGATCAGCAGAAGTTCGCCGGCA
+TGAATCTGAAACACCAGATGGACATCGACGAGCAGGTGTACATCGGCGATACCGTGCTGG
+GCCTGGAGGGCTTGGTGAACAGCTCGGCCGTCACCACCACCAACGTGGTCAACGGTGCGA
+GCGGATCGCCGCTGTGGTCGAGCAAAACCCCGAAGGAAATCCTTGCGGACTTCAATGCGA
+TTTTGAATCTTGCGTGGGAGGCATCCGCATATGCGGTGTGCCCGACCAAGGTGCTGATTG
+CTCCGGCGAAGTACTCGATCCTGACCCAGCCGGTTTCTGAGGCGGGCAATATTTCGATTC
+TCGAGTATGTTCGGACCAACTGCATATCGCACAACGTGAATGGGCGTCCGCTGGACATCC
+AGCCGGTGAAGTGGCTGGCGGGCCGCGGAACCAGCGGCACCGATCGCATGGTGGCCTACA
+CGCAGGAAATGGACCGCGTCCGCTTCCCGTATGTGCCACTGCAGCGCACCCCGCTGGAAT
+ACCGCGACCTGCGTCAGCTGGTGACCTACTTCGGTCGCCTGGGTGCTGTGGAGTTCGTGT
+ATCCCGAGACCCTGGCCTACGCCGACGGCTACTGAGGAGGTCGATATGCCGAGGATCAAC
+GTGACCAAGGCATTCACCTTCACCCATGCCACCGGGGAGCGACAGCGCTTCCCGGTGGGC
+TGTCACGAGGTCGCCGAGTCCGTGGCCGGGCACTGGTACGCGCATGAGCACAGTGAGCCT
+GTAGCTGATGCAGACGTGATCGAGACGGACACACCCGCAAAGCGGCCGCGCCGCACGAGG
+AAGGCCGATGGCTCTGACACTGACGCCTGACCAGTTCAGGGCGGACTTTCCAGCGCTGGC
+CAGCACCACGACATATCCCGATGCGCAGGTGAATTTCTGGATCGAGCTGGCAGCTATCCG
+GCTCAACGAGGCCCGCTGGGGCAAGCTCCTGCAGTACGGCGCCGAGCTGTTCGTGGCTCA
+TAACCTGGTGCTACAGGCGCGGGATATCGCGGATGTGGCGGCCGGCGGCGATCCGGGTGA
+GGTGACGGGCCCGGCGACAGCCAAGAGCGTGGACAAGGTGTCTGTGAGCTACGACGCCCA
+GTCCGTCGCACTGACCGACGGTGGCTTCTGGAACATGAGCAGCTACGGCATTCAGTTCCT
+GCAGCTCGCGCGCATGATTGGCACGGGCGGTATCCAGCTATGAGCATCAAGGTCAAGCAG
+GACAAGGTGAACGCCATCCTGCGGTCTCTGCAGGGCATGGAGCGAAAGCAGGTCATGATC
+GGCGTGCCGTCGGACACCTCGGACCGCCGAGACCCGACGCAGCCGATCACCAATGCCGAG
+ATCGCTTACATCCAAGACAACGGATCGCCGGCGAACAACATCCCGGCCCGGCCGTTCATG
+CGTCCCGGCATGGATGATGCAGCGCCCCGCGCGGCGGTGCAGATGAAGAAGGGCATCACC
+GGGGTGCTGGATGGCGATCACGCGGCTGGAGAAAGGGCTCTTGATGCTGCCGGCATCGTG
+GCATCCAGTGCGGTGAAGAACGTCATCAACTCGGGCAATTTCACGCCTCTTGCCGATTCC
+ACCCTGGCTGCCCGCGCGGCACGTGGACGCGCCGGCGCTCAGGAAGAGCTGGATCGACGC
+GATGCCGGCCATGCGCCGGGCACGGATCTGGCGAAACCCCTGGTCGATACCGGCCAGCTT
+CGCAACTCGATCACCTACGTCGTGCGATCCACGGAGGACTGATGCGCCTCAATGTTTCCC
+GTGTCCTGGCCTCGCGAGAGTTCCGGGACACTTCACTCGTCCGCATTCGCAACACGCAAA
+CCGTCGGAGACGATGGCCGTGCGGTGAATGCCCAGGACAGCACCCCATTTTCTGGCGTCG
+TGACGAACGATGCCGGGTACATCCTGCGCCGCTTCCCGGCGGCCAGCGTCGTGTCCGGAT
+CGATCCTGATCACGTCGCAAACCCCGCTCACGTCGGGCACCCCTGACCTGGATGCCGACA
+TCGTGCGGTGGCGCGGCCAGCAGTACACCGTGTCGATGGTCAATGACTATACGACCTACG
+GCCAGGGCTTCACCGAGGCCATCTGCAATCCGCTCAGCCTGCAGGGAGGTGCTGACAGTG
+GGTAATGACTCTTCCACTGGCGGATACCTGCTGCCGGCGGCGGGCGGCCCGAGCTTCGAT
+AACGCCCTGGATGACGCCATCCAGCAGGCAGTGGTCGGCATCACCGGATTACCGGGCAGC
+CTGGTCCGCCCACGTTGGCAGCCCATCGTGGCCAAGCAGCCGCCCATCGATACCGACTGG
+TGCGCCATCGGCGTCACCGATACCGAGCCCGACGACTATCCGGTGCAGGACCAAACTGCT
+ACCGGGTCGGATCTGATCGAGCACGAGACGATCACGGTGCTGGCCACCATGTACGGCCCG
+CAGGCGGCAGCCAATGCCAAGGCCCTGCGCAACGGTCTGTATGTCGCCCAGAACCGCGAG
+GGGCTGCTCGCAGCAGGCATCAACCTGACGGATACCGGCAAGCCGATAGCAGCCATGGAT
+TTCGTCAATCAGCAGTGGGTCCGGCGCTACGACCTGACCATCCGATTTCGTCGAAAGACG
+ATCCAGAACTACGACATCCTCACCATCCTCTCAGCCGAGGCGGATGTGCACACTGACACC
+CACGAGGGGTAAATCATGGCCCGAGGCCTTCCCGTATCACGCATCATCAATATGAGCGCG
+GTCATCGCATCCGTCGGCGTCGCGACCGCGGACTTCAACTCGCTGCTGATCGTCGGCGCA
+AGCTCGGTCATCAGTATCAACGAGCGCCTTCGCTCCTATGGCTCTCTGGCCGATGTTGCA
+TCGGATTTCGGCACCAGTGCGCCGGAATACCTGGCCGCTGCGCTCTATTTCGACCAGTCG
+CCCCGGCCGAGCGAGCTGTATATCGGCCGCTGGGCCAAGACGGCCAGTGCCGGCGAGCTG
+TCCGGCGGTGTCCTGAGCAGTGCCGCGCAGGCCATTGCCAACTTCACCGCCGTGTCTGCG
+GGCGGCATGGATATCACCATCGACGGCACGGCCAAATCGCTGAGTGCGATCGATCTGTCC
+GCCGTGACCAATCTCAACGGTGTCGCCTCGGCCGTCACCACGGCCCTGGCTGGCGTCGCC
+ACCGTGACCTGGAACTCGGCCACCAATCAGTTTCAGGTGGTCAGTGCTACCACCGGCGCC
+ACGTCTTCGGTGGGCTACGCCTCGGCCCCGTCCACGGGCACGGACATTTCGGCTCTGCTG
+GGCCTGACCTCGGGCGTAGCATCGGCACCATCCGACGGTATTGCTGCCGAGGAGCCGGTG
+GACGCGATCACCGCACTGGATGATGCCTCGGGCGGCTGGTACGCCTCGATGTTCGCCGAT
+ACCTCGCTGACCATCGCGCAGCACGAGGCAGTGGCCAGCTACATCCAGGGCGCGGCGCGC
+CTGCATCTGTACGGCATCACCACGCAGGACAGCCTGGTCCTAGACCCGACATCGACCACC
+GATATCGCCGCCGTGTTCGCCGGCCTAGCTCTGGATCGCACGGTCCTGCAGTATTCCAGC
+AGCTCGCCCTATGCGATTGCCTCGCTGTTCGGCCGTGCGCTGACCGTGGACTTCAACGCC
+AACAACACCGCGATCACCCTGAAGTTCAAGCAGGAGCCCGGCGTTACTGCCGAGACCCTG
+ACCACCACGCAGGCCAATGCGCTGGAGGCGAAGAACTGCAACGTGTTCGTGAACTACGCC
+AATGGTTCGGCGATTCTCGAGCAGGGCGTGATGAGCAGCGGCGCATTATTCGACGAGATC
+CAGGGTGTGGACTGGCTGCAGAACGCCATCCAGACCGCGATCTTCAATCTGCTGTACACG
+TCTACCACCAAGATCCCGCAGACCGATGCCGGTGTGGCCCAGATTTGCACCACCGTCGAG
+GACCAGTGCGAACAGGGCGTTTCCAATGGCCTGCTGGCCCAGGGTGTCTGGAATACGACC
+GGCTTCGGATCGCTGTCGGAAGGCCAGACCTTGACCAAGGGATACTACGTCTACGCCGCG
+ACCATCGCCAGCCAGTCCACGGCCGACCGCGCCGCGCGCAAGTCCCCGCCCATCCAGGTT
+GCCGCCAAGCTGGCCGGCGCCATCCATTCGGTCGATGTTTCGATCACCGTGAACCGCTGA
+GGTAGACCATGGCAACGTACAGTTTTCTCGATGTGGCTGCCACGATCACCGGTGTGGGCG
+GATCTTTCCGCCTCGGTAGTGGTGCGGGTGTGGCTGAGGAAGGCATCTCGTATGAGATGA
+CCGAAGACAAGAACAACATGACCGTGGGCGCCGATGGCCAGGTGCTGCACGCACTTCATG
+CCGGCAAGAGCGGTCACATCACCATCCGGCTTCTGAAGTCGTCGCCCCAGAATGCGAAGC
+TGCAGGCCATGTATGACGCCCAGTCGTTGTCCAGTGCCACCTGGGGCCAGAACGTCATCA
+GCATCCGCAACTCGGCCGTGGGCGACGTGATCGCCTGTACGCAGGTGGCATTCCGCCGCT
+CGCCGAGCAACACCTACGCGAAAGACCCGAACGTGATGGAGTGGCAGTTCGATGCCGGCC
+AGATCGACGCGATTCTTGGCGAATACTGAGGAATGACCGATGCAGTTTGAAATCAATGGT
+CGGCAGTACCAGTCGGCCAAGATGGACACCCGTAAGCAGTTCCACGTCGCCCGCCGGCTG
+GCCCCGGCCATGGGCTCGCTCGCCGCAGTCGCGGCCAGTGGGTCAGTCGACAATCTGTCG
+GTGCTGAGCCCGCTGGCATCGGCCATCGCCGCCATGCCGGATGCAGACTGCGATTTCGTG
+CTGGATGCCTGTCTGGCCGTGGTCAGCCTCAACCAGTCCGGATCGTGGGTACAGATCGCC
+AACCGATCCGGAGGCCTGCAGTTCGACGAGATCGAACTGGGCGAGATGCTCCAGATCGCG
+GCGAAGGTGATCCAGGAGAACCTGGGCGGTTTTTTGCCCGCAAAGGCCGCACCCCTACCG
+AAGCAGTAGGGTCGGCCGGCAGCACGGATGCATGGGCCTGCCTTCCCGACGGGGAGGACT
+GGCTCCTGCGCCCCGTCGTGCGAGGCATGTGCAAATTCGAGAGCCTGATCGATGGGACGC
+TCGACCTAGAGCACATCGCCCTGATGAATGACGCCCTCGATGTCGTCGACGAGAACCGGA
+TCAAAGCGGAGCGGAAACAGTCATGAGTTCGGAAGTCATCCGCGAATACCTGGTGTCGCT
+CGGCTACAAGATCGATGGCGACAGCGAGCGCCGATTTACTGAAAGCCTGGGTGGGGCCGC
+CAAAGATGTTGCGGCCCTGGGAGTCGCAATGGCGGCTGCAGCGACGGCATTTGTTGCTGG
+CGTGGCCAAGATTGCCGGCGGCATGGAGCAGCTGTATTTCGCTGCTCAGCGGACCCATGC
+GGCCGTGGAGAGCATTCAGGCCCTGCAGTACGCAGCCGCCCAGATGGGATCTAGCGCCGA
+GGGCGCTGCCGGCTCGCTTGAGTCGCTGGCGCGCTTCATGCGTGAGAACCCGAACGGGGA
+GAACTTTGTTCGTAGCCTGGGTGTATCTACCCGCGATGCGAATGGTCAGCTGCGCGACAC
+TACCCAGATCATGGGCGATCTCGGCAAGCGCTTGGCGGCCATGCCGTATTACCGCGCTCG
+GCAGTACGGATCGATGTTCGGGTTCGATGAGCGCACGCTCATGGCCCTGCGCTCGGGCAT
+GGGCCAGTTCACCGACCAGTATCAGCAGATGCTGCGCGTGGCCGGCCTCAATTCGACCCA
+GGCGGCAGCCGCGTCGCATGGCTTCATGGTGCAGCTGCGAGAGGTAGCGGCGTGGCTGCA
+GATCCTCTCCCAGAAGGTCTACACGGATCTGGCACAGGGTATTGGCGACGATATTGAGCG
+CTTCCGGGTCCGTTTTATTGCGGACTTCGGGAAAATCTCGCACATCATCGAGTCAGTGGT
+GAAAGGCATCCTGTGGGCAGTCGACATCGTGACCAGCTTCGGCATGGTGGTGGCCGATGC
+CATCGAGGGCGTGATTGGCTGGTTTCGTGGACTCGATGCCAATTCGAAGCATGTCGTGGA
+GGCCATTGGCGCGATTGCTGCGGCATGGGTAGCGCTTGACGCGGCCATGGATGCCAACCC
+GATCACGCTGGTGCTGATTCTGGCTGCGGCAGTCGCCTCCCTATGGAATGACTTCAAGGT
+CTGGAAGCGGGGCGGAACAAGCCTGATTGATTGGGGTAAATGGAAGCCAGAAATCGATCT
+GGCGAGCGCAGGCATTCACCTAATCACCCATGCCATCGAGGCATTGGTGCATATGTTCGA
+GCGGCTCTGGGAGCAGACGGCAAAGATTCGATCCGCTGGCCTTGGCGAGATTTCAAAGAT
+TGCCCATGGCATTTGGGATGCAACCTCAGGCGCGCGGCAATGGTCCCTTCAGGCCCAAAA
+ATCCATCTGGGATTGGGCCACCGGCGGATCCCCGCAGGTCGGGCAGGACGCGCAGGCACT
+CGCCGCTGCTGCTAACCAGATCCGCAATCAGGTCACAGGCCTGCCATACGAGCATGGCCG
+GCCGGGCCCAGATGCTCCACGAGGCATCCGCAACAACAATCCCTTGAACATCCGTCACGA
+TGGCGGATCGTTCAATGTGTATGCCACGCCGCTTGATGGATTGACAGCAATGGCTCACCA
+GTTTGCCCTGTACTACTCGGGCAGGTCCGCCACCGCGCACCATGAGGCACTGCACTCCAT
+TCGTCAGATCATTTCGACGTATGCACCGCCCAAGGATGGAAACGATACACAGGCCTACAT
+CGCCGACGTCTCCAAGCAGACCGGCATCGATCCAGATGCTGACCTGAATTTTGCTGACCC
+GGCGCGGATGCAGGCATTCATGCAGGCCGTGACGCGCCATGAGAACAGCGGACGGAACCC
+CTATGACAACAGCCTGTTCGCTCAGGCGATTGCCAATCAGGGGGCATACCCGAAGGCAGT
+GGGCGTGGATCGAGGATCAAGTTCCGCACAGCTTGCTGATGGCTTCAGAAAGCTCCACGA
+GCTTGTCAGCACCATTCACGGCAACCTGCAGGGACCACAGATTCAGGGTCTGCTTTCATC
+GCTGATGGATGCATACCCGGCGGCCCAGGCAGAGAACAATGGCGCATTGAGCGGAGCCAT
+TGCAGATGCGGTGCAGCAGATCCAGAAGCTTCAACCTGGTCAGCAGTTCGATGCTCGGGC
+ACTTACGCAGCGCCTCGACGATCTGTCGCGACCTCGGCTACTTGCAGACGCATCCACTGC
+GGCAGCGGCTGGCCAGCCTGCGGCGTCACGGTCAGGCAACACATTGAACCAGCAGACGAG
+CATTGTTGTGCATGGCGCCACCGATCCGCAGGCTACGGCCAAAGCGATTCAGGAGCGGCA
+GCAATCGGTGAATGAGCGGGTCACTCGGAACATGACGGCAGGGACGGCGACATGAGCATA
+CTCAGCACAGCCGCCGTTCTTGTCGGCGGAACCGTGGCGGATATCCTGATCACGCAGAAG
+CGGCGAATCGGGACCATTTATCCGCAGGTGACCATCTCGGAGCGCATGCACGACGAGCTG
+GCCATGACGGACAACCCCGTTGATTCGGGTGAGGTCGTCACCGATCACTCATACAAGTTA
+CCGGCCGAGCTGACCATGCGCTGCGGATGGAGTGAGAGCGGATCGCTGTTCAATGACATC
+GACAGTCTGCAGATCGCATCTACTCCCAACGAGGCCTATCAGAACCTGCTTTCCCTGCAG
+AAATCGCGCCTTCCGTTCACGGTCACGACCCCGCGTCGACAGTACAGCAACATGCTGATC
+CGATCCCTGGACGTGACCACGGATGCGGCGACGGCCAATGTACTGATGGTCGAGGTGGTC
+ATGCGCGAGGTGATCATTGTCAGTACCCAGCAAACGACCATGGCGGCAGCCGAGGATCAG
+GCCAGCCCGCAGGACACAGCGGCCACGACCAATGGCGGGGTGAAGCAGGCGACGGTGGTC
+ACCGATACATCGGTTTTGAGCAAGATCGGGACGGGTGTAGAAAGTGCATTCTCCGCGATT
+ACTGGAGGGTAAAGCATGGCAAAAACTGTCTACCAGATTCCCCTGGATGCGGCCGGCCAG
+ACCATCCAGGCGATGATCGGCTCAGTGCAGTATCAGCTCACCGTTCAGTGGCGGAAATTC
+TCCGGCTGGGTGCTAGATATTGCCTCTACGGATGGGACTGCCCTGGTGTCGGGCATTCCG
+CTTGTCACCGGCGTGGATCTTCTGGGCCAGTACGGATACCTGGGCATCGGGGGATCTCTG
+CTCATGGCTACCAATGCCGACCCCGATGCTGTGCCGACCTATGAAAACCTTGGCACGACT
+AGCAATCTGTATTTCGTGGTGACCTCATGAGCCAGTCTGCCCAGCAGTATTTGCGCCAGG
+TACAGCTGGTGATCGGCACCCCTGGCGGCCCGGCGGTCGATGTCTCTGATCTTCGCGTGA
+CCTTCAATGTGCGCTCAGCTTCGGTCGAGACCCTGAAGTCCGCGAACATCCGGATCTTCA
+ATTTGGCCAAGGCCACAGCATCGAAGGTGCTCAACGAGTTCACTTACATCGAGCTGCATG
+CCGGCTACCCGAACAACATGGGCATGATCTTCCGCGGCGAGATCTGTCAGGTGAAGTATG
+GCCGCGATCAGAACATGGTCGATACCGTCACCGAGATCCTGGCCCAGGATGCTGACACGG
+CTTACAACCAGGCGGTGATCAGCAAGACGCTGGCCAAGGGCTGGACCTACGAGGATCAGT
+TCAGTGCGCTGATGCGGCCTTTGAACAAGTACGGGGTCAATCCTGGCTTCTCGCCCAGCC
+GGACAAACAGCCCGGCACCGCGCGGAATCACCATGTACGGCATGGTCCGCGATGAGATGC
+GGATCCTCGCCGAGGATATGGATTGCGACTGGATCATGGAGGACGGGTTCCTGCACCTGA
+TTCCGTCCGATGGATATATCCCAGGCAACGTGCCGGTGATCAATGGCATGACGGGTATGG
+TGGGTATCCCAATGCAGACCATTGAGGGTATTGAGGTGCAGTGCCTGCTCAATCCCCTGG
+TAAAGGCGGGCGGGGCGGTGAAGCTCAACAATGCCGAGATCGCCAAGGCGGCCAACCGCG
+TGCCGACGAATACGACAAACGGCTTGCAGCCGGTTGCCGGCCTGGATGCGGATGGCTTCT
+ATCGCGTTGCGTGCGTGACGCATACGGGCGACACCAGGGGGCAGCAGTTTTACACCTACA
+TCATCGGCTATTCGGTCGATCCCAATCAGGCTCGGCCCATGGTTGGCCCCTCAGTTACAG
+CGGTGCCCGGATAATGCGACCCACTGAGCGATACGAGGACCACGAGCATGTCCTGCGCGA
+GATCATGCGCTCTGCGCGCACTCGGCAGTGGACATGCATGCCTGGGCATTTCGTCAGTTT
+CGATGCCGGCACATGCACCGCCGTCGTGCAGATTGGGATCGCTGGCCAGCAAACAAGTGA
+CGGCGTATCGACGGCCGTGCCGTATCCCGTGCTGGTCGATGTGCCGGTGCAGTTCCCGCG
+GGGTGGTGGTGCGGCGCTCACGTTCCCCATTGCCGAGGGAGATGAGTGCACGGTGCATAT
+CGTGGACCGTGCGATTGATGGCTGGTTTGAGTCCAGTGGCATCCAGCCGCCGAGCAGCAA
+GCGACGGCAGGCGATAAGCGATGCGTTTGCAGTCCCCGGCTCTCTGTCGAAGCCTGCTCG
+GCTGCAGAACATCAGCACGTCCACAGCGCAGCTGCGGAGTGTGGATGGCAAAACCTATGT
+TGATCTGGACCCGACTGGCCAAGTGGTGAAAATCACTGCGCCCGGCGGCCTGGTCATCGA
+TGCGCCCAGCGTCAAATGCAGTGGCACAGTCACAGCATCGGGCGAGATCACCGGCAACGG
+CATCCCACTGTCCACCCACACTCATTCAGGCGTGCAGTCAGGTTCAAGCAGTACCGGCAA
+GCCGCAGGGGTAGCCATGATTTACCGAAAACTCAACGCGGCTGGTGACTACTCGTTTGGC
+GCCGGCCCGGGCGACTTTTACCAAAACTCTCCAGAAGCGGTGGCTCAAGCTGTACTGACT
+CGACTTCGCCTACTGGTAGGCGAGTGGTTCCTTGATACAACTGCCGGCACACCCTGGGCT
+ACCCAGATACTTGGCAAGGGCACATCGTCGGTCTACGACAGCGTGATCAAGAATCGCATC
+CTCGGGACCACTGGCGTCCAATCCATCGACTGCTACAGCAGCTCGGTGTCCGACCGGAAG
+CTGTCAGTCACCGCAACCATCACCACCGCATACGGAAGCACGACCGTGGAGGCATCGCTT
+TGATCACGACCACGGCCCCGACAATCGGTGCTTCGGGCATCAGCGCGCCGACCTATGCCG
+AGATTCTCGCCTACCTACAGGCCAAGATGCAGGCTATCTATGGCGACGACATCTATATCG
+ACCCGGACAGTCAGGATGGCCAATTCATCGCCATTCAGGCGCTGGCGATCAGCGATGCGA
+ATGCTGCCGCGATACTGGCATACAACAGCCTGAGCCCATCCACTGCTCAGACCTCGGCCC
+TGTCGAACAATGTCAAAATCAATGGGCTTACCCGGAACGTGGCGAGCTATTCCACGGTCA
+CCGTCACATTGGTGGGCGTGGCCGGCACGATCATCTCTGGCGGCTCAGTGCAGGATGCAT
+CCGGCAATCTGTGGAGCCTTCCAAGCAAGGTTACGATTCCGTCATCCGGCACAGTCGACG
+TTACCGCTACCTGCCAGACCGAGGGCGCCACTGTGGCGGCCGCAGCGTCGCTCACGACTA
+TCGCCACGCCGACGCTTGGGTGGCAGTCGGTCAGTAATGCAGCGGCGGCGACATTGGGCG
+ATGCTGTCGAAACCGATGCCCAGCTCAGGGTTCGCCAGGCCAACTCGACCATGGCCCCCT
+CCCAGGGGCCGGCCGACGGCATTGTCGGCGCGATCTCCGATATCACCGGGGTGACTCGGG
+TCAAGCTCTACGACAACAACACCAGCGCCGCTGACAGTAATGGCATTCCGGCCTATACGC
+TTGCTCTGGTGGTGGAGGGTGGCGATGCCGAGGCCATTGCGAGCGCATTTGCCCTACGGA
+AAGCGCCGGGTGTGCCCACGGCTGGCACTACCACGCAGACTGTCACCACTCCGGGCGGGA
+GCAGTGTACCGATCAACTTCTATGCTCTGGGCGAGACGACCATCAGTGTTGCCATCGGTC
+TGAAGGCCGGGTCGGGATATAGCTCGGCCGTGGGCGAGCTTATTCAGGAGGCGGTAGCTG
+CTTGGATCAATGCTTTGGACATTGGCGCCCCGGTGGTCTGGAATCGCCTCTACATCCCGG
+CGAATTTGTCGGGAGATTCCAGCAGCAGCACCTACGAGATCACCAGCCTGGAGATCTGCA
+TCAGTGGGGGCGCGCTCGGCACCGCGGATCTTGCGATTCCATTCAACTCAGCGGCTTATT
+GCACCGCTGATGATGTGGTGCTGGCGGTGACCTCATGACGGCCTATGTCAGCGACTACAC
+CGGCCTGATTACCTCCGAGCACTCCGACAAGCCCAAATTCTCCGCAATGGTCCAGGCCAT
+GGCGCAGTGCTGGGTTGATTACCAGAACGCCATGCAGTCGCTCGTTGATGCGATGAATCT
+CGACACTGCGGTCGGCGATCAGCTGGATATTCTCGGCAGGTGGATCGGCATTACCCGCAA
+CATCAACGTGCCGATCGATGATCTGTATTTCGCCTACGACGATGTGGATGGCATCGGGCT
+GGATCTCGGTATCTGGAAGACCCCGAGCGACCCAACGACGGGTGTCACCCAGATGGATGA
+CACCACCTATCGCGCAATCCTGCGAGCAAAGGTAGGCGCAAATCACTGGGACGGCAGCAT
+CGAGGGACTGGAGCCCATCCTTAGCGCGATCTTCAGCCCAGGCGGAACGACGGCAAAAAT
+CGTCGACAACGGCGACATGACCTACAACGTCAATTTGACCGGGACCGAGCCGACCAAGCT
+GCTCATGACACTGGTCGATGCCGGATACATCCAGTGCGTTCCGGCCGGCATGGCCGTGAC
+CTACACCTACACCGCATAGGCCCGCGTTTGAAACGCGACCCCTGCAGGCGCCTTTGAGGC
+GCCTTTATTGTGCCCAGAGGAAACCATGGCCACACTTGAAAATGATTTCTTGCCGTTCGC
+CACCGGATCTGGCGCCAATGTCGACGACCAGGCGACTTATGCCGATGCAGCCACGACCGG
+GACGGGGTTTGTGTCTGGTATCGCAAAGTCCGCGTCTGTGAACAAGGTTCTACGTCAGGC
+CTCGACGATGGCTGCCGTGATTGCCGCCCTGATCGTGGATAAGGCCGCGGTAGCGGTTAC
+CGATGATGGGAGCGTGAGTACCATTGAGGCGAACCTGGTCACGGCCATTCAGGCTGTCGC
+GCAGGCGCTGGACTATCCAATCAGCCAGGTGACGGGTCTGCAGGCTGCGCTGAATGCGAA
+ACTGGATGCAACGGCAAATGCCGTGTCTGCGAGCAAGCTGGCCAACACCTTCAATCTCGC
+CCTGACGGGCACGGTGACTGGCGCAATCAACATTGATGGATCGCAGAACGTCTCGCTGTC
+GACATCCATTGCCGATGCAGCCCTCTCCGAAAGCATGGTGAACGGCCTGCCGGCAGCGCT
+GTCCACCATTACCAACACGCTTGCGTCGGCCAGTGATGGGACGAATCAGCGTGTAGCCCT
+GGTTGGCATCAACATCGCCTCTGACGCACCCTTCATGACGAGTGCGCAGAATGTCGCCTA
+TGACCTGATCAAGTCGGCGCCAGGAAGCGGATATTTGCATGCCCGCAACCTGACCCTGGA
+TGCCAGCGGCAACCTGATCGCTGTGGATAGCGCAGGCAATACGCGAGGTTACGGTACGAG
+CGCATGGGTTACCACGCAGATCAGCGCAGAGACCGCGCGCGCCGAGGCCGCCGAGTCCAC
+GCTGACCACCAATCTTGCCGCAGAGGTGACGCGAGCCAAGGGAGTGGAGGCCACGATCAC
+CAATACCATCGCCTCGGCTGATGACGGAACGAACTTGCGCATCGCGCTGGTCGGCATCAC
+CAAAGCGACTGGCGTTCCGTTCATGGCCAGTGCGCAGGGGGTGACGTACAGCCTGATCAA
+GTCGGCACCGGGGACCGGGTTTCTTTCGGCCCAGAATGTGACGCTGGATAGTTCCGGCAA
+TCTGATCATCGTCGATAGTGCTGGGAACACTCGCAATTATGGCACCATCAGCTGGGTTAA
+CACTCAGGTTGCGGCTGAAGCAGCCCGAGCCAAGGCGGTCGAGTCAACCCTGACTTCGAA
+CTTGGCGACAGAGACCGCGCGCGCCGAGGCCGCCGAGTCCACGCTGACCACCAATCTTGC
+CGCAGAGGTGACGCGAGCCAAGGGAGTGGAGGCCACGATCACCAATACCATCGCCTCGGC
+TGATGACGGAACGAACTTGCGCATCGCGCTGGTCGGCATCACCAAAGCGACTGGCGTTCC
+GTTCATGGCCAGTGCGCAGGGGGTGACGTACAGCCTGATCAAGTCGGCACCGGGGACCGG
+GTTTCTTTCGGCCCAGAATGTGACGCTGGATAGTTCCGGCAATCTGATCATCGTCGATAG
+TGCTGGGAACACTCGCAATTATGGGACTAGCTCCTACGGGACCATCTCCGGTGGCTACTA
+CATCCGCATCGGAAACATCCTGATCCAGGCGTTCTCTGCAGGGGTCCTGAATGCCGGTGA
+CTCAATTGCATTCCCTGTAGCTTTCTCTGCCGCGCCAGTGGTGTCCACGACCGTCGACAA
+CAACCGGGACGGCGCCAATCGTCCGGTCGCCATCAATCCGACGGTCGGGACAGTGACCGC
+GTCGGGTTTCAAGATCAACATCGCCGCCATCTCGGGGGCGAACCAGCCGGCCGGCACCGG
+CCAGGTGTGGGTATTTGCCATGGGTCCTGCATAAATGACTGACAACACCGAAGAGACGGC
+ACCGGTGGCCACCGCAGCTGCCGTGGACATGGCGACCGATGCGACATCGAATGTCGAGAC
+GCAATGGCCTGCCCGCTACTACGCCAGCTATGACACGTCCGCCACCGGTCCCACCGAGGT
+CACCGGCTGGTATGACGTGTGGGGCATGTCCAGCACGGCGAATGTGCCTGCTGCGGCCGA
+GATGCTTGCGCTTACGGCCGAGCAATGGGCTGCTCGGCTTCCGTATGGGCAGGGCGTGCA
+TGAGGGGACCATTGTGGCCTACACGCCTCCCAGCACCGTCACCCTGGCAGATCAGGCTGC
+CACAGCATACTCGGCGGCCGTCGCGACGGTGCAGAGTGAGTATGGCGTCCTCAATGAGCC
+GACGCCGGATGACTGGGTGACCTACCTGAAGGCGCTGAAAGCGATCCGGGATGGAGTCGA
+CACCACCAGCACGGCACTGCCGGCCGCGCCGGCGGCATGACGAAAAGCCCCATCCCTCGC
+GGGGTGGGGTCTTTTTTGTGCCTGAAGCTCGACCATGAAAAATCAATGACTTGCCAATTA
+TCCGCCGTAGTAGACAATCCATCGCTACGAGGTCAGATCATGAGCAGCATTGCATCCATC
+ATCCGAGAGCTTCGCATTGCGCGAAAAGAGCTGCGGCCAGCCGACTTTGTTTTTGGAGTG
+TTGATTCCAACGATGGTCTTGGCGCTAATCAGGAAGGGGTCAGTCCTTTACCATCTGATC
+ACGATAGCGGGACAGGTGGCGGCCGTCGCAGCCTGATCTTGATGGCCATGGATGGCCTAG
+TCCAGCTTCGATGCCATATCCGATGCCGACTCCCGGTAGTAGATCATCAGCGACTGCAGG
+TCTCGATGACCGATGGCCCGAGCAAGCTGGAGTACATCCAGCTTTTTGCTGAGTCGCCAG
+ATAGCTTCGGCCCGGCTGTCATGGAAGTGTAGGTCTTGAATGGTCGTTTTGTTCCGCACC
+TTGCGCCAGAGAGCATCCCGATTCGCATCCGATAGTTGGAAGCATGGGGCATCATCGCGG
+GGTAGGGCCTCCAGAATCTCAATGGCTCGAGACGATAAGGGAACGTCGCGGGCATCACCA
+TTTTTCGTTTTGGGAAGATGGGCGTAACGCTCACTGATGTGAACATGGTCCCATGTAAGG
+GCGGTGATCTCGCCGGAGCGCATCGCGGTCTCAATCGCAAAAAGGAATGCAAGCCCGATC
+CGATTTGTTGATGTCCTGCAGGCGAGTCCCGCATCCAGGCCAAAGGCCAGACTTATCTCT
+TCCACCTCTGCCTGGGTGATGCGCCTCTTTCGGCTATCTGGCTGATCGGGGAGCTGCATA
+CCCTTGATGGGGTCATGGTTCATGTAGAACCACTCTTCTCGGCAGTAGCGAAACATCGCC
+CGGAGCATGTTCAGCTCGCGAAGCATGGTCGCCGGCGTGACGCTCTGAAGGCGCTCATCG
+CGCCATGCAATGATGTCTGATCGATCGAGGTCTTGCATGCGCACCTTGGCGATGCTTTTG
+GACTTGAGTGATCGGCATTTCATCACCTCCCATCGCCCTGCGCCTCGCGTGGGGGCAACT
+TCTCGCTCGTAGCGCTCAAGCGCATCAGAAACGAGGCGGGGGATGGTTGCTCGGCCAGAT
+GAAACGGCCTCCTGTTCAATGGCCCATGCCGATGCCTGGGCCTTGGTAACGAAGACCTTA
+CTCTTGCGCTGACCCTTGATCAGAACCTGCGCTCGCCAGCGCTTTCCATGCTTGAAGATG
+CTTGCCAT
+>NC_017033.1|provirus_2089294_2107522
+CTATGCCCGAACATCGTGGCCATCCGAACCCAGAAAGCGTCGATCATCGACTGCGAGGCC
+TTGGGCAGCTGGCTGTGCTTCTGCTGAGGCTTCGGCCTGCTTGCGGATTGCGATGGCGGC
+CTCGACGCGTTCGACCGCGCTGAGCTTACTGCCGCCACTGCGGCCTGCTGGATGGTTTGC
+ATGGGCTGATCCTTGGGTGACGGGCTTGGGGCCCTCGGCATGGCGATTACGGGCGGTTGT
+GATGGCGTAGGCGAACGGCTTGGCCTTGTTGCGGAACTCCGCAGCTGTGGCTGCCAGCGT
+TTCCGGGGTGATGCCCTCGGCCAGAGCGGCGAGGAGATCCGGATGCTGAGGGTTCACGTC
+GGAGCAGCCGGCCTTGCGCATCAGCCGGCAGGCTCGAGCGGCTTCGGTGATCGTTGGGCC
+GTCGTCGCTTGAATCGCTCGCGCTCGTGCCCGCGTCTATCTCTCTCTCTTGGTTATTGGT
+TACTGGTTTATGGATACCCGTGTCTTCACATGTGACAGGTTGTGACGTCACATCGTCTGT
+CACGGGACTTGTCACACCTGTCACGCGTGACAACATCTCCCGAAGCTGTGACATGGGCGT
+ATCAAATCCCGCTGTCACACCGTGACGCTCGAGCTCAGCAAAGAGATCCGCGCGGCGCTG
+CCTGGACTTCTTCTGGCGTTCTCGCTCGTTTGCTTTCTTGCTTTGTCGATCCGGTTCGCC
+TGCGCGGTAGGACGCAATAATCGAGTCGGCACGATGCTGCCGCCAGAAGCCGTCTACCTG
+GACGAAGAACTCCTCGAGGATCGCGTCGACCGCAGCCTTCTCTTCTTCAGTGCGGGCACC
+AACAAGTCGATATGCCCTGCCCTCTGGAATGCCTTCCTCGGACGAGTAGTAGCGATCCAG
+CAGCAGCGTGTAGACGCCATGCTCGAGGATCGTCAGATGGCGGGTGTCCCGGGCGTAATC
+GCCCAGGTGGCGCTCGTAGTAGTTCATTGCCTCCGCACCTTCCGCGCGATCGCGGCGACA
+AGGCGAACCACGATGTCCTGGACAAGGTGTCCGGCGTGGCTGGTGTCCTTGGACTCGCTG
+TGTGTGATCACGCCATCGGCCAAGGACTCGCGGACGGTGCCTGCAAGCCCGCCGCTGCGC
+TCGACCAGCTCCAGCACCAGGGCGGTCACGTCATCCTCTTTCTGCTGGGCAACTTGGTCC
+AGCGGCGTCAGGGCAAAGCCATGGCTGGCAGCCAGCGCGTGCAGGATGCGCACATCGCCG
+GTGATGCCCATGAGGCGATCAGCCTCCGCCAAGGTCAGGTGGTTGCGGTCATAAGTCGGA
+TTGACCTTGTGGCGAAGGATGCCGGCTTGCAGACCCAGCCGCAGGGCAAGGGTCTCGGCG
+CCACCGGGATAGTCATGCACCGTGGCATGGGCAGCATCAACGACGTTCATACGGAAGGGT
+CTCAAAAAGATGGAGCATCGGTTTTGCTGTACTGGCAAGATGGCAACTCACCACCTTCGC
+CACTTGTGACCTGCTCATGGATTTCGCTTCGATCACCGGCCTCGCCTCCTCGACGATCTC
+GACAATCACTGGCGCCAAGGATCTGATCAGCGCTGCCGTCGACATGCGGGACGCTGCGAA
+ACAGAGCGCGGAGCTCGTCAAGGCCAATGACCTTTTGCTCAAGGCCCAGCAGAGTCTCCT
+CACGTACACCGGCCAGCTCATGGAGCTGCAGGGCAAGTACCTCGATGCCTGTGAGGAATT
+GCGAAAACTGCGAGAAGCCGAAGCGGACCGTGGTCGCTATACGCTCTTCGAGGTCAGCCC
+CGGGGCTTTCGCTTATCGCGCATATGCCACCCCACGACTCAGCACAGCTGGCGAGCCATT
+GCCGCCGGAGCCCGAGCATTACGTCTGTCAGCCGTGCTATGACCGCGGGATCAAGTCCGT
+CTTGCAACGCTTCAACCACTACGGGTCGATCTATCTTCGGTGCTCCATCTGCAAGCAGGA
+CTTGCCCACCGGCCGTACAGAGCCTTTCGGAGGTATTTGATTGCTTCACGCAGCCACCAC
+CTGCCCCGGGCTGGCGGGCCTCGGAGGTGAGATGATCGACTTCACAGACATTCCAGTCAG
+CTTCGAGACTGCCTGGACGTGCTGATACGGGACTCGGCGCCATTGAGAAACAGCCTGACT
+GCTGATCCCGCAGCAACGAGCGACTTTTGCCGGGCCGCCGGCCCGCTTGATGATGTCTTT
+GATGTCCATAAAGCTAAGGTAAGTCATGCTTACCTTTATTGGCAAGAGATACTTCCGTGC
+GCCTTGTAAATTTCCCTTACATACTCGCCCCATGAGCGATCAACTTTGGAAACGAATCAA
+GGAGGCCAGGACGGCAGCCAAGCTGACTCAGCAGGCTGTTGCTGACGCCTTTGGGATTGA
+TCGAGTCGCCGTCTCTCTCTGGGAAAGTTCAAGTGATGCCCGGCGAACGAGGCCAGATAT
+CGGCCGGCTAAGGGAGCTGGCCAAAATTACTGGCGTGAAGATGGAGTGGCTGCTAGGTGC
+GGATGGAGATCCAATCGGATCCACCCATCTCGTCTCACGAGATGAGACAGACCCGGCGTA
+TGTTCGATTCCCTCTCCTTGAGGGTTACGCAGGCATGGGGCCTGGAACATTCATCAGCGA
+CTACCCCGAAGTGGTCAAAGACCTCCGCGTCTCCCGCGAGTGGGTCTCGCAGAAGATGCC
+AGGCATCCCCCATGACGTGATCCGCGTGATCACCGGTCGCGGCGACAGCATGCGCGGGCA
+GTACAACGATGGGGATCTGATCTTTGTCGACACACGTGTGAAAAGCTTCGATCAGGACAG
+CGCGTACTGTTTCCGCTGGGCCGGCCGCGTGCAGGTGAAGCGCCTGCAGCTCATCAAGCC
+CGGGATCGTCCGCATCCTCAGCAAGAACCCCGACTATGAGTCGATCGATGCTGAGGTCGA
+GGAGATCGAGATCGGCGGGCGAGCCATTGCGGCTTGGACCTTGAGGGAATTTTGATATGG
+CAATTGAAAAGAGGCTTTATCAGCAAAGCCACTATATTGGATACAGTGCTAGTAAATAAA
+ATACACTTACTAAAAATCAACAATTCAATATCCGCACCACCAACATATAAAGCACCAATC
+CAAGGCAATAAGAAATGAATGTCAACTATTTTGGTTATTACCTTCACGACCACAAAACCA
+ACAAAGACTACCAGATTGATCTATCAGACCTATTTGACTCAATATCAAATAACAAATACC
+CAGATATAAATAGCAACCTCTACTATAATGGAGATCGAATATACCCACTCCCCTATCTTG
+GATCAACATACCTGCTAATTCAATCAAGAGACAATGAGTTAATAAAATTTATTGAAAGGG
+CAACATTGAAACATGAAGATCTATCGACCAAGCTAGGCACGGCGAATTCAGTCGGAATGG
+CAAGCTACGTTAAGTTCGAGCCTAATTGGATAGCAATAGTTAGCAAGGTTTTGTCGCCAA
+GGATTCAGGCGCTATCCCATATAATTAATCACTTTATTAGATGCCTAGGTAGTGACTTAG
+AATTTAAGCTCGCCGCATTTAATGATAAGGTGTCAAAAAAAGATATTGTCAAATTAAATC
+ATGTTAGCTCAATATCCATTGGATTGAACGCCTCCAGCTCGTTAACCAGTAAGTTGGTCG
+GCACACTTTTAGGCAACGGGTATCCAGCCACCTCTGATATCGGAGGCATAGAAATCAGAC
+TGAAGCCATCGTCGTCTAAATCAAATTTGAAGAAAGACCTTCAAAATATAGCCATTAATA
+TACCAGACTCTGATATCGATGAATTAGATGCTCGCGGCAAAATTGAGGCGACTGACAGAA
+TGAGGGATCTATATATTCATGGCTCTGGTGGACTTAAAGATTTCATCAGGCCTAGATACG
+AACATGAAATACCTTCATCTATTACTAAAGCTGCGTCACTAAACACGGCCCTACAAGCAA
+AAATAAAGGAGTTTAGTGGTGACCCGAATTACATCAAAACTAGCGATCCCCATGCTATTG
+GCCTTAACTGGTAATTCCCTAGCGCTACTTTTGTACATCCTATCCTTTACCAAAAAAGGT
+GGCGCACTACTCATCACCCTTGGAAAAAACTCCGATAATTTTGCAGCAATGTCCGCCAGT
+GCAGAATTCTCCATGCTTGGCTTTCTATCTGCAGTAATGGCCTTATTTAGCATCATAGGA
+CAATCGGAAGCACTCAGGCGTTACCGTATTAACGGCTACTTATCCAGCCTCTTGATCACA
+TTCTCCTTCGCGCTACTTGAGACTGCGATCGCCTTCACATCATCGCTAATCCTATTCTTT
+AAGCCAGTCAGTAATATATTCATCACGATTGCTTTCATTGCCCTAGTCGGATCATTCGGA
+ATGATGTGTGTCACCTTGATACCATGCATAGGCCTTCAAATAAGAGCATCGAGCGAAGAA
+TGAGGAGCCTCATACTCCTAGAAAACAATCTTAAATTCACGACTTATCAATCAAGGCCAT
+TATTCACTTATTCACAAGACCCAAGCATTGCCATGTGATTATTTCCCACAAGTAAATACC
+CAATTCCATCCAACTCCAAGAAGCCACCGCCAAGTTCTTCGATCGCTACATCGCCAAGGA
+TCTCAACCTGTCCCCAACATGGTCAGATCCAAAGAATACGGATGGGGCAAGCGGGCCAGC
+CCCGAACTATGACCGAAGTGGTTGCTATGCCCTGCTCTCCGGCGATGAAGTGATTTACAT
+CGGCCTGGGACGCTCTTGGAAAAAGGGGCGCTACAAAGAGCACGCAATTGGCGTGCGTCT
+GAGCGCTCATGTCCTGCTCGTCGACAAGGCCACAAACACCTACATCACGCGAGAAAAGTG
+GCGCGCGCTGGGTGTCGATTCCCTCATCACCATCGGCTTCCCTCACGAGATGTTTTTCCT
+TGCATCGGCGCTTGAGGACTATCTGATCAATGAGCTGAAGCCTGAAGGTAATGGGGTTGG
+GAAAGGGCGATGAAACTTCTAGCTTATTCGACCAGAGCTGTAACCACATCAAGTCGTGGG
+CGAGTGAGGGGTACACCTCAGCCAGACTGATCAATCACCCCTTAGGCGACACAGTACCTC
+ACAAAAAAGACACAAAGACGAGTTGTATTTAACAATTTGATCACCCCCCTTCAAGAGGAA
+AGCCTTACCTCACCACCCTAATTAAGATGCATCTATCACCAAACTCAGGATTAAATATCA
+TGTCGGAAAACAATAAATCCACTGCATTCAACGACAAGTACTATGAAGAACATTTCAACC
+TAGAATTCCTTCCTAAGAAATGCATGCTATGCCAATCAGGATCATTAAATAGAAAAGGCC
+ACCTCATACCAAAATTTATATCAACCCAGATAAAGAAGAAGCTTGATATACCCACACTTC
+GCTACAGTACAGTAACCGACCAAGGATTGATTAACGAGGGCAGGCATCGGCAAGACACGC
+TGGCATTACAGTTTCTGTGTGATAATTGTGAGAATAGGCTCGGACTGGCTGAAAGTGCCT
+TTTCGAACAGTCAATTTCGCCCACGTCTTGAAGGCGCCCAAATTCCGGATATGGATCGAT
+TAACTCATGACTTCATAACATCTATCGCATGGAAATATGCGACCTTCAATAGCTTCAAGA
+AAGTTGGAAGCAACTCTCTTTCAAGAATAGAGCCTGAGATCGAAAAAGCGAGAAAATATT
+TAGCAGGAGAACAAGAAAGCAATCCTTTTGATATATACTTCATAAACTTGGAGCGCGTGA
+GTGAGGTAATGGAGAATACAGACTCAAACAGATTTCTCTACAACATAACTCTCCGCGATC
+GAGAAATAAATCCAATCCAACTGATTGGAGACACTTGGTTTCCCGGCACCTCGTCAGGAA
+TTCCAATAATAACAGTTAGGCTAGGACCGCTATGCTACATTATAGCTCCAAGCGGTCACT
+TGCATCTACTCAGATGCATGCCTGAAGAAAGGCCATCGCCACACAACATAGTGGAATTGG
+AGGTGACGCAAGATATTATCAACCTGCTTATATCGCTAGAAGGAGGATTTATTGATGGCA
+TCCCATCAAGAATAAACAATCCAGCCATGGAGTATGAGATGAGATGAGATGCAAACTTCT
+CAATCTCCACAGAGGCCGCATATCACTAGCGACATAATATTCAGCACGCCTGACTTGATG
+ACATCATCAATAAAATTCCTACTCCCAAGTTTTTTTCATACACTACCCCACGTCTAGATC
+CGCCCCAAGCCTCAGGGTGGTCCTCGGCTCATCGTAGTCGCCCGTCTCTGAGTCCACAGT
+CTGGGCAAAGACCAAGACAGCGGCCTACTCTTCTTCCAGCCTGTAAGCCCTGCGCACCGC
+CGCATCCTCCGCCGTCTTCGGTATGGGGGTTCGGCGAGCAGCTGACCGCGTTGCCCTGTA
+ACCCACGTCTGCACCACATAGATCGTTTCTTTGGCCATAGCTCCTCCTGGTGAAGGAAGC
+ATGGGCCGTGCGCGCCTCTCGGTCGGCACAAACATAACCATATGCTGAACAATTGTAGGA
+TTACCTTACCCCCCACACGTAAGTTTTACTTGCCTTTAAGTGTAAGTATGGCTTACCTTT
+ATCCCGCGCCGCAGCGAACCGCTGACCAACGGCCTGGGATCTTCCACAACCTAGCGGGCA
+CCCGAGGATGGCATCGCCATGCGGAGGGCCCAGGGTCTGACCAGCCCGGATATCGGTCGC
+CGTGCGCCTTCGCAGAGGGCGCATTGGCATGGCGGTTGGCGCTTGCGCTGACCGAGGCGC
+TGAACACTCGGAACCCTCCGTGAGACATGTGGAATGGCCTGTAACGGGGCCGGCCAGCCG
+CCATCCCAATTCGTCACCCTGCCCGCTCGGGCTATCTCGCGCTTTTCCGCGCACCTTCCA
+CTGGAACCACAACATGAGCATTTCTACTCGCATCTATCGCGTCGTCGTCAACGAGGGCGG
+CGATGACGAAAGCACGCACCTGGTGCGCGCAAACACCCCTGACAACGCTGTAAAGCATGT
+GCTGACGAAGCAGATCAGCGCGAACGTCGCCACCCAGGACGAGCTGGTCGAATTGGCCAG
+CCAGGGTGTCGCCGTTGAGACGGCAATCGTCCATGATAGGCCGGGCAAGCCGGGCCGTCC
+GAAGCAGAAGGCGGCGTAAGCAACACCCTGCAGGATGCAGGCGTAAAAACCGTGCGAGGC
+CGGCGCAATACCCGGCCACTCATTCCCCACCGATGCGGCCTATCCCGCATCGATCCGCGA
+CTCAGCTGGCAGCCGTGCCGGCTTTTTTTGTGCCTGGAGAAAGTCATGCACTTCAAATCT
+GCTCAATACCGGCTGCTGGCAAGCATGCCTCAGTACCTCGACTACACCATGGGCCAGCTC
+GCCGCTCTGTGCACTGTGAACCCGAAATTCCCGCTGATTGCCGGGGGTATCCAGTGAGGT
+CGACTACCCAGTCTTTCATCCGCCGGCGCTTCAGGGGCTTCACCCTCTATATCTCGGCCA
+CGGCCATCAGCGGAACCCACGATGTGCGCTTCAACACCGGCGCCGGCGAGTTCACCCTCC
+AGATGACACCGGACGATATCGAAGGCGTGCAGTCGGTCCTCGAGCAGGCACACACCCTGA
+TCGATGCGAACCTGCCGGGCCGCTGTCGATCCTGCGCAGGAACTGGTGAATATGGTGTAG
+GAATCGGCATTCCTCGCGACTGCCCGGCCTGCTCGGGAACTGGCCTCAAATCGCGTCAGC
+AGGTGGCGGCATGACCGACAACGACAAGACGCTGCGGGATGAGTTTGAGGAGCGCGCCAA
+GCGCTTATTTCTTCCAATCGAAAGGAACAGATTCGATCAATACCGGGATACCCGCACTCA
+GCATATGTGGTGGGGGTGTCAGGCCGCCCACGCCAAATACGCCCCGCGATGGCTGCCGAT
+TGATGAGGAGGTTAAAGATGGCAATCCCCTCCTAGGCCTACGAGTACAGGACGATGCTGT
+CTGCCTCGCCTACTGGAATGATGAATCTTTTTACAACGTCTGGACTGGGGAGAAGGTCAT
+TCTTACTCACTATCTTCCAATCCCTGGTGCGTCGGAGGTGGTGGCATGACCACCTACCTT
+CAGCCGCCGGGCATGTTCTGCGATCGAGCCGGCGAGAAAAGGGCTGACGAAGAGGAGGCC
+ATCGAAAGGCAAGTTGCCTCTGACCTCTCCGATCCAGACGTCGCCGAGGAATGGCTGATG
+AGTTCGATCGACCGCTTCGACGACACCAAGGCAGCCGCCCAGGCACTGGCCCGGGGCGAC
+CTGCACTCGTTCCATAACATCTTCGCCCACTGGGTGCAGGCGCAGACCGAACTGCGCTTT
+GAGCAGAAGCTCCGCGGCTTCCACTGATTCAAATCCCCTCCCTTTTGATTGTGCTGGCTC
+AGGCCGGCAGGAGATCCCCATGTCTGAAATATCCGTGGCCAGAGCACAGAACCTGGCACA
+AATTGAGCGTGTAAATGCGCTACTTCCCACCTCGATCGGTGAGGCCATGCAACTCGCCGA
+GTTCATGGCTAAGTCGGATCTCCTGCCTCCGCACCTAAAAGGCCGACAGGGCGACTGCCT
+GCTGGTGGTAATGCAAGCTCAACGCTGGGGTATGGACGCCTTATCAGTGGCCCAATGCAC
+GTCAGTTGTTCATGGACGCCTCTGCTACGAGGGCAAGCTGGTTGCGGCAGCCCTGTACTC
+ACAGAAAGCCATCGATGGCCGCCTCCACTATGAAATCAGCGGCCATGGGCAGGACGCCTC
+CATCGTTGTAACTGGAACACCTCGTGGAACTGGTCAGACTCAATCAGTGTCAGGCTCCGT
+CCGCAAGTGGCGAACGATCACGATGAAGAAACAGGATGGCGCCCCTCCCAAGCGGGTCGA
+CAATGCCTGGGACACAATCCCGGAAGACATGCTGGTCTACCGCGGAACGCGGCAATGGGC
+GCGACGCTATGCGCCTGAGGTGATGCTCGGGGTGCAGACGCCCGATGAAGTTGACGATAC
+ACCCATGCAGACCACTGTGATCCACAGCACGGCTGCATCCTCTCCTGCCATTGAACCGTT
+GATTCCTTATCCGGAAGAAGAGTTCAGCAAGAACTTCGACACCTGGCTCGGACGCATCCA
+GTGCGGCCGGAACTCCGCCGAAGAGGTGATCGCCAAGCTGCAGACCAAATACACCCTGAC
+GCCCGGTCAGCTGGGCGCCATCCGTGACCTCGAAACCACCGAGGCGGAGGTAGTCGAATG
+AAGATCGTGAAGCTCACCCAGGGCACGCCGGAATGGCATGCCCACCGCGCCCGTCACTTC
+AACGCCAGCGAGGCCGGCGTGATGCTGGGCATTTTCCCTGGCGTGAAACGCAGCGACCTG
+ATCAAGGTCCGCGCCACCGGCATCGAAGAGGAGATCTCCACCTTCGTGCAGAAGATCTTC
+GATGACGGTCATCGCTTCGAGGCACTGTGCCGGCCGCTGGCCGAGCTGGTGATCAGCGAG
+GACCTTTTCCCCTGCGTCGGAGAGGATGGCAAGCTGTCGGCCAGCTTCGACGGCCTGACG
+ATGATGGAAGATGTGGCCTGGGAGCATAAAACGCTCAACTCGGTGCTGCGCAAGGCATTG
+CCGGAGGCGGCCCATACCGGTGGCACGATTCCGCTGCACGGCGAGGATGTCACCCTGCCG
+GCGCACTACTGCGCACAGATGGAGCAGCAGATGCTTGTCTCCGGTGCCGATCGTACGCTG
+TTCATGGCATCAGTCTGGGATGGCGACACGATGGTCGAGAGCCGGGCCTGCTGGTATCAC
+TCCGACCCCGAACTGCGCGCACGCATCGTTGCAGGCTGGGCCCAGCTCGAGCAGGACATC
+GCGGCCTTCACCTTGGAGCCGGAAGAAGCTGTCGTCGTAGGCAAGGCACCCGACCAGTTG
+CCCGGCCTGCACATCGAGGTCACCGGCATGGTGACTGCCTCGAATCTGGAAGCGTTCAAA
+TCTCAGGCGATGGCGGTGCTTGGCGGGATCAACCGGGACCTGCAGACCGATGAAGACTTC
+GCCAATGCGGAAAAAGCAGTCACCTGGGCGAAGGGCGTAGAAGATCGCATCGATGCGGCC
+AAGGCCAATGCGCTCGCCCAGACCGAAACCATCGACACCCTCTTCCGCACCCTGGACGAC
+GTGAAGGAGGAGACCCGGCGTATCCGCCTCGAGCTCGACAAGATGGTGAAGGCTCGCAAG
+GTCTCCATCCGGGACGAGATCGTCGACGCCGGCATCCGTGCAGCAAGAGCCCACTACGAT
+CAGCTGGACTCGAGCCTGGGCGAGTATGCCATCCGTCCCGATCACGCCACGTTTGCCGTG
+ATCGGTGCATCGATCAAGGGCAAGCGATCGATCAGCAGCATGCGGGACGCAGTCAGTACG
+GCCGTGGCCGACATCAAGATCGCTGCGAGCCAGTTTGCCGAAGTCATCCGCGCCAACATC
+AGCATCCTGAAAAATCAACATCAGCACCAGTCACTGTTTGCCGATCGGGTGATGCTTGCA
+CAAACCAAGTCGCCTGAAGATCTCCGCAACTTGGTCGCGGCTCGTATCGGCGAGTTCGAA
+CGGCAGGAGACTGAGCGACTGGAGCGGCAGCGCGAGCAGATCCGCAAGGAAGAAGCCGAG
+AAGCTGGCCCGCGAGCAGGAGGCGGCCAAGGTGGTGGACGAGACTCCGCCGGCATCTGCA
+AAAGTCGTCCAGTCCGCACCTCAGGCGCAGAGCCACTTTGCGGCATCAACGGACGAGATC
+CCAGCCAAGGCCGAAAAAGTCGCCCAACCGGCAGGCCCTGCCAAGACCATCAAGCTGGGC
+GACATCAACGCCTTGATCGCACCGCTTTCGATCACTGCAGACGGACTGGCGCAGCTTGGC
+TTCAACCCTGCAAGCATCGATCGCACCGCCAAGCTGTACCGAGAGGACCAGGTCCTCGAA
+ATGTTGAGGGCCATGATGGCGCGGATCAAGGATGTCGGCCTGGCAATGTCGGAACGCAAA
+GCGGCCTGACCATGGCAACCGACAACTCCCTTCCCACCATCGACATGTTCCAGCCGCTCG
+ACGGCTGGTTCGACTGGCGATCCGGCCGTATGCGAGTGCTTGTCCGAGAAGGCGAGCCAC
+GCATGCGCTGCGGAAAGATGGCCTGCGGCCACGATTCACCATGGGCCCCTGAGTTTTCCA
+AACCGTGGGGCACCTTCCCGGATCTGCCCGAAACAGTGGCCGAGAAAATGGCCGCCTGAG
+GACGAAGCATGAAATCACTCGGAAATATCAGCCGTGGCGCAGAAGCCGCGGCAAAACAAA
+TCAGCAAGAACGCCCTGGAGCATGGACGTGTCGCGATCTTCATCGATGAGACAGGCGATG
+TTGCCTTCGTCCCGCATTACGATCGCCAATATGGCGCGGCGCTGGCGACTCTTTCCAAGC
+AGCTCGTCGGAATTTATGAGGGCAACGCCTCAGGCACCGGTGTGTGCCACCCGACGCAGT
+CGGTCTATGCCATCTCCAAATCGGACCTTGAGCATTGGATGGGGTTTATCAGTATCCCGG
+CCGGTGTGTGCGCGATGACTGAACAGAGGGCTGCAGCATGAGCGCTGCTGAAAATATTGA
+TCCGGCCGAAGGCCACCTGTGGGGTTATGAGGACTGCGCCAGGTATATCGGCGTGGCCCG
+GTGGACCTTCGTCAACCGAATCAGCAAAGAGCCGGACTTCCCGCGCCCGGCCATCGAGCT
+GTCGAGAAAGATCCGGCGATGGCTCCCCGAAGACGTGAAGGACTGGGCCTATCGCTCCCG
+CCGCCGGAACCGGCGTTAACCCAGCTTGGCCGCCATATCCGTGGCGGACTCCCGGTAATA
+GATCAACAGGCTTTTGATGTCCCTGTGACCGATGACCCGGGCGAGCTGCAGCACATCCAG
+CTTCTTGCTCAGGCGCCAAATGCCTTCCGCACGCGTGTCATGGAAGTGCAGATCCTCGAC
+GGCCGCCCTATCCCGGTACTTTCGCCAAATTGCATCCCGCTGCGCATCATTCATGCCGAA
+GCATGGCTGATCGCCATCCCTTGGTAACGCCTGCAGTATCTCGGCGGCAAACGTGGACAG
+AGGAACGTCCCGTTTGTCGCCGTTTTTCGTTATGGGGATATGCACATAACGCTTATCGAG
+GTGAACGTGATTCCAGGTCAGCCCGACAATCTCGCCTGACCGCATCGCCGTCTCGATGGC
+AAACAGAAAACACAGGCCGACGCGGTTGGCCAAGCTTTCGGCTCGCAGCTCATAACCGAC
+ACCGAAGGCCTGGCGGACGCACTCAATCTCATCATCCGTAAGCCGGCGCTTGCGGCTCTC
+TGGTGACTTGGGAGCTGCAAATCCTTCGAACGGGTTATGGGTCATCCAGCCCCATTCCTC
+TCGGCACCGCCGAAACAGGCCCCGCAGCTCGTTCATCTCTCGCCGGACCGATGCCTCGGA
+GACCTCTTGCAGCCTGGCATCCCGGTAACGAATCAGGTGATCTTTGCTCACCTCGGGTAT
+CCGCACCTCGGCAATGGGATCCAGCATCAGGCGCTTCACGCGAGCGATATCCCCCCGTGA
+TTTGCCGGCATTCACATGCTCGTCGAGCAGGCGCTTGAGGGCATCTTCCACCAGCATCTT
+CTGCGCAGGTGCCTGCTTGCCCTCAGCCTCTTGGCGAAGGGACCAGCGCTGCGCTTCGGT
+CTTGGTGGAAAACGACTTGCTGACGCGCTGGCCATGAACCATGACCTGGGCTCGCCAGTT
+TGTGCCGCGCTTTGTGATGGATGCCATGTCGCCTCGCTGCTGGTGCAATCTCTGGTGCAA
+AAGTGGTGCACTAGGGTGCAACTTACGGCAATTTCTGGCAACTAAAACGAGAAAGGCCAC
+CCCTTGCGGAGTGGCCTAACTCGTCGTTTTCTAGCGTTTTTGCAATGATTTGCAATGTAT
+CGCTAGTTGGTATTGGTGCCAAGAGGGGCATCGAAAACCGCATAGAAATGCGGACTATCA
+ATGCCAAAAGAAAAATATGCCCCCCAAAAATGCCCCCAGACCGGCCGCGCTTGAATGAGA
+CAGCATGGGACAACCGGGCCATCTGGCGAGGATATCCACCCGTCGCCACTGTAGAAATTG
+ACCCGATCTGATTGGTGCCCCTTTAGGGCACTCGATCTGGTGCAGAATGTCGCAGGTTGA
+GGGGGGGGTAAAAGTGCGGAGGTTATTACTTTTTCGGTGTTCCAGGTGTTCCACCCCTCC
+TAAACCCGCATGGTTAAGCCATTTCTCAGGCAAAAAAATGGAACACCTCCAAAAACGGCA
+GGTGTTCCAGGTGTTCCACTTTTGTCGGCGAGGATCAGCGGCGATCAGCCCTCTGCGGAG
+AAAACAGCCGCGCCCTCAAGGACATAGAACCGCCCCTTGCTCAGACCCCGCACACGCACG
+GATTGCGAGGCCTTGCCATCCTTGCCCGGCTGCAGCCATCCCGCGGCGATCAGCGTCTGT
+GCCGCCGCCTTCGGGTTGAAGCCCCGCACCAGCTCCTCGAAGGCCTCCGGCATGACCAGG
+TACTGCTCGCGCCGATCCTCGGCGCCCGGCTCACCGACCTGCAACTTGCGACGAAAGCCG
+ACACGATGTGCCACCGGCCGGCGCTCGTTATCGTGGTCCTCCGGTTCGAAGCGGCTATCG
+CCATGCGCCTCGATGAAGGCCTTCACCTGAGACAGCAGCGCCGCCCGCTCGGCATCGGCA
+GGGCCGCCGCGGTCAGCCAGCCACTGGCGAAAACAGATCCGGATTGCTTGCGCTGCCTCG
+CCCTCGGGCCAGCCGGTGATGCCGTAGGCCGTCGCCAGCTCGCCGGCGGCGCCGATCAGG
+GCAAAGCGCCGGGCCACGCGCCGGACTTGCCCGCCGGCATCTTCGGGCACCAGGTCCGCC
+AGCATGTCGGTCATGCTCGCCTCAATGCGTCGACGCGATGCACGCTGGTCCGCCGTCAGC
+TGCTCGAGAAAGGACAGCAGCGGATGCCCGTAGTGTGTCGCCGCGGCCCGCTTCAACTGC
+TCGGCCACCGCGCTGGCGCTGCTGCCCACCGGCACCGACTCGAACATGCCATGCCCCATA
+CCGGCATCCGCTGCCACGTCGATCACTCGCACCTCATGGCCAGCCCGACGCCGGCCGCCC
+GACTCCACCATCAGATCGCCCATGCTGACCTCACCCGAGGACAGAAACGCCGTGCGCCAT
+GTCGCCACCGGCCGGGCTCGGCCACTGCGATCTGATCGCCCTTTGCCCTGCCCGTTGGCC
+AGCATATAGGCGACCCTGCTGGCGTCCTTCGGCTCCAACTGGCCCAGCTCATCCAGCGGC
+AGCATCAGGTCGTTGTGCAGGGTCGCCACGCCCTCGAGCGCGTTGTCGGTCTGCCGCCAT
+GTTCGCATGTAGGCCGGCGGACCATAGACGGACGATGCCACCAGCACGGCAGTCGTCTTG
+CCGGTGCTGCTCGAGCCCCGCAGATGCACGCCGCCACCGTCCATGCCGGCCAGATCCAGG
+CACGGTGCAGAGAAAGCCATGGAGACCGCCAACACCAGGCGGCTATGCCCGATGCAAACC
+TTGGCCACGCTATCGGTCCAGCCCTCGAGCGTGCCGCCGGTGGCGACTTGCGCCGCACCC
+GGTGCCGTGGTCTGGAAGATAACCGCCTCAGCTGCTGTCGGGCCAAAGGTGCGATCAGGC
+AGCGCAAACACCTCACCATGCCAGCCGGTGCGGCTCACGCTCCGCGCCTTCTGAGTGGGG
+TTGGCCTGGGCGATGTAGTCCATCAGCAGCTTGCGGGCGTGCTGGGAATTGGCGATCACC
+AGACCTTGCCCCAGCAGCTCTGCCCGCAGCTCCGCGCCATCGGTGGCCAGCATGGCGCAG
+GGCATCGCCCAGCGGTGCGCCTTGCCGTCCCGATCCGTGAAGGCCAGCAAGCGCCCCCAT
+TCTCCGCCATCGGCATTGCGTGTCTCGGCCTCGACATACAGAGGCGCGCAGATCCACGTC
+GCCGGCTTGTCGCTGTGCGGGTCGCTGAAATAGACCCCGTGGCGTCGGCCTTTGCCACGC
+TCGACCACTTCAAAGCCGGGCCCGGCCGGCGGTTCGGCATTGCTCACCACCAGGGCGAGC
+GGCGGCAGCGACTCGGCCGCTTCAATCGTGGAGCTGGACATGATTTTTGACCTCGATAGA
+TTCGGGCGTGCCGCCTTGCGCGGCCAGGGTGGTGGCGTAGTCGTTGAAGTCGCCGGGAAT
+GGGTGGCACGGCCAGCGCCGCACCGATGGCACAGGCCGCTTGTGTCGCCGCCTGCACACC
+GGGATTGCTGCCATCCGGCTTGGCATCGTTGTCCGCGCAGATCGTGATTGGCAGATCCGG
+GTAGCGATCGCGCATCACCAGCGCTACCGCCAGCAGGTTGCCGGCACTGAAAGCGACCGC
+CACCGCCTGGCCGGTGCTGGCGTGCAGACTCTTGGCCGTGGCCACGCCCTCAGCGATCAA
+CAGTCCGTCGCGGACCTTGCCCAGCAGGCAATAGGCGCCGCGGACCATGCCGCCGGGCAA
+AAACCGCTTGTCACCGTCGCCGCGGATACGCTGCAGGTTGACCAGGCGGCCCTCGGCATC
+GTGCATCGGCACCAGCAGCTTGCCGCCAGCTTCCCGCAGCCCGTCAGCCGTCACGCCTTT
+ACGTTGCAGGTAGGGATGCCGCGGACTGGCCGGGCTGGCGCGCTGCCACTCATCGAACGC
+ACTGCCGGCGGCACGCCGCTGGCGGTGACGTTGCTCGGCATCGCGTGCGGCGCGGGCCTG
+CTCGATGGCGATACGCTGGCGCTCCAGCTCGTCGGCCGTCATGGTGCGGCCGGACTGGCC
+CAGCACCACAGTATGCTGCCCGCCTTTGCGCCAGCTCCCGAACACCGCGACAGGTCGCTC
+CGTATCAACATACACCACGGCCCAGCCATTGCGCTTGTCGCGCCGGTCGCCTTCATCGTG
+GAACCTGCACAGCACGCCATCCAGGCGCAGCCGGGTCGGATCGGTCGGCGTGATGCCGTG
+CTGGCGCATCGCGGCCACCAGGTCGGCCAAGAGATTGCCGGTGTAGCGGCTCATGCCAAC
+ACCTCCCCAGCGATCACCCTGGCCATGTCGGCCACCGTGGATGGATTGAAATGGAACTCG
+CCCGGGTCGTCGTTGAGTTTGATCTGCTGCCAATCGCTCACGTCATGAGGCCAGCTGGTC
+AGCACCCGACTGGCCGAGCCCTGGGACCGATTCAAGGCGGCCATGCGCTCGGCCGCGGCG
+CGATCGGTGGCCCAGACATTGCACAGATACAGGATCGACACGCCCGGCAGCGGCGACGGC
+AGGCCCGCCAATGATCGATGATCTGCCGCGCGCACCATGTCGGCATATTCCCGGGACAGC
+CGGCCGACCTGCGATGTACGGATATCGCCCATGATCGAAACCACGAAGTAACGTTTCATC
+GCGGCACCTCCCCGCCGGCAGCTGCCGCCCGCAAGGCTTGGTTCTCTGCCATCAGCTGGC
+GAACGGTCGCCCGCAGCTCGGTGCGCTCGTCGTCGTAGTTGGCACCGGCTTCGACAAGCA
+GGCGCTGCATCTGCCCGTAGACAGTCCGCTGATCGGTCATGGTGGCCAGGGTCTGAAACT
+CGGCCCGAGCATCATCCGCAGTCAGGCTGGCACGCTTGGCCAGGATCGCAGACCGGAACG
+ATGCTTCATCCAGCACGGTCCACAACTTCACGAACACGTCGCGCAGGCCGCGATAGGTCG
+GGGTGTTCAACGGGTCAAAGCCCGGCACGGTAACGGCGCTCATCGCAGCACCTCCACCGC
+CATAAAAGCGCAGGTGGACAGCACAACGCCGGCAACGAACGCAGCGAAGATATCCAGATC
+CGTGCTGCTGACATGCAGCCAGCCAGAAGGCCGGAAGGAAAAACGAGACGTGTGGGAGAT
+GGTGCAGGTGCGTGCAGACGCACCCTGGGCATGATGTGCCATGGTGGGGTTCCTTGAGAG
+ATTGGAACCGCCGCGCACAGTCGCCAAACCATGGGCGGCGGGATGCAACGGGTTGGCGAA
+CCGGTACTCAAGGAACCCGGCAGGCCCGTAGGCCTCCCATTGCACCCCGCCATAAGCTGG
+GCATGACGCAACAAAAAAGCGCCGAGTTGGCGCGTTGCGCCTCGAGTAAGTCGGGTCGCC
+AAACCCGGCCCCGGATTGTGCCGGGACGTGCGAATGGTGCGCGCTGGCGCATGCGATGGT
+CAAGCGATTTTGCATGGCTGATTCCTGATTTCAGGCAAGCCGCCCCCGTCCGGCCCGGAA
+ACTCCATGGCCGGTGGGCACGGTATGGGCTGGGGGAGTTACGCCGCTTCGGGCGTGCTGG
+ATGCGATGCGCAGGGTGTAGATGGCCACGCGGGGATGCTTGCGGCCCTGGTCGTCGGTCA
+TGGCTTGGAGCCGTGTGTCGATCAGATGGCCGGCTTCGCGCAGCTCCTTGATCCGTGCGC
+CTGGCATCATGATGTTGAGGTGTCGGCGGGCGTACATGGTGCTGACTGGCCCGAATCGCA
+GCGCCTGCAACATCCGGTGGCGCTGGGCCGCCGTGCTGGTATCATCAATGCGCGAGATTG
+ATGCGATGGGGCTTGCCTTCGGGTGAGCCTTTTTCGTGTCCGGCGCCCGCTGGATCTCCG
+TCACCAGGCGCATGCCGCCTGTCTGGCCAGCCGTCCCCGGCAGTGCGCGATGACTGGCGG
+CCAGATCCATCAGCCGCTGCTTGCGGTCCTCGTAGGGGATGCCCTGCCCCAGCAGCATGA
+TGTTGAGCCCTTCCAGCCTCCCGACCAGATCCAGCTCGGCCATCGTCATCTGGTCGCGGT
+CGCGCCCGGCAAACTTGCCCGTCACCACCCAATTGATCAGCTTTGCCTCATTCATGTAGT
+GATGGGGCTCCGTTTCCTTGCCCTGGGCAGCGCGTACCGTCTGCAGCATGGCCGCCTGGA
+TCTTGTGGCTGCTGGCGGCGACATGGCGCTGCCGGCGCCAATCATCCGTGCGATGCGTCG
+ATGCCTCGTAGGCGTTGATGACGCGCAGGTAGAAGGCAGGACTGACCCACGTCGCATAGG
+CGATGGCCAGCTGCTTGATGACATAGGTGCCGATGCGCTGCTTGGAGGCAATAGGCGTAA
+TTCCGCCTTTTTCGATTTCAGCGACCAGATCCTGGGTCTGCTGATTCTCGAGCCAATACT
+TGGGGCGGTGCCGCTGTTCGCCGCCGGCAGCTTGATGCAGATCGTTGAGGCAGTAACGGC
+CGGCCTTGTCCATCCGGATCGATGTGCTTGCGATCGACAGGCCATCCAT
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_017095.fasta.fasta
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_018014.fasta.fasta
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_018068.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_018068.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1081 @@
+>NC_018068.1|provirus_1361108_1399802
+TCATTCCCCTTTGTTAATCTCATCGATGTGTTTTTTATAGATGGTTGTTATTTCACGAAG
+AAGTTTATCGGATTGCTCATCCGTTATTTTACCTTTTTTTCGTAATCGTCTTAATTCTGC
+CAAAGTATCTTGAAGATATGGATGTTCTAATATTTCATGCCTAACTATAACGGGTATTTT
+TCCGTACCTTTGGAACAAATCGTTATCTTTGACGCTATAATAACTGGCAAATTCTTCAAT
+GAGTTCATCAGAAGGCATTCTGACGCCCTTTTCGATTTCAGATAAATATGAAGGGCTTAT
+ACCTAATGCCTTACCCACGACTGGCTGCGTTAAACCTTTCTGAGTACGAAGGGAATGAAG
+ATATTGGCCAGTGTCATATTGTCTTATTAGCTGCTGATGTTTCTCGTCCTCCAACATATC
+ACCCACGTTTCGCTAGTTTATTACCATAATATACAAGCTGACATGTAAATAACTGTCTGC
+TATATTAATTCATATCAGATAACTTCACAAGCTTGTTAATATAACAAAGGTAAAGAGTGG
+TTAATTTAACAAACATGAGTAGTATTGTTATCTTACAATGTTATCGTTACCAGTCTTAGA
+CGATTTATGCAAAATAGTCTCCTTGGCATCACCGAGGAGGCTATTTTTAGTTAGGAGGTG
+AACGTTTACGAAACTTGTGTATATTTGTTCGCCATGCAAAGGCGACATCGAAAGAAACAT
+TGCGAAGGCACGAGAATATTGCTTGTTCGCGATTAAACAGAACTGTTTGCCGATTGCTCC
+GCATGTTTTTTACACTTCGATTTTAGAGGACACTGTCGAGGAACAACGCAGAAATGGTAT
+GGCAATGGGCCTGGAGCTGTTGAGCATATGCCAGGAGCTGTTGAGCATATGCCAGGAGCT
+TTGGGCTTTCGGAGATAAGATTTCAGCAGGAATGATGTCCGAGATCGAAGCTGCCGAACA
+ATTGGGAATTCCAGTCGTGTTCTACAGTGATAAGTGCCAAAGGAGAATTTTGAAAGGAGG
+TGAATAAGCCATGAACTTGAGTAAGGAAAAGATAACCTATCTTATTCAACAACGGGGACT
+CACTCAGAACGAACTTGCTCGCGCCCTAAATATTCGACCGGGTTCATTATCCAATGCGCT
+ATCCGGTAAACGTGGGGTTGGGAGGAAGATTCTATCCGCTTTGCTCAGGGAATTCCCAGG
+AGAAAGTGCTATGAGTCTTACCAAAAGGCAGGTGGCAGTATGAAGATGAGCCCATTGAAA
+GGAGGTGATCCAGCTTATGCGCACAGCAAAAAGGCCCGTCGGTGCAGCAACACCCAACGG
+ACCCGATACAAAATATAACCAGTAAGAGTATACCACGGGAACATGAACGAATCCATATCG
+GTTAGAAAAGGAGAGAAAAAACCTTCATGAGCGATGATTTAAAGGTTATCGAGCAAAGAG
+ACCTTCTGGGAAATGATTTTAGGATATACGGAGACATGGAAAATCCATTGTTTCTGGCCA
+AAGATGTAGCGGAGTGGATTGACTACGATCCCAGTAAGGTCAATGAGATGGTTGCTATGG
+TTGATGACAACGAAAAGCTGACCGAGACAATTTCGTGGTCAGGTCAGGGACGCAAAATGT
+GGTTCCTCACCGAAGATGGACTCTATGAAGTTCTCCTTCAGAGTCGAAAACCCAACGCTA
+AAGAATTTAAGAGGCAAGTTAAGCAGATTCTTAAAGATATTCGGAGGCACGGTCTATATG
+TAACAGATACCGCATTAGAAAACATGCTCACCAGTCCTGATTTTGGTATAAGGCTCCTTA
+ACGAAATTAAATTAGAACGAGAGACAATTTCTAGGCTAGAACAAAAAATCGAAGAGGACA
+AGTCCAAAGTCGCTTTTGCCAAGGCGATTGAAGCAACAAACGATACCATCTATGTAGGGG
+ACTTGGCTAAACTTCTTAAGAAAAACGGTACGGATATTGGGCAAGCGCGGTTATTTGAGT
+GGCTGAGGCAGAATGGTTATCTAATGACGGGATTCAGTAAAAATACACCGATTCAGCGGT
+CTATAGAAATGGGTCTCTTTGACGTTAAAGAAGATGTGTTTACCTTTCCCAATGGGGACG
+TTCGGATCTCCAAAACTCCAATGGTTACGGTAAAAGGGCAGACGTATTTTATAAATCTGT
+TTGCGAAAAAAGAAGGAGACATCAGAAGAAGTGAACCCACGGTTGAAGTGGATATCAATA
+ACGCGCGATGATTAAACTCCTCCCACATCAGCAATCGGTTCTTGAACAAACAAAAGCCTT
+TCACCGAGTCGCCTATTATTTGGATATGGGCTTAGGCAAGAGTTTTGTTGGTTCAGAAAA
+GATGCACCAACTCAAAACGCCTTTTACTTTGGTGATCTGCCAAAAATCTAAAATTGATGA
+TTGGGCAGCTCATTTTCGAGAGCATTACGACTATAACGTTTATAGTTTCAACAAACAATT
+TATCTCGGAAATTCCGGAACACTCTGTGCTCGTTATCAATTATGATCTCGCCTGGCGGAG
+ATCGGAGTTATTAAAACTATCCAACTATACGCTGATCCTGGACGAATCCTCTTGTATCAA
+AAATGAGACACGGCGACGATCAAAGTTTATCCTCAAACTGAAAGCGGACAATGCCATCTT
+GCTTTCTGGTACTCCCACCGGGGGGAAATATGAGGAACTCTGGAGTCAATGCCAGCTGCT
+TGGCTGGGCCATTTCAAAGCGCCTTTATTGGCAGCAGTTTGTTAAAACGAAAATATTGGA
+GGTCGGAGGCTGTCCCATCAAGGTTGTTACTGGGTATAAAAATGTGGATCGTTTAAAAGC
+CAAGCTTCGTGACTATGGTGCTGTCTTCATGAAAACCGAAGAGGTTCTGGATCTTCCGAA
+AACCATGGATCAAATTGTTAATATCGCTATCACGAAGGAGTACCGTCGCTTCAAAAAGGA
+CCGGGTAATCGATATCAACGGTAAAACGCTGGTAGGAGACACACCACTGACCCAGCTCTT
+ATATCTCCGGCAGTTAGCCGGAATGTACAACGAGAACAAGATTGAGCGTTTGACAGATTT
+AATTCAATCAACAGGGGATCGCTTGATCGTGTTCTATAATTTTGACCTTGAATATGGGGT
+TATTAGGAATCTTTGTGAGAAAACGGGTAAGCAAGTCTCTGTGGTCAATGGGAAGCTTAA
+GGATTTAAAAGCCTACGAAGAACACTCCGATTCGGTAACGCTGGTTCAATATCAGGCGGG
+AGCCATGGGTTTAAACTTACAGCTAGCCAATAAAATCATCTATTTCTCACTCCCATTATC
+CAGTGAATTATGGATGCAATCTAAAAAGCGAATTCACCGGATCGGACAGACCCAAACGTG
+CTTCTATTATTATCTGCTCACAAAAGGAACCATTGAACCAAAAATCTTAGAAACCCTGCA
+ACAACGTAAAGACTTCACGGATCGGCTATTTAAGGAAGTGGACCATGACTGAAGCAGAGT
+TCCAAAAACAAGTCCAAGAATTCCTCCGCCGCCAAGGGGTTTGGTATGTGAAGTATTGGG
+GTGGAGGACGGTTTACCAAAGCAGGAGTCCCCGATCTTCTATGCTGTGTCAACGGTTGGT
+TTGTCGGCATTGAGTTAAAAACGGAAACGGGCAGAGTATCAAAACTTCAAGAATACAATC
+TCACTAAAATCCAAGAATCGGGTGGACAAGCTTTTGTTCTCCGTCCAAGCGGATTCAAAG
+CCTTTAAAGAGTTCATCGAAGGGAAGTGAACAAACTGCAATTCAGCCACAGCCGAGTCAA
+TACCTTCGAAAAATGTCCCTATCAGTTTAAACTCCGCTACCTGGACAAACTCACCACGAT
+CTCCGACTCCTTAGCCGATGATGCACTGGTTGTTGGTAACGCCCTCCATCTGGGTGCTGA
+GAAGGACGAACGAGCGATGTTGGAGTTTTACTTCTCCAACTATACCGTGATTGATGATTT
+GCACATCAACGAAACTATGAAACTGACCGCCCTTTTACGAAAGCTTAAGAACCATCTTGG
+CAGTATCTCCGGCCAATTTAGGCAGGAATATAAACTTGAACGGCCCGAGTTTAAAGGTTT
+TGTGGACTTGATCGTGACTAATCCAGATAGAACCGTTGATGTCTACGACTTTAAGTATTC
+CAATCATGTAAATAACTATCTCGATTCCAAACAGCTTCATCTCTATAAATTCTATCTCGA
+ACGGGAAGGGTTTAACGTTCAGCGAATCGGGTTCATCTTCATCCCCAAAACCTCTATCCG
+TCAAAAGAAAACGGAAGATCTTTATCAGTTCAGAAAGAGACTCATAGAAACCCTCAGCAC
+AATGGAAGTGCAAGTGGTTTACCTCGATTACGATTTCCAAAAAGTTAAAGAGTTCTGGGA
+CTCTTGCGATTTGATTGGTGAGACAATCGAGTTTCCTAAAAACCAAACGAACCTGTGTAA
+CTGGTGTGAGTTTCAGAAATATTGCCTAGAAGGGATTGACTATATGTTATTACCAAGTGC
+CGAACGTCGCCAAATTGATGCTGTGAGTAAGAAAGTCATCTGGATTTACGGTGCTCCATT
+TACCGGCAAGACTTACTTTGCTAATAAATTCCCAAGTCCTTTGATGCTCAATACTGACGG
+AAATGTCAGGTTTGTAGATGCACCGTATATCGCCATAAGAAACGAAGTAACGGTCGAGGG
+ACGGCTGACTAAAACAAGATTGGCCTGGGATATTTTCAAAGATGCCATTGCCGAATTAGA
+AAAGAAACAGAACGAGTTTGAAACCATTATTTTGGATTTACTCGAAGACACTTACGAGCA
+TTGCCGACTTTTTATGTATGACAAATTAGGCATTGAGCATGAATCGGATAACAGCTTTAA
+AGCCTGGGATATGGTCAGAACAGAGTTCTTATCCACGCTCAAACGCCTCATCAACTTGGA
+CTATAACATTGTTCTTATTTCCCATGAAGATATGTCTAAGGACGTGACTAAACGAACGGG
+AGACAAGATCACAAGGATTGCTCCGAATATTCAAGAGAAAGCTGCCAACAAAATCGCTGG
+GATGGTGGATATCGTGGCCCGAGTAATCAACGAAGACGATGAACGGTTCTTAACCTTTAA
+AACCAGTGAGGTAGAGTTTGGTGGTGGTAGACTTACACTCATTGCTAAAAAAATACCCTT
+GGAATATGAATCATTTGTCAAACTATATGAGGCTGTGCAGAACTCGGTTCCAGCCAGCGA
+GACAAAGACCCGTCGAGAACGGAAGAGTAAGGACGCAATGGAAGAAGAGGTTACCCAACA
+AGCAACTATTGAAACACCAGAGGAAACCGTATCTGATGAACCCAGCCTGAAGGTTGAGCC
+AACCCAAGGTCTAGAAACACCTTCGCTCAGTGAACCTCCGAAACGATCCCGCCGTACCAG
+AACACAACAATAAAAGGAGATGGATTATTCATGGCAACAATATGGGAAAAATTCGACAAA
+GCAATTGATACAAAGGCACTCAAGGAAGACGTGTTAGCCGCACAAGAAAACAAGCAAGAA
+TATCGGGATGTTCCGAAGGGCCATTATGAAGTGAAAATAGAAAAACTGGAACTTGTCGAA
+TCGAAAACGAGTAAGCCGATGGTGGCCTGCTGGATGAAAATTCTGAGTGGAGAGTACAAG
+GGACAATTAATATTCTACAACCAAGTTATTCATGTTGGGTTTGGCATTCACAAGGCCACT
+GAGTTTCTGCGTTCCTTAGATAGTGGTATTGAAGTTACCTTCGATAATTACAAACAGTTT
+TATGAATTGCTTCTGAATATCTTAGAGGTGATTGAGAACAAATTCGAATATGAAGTTGAT
+TATGGGGAAGACAAGAAAGGCTATGGCACCTACGTGATTAAGGAAGTCTTTGAAGTTTAA
+CAACATGATTAGGGGATTCGCAAGAGTCCCCTTTTTCTAAAGATACGAAGAGAAGAATAC
+CGCTCAGGGGTATAACAGAAATAATAGGGGGTATAGGCATCGTGAATAGTCAACAAAAGC
+TGAGTAAAACCTCTAAAAAAAATCGAGAAGAACATTTTGATCAACGAAATCACGAGGGGT
+ATTTTGATCTTACAGCATTCCTTGCTTTAGAGAGAATAATCGATCAAAACAGACGGCAAC
+CGAGGCCTGTCCCAACGAGGCAATCCAAATGATCTTCTTCGATGCCGAAGTCTTCCGCTA
+CGATTGGTTGTTTGTGTTCATGAATACAGATACCCAAGTAACGACTGTCATCGTGAACGA
+CCCGGAGAAACTCAAACAACTTTACGAACAATACAATAATAACGTCTGGGTCGGATTTAA
+CAGCCGACATTATGACCAGTATATTTTTAAAGCGATCCTCTGTGATTTTGATCCATATGA
+AGTGTCACAGTGGATTATTTCAAATAGACAAGGTGGCTGGGGGTATAGTGGAGCCTTTCG
+GAAACTACCGTTTTATACCTTTGATGTCATGACGACTCGCTATCACGGATTAAAGCAACT
+TGAGGGGTTTATGGGGAACGACATCCAGGAATCCGATGTGTCGTTTGATATCGACCGTAA
+ACTCAGTTCAGAAGAGCTGGAAAGTGTCATTCAATACTGTCGGCACGATGTTGAGCAAAC
+GATCGAAGTATTTTTGAACCGAATAGAAGAGTTCGAGTCTCAAATGGCCCTCATAAAATC
+CTTCAAACTCCCACTGAGTTATATCAGTAAAACGAAAGCCCAATTAACCGCCGCTGTTTT
+AGAAGCCGTAAAGGTCGATCGTAATGAAGAGTTTGATATTGTCCTGCCGGACACTCTGAA
+AATCCAAAAATACCGGCACATCACAAACTGGTATATGAAACCGGAAAATCGGGATTATGA
+GAAACAGCTCGAGGTAGATATAGCCGGAGTCCCCCATGTTTTTGGCTGGGGTGGGCTGCA
+TGGAGCGATACCAAACTACCAGGGCGAAGGGATCTATCTGAATGTCGATGTGGCCTCATT
+TTACCCGGCAATTATGATTGAGTACGATTTTCTTTCCCGCAATGTGGCTGACTCCACCAA
+ATATCGTCAGATTCGGGATGAACGTTTAAGGCTTAAGGCTCAGAAAAACCCCATGGCCAA
+CCCCTTGAAAATTGTCTTGAACAGTACGTTTGGGGCCTCCAAGGATAAATACAATCAGCT
+CTATGATCCTAGGCAGGCCAATAACGTCTGTGTTGGCGGACAGTTATTACTGTTGGATCT
+TATCGAGCATTTGGAAGGTTCTTGTAAGCTGATCCAATCAAACACCGATGGATTGTTTCT
+TCAGGTTCGGAGGGAGCGAGACGTTGACCGAGTTAGAGCCATTTGTGCGGAATGGGAGCA
+GCGCACGAGAATGGTCTTGGAGTTTGATGAGTTTGAGCGAATTTTCCAGAAGGACGTTAA
+CAATTATATCGTCATCCAAAACAACGGCAGTTATAAATCCAAAGGCGCTTACGTCAAAAA
+ACTCGACATTTTAGATTATGATCTTGCCATCGTCAATAAAGCCATCGTGAACTATTTCAT
+TCATAACATTCCCGTCGAGCAGACCGTAATGGCGGCGGAAAAACTCATCGATTTTCAGAA
+AATCGTTAAAGTCAGTGAGAAATACACGTATGCCACCCATGGAAATGAGCGAAGGCCGGA
+AAAAGTGCTCAGAGTTTTTGCGTCAAAAGTTAGGACGGACCCAGGAGTTTTTAAAAGGAA
+GCAAGTGAGGGATGATTTCAGGATTGAGAAGATAGCAAATACGCCTGAGCGATGTTTCAT
+CATGAATCATGATATTAACGATGTCGAGATTCCAAGAAAACTGGATCGGAGATGGTATAT
+CGATCTAGCGAAGAAACGGATTGAAGATTTTTTTGGTCATTAAATATCAGTACGGAATTT
+AAACTTAGTGGAGGTTCCTCCCAAAATAAACCCTATTTAGATTAAAAACTGGAGGAAAAA
+CCTCCAACTGAAACTTATCACCCTTCGAAATATGTAGATATTCACTTAAAAAGTGGAGGT
+TGAACCTCCAGAAAATCGCTTCTCAAATGACAAAAAATTGGAGGTTAGAATGGAGTTTTA
+CAAAGGGTATATCCCTACAAGAAATAAAAAACCACTTAAAGAGTTTAAAGACGGCAATAA
+TTTTATAGTTCTTGACTGGGCTAGGAAACTCGACGAATATGCCGGAGTGCTTGCTGAGGG
+AGTCATTCTCATCGATATAGACGACATGGAAAGTTCTGATATCGTCTTACGAATCCTCGA
+TGACCTTAGTATCCAAACCCTTGTTATTGGAACGACCCGAGGAAAACACTTCTTATTTAA
+TAACACCGATGTGACCACTAACAAGACCCACACGAATACTGCTATTGGTATAACCGTAGA
+TATCAAGCTTGGCTCAAGGAACTCTTATCACATTTTAAAGTTTGATGGAGTCAAAAGACC
+TGTTCTTCGTAAAGCTGATGAATTGGCAGAACTTCCAAAGTGGTTGCTGCCCGTTAAGAG
+TAGCATTAGTTTCTCTATCTTGGAAGAAGGGGATGGACGGAACCAAGCCTTGTTCAATTA
+CATCCTTACTCTGCAATCCGAGGGATTTAATAAAAATGAGATCATTGAAACGATCGGGAT
+CATCAATAAATATGTTCTCAAGGCACCTTTGGAGCAGCGTGAGATTGACACCATATTAAG
+AGATGAAGCCTTTAAGAAAAAATCCTTCTTTACTAAACAAGGATTTCAGCATCAAGACTT
+TGCTAAGTATCTGGTGCGAGAAGAACACATTGTCTGGATCAATAACGTGTTGCACATTTA
+TAAGGACGGAATTTACTCTGACAAGCAACGAGACCTAGAAATCGCGATGATCCGCCATAT
+CCCAGAGCTCACTCAATCTCGGCGAAGAGAAGTCTTGACCTATTTAGAACTTGTTGCAGA
+CCATGTGGAAATGTCACCGCCTAATTTTATCGCCCTAGGTAATGGCATCTACGATCTAGA
+GATGGACGAACTTCGGGAATACTGTCCCGAGATTGTGATCAAGAACCGGATTTCCGTTAA
+TTATGAACCGGAAACCTATGATGAAACCGTGGACAAGACCCTAAGTAATATCTGCTGTCA
+AGATACGGAACTTAGGATCCACTTAGAAGAAGTCATCGGGTACTTGTTACTGCGCAGAAA
+CGAGTTAGGGAAATTTTTTGTTTTAACAGGTTCAGGATCCAACGGTAAATCCACATTCAT
+TGATATGCTCAAGTATTTTCTCAAGCCGGAAAACTACTCAGCCTTAGCTCTTGGAGAACT
+TGGTCAACGGTTTAAAACGGCAGAAGTGTTCGGAAAGCTCGCGAATTTGGGAGATGATAT
+TTCCGGTAAGTATATCGAAGAAACCGATATCCTAAAGAAACTGGTCACCGGAGAAACGCT
+TAATGTGGAGAGAAAAGGAAAAGATCCCTATGAATTTGAAAGTTACGCCAAATTGATCTT
+CTCAGCCAATGATATGCCTCGGATAAACGATCTTTCAGATGGACTAAAACGTCGATTAGT
+CATTATTCCGTTCAATGCCAAGTTTAGCAGCAGTGATGCGGATTTCGATCCCTTTATTAT
+CGATAAATTGCTCTCGGAGAAGGCCATGAAATATCTGCTGCGAATCGGGATTGTTGGGCT
+CAAGCGCGTACTGGCAGCCAAGGACTTTATCAAACCGGCAGTGGTCAAAAAAGCATTAGC
+TCATTATGAACTTGAGAACAATCCGTTACTTGGGTTTTTAGAAGAACATCCGAAACTCAA
+CAATGAACTGGTCAAAGATGTTTATTTACGATACGACCTATGGTGCCGTCAGTGTAATCT
+CAAACCCTTAAGTCGGCCTATGTTCGGTCGCGAACTGGCTAAATACGGGTATAAAAGTAA
+AACCGTCACCCTCCAGGGTGAAAGCAGCCGAGTTTATGTCATGACAAATCCCCGTAATAA
+ATAAGGAACATGTGTAATCTCTGAAAAGGGCATGGTTCAACGGACTCGGAATTAAAATGA
+CAAAATGACAACGGGTTTCGCTTTCTTATTATAGGAAACTTACGAAAACAAGAGTGCTCT
+CGCGCATTAGATAGTAATTATAGTGTATAGAGATTAATATAATACATCTTTGCAAGTATC
+ATGCCACGTTCAAAGTCCGCTAAAATCAAGGGCTCTGGTGATTGGAAGAAGATGGGGATT
+AGACGTTTAGGGGCAAATCATCTGTAATTTTTCTGTAATTTATGTGTCATTTGTTGTCAT
+TGAATCAGATGCATTAAAACGTATGACCAGATATGAATTTTATTGCCGTAGCAATCGTGA
+CAGGTAACAGTATCATCCAACTGCCAAAGAAGGCTAAATCACAATCCATAATAAGCAAAC
+CCTCCTTCGTTCGATTTTGCTTATTATTACCAAGATGTAGAAATAGTTGCATACCGAGTA
+ACAAAAGTAATCGGTAGAGAAAGGGAGGGATTAGTAATGAGGATTCGAAGCAACAACGTT
+AGAGCGGCCTTCATTTTTGAAGAACTCGAACGAGCCAACCAAATTTATGGGACAAGCTTT
+CATTCTCCTCATGAAGGCTATGCCGTGATGTTAGAAGAGATGGATGAACTCTTTGAAGAA
+ATCAAGAAAAAGAATCCCGACAAAGATAAGTTGATGGAAGAAGCCGTACAGATTGGCGCT
+ATGGCCATCAAGTTTATTCAGTCTCTGGAACACTGGCCTTGGTTGGATTTAAAAATGAGT
+GCCCATGAATTGAAATGCCTGCAGTGTCGGTACGCTGTCCTCACGGCGGATAAACTTGCT
+GAATTAGAAAGTGATCCATGTTTAAGTTGCAATAAACTGTGCCAGTGGAAGCCTTAAAAT
+AACACTGCATATCCACAAAGGTAAAAAGTGGATAAGTATGTTAATAACTGTAAGTTTTTG
+TGGATAATCTTGCTTCACGAAAGGAACTATTTCGGATTCTAAGGAGGAAGCTAATGAATT
+ACATCGAGGAAGCCGAGAATTTGCTCTTATATTATAACGATCTTTATCGGAGCGTGGAGA
+ATTTGAATCGTGAAATTTCCAAATTGATCCGTTACCAAACACCGAGTCCCCTCAACGCGA
+TCCAATTGGAGGAGACGGGTGTTCGGTCCAGTAAGGTCGAAGACACGTATAACATGATGT
+TTAAACTTAAGACGATGGTAGAAAACAAGGAAAAGACCGAATTAGAATTAAAGGAGATCG
+ACCGAATACTCGAGGAATTGAGTCAGGATCCGGGATGTGAGTACTACGGGCAACTTTTAA
+AAGAGTGGTATATTTACGGAACAGCGAAGGAGAAAATAGCGGATCTTATTAAGTCATCCT
+CACGGAATGTGTATCGTATTAAGGATCAAGCTATAAAAAAATTTGCCGTCCGATACTTTG
+GACTTGATGCAATGAGAGTCGTTTAATGTGGCAAAAAGATGGCATACTTTTTTGACTTTG
+GATGTGCTAAACTAGTATCAGAAAGAGAAGACGTTCCGATGGGAGCGTCTTTTTCTTTTG
+GTTACATCACTCATTTGAGAATTATGGCTGCCATACGGCGGCCTTTTTTAGTTAGGAGTG
+GATATGAATAAATGCCAATATTTTTCACCCAACAAACTAGGATGCAGAGTTAATTGCGCT
+AACTGTAAGCGTTGGACTGGTACCGAGTGTAAGATTGAACTGCAACTCTTTAATCGTTAC
+GAGGACACCGTAGAATTTAAATTCTACAATCGCTTGATGCGGGAAAACAAAGGGGTTAAT
+GGTCCGCTATGATGATTAAAGAAGGCGTTTCCGAAAGGGTGCCTTTTTTTAATACACTCC
+TCTCTTTTTATATAAAGCGGTCTTCGGGCCGCATTTTTTAAAACATGTCGCTGATGAGCG
+ACTTTGAATAGACGGAGGTCACCGCAATGCAGAAATTTACGCCGCGGCAAAGCAGCTTTA
+TGGCTAAAACACTACGAGATCTCATTCATGCTTATGGGTTGAGTAAAGAACAATTAGCTG
+GGCTCGCTAAAGCGTTTGGTGTTCAGGAGACCTCCGTCAAAGGAATGGAAGTTGAGTTGA
+TTCGGGCGATGAATGATGGCGAGGACCTGGATTGGAGCAAGAAGAGAAGGTGATGGACTG
+ATGCCGACCAAGCCAAAGCGTCCCTGCTCTTATCCAGGTTGTCCCTGGCTAACAGCAGGA
+CGATACTGTGAGCAGCATCAAAAACAAGTGTCCAAAGAATACGATTTAAGGCGAGGTTCC
+GCAGCTAGTCGTGGTTATGATTCAAGATGGGCTACGACCCGCAAGCGTTACTTGCGCGAG
+CATTCCTTGTGTGTAGAGTGCTTAAAGACCGGCAAACTCACGCCAGCTAATGTTGTCGAT
+CATGTTATTCCTCATAAAGGAGATATGGTTAAGTTCTGGGATGAATCCAATTGGCAAAGT
+TTATGTAAACGGTGTCATGACAGAAAGACGGCAAAAGAGGATGGACGTTGGGGATAGAAA
+ACGAATGGTGATCCAAGGGGTAGGGGCGGTCATAATCTCTACAGCCTTGGCAAATATTAC
+CGGGTGCTTGGTCACACGCGAAATTTCGCGAATTCAAAAGGGGAATAAGAAATCTAAAAG
+CCACATGAGCACTGACGTGTGGCCTTTAAATAGTCAAATTTAAATCAAAGAAGGAATGAT
+ATATGGCTCGTGGAGGAGCACGCAAAAATGCCGGACGACCTAAAAAGCCATTGGATGAAA
+AATTGTTAGAAGGTAATCCCGGTAAACGCCCATTGACGGTTTTGGCCTTTCCGGAGACAG
+TGACCCAAGCAGAAGCTCTGCCACCACCACCCGAGTTTTTGGTGGATCTGGCTAAAGGGG
+TTGGCAGGTGTCCTAATGCTGAAACTATTTTCGAGAATGTCACTACGTGGTTAGAAAGAA
+CTGGTTGCGTTAATCTGATTCCGCCAGAACATGTTACAGAATATAGTTTGCTTAAAGCAC
+GATGGTTGGAATGTGAAGCCATGAACGCTAAACACGGCCTACTTGCCAAACATCCCACCT
+CCGGACAACCGATTGCCTCGCCTTATGTTCGCATGAGTATTGATTATTTGAAAGCCGCTG
+ATTCAGCATGGTCACGTATTTGGAATGTGGTCAGTCAAAATAGTCAGAAGGAATTTAGAG
+CGAATAGCCCTCATGAGGATGCCATGGAAAAATTATTAAGTGGCAGGTAAATCAATCAAA
+GTTTAAAAATATTGCACGCTGATCAAGCGTGCTTTTCATATTGGGAGGAACTATGGATAT
+TCAGAAAATACCTGCCGAAAAACTAAATCCAGCGAAATACAACCCTCGTAAAAACTTAAA
+ACCGGGTGATACGGATTATGAAAAGCTTCGCCGCTCAATCGAAGAGTTTGGTTATGTAGA
+ACCCGTCATATGGAACAAGCAAACCGGCAACATCGTAGGAGGCCATCAACGCTATAAAAT
+ATTGACAGAACAAGGTGTCAAAGACATTGACTGTGTTGTGGTTGATATGGATGAGCAGCA
+TGAAAAGGCTTTAAACATTGCACTGAATAAGGTAGCCGGTGAATGGGATATGCCGCTACT
+TACGGATTTATTGAAGGACCTAGATGAGTCCGGCTTTGAGGTTTCCTTAACCGGTTTTGA
+AGCAGAGGAACTGGATGAGTTGTTTGGAAACTCAGGCACTGAAGGATCTCAAGAGGTTGA
+AGAAGACGACTTTGACACGGATGCTGCTGTTGCCAAAATTGAAACTCCGATCAGCCAGCG
+TGGGGATATTTGGCAATTGGGTAAGCATAGACTGATGTGCGGGGATTCGACCTTAAGTGA
+AGATATGGCTAAACTGATGGACGGACAGCAGTGTGACCTTGTTCTGACAGATCCTCCCTA
+TAATGTCGACTACCAAGGGGCTACCAAGGATAAGTTGAAAATCCAAAATGACAAGATGGA
+AGACGATAAGTTCCTAGCGTTTCTAACCGATGCATTTACCCAGATGTATGAGCATTCCAA
+AAAGGGTGCTGCGATTTATGTATTTCATGCCGATAGCGAAGGTTACAATTTCAGAGCTGC
+TTTTAAGCATGCAGGTTATACTTTGCGTCAATGCCTAGTGTGGGTAAAGAACTCCATGGT
+GTTAGGTCGCCAGGACTATCAATGGAGGCACGAGCCCATTCTCTACGGCTGGAAAGACGG
+AGCAAGCCATAGTTGGTACTCAGACCGTAAGCAAACAACGGTTGTAGAATTTGATAAACC
+TCATAGAAATAGTACTCATCCAACAATTAAACCCCTAGGCTTAGTTGGATATTATATAGA
+AAACTCTAGCAAGGCTGGAGATTTAGTACTCGATCCCTTTTCAGGGAGTTTTTCAACGGG
+GATAGCATGCGAACAAACTCATAGGATTTGTTATGGTATGGAAATGGACCCCAAGTATGT
+GGATGTATGTGCTTCGAGGTATATCGAGCATAAAGGCGGGAGCGATGATGTTTATCTGAT
+TCGTAATGGTGAGAAGGTAGCCTGGAAGGATATAAAACAAGTATAACTTAGGAGCGTAAA
+ACGGATATGTCCGGCTGAACGCTCTTTTTTATTTCGTAATAAATGAAGGATGTGATCATC
+TGCGAGATTTAAGAAATCAAAAATTTGGAAATCTGACAGTAAAAGCTGAAGTTGGTCGAG
+ATAAAGGTGGTCGTGTTCTTTGGTTATGTCTATGTGACTGTGGCAGAGATCATATTGCCA
+GAGGAACTGCGTTAACATCGAAAAATACAAAGACATGTGGTAAATGTAACTCGGTAACTT
+ATAGATTATCAGAAGACGGTGACCACATGGTAATGACATTTTCGAATGGAACTGAGCTTC
+TAATTGATTCTGAGGAAGGAAAAAGAGTAAAATCGTACAACTGGTTTCTTAATGAGAAAG
+GTTATGCATGGGCTAAGATTAATGGACAGCGAATTAGACTCCATCGGTTTCTCATAAATG
+CTCCAGCCGATCTCCAGGTGGATCATATCAATAATATAAAAGTTGATAATCGAAAATCTA
+ATCTAAGGCTTGCAACTAATAAAGAAAATAGACGAAATGAAGGACTTCGGAAAAGTAACA
+GTACTGGGGCTAAAGGTGTCAATTTTGATAAGCGTCGTAAAAAATATAGGGCTTATATTA
+CAGTTGATGGTAGATATATTCATCTTGGATACTATTCCACAATAGAAAAAGCATCCATTG
+CATACGATCACTCCGCAGAGCAATATTTCGACGAATTCGCTCGCCCAAATGATCTCACAA
+CAAAGACCCCCGAGCTGGTGTCATTTTTATTTTCCGGCAAAGAAAAAGAACTTGATTTAT
+CAGCCCGGTAGAGTGATGAATGTACACAACCAAAAATGAAAGGTTGTGTACTCATGGTAA
+ACGAACTCAGAAACTACAAAGTCAGACATGTGGGTGGTCGCGAACGGATTGTTCCAGCTA
+AAAATGGAACGGAAGCCAAACGCCAGGCTTGCAGATTTTGGGGCTATAAACCGAACGATT
+ATTGGCTTGGCATTACTGCCTGCTCAGCAAACCTCATTCCTGCCGGAAAGGTGGGGTGAG
+CCATGACGAACGAAACCTTCACCTTAACATTTAAAGTCACAGGACTAGAACGTAAGCAGA
+TTGCCTGTATTATTGGTGAAGCTGTCGGGCAGGATATTAGCTACGCAGGTGCTCCAAGTT
+TTTTCTACAGGGCTGGCGATTGGACGATTGACCGGGACAGCGTTATTACTTCCCCAGAAA
+CACCACTCCATGATAAAGACAATCTTCGGAAAATACTTGCTGCTTTGAAAGCTGTTGGGG
+TAATTGCCGAAGGAGACGGAACCGTCACACTTCCACTCGATGGACATTCTGGAAACACTT
+TGAGAAACGCGATTAATCTTATTTGGTGTAAGCAGAGTCTATTAAAAAAATCCTTTGATC
+GGCAGACCGACATGGTACCAGAAAGTCTTGTAGGTGTAATCAACGCCGTGCCGATTGATA
+CCATGGAAGAGTTTGCCGAGGTCGTAAACAATGGCATTGACCAAGGAACCATCATTGGCG
+ACAGCAACTTGGATTTCGACCTGGCAGAACAAACGGTAAGTTTTAGCTTCATGAATGCCA
+CCTTGGAATTTGACGAAGTTCTTGCTTTTATAACCTTTTGCCATAAGCTCAGCGTACAAT
+CGAAACTGCAAAAGTTTAGCTCAACAAAGCAAAAAGAAGCTGTTAATGAAAAATACGCCA
+TGCGCTGCTTCCTTTTAAAATTAGGATTTATTACAGAAGAATTCAAAACCGAGCGCAAGA
+TTCTTCTTCAAAAATTAGATGGGAACGCCGCTTTTCGTACGATTGAGGCACAGCAGGCAG
+CGGAGTCAAAGCGTAAAACAAAACAGGAGGCGAGTTAATGATTAACCAACGAGAAAAAGA
+CAAAATTTTGAGTCAGGAACGATGTTCTCGTTGTGGCAGTCCATTGACGATCCGAACAAT
+GTCGAAAATGAATATAGATATCGTATGTATGGACTGCGCGGAAGCTGAAAAAAGCCATCC
+CCGCTACCAGGAAGCTGCCGATGCCGAACTCGAACAAGTCAAAGCCGGAAACTACAATTA
+CTCAGGTCTGTTTGCTGGTGAGAAATACCCGTTCTAATATTGGTCAAAAATAAAAGACAG
+CCCGGAAAGTTCTTTTAAAAATCAAAATCCAAACGCTGCCTATCGTACAATCTAGGCACA
+ACAGGCTAGAGATGTTCCTTTATTGCCGCCATAGGATATTGAAAATCACTGGGAGGATAA
+TGAGGGTTAAGAGGACAAACAAAAAAATCTGAGCGATTGGATGAGCCCAGTTAACAGTCC
+TTCCTGCTATGGGCCACATTCTGAAGGCTTCATGGATATAAGCTTTAGGGACAAACAAGT
+TTCCATCTTCTTCGTTATAGTAAATTAGGGAGTTGTTATGTGTCCTTCGAAAATCGTCAA
+CTTCCTCATCCGTCCATTTTCGTTTGGCCATATCTAACCCTCCTTTTCCAATCACTGATA
+TAAAAATATTTTACCATAATTTAGTAATGTAATAAAACAACAAAGATTGGGTCGATTTAT
+AAGGTTTTAAGTTACCCAGATTCTCGGTAAGAAATTTGTAGAATATTGTAGTATAATTAG
+CCTAAAAGACATTAGGGGAGAATGATATGCAGTTAATTAACCGAGAAGACGAAGATGAAA
+TTAAGGTTGTAATCCATGAATTCTTAATGACAAGTCAGGTTAATTCGCAGGAAAGTATCC
+CCATTGAGTTATTAAAATATCTACGTAAAGCGGACAAGAAGATTGAAGACGGTCTCTTGC
+TTAATGAACTATGTGATTTAATCGAACAGAAACTTCGCAATAGTAATTCGCGTTAAGGTT
+TAACTTTAATTAGAATATTAATTTTACCAAGGAACTTCGTAAGAGGTTCCTTTTTTGGTT
+GCCCTATTTACTATGAAAGGAGGCTGCTACCATTGGTAAGAAAACCGAGCCGTACTTGGA
+TAAGGCTAAAGCCGAACATGCCATTCAATTCATCAACCTGCTAAAACACACCAAAGGTGA
+ATGGTATGGGCAGCCCTTTAACCTGATCCCTTGGCAGGAGACCATTATCCAAGATATTTT
+TGGGACCATGAAAGCGAATGGTTACCGGCAATATAATACGGCATACATTGAAATTCCTAA
+AAAGATGGGAAAAAGTGAACTGGCGGCAGGTATTGCCTTACTTCTGACCTGTGGCGACTT
+TGAACATGGCGGTGAGATCTACGGCTGTGCAGCCGACAGACAACAAGCCTCCATTGTTTT
+TGATGTTGCCGTTGAAATGGTTGAACAGTGCCAAGCCTTGAAGAGCCGGATTAAGCCCGT
+ACTTTCTCAGAAACGTTTGGTTTATAAACCGCTTAATAGTTTTTATCAGGTGCTATCAGC
+GGAGTCGTATACAAAACATGGCTTGAATGTTCATGGCGTTGTTTTTGATGAATTGCATAT
+TCAGCCCAACCGAGATCTTTATGATGTCATGACGCACGGTTCCGGTGATGCCAGAAAGCA
+GCCGCTGTATTTTCTGATTACCACTGCGGGAACCGATCGTCATAGTATCTGCTGGGAGGT
+TCACCAAAAGGCTGAGGACATTCTACAGGGCCGTAAAGTCGATCCGTCCTTTTACCCAGT
+GATTTATGGTGCGGACGATGATGATGACTGGACGGATCCTAAAGTATGGGCCAAAGCGAA
+CCCGTCACTCGGTATCACCGTTGATATTGAGAAATTACAAATTGCTTGCGAAAATGCCAA
+GCAAAACCCTGCCGAAGAAAACTTATTTCGCCAACTTAGATTAAACCAGTGGGTCAAACA
+ATCTATTCGCTGGATGCCCATGGAGAAATGGGACCATTGCGCCTTCCCAGTTAACTTGGA
+AAGCCTAAAAGGCCGGGAGTGCTATGCAGGACTAGACCTCTCCAGCACGACGGACATTAC
+AGCGTTTGTCTTGGTTTTTCCGCCAGAATATGAAGGCGATAAATACCAAGTGGTGCCTTT
+CTTTTGGCTGCCAGAAGATAATCTGGATCTAAGAGTGCGCCGTGACCACGTTCCCTATGA
+TACTTGGGAAAAGCAAGGCTTCCTAAAGACTACAGAAGGGAACGTTGTCCACTACGGATT
+TATAGAAACCTTCATCGAAGAACTTGGCAAGAATTACAACATTAAAGAAATCGCCTTCGA
+CCGCTGGGGAGCCGTCCAGATGACGCAGAACCTTGAGGGCCTTGGCTTTACCGTGGTTCC
+TTTTGGTCAGGGCTATAAAGATATGTCTCCTTCCAGTAAAGAACTCATGAAGCTGACCTT
+GGAAGGAAAACTGGCCCACTCCGGCCACCCGGTACTTCGCTGGATGATGGATAATATCTA
+CGTTAAAACTGACCCGGCGGGTAATATCAAACCGGACAAAGAAAAGAGCACCGAGCGCAT
+TGATGGTGCCGTCGCTTTAATTATGGCCTTAGACCGTGCGCTCCGCCATGAAAACAATGA
+CTCAAGCGATGTGTACAACCAGCGAGGAATGCGCAGTCTGTAAGAGGGAGGTGAGACAGT
+ATTAAACTCTTCCAACGAGCCAAATTCTTCTTCGGCCAAGGCTTCGATGACTATATCCAG
+CGTTTCTTACTCGGGGATGATGTCAGCGACTTAGACTATCCCGGTCAAATGGATGCCAAA
+ACAGCCATGAACTATTCGGCAGTTTTTTCGTGTGTTCGGGTCCTTGCTGAAGCCTTGGCC
+GGAACTCCAATTATGCTTTACCGCAAAAAAGAAACCGGCGAACGTGAAGTCCGTAATGAC
+TTAAGTGTTTACGACATTTTGCATAACCAACCCAATGTAGAAATGTCGCCGTTTAATTTC
+AAAGAAATGTGTATGGTCTCTCTGAACCTGGGAGGTAATTCTGTCAGCCAAAAGTTGGTC
+AACAAATATGGCGATTTAGTTGGGCTTTATCCCTATGAATGGCCCAAGGTCGATATCACC
+AGAGATCCAATCACTAATAAGTTAGTCTATAAAATCCGGGATATTAACGGCGGCAAACAA
+CTGAATTTAGCACGGGATCAGGTTTTCCACATTCCGGGTTTGAGTATGGACGGAGTAGTG
+GGAGTGTCGCCCATTGAGTATCTTTCCTCAGCCATTCGCTTGGGCCTTTCTTATGAACGG
+TTCGGGGTTAATTTCTATAAAAACGGAGCGAACTCATCCGGAGTGATTGAGTACCCCGGA
+GCCTTGGCTGACACGGCTTATGAGCGTTTAAAGAAGGACTTTGCTAAAAGTTATCAGGGA
+CTGGCTAATACCGGAAAGCCCATCATCTTAGAAGGCGGGGCGAAGTTCAGTCAGCTCGCT
+ATTAAACCTGCCGATGCCCAACTCATTGAAAATAAGAAATTCCAGCTGGAAGACATCGCC
+CGTATTTACCGCGTACCCCTTCACTTGATCCAAAACTTAGATGGAGCGACATTTTCAAAT
+ATCGAACAACAAAGTCTAGAATTTGTCATGTATACGATGTTGCCTTGGTTTAAGCGCTGG
+GAGGAAAATGTTAATATGCAGCTTTTGACACCTCTGGAACGCAAAGCAGGGTTTTATTTG
+GAGTTTAATATTTCATCGCTTCTCCGGGGTGACATGCAAAGCCGGGCGATGGCTTATGCC
+CAAGGTAGACAGTGGGGCTGGTTATCCGTGAACGATATCCGAAAGCTTGAAAATATGCCG
+CCGATTCCTAACGGAGATATTTATATGATGCCGCTGAACTTTACCGAAGCTGGAAAAGCA
+CCCTCTACAACGGAGTCGGCGGTGCCGGAAGCCTTGGCAGAAGAGACTTACAAGATGATG
+ACAAGGAGGTGATGACCATAAAACCCTTTTGGAAATTTCAAGCAAAAAATGAAGCTCCCT
+TGATCGGTGAACTTTTGCTTTATGGGGATATCTCCAGTACCACTTGGTGGGGTGATGAAG
+TGACCCCTGTGGCATTTGCACAGGACCTTAAAAATCTCGGAGATATTTCACAGCTTAACA
+TTTATATCAACAGTGGCGGCGGAGATGTGTTCGCGGGTCAAGCGATCTATTCCATGCTCA
+AACGTCACCCAGCACAGAAAAATGTCTATATTGATGGTCTGGCCGCCAGCATCGCCTCTG
+TTATCGCGATGGCTGGCGATGTTGTTTTTATGCCGAAAAACGCCATGCTCATGATCCATA
+AAGCCTGGACCATGGCCATTGGCAACGCCAACGATCTTCGTAAATTGGCTGATGATATGG
+ACAAAATTGACGAAAGTATACTTACAACCTACCAAGCGAAAACGGGCTTAGATCCCGAAA
+CTATTACAGAAATGGTTAATGCTGAAACATGGCTGACAGCCGATGAAGCCGTAAAACTTG
+GTTTTGCTGATGTGATTGAAGATAGCAAGCAAGTTTCAGCATCCATTGCCGATGGTCAGC
+TTATGGTTAATGGTCAAACCATGGACTTAAGCCGGTTCCGTAAGACTCCGCAGTTCGTTA
+ACAAAGGAGATCAACCCCAGGTTCCCCAAGATCCAAGGATACCTACGTTAGAAGAACCAA
+ACGAAGAGCTGAAGGAAGAACCAAATAACCAGGCAGTGGAAAGCAAAGTAGCCGCACCAC
+TGCCTATTCGTTTGCCCGAGTTACGAAACTCCGGTCGAACAATATCCTCCACCAACGAAG
+CTCTGATCCGCCAAGCCATGGATTGTCTGGCTGAAGTCTTAGGTCAACTGGACAACTCAG
+ACGAACAACCTGACGGCGATGACATGGGCATGGATGGCGACGGAATGGGAACGGACGCCC
+CTGAAACAAATGGGGAAGAGAATCTTGGAGAGGACGATGAGGACGTTGGACTCTTTGGTG
+TTTCCCTCTGCCAAGCACAATTAAATTTAACAAGAAGGAGACTCGATTATGGATTTTAAA
+GCTCTACTCAAACAAAAACTTGATGCCCAGCAAACCCTCATTGATGCAGCGATGGTCAGT
+GGAACAGGATTTAGTGCTGAACAGCAAACCCAGTTTGATACTTTGCAAGCAGAGATTGTA
+AATCTGGAAAATACCATTAAAGCCGCTGCAGAATTGGAAGCTCGCCAGAAAGAAATGACG
+AACCCAGTCAATCAGCCGCTCTATCCTGAACCCAAAGCCAAAAAGGAGAAATTCGCATCC
+TTTGGTGAGCAACTGCGTGCTGTGATTGAAGCTGCAAGACCGGGCGGTTCTATGGACAAT
+CGGTTATCCATCAAAGCCGCTGCTGGGCTCAATGAAAACGTGGGCAGCGATGGCGGGTTC
+TTAGTGGATGATGACTTTTCGAAAGAGATCCTAAAGAGGGCTTATGACACAGGCATTTTG
+GCCAGTCGCTGTAATAAAGTGCCGCTGAGTACCAATGCCACGGGACTAAAAATAAATGCC
+ATTGATGAAAGCAGCCGAGCCAACGGTTCCCGTTGGGGTGGAATTCAAGCTTACTGGGAA
+GGTGAATCCGACCAACTTTTAGGCAGCAAACCAAAGTTCCGACAAATGGAACTGAACCTT
+CATAAACTGACGGGACTATGTTATGCAACGGATGAACTACTGACGGATGCCACTGCCTTG
+GAATCGGTGATTTCTCAGGGGTTTGCGGAAGAATTTGGTTTTAAAATGGACGATGGCATT
+ATTAATGGGACTGGAGCTGGGATGCCTTTGGGGATCATGAATAGTAAAGCTTTAGTAACA
+GTACCCAAAGAAAACAGTCAAGCTTCAGGTACCATTAACATTCAAAATATCGTTAAAATG
+TGGTCACGATGTTGGGGTCAATCTCGCCAAAACGCCGTATGGTTCATTAATCAGGATATT
+GAACCTCAGCTCTACACGATGGCTTTATCCGTTGGGACAGGCGGTATTCCTGTCTATATG
+CCAGCGGGAGGGATTTCCGGTTCACCTTACAGCACACTGTATGGTCGTCCAGTCATTCCC
+TTGGAGCAGTGCCAAACGCTGGGTACTGTCGGTGACATTGTACTGGCGGATTTGTCGCAG
+TACCTGATCATCGACAAGGGTGGTCTTAGCGCAGCCTCTTCCATCCATGTTCGTTTTTTG
+TATGATGAGAACTGTTTCCGGTTTATTTACCGCGTGGATGGACAGCCTGTGTGGAACACA
+GTTTTAACTCCGGCACGTGGATCGAACACACTATCACCGTTCGTCGCATTGCAAACACGC
+TAATCATTTTTTATTGAAGCAGGAGGTTAAAAACTTATGTGTTGTATTCCCGAAAAAGAT
+AAACCCCTTGAAGCTATCACTCCACAGGCTGGCGGTGCTATTACCGGAGTCTATGTAACC
+CTGCGGGATGCTGAAGATTGTTATGTTCTGGTCCATATTAATCAGGCAGTCGCGACAGCC
+GTGGATATAACAATTGAACAAGCCACTGACGTTGAAGGCACCGGCAGTAAAGTCATAACC
+ACTGCCGTTCCTATTTGGGCAGATCAAGATTGCGCCTCTTCTGATGCCTTGCTTCGACAA
+CCGGATGCAGTAGCCTTCACTACTTCAGCTACCCTTGCTCATAAACTGGTTGTCTTTCAG
+ATAAACCCGTCTCACTTAGATGTAACAAACGGCTTTGACTGCATCACCGTCAAAACGGCG
+GCTTCCGACCCGACCAATATTACCGCCGCCCAGTATATCCTCAGCGATCTGCGCTTTGGT
+GGTTCAACTCCACCTACAGATATCACGGACTAATTCTTGTAACTGATTAGATAGGGAGGC
+AGCCTTGCCTTCCTATTTAAATAATCAATACGGAAAGGATGGATGCTGTGAACTTAGTCC
+AAACAGTACCTCCAGCCGTTGAACCTTTGAGTCTTCAGGAAGTGAAGGATTATCTCCGAG
+TCGATGATGATACCGATACCTCAGAAGATCAATACCTAGGCGCCTTAATCACTGCCGCCC
+GGGAGTACTGTGAAAGCTTCCAAAACCGCGCCTATATTACGCAGACTTGGCAGATGAGCT
+TTGATTACTGGCCCAGTTATGCCATCAATATTCCGCGTGGAAATCTGCAGAGAATAACTT
+CTGTTTCTTATAAAAATTCATCGGGCGTTGTAACAACCCTGACAGAAACTCTCCAATATG
+TTGTCAGTACACGCGGAGTTTTAGGCCGAATATCACCGCCTTACGCTCAGCCCTGGCCGC
+CTTTTATCCCATTTCCCTTGGATGCCGTTGTGATTGAGTTTGTCTGCGGATATGGTGATA
+CGGAGGAGAGTGTGCCGGAAAAAGTGAAGCAGGCCATGAAATTGTTGGTCAATCATTGGT
+ACGAGAATAGGACTCCTCTCACAGAGTTAAAGCAAGCTCCGGCAGAGATCGCGTTTACAG
+TATCTGCTTTATTATGGCAAGACAGAATCGTGGTGGCATAAGGTTGGTGGCTAAAAATGA
+ATCCAGGCATACTGCGGCATAAGATTAATATCCTGACCACAACGGAAGGAACCAATGAAG
+CAGGAGATACCATTCTCATTCCATCGGTATATAAAACTGTGTGGGCCAGCGTCTCTCCGG
+TCTCAGGTAAAGATTATCTTGAAGCGAAAAAGCTCCAAGCTGAACTGACCTATAAATTTA
+TCCTTCGTTACACTTCAGGGGTAACGCCGGACATGCAAATTGAGTTTAAAGGGCGAATTT
+TTCTCATTCAGGATATCCTTAATCCTTTAGAAATTAATGAGACTATAGAGATTATGGCCA
+TAGAGAGGGTGATTAAGAATGGCTGATGATTTCGAAATAACCTTTCAGGGTCTTGACCCG
+TTAATGACTCGGCTGAAGGAAGTGAGAGCACGTTATCCCTACAAGGAAGAGGAAATGCTG
+CTGACATTGGGAGCCACCTTAAAGGCCAGTTCTAAGGATAAAACTCCTTTAGGAAAGCAC
+AAAAAACATCTAAGAAATCAATATAAACTTTCTAAGGTTCAGTACAACCGAGATGGTTCC
+TTTATTACTATGACCAACACAAGTTCCCATTTTCATCTGATAGAAAAAGGCCACCAGATT
+GTCGGTAAAAACGGGCAGGAACATGGCTTTGCCCAAGGGCTGCACATGGTTGAAACGTCG
+ATGATCGAACTGGAACAAACCTTACCGGATACACTTGGGGCATGGTTGGACAGTATCTTA
+GGCAGTGTGTAATGGTTACTTTATTAGCCGTCAAGCGGGCCATGAATCAAGTGCTGGCGC
+CTATTGGTCTTAAGATTTACGGAAATGAGGTCAAAGAGGGCTTCTCCAGACCTTGTTTTT
+TTGTGAACCTTGTTCCGGTAAAGAGTGAAATCCTTAAGAAAGACACCCGAGAAAACTCGT
+TGATGGTGGAGATGGTTTATTTTTCAGAGAGTAAAACCGATTTGGAAAATCTCCAAATGT
+ATGACACCCTTCAAGGACTTCTTACGCCTATTCTAGTCATAGGGACCAGAAACCTACTCG
+TCCAGAATTTTCGGGCTGAAGTCATTGATGAGCTAGACCATATTTATTCTGTGAAATTCG
+ACCTGAACTTTTATGATGAAATTGTGGATACCACACCAGAACCCGATCCTATGGAGACAT
+TAACGATTCAGTTAGGAGGTCAATAAAGAATGGGACTTCCCGATATCGAGGTCATTTTTA
+AATCCCTAGCCGTCAGTGCCATTACTAGAGGAGCGCAAGGGATTGTTGCCTTAGTCTTAA
+AAGACTCCGTTCATAATGGATCGAATATTTATACCGATCCAACCAACATCCCGAAGGACT
+ATTCGGCCTACAACCTCAACCAAATCAACTTGGCCTTTCAAGGGGGCGTGCAAACCCCAA
+CCAGTCTGATCGTTTATGTAGAACCGAGTGATGCTGCGGACTATACCGCCGCCATGAACT
+ATTTGGAAACCGTAAAGTGGGATTATGGTGCGGTTCCGGGAATCAGCTCCACGGATGCCC
+AGACGGTGGCAACATGGTTAAAAGCCCTTCGAGATACCAAAGATATTAAAGCCAAAATGG
+TTCTTCCCAACACGGCAGCCGACCATGAAGGAATTATTAACTTTGCGACCGATGGGATTG
+TCTTATCTTCGGGAACGGTGAATGCCACCGATTACTGCAGCCGGATCGCTGGAATATTGG
+CCGGAACTCCTCTTACCATGAGTGCTACATTTCAGGTGCTCCCGGAAGTGATCGATGTAC
+CGCATAACAGCAAAACACAATTTGACACCCTGATTAATGAAGGCCAGCTAGTCTTCATGA
+ACGATGGTGAAAAGGTAAAAATAGCGCGAGCCATCAACAGTTTAGTCACGCTGACACCAA
+CGAAAACGGCGGATTGGCAGAAGTGCAAGATCGTCGATATTATGGATCTTCAGCACAATG
+ACATTATACAAACCTTTAACGATAACTATGTCGGCAAAGTCCCCAACGATTATGACCATA
+AGTGCTTACTCATCACGGCCATCAATGCTTACTTGGAAGGGTTGGAAAACCAAATGCTGC
+TTGATCCCGGTAAAAATAAAGTGAGCCTGGACGTGGAGGCCCAAACCTTATATTTACAGA
+GTAAAGGCATCGACACCAGCACCATGAGTCAGTTAGACATCAAGAAAGCCAACACGGGCT
+CTTTAGTTTTTCTAACCGGTACCGATCGCCCGCTGGATGCTATGGAAGATCTAACCTTAA
+ATCTCTATTTAAACTAGGGAGGTGAAGCATGAATAACTATACTGCAGATCAGGTCCTAAA
+TGGCACTTGGGGAGAGATGTGGCTGAACGGAGATTTCATGGCTGAAACCATCGCCCTGCA
+GGCCAAAGTGACCTTGACCAAAACTGCCGTGGAGATGTGCGGAACCTTAGTGGCGGGGCA
+AAAGGTCACGGGAATGGAACTCAAAGGGACCCTTAAAATGAACAAAGTGAGTTCGGCGAT
+GATTAAAGCCAACTCCGACAATATGAAGGCGGGTAAAACGCCGGAGTTTACCATCATCTC
+CAATCTGGATGATCCGCAGGCCTTGGGCGCTGAACGAATTGTCCTTAAAGGCGTTATGTT
+TGATGAATTGACTCTTGTGGATTGGGAAGCCAAGAAGAATGGGGAAGAAAGTATCCCGTT
+TACCTTTATGGATTGGGATCTCTTAGACTTAATCTAAAAAATCTCTTCCCATTATATAGG
+GCATTAAACTATTGATTTGGAGGTCTTATTGGTGAACTTAGTAGAGCAACTCTTAAAAAT
+GGATGCTGGACTCCTTGAAACCCCTTCGAAGGTAATAACCATCCCATCGAAAAAGCTGAA
+AGAGCCCCTCGATTTTCCCTGTAAAGCCGTGGATCCGGAGAAGTATGCCGAGATCCAGGA
+AGGGGCGGTGGAGATCCGTAAAGGTGATGTTAAGAAAATCAATATGTATTCCTTAAAGAC
+GCTCATTGTGATTGAAGGCTGTCCCGAGGTATTTAAAAGCAAAGAGATTATGGAACATTT
+CGGAGCACCGACCCCTAAAGAGTTGGTCAAAACCCTCTTACTCAGCGGAGAGATCGATGA
+TCTGTATAACGGGATCAATGAGCTTTCTGGTTATGAGAAGGATGCAGAGGACGAAGAAAC
+CATAAAAAACTGATTCAGGGAGATAAAACTGTGCAAACAGCTTATCTCCTTTTTAAGTAC
+AAAAACATGAGTCCCAAAGAGTTCTACGATAAGAAACCCGGTGAGAAGAAAATTCTCCGG
+GCGTTTTTATTTTACGAGTTAGCAGAACGAAATCGGGAGAACAGCTCTTAATAAGGCGGG
+AAGGAGGTAAAAACCATAGCGCGAGTGATTGATGCTGTGATTCAGCTTCGTGACCAATTC
+AGTGGAACTCTTCGGAATGTCAACGCTAATCTCTCAGTCTTTCAACGACAGGCCAGCTAT
+GCCGGAAGAAACATGATGTCGGTCGGTAAGGACTTACAGAGTGTGGGTAAGACGTTTACC
+AAAACACTGACTGTTCCTATTGTTGCGGCGGGTGGAGCACTATTAAAGCTGGGACAGGAC
+TTCCAAGATGCCGAAAACACCATACGAGTTGGCACGGGTGCAACCGGAAAAGATCTTCAA
+AACTTAACGAGTGATTTTAAGGCGACTTACAGTCAGGTGAGTAATAGCATGGCTGACACC
+AGCAAAGTGATTGCTGATTTAAATACAAGAACCGGCTTATCCGGTAAGCCCCTGCAAGCC
+TTGTCCGTTCAAATGCTTAACCTCTCAAAGATCACGAAAGAAGACTTGAATACTTTGATT
+CCAGCGACCACGCGGATGTTTCAGGATGCCGGGCTTAAGCAGGCGGATTATTCGAAGGCA
+CTCGACTATACCTTCAAAGTCAGCCAAAATACCGGTATTTCTGTGTCAAAACTTCAGGAG
+CTGATGACTCAGTTCGGTGGTCCTTTAAGACAAATGGGCTTTAGCTGGCAAACGAGTGCT
+GTCATGCTTGGAAAGTTTGAAAAAGAAGGTGTTAACACTGAGTTGGTTGTCGGGTCCCTT
+CGGATTGCTCTCGGTAAGATGGCTAAGAAAGGGATCGCTGATCCTTCAAAGGCGTTGCAA
+GAAATGATTACCAAGATTAAGGACGCTGGCACAGCTGGAAAGGCAAACGCCATGGCCTTG
+TCGATGTTCGGAGCTAAAGCCGGGCCGGATATGGCAGCCGCTATTCGGGAAGGACACCTG
+GACTTAGACAATCTCCTGCGAACCATTAAGAACAGCCCGGAAACGATCGACCAAGCCACT
+GCCGATACCATGACCTTTGCGGATAAAATGGCGAAAGTAAAAAATCAACTCGCCGTGGCG
+TTTGAGCCGGTGGCTACCAGCCTATTAGATTCTTTAGATAAGCTACTTCCGAGTATCAAA
+AATGTGGGCGATACCATCGCGAAGTTTGCTAAAAGAATTGCGGATATGTCACCTCAGCAA
+CAGGAAATGATTCTCAAGTTTGCGCTTATGGCTGCCGCAGCAGGGCCGGTTATTTTTACG
+GTTGGTAAGCTAGTTTATGGGATGGGTGATGCGGTAAAAACATTTACAAAATTATCTCGT
+TCCATCTCTAATGCAGGCGGGATTTTAGAGTACCTTCAAACTCCAGGCGGCATGGTGATT
+GCCATTATTGGAACTTTAACAATCGCTGGACTATTACTTGTAACCCACTGGGCACAGGTA
+ACAAAGTCCTTGAATGACTTTAAGACGGTTTTGAAAAATAATGAAACAGCCATCCGAAAT
+GTAGCGATAGCCCTTGGCGTTATTTTTGGACCGGCGCTGGTGGGGTTGGGTGTTCAAGCA
+CTCATCACGGGCGGTCAAATCACCGCTGGGTTTATTGCTTCCTTAGTAACCTCAGGAATT
+GAAGCCGCTGCAACCGGAGCCGTTTTTACAGGAAAACTAATCGTTTCTCTCATATCTTTT
+GCCCTTCAAGTCTGGAAAACTGTTGCTGTTATTGGTATTCAGACAACTTTGTTCATTGCT
+CAGAGACTTGGAATTATCAGTGCCGCCGAAGCAACGAATATTATCACAGCCGCCCAATGG
+CTTTTTAATGCCGCCATGAATGCGAACCCGATTGGTGTTGTCATTTTAGCCCTTGCGGCT
+TTAGGGGTGGCTATCTATGAGGTTGTCCAGCATTGGAAAGATATCTGTACTTGGGTTGAA
+AAAGCATGGAACTGGCTGACGAAATGGAATGGAACTCAGCCTCAGGATAAGAGCCTCAAT
+GTTACCACCAACGTGGCAACGTCCGCTGCGACTACGGCCCACAATGCGCTTGGAACCAGT
+TATTTTGGAGGCGGCTCCACTTGGGTAGGGGAGAATGGGCCAGAAATACTCACACTCCCT
+AAAGGTTCTCAAGTCATGGATCATCAAACGTCAAAAAGATCAACAGGGAAGAATATTTCG
+ATCGCCAAGCTCGCCGACACCATCGTTGTCCGGGAAGAAGCCGACATTGATAAGATTGCC
+ACGGCATTGGTGCTTAAGCTTCACTCGGTCGCTATTAACACGGCTTAGGGGGTGACATCC
+ATGGAATTTTGGCTTATGCAGGATAAGGAAACCCTCCAGCTTCCGGTTCCCCCTCCAAGT
+TATACGGTCAAGAAAACTCTGAATAATACTTCTGTGATTGTTGAAAGCATCGGCGAAATT
+AGTTTTATTGGCAAGCCGAAACTCGCTGAAATCCCGCCCATAAGTTCGTTCTTTCCGAAA
+AAGGATTATAGCTTTTGTCAGTATCATACCTTTCCAACGCCCAAAGAATGTACCGACCTT
+ATCGAGAAATGGATGGCCAGCGGTAAGCCGATCCGTTACCTTGTAACTGGGACAAGTATT
+AATACACTTTGCTCCATTGAAAGTTTTGAGTATGGTGAGCAGGATGGGACGGGGGATGTT
+TATTTTACACTGACACTTAAGGAATACAAGGTGATCCCTTCGTGATCAAAATTTACAGTA
+ATTACTTTGGGGGATCGACCGACATTACGATGTTTTGCAAGACCGTGCAGTGGTCCGGCG
+ACAAGTCGCAAGTGGCCCGGAAAATTGACGTAACTTTAGCCTATGCCATTTTTGACAAGA
+CCCAGCCCAATACCCAAATTTCGCCCGGCACCATGGTATGGCTTGTCGATGATGTGGAAG
+GTGAGATTTTTCGAGGTATTGTTTTTGTTCGCTCGCTCAATTCCAACCAGGAACTACAAT
+TCACGGCTTACGACCTTTTGATCTATTTTCTGAAGTCCAAGGCCACCTATAACTTCAAAA
+ACATTACAGCAGAGGCAATAACGGCGAAAGTTTGTCAGGAAGTTGGGGTGAGTGTTGGAA
+GTTTAGAGCCAACCGGTGTGAACATCAGCCTCATAGCCTCGAACAAAACCCTATATGATA
+TCATCATGCAGGCTTACAGCTTCGCGTCGTACTCCACAGGAAAGCAATATTTTCTCCTGA
+TGAATGGAACCAGTCTGAACTGTATTGAAAAGGGTCAAAACCTCATAAATTTTACGCTCG
+ACCCTAAGGTCAATTTAATCAATGCTGTCTATGATGACTCGATCGAACAGATGATTAATA
+AGGTGAAAATTTATAACTCCAAAAAGGAGTTTACCGGGCAAATCCTAGAGAACAAAGACT
+GGGAAAGTCACTACGGAATCCTCCAGGACACGTATACAATTAATAAGTCTAAAAACACCT
+TGATTGAAGCGTCGATCCTCCTTAAAGGGATGGAGCAGGAGGTCGAAGCCACGGCACTCG
+GTAATGTAAACGTCATCACCGGCACCGCCGTGAAAACCAATATTTTTTATGTCAGTGTTC
+TCCAAAACGCCACTTGGTATGTCGATACCGACGTTCACACGTGGGAAATCGGCACGAATA
+AATACACCATGAAGCTTAATCTCAAGAGCCATAATTTAATGGACATGAAGGAAGGTAAGG
+TCGATGGGGAATAGGGAGGCAACATGAGGTCTAAAAATCCATACAGCGAAATGATTAAAA
+TCATGCAGGACCAGGGAGCGAAATACAACCCCTTTTCGGTTCAATTGGCGACGGTGATCG
+CTACATCTCCGCTTACGATTACGGCTGGAGAACTTCAATTAGCCGGGGATAATCTATTAG
+TGGCCGATTTTCTGCTAACCAGTTATTCCCGACAGATTAACCTTCCAAGCCCAACAGTCA
+GTGGTACAACTTCAGATGGCACAATAACAAGTCTCAGCATACCAAATGCCACGCTAAATT
+TCACAGATGGACTCAATGTAGGTGACACTTTAGCCGTAGTTCAGGTCGATAGTTCTACCT
+TTGTTATTTTGGCAAGGGTTGTGAGTGTATGAGCATTTTTCCGCAAAACTTCGAACAGGC
+CCTCATCACATCCAACGGTCTGGGTTCTTCTGAGTTACCTCTGGCGAAAGAGTATGGTTG
+GGACTTTACTAATAACACGTTTCTTCTAATTGACGGCAAGAGTGTGTTGGTAACCGGAAG
+AGATGCCGTTAAGATTTGGGCTTGGAAAGCATTACAGACTCCAAAGGGTGTCTATAAAGC
+CTACAGTCTAAACTTTGGAAACGAACTGGAATCGCTGATGAATCAGAGCCTATCAAACGC
+AGCCATGTCTTCAGAAGTCGAACGGTATTTAAAAGAAGCGCTCTTAGTTAATCCCTATAT
+TACCGGAATCTCTAACATTACACTGTCTATTGATGGTAGTAAAACCAGCGTAGATTTTAC
+GGCAGAGACGATCTATGGTGAGGTGACCATGAGTGTATAGCGAAACCAGTAATGTGATTT
+TAAGTCGCATGCTTTCCAATGTATCCTCAGATGTTGACAAATCCGAGGGTTCTTTTATTT
+ATGATGCAACCTCTCCGGTGGCCATTGAGATTGCTCAGCAAGAGGCCAATCTCGACCAAG
+TAGCCAAGAAGTTTGATATTACAACCTTAAGCGGCGACGAGTTGGCCATGAGAATCTACC
+AACGGACAGGCATTTCCCGAAACCCAGCAACTTATGCCACGGCAGACGTAACCATAACAG
+GTAATGGAATGATTAATACTGGTGATTTGGTTCAAACACCTGGCGGAGTTCAGTTTAAAT
+CAACTCAGCAACAAACCATCAGCGGATCGGCAAGTGTTCATGTTGAAGCCCTCATCGCTG
+GGTCAACAGGCATGGTTCCAGCCAACCAGATCACTCAGTTTCCGGTTGCCATCGCTGGTC
+TTGTGAGCGTCACAAATTCTAATCCGACGCAGGACGGCTTTGACGCAGAAAGCGACTCAG
+CCCTTTTACAAAGGTACTATGATTATATTCAAACTCCGGCAACGGGAGGAAATATTGCTC
+AGTTTATCAACCTCATGAAAGACTTCACGGGAGTCGGTGATGTAAAATTCTATCCAACTT
+GGAACGGAAACAACACTGTAAAACTGGTCATAATTGACGTGAATAAACTGCCTCCCAGCA
+GTGATTTAGTCGCAGCAGCTCAGGCTTATATGGACCCAGGTGCCCAAGGACTCGGGCTGG
+GTGCTGCTCCGTTCGGAGCTTTTACCACAGTGGAAGGTGCATTCGCTAGTACAATAACCA
+TTAATTTTACAGCGGTTAAAGATTCGGATTATACCGATGAACAACGGCTCGCCAATGTCC
+AAGCGAATTTAACAGCTTATCTCCAGGCGATTGCCTTCGTTGATAGTACTGTTAGTTATG
+CCAAGATTGGGTCGGCAATTTTATCGAGCCAAGGGATCTTGGATTATACCAACCTAACGG
+TCAATGGAGGAATTTCTAATGTTCCTCTCAGCTATACCTCGGCACTGACTGAAACGCCGG
+TTCTGGGGGTGGTGACGATTGCTTAGCGATTCTCTTCCTTATTTCATAACGAGCACTCAG
+TTATTTACTGAGTTATTCCAATCTGAAGGGCAAGAACTGGATGGCCTGGGCGCTGATCTA
+TCCGATTTAGAAGCTCAATTTAACGTTGATACGGCAACATGGGGCTTGGATTATTATGAA
+AAAGAACTAGGAATACCCACTGATAACACAAAACCTCTGTCCTATAGGGCCAGTGTTATA
+AAGTCCAAGTGGCGAGGCGGCGGGAAGCTTAACTCCACCTTGATTAAAACCGTCTGTGAT
+GCCTTTACGAATGGAAATACGGAGGTGACGTTTGATGGAACCATTAAGGTCAAGTTCAAT
+AGTATTCTGGGTATACCACCCAATCTCAATGATTTAAAAGCAGCAGTCTCTCAGATTAAG
+CCAGCCTATTTGGAGCTGGTCTATTTGTTTTCCTATCTGTTGATTAACGAAATTCATCAG
+GTAATGACCATCAACCAGTTAGACTCAACCCCACTCAACGAATTTGCCGGAGGTGTTTAG
+ATGGCTAAGACAACGCCGAACTTGGATCTTTATGAAGTTGATCCTGCCTCAGACGGATCG
+CTGACCTTCAACATTCAGACCATGCTCAATGACAACTTTGACAAGATTGACTCAGCCATC
+CCGGCTGCACAGGCAGCAGCTCAGAGCTACACAGACTCCAAGTTTCCTGTTCAAGCTTCT
+GAATTGAGCAATGGTGCTGCCACCGATGCGGTGATTGGAAATCGAACTGGGGACCCAACG
+CTGGCTTCCCCTTCGAGCACCGGAACGATGACTCAACTCTTTGGTTGGTTGATGGGGAGG
+GTCAAGGCGATATCTGGAACGACAAACTGGTATGATCCTCCAGACATAAATCTAGCGGCT
+TTGAGTGCTCATAAATCCAGGCATGCGATAGGCGGCGCTGACGTGTTATTACCTTCAGAT
+ATTGGGGCTGAAACTCCATCAGGAGCACAGGCCAAGGCTGCCACAGCCCAAACGGCAGCT
+GGGTCTTATACAGATTCTTCGGTAGCAGGGGTTAAGTCGGATTCCATCAACTATAAACGT
+ATTACATCAATGGGAGGTCTTTATTAATGGCAGTAGGCGACAGAACGCCAACGGAACTGG
+CCCAGTCAGCATTAAGTGCCACGGCAACGAACTACTTCACCAACGCAGGGTCAAGTTATC
+GAACCCAGATCTTAGAGGTTTGCTTAGTCAATACTGGTTCCTCTCAACGAGTTGTAACTC
+TTTATAAAAATGGGTTGACTGCAAACAATCAGATCGCCAACTCTATCACACTCCCGGCTA
+ACACGTCAACCATTATTGACTTGAAACTTGTAGCCACCGGGGTACAAACGTTTGGAGCCA
+ATCAAGACTCAGGAACTGATGTCACGATGACGGTCAGCGGCATTGTTGAACAGATAGCGT
+AGGTGATGAGATGGGTATTCGATTATTTGGGGCTGTTCAAGGTATAAAGGCCCAGGTTCA
+AGGGTTACTCCTTGGTTTGGGAACGGGCGGCAATGCCAACGCCTCAGAGGTTCTTAGTGG
+AAAAGAGGTTACAACCGACGTTGGACAAATAACAGGAACCATGCCAAATGAAGGCTCCGT
+GACGCTTACGCCGGGGCCTTCTGACGTTCCTATCCCGAAAGGATACCACGACGGGACTGG
+AAAAGCCTCGGCAGTTGTTGTACCTGCAGCTAATGTCCTAACCGGCACGACAATCGCAGG
+GACAGCAGGGACCATGCCTAACGAGGGAGCTGTTACTATAACACCGAGCAATGCAGCCCA
+GGCTATCCCGGTGGGGTATCATAACGGATCTGGAACCGTCCCGGCAGTTGTTGTACCGGT
+AGCTAACGTCCTAACCGGCACGACGATCGCAGGAACAGCGGGAACCATGCCGAACCGGGG
+AGCTGTGACAATCACACCAGGAAGCACCGCACAGGCAATCCCAGCGGGGTATCACAACGG
+ATCGGGAACAGTTTCGGCGGTGTCGGTCCCGGCAGGGAATGTTTTGACCGGCACAACGAT
+CGCGGGAACGGCGGGAACTATGCCGAACCAGGGAGTGCCGACATTCACGCCGTCTACTTC
+CGGCGACACTTCAATTCCTGCAGGGTATTATTCAGGCGGGATAGTAAAGAAAGCATATCC
+TGTAGGAAGCATGGTATCGAACGTCACGGTCGAGCAGATAGCGTATTCAGCCAACCCCAA
+CAGTAGTGGCTCCTCGTATGGTATCGCTGTCGATTCGCAAGGTAATATGTATCTATGCGC
+TGGAAGTATACTGTATAAATACAACGCAGCGGGATCACTTGTGTGGTCAAAGAATGACTT
+CTCCTATTTTGGCGTTTTCGTAGACCAGTACGATTATATCTACGTTAACCACAACAATTC
+TAACCTCCATAAGATGGACGGTTCAGGTAATACGGTCTGGAATAACGCGGTAGGGGTGCA
+ACAAGCATATAATATCACCATTTGTAATTCTGGGTATATTTACACCTACGACGGTGGCAC
+AAGTACCCACCCCACAAGAAAGCATGACGGTTCCGGCAATGTAATCTGGACGGATACAAC
+AATTGGTAGTAACTCTTGGTTTTCAGACACAAATTTCAGTACCGAAGTGACGGTTATTTC
+AGGATACGTGAGTGGAACTAGCATGGCAATCAGAGTGGTAGATTCAAATGATTCGTTACA
+ATGGAATTTAACTGCTTCTGCTTCAGCAATGTCTAACTGTTCCGGAGCGGTTATGGGTTC
+GGATGGTTACGTGTACGCCAGAAATGGCACTCAGGTTGTGAAACTAAACAGTAGTGGGGG
+CCAAGTATGGTCTGTGCCTATAAATGATACCTACACCTTAAAAGGAAATATAGCCATTGA
+TAACTCAACCAACATTTATATTGTTGAATACCAAACAGGCCATAGATATATGAAAATCAA
+TTCAAGCGGTACCATTCTATGGACCTACACGGCATCAAACATGACCCCATACGCGATTAA
+CGCAAATCATAGCGGCAGCTACGCATGTGCAACTATCCCATACGCAGGAGGTACTGTATT
+TTATGGTGCTACCCAATATCTAATTAACGGCTAGGGGGAAACTTTAAATGATATTTTTAG
+GTAACTTAACTATCATAAATCCCAACAAATCGTTGGTCAATTTCATTCATTATATGCCTT
+TAGACACGGACCACGGGATGAAGGATACAAACGGAAATCTAATGACCCAGGACGAATTAA
+ACGCGATCGGTATTCTTATTGATTCAATACCGCAGCCAGCCCCGCCCAATGGATATTATG
+TCTCCGCAACCTATGTAGATCCAACTACGAAGGACGTATCATTCGACTACGCACAAACCC
+CTAAAACTCCTGAACAACAACTAGCAGATTTACAGGCCCAAAACGCTCAAATGCTCTTAG
+CCCTAGTACAAGGAGGTTTGATGTAAATGGATTGGGTATCGATTTGTACAAGTTATTACC
+AAGCAGGATATTATGACAATACTTCACTAAAAGTATTTGTAGTTAAAGGTAAGATCACTG
+GGGCCGATTATAAGACAATCACAGGCATTGACTATGTAGCTTAAATTTGGGAGGGGCATA
+AAAGCTCCTCTTTTCTAATAAAAGAAGGGGGAGATGACCATTGGGCGAACAGGATGATCT
+AAATACGCGAGTTGCTGTCCTCGAAACCAAAAACCTAGCTCAGGAAGCTAGGCTCAATTC
+TCTAGAGATCGACGTGGGAAAAAAGTTCGACCGCCTTGAGGCTAAGCTGGATCAAGTTTT
+ACAGGCTTCCCGTGGACGACCAACGTGGATTGTGGCTCTGGCGATTTCAGGACTCATGAC
+GATTGTTACAGGACTAATTGTTTATTTGGTGACCCGTTAAGAAATCACCGAAGAAGGTTT
+GTCTGCATATTCTAAATTAAACGATGATCCTTGGTACAGTCGAAGGATATAGCTCTCGAT
+CGATTGTACTGAGAAGCTTAAATAAGGATGTCCTATGATGGTCCATCTGAGCTCTTCAAA
+CATCTCAGGAAAGTTGGTTGAAAAATTTCAAAGAGGAGGGGTCTTGATTGGATCTATCGT
+CGACGATACCCATAGTTGTTGCTGCAGAGGCGATCAGTGCCGTGATCTTTGGTTATTTGG
+GCTATGCGAGAGGGGTTAAGAAAGAATCCATGCTGGATGGTCAAGATAAGGGAAGTATCG
+AGTCAGACATTAAGTATATCTTGAGAAGGACTGACGATTTGTTAATGGAGCAGAAGGAGA
+CCAACAAGAACTTTCATACTTTGTCCGAACGTCTTGCACGGGTTGAGGAAGGAACTAAGT
+TAGCTCACAAGCGTATTGACCAGCTTGAAAAAGGGGAACGACGAGATGTTAGAAGTCCAT
+GTGATTAAGCGGACGCTCACGGAAATTGTCATTGATCCTTCACACGCAGAGAGGAAAGAA
+TCGGCAGAATTTCGGCGAAGTAAGGAACGATTGAAAGCCGATGGACATTATAAATGTTGG
+ATATGTGGAACCACAGAAAATCTCCAGGTCCACCATTTTGGAGCTGAGTGGAGCTTAGAA
+AACGTGACGGATTTTGAAAAGCTCAAGGTGTTTTGTGAAGAATGGGACCCCTATGGTTAT
+GGGCGGCTTCTTAGAAACCTGCCCATAACAACCGTCGATGATGTTCGAAATATGTTGGTA
+CTCTGTCAGGAACACCATACGGGTGGTTCTAAAGATGGTGCCGCCAACGGAATTCATGAA
+ATAACCTTACCAGTATGGCTGATTCAGAAATTGGCAAAGCAAGGAGAAGATCCTGTTCCA
+CAAGACGGTGAGTCTGTAGAGAACGTGATTAAGAAGATCACGGATTTATAAATCGTTAGA
+CTTCTAAAGGGAATATCATTATTTAGTCTCCCGAATTAGGGTGGCTTTTTTGTATGCTAA
+AGAAAGTAATTTGTCAGAAATATATACTGATAGCTGGCTATAGGAGGTCAAATGAGCTAT
+TCAATCAAACAAAACTTTATTGCCGGACTACCTAAAGAACCCTATGACAACGGGCATTAT
+GTCGGAGTAGTTGCACACTCGACGGCCAATAACGGCGACTCCGCCGATGGAGAGCGCAAT
+TTCGAATCGACTACTTGGCAAAACGCGTTCGTTCATTTCTTCGTGGACGACCAGAAAATC
+CTTCAAGTTGCCGATACCAACTATCTCTGCTATGGAGCTGGCCACACTGCAAACCATTTG
+GGTTATGTTCAAGTGGAGTTGTGCCAAACAACAGATCCAGTTAAGTTCAAAGCAGCTTAT
+GAGAAATACGTTTGGTTGCTTGCAAAGCTCCTATATAATAGGAAGCTTCCTGTCGTGGAT
+GGGGTTACTCTGATGTCCCATGCTCAAGTTTCAGCCAAGTGGCATGAGACGGACCATCAA
+GATCCGATCGAATATCTAACAAGCCACGGAAAAACATGGGCTGATTTGGTCGCTGATGTA
+ACGGCTCAATATAACTTGCTGGAGGAGGAAGATAGAGTGTTAAACGTTGCAGTATTACTA
+TTCACGAAGGACGATTTTTGGAGTGGGAATGATGTTGCTGCTAAAAATGGAAACTGTGCA
+CTATTTATAAGAGCAGCCAACCAGTCCGTTCCGGCTGAGGCCCAGAGTGCCAAGCAATTA
+ATTGTTGTTGGTGGGCCAAGCGCCGGGCATCCGAACGAAGTCCTGTTATCTGGCAAGGAC
+AAATATGCGACCGCTGCTGCGGTTGCTAAGTATTTGGGACAATAAAAAAGGGGGTATTTT
+AGTGTTAAACTTTATTCTGGCTTCAAAAGTTCTCGTTACCCTGGAGACAGTTCTGGGTTT
+AATATTAGCGGATTTCATTTTTGGAGTGTTGCTTTCTCTTAGAAACAGTAATTTTAGTTT
+CAGTAAACTGCCCCAATTCGTTGAAACGAGCTTGGTTCCTTATATTGGTGGTCTTCTTGT
+GTTGGCTCTCTTTTCTAATGTAAACACTGAGCTAGGGACGCTGTTTTTCACGATTGCCGC
+AACGATTTCAGCGAAATTTCTAGCGGATATTGTAACCAAAGCGGGGCAGCTGTTTAATGG
+ATTGCAAATTCAGAGTCCGTTGACTGTGGCTAAATCAGATAGCAAACAGGAAACAGTTCC
+CGTACAAAATGCAGTCCAAACGACGGATAATGGTACTGCTGGAGATGCGCAGTAA
+>NC_018068.1|provirus_2072558_2098541
+ATGGAAGATAGATTACTCACGAAGGAAGAGGTTTGTGAGTGGCTTAATATCAGCCGAGCC
+ACACTCGATAGATGGCGCAATCAGGGTTTGCCCTATTTAAAGACTGGGAAACTTGTTAGG
+TTCAACAGAGGTAAAGTTCAAGAGTGGCTTAATCAGCAGACTCACAACCAAAAATGAAAA
+GGAAGCCGCACCCCATCTCCGCAAAAAGACAGTGCAACTTCCCACATGAAACCAACCTTG
+TAAAGGCTGAACTTCTCTATAAGTATAGCAGAATGGGCCTCTTTATTACAAGTGTTGGAA
+AAAGAAAGAGGCGAGGATAGATGACCACTTTAGAAAGTCAAGAAATGATCCTATTAGGCC
+GCCAAATAAAAATAGGTCCTGAAGCAGAACGGTTTAAACGGTATGAGTATCTCGTAGGTG
+AATTATTGTGGTCCATGCGCGAGGACGGTTTTAAAGAAGGGGTAAGTCATGCAATTAAAA
+TTTTAGACGAAGATTCCAGAATTTCATAGCAGTCTTAAATTCTTGAAAATCCGTAGTATA
+TAGCTATGGATTTTCTTTTAATTTAGACCCTTGTACCCTACCACTATGGTCTCCTTCTGT
+AAAATAAAATTTCATAAATTATCAAGCATCGTCAAAAAGGCCCTTCTAAGCCTCTGAAAT
+TAATGAAATAATGAATACCCCTTGCCCCCTCCTGAAAACGGCAGGAAGGGGGCATTATGC
+ATGTCTCCGTGAAATGTAGCGGATATCCAATGACCTTCAATATCATTTGAATCATTATCA
+AAATTTATATTAAAGAAGAACTATTAAAATTGATAATATGTGAAAATACTAATTGAAATA
+TCAATTAAAATTTGATATTGTTGAGGTATAATATTTTACTAAAGAAAGGATGTAACAAAA
+CAAATGAAAAACGAAACAAAATGGGAAGATCTACCGATTATGCTCAGCCCTATACAAGCG
+GGGAAAATTCTTCGACTTAACCCTGAAATGGTCCGAACGTTGGCCAAGGCGAAGGCTATT
+CCTGCCATCCGTCCAACGTCTAAGTTTCTGATTCCACGCGACGCTTTGAAAGAATGGATC
+GAAAAAAATTCACAGGTAGTGGAGTAAAATGGAAATTTCCACGAGGAATAATATCAAATA
+ATATCTCTAAATCCTGCGTTTCAATTCATAATCAATCAAAAGAGACACGCGATTTTGAGG
+AGGTATTCACAAAGCCTATGAAGAAGAAAGGTGGTGAGATATCTATGCCGGGGTTTATGA
+CGCTTGAAGATTTATGTAAGAGCGGAAAAATTGCCTACTTAAAGCTTGGAGATGCCGTTT
+TGATTAAGATAATTGATGAGAGGGAGAATGATGACGATGACTAAGATTAAAAAAATCCTG
+TTAACTTCTTATATATTGATTACCCTTATTTTCACAGCCGTTGCCCCAGCCTTCGCGTAT
+TACGGGGCTACCGGTGTCAGTGGGGAGATTTGGCCTCCGGTACTCACGGGGTGGACAATT
+GCTACTGGCGGGGGAAATTCAACGATTAACTGGCATTTTAGCGACCCACTTTTTGGTGGT
+TCGACCGGTGGCGGTATCCCCGATCTCTCGGCTCAGTATCCAGACTGGGATAAGCCGAAC
+AACATGGATATTGTTCTTTGGGCACAGAACCATCATTATCAAATGCCGCTGAATAGTAGG
+TTTTATTGGTTCGCACTTCACCCGACCGATAAACAACCAACAAACTACACAGGCCCAGCC
+CCATGTTCTTACACACCGCAAATTCAATCTATCATCGATGCTTCGGGCTACACTCCTGCT
+GATTTTTATAATGCGGGAAAGGCTCCGCTGAGTGGTTCAGCACCTAAAGCAACTACAACT
+TCATCGCCAGTCTCAACTCCAGCTCCAGCACCTAAAACAGTATCAACCCCAGTTGCTACT
+CCCGAACCCCCTGTTGTCTCTGGTCCTCCTGCACCCGTCGTTTCAAAAACTCAAACGCCA
+GTGTCACCAGAAGTTGCAAAGCAACACTCTGACCCAGTGAGCGACCCTTCATCATTAACC
+TATGCAACTATCACCAAAATCGACAATGCAAAACAAGCTGCGGATGATAAAGCCCAAACG
+GATTCCCTAAATAGGAAGCGATATATAGTGTATGGTCTGTTAGCGTTAGCACTTGTGGTT
+TCGATTGGTTTTGTTCTTTCTATCTATATCCGTGAATGGAGGACCAAAAGGAAATGAGAA
+AGTTAATTTCTATCCTTACGGCCCTCCTAATCCTGGTCTTTCCCGCCATAGCATCGGCTC
+AATGTGGGATTACAACTTGGGATTTCGACCCACAACGGACGGCAACCAGCATATCCAGTT
+CCAGTACCGATCCATGGGTTCTCGCGCAGGGATCAGGAAAGGTCGTGTCCTATGCTGGGA
+AACCCGTGGTCGTTCATATTCCCTCGATCGACGAATCGTATGCGCCTAACCCGGTAACGG
+GAGACGTTCCTAAAACTGGCGTATTTACCTTTAACCAATTCTCATCAACGACTGCCATAA
+CAGATCCCATCGGATACACGATGTACCAGTATACCTGGGATGATGGAGGATGGGGACATG
+TATGGAAGTATACGATTAAATCCGGTGATCTCGCCGAAGGCAATGTGATTACTTTAACAG
+CAGCCGACTTAATCGCTGCATTTCCTTGTGGCTATTCAGGAGGAACAAACTTTGCGAACG
+CCCCGTCGGGTGTAACCATTTCAAACGACGGGAATTTTGTGGCCGTCGGAGCTGGCAATA
+AGCTTTATTGGTGGCCCATCGGAAATCCGGGGGCAACGCTATATAGTTTTATAAACGGCA
+ACTCTGACTTCGACATGTGCGAAGCTTCACCAATTATCACCCCCAACGGCTATATTGCCG
+TCGGATGTGATAATGGCGGATTTGTTTCCACCGACCTCTCTGGCAATACTCATAATTTCC
+TCACCTCTGACTCAGTTCTTGGCTCAGGCGATTCTTCCGAAGCAATTACCTCATCGCCAT
+CATGGAACCCAATATCAAATACCATATGGTTCGGTATCGACTCATATTCTGCACCAAGGC
+TCGTTTCCTTTGATCCATCAAACGACACAAGCACAATCGTTGGTAAAGGCACTATTTTAA
+CTCCAGTTTTTTCCCCAACGCCCGTGGATAAGGTGTCCGGAGATGTGTTTAATACGGATT
+ACGGTGGAAATGCTTATCGTTGGAGTTCATCCGGCAATCTTATTCAAAAATGGATAACTC
+CGAACGGGGTAACGCACGTATGTTCAAACATGGCGATAGCGAGAGACGAGAACGGGAATG
+ATCATGTAGCATGGAAAGATATGAACCGTCAGCTTGAAAACGCCATTACTCCATCGGGGT
+CATTCTGGGTTGAATCGGGTGGAACAAATGCTCATGATGTAATGGATCCGAGCTTCGTGA
+CCAGTTCAGTAGGCGACTATATAGGTGAGGCTTTCGTTGATCCGTCCTCAGGGGAGGTAT
+ATTATTCGCCACAACCGAATAGCGCAATATCTACAAACCCCCATTCCTACGTACCCATTA
+ATCAAAATAATTATGGCGTCATAGGCGATTACATCGACATGGTTTACGACGCTGATATCG
+GTCCTGTAATGAGTCCAGCAAAATCAACGTCCTATACCTGGTCCAACGATGCAAATGGTT
+CGCCTGGGATTTTGATTTATCTCCTGAGCCCCGTTTCTCTTGAAATGTGCGTCGCTGGTC
+CAAGTGGGGTCGTATATGCGCCGCCAAACAAGACGATCACGGGTTTACCTGGAGATACAG
+AAAATATTACAATGTTCGCACCGGGGTTAGATTTGAGTGGTGATACCAGCGATGGTTATG
+GTGTTATTCATATCACCGGTTTCCCGGATGGTAGTTCAGCAGATAAACAGGTAAATTTCG
+ACTGCAATACCACAGACCTGATAACCGGTTCAGGGAGTGCAGCGGCTTTCGATTCGACTA
+GTATTACCTTGCCGACGTCTAGCGCTAATTACACGCTGACCTTAACTGAGACGCTCTATG
+TCAAAGATCATAGTACCGGAGTAATGGAACAAAAAGATTATCCATCACCGACGATAACGA
+TTAATGTTCCTGTAGTTGGTGTTGCCAGCCCGGGCAATCTCACAATATCGTCTTATCACA
+ATGGTGACACAAACAATTCGGGCATAGACGCCGGGGGATACCCAAACTTGGTAACTGGTA
+ACCCGTTGAAATTCAATTATGGCGACACAATGTTGGCTGATCTTGTAATCCCGGTCCCAG
+CGCCACCAGCCGGATGGCAATATTATTCATCAGTTTTAAGCGGGTTCATAACATATCCAG
+TAAATACGCCAAAGCCGACCGGCACAGCGCAAATTGGGGAGCCACTGACGATTGCTTCAA
+CAAAAACAGCGACCTTTTCAAAGAGTACGAGGGCTGGAAGTCAAGAAAATGGGGCATCGG
+TGAACGACAGTATTGCCAGTTTTCCTGTAGAATGGCCTACGTGGAGGCCACCGATTGGAC
+TGCCAGGGTACGATTGGGACTCAACATTAACAGCGACATGGACGCAAACCGTTACCTATG
+TACACCATATTAATACACCTGTGGGGGGGTTCTCACAGTATAGAACTTATACTCATAGTG
+ATAGCACCCCATCACAGGAGTTACAGAGAACAGGTACGGATATTTACTATATTCCCGCAG
+CGAGGGAGCCGTGGATGAGATAAAGAAAGGGTTGATTTGCGAAATGAAAAAATCAATAAT
+GCTTCTTGTTTGTTCTGTTTTAATTTTGTTTTCGGGCGTTTCAACAGCCCAAGCATTTGA
+TGATAGTCAGCATAATCTTGTTGGCGGAGTTGATGCTGCTTATCAAGTGGTCACTCCTGG
+TCACTCTTACACATTGGGTTACAAACTTTATGGAGTTGATTTGACGAGTGCCTGCAAATT
+TAAACTAGGAGAAAATCCCGAAACAACCCTATAAAATAAAGATCACCCAACAACAAATGG
+AATTATATGGACTTCGCAACCTCCAAAAAATGCAAATTGTGGTGTCTCTACCTATGGCAG
+CTTATCTGGTAATGTTTTTGTAATGCGCCCATTATCAGAAATCCCATTAGATTGTCGAAA
+TGAGGAAGATATAACTGGTTTAATACCGTATAATTTTTCATCTGTGAAACCTTTATCTGT
+ACATGTTCCGACACGAACTACTTTAACTGGAGTTAGCGGTGGTGGGGATTTAATTCGTTT
+TAGAATCCCTGGGAATGGACACACCCCAATACCGGCAAAAGTGAACATAAAAATAATAAT
+TTTGGGGGCTATTGGCATAGCACTGGTGTTCGGTGCTGCTGTTTTTGCGATTAAGAGTAA
+ACAGAGGAGGTCACACAATGATTAAATTTATCCGTTGACCTAGAAAGCCTTATACTTTGC
+GAAAGTCCTATACTTTATAGCTTTATTCATTAATTAATTCATTAAATGTCATGAACAATC
+TCAGCCATACTCTCGCAAGGCTTTCACGGATTTACTAATGAGGTTAAAAACGCTGTTTTT
+TCATGACTGATTGACGCTTTGAATCATCATTTGAAATGATTAATAAATGTGTATTTATAC
+CTAGCCTATCATTGCACGAATGAAAGTAGTTTTGATTTGTATGGACATAACGCGAATCAA
+AACTATTTTCAACGACTAAACATTCACTGCCACAACGGTTTCAGGCGTTTTAAAGTGCGC
+GAAGTATAGCACTTCGAAATAGGTGAGAGGCTCCTGAAAATGTCTACAATCTAGACTCAT
+ATTTTATTTCGTTTAATATTTAATTACCTATATATAAGCTATTAAATATTGAATGTTTAT
+ACGATATGGATAAGCTATTAATTTTTACTAAAAACACTCTATAACAACCTATCCTCACTG
+GGGGAAAATGACATATCATTTTCGCTCAATTTCAAGGATAATGTTTGATTAAATATCAAG
+GGGAGCTGTACGATGACACAAAAAAACAGAGTTATATCAGACCGAAATATGGAAGTTGAA
+ATTATGGGAGATATACTCGAAATCAGGATTAATCTTGCACGATCAATCGGTATGACCAGG
+AGCGAAAAAAATTTTTTGCTCGCCTCGTCCAAAGGTACTCTTCAGATTGGTCGTGATCGC
+GAGGAGAAGATGGTTCTTACAGTCTATCGACCGAAGCCGGCATAGGATTAATCGGATAGC
+TATTGAGAAATGAGGGCTGATATTGCAGGCGAAAAACATTGATGCAGAAATTCAGGGAAG
+TTTTTTAACAATACGAATAGATTTAACAAAATCCTTCGGCGAAACAAAAAGCGGAAAATA
+TGTTCTAATAGCTACAACAGACGGAATTAAACCAGTGGGAGATGGGCGCACTGAAAAAAT
+GACGATAACTGTATATCGCCCTAAGCCTTGAGTCAGCTCTCAAAGAGGAGTGGTTCGCAT
+AAAAATAGTAATAGATCGTTCCTATGCTAATTTCAGCCTTTCCGAGGAAGCCTGGACCGC
+CTACGGGAAGGAAAGACCTAAAGACTTAAACAGTATTGTCTTCCGATCCGATCCCGACCT
+GATTCGTGTGGTCGAGCAACTTGGGGAAAGGGCAAACGGTCAGTCACAGTTCGGTCCGAA
+AAACAAATTAGAAATTGTAGAAGTCCCAGATGAGATTCCGGTTCGCATTGAATCTTATGA
+TGGGAATGAGTGGGTGGCTGAGGAACATAGGGTTTGGGGGAAGGACGAAAAGATATAGAG
+CACCAAAAAACTCACCTATTTAAAAGGTGAGTTTTTAATCTGATTCTTGACTGAACCTGA
+CTGACTCTTGACTGAATGCTACCGAATACTTAGCGATATTTACGGGTTTTTATTAGGTAT
+TTTGCTCAACCCCCGTTATAATTGAAACCCGCTAATCCGCTTGTAGAGTGGCTTGTATCA
+ATGCTTTCAGGGTTTTAACCCAAAAGTTTTTGGACATAAAAATGGTGCGGTCGAGAGGAC
+TTGAACCTCCATGCCCTTGCGAGCACTAGAACCTGAATCTAGCGCGTCTGCCAGTTCCTG
+TCCAAATCTCTGAACGCTTACATACATAAGGATTATAGAGTTTTTAAATAACTGAAAAAT
+CTAGTGGGGAACTAATTACCTGTAATTGTTTGCTATTTTAGCACATAACTTGTCATAAAT
+AAACTATGTATAAAAAGAATAACAAAAATAAAAATTTTATACGTTTAGAAAATCCCGCAA
+ACTTGCTTATAGCAATACTTTCACTAATTATCCCTAGTGTGCTTAATATGGATAGTATTA
+TCTCAAACAATAAATCAAAATATTGTCCTACTTGTGCTAAGGAAATTAAATTAGAAAATG
+ATAGGAAAATCCAAAAAGAAAGATATTATAGTAATAAATTCTCGCAAATAGAAAACGCTT
+AAAAGTCACATATATCAATACTTTTAAAGAATAGATGTAATTTTGTATATATGAATATAA
+TAACAAATTAAAATATTGTCCAACTTGTGCAAAAGAAATTGAGAAAAGTAACTGGGTGGA
+AAGAAAAAGGAGACAAAGAAATAAAAATGTCACGAAATAGAAACGCCCTGAAATTCAATT
+ATAGAAAGGGTTTGACGATATATAAAACAAAACGTATTAATAATGGTAAAGAAATAACAT
+AGTATTATCAATGCTTCCAGATTACATTGTACTTTGTTTCTCAATGGTCACTTAGGGAAA
+GAAATATCAAATGTTAAGAAAGCAGTGAAGTTTTAGAAGACCCTTATACACCAACCCTTT
+CAGGATTCATCAAAATCAAGAACATAGCAATATTAGTATTTGTACTTTATTTCTTAATGT
+CCTATAAGGGAAGAAATAAAATTTAATCGCGTTTTAATCAAAATTATCAAAATTAGTGTA
+AATCATAAAAATCACACCCTTCAATCCCTTATGTGGCAATGGTTTCAGAAATTAGTTAAA
+TTGCTGTATATGGGTATATAAGCATTTTTCACGTAATTAGTTAAAGCGGATTCTACAGTC
+CTACTCGCACAACGGTTTCAGGGCTGTCTATCTTCCTTGTATATGGTATATAAACAAATT
+CAAAATATTTGCTTATTATGATACTAATAGTAGCCAATCAAATAATATAATCAAATTAAA
+TAATCATTCTAATTATGAATACTAATAGTTGTCTACCAAATAATATTTACATTTAAAATT
+ACCAATGGCTGGTAAAGTGATAAGTATATTATATTAGTGTTTTTGTACATAAAAAGCGAG
+AAAATAGAAAACGTCTAAAACTGGCTTGTGACAAGGGTTTGATAATACATAAAACAAAAC
+GTATTAATAATGGTAAAGAAATGACAAATGTGAAGTTTTAGAAAAACCTCTTAACCCATA
+TCCAACAATCATTTCAAGGTTTGTTACAGCCATTCTAATATGGATATAGTTAAAAATCGT
+GGAAGGAAAACAGAAATCCTCTGTATCCCCACAGATACAAGCGATTCCAGTCACGCTCTA
+GCCGTTGTAATGTGGATAGTATTTTAATAAAAAGTAAAAAAAATAAAAATGTTCGAAAAT
+AGAAAACGCCTGTAACTACACTCCTGTAATACTTACAGAGGACACATGTATTTTCTTAAC
+TTATGATATATAGTATTATTTTTTTTATTTAACTTCTTAATTAACTTTTTAACTCGATTA
+TCCTCCACCTTCAGCAAGTGGATTATAATACATTACTAGTTGAAAAATTTAAGTCATTTT
+ATTCCGTTGCGTCTCGTTGGGTAGCTAGACCTGACTCCTCCAAAACAAAGGAAAGACGAT
+AAGCATAGTGAGTATTCTATGCAAAGGTGCGACCTAGTTGTTGCACCTTCTTCTTTATGT
+TTAAATATCAATTCTAAGTTTCAAAACACCATCAATTGATGGTAAATTTATACCTATCTT
+TCTTAGTTGGTATAATTCTATACCCATGATAAAAAAGTATAGAAAAATCAATTTAAATGA
+CCTTCTAAGGCGTTACAAAATGATACCCCTTACAATTACCCTACTTAACATTTTAAACTC
+AATACAGCCGATTTAAAATGAAATATTGATTTTTACCATACCCGCAAACCCTTGATATAA
+GCCATTTTTAAAAATGCCATTTTTTCATCATTAAGGGGATTCCACCCCTCTTTTGATGAA
+TTAAATATATCCCAAAAAACGAATGGAGGTGAAACAAATGACAAGTAAAATTGTAAGATT
+TATAACTATTAATTTTTCATTAAATCCAAAATATTACATTGTAAAATATGGTTTGGAAGA
+TATTGCTAAAACAATTGAAGATTTCAGAAACGATTTAAACAAAAGGAGATGAAACAAATG
+AGATTAATTAGATTTATGAGACATCCAATAAAAAATGCATTAATAGCAATTCAAGTAGTT
+GGTTCTATATTGCAGGAATACCCAAAACAAACCTTAATCTTTATTATAGTTTATTGCCTA
+GTATATTACTTAAACTATTAAAACGGAGGTGTGACAACAAATGCCAACAGATACACTAAA
+AACATTTTACATAAAATCAATGCGACTTGCAGGTTTCTTAATGCAAAGGGGCTTTGTCCT
+CCATAGCGTGATACCTGATAGATTTGATACTGCTATGCCCAAACGCAATGTATTTACATT
+TACTAACTGTCCAGAGTTAATTGATGCTATAGACGATTATAAACAAATGAGAGGAAGTGT
+ATAAAAATGGAACAAACATTAAAACAAATAGAAATGCAATTACTCCGTATTGAAGCACAA
+CAATTAAATTTCCACCTTCAGATGATGAATATGATCAAATTGATCAATCAAAATTTAGCC
+AAAATCAAAAAGTAATCCTTTGCTAGAGATAGCAATTTTTTTATGCCTATTTTTTATTTA
+ACTTTTTAAAATCTGAAATGAGGTGGTGAAATGGACTTAAATGCAGAGCTAATAAATCAA
+GTTTTGGGGCAAGGAATATTCGCAGTTTTATTTGTTTGGTTGCTTATGTCTGAAAGAAAA
+TCTAGTCAAGCAAGAGAAGATAAGTTGATGCTCCAACTAGAAAAATCTAATGATGTTTAT
+ACGAACGTCATTGAAGCGGTAGATGCCCTTAAAGATACTATTATGAAACAAAAATAAAGG
+AGAGATAACGAATGGAATTTACACCTGAACAACAAGCCCATATTGATGGATTACTTACTG
+AGCATAAGGAAAAATGGGAAACTGAAATCCTTGCACCTTTACAAACAGAACTAGCAGGAT
+TAAAGCCAGTTGCCAAAACAGATAAGGAAAAAGAGATTGAAGCCAAGGAACAAGAACTAT
+GGAATAAAGAAAAATCTTTACATATCAAGGAAAAAGGTCTTAGTGATTTTGCTGAATTCT
+TTAATGCTAATACCATTGAAGATTTAGATATTCAAGCGGAAAAACTTAATAAAATCCTAG
+AAGCCAAAAAACTTAATAATGCTTATGTTCCTAGCGGTCATAAAACTGCTGATGCTTATG
+CACAGGCAGAAAAATCAGGTGATACTCAAACTATGATAGGCAGTAAACTGTCTAAATTAT
+TCTCTTAATTTATAACTAATATTAAATAAAAGAAAGAAGGAATTTTATAATGATTACAAC
+TGCTAATTTTACCTCTTTGGAAAATATTAACCTTGCTAAAGAAATAAGTTTGGTAAGTCC
+GCTAGATACTCCTTTCAGCACCATGCTTTTAGGTGGAGGTAAATTCGATACCACTACTTC
+AAAGATTGATACTTGGAGAACAAAATCCCTTGATAATACTGCTGATATTTCTCAGGTTGA
+AGGTTCAGAAACTTCTGTATTCCAAGCAAGCGCAAGAGCAGAAATGTCAAATGTTTGTGA
+AATTTTTAAAAAGGCAGTTTCTGTTTCTGGAACTGCATCCGCTTCAGGTATCACAGGCGT
+TCCTAACTCATTCGCTGAGGAAATCAACGACCGCTTAATCGAAATGAAAGTTTCGATGGA
+GAAACAACTTATCAATGGAGTTAAAAATGATGGTTCTGCCACTCCTTTTATTCGCAGAAT
+GGGTGGATTATTTTCCTTTGCATTGGCTGAACAATCTATTTCTAATGCTACTGCTGGAAC
+TCTTGCAGAAGCAGACGTAAAAGACACTGTAAAAGCACTTTGGACAGCAGGAATGGCTAC
+AGGTCAATATATTGGCATGGTTAATGCTGACCTCAAAGAGCGTATTGATGCTTTATATGA
+TGGAAAATACAGCTATATTGCACAAGAAAATTTGTTTGGGCTTGTAGTTTCTAGCATTGC
+TACTAATTATGGCACAATCAAACTCTTACTTAATCGTCATATGCCAGTTGATAAAATGGT
+TGTATTTGACCCTGCATATCTTAAAATTGCTTATCTTCGTCAACCTCAATTTGAGATGTT
+AGCAAAGACAGGTGACTACACTCAAGGTCAAGTAATTGCTGAATTGACTTTGAAAGTTAT
+GAATCCTAAAGCAATCTCAGTTTTAACTTTTGCCTAAAAGGTCAGAGTTGGTCAGGAGAG
+GGTGAAATATCCCTCTCTATATTTTTATTTAACTTTTTAACAATTTGAAAAATGAAGGAT
+GTTTTTAAAATGCTGATGACAGAGGAATTAACGGAGCGACAATATTATACATTTACAAGG
+AAAATCAAAAAAATTAAACTTCGACAAATTGCTGAGGTACTTGGATGTAGTGTGCCACTT
+CTCTCAATGTGGGAGACAGGCAGGACAGACATAAACGATTATTACGTCAAAAATTACAAG
+CAATTTATTGATAACAAATAACCTATAAACAAATGAAAGGGGTTGTATTAATGTTTGTGG
+TCGATAAGGGCAACAACGATTGCCTTCTTGATTCTGTAAAAGAGAGGGAGGGTGACATTG
+TGATTTAACCATAGCATGGTTAAATTTTACGGTACATTATCAATAGACAAACAACATATT
+GAAAATGAAATCCAAAATAAAGGAGAGATTTCCGCAATGGTGTTCTGACAATGAGGACTA
+TGAGTTGATGCTAACGGATGATATAGATAGTTTGGTTAGTTGCGCTTTACTTAAAAAAAT
+TAAAGGTTATGAGACAAATTACTATTATGATTTTCAAACTATTTATGAGCTTAAAGAATC
+AGATGTTCCTGCAATTGCAGTTGATTGTGATTTGGTTAATGGAAGATGTTGGAGTAATCA
+TGTAACAATGTTGTCCGCTAAGGACAGTGTCAATAAAAAGAGTGCCAACTTAAACAATAT
+CGGAAAAATATCAAGAGATAATTACTTTCAAAAGTTTTGTGGTAGCACAGCAATTCAGAT
+ATGGAGTTTCTATGATATTCCTCTACCAGAGACAGAAGAAGGTAAGATGGCTTTACTTTG
+TTTAGATGTTGGATTTAAGGGACACTACGATTCAAGATTCATTGAGATACATTCGAAATA
+TCTCAAGGCACTTGGATTCCCTGAATTAATTGAGGTGCTAGAACGGCACACTTCAACCGA
+ATTCTATGATCTGATTAGGAAATATAATATGGCAAGCAAAATAAAACTTAATAAAAATGG
+TATGCTCACCACTGACATAGACATTGCAAATTTGCAGTGTCTTTTTAGTTTGGATTTATC
+TCGCCCTGATAAACCATTCTACATAAGAAGAGAATTTACAAGAGATTGGCCTACATGTTT
+AGTCAACTATAAGACATATACAAAGGATGATTTTCCTGAGATGTTTAGTGTGGCTCTAAT
+TAACAGAAATAAGGTTTGTTTTACAAAAATTAAATAGAGTTTTGAAAGGACTGGGTAAAA
+TACTCAGTCCTAATATTACCAAAAATGTTCGAACAATTATTCTCAAATTAATTGTAATGT
+TCGGAATTATCATTGACCTTAAAGAAAAACAAGAGTAGAATTTTGAAGCGAAGGAAATGA
+ATATTCAAACAAATGAAAGGAAATGCTAATGAGAGTTTCAGATGTGGTTACTATAAAAAA
+GGTTAAATCTTGGATGCCAGGCGATGTAATAACAATAAAAGCAGGTACAGGAGTAGGTAA
+ATCATATTTTATAAAAAACAATCTATACGCCTTAGCCAAAAAAGAGGGCAGTAAAATTCT
+TTTATTAGTAAATAGAATTAATTGTAAAGATCAATTTGTAGATGAAATTGGTAAGGCAAA
+AAAGACGGATATTATTGATATTAAAACCTATCAATATATCGAAAATAAAGAAGCCAATAA
+AAATTATTTTGATTTCAGTGAATATGATTATATTGTTTGTGATGAGTTTCATTATTTCAT
+GAGTGATGCGGCATTTAATATCAATACCGATTTATCTTTAAATGCAATTCTTGCCCAAAC
+TTTCCCAGTTAAAATATTTATGAGTGCTACGGGCGATTACATGAAAAATTATATAACTGG
+AGTTAGAAAAATAGAAACGATTGATTATGAAGTCCCTATTACATACGATTTTATTAAAAG
+TTTAACCTTCTTTAATAAAGATGAAACACTAGAAGCATTCATAGAAGAAGCAATAGCAAA
+GAATCATAAGGCCATTTTCTTCATCCAATCAGCCACAAAAGCATATGATTTGTACAAAAA
+ATACAAAAAGCATTGTTTATTCAATTGTGGTAAAAGTGATAAACATTACAAATATGTGGA
+TAAAGAAAAAATCAAAGAAATGCTAAAGAAGGAAAGATTTGAAGATCAAATTTTAATCAC
+TACTACCTGCATGGATACAGGGGTTAATATAAATGACATTGACCTGTATCATATTGTTTG
+TGATGTTAAAGATATCGGCGTTTTAGTTCAGTGTATAGGCAGAAAACGCCTAGAAAATAA
+AGATGATAAAATTTATTTGTACGTTAAAACTATTAATAATCAATCATTAGGGGGCATGGA
+AACCCAATTAAAGAGAAAAGTTAATATGGCTGATTATTTGCGAGAACATACCGTAAAAGA
+ATATCTTGAGGAATACAAAAGACAATATGATACCAGTAACATTGTCTATAATGACACGGT
+AAAAGAAGATAATAAATCAACACTAAAAGTAAATGAATTAATGTTCTTTAAGGTTAAAAC
+AGATTTGGCTGAATTAAGTTTCATGAAAACTTATGGTGATTTTGGTTATTGTAAATATCT
+TGCGAGTAAATTTGGATTCCGAGATGATAACGGATATTATAATTATCGGACTATTGAAGA
+AGATTATCAAAAAGATAAGATTGTTAATTTTATGGCAAAGGTTGTTGGCAAAAAATTAAC
+AAAAGAAGAACAAAATGAATTGATTGATATAGTTGATTTAAGAGATTCTAGGAATAGACA
+ACAAAAATCAATAGGACAATTAAACGAGTATTTTAAAGCAAATAATATAAAATATTTTAT
+TATATCTAAAAAAAGTGGTCCAAAAAGATATTGGGAAGTAAAAGAAGATAATGCGCAAAA
+CAAAATGGGACAAAATTTGGAATAACCTCTATTATAGGTTTATCCATAAATTGTCCCAAC
+TAATTATTATATCATATTGCAAATATAATTCAAGAGTATTTAATTAAAAATAAATATAAA
+AAGTATTTGGCAGTTGCCCACGGTGGGCAAATGCGAGGTAATAATTTTGATATTTGCTTG
+GGTTTTGCGACCTTGGGGCGCGAAACCATAGCAAATTCAAATTATTGCCCAATGCCATAG
+GCAAAAGTTTAATGTAAATCTTATTTCAATGAATAAGAACACAGGGCGCTTACCAGCGGG
+GTATGTCTGTCGGGTGCAGTGGCTCCCGCCAGCCATAAATATAATTTTAATTGTTTTTAT
+AATTGGTTTCAAGAAAAGGTACTTCATATTGAGGTGCCTTTTTTTGATGTCACTAAGAGT
+TACCATTACAAAATAATTATAGGAGTTGATACAAATGACTTTAGACGAGCAATTAGCACG
+TACAAATTTAAAATATAAACGATATTTTCGGTGGAAATTCAAACTATCTACAAGAGGTAG
+AGCATATAAAGAACGTCCGTTGGAAGAAATCATGAAGATTGATTTAATAAAAACAAGGGA
+AACATATTACGCTTGGGAAAAAACGGAGGAATATCAGAACTTAGTCAATTTACTTATTAT
+GTCAAATGCAGGTAATGATTTATTAGAAATTTATAATGTCATGCTTGATAAAGCAAAAAA
+AGGTGATGCAAAGGCAGTTGATACTGTCATTAAACTTCAGAAATCTATTGCATCAAGCAT
+TAAACAGAATAGTAAAGATAATAATTCTGCTCCTGTTGAAGATGAAGAAGATGATCTTGA
+ACTATGACAATGAAAAAGGAAACAAAATTAGAGAAGATTAATAAGGACTTCTTTTTGTGG
+GCTAAAAACTTTGTTCAGATTATTGATAATAATGGAGATTTAGTTAAGTTTGTTCCGAAT
+GAGCAACAGGTAGAATTCTTTAATGGCATGGATAAGTTTAATATCATCGCCAAGAGCAGA
+CAATTAGGTTTTTCAACTTTGATGATGATATATTGCTTGTGGCTTGTTTGTACCAGACCA
+AATACTAATACTATGATGGTTTCTTATAATGTTGAGAGTACACAAGCACTATTTGAGAAG
+TTGAAAATGATTTATGCAACTATTCCTGACAAATATAAGCCAGCAGAAAAGCGTTCAAAT
+AGAATGGAATTATTTTTGGAGAACGGTTCTAAGGTAATGGTAAAGACCGCAGGTAATAAA
+TCCTTGGGGCGCGGAATGAATTTACAGTATATCCACTTGTCAGAGTTTGCTTTTTATCCC
+GATGACCAACAAAAAGATTCATTAGTGTCATTAGAGCAAGCACTTGCAAAAAATATGGAT
+TCAATGATTGTTGTTGAAACTACTTCTAACGGATACAACTATTACCAAAAACTATTTACA
+AAGTCCTATAAGGATAAATCGAGCAGATATAAAGCATTTTTCTTTCCTTGGACTTCTAGT
+GCCACTGTAAGCCAATTCAAACACGAGTTAAACATTGCTGAGGATTGGTTTAAGGCCAAT
+AATCATAATCATAGATTGATACCTGAGCAATTAGAGAAGGATGAATTACCTTTATATAAT
+GCTAAAGTTAGTTTGAAGATGATAATGTGGCGTAGATGGAAACTTCAGGACATGGCATTA
+GAAGATTTTCAGCAGGAATTTCCCTTTACTCCTGAAGAAAGTTTCAGGGCCACAAGTCGA
+TCAATATTTAATGAGCAAGCAATTAATAATAGTGTTATGAATCTACTTCCTCCATTGAGG
+AAAGATGAACTAAATATATCTCTCCCTGATTCCCTTGCTAGTTATTATGGCAGGGGTTTT
+TATATGTTCAAAAATGTTAAGCCAGGAGAACGATATTATGCAGGAGTTGATACTGCTTCA
+GGTAATGGTGGAGATAATTCAACGATTAGTGTTTATAGTTCGGAGGGTGAGCAGGTCGCA
+GTGTTTATGGATAATAAAATACCTATCTATAAATTTGCTGATGTTGTTTATGACTTGGGC
+ATGATGTTTAACTATGCCTTTCTTGTAGTGGAGAAAAATAGTTTTGGTCAGTCAGTCATT
+GAGAAGTTAAGGTCTGAACGCCAATATTTAAACATGTACAAGATGAAAACTTTTGATGAT
+AGAGGTAAGAAAAAGTATATGGTTGGTTGGATTACTACAGCAGTTTCAAAACCAAGGTTA
+GTCCAAGATTTTAAAGAGCAATTTGAGAAGAATTTGATTTTGATAAATGATAGCAGCACT
+CTTGATGAAATGAAGATTTATGTTGAAGCCGATGGTAAGACATCAAATAAGCGTGGAGAT
+GATTTTCACGATGATTTAGTAATTGCTTCAGCATTGGCAGTTCAGGGGCTTAAATGTGGC
+AAATGGTATTTATAAGAAAGGGATGAAATAAATGAATCTACAAGAGTATATAAATGCTTA
+TTATGATGGAGATGAGTATTGGTTTATACAATTTACCAATTACAGTAATTCTCATGTCAA
+TGTAAGTCAGCAAAATAATGTACCTTATGTATATAGTAATCAGGAACGCATCATGAACAT
+TATAAACATTAAAGATTATTTAAGTGGCAAACATGCCATTTTAGATAAATCGGTTGAAAT
+GTGGAATGGGAAAGAATTCCATCCGAGAACTATTGTTTTGAATTATGCCAAGACGATATT
+AAACTTCTCGACAAGTTATTTGCTCAAGAATCCTGTCACTATATCAGGAGATGAAGCAAG
+TGTACCTATAGTCAAGGATGTTTATAAAAAAGGCAATTATAATAAGATTGATTGGGACAT
+TTTAGATAAGGTATGTAAATATGGGTCAGTGGCTGAGTATGTTTATATTGACAAAGACAA
+AGAGATTAGAAGTAAGTTAATACTGCCAGAGGACAGTTATCCTGTTTACAATGATGAGAA
+TGAATATATTGGATTCGTTGAATACTTTACTTCGATTATGAATGTAAGTTACTGGAATGT
+TTTTACTGAGGATAAGGTATTAAAGTATGATGACTTTGGTGGAGAGATAAGATTAGTAGG
+TGAGTTTAATAATCCTTCAGGTTTGCCGATTATTTACAAAAATAAGAATGAGTTAGATGA
+AACAGCAGGGCGAAGTGATTTGGAGGATTATGTAAATATTGTGGATGCCTTGGAGGATTT
+AATTAGTAAATATACGGATTCAATTTATAAGTTCATTAATCCTATACCTGTAGTTGTCGG
+GCAGAAGTTAGGCATCGGTAAATCAGGTGAGGGTGCTATACCTTCTACATTAGTAGGAAC
+AGGATTACAGTTAGATGATGGTGGACAGTTTAGTTTTGCTAATGGTCAATTAGATTATCA
+ATCCTTTGAATCAGTTTGGAAGATTTTATATAACTCATTACTTCAGGTTTCTAGTGTTCC
+GGCTGTATCTATGGGTGTTCAGGACGTTAGCAATTTATCAGAAGTAAGTATTAAGTTATT
+GTTCTCTCTTGCTGATTTAAGAGCAGGTATGAATGAGATGTATATGAGAGAGGGCATAGA
+ACAACGATTTAAGGCGTTTGAAACATTACTTAAAGCAAAAGGTATAGTGATAGATGCTAA
+TGCTTTAGATGTAGTATTTGAATACGCAAGGCCAATGAATCAGACAGATATAATCAATGA
+TCTAAAGACATTAAGAGATATGGGTGCTATTAGTTTACAGAGTACATTAGAACAGTGTCC
+TATGACATATGATGTGGCTATGGAGTTAGAGAGGATTAAGAAGGAAGATAAGGCAAAGGT
+TAAGAAGCAACAGGCACAACAACAAACATTTGATAATAATGGGAATGTGGTTAGTGGAAG
+TGATGCTACCAATAACAATATAAATACAGATAATGGTAATGTAAATGGTTAAGTGAGATT
+AAGTGATACTAGATATAGTGGTTAATTTGTTTTGTTAATACTAGATGTAGTGTTGCATTA
+AGTTATGGATTATATAAGCGTTTGATTATGAATGTAATTGTTCTAAAAAATCGCGCGTGT
+TATAATATCTATATACCCATATGGGGTATAATTACTATAATTTTGCTGTATTCAATATGT
+AGGTGGCACTCACTCACTGACATAATAACCAACAAAAAAGCATAGGTGCTTCAAATCAAG
+AGCATCTATGCTTAGATACATTGTAATTATCAGAATTGTTTATTGGGTCCGATAATGAAC
+ACTATGTAAAGTAAAATATGACACAATAGACATTGTGTAACATTAGGTAAAATGGCTACA
+ATCCGCTTATATCAAGGGATGTAGGGTTTGGGGTATTACTTGCCCATTTACTTGTTAAAA
+TCTAATTGATAATGACTAGGGAAATTCCACCACTCATGGACATTTATAGGGTAATTATAT
+AGCATCAAATTGAAGTTTTAATGGAAATAGGGGGCTGATTCGATACCCCTTTTCTGAAAT
+GAGTCGCCATAGTTAATCCAATTTTACACGTTCAAAGTAAATTTTGAATCCTCAGATTCA
+CTTGGAATAAATTCATACCCACAAAACTCACATTTCTCTGTTCCATAAGGAGAAAACTCC
+CCACACTTAGGACACTTTTTTTCATTCCTCGAAATTATTGCAGATATTAAAACCCCAAGG
+ATACTAAAGAAAAATCCTGCAAAAAACCATGCTATAAAAGAACGATGTTTTGCCCATGCT
+ATTGCTCCACTGATGATTCCGCAGATTATACCAAAAATAAACCATAATGACATAACATCA
+CTTGATGGAGTAATCAAGTTGAATTCCTCCTTACTACTTAAATACAATTTGATTCAAAAC
+ATCCGCTTAATAATTTCTTTATATCTTTTATCATCTATTTCTATTAAACACTTTTTACCA
+TTTTTAAACTGAACAGCTAAAGTATGGATACCTTTAGATTTAGCAGAAAGACCTGCTAAT
+AATCCAACTGGGCCTAATAAAAATCCTCCAAGCAATCCTCTGCTTATTGCACTTGAAGCA
+CTTTTTATGCTTTCCTCCGTAACGATTTCATAGTGTTCCACATTTGATTTACTAATATCT
+TCAATGTTATATCCCTTTGAATCTTCAATGTATACTAAACCAGTCGTCCACCCAATGCGG
+TAATTAAAATAATCACCAGCAATAACAATGTTTTTTGCACTCATCTTAAATCACTCCTCG
+TATAATTAATTTAGTTCCTGCCCCACGAGTCCAAAAAACTAATGGAACGTGGGGTATTTA
+AATGACCAAAGAAAACTGGAAATTCAGTTGGTTGGTCATCATCAACAAGATGCGCGCAGA
+ATAACGCATACCCCATGCAGTCGTCGTGCCTGTGGGCAGTGTGGACAAGTCAACCCCAAA
+GCACACTTCAAATTCGACTTGTCCAAAGCCTGAGGGAAAGCTCTTTTAAGATAGACCCAT
+AAGGGCTTTTCCATAGGCTGGCACTGTCCACAGGCTCAGGATAAGGAATACCTGAGTAAT
+GATTCCTTAAGTCGTTCTTTGACAACAAAAAAGTATTTAAGTTTGTTGGGGTTTCAGGCA
+AAATGATACCGTGAGGTTCGTTCTGGTAAGGCCTTTCACTCCTTGAGGCTATGACCTCTT
+ATTAAGTCTGACTGCCAGCCCACAATTTGAACTTTTAACTCGAAGGTTGCACAGCTTAAA
+GGGAACCCCTCCGATGGTAGCAGATCGGTTGGATCCGAGGTCTTTTTAAGACAAGTGCTG
+ATTCGGCGAGGTTGTTGACCTGTTGTGGTGCCTGGTCCCAACGTTAATCTTACAAATTCT
+TCGACTCGGAAAGTGAGGTGATTTTACTTGAGTTTATTTGTCGGTATAGATGTGAGTTCC
+AGTGATTTTAAAGTGCGAATCTTAGATGAGCGTGGTAATGAACCAGTTAAAAGGCTAAGG
+GTTTTGAATGATCAGCCTGGTTGTGAGCAAGTTGCCCGATATCTCTCTGAAGCCTGTAAT
+AAAGAGAATGAGGACCGGCTGGTTATTGGTTTAGAGGCCACTTCCGTGTACAGTTGGCCG
+TTACAAATGTTCTTAGCGGAAGACCATTGTTTAGCACCTTTACAGCCCCAAATTTATTCC
+TTTAACCCCAAGGTCGTTGCTAATTTCAAAAAGGCTTATGTGGACCTTCCGAAGAACGAC
+TGGATTGATGCCTGGGTCATTGCCGAACGTTTACGCTTCGGCCGGCTCCCGGAGGGCTCT
+CAGGTCGATTTCCGCTACTTACCGTTACAGCGACTCACTCGCTTTCGTTGTCATCTGATC
+GAGATGATCTCCAGAGAGAAGAATTATTTCCTCACGAACTTGTTCTTAAAGTTTAGCACT
+CTTGCCCAAGGTACGGTTTTTAGTAATACTTTCAGCGTTACTTCTGAATCCTTGACACTT
+GAGTTTTTTTCTCCAGAAGAGGTTGCGGCTCGACCGCTTGATGAACTGATTGATTTCCTC
+ATGGAGAAAGGAAGAAGTCATTTCGAGGATCCGGAAGCCAAAGCCAGAGAGTTGAAGGAA
+GCCGCTCGCAAGGCCCATCGACTACGTGGAAGCCTATTGCAACCCATTAACCTTATCCTA
+GCCACGAGCATCGAAACCATCCACACTTTAGAGAAACAGGTCAAGAAAATCGATAAGGCG
+ATCGAAGCTGAAATCAGGCATTTCCCTAATACGCTCATTACCATTCCCGGTATTGGCCCT
+GTGCTTTCAGCTGGTATTATTGCTGAGATTGGAGACATCCGCCGTTTTCCGAATGAAGGA
+GCCTTAGCAAAGTTTATTGGGCTAACCTGGCGTTCTCACCAGTCCGGTGATTTTACAGCC
+GATGACACGCCCTTAACTCGAACCGGCAACACCTACTTGCGAAGTTATATCATCCAGGCT
+GCTAACCTAGTACGCCAAAAGGAACCAGAGTACAAAGCCTTCTACCAACGTAAATTCTCG
+GAAAGTAAGACTCACCATCATCGCCGTGCTCTCGTGCTTACTGCACGCAAACTCGTCCGT
+ATGGTTGATGCTCTGCTACGCAGCAACCAAATCTATATGCCACATGGCAATAGGGGGATT
+GCAAACTAAGCATGAACTACGAGAATTGAAGTCCCATTTTTGTAACTTGTTTCCATTTCA
+TTTTGGGAATAAGAGGGTTTTTTATTGCCTTTTTTGCCAACGGATAACTAACTTACTGAA
+AAATTGACTCACTTAGGGTCTTGACATATTACCGAAGGACTTAATTTTGAACCGCGGTTA
+ATATTCCATTGTCAAAATACAAATAACCTCCGTTATCATATACCCATTGCTCATGTGTAC
+CGTTAGCAGTAACCGTTCTATTGACCTCATTTGGTCTTCCCCACGAAGAATCTAAAACCT
+GTTGTTGAGTCATTCCTATTCTGACACCTTGTGTTTTCGCTAATGCTTTAGCTTTTGCTT
+CTTCCTCGGCACGTTTTTGAGCTTCTAACTTGGCTTGAGCATCTGCTTCTGCTTTAGCTT
+TGGTTTCTGCTTCGGCATTTTGCTTTGCTAATAAATCATTGTATTGTTGTCTTCTTTGAA
+GGAGTTCTTTTTGGACATTCTCATCAAGAAACTTGGTAACGGTTAAGTTTTGAATTTCAT
+TAATTGCCTTTTGATAATCCTTTGAATTAGCGTACTGGTCAATTTTTGTCATCTCATCTT
+GAGTATACATTTTCTTACTTTCAGCTTCTTTTGATTGTGCATCTTTATAACGTTTTGTAT
+CTTGTGCTGAAACATAACTAAATGACCTATAAGCATCTAAATAATTCTTATCATCAAATT
+GTTTTAATCCTAAATTATAGTTTTGAAGCGAAAAGCTTAAATTTTTACTTAACTCCTGCT
+TATCGACAATAGCTTGATCTGTGCGATATTTTAGGGCATTACTATAAAACGTTTCAGCAT
+CGTTGAATTTTTCATTAGAGAAACTATCATTTCCCTTTCGAACATTATCATTAAAAAGTT
+TTGAGTCATAAAGTGCTTTTAGTGAGAGGGGGACTATACAAACGACAAGAATAATGACTA
+TAAGAAGAATTGTTTTTCTTTTTTCGGTATTAGATTTTATTAATATTTCTTTTATGGGAT
+TCTCCATTTTCAAATACCTCCCAAAATCTATTTATACCAAAAGTATATACCCGTCCTCGG
+ACATTTTTTTGGTGAATCATGTCTATAGGATTTGTCTTATTACGTAGTATTTGAGAAATT
+AATAGAACATTCTGAAGTTTAGCAGGAAAATATCTATCTATGTTGAAAATGGAAGCGAGA
+AAGAGGTGAATAAGGTGATTGAAATCAAGCCAACTCAAAAACAAGTATTGAAAGTTTTAT
+TGGAAAATAAGAATACTTGGCTTACTGATATTCAGATAAGAGATAAATCAGGGTTGAATT
+ATTCCCATGTAAAAACTGCCTTGAAGAAGTTTATGGACAACGATTATGTTTTCTTTGATG
+GAAATAAGAGCTTTCAAATTTCACCTGATGGGGAAAGTGCTTATTTAAGTTAATTATAAA
+AAATGGAGGGATATTTTATGACAACTACAAAAGAAGAAGTGATAAAGATTTTGTCTCAAA
+CATATGACGAATGTAAGAAACAAAATTACAGCTATTTTATGAGAGAAAAAATACCTAACT
+TAAACGAATTAATGTTTAAATTGAGATACCTTGAAGATGAAAAACTTATAAAATATTTAG
+ATGCCGATGATGGATTGCCTTATGGAATGTTTAAATTTAGGATAACTTCTAAAGGTATTG
+ATTTCTATGAAAATGAAATAAAAAAAGTAACCGAATAATTAATATTCATCTAATCCCCTA
+ATTTATGGGGATTTTTTATATCCAAAATTAAAGGAGGAAATCAACCATGACAAATTCAGA
+CCGCTTAATCATGGAAATCAAAGGCATAGACCTTACACCAGATGAATTAAATATATACCT
+TGAAGAAAATTTACTTGTTGGTACAACTGAATATATTCCAACTTCAAAAACAAATAAGCG
+CAATATCTTAAAGGCAGCATTATCAATTCTTGAATCGGTTGCCAATCAACCTGATTTGAT
+GAAAAATTATAAACAGGATGATATTTCAATTTATCAATTCCATGAGAATCTTGAAAAGAG
+AATAGATGCACTCACATATAAAATCAGACAAATACCTGATGATACTCAAACTTATGCTGA
+TGGGGCTTCATTTTTTTATATGTTTGCTGATTAAGAGAGGGGATAAATGAATGGTGAAAT
+TATTTGATCCTGATGCTTCAAGCTTTAATTATATGCTTGAGCAAATGGGTAAAGATTTAA
+CTTTGAATGATACCACGCAAATTAGAGCCATATTGTCCTCCATCCCTGTCAATGCAAATA
+ATCATGATGATAAATATATATCCACCTTATCCCCTCTAAAACAAGGCGATAAGGTGGATT
+ATTTATTGTCTAAATGGCTTGTAGTTTCTCAGGTTAATGGTCAGAGGATAGTAAAATATA
+AGGCGATTATGCGAAAATGTAACTATAATGTGAATTTTAATTTTGATGGTTACGTGAAAA
+ATTTCCCTACTTTTATTGAGGGTAAAATTTTTGATGTTCAAAGTGGTCAATATATTATGT
+TACCTGTAGGTAAAATCCTTGTCACATTGCAGGAGAATCCTGATACATTAGCCATCGTGA
+TTAATCAACGTTTTATTTCTATGAATTCCCCTTGGAAGATTACAGGCATTGATAGGACAG
+TAAAAGGTTTAATTACTTTATCCTGTGATTTAGATTTATGGGGAGCAAACGATGATAAAA
+TCAATGAAATTGCTGATGTAGTTACTTATACAGTTGCATTTACTGATGTTTCACCTGTTT
+CAGTTGATATTGGCTCAACTTATCAGACAAATATTTCAATGGCAAAAGATGGAGCGAGTG
+TAACCTTCCCTGTAACATATAGTTCTGATAATGGCAATGTATCTGTTGATGCTAATGGTT
+TACTAACCGCATATACTGAGGGTACGTCAATTATCACAGTCACAAAATCAGATAATCCTT
+ATGTAAGTGCAACTTTAGAAGTGACAGCAAAGGTAAATCATGTTCCTGTTGTTGTTGACC
+AAATATTACCTAATGTTACTTCTTTACTTCAAACTACGTCTCAGGATTACACGGTTTACC
+AATACGTTGATTCTGTCGCGAATTCCGACACCTTTACTATAACTGCTTCAGGCCCAACAA
+CCACTTATTACACTTTGACAGTTTCAGATGGAAATCATTTTACTGTGTACAATAAGCAAT
+ATATCGCAACAAAATTGGTTATTACCTGCACGAATAATAGAGATGCTTCGCAGGTTCAAA
+TATCCATAGATTTAAGGGGATTGTGGTAATGGAAAAGGGATGTACTTTAATTACATCCCT
+TAAATTTAATTACTTGTAGTTACCTTCAATATAACAAAACGCATAGTTTTGACTGTTATC
+ATCATCATAAACAAACCATTCTTCTGTCAAATCATTGAACATGAGAGGGTATTCTTTACC
+TGCTGTCAGACAGAAATTGCTTACTGACGGAATCCAAACCTTTGCATTATTGATTCTAAT
+TTCATCTTCAAGAAAATGAGGAAAATTAATTATATTAGCCATGATTTAATCACTCCTTGC
+AAATCTTTACCCTTTTCAGTATGCCAATCACAACCTAAAAAGGCAATATTTAGTTTTAGA
+ATGGAATTACATTAGGGGCATTTCAGTATTTGCATGGTCAGCAAACACCCCCTTGTAATT
+CCATTTTGTCTAAGGGGTTATATTTTTCAAATTCCTCTAATTTATCATCCGTTGACCAAT
+ATAAATACTTTTCAACTGTTTCAATCGTTCTATGTCCTAATTGTTCCCTGAGCGATGCGG
+TAGACCCACCATTTTTGAGGTAATTGATGGCATATGTGTGCCTATACGTGTGAGGTGATA
+CTCTGATTCTAGGGTCAATATTGGCTTGTACTCCATATTCCCTGAAATTTTCCTGAATGG
+TATTGTCGGCAAGTTTTCCACCATCCTGATTTTGAAACAATATATCAAAAGGTTTGGCAT
+TGGGAAGGCATAGGCGAATGAAACGTTGTAATTCAGGTTTAATTTTCTTAGCCATTCCTA
+CAATTCTTGGAGTTCTGTTTTTACTTTCTCGAATGAGAATTCTATTATTCTTAAAATCAA
+TATCAGAAATAGTTAAATTAAGACATTCACTAATTCTCATTCCAGTGGATAAAAGCATAA
+GCATCATGCAATAATCCCTATATCCTGCATGTCTGGACTTATCTGGTTGTTTTAACAGGT
+TTTTAATATCTTCATTTGAAAAAGGGATAATAGGTTTTTGGTCAATTTTGCCCTTTTTAA
+TTTTTGCCATTGGATGATCTTGAATGATTTCTTGCTCAATAAGGTAATTGAAAAAAGGGC
+GAATAGATGCAATTGCTGAATTAATAGTTGCTTGAGTATTGTTTTTAGTTTTACGCATGA
+AATTAAGGAAATCCTTTATATCCCTTTCAGTAATTTCATCAACTAATAATGAGTGTTCAT
+TTTCTTCCAGATACTTCTTTAAATACCCTAAATAAAAGCGATAACCTTCAATAGAACCTT
+GAGTTAGATTTCTTTCCTCACAATGAATTAAGTAATCATCAAATTGAATTGAGTAATCGG
+TAGGTGCTACTATTTTTCTTGATTTTCTTTTGACAGGGGAAATAACTGCTGATTTTCTAG
+CCAT
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_018515.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_018515.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,888 @@
+>NC_018515.1|provirus_3418112_3436097
+CTATATGAGACATCCTCTGATGGGCCTCGCTGCTGTATACACCAGTGTTCTTTGGACAGC
+ATCAATATCCATCCCGGTAATTTCTCCGTCTTTCACGGCAACTTTATAGGTGCAAATGGA
+GGGATGACGTTTGGAAGTAAACTCCATGTCTTCCCGCCGCTCAAAGATCACCTTCACCGG
+CTTGTTGGCCTTTTTGGCTGCAACTGCGGTTTGACAAGCAAGAATGGAAGGGAAGGCTTC
+CTTACCGCCAAGGTCCCCGCCGGTGACATCCTGGATAACCTGAACGTCCTTCTTCTCATA
+ACCCAGAGCCTTAGCCACTGCACCATGGACATAATAGGGACACTGCAAATCACTCAAGCC
+TTCAACGGTGAGAATCCGTTTTCCTACGAACTTCGATACTTTCTGCACGCAAGCCTTAAG
+CGCTTTGCCATCCACTAAAACCATACATGTCCCGCAGGCCCCTTCACTGCAGCCATCTTT
+TACCGAAGCAATCCGCAAATCGTCTCTTAAAAAGAGTAATAAACGTTTGTCACTCATAGC
+AAAGACATCTTCACCATTGATATTTAAGGTAAACATAAATAACCTCCTGTCTTATAATGA
+TTCAACAGCTGGTGTTATGAATCATTATAAGTAGGAGGTTATACTACATCAAATTCTTTC
+TCAAAAGCACTTGCTTTATTTGTTTGTATTCCACTGATATCAAGGCAAATTTAGCTCTGC
+CAGCCTTCATCAGTATTCACTGGATTACTCTTACCGTAGCAAGATCAGGCTTGCTGAACG
+CTTGAGATCACCATAATAAAGTACAAAGCAAACTTAGCATAAGCACTAACTGCATCTCCC
+TTTTCAAGCTTAACAAACCCCTCACATTCATACCTGTTTCGGCTTTTGATTCTCGTCAGA
+ATTTTTTATCCCTAATAAGTAATTCTTTGCACTAGCATAAAATATTTTAGCCATATCCGA
+AAACATTGTATAAGTAATAAACAGCCGCGCAGTCCTGGGCAGTAACCGGTAACCATAATC
+AACTACAAAGGAAAACTTTTCATCCCCGTTTTTGAGCACCAGACACTCTGCTTCCTTCTC
+AGCTCGGAGCATAAGCGAGAGAATGATCTGTGCAGCCTCAGCCTTCCCTTGAGTTACCAA
+GAAGGTGATAAAGCCTATAACGAATAGGATTATCCCCCAGTAATTCTGGAGATACGCTAA
+AATAACATCCACCTCTGTTTTCCTCCCTTTCAAATACAGCTGTAGATAAACTTAAACCTT
+TTTGCCCATACCCAATCCCCGGAACTGACCAATGCCCCTTCAGATTTTCTCAGTTATTGT
+TTTGTGTCATGGTATACTCAAAAACATTAACGCTGTCAGTGTTGCGCTGTACGGCTCCTT
+TTTGAGCTTGACCTGCCTCAACTGCCTTTTTTACTTCGGCGATTGCAGCATCTTGATAAC
+TTAATGCCATGGTCTGCTTGTCATTTAGAATGACACGATACATAACGGTAGGTACTGGAT
+TTAGAGCAGTATCTTTAACCGATTCTGTATAAGGGATACCAACAGCACGGCTGAAGCCCC
+TGCAGATTGCCGAAGACACCGACTCATCAAACCGGTCTTGTTTCATGAGTGCCTCTTCAG
+CGGGATTTGAGATAAAACCGATCTCCACCAAGACCGCGGGGCAATCCGTTTCCCTGAGCA
+CGTGGAGATTATTAAACTTAATCCCCCGATTAGTGAGGCCAGTTGCAGCGACTAACTCCT
+TCTGGATCTCCTTAGCTATCTTTTCTCCCTTCCCGCCAGCTCCTAAGGCTATCGTTTCAA
+TTCCGTGGGCATTGGGATCTGTGAAGGAGTTGGCGTGGATTGATAAAAAGTAGTGTGGCT
+TATAGTCGTTCGCTTGGTTTGTCACATCCCATAGATCTCCGTCTTGAATTGCAAGGATCT
+CCCAGCCGTTCTTTTTCAACTTCGTGACGACTAATTCTCCAACTTCTTTATTTTGCATGG
+CCTCCTGATAACCTGTTGGCCCAATGGCTCCAGGATCATAACCAATGTCTTTAGGGCCGT
+GGCCGTAGTTTATGACTGCTTTCACTTAACCAGCTCCTTCGAATAAAAAGCTCATTTAAT
+AATTGCGATTACGGCAATCGCTGTACTAATAAAGGCCCCGACGACTGTGCGCCAGAGCCA
+TGTATTGTTTGCTTCGAGTTTGTCGATACGGTGAGAGTTTGATTTTGACCTAGCTTCCGT
+TTCTGTAGCCTTGTTTTCGATGCAGTCTACCTTTTCTCTCAATCCGTTTTGGGTATCTAG
+TTTTGTCTCCACTCTCACGAGGCGTTCTCTTATGTCTATTAGTACTTCTTGATCGACCAT
+ATTGCCACTGTCCTTTCTAGAGACATAAAAATAACACCCCGTATTTAGGCGTTTTCTGCG
+CATAATGGGTCAACTGCGTATTAAGCTGTTTGCCGTTGTGATGATAATAATGTAGATAAC
+TCTTGATATTCATCTGTAGTAAGTCGTTCTCCTGCGTAAAAGACATCTAGCATTTCATGC
+ATTTGTTCAAACGAGATGAATTGTTTTTTTTCAATTTTCGATTTGCAAAGTGTATAAGTT
+AATGTATGCATGTAAAACTCCTCCTTATAATCCTAGTTCCATCATAATTAATCTATAATC
+GAGGTTTAGTACATAATCCCTTAAAATTTCGTTTTCGGTTGGTTGCGGTTCGGGTTCTGG
+TGGTATATCTGTTAATTCAAGAATTATTAACTCTTCGTTCTTTATTTCGTAGTAAGCTTG
+TTTACTACCTATAGCGTCGTACGTATCTTGGGATATTTCGTATAGAATCTCGTTTTCTTT
+CACTCGAACTATAGCACCTTCTGCTACAGCTGCGCAATTAGTAACTACGCTTTCTTTTTT
+AGATACAACGGCATAGTAACGCAAGTTTAGCCCTCCCTTTATTGTAGTGCGTACACTTCG
+TTTGTTTTGTAATCAAGTGTTGCGTTGGCGTACATATACGTAGGACTTGAAGTGTTGCCG
+TTGTAGACGTCAATTCTTATTGAATAAGAAGCACCTACAGCTATATCTGTTAAGTCAATA
+TCCGCGCTCAAGTCACGACCAGACGCGTAGTAAACCTTTTGGACTCCGTTTAAATAAAAA
+CGCGTCCCATAGCCAGCCGCTTGCGCTGTATTCGAGGTAGCGTTAAATCTCAGTGACTCC
+ATATTGATAGTCAGTGTGTCGTGGCCCTTTAATCGGGTAAGGCTGACTGATTTCAAAGTA
+CCCCATGTGTTTTGCGCTACTACAGCTTCGTTCCACGCCATAACTATGTGCGAAAGAACG
+TACCTAGTGTCTGACGTAGTAGCCACCGACAAAGACGTAGCTTTAGTTATGGCGGTCTGT
+ACAGCTGCTGCTAGGTCGGTTGTTGGAATACCTAGAGCTGGCTTCGAATATTTAGAATTC
+CACAGCGTTTGCTTTTCGGCAGTAACATGTTTCGCCACATCCGCCAAATGCGCAGCAAAA
+TCCACCTGCCCAACCCTGCTCGTATCAACAGGATGAACATGATCTGCTCTGGCATATCTC
+TTCGAAGCCCCTACTCCCGCTGTCCCATTCATGGTCGGTGCAGTTGTCCCGGCCTGGCCG
+AGCACAAAAGCGGTTGTAGCAACCTGTGTCGTACTCGTATCAACCGCGGCAGTTGTTGCT
+GTAGGCGTTCCCTCAAGTGCGGGCGACACCAACGGTGCCTTGGTACCGATGAGTGTTGCC
+GTCGTGGCCGCATAATTGGGGTCACTCCCTAAGGCATTAGCTAGTTCCTTTAATGTGTCC
+AGGGCAGCAGGAGCGGAATTAACCAAACCAGCAACTTTGGTATCTGTATAAGCCTTTGCA
+TTAGCCTCCGCTGTATTCGCTTTCGCCTGTGCCCCAGCCGTAGTTTCCTTTGCCGCCACT
+GCTGTATCCAACAGATCCGCATTATCATTAAAGTCTTGGATATTGACAACATCTGTACCT
+TCGGGCTTTTTTAACCCTAAATTCGCCGTCGTTTGCATAGCTTATCTCCTTTACTCATAC
+ACTCTCAGTTCATTCCAAGTCATCAGGTTCACGCTATTCCAAGTGAGATATTTCAAAGAA
+TCCCACCAAGTATAGGAATACTTAAAACTGTAATCTAAATGGGACGGCTTAATTTGTTCC
+AGCATCTGAATAAACCCTGGCATGTTAGACGGGATACCTTTTACCCCAATAAACCGTACC
+TCAAAGCGATATTCTGCCGGATACTCGATGACATCCACCTCCCCGCCCGAAAAGGCGGAT
+GCAGTATCCAAGATCATATGCTTGGTGGTTGTGCCAGAGCCGCGAATTTTTGCTTTTATA
+GACTCTCTTCTCCGCTCGATAGGCTTATTAGCCTCTGTCGTTAAACCTAACTCGCTTTCC
+CAGCAATCCAATCTCCATGTGGCAGTATCCACAAAACATTGACTCAGCATATCGTCAATG
+GCATATAAAAAAAGACCCATCTCATCCGATGCAGTCTCTTGGAGTTTTTTCATTTCTCGA
+ATGCTCTGATAATACTCAGGCAAATATCTCATGAGGTCAGGAATCGTGTATTCAGTCAGA
+TTACCGTCACTGCCCTCTGTGCCAAAAGTGGTTGTGCCATAAAGTTGATTTCCATATCCC
+ACTAGACTTACACCCCCTTTAATTGGTCCCAGGTTACTGCGCCCTTGGGCATAGCGTTCG
+CGACGATCGCTTGGGCCACTCTTTGGGCAGTCCATAATCTGGTGGATGTCGCAACACCTG
+CTTCTGCTTCTGCTTGAGATACCGTGCTCCAAGTGCTTGTATGAGCCAGTGTTCTGGTTG
+ACCCATTGATGCGGGTAATGATTCCCGTAGTCGTTGTCCATACGTCTCCATTAACAGGGC
+TCGTTGGTGTTACACCATGGGGAAGGTTAAGGGAAGCCGTGGAGTCTGTCGAGGCAGGAA
+GATTAATCTTTCCCTCAAAAGTATCCCCAGCTTTATTTGCCGGAATATAAGCCAGGGCAT
+CTTGTTTCGAGTTCCATGTAGACTTCTCTGCATCTGTAACAAGTCTATTGCTAGAATCCT
+GAGTAATTGCAGAAGGACTATGCGTATGTGCGCTTGGCGCAAAGGTGCTTGGTTTCTCGG
+TCACACCAGACCATGGCACACTTTCTGCTGCCTCAGCCGCATCGACTTTACCGTCATTAT
+CAGTGTCATAAATACTTTTTAGCATATCTCCAACTGTTTGCGCCGCGACAAGCAACTCAT
+TGCCGCTATCCGTTCCAATATAAAGTTTTTTGGTATCCGTACAAAAACCTAACTCACCTA
+TAGCCAGCGTTCCGATACTGGCTTCAAGACCACGCCTAATTTGGATCATTACTTTCCTTG
+GCATATCATCTCCTCCCTAAAAGGTTCCTCCATCCACGACAGATACCATCAGCCTGTTTC
+CGTTGCCAGCATCATAGACAATACTGCTGGTATCAATGTTGGCTTCTATACCAGTGCTGT
+TGACGAGAATTCCTTTCCCTGCTTTAGCACTCACTGTGGTTGTTCCTACCGCGATCCCGT
+TTCCCGCCCCAACTGTTATGCTGACCGTGTCTGCCTGACCGCCTCCAGTTAGACCATTAC
+CGGCGGTGATAGTTTGCAGAGCCCCGCCAGTTCTTACCCAAGCGGTTCCGTTCCAGGAAT
+ACACTTTTTGCTCATCATCGACATAACATGTCCAACCTGTCTGGGGTGTGTAAAAAAGCC
+AAGATGCACCATTCCACTCAGCAATTTTTGTAGCCTGGCTGACCCATGCCCCAGTGGCAC
+TGGCGGGAATAATATATCGGTCTCCCGTCGTTGGCGACCCAGGGGGAGCGGTAAGATTCT
+GATCCTTGACGCTTGCTTGAGGTTCGATATTATGTTTGGCTAACTCAATTTCGTTGTTTA
+TTTTTTGAGCACTCCACAAATCAGTTATCGTCGTCCCGGCGTCATTGATCAATCTGTGTT
+TAGCAGAATCGTCAATATGAGTCTTTATTTCTACTGCAGTTTTAGTGTTCGTTCCATCGG
+ACACTTTATTAACCTGACCATTTGTGAGATCTGATTTTTTGACCTTGGCATAGGTGGTTC
+CATCAGCAATGTCATCTAAGGTTCCCGTCAGATCCGTCAGTTTTTGCGCATTGACTCGCT
+CCCAGACTGCACCATCATCCAGGTAGAGATTACCCACATTAGTTCCGCTAGTAACATAAT
+AAAACCTTCCCGATACTCCTGCATTAGGCCGAGCCGCTTCTGTGCCTGATAGTACCCGAC
+CAACAAAAATATTGGCGATTCCGTCCCCGATGTAAACTTCCTTAGTATCTGTGCATAGTC
+CCATTTCCCCCGTTAACAAGGCACCCAAAGCGATCAACTCAGTTTTTGTACCACGACGAA
+TTCTTATTGTTTGGGCCACAAATTACACCTCCTCCAAAAATGTTCCACCATCAACGATAC
+CCTTTTTCTTATAGCTCTCTAACGCTTGTTGAGTCGCTATAAGACTTTCTTGCAGTAAAT
+TGATATCTTCTGCCTCCACCATATCCCCGAGAGTCTCATAGGTCACATACACTTTACCCA
+CACTGGCAAAGATTTTAATCATCCGCTTCCAAGGGGATTCTGATGGGATTGAAACAATAA
+AGTTTGTGATCTCTTCTCCAGCAAAACGTGACTCCGTATAAACCCTGATCGTGCTGTTCG
+TGATATTGTCATGGCCTAAAAGCCCGCTATACACCCCCTCGAAAATTGGCAGTTCTTCTT
+CAACGGCATAAGCACTGCCATCTGGCTTTCTATTGAACTTTGGCGATAACTGGTCAATCT
+GCTCAGGATAGGGCATTTTTTCATACCCCCAGTCCTACGGTTCCAAGCACCGGTATTTCT
+TCATCCCGTAAAGCAACGTTTGCATTGCCGTTATTAAGCGTTAAACTGACATAGTCAATG
+ATGCCAGGTGTGCTAAGCAGTAATGTCCCAACTTTGGCATAACTGACATAGGTACCCGTA
+AAAGCCATCTCTTGCAAATAGGCTTCCATGGATGCACTAAAAGCATCTGTCACAGCTTGG
+ATAGCATAACCTGAGGCCAACACTACTCCAGCTGAAACATTAACCCCCTTAGCGGCTGCC
+GAAACAACAGTCACTGCAGCACCAATTGGCCGGACGGTTTCAAGGTATTTCATAACCTCA
+TCCACTAAGGTTAAGGAGGCTGGCTGTTTTTCGGTATCCACTATGGCAAGCTTCACTGTT
+CCAGGTCCTGCCCATAACGGAAAGACTTTGGCATCTCCTACGCCGGGTACTTCTGTGGCC
+CACTGCCGATACTGAGCAGCATTTCCCGAGGTTGCCGGCTGCCGAACTCGCTGCAGATAT
+CGCTTTCTGAGCTCGTCATCCGACTCTGTATCTACTCCAGGAATCAAAATATCGACCAGC
+TCCGCCCTTACAAGTCCACTAATAAAGTCAATGGGCAACATAGTTCCGAAGTTCTGGTTT
+CCTCTGCTTCCTGCAATCTCACACTCCAAACTATACTGACCGGTTGAAATTCTTTCCATA
+GTCTGATAGTTAACCTTCTCTATGGAAAAGCGACTGCCCACGGCCACCTCCAAAGGTAGA
+TTATCTTTTCCAAAGAACAGGGCTTTCCGTAGTGCCTTCGTAGCAGCTTTACGAGTTACT
+CCATAATCTGCTGTCCTGTATTCCAGATAGTCTCCGCTTGAAGTCTGAGCCGAGAATAGC
+CTTAGATTGATCTCTAGCCCTGCATAGGCCTGAGCCAACTCTGCTGCAGCCGGGGATAGG
+GCATCATAAATGATGCTGCCCTCTCGTTTGTCTAGGTCTACGTCAACCCTGTCCAACATT
+CTTTTCAGTATTAACTCGTAAGTTTGTGCTTCATACACTAAACCTTCACCTCCTGAGTCA
+TATCAAAGCTCCCATAGCTGCTGATCACTGTAAATTCAATCAATAGACCATCCCCTGCAG
+CTGTGATTTGAACATTTTCAATAGAAGAAATTCGATCATCTTGAGTCAGGGCTTCTCCAA
+TCATCCGGCTTATTTCCGATTGGACAAAAATCGGATTGCTACCGATTAACTTCTCGAGCT
+CAGAACCATAGTTAGCTGTGTAAATCAAATGGTGCAAGCGTGGAGTCAGCAATATCTTAT
+AGACGGACTGCTTGACTGCCTCGATTCCGTCTAACCTGCCTACAATTCGATCTTTGGCCA
+CATCCAGCTTCCAAGTGAGTGACGGCTGCTCTATTTCTTGAATCGCATCATTGGTTAAGG
+TTCTCCCTACAGGAATCATAGCGTCACCACCTTATCTAAAATTACAAATTTTTGACCACC
+CTGAACTCGAAGCAACAGAACCATATCTCCAGCCTTGAGACCTCCGCGGATTACGATCTT
+GGTTGTTAGAGCTTTGGCACTATTTCTCGATGAACCGTCGTCAGTGTATTGGTGAGTATG
+CTCGAGATCAAGTTCAAACGAAGTCATACTTTCCGGTACCATTAAAAAATCCGCCGTAAG
+CGTGAATCGTTGATCGACCATCACACTGAGCGGATTAACTGTCATGACTTCTCCAGACAT
+CACGGTTACGGGGTTAGAGGCTCCCACTGCGTCCATTCCTGCAGTCTTTATGACATCCAG
+TAAACTTGCCATTATATCACCTTCATAATTGCTTTAAGTTCTAGGCTCATTTTATGATCT
+GCTCCGTCAAAACTATGGGTACATTCATCCACCAGAAAAGGCTGATTGATTCCGTACTCT
+TGAATCTGGATTCGAACATAGCTTCCTGCCCTTACCCGAAGATCGCCGATGGCTTCAATC
+TTCAGAGTCTTTGACTCTCGGTTTTTCAATGTGGCCAGCGTATCAAGAAGCTCATTGATC
+TGAGCAGAGTTCATGTCTTCGTCCACACTTTGGTAGAGCTGTAGGACGCCCCACTTCGCC
+ATATTTACGCTGTCTTGGGCACAATAGACCTCACGCCTGCCGGTGTCTTTGTTGTCCTTA
+TAAAGCTTAATTTTGTTATAGGTGTCGGAGTCAATCGATAGTTTATGGACATAGTCCGTC
+ATGAGACTATTATCCCCGACGACAAAGTCCAGCAACAGATCCTCTACATTTCTAACGGAT
+AAAGAACCGAAGTCATCGAAGAAGACGTAGTTTTTTCCAGAGTTAATAAGGGTTAGATCC
+AACGCCTTGCAGATGACGTCTAGAAGCTTTTTATCGTTTTCGCTCATGGTGGGAATCCTG
+TAGCCGGTATCATCAATTTGGCCGAGCTTGAGATTGAAGTCGGCAGCGATCTTTTGAACC
+ACCTCAGACGCTGTAATGTTGGTAAACACATAAGTATCATTGGACATGAGGTAGCGTATT
+TGGTCATAGCAAGTTATCTTAACTGCCTCATCCCTTCCCCCATCAATGGAAAAAATATAG
+CCAAAAAAGGCCTTGGCTCCATCTTCTGCCCTTTGAACGCTGACAATATCCCCATTACTA
+TATTTAAACGTTTTGTCTTGGCCAGGGGCGTTTTTGATGAGTGTGAAGTCCAAGCTGCCT
+GCTTTACCAATCCGGCTGGTTTTCCAGCTCACATCGGCTACCAGGCTAGAAATGTCCCAC
+ACGTCGCCGTCTTTCTTATCGATTAGTATTTTCAGCATAACCAAGAACCTCCTTTTAGGG
+CAGCTTTAAAACCCTGCCGATCTGCAGTCGCTTGATCTCGGCATCAGTAATATCGTTTAT
+TCTCTGAATTTCCGGCCAACGTGCTCCGTTGCCAAGAAACTGTTTGGCAACTGCCCAAAG
+TGTATCACCAGCCACGAGTGTATAAGTTTTAGGCTGTTGTGTCTCATCCGGGCGCGCTGG
+AGCTGCTGTTGTCGCAACGCCAGCAGCGCTTGGATTTGAGCTGATCTCAACCTTCTGTGC
+GGTATAGGGTACATACATTTTCAGCTTAATGTTGTAGTCAATGTCTCCTGCCCCACCAGC
+TACTTCTTTCCAGTCGAAACTCTCAATACTGGCCAAGGTGTTGATATTGTAGCGATCAGA
+AATAAAAATAAAGCGAATAGGCTGTGCGGACTCCATCCACTTTACGATGAATCTTACGTA
+TTCAATGGGCTGCAAAAGGGTTTGTACCGTTACAAATGGATAACGCTGAGCAGGGAAAAG
+ACTGCTAAATCCATATTGGCTGAGCTTGAGATTCTTGATCACATTGATTTCTCTTAAACC
+AACAATGTCATAAGTCTTGCTGCTTATGGCTTCGCTGATTTCAAGGGACCCCGGCATAAC
+AGGTAGTTGAAAGATTTCAGCCTTGTCATTAAAGCTCAATTCTATTCCATACGGCATTAC
+GCATACACCCCCTGAGCAGATGAGGAAATTTCGCTCTCCAGCATCGTCTTAATCTTTACT
+ATAATTGAATCTACACTCTGCCCGTTGTGAATATCCCCTGTTGTCACGGCCACCGTCGGA
+GTAAGGGTCACAAAGTTTTGAATGTTCTTCATTTCAGCCAGTTCACGCATAGTCTTTAGG
+TCTTCGCTGGAGATGTCCACGGTGTTGTTTATTTTACCGACTTCGTTGACGCGGTCGATG
+GCGGGAATACTGCCTGCTCCTCCGTTCCAGCTATTCAAGATTTTTTGTTGATCCAAAGTC
+GAAGTATCCGCCTTTCCCAAATCAGCTAGACCAAATTTCTTCTTAATATCATCGAGGCTG
+ATATTTTCAATAAAATCTTGTCCGGCTTTTTTAAATTGGGAGAAGTCAGCCTGAAATTCG
+ATTTCCTGTATCTGTTTAGCATCTATGCCTAGAAGGTCACCGAAAAATCCAGCCACTTTG
+TTAATCGCATTGATAGCATTGTTGATACTTCCAAGGATAAAGTTTATTGCGCTCTGAACA
+ACATCCACAACGAACCCAAAAGCTGAGCTAAATACATTCCTAATGCCGTTTGTGACTATA
+GCGAAGGTCCCTAATGCTGTGATTAACCCTACGATTAAAGCTATAACTATTCCGATAGGA
+TTCATGCTCATCACAAAATTGAACACTCTTTGCTTTAATAAGGCAAACGATATTGCTCCC
+GCTAATTGGAGAGTTACCAGGGACCAGCCAGCTGTAAGCGCTGTGATCAATGGAATTAGT
+GTCCCCGTGATAAATATAACTGCGTTATAGATTCCCCAAGCTGCTGCTATCCCTAGAATG
+AATGGAGAGAGCCCCACAAGAATGATTCCCACATTATAAGCGACATCGCCAATCATTGAT
+AACCCTTGTAGTAGAAGAGGCCAGACTCCTTCCCCGGTACTCACGAGCCACTGAAGGCCG
+GTAACGATCAAGAATAAACCTATGCTCAGACCCTCAAAAAATGGCTGAAAGCTTCCCTCC
+TGAAAGGCATCATTCAATCTAATCATGAGAGGAGTAAGGGCTTCAGTGGCTTGTTGCCCT
+GCATCAGCAAAGCTGGATTTCATATTGTTCGTTAAAATTTCCAACTGTTTTGTTGGAGAC
+TTCATCATTTGATCAAAGGCCGCTTGTCCCATATTTTGTTTTTCGAGGAGCTGATCAAAC
+GCTTTAATGAAACCATCAATGTTTCCCGACTTGCCTAGATCCTCAATTTTAAAGGCCTCC
+ATATCGAAGTCTGATATACTGAAGCGTTTAGCCAAAGAAGCGGTGTTGCCGGACATCGCT
+TCCTTAACAGCGGATGCTGCCCCTTCAATCCCATTGCCAGCATTGTCAAAAGCGTTTAGA
+CGAAATGCAAAATCATTCAGCTTGGATAGTTGGTCTACATTCTGGGTGGACGAAAGAAAT
+GTAAGACTACTCTGCAAGGCTTTATTGACATCCTGCCCGGTGGCGAGTGCCTCCCTTTTG
+AACTTATCGAACATGGCAGTCCCAATTTCTGTATTTCCGGTCCGGGCGATAAACATATCT
+TGAGTTTTTCGCTGCTCCATTGCGCCACCAATGCTTGCTTTTCCTAACTCCGTAAACATT
+TCGACAGTTGCCTGGACGCGAGAGGATGCATTAAAAAACTTCAAGATTGAATCAACTGTT
+GCCAAATCGGAAACCTCCTTTTGCGCATAATAAAAAGCACTCTGTTTCGAGTGCTTATAT
+GCTATGATAAATTTGGTAACAGAAAAGGCTTGCAGGGCGGTCGGCTTATGATTTCATTCG
+CGACATTGGTGGTGTTAATACTTTCTTTCCATAAACGGAAATAGACCGCCCCTGCCGAAA
+GGTTTGCGGTCTATCCGTCACCCTAAGCCGTCCGCCCTTTTAAGCGGCTGTTACACAAGG
+AGTCATGTTTGCAGCATGGCTTCTTGCTGTTACGATACGTAACTTCTGTCTTTAGCATAC
+CATAATTGTTGAATTTTAACACAAGCTGAAAGATAAATCAGGCAAGTTTGAGGCTTAAGA
+CTTGCCAATATCTCCGTCGTACAATCCTCTTCCTTATAAATCCTACTGATCAATTGCCCC
+TGTCAAATAGGAAAAGAAGAAGCTTAGGAACACTAGACATTATTTCTTCTTTATCTTCGC
+CCTATCTTGTCTTTCCTTTTTAATTCGAATATCAATCATGGCAAAGATAGCGGCCTTAGC
+TTCTCGTGTTTTTTGGGCCAGCTCATCGGGGGGAATATGGAGTTCGTGGAGGGCGTAGTA
+AGCGTAATTCCACTCACCCTCGCCCTCCTCAATTAGTTTTTTACCTCATCCATCAGGTCT
+TCCAGGCTTTGATCAAAACCGTTCAGTTCTTGCACCTGCTGAACAAGGGTCGCATATTCA
+CCGGGAAACAGCATCTTGCGCAGCAGCTCTTCAGCGCCTATGACGCCGTAAGATTTTTGC
+AACTCAGCATTTTTCAGATCAGGGAAGCTGACACTTGCCACGATGATTTTGGCCAGATAG
+ATGTTCTGATCTATTTCAGACTGCTGTGAACCATTTTTTCCCTTAACTTTCCGAGTGGCT
+GCTTTTCGGTACTCTTCATTTTCAGCTTCAGTTATGCTATGGATTTTCCAGGGTATTGAC
+TTGCCGTCATTGTCCTTAAACCGCTCGGATATGACAACCTCTTTGCTGAGATCAGATCCT
+GCATTTTGCGCAAAAAATGCTTGTAAATCACTCATTTTCTCTTCCTCCAGAATTTCTGAT
+TTCTATGATAACTACCACGAGGATACGACTTATCTCACAACCGGAGCATTAAACTGGTCC
+AAAAGATCAAAATCGTCAAACGTAAAGGGTAATTCTTCCTCCAAGGGGTCATCTGACGTC
+GCATCGAAGGCTGCAGCCACCACGCTGTCCAAGTTGCAATCCTTGAGGACGGAGGTCTGT
+TTGCCAACTGTAGAGGCAGGGTCCTCATTGACAATCTGCAGATCAAAGTAAAAATCTTTG
+CCCGTCTTGATATATTCCATCATCAGCGCCCTGAACATGCTCGTAAAGTAATAAATCGTC
+AGTGTTCCGGTCCCAGACCAACCGGCTGCCTTTTTGCCGACGTTGGTTTTTCCCAATATC
+GGTACATCAGCCTTCGTTTTTTCGATAGTCGCTTCCACTGTTTTGGCATAAAACAACTCT
+TCCACGCGGCCATTAATTGTGACAAAAGCCTTACCTTGCTTTCCGGATATTGCATCTTCT
+GCTTTAAGAAATGCCATAGCTTATCTCACCTGCACTTTCACATAGATTTTCTCAATAGAA
+TCTACCGGCTGAGCATATGCCTCAATATAGACACTATCTAATTCATTACCCGTTTGGACT
+GTCAAATCTGCTTGAGAGTCAAAATTCTGGACAGCATCCATGCTCTGAAGTGTTTCCATA
+TATTTGACACACTGGGTTTTTAACAGGTTTCGTCCATCAGCATTATTGGATACCTGCCCA
+ATGTAAAACTCACTGAAAAGCTGGACAAAATCGTTATTAATTCCATCGAGAACTCTGATC
+ACGCGGTTCTTGGCAAACTGCTTACCTTTTTCTAAGCTCGATGTGGTTAGAGTATTAATG
+TCCTGCTCGACGATGGCTCGGTTGTCATTGGCTGTGAAAATAAATTCCCCAGCCCGCAAC
+GCTGCAATGATCTGTGCATTGGTATACCTCGGAGCTACATCCACTGCCCCATCATAAGCC
+TGATAGGTTAGAGATTCATTCACTTGAGCACCTGCAGTTGCACCGGCTACCCAGGCAGTA
+GCTTGAGCTGCACTGAGGGTTGTGCCGTTGGCAAGAATGACTCCGTTCTTCACACTGATC
+ACGCCTTCATAATCAGCTGTTGGATAGTTTTCCAGCACGACCTGAATCTTTTTTCCTTCG
+TTATCTCGAAGACGTTGGCAAAACGCTGCGAATGTTGCTTTAAGAGTATCGTCTGTCGAA
+GGCAAGGCTATTGTGTTAAAGTCATAGATCTCGACTGCTGCCAAGTAGTCAACATAAGTC
+TGATTGGTGATCGTGCCATCTGCTCCTCCCATCAAAGGGACGCCCGCCGTTTCTGTCAAA
+GCTCCTGTGCCCGAAAATACGACCCAATCATTTTCTACCAGATCCGCGATATAGGGAACA
+GTTTGCTGATCTACTTCAGCCCCATCCACTAATGTGGTAACATCAAATTTAGTATTATCG
+TCAATGTTTTCCTGAATGACCAGAGACACATCATTCCCTCTGATACCGCCCCATTTGGCT
+GTGACCGTAAGGTTACCAGTTGTCACGGCTGCCTTTGTCCCAACATTAAGTCTGTATAAA
+AGCAGGGTTTTGGCTTGTTTCAAAGCCTCTCTAACTAAAAGCAGTTTGGCATCCCCCATC
+GGATAGCCCAGCTTGACGAAGGTATCTTCACCCGCCTCAAGGCTGATGATTTTATTAGGC
+TCACCCCATGAGAGCAAAAGCGGAAGAGAAACAATCCCTCGCTCTCCAAGTGCACCTACT
+ACCTGGGGCTCTGATTTAAAATTAACATACACTCCCGGTCGTATTTTATTTTGAGTCGTC
+CATGTACCTGCTGCCATCTTATTTAGCCTCCCTTTTTAGAAAATCCTCAAGAATCTTTTT
+GACCTGATCGTGACTGTATTTCTGTCCTTCTTCCAAGAGCGCCTCCAGCAAATCCTTGCG
+GAAATATTGCTTGGACTTCAAAATCTGCTGTTTACTATAAATCTTAGGGAGCTGCTTATC
+TCTTTTTTCAGTTTTAACCACGTAAATATCCCTCCTGTCTCATAGACCCCATTAATGGAT
+CTGGTTCAACACTTCGCTTAACATGAAAATTGTAAGCCACAAACCAATGAAGTACTCCGT
+TGACAATTTCGTGTCGCATTCCGCTGCCTCTAACGAGGCCGCCGTCCACGCTGATCAGCT
+CCAGTTTGTCATACAATTGCTCAGCCATGTCATGTAAGGCCTCATTACTCCCTGCAAAGT
+AATGAATATCGAATAAGTGATTGCGCTGATAATGCTGACCCAGCAGCTGATTTTGTGACA
+TAGGAAACAGCTTTACATAAAAATAAGGCTCTACCAAGCCTTGATCACTCTCTTCGCTGT
+ATGTGCCAATATTGGGGAAGCTCTGATCCAGAGCGGCAATAACGCCATCTAGGACACTAT
+TGACGGTGATCATCAAATCATCTCCTTGACCTCGACCGATTACGATTTTTTAGAGCAAGC
+TGATTAGCTTTGGCTCATAAATCTCGGGCGCTGTCCAATTTTTCTAATGGACATTGTTTT
+AATGAGTTCTTTAAAGTCTTTCATGATCGCTGTTCAGATAAGAGTTCTTAATGTGTCAGA
+GTATTACCCCCCTCTCTTCAATCCTTCCAAAAGGACTTGCTTAGCCCCGATTGTTAGAAC
+TATTGTCCCCAAACCTTGACTCTTCTGAAAGAACTAGCCGGAACAGAATCTCGCTCATAC
+CATCGTTACTCCTCGGTTTCTTCGCATCATCCGGTCCCAAGCCTTAAACTGGGCGGTATC
+CTCGTAGTTCTCCTTAAACTCGCCTTTATCCCCACATAGCTTCCCCGTCCATTTTAAACA
+GTTGGCACAGGTTTCTTTAAGTTTTGGTTTTGGTTTTATTGGTGAGAATAAGGGGCAGGG
+TTTGGTTCTGGTTTTCACGGCTTGCACCTCGCTTTAATGAGATAAAAATGAACGCCCCAA
+ACATCGGAGCGTTCTAGCCAGAGGAGGATTATGTTAGAGCGGGTCTCGTTCCTAACTTCT
+TTCACAATATTATTGTATCACGCTTTTTTCCAAACAAAGTGCAAACCCTCTGCCAAAAAA
+GTGCCAAACTTTCACTCCCAACTCCCCTAATCACGTTTATATATTCCTAATAAAATAGCC
+ACCTCTGACAACAGTTCATCTCTTACACGATAATAAGTCCGAAGAGGTATTTTCATCTGT
+TTTGCTACCCACCAGTCATAATTATGTTTACTAAAGTAGCGATACTCAATTATCTTCCTT
+TCGTCTTCTCCAAATCCAGCGAGGATAATATCTATCTCCCTGATACGAAGTGTACACTCA
+TTAATCTCTCGCGCTGTCTCCCAACGTTTTGAAGCAATCCCCGCTGTTTGATCGCTAGTC
+TTTGTGGATGCTGGAGTTAGGGAGTAGCTCGCTGTCGTCTTAGGTAGTTCGTTTCCCAGC
+TGAGCATTCAAAATGCAAAGCCGCTTTTTATCCTCCGGATATTGAGAAAGTCTTCTGATC
+GTTAGCAGGTACCACTCAGGCTTTTTGCTTTTTTTCTCTGCTTGATCATCCATAATATCC
+CCTTTGAGTTTTAACATTCTTACATCCTCCTCTCATAAACGTCAACAATCTTTACCTCTT
+TCGGGTTAATTTGCAGTTGTCCTATTTCATCTTGTATTTCCGTCATTCCCTTCTCTGTTG
+ATCTAGTGGTAATTGTATTGTATATCCGTCATTTGCTCAAGGCGAAAAAACCCCTACTGA
+GTTTAATTAGATAGCTCGTACTTAAATTTGCGATTACTCACTTGTATTTCCGTCACATTT
+GAAAAATTAAATTACTTGTTGTTCCGACAATTCTGCTCTATAATATAAATGTCTGATATG
+CCGAACAAATATTCAAGGAGGGAACACCGTGGGTGTGGGCGAGCGAATTAAACAATTCAG
+AAAACAAAAAGGTCTTACTCAAGTTAAACTTGCAGAAAAGGCCGGAATTTCAAGGTCCTA
+TCTAGCTGACGTGGAATCGGATCGATATAATCCAAGCTTAACCACGTTAATAGATCTTGC
+TCAAGCTTTAAATGTTACCGCGAGTTGTTTCCTGGATGACAAAGAAATAGATTTCAGTAA
+CCTTATTCAGCTATGTAAAAAAAACGGCATGTCCCTGAGCTCTCTTGGTGCGATATTGGA
+CATCTCGCCAAAGGAATTAGATCATATACGATCCAACAAGCTCCCCGTTGAAGAGACTAT
+GTCTAAAATTGCCGATCATTTCGAATGCACTTGGGATTATCTTATTGGCAAAACTGACTC
+CCCCGATGATATCGTCTTGGGTGGAAACTCCATTTCCATCCAAGATCCAATTTCAACCCC
+CCCCCAGAAAGTTGGAAGTTCGGTTGAGCCCATAAACATTCCTTCCACCATCGCGGCTCA
+TTTTGAAAATATGAATTTTACAAAGGAAGAAACTGAAGAGATCAGCAATTTCATTAAATT
+CATAGCCTCTAAAAGAAAAAAGTAGTCTTGCGCAAGGAGATGTCACATGAATTATGAGAG
+TTTAATTTTGGAGCTTGAAAAGGAAGGCGTCGAGGTAATAGAGCACAAATTCCACAGCGA
+ATCTTTGAAAGGTTTATATTTTGACAATGTGATAACACTTAATCCTTCAAGTATTATAGA
+TGAAAAGGAAAAAGCATGTATTCTAGCCGAAGAATATGGACACTATCGCACATCCTTTGG
+AAATATTCTAGATCAGAAAAACACCTCCAATATAAAGCAAGAAAAAAGAGCCAGAAATTG
+GGCCTATGAAAAATTAGTACCCTTAGAAAAACTCATCGATGCATTTGAAGCATGTATTTG
+TAACCGTTATGATTTAGCTGATTTTTTGGGAGTGACGGAAGATTTCTTAGATCTAACACT
+TGCCCACTATAAAGAGAAATTCGGCCTGTATGTGGAGTGTAGGAACTACCTTATTTATTT
+CAGTCCTCTCGGCATACTTCGCAAATTTGATAATACCGAATTCTAA
+>NC_018515.1|provirus_4659544_4694673
+TCACATCTTCCATAAAAGCCACCTGCAGGTATTAAGTTCATATTTGATCTCGAAAATTTG
+TACTTCACCTTTGATCTCGCTCTGACATTTAAAGATGAGCATACGATTGCCAGCAAGTTT
+TTCTTCGGACACGGAAACTACTTTATCAATTTTAAGTTCTTTTTCATCAAGCTTGAATCT
+TAAGGGGTGGGGTTTGCCGTTCTCAAACCAAGCTAAGACCTCGATGGGGGCTGCTAAGAG
+TTTCACTTTTCTACCCCCACTTCGTAATTGCTAATGAGTAACTCCCCGGCCTTACTACTT
+TTGTCAGTTCTGCAGACCGAATATCTTACTTCAATCGGGTTAATGTTAAACCCGGTATAC
+AGCTCTCGGATCTCCGGATGGTCATTAATACTCAGCAAGAACTTTCCTTGAATTTTTGCA
+AGGCATTCCTTAAGCCTGATATGATCTTCTTTCGTGAATGGTTTGCTCCCTTGGCTTTTG
+TAGTCAGCTAGGCCGTAATAAGGCGGATCGCAATAGAAAAACGTTGAGCTTCGATCATAA
+CTGGAAATAATTTTTTCGACATCTCTATTTTCGATGATTGTATTTACCAGTCTGTCCCTC
+ACGGATGTAATGTTATCCCTTACCCGCTCAAGAACCATTGGCGGCTTTTTCAAAGGAGTA
+ATCATGAAGTCCTTCATCAATGCTCCAAAGCTGAAATGAAGTAGGTAATAGAATCTGACT
+GCCCTATTTACATCGGATGTACCGGCGAGGCTTAATGCTTTGTATTTCTGGAAGATCTCT
+CTTGAAATAAGCAAATAATCAAAGGCCTGAATGAATTGTTCGGGCTTTTCTTTTACGACT
+CGGAAGAAGTTGACCAGTTCAGAATTTATGTCGTTATAGACCTCCACTTCGGAAGGAGGC
+TTTTCAAAGAGTACCCAGCCAGCTCCACCAAACGGTTCACAATAGCATATATGCTCCGGG
+ATCATTTTTACGATGGTCTTTCTTAATCTATATTTGCCACCCATCCATTTGATTGGACTG
+TTCATGGTTGTTCCTCCTATACTAGAACATATGTTCTATTATAGGGTATTTCAAGGAAAA
+AGAAAAGACCCCATAAGGGGCGTTTTCGAACAGGCTGGGACTTGAATTGGACAACGTTAT
+TATAAAATTGAGTATTAAATTAAAACAACAAAGTATTTATTGCAATAGTAATAAAAAGTT
+ATATTATAAGATATATACCTATAATACAATTGTAATATATTCCCACTCTTTTGGAGGTGA
+AAAAATGTTCGAATTAGAAAAGGAGATGACACCAGTAGTAACAAATAATCTAGGGATCTT
+TTCTCAAAGAATTGCAAATCACGAGAATCTAGCTTTAACCTATGAATTACCAGTGAAATA
+TCGTCTTATTGATATGGCAATTGCCTACGCTCTTCCCGATGGGTATTTCAATAATGTAGA
+ATCATATAGCCCATTAAAATATATCAACAATATCCTTATGGAAATACTATCTATATTTTA
+CTTGTACCCTCAAGTTACAATAAAACGTCTCCAGAAAGAGCTCTTCATGAACCCGGATGA
+ATTAGAAAAACTTTTATATAAGCTTATTAAGCATAAATTAATCAAACAAGTATCACGAAT
+GTCATATCAAATTAATGATTTGGTTAAAATAGACAGTCTTGGTATGATATCTATAGAACT
+TAAGTTGTGTAATTGGAGAGAAGCTTTAGGACAAGCAGAATATAACCTTATGTTCTCTGA
+TTACTCATATGTTGCCCTCGACAAAGCTAGAATTCCTAATAATGGAGTAGATTTGATTCC
+ATTTTTTAATAGTAGAAATATTGGCTTATTATCCGTTTCAGATGATGGTAATATTGAACT
+ACTTTTTAATCCTAAGAAAAACCGGAAAATTGATAAACGTTTATACACAATGCAACGTTT
+GAAAATACTGCAAAGTATTATCTCAAGTCAAAAATGGTACTTGTATTCGAAAATAGGAGA
+ACCTAAGTAAATTACTGTAGGTTCTCCTATTTTATTTATAGGTATTCATCCACAAAATTA
+TCCAAAACTTCTCGCCAAACACTTATATGATTTCCATTTTCACTTAAGGGATTTCCTTTC
+AGCCTGCCCTTCATATATTCCATTTTTGCCTCTGCATCCTGAAGCCATGTTTGAAGATAC
+CCTATTCTATCCCCTATAGAAGGTATTTCCCGAATATGCTCTGCTTGTTGAATTAAACTA
+ATTACTCTGTGCTTACTAGCCGCACTTGTATTACTACGGCTTTCTGTCCAAGATGGTGGA
+ACCACAATTTTTTTGCCTTTTACTCCTAGTGATTGAAGTAGTGGATCACTATGAATAGTT
+ATAATATCTGACTTAAGGTACCTTAATAATTTTAAATTAACAATTTTCTTAAGATCTCTT
+TCTGAATAAAAATCCCCGATTAGACTTGTTGAATAATACTTCGGTAATGACATGCCTCCA
+TCTTTATCTACGAAGTCATTCAAACATAATCTTCGCTCTTTAGTTGAATATCCACTTCCA
+AATGCTGTTGCACCGACAGCCAAGCACAATAAACCGAATGCATCTGCAAAATTTATAATT
+ACTTTTTTATCTTCCACGTACCCTAAATTATATGAGAGTTCTAATAGCACCCTCGCAATA
+TTGGCCTCAACAATCTGGAGCGAAGAAGTACTCTGCTCTACAACAATATAGTACCCATCT
+ATTTCTGATAAAACAGACGCATTGTCTAATAATGTTTGAACCATTTGATTATCATTAATA
+TCACAATCAAGTAAAGCCTTATCGGATATTGCAATTGTTGCAAGGAATGGCTTACTGTAA
+TTACCTTTCAGCTTACTTGCTGCCTTTAGCCATTTAAGTTGTTCACTGAACTGATCTTCG
+CGATTAACAACAAGTGGTGTGGGAATAATTAGATCTGTAACTCCAACTAGTTCTTGAAGA
+GCAAAGCAGGACTTTATACATTCTTGAATTTCTAATTCGGAAGAATACGATGATAGACTA
+ACACTTAAATCCCTTGAAGAAATAATATTAATCTTTCCAGATATACTCTTGGTCGTTCTT
+ACTTTTGGCTTTGAACTCTTCGTTTTTTCATACCAAGGATAAGAACAAAGATTTGAAAAT
+GTTTTCTTACATCTATCCTTATCGATACCATGAAGGTAATATTGAGGATCAAGCAGTACA
+GTAGATAAATCATACGCTTGCCTCTTACATAGCTTGTCGCTATTAATTGAAGAGCTGGCC
+ATTATAACCCCCTGAGGGTCTACCCCATCTATTGTACCGAAATGACCTCGATTATATAAA
+AACAATGTCACTCAACTCCTAAAATATCAAATATTTCCGTCCAACCTTTTGGTCGCTTAA
+AAGCACGAAGTTCTGTTAATTTATAAATAACCTTTTCAAGAGTATTAATAATATTTACTT
+CTTGCGGAAACTTCGGTATAGGGGTATTCAACATAATATCCTGCCTGAAATTATAGGGAT
+GATACCCAGCCAAGCATTGATATGCAACAATCCCAAGTGCGTACAGATCAGCCCGAAGAG
+TAAGATTCTTTCTCCCAAGAAACTGTTCCGGAGCAAGATACCCTTTTGTCCCAAAAATAA
+TTCCGTATTCAGTTAGTGATTCAGCATCGGCATCAAGATGTTTTGCAAGCCCGAGATCAA
+TCAATATAAAGTCTCCATTAGTATCGAGAATAATATTTTCAGGTTTAATATCACAATGAA
+CCACATCTACCGCCCATAATGCCTCAATCGCTAGAGAAATACAATGAATCAATCTTATAG
+TTTCCTGTTCAGATAACTTTTTTCCCGATTCCAATAGTGCTTGGAGATTATCGCCACTAA
+TAAAGTTTGTGATTATATAATAGCAATCTAAACCCCTTATTACCTTTTTTCCACTTCCGT
+ATAAAGTTACGAGGTAAGGAGAATCAATTTCTTTCAATTTAGCAATTTCAAGTTCAGTTC
+TACGATGCTGATGATCAGGACCATAAATTTTCAACAAAATTTCGCGTTGTGAGTTATTAT
+CAATTGCTTTAAAGACAGCTCCTTCTGCCCCTGGCTTAAGACTATCAACAGATTTAAGGT
+TAGGAAATAATGATATAACTTCAGCCTCTAATAAAGGCGGCAAAAAAGGCGAAATCATTT
+TAGGCCTCCTTAAAATTTTAATAAGTTTATAATAGTTCAATAATTTACAATATACTATTA
+TGGCATAAAGTTAATGACGAATTCCCACGAAATTAGTCTTATAAATTAAAAAAAGCCCTC
+TCGCTTTGAAGAGGGCTTTTGTCATAATAATTATACAGATTGTTGTACTGGTTTTAACTC
+CAGATTAAGCACCTGCGATGGTGTTTCCGATATAGATAGCACAGGATCTGGCTTCTGCCC
+TTGTTGCTTCATCACAAAGACAGCCGCCTCAGCCGTACTACGAATAACTTGTTTTAGATC
+CGGAGTAATCTCGCGGCCAGTAAGTTTAATCATATTCATAGCATATTCGGTGGCCTGATC
+TTTTCTCAGTTCCGGAGGTAATTGCCCACTATTATAAAGTTGCTGCGCCGAATGTACCCC
+AGTTTGTGTAACCTTGAGGATCGTATCAATAACGTTATCTACCGGATCAGGAATAATTGG
+TTCTAATACTGCATGTACAGATTCAACGGTATCCACGACAGCACCTGCAACCTGCAGCTG
+CTTCCCTGTATCCCTGCCCTGTTTGACTAACGTCTGGATACCGTACATCGTCCCAAAGAA
+ACACATCAATGATAAACCAGCAATTAATAATGTAATCGTTTGAACACTCATCTTATTTCC
+TCCTTTTTAAGTAAATTGGCAAGCGCTTGGGAATATTAAGCTCCAGTAGCGCTGACTGCA
+GCTGCAGTATCTCCCCAGGTCTTTCCGGAGAGAATCGTTTCGTTTGGATGGCCAACGGAT
+CCCCCGCCAACGATAGTTAAATGCTCTGCCTTATAAATGTCTGCCGGGGGAGTTTTATCA
+TCAAACCTGAGAAACACTGCACAGTTTCCAAGCTTAATTGACTCTCTTCGCGCCGGTACC
+AGGTAATCCTCAATTCCATGAGCTAAGACCGCCTCTTTCATCTCATAGACCTCCTTTTTA
+ATAACATTCGCGCTGACACTTACGCCAAAATGATCACCAATCCCCTGAGCGATGGCCAGA
+GCAGCCTGATCTATTTTGGCTAAGATCACGCTTTCCTCAGAATTAATAAAACCGTACTCA
+ATGAGCACGGCCGGCATATCTGTCCACTTTAATACATACCAATTTGCATATTTAACTCCG
+CGGTCAACCATTCCCAGTAAAGCCATTCTCGCCCGGATAGCCTTGGCCATCTTCTCTCCT
+TCACCACCGGCTGCTAAAGCATAGACTTCGTTCCCGTAAGCTTTCACAGCTGCCGAGTTA
+TTATGGAAGGAATAGAATGCATCGCCGCCCAAGGCATTTGCCACTTTTACCCGATTCTTT
+AAGTCGAGATCATCATTGTATGGTGCTGGCTCACAGAAGTCTTTATCTGTAGCCCTAGTG
+AACTTTACTTGGAAGCGGCCGGTTGCTTCGAGGATCGCCGCCGTTTTCTTGGCCAGCATT
+AAGACGTTATCCTTTTCCTTGGTCGTTGGGCCTACTGCTCCCGGATCCGGGCCGCCGTGG
+CCCGGGTCGAAGACCAGGTCATATATTTTCAATTCAGCCAAATTACTCACCTCACTTTCC
+AAATATGCTAGCTAAAAACTCAGGGTTGACGTTCTGTCCAATGGCTGCAAGCGTGATAAT
+AATGGCTATAATTACAAAACCCTTGATGATCCATTGTCCCCCTGGGGTTTGCCAAAAACC
+TGCTTCTTTTGATGACTCTTCGTGTAATGTTTCTAAGGTTGAAATCCGCTTTTCCATCGT
+TTCTAATGTCTTAGAGGTTGTCTCTAACAGCTGAGTAAGCTGAGTGATAATGATCTTTAA
+ATCTGTTATTGTCTCACTGTGCGCGTTTAATCTGCGTTCAGCTACCTCAAGTTGCTTATC
+TAAGCCTTTATGAGTTCGTTCACAGGATTGCTCGGTGACTAAGTTTTCCCCCACCATAGC
+CCCACCCCTTCTTTGATTATTGCTACCAACAACAAGCTCCCAATACCGTTAACTTGGCCT
+TGGGAACTTATTGTGCGCTTTATGATTTATTGGTGTCCTTAAACTTAGCCAAAATGTTGC
+ATGCAGTATCACAAGTTCCAACTGCACAGATTCCAATTAGTAACCCTTTCGCAAAACACT
+CTAATATTGAGGCACACTGCAGCAGGCCAAAGCTGCTGAGGATACCTAAAGGAATTGCGA
+GCAAGTGTGCGATTCTTCTACTTAAGCCTAACTTCTCGAGAGACTCTACAATTGCGTAGA
+CAAATCCGATCAATATTATCAGTTCAGCTGCCATAGATTACCACTCCTTCACAAACCAAT
+AAGGCTTGTTCTCCTTCTATGGCATAGTATGTTGATGATTCGGAATCCGTGAAAACACTC
+TAATTAAGCCCTTCTTCGAGATATAAAGCAGCATTAGTATCTTCTAGGCAATAAAAATAA
+CGCCCCAAGGCATTTAACTTCTCTGGAATCTTCACTATGCATTAGCCCAGTATGGCTATC
+TCCCTCGTAGCTACTTCCATCTCTACCTCGGTTCTCAATGTTGTGTTTGTTCCGTTTAAA
+AGTTCCCATTCGGTATTGGGTACGTCTTCGATGGTCATTCTCTTACCCATTACTAACGTC
+GCATAGGCGTTTACGAGTCTTTTTTGAACTGCTGTCATATTAATCCTACCTCCATCAAAA
+TATTTATAATCAATATCTCTGTCTCAGCTTTTGCAATTTCATCTCTGGACGGGATAAGGC
+TATCCAGTAATTCTTGCTCCTCATGTATTGCCTCCACCTGTGCCGAAGCCTCCTTCATTT
+CAGCCTGTGAAGGCAATTGGAGGTCATGGTTAAGCATAGTCACAGTTGTGATGTCGTTGG
+TGGTAATTACGATGAAGTCAACATTATGCTTAGCCTGGGGGTAAATATGGGATACAGCCT
+CTACGTAGTTCATAGCATCGCCTCCAAAGAGCTTAGCTGGTATTCAATGAGGATTCCCAT
+TCCCCCATTAGTTGCTGACACAGCCGGAACGGTGCTAACGTTGCAGGTACCATTTACGCC
+CTTAACCCCACCATCTAGGACAATCTGTGACGGTAGGATATCGGAGTCGGTAATGGTTAT
+TAGGAGTCCTCCCCCACCGCCTCCACCGCCTCCACCCGAAGCACCCCAGGTATTCTGGTT
+CAAATTAGCCCCATTGGAACCAGCTGTCCCGTTGCCTCCGCTAACATCAAGGGTGATGGT
+ATTGACGATGGAGGGGGATATGACAGTCAGGAATCCTCCCGCTCCACCTCCGCCACTTCC
+CCCAGCGCCCTCGTAAGTGAGGGATCCATTTCCACTACTATTATATCCCCATCCACCTTT
+ACCGCCTGCACCTCCGAAGGATCCTCCTGCCCCCCCGGGTCCACCCTGACCCCCAGAGTT
+ACTAGAGCTGGTAGTCCCCCCGGCGGATCCACCCCCACCGCCATCCGAGATGGGTACCTC
+GGGAAACTGAGTGGTTATTAGGGCTGGAATGAACAGGTAGTTTAAATATTGCCATAGCCA
+CCCCTCGGGAGCTATACCGAGAAAAGAATTACTGCCTATGCTACTATATGAGGCTCCTCC
+GGCATTATTGGGGGCTGATTTCAGCCCCAGGGCTGATATCGAGCACCCGGAACTGGGATT
+GCCCGCCTGGGGATTAGAGTTGTCATTGGTGTTAGAATAGGATCCAGGACTACCATTACC
+TCCAACTGATCCTTTGGCGGTTATAATACCAGTACCAACTATGCTATTGGCAATAATTAT
+TAATGATCCTCCAGCAGCACCACCAGCTCCCCCCTGTCCAGCGTATGAGAAGCCGTTTTT
+TGCTAAACCTCCGAGGGGTCCTGGGGCCACGGTGAGAGTTCCGTTTACGCTTAGGGTCCC
+CTTCACAAAAACCACAGACCTGTGGGGAAAGGTTAGAGTAACTCCAGCGTTGATGGTTAA
+ATTATCGTAATGATAGACTGAGTCCGTTAGGGTCTTATGCGTTGAGATCGTTACATCCCC
+GAGTATTCCACTTCCGTAATACAATTTTATTCACTCCCCTATAATTTAATAATCTCAAGG
+GTACTATTGGCTCCCCCATGTTTGTAGCCTGCGTTGGTGGCCGGAGAATTGACAGCGGTA
+TTTACCTTATCTTCGCTTTTCAAATAGACTACCCGGTGCATTTTAAACATAAATTTATTG
+CCACTAGCTGTTGGGGGGTCAGAGATCCAGATGGTATCCACAATGCTTTCCATGAGTCCA
+TTAATAAATAACCCGTAATTAAACTCATACCTATCGGTAGTGGTATCGAATATAAAATCA
+AGGTTGGATAATATCAAGTAATATCCATTCTCGGGGGCAGTATAAAATTGCCCGTTTGTT
+AAAAGTGACTCCTCGTCGCTAATGGTGTTGCCGAAGGTTACGGTATTCCATCCAACATAC
+GATGTAAAGGTAGTAGTACCTTTGGCCTTTAAATAGTGTCTTGGGGCTAGCTCTAATTTT
+AATATTCTCCGAAGTAATCCCATCTGATTAGCAAAAAACATCTTCATCGAGGGGGCTTTT
+CTTAGGAACTCCCGAGGAACTTGTACATCAGCTCCGAGAGGAGTAATGCCACCTGCTAGT
+CCCTTTCTGTGGGGAGTTGAAGTCACCATGTGAGCGTTGATGACATCCGAAGTATCATCG
+AGGTCTTCGGTAAGTGAGTCAATTTGGAGCTGGAGGTTTCCAGCGGCATCAACGCTTAAT
+TGATCCTTCATGCTGTTAAACCAAATGATAAAATCATCCTGAAACTGGGCTTCCACAGCA
+TCCTGATCAGCCTCGATGGCTAATACCCAGGCGTCATAAGCATCTTTTTTGTCGGTAGTC
+CACGTGCTAAAATCCCCATCGTATTCTGTTTGCTTAGCTGCGTACCAATCCATGTACTGG
+TTAAAGATTGCCGTGGTATCTACTTGAATTAGGCTGTTGACCCATCCGCATTTGGTGGTA
+TCCATTCGCAGATCAGTAATATTAGCTTGTGTAACTTCTATTGCACCGGCACCGATATAA
+ATCTCAGCCAGGGCCAATTCATAGATATCAGCATCCCTTTGAATCGCCGGGGCCACCGGC
+AAGCTGGCAAACACGCCTTTTTTTATAACCGATGTGATCTTTCGTAGAACGGTATCCAGC
+CTGACCACTAATAAATCTTTCCGCTTTAAAGCACCGTCAGCGACATCTATTGGGATTACT
+AGATCGGAATCGTTAAGGTAATAATACCCGTTTATCCATGCCTTGCCCGCTTTTAAGAGA
+ACAGACATCCCCCCGTTGGCCATAGCTTGAAGGCTTGTCGTTGGGTTGGGGAATACGCCG
+GTCGTAATAAAGCTGTTAAAATACGCCGCGTAGTCAGATGCTTGGTATTTTCGATCGCCA
+CTGACTGAATTAAAAAAACTTGATTTCTCCGCCAATTCTTATCACCTCATTTTCTGTTTG
+ATTTTATCGAGTAATGTTGGGATGCTGTTTCCAAAGGTGACATTAATCCTTACTCCAGCT
+TCCTCGTAGACCTCTTGAATTTCAGTGATTCGTGCATTTATAGTAACGCCCCATTTTTTA
+CGAACACAAGTCACTATATCCCCAAGATCAAAGTCAGTTTTGTAAACCAGGTTAGCATTT
+AGATTTATGACACTGTCAAAGGTTCGGTTCTCTACTCCTTCAGAGAGCTTAGAATTACCT
+CGCTCCGTTAAAGTTTTCAAATAATCTGCATCCGACAAAGTTACGCCATTAACAACGTTC
+GTAAGATCCTTGGCGTCCACAAAGTCCTCGAATCGGTTTAACCCTGTGGAGGATCCAACG
+GTTACGAGCTTTCTAGCTGTACCTTCACCCATACCCCCTACAAGGGCTGTATCCCGATAG
+TTATTGATGCTCTCGGTATACTGTTGCGTGAGAATGTTCTCAAACTCTTTACTGAAGACC
+GCCCGCGGATTAACGCTTTGATTTATGGAACGATCTAATCCCGCGTACACATCGAACACT
+AACTTTTTATTGGATGTATCAAAGCTAACCCTATATCCCAAATCAGAGAGTGAGCATAGG
+TTCTCAATTTCATCCAAGAGGTTTTTATAACTCACTTGATAGTTAACTGTTTGAGAATAG
+CCTTTTAAGGTGCCTAAACTAAGGTTTGGTATGATTCTTTTATTATCCGTTGGAGTAATG
+CTGTGCTTGTTTACAAGGGTTCTCATGGCATTTTCTGCTGTGCTCTGAAGTATCTCCTGG
+CCCCATACAATGCGTCTGTTCAGATAGGCCGAGAGAAATTTTCCCTTAACGACGAGAATT
+TCTTTACCTTCCACGTCTTGATCCATTTGCCTGAATTCAATGTACCCTGCTTCATCATCG
+TTATTCTTCCAAACGACATTCCCCCTTTGGAGCATATCAAGTGTGTAAGCATCTAAAGAA
+CAATGCAGCTCGAAATCGCCGCATTTAGAATAACGGCGATTCCACTGCAAGGACGTGAAA
+TTATCCATAACCCCCAAAAGGTTAAGGTCTGAATTGTAGATATACAAATCCATCATTACA
+CCCCCAGATACTGAGGCATGTAGTAAATGGTTACCTCAAGGTTGTCTAGATTTGTGTCTG
+AGTTATACCTAAAAAGATTATCCCCTACATCCAACTGTAAAAAGGTACTGCCAACGTCGA
+TGTAGTTAAAAGCGTTCGTTGTGACACCATTCAAATCACTCCTAACCTTTTTGTTGCCAA
+AGTATGTGGAGACCGTAATTGTTTCGCCAGCAATCATTTCTTTATTAATTTTGATGAATT
+CCTGAGTGTTCACATTGAGGATAGATGGATTCGTAAGGGTTGCAAGCGCCTTAAACTCTA
+CTCGCATTCCACACTCAACATCGCCGCCATTAAATACATTCACGATCAAAGACGGTTCTC
+TATGTCCCATCTCAATGCCGTCTTCAGTTAACTCTAGCTCAAAGCTAAAATCACCCACCC
+AAAGAGCGATCTCTTCCTTTGATTCATCGATATCAGTCCAGAAAGGATTACTGGCAGTCA
+TGGAGATTAAGCAGTCATCGTATGAAGTGTCCGTTATCTTGAAAAATGGCATCTTGTTAA
+TGAGGCATTTTACTTTTCTCTCCTTAACATTATCCTTGTAAATTAGATACCCCTCTCCGT
+ATTTCGGGTTAAATATGGCGTTGATTTCGTCTCTATAGGCCGTCAGTTCGTCCTTAGATT
+TAGCCAATAACATAACAGTAAGGGTTATGTCCCTCTCGTTTAAGGTATTGCCTAGGTATG
+TCCTCCCATCCTGGTTAACCCCTTTAGAGTTATAAATGGTTACATTGTTAGTCGTCTCAA
+TTTTCTGCAGCAAAAAAGGAGCAGTATTTGATAGTTCAATACTTACCCCTTTTGCATTGA
+CATAGGTCACCTTCCGCACAATACCCCCCCTAGAATGCTAACGCTAACTCTTGCAGGGCT
+CTTTTGTTTTGCCTTGCTGTCTCGGCAGGGCTTACAGCTGCAGGGCTGTAGATGTTCACC
+GTTTGATTGATAGCCTTCGAATTATCGGCATTTCCTGCAGAGGCTGAACTTTTAACGCGA
+CCTTCAATCATTTTTTTACTAAGAACAAATTCACCCCTTTGGGCGATAATCGGAACCTCA
+TCGGGTCGAAGGTCTAGTCCAACCCACCCACCCTCGTGGAACTTCGCATAGTTTTCTTCA
+TACTCTTCTTTTGAACCGTTTCGGTATAAAGTTTGACCAGTTTTATAATTAGTAATCGAA
+TATTGACCCGTCTTTTCATTATACGAACCAGATTTAGTGTTAATGGTTACTTGACCATTC
+GTTTCAACAACATTACCTACACCTTTGACATTAGTAATACTAGTACCACTTGAGCCTCCA
+CTGCTTCCTCCTCCTGATCCAGAAGAATAAGTTGGTTCTTTGATACTAGATTGCAATGCC
+TCGGAAAACTGTTGGCCAATGGTTGTTCCGGCAGTAACAAAGGCCGACGCTTTACTTGTG
+ACCGTGCCCACTATGTTATCCATAGCGGCACCCACGGCAGAGGCTTTATTTCCAATGCCC
+AGAATTAAGCCATCAATGGTGTACTGACCAACTTCTTGAAGTACCGTTGAAGGCGAGTGG
+ATACCCAGTATTTTCTTAATCCAGTTAGGCAGGGATGAAGCCATTTCCTCTACGGTGCCT
+TTTAGTGATGCAAGTTTATTGCTGATTCCATTAATTAAGCCCCGAATGATGTCTTGACCG
+ATCTGCATTAGGTCAATATCTTGAAGAAATTGTTGCGATTGATTCCATTTTTCAACGATG
+GTTGTTCTGACAGCTTCCATTTTGTTGTAGATAGCTGTTTTGATCGCTTCCCAGGCATTT
+GAAATATCTGTCTTTATTTCGAGCACCTTCGCCGAAATGTATGCCTTAATAGCCTCCCAA
+GTGGTACTGAGCCAAGTCGATATACCCCCGAAGATCTCAATAGTTTTGGTCTTGACCGTT
+TCCCAATTCGCAATAATCAGCACTGCAAGTGCCATTACTGCTGCCGTGACCCATGCCACT
+GGCCCCATAGCCATTACCCAAGCCGACGCCATCTTTGCGGCGTGTAATAAACTCTGTACG
+CCCATCCATGCCCATTTTGCCACCACGATGGCTGACTGCACTACTAATATAGTTACCGCT
+GCCACTGCTCCCACTCCTGTTGCAGCCCATGATGCTACAACCACTAAAGCGTGCGCAGTA
+CTCTTTAGGCCCATTAAAAGCCAATCTGCAACTACCTTGGCAGATGCTATTCCATTGACA
+ATTGCTGTTTTTGCTGCTTCAATCCCCATGACTATCCAGGCATTAATCACGACCGCAGCG
+ACCGCTCCAACAATAGGTACTATAATAGCCTGGTATTGGACAAACCAATCAATAATCCCA
+CTAATAGTTTTTGCTGCTTCGTCAATGGCTCTCCCTGCCACGGTAAACGCATATTCGATC
+TCATTTTTGATCAGCGGCATATTGGTAATAATCAAGTTCGTAAATTCATTAACTTTTGGC
+ATTACTTTTTCACCAAGGGGGATGAGGATAGACGTTTCCATGTTTCGTTTTATGCCTTGA
+ATTGCGAGACCAAAGGTATCATACTTGACTTCGTTGATTTTTCCGAGTGCATCCGTTGTC
+TTACTTATTCCCCCCTGAGTATTCGTTAGGGCCTCCATGCCTTTTGCTCCAATATCTTCC
+CACATGGTTCCAAAGAGAGCGACCCCTGCTGCTTCCTTTGCAAGTGGATCCTCAAGTGCA
+AATATTGCCTGAGCCGTCTTGTCAAATGCCTCTTTTGCACTATCTCCACCTTGAGCAAAG
+GCCAGTGACATTTTGCCAGCATCTAAACCTAACGCTTGAAACGCTTCGGTAGATGCTTTG
+CTTCCATCCTTGGAACGTATACCAAACTCTTTCATGGCATCGCCTAGTTTGTCGATATCA
+AAAACACCGGTAGCTGCCCCGTTCGCCATCATGTTGAACATTTCTTCGCTATTAAATCCA
+AGCTGTTCGAAATGAACACTGTACTCATTAATAGAGTCCAAGAGGTTCCCGTTTTTGTCG
+AGACCCTGTTGTGCACCTTGGGCTATAAGGTTAAATGCTTCATCGCTAGTAATCCCAAAT
+CGCTTCATCATCATGTCTGCAGTTCTTGTGCTTTCCGCGACCTCAAATTCAAAGGTATCT
+CGCAGCATTAAAGCATCTTTGGTCATGTCTTCAAGCTCTTCGCCTGTTGCACCAGTTTGC
+TTTCCGACTTCTGCCATTGCCTTAGCGATGTCCTCAAAGTTCTCGCCAAGATTAGCATTG
+TAAATTTCAAGCAACGTATCTTTCATGCCGATCATGGCTTCATCGGTTACCCCGGTTTCG
+GCTTGAATTCCATTAAGTGCCTTTTTTAAATCATCACTAAAGCTAACTGCAAGTCCACCA
+ACCGCCAGAGCCGCCGTACCCATGGCCAGGACTATTCCGGCGCCCACCTTCGCAGCGCTG
+GACACCATTTCGCCGAATGTTTTTGCTGTGCCCTGAGCGCGTCTGTCGGTGTCGTCTATA
+CGAGCATTCGCGGCATCATTGTCGATTAAGATTGATCCAAACAGTCTAAATATCTCTATT
+TTTACCACCTCCCATTCAATGGCATAAGAAAAACAACCCTTGTTAAAAGGTTGTTTGTTT
+TGTGTCATTGCTTTTTGGCTTCATGCGCTACAATAATCGGTAGCAGCTCATCAATAATCT
+CCTCGGCCGTTATTTCTGTGTGCTTCAGTTGTGGTTTGAATAATTCGTTCTTATAATCCT
+CAAAGCTTTGAGGGTGGATATACCCCAGTACCATATAAGGATAGAGACTGTTCCACATAT
+CCCAAGCCCATTCCTCTTGCTCTTTGGTAACAGCTTTTGCAAGTAAGCGCACCAGGTGTT
+TGAGCTGTATTTTGCTGGCTGAATTAACACCATAATGGCTATACAGTAGGTTGATTGTTT
+TTGGATAACCTACCGTATAGCATCCTTGAAAAAACCAACGGCTTCTTTATCTGAGAAGAT
+TTCTTTGAAAGAATTCATGGTCGTAATAAAGTTCTGTGCCTTAATTTCCTCGACTGCCTT
+GTCCTCGAAAACAGCGACAATCTCAAAGACTTCGTTTTTAACTTTGCCTGAGTTCTTAAG
+GACAAACTTAAACAGGTTAATCCCTGCACTCATTTGGTCAAGGCTCTTGCCTTTGTTTTC
+TTCCGCAACCTTTTTGCGGTATCCGTCGAGGTCTAGTTTATCGTATAGATCCACCACATT
+GGGGAGCATGTCAAAGGCTTTTTCCGTTGTTAACATATTTAATTCCTCCAAAATTAGGCG
+GGGGGTCCCCGCCTTTTGTTATCCTGCTACAAAAGGATCTACAATCGCTGCAACATCTTC
+GATTTTGTACAGGTCTGCGGCATCATCAAACGCATCCCAATGCGCCATGATCTCAAGCCC
+AATCTCAGCTTCGCCCTTTGGCTTTGCAGCCAACTCGAAGGAGGATTCGCTCATCGCGTT
+ATACAGAGTGATTTTTTTGTACTCGTTATTCATGAGCTTCGCGAACATAGTCACATTGTC
+CAAGTATGCGGTGTCTTGTATCCCGCCAATATTTGCGCTCTTGGCTGTGATTGTTTTCGC
+CGTGCCGTCGTAGGTCGCCCAGGGCATTGCGATAGCTAGGGTTTCCATGCTTGTGTCTAG
+GACCGTAACGCTCAGGCTTGCCGTTACACTCTCTAGGACTTGCATGCCCTTGCTTTTGCC
+ATTGCCTCCGTCATATTCGATGTCCCTGATTGTTGCATCGACCTTAAAGCCCCCGCCCCC
+TCTAGTGGGTCCTAATCTGCGCTGTGTCGCTAGGCCGTAGTCCGCAAAGACGATTCCGTA
+GTCGACTTGGACGTTTTCGAGTTGAGTTTGTGTAAGTGCCATATTTATCACCCTTTCCTA
+AATAGTTTTCCTGAGAAGTTGTACTGGCGACGCTTGATAGTTTTGTCATCATCGATCAGC
+GGGAGCATATTTTCGAGGTAAAAAATTATTGCCATTTCAGGGTTTGTGACCGTTGTTTTG
+TCCAGGGTTTTAACGCTGGTCATAAGATTCTCTAGTTCGGTAGTGTCAGGGTTTTTGCTC
+CATCCATCCACACTTAGAGTACATAACTCGAACCCTTCGCCATCAGGATAGAGCTGGAAG
+TCGAACACTAGGTAAGGAAAAACCGCTGTCGATGGTGCCTCTTGGAAGTAGGCACGAGGG
+TGGATTGTTTTGAGGAAAGCCGTTAAGGATTTCCTTAGTGCGATCATGAATCCGCCTCCT
+CATCCGCTACCTCTGGTAAGCCGTTTTCTCTTAGGCTCTCGATTTGCCTGATAGAGTCAG
+CTTGCAGTTCGCGAATTTTGGCAAGGTTACTGAGAACAGGAGCACGAAGGTAATCGGTTC
+CCTTCATCCTTACCGTACCGAATTGCACTAGGTGGGCATGGAAAGCATATTTATAACCCT
+TTTTCTTAGCTCTCGCCCTGCTGTAGACTCCGATTTGAAGAACGGGGGTTTCATTCGCCC
+TTCCTTTTACCCATGAGCCAACATTCTTTTTAAGCACACCTTCATGAATAGGAACTGTCC
+TCTTGATTTCCTTTCTCAAAAACTTTGCGGTTTCCCTAAGTGCTTGTTTTTCCAACTTCG
+CTATGGCCCCTTTTACGGCTCGGGCATTTGACTCAAACTGCACACCCATTTACACCACCC
+CATTCACAAGACCCTGACAGGTAAGCTCTGTGTCCTCGCTGTTAGGCTCAAACGTGCGAA
+TAATGTTGTACTCCTTGCCGTCGAATTCGAGCTTTCCTTCTCCTGCATATTCACGAGTCC
+ACACAACAAAGCTTAGTTCTGGTCGAAGGCCGGTTGCTTTCGCCTGGTAAAATTCAGACT
+GGCGTATTGACTTTTTTTCGGCAAACACTAGGCGCTTTGTTTTGGCTTCGATAAAATCGC
+CCATATCATTTTCGCTGATAGTAGTACTAATCAGGTAGATTGCTTGATCCGGTCTATTCA
+TGGCATACTCACCGCTTTAAGTTGAGTCATAAGAATATCAAATGCTAAGCTGAATTTTAC
+TTCTCCGCTTTTTAGATACCAAATATCATTTACGCCAACGGTAAGCGTTGCAATCCCTAA
+CTCGTTCTCGACGTTCTCAATCGTTACTCCAGCATTCATCATGTACTGTTTTACTGCGAT
+TGCTTTGATTGAGAGAGTCGAATCTGTATACTCGCCAGTAATCCCTAAACCGGTTTTTAC
+TTTCTCCAGTAATTCTTCGTTCGTCATTTACTCACCCTCTGCGGGATCTAAGGAAAACGG
+GACTAAGACAATAGTTAGCCCCGTTTTTTCCATCTCATATCGAAGCTTTTGAGATAGTTC
+CTCATGCTCCCGGACCGTGAGTGGCCTTGTTGCTTTCAAATAAAGAACGCCCTCAGTCTG
+CTTTACTTCAACAGCTTCAGGCGTCTTGCTTTTAGTTCTAGCCATTTATGCCACCGTCCT
+TAAACAAATTAGGTTCCGGAGTAGCTGTAATAGGCAAAGGTGTTCTTAGCAAACAATGGT
+TTACCTCCGGAGTACAGCTTGCCTCGCCACACGGTTTTATCCTCGGAGAACTTCTCAGAA
+GCATTGGCTTCGATGACAAAAGCCTCTGATTCATTGACAATATAGGTTGAAAGATCACCG
+TACAGCACAGAGTCCGTATCCGGCATTTGGGAAGTAAACACCACCGGCTGCCCGGCAATT
+AAGTAATTGGATTGACCAGGACCGCCTTGCACTGGAAGGACGGATACTAAAGGCTTCCCG
+GCGGCATCGGTGATTGCGAAAAACCGCTTAAAGAAGGTACTGCGCTTCATGACCCAGGTA
+GCATTATCTCCATAGGGACTCTCCACCTCTGAACAGATCAAAGCAATCTGCTGCCAATCC
+ATCAAGGAATAGGTTTTGGCGGCTGAGGGTGCAACTTTAAGGGCTGCAATAATTCCTTGG
+AAGGTCGAGGTATCCACCGCGCCGTTTAACACGTAGTTTTCAAGTAAGATCCCAATGTAC
+TTACCAATTTCCATGGCAAGGAACTTTTCAAAGGCCGGAATGCTGTTTCTGAGCAGCAGA
+TTCTTAACAACAATCGTTGCCACAACGGCCTGCTGTGAAATTTTCACTTCGGTAAAGGTG
+AAGTTGAGGGTTACTGTGCCGTCGGGATTCTCCGTCGGTGCCTCCGTGGTACCAATTGGC
+AGGGACACGTCCCCTGTAAAGCCAAACTTTGTGATAGCCGTGTACAGTCGACCGTATTGT
+TTGATGACGGAATAGACATTATCGAGAGTGGTTTGGGGAACCAGGTATTCAGCACCGCTG
+GCCACACTTTCGCCGTTCATATCCGTTACAGAGCGCTTACCAAAGGCCATAATGTCGGCG
+TCTGCTTCACTGATTTTCCCATTGAGATAACTTCGATAGAAAGCATCCCTGTACTTTGCG
+CTTGAGCGATAGTTCTCTTCCGTTAGATCGCTATGGTTTTGCTTACCGAACATAAATCCT
+CCTCGTTTCTCGGTCTCCGGTGCTTCCTGGAGCCTTTCATTGATCTCGTCCAAGCGTTCA
+GACATACTTCTAAGGTTGTCGGCGACTTCGTTCATGTCTTCGGTGGACATATCCCGATGA
+TTTTTAACCTTGCTCTTCAGCTCCAACCGCTTTTGTTCCAACTCTGACTTTTCTCTGCGG
+AGTTCCGCCGCCTCTTTTTGGGTTAGTTTCATGGATTCGTTCCTCCTCTTTCTTCGTTAT
+CTTGTAGGGTTTATAACTGACTGATCAGATTCATTAAGGCCAATTTAAGAGCAGTATCGT
+CAGCCGGTGCAGGTGTCTCAGGCGTCTGCTCTTCGGTAATAATGACCGTTTCTTCATACG
+CCGGGAAAACGACGATACTTACCTCATAGACATCATTAATCTTGAGGATGACGTCAATTT
+TGTTTTCCCAGTCCGTGGCGATCATGGCATTGTTATCGAACCAAAAGGACATACCATCCA
+CAATTTCATTTTGAACTCGGTCAAAGACGTAATCGTCCAACCAGGTATTTCCTAAGGTTA
+CCTCAATGAACAGGCCGACTTCGTCTACAACCGTCCTCATATTCTTCCCTGCTCTACCGA
+GCACCCAGGACGTGGCATGATCCCACAATAAAACAAGCTTTGAAAGATCAACCCCTTCCA
+AAGCTTTCTTATCAACCTTCTCGATCCACTTACTCCCGCGATAGGGGCGTCCCGGTGTGT
+CGAAGAGAATTGGGTACCCCCGCAATCTCCTGACGTTTTGGCCATCTACCTCTTCGCTGA
+TCGCTCGAAATTTTGACCGATCATCATCAAAGAGCATGCGCTTTTTAGACTGCTGACTCA
+GGGGTGACTTTTTCTCCGCTTCCTTGCTCATCGCTCTCTCCTCCTTTCTGCTCTACCACA
+TAGCTCCCGGGACTTAGGACTTGAAAGTTTTTGTTTTCCAAGAACTTGTCTAATTCCGGC
+GGCCCTTTGGTGATGCCGAGCCGTTTTCTGATCTCATTGCGGTTCATGATGGTTCCATAG
+ACCATTTCTTTGTAAAAGGCGGTCTTAGCCGCCAGGGTACTGATTTCCAAGTCCACCAAT
+TCTGCCTGAACGCAATTTCCGTGAAAGATTTCTGTTTCACTGAATAAGGCATAGGTGGAG
+GTTTCTTCGATTTGCCACACCCAGGGTTTGATGGTGTTGTCCACAAACTGTTCAAACTGA
+AGTTCTGAGGCGGTTCCGTTAATGATTTCGTAACTGACTCCAAAGTAGTTATAGAGTTTT
+CGGGTGATGTCATCCAGCAGCTTGGTATCCAAAGGGTTGAGCTTCATGTCAAGATTGTGG
+ACTTCATACTCAGCGCCGATCATTCCGAAACCGGTTGTGTTTTCAGCCGTGAGAAACAGC
+TCTTTAAACTCATCCAGCTTTTTCTTCATGTCTGAGCTCTTCAGTTGAGATTTAACTTGC
+AGCAGAGCAGCAATTCTCTGGCTGTTTTCGCTGTCCTTGACTGCTTGATTTTGCATGGTG
+TTGACAATTTGAACATAGTTTCCGGAGGCCTGTTTACTAGATCCTTGTTTACCGTCCGGG
+AAGCGCTGCAGGTGAATTAAGTCGTCATAATAAAAGGGATAGCTTCCGCCTAACGTGACG
+ATAATTCTCCCCTGGGCATCTTGGTTGAACTCACCAAGCGTAAAGGGTAGTGGCCAAAGC
+CAGCGCAATTTGCCGCTATGTTCATCCCATTCAGGCATAATAAAACAGTTATTAGTCAAC
+AGCACTTTCGTCATGCAATGAGTCCAGAAAACCTGGGGACACTGATAAGGATTGGTTCTT
+ACCTTCAGGACAAACCCCAGGCGGTCATTGACTTGATTCATGTTACCTTCCGTGTCTGCC
+CGGATATGGTAGAAGGGAATGCTGGCCACTTTTTCGGCGATAAAGTTAATGGCTGTCCGG
+ATTTCCGGGATGTTGTAAATATTCCCCCCGAAGAGCTGCGTCAGAGAATATCCCCGGTTC
+AGCAAATCAATGACCTTGGCAGCGGTTACTTTTTCTTTCTGAAAGTAACCGGCCACATAT
+CTTAAAAAACCCAAATGATCACCTCTTTTCTACGGCTGAACTCTAACTTATCCCTTGCTA
+ATCGTTGGCCAACCATGAGCCGTTATGCATAGGCGCTCTATGGTGTTTGCGACAGAGCAG
+GCTGCTTCTGCATTCAGGGGTTACTTTGCTTTCAAGATACTATCTTGTACTTTCTCCAAG
+GCTTCAATCTGCTTTTCGATGATGGCTTTATATTCCATAAACCTTCCTCTCTTTCTACGA
+CTGATATTCTTCGAATAAATCCTGTACTTTTTTATAAGCAATATAGGCCATTAAATAGCT
+CATATACCCGTCAATTCTCGCCTTACTCTTTGCCTTATCCGGCTGAATGTTTGCGTTGGT
+GTCGATCTTAGCTGCCGTATTCGTGGTACACCACCGGAAAAGGCCATTGTGTCTGCTGAA
+CTGTACCACTTTGTCCTCAAAGAGCGATCTCGTTTCCTTCATGGGTTGGGAAAGACTTTT
+TGCTCCCATGGCCACGGAAAAAACCACACCGCGACCTTCCTTGTTCTCTCGCGGAAAGCC
+TGCTATCTCCATGTCGCTGGCGAAGTCCTCATAGTGCCAGCGGTCTGCACCGATCTTCCA
+GAAGGTTACCCCATAGGTTTCGGCCAGATCAACGTACCATTGGACAACATCCTTCCTGCT
+TACCATGCTTCCCTCGCAGATATGCAAGAGCTCATGGTTAAGTCCATCGCTTGCCCCAGT
+GCTGGTAAAGCTTTCGTAGGCCATTTTATCGGCCTTGCTGTTTTGCTCAATCCTTGACCG
+GGCAATGAAATATTTTTGAAAGAGATACAGCTTACCTTGGATCGGTACCAGGGCCGAGGA
+TGCACAAAGGTCTGTGGTCTCGGAAATATCGCTGGCACCAACAGCATAGCGATCCTGTAT
+CATATCCTCGATCATATCGATGGCGCATTGATCAACAATGGGGAGATCAAAATAGATCAT
+GCTTAAGGAGCTGGCCCGGTTAAGATGCTTAGCCAAGAACGATGGCATTTGCGCTGGATC
+TTCCAGGGCTTTTAGATATTCCCCTTCGAGGTAGCTCATAGTGGGTCTGGCTTCCCCTAA
+TCCTGGGTTAGCCTTGATCCAGCACTTACGATCCTCCGGCTTGTCGTCATCGTCGATCCG
+GAAGATCATCGGGAAGACACGTTCTTTACTTTTTCCGTTTAAGACCTTTTTGCAGCGCTC
+GAAGATGCTGTCAAAGATTCCTTCGCGGACAAAGCCAAAGGTTGAGATGATAACATTTAG
+TGGTTGAGCTCGAGCTCCTTGGGCCGATGAGAAGACATCGTAAGTGTTACGGTTTTTGAT
+GGCATGAAGCTCATCGATGACAACTCCATGAGGATTTAAACCGTCCTGTCCTTCGCTATT
+TTTACTGCCGGCTTTCATGTATGAGTTGGTGGCAGGAAACAGGATCATCTCAGTGTTGTC
+TTTATCCCTCTTAGTCCGCCAATGTTTTTTGGGATTATCCTTGGGGGTCAGAACATCGCT
+AGTCTGCAAAAACGATTTCGCCGCTTCATAGACGATGGCTGCTTGAGTCTTCATGGTGGC
+CAGACACCAGACCTGAGCAGCCGGTTCTCCATCGGCCATTAAGAGAAAGTCTGCAATGGC
+TGAAATGAAGGTGGACTTGCCCCATTTTCTGGCCACGAATAGGATCATTTCCTTGAAGTA
+TCGAACCGTCATCTGCAGTTCGGTGTCGTAGATCTTAAAACCAAAGATGCAGGCGGAGAT
+ATACTTTTGCTCAATGGACAATTCAAAGGGCTGCCCGGCCCACCGGCCTTCCTTGTGCTT
+AACCAGCTTGCAGAAATCAATAAAGGCCTCTACGTCGGTATCGTCGTAGAAGACCTTTGG
+GTTTTTAAGTAAGGATTCAATGAGTTTCTTTAACTTTTTGATGTCTTTACAATGCTTTTT
+GGGCTCTCGATCAACATAATCATGCCAGCTTTTTATATATTCCGGAGCAATAACCTTAGG
+CTTAGCCACCTTTCCCCCGCCTTAGGATAATCTTTTCGAAGGCATCCGGCTCCGAGGCTT
+TGGGTGGAGGACCCTGCGGCGTTAAGTCTGTCAGCTGCTTGATTATGCTCATGTGGTTCT
+TCACCATCGTGTTGTAGATCTCAACCTCAGGCGATTTCTTTGTTCCGTGTTGGTTTTCTC
+CGTTCTGATATTCAGAGACTGTGCCTTCTCGGTTGATGGTTTCCTGCAGATCCTCAAGGG
+TTATCGTCATGAAGGCGGCGTTGGTGATCAGCGATAAAACTCGGTTCATGGTATCTTTGG
+GCATATTCTTGAAAAGACGCTTAAGTCTTTGGATCTCTTTCTTAATTCGCTCTTCTTTCG
+ATAAGTCTTGAAGTTCCTTTTTCATGGTTTTATCACCTCCCCACCACACCCCCCTATACA
+GATCTGACTCGCGTAATAAATAACCTTCCCTCCCCGGTCCCTGGAATTTATTATTTGTTT
+TCAGAACCCGGGGGGGATGATTTCTTAGGCAACATACTTAAAGGAACTACTGTTCCCGAA
+CATTTATTACATCTTAATCCATCTATTATCCATGGCTTATTATGGCTGATTGTATATCCG
+CAATCAATGCATTTATGCGTGGGCTTTAGCTTCTTGACCTTGATTGGATATCCTTCTGGA
+TAGTCCCTTTGTAATACACGCATACCTAGTATCTGTTGGCATTGATGTATCCCATTTGTA
+AAATCAGTCATATCTGAAGTGTGAGTTATCTCTAGTTTTGCAAACTCATTCCATGCTGCT
+TGAAGCGCATCCATAACTCTGCCCTCATGCTCCGTTAATCCGTCTTTTCTCATTAATATA
+TCAACTCCCTTCTTGGCTAATTGGCGGTATTAAAAAGTCTTGCAATCCTGTACTTCTTCC
+GCTTTTATGGTTATGACAATCAGTGCAAAGGTATTGCAAGTTTTCCGGATTATATGCTAT
+GTTCCAGTCATGCTTGTTTGCATCGGTTAACTCAATAATGTGATCTACTTCCTTGCCTGG
+CTTAATGATGCCTTTGGCATGGCATTCTTCGCAAAGACCGTTAGCTCGGATTATGACAAA
+CTGCCTCGCTGGTTCCCATTGTTTATTCTTGTAGACTTCTGGATGCCTTGCCATTTACAT
+TGGCCCAGATATACCTTTGTTCGACCTCATCAACCGATCAAGCGCTTTAAATCCCTTTGT
+ATCCTCGAACTTAATCTTTGGATGAGGTTTAATTGGCTTTTTCTTTAGAGCCTCATTAGC
+CATGTTGCCCTCCTTTTAGGCATAAGAAAAAAAAGAGCCTCTCGGCTCTTGATCCCTTTG
+GTATTAGTGAACACATCAAAGACATATTTCAAAAATCTTCACAGCTATACATTAACATAT
+AATCGAGGTCTTTTAGTGCCATGGCACTGCCACCTTTATGCCATCTTACTGCCAATCGAT
+GAACAATTAAAATTTAGCTAAAAGTATTGTCATTTATCAAAGGAATTGGAAAGTTATTGT
+AGAAAATATTTTAGATGGTTATCTAGAAAAACTGAACTATTATGCTATTGGTATCTACTA
+TTTCATGTGCTGATAATGGGAGCATCCCGACACATGTCTTGTATTCATAGAGTGATCTTC
+CGACACCTGTGAGAGAAAAGCAGTTAACAAATTTTCGATATTCAATTCAGAGGAAGATGA
+GGATTTTCATGAGTATTAACAAATAACTATTTTTGTCAGTTCGTGGGACAGGGAACTTCA
+CATAAACAGTGAATTTGCAAAACTTGAGAGGATATGAATGTAATAGCCAAACTTCGCAAA
+TTCACAGAACGTCAGGCACCATTAATAAAACCTACTATAAGAAAGGAGACTTTATTTGTT
+TGGGACAATAATTCTAGATGCGTTTACTAAATCTGAAACTATGGAAATTATCGAGGCTTT
+GGATGAATTGGTCAATCCATTAGATAACTATGGTTGGGCTTCAGCAGGTATATATAGTTT
+TTGGAACTATTACACCAAAGAATTGCTTTACATTGGATTAGCTGTAGACCTAACGGAAAG
+ATTTAAGCAGCATAATGGTATAATCCCTATGGATCCAAACGGATGCAAAAAGGATAAGAT
+AGAGGAATATTTTGGGTCATGCGATAAACTTGGCTATACAATATTTGTACAATCCTCAAT
+GTCTCAACCTGCTACTCATAGAAATAAACAACTATGGAATGGACTTGATATTAAGATGTT
+TGATGTTCAAGATTACCGTGATGACCTGGTTAGGGATGACATTCGAAGAGTTGAAGGTAT
+ACTTATTGAATCATACCGAATAAAACATGGGGATTTGCCACCATGGAATAGAGTTGGGGG
+ATCAATACTCGGTCAGCAATCTGTTAATCCAGGGAACTATAATGAAATTGTTGCAAGTTT
+TAGTTCTATGGATCCTAATTTATTAACGGCTAGGTATTCTCTAAGGGAAATATCTAATAA
+CCCAACATTTGAGAGATACGAGAACACTATGCATGCAATTAGAATGCATATGTTATTATG
+GGGGATGTCTTTTGGTGAGGCACGAAACCTTATTAAGAGATCTGATAGTACTGGTTTTTT
+CGAAAAAACAATACAGGAAATGAACCGTGCAGGATATTTTAAGCGACTTCTAGCGATATA
+AGAGATTTATCTGAGCTCACATTAAATTATAGACAAATATTTTAGTAGGGACTATATAAA
+CGAAATAATCTATTACAAAGTTAAATGATGGAGACTAACACGGGATTCCCGACACTTAGA
+GGAAGATACATCCCGGTTGGGATGCGTTGGGAATCCTTGGACATTGCGCGTTAATGCTTT
+AGGGTTTTAGTTTAAATTGAAGGAGAACGATTATGGATTTTTTGGGAACATGGGAATCTG
+TGTTAAGCATTGGAGGAATTATTCTAGCTATATTTGGTATATTAGCAACTAAGTATTATT
+ATGATAAAAGTGAAAAAAAGTTCATTAAAGCATTAGAAACTGAAAGAGCTCGGATAAAAG
+AAGAGTACAGTAATTTTCTTGCGAAGAACTTAGTAAAAATGAAACTTGAAGAAGAAGAAA
+TCATTCTATCAAGAGAAACAGTAAAATTAAGTATTCTGGGTAAGTTTAATAGAACAAATA
+TACTATCAGAACCAAACGATAAAGAAATTGATGAAATAATTACAAGAACTTATTCCATCA
+TAGAAGAACAGGAATTTGTTAGTACCTCGGTTAAAAGATATATTCTAGAATCTCTTTCAA
+AGACTATACAACAACAACATACTTTAAAATCTGAAACTATCGAAAATAGGTCAGAAATAA
+GTAATTATCAACATCTAATAGATATTTCAAGCACGCAATTGTTATATATATTATCTGGTT
+TCAGTTGTCTCTTACTAATAATATATTATGGGATAAGTCATTATGGTATTAAATCCGAGT
+TTTTGATGAGTGTTTTAATAATGGTTTTTATCGCTATCCCTTTTATGTTTATGGCTAATA
+TGCCTTTTAATTTTTTTAATCCGAGTTTATCGTTTTACTTCAAGTTACATTCATATTTTA
+ATATTGGTTTAGTTACAGTTCTTATGTTAATAGGGAAAACATTAAATAAAAATGATCCTT
+TATACAATGTATTCAGTAATATTATAATGTGGAGTTTGGCTACTCTGCCAATAAGCTATT
+TCTTGTTTATTACCATTAAGAAATTTAAGAAAAAAGATTAGTTGTCTTGTAACATGACAA
+ACATTACCCCGTATAGTTGTTTTACTACATCCGAATTACATTTAGGGTAGTAAAATTATA
+ATAGCTGTTTTAACCAAATTTTTTACCATCTCTCATATCCAACAATATTAGGGCTAGTAA
+TTTTCCAGCCAACTTATAATTATTCAAATTTAGATGAAGAAAATTTCTTTAACTTAAGTG
+AATGCAATTTAAAGACTCGCACAAACAGGCGGAAAGGCGTCTATGAAAGAGTAAATTCAT
+TCCATCCCCACTCTTCGAAACTAATCTGCTCCCTACTAACATATCCAAACATCTGAGCAG
+CCATCACTATCAACTCCTCTTTCATCCTGTAATACGACCTTACAGCCATCCCAATTTCCC
+CGGCTATCCAGAAATCCTTATTAAACCGCTGCATATACTTAAGCTCTATCAGCTTTCTCT
+CCGTTTTCCCCAAGGAGCCAAGAATTATATCAACCTCATGGATCTTGTGCCTCAGCTCCC
+TAATCTCGGTTTCAAGCTCCACTCTCCTATCTACATAGCTGCCCGTCTGATCGCCTGTCT
+TTCCAACGGAACGTCCAGGGCTTAGGCTAATCTGAGCCGTATTACTAGGAAATTCGTTCT
+CAAGTTGTGCATTAAGTATCTGTAGACGAAGTTTGTCCTGCGTGTAGGTCGTAAACCGAC
+GGATTGTTTGTCGGTACCACAACGGCTTTACACGCTTTTTCTTTTCCTCAGTTGCGGCTT
+CAGTTGTCTCCAAGCCCCTTACCTCCTTATTCTCATTTAACTAACATCCTGTCCTTAGAG
+TTATTCACTTGACCCACAAGCAAAGCAATGCATACTAGCGCCAACCTTGACAGTCTTACC
+CCCACACTCTTTGCAGCCAGCACCTTCCCTGTGGTAATAACAATTTTTCATCTTCGGATT
+CTTAGCAAGGCTTTTTGCCCTGCACTCCTGGACATCATTTTCAGTCTTCCTATCCGGATT
+GCAGCAGAATTTATGTCCACACTTAAGCACCTTTCTTGCCTCCGATCCGCACCCACCGGC
+AATCGTCCGTATACACATATTTGCATTTATCCTTTTCCACACAATCTTTGCACTGACAAG
+CGCCAGCTTTACATTTGCGGCATTGACACATTCTTTTCCCTCCTTGCCAAATCCTGACCA
+GCTTCCCACTCTCGATAAATCGCGAACCAATCCTCAGCATCCATGCAGACTTTCCAACGT
+TCCCGGTCTCGTCTAAATGCCACAATGGGCATTTCACCCTCTTTGGCATCCCTTCGACTT
+TGAATCATGGCTTTTTCGATATTGAGGGCTTCGACTCTTTTACATTCGATGTGGATCCCC
+GGGAGGCCAACGACATCGTCTCCTTCGAGCCCACTAAATTGCTGGCCACGTCTGCAATCA
+TATCCTTGATCCCTACAGAGCCGAGCAAACTCGCGCTCACCGGCTGCACCCTTTTCTCGA
+CTGTTTGTCATTGCGCTCTTTTCAACTCCTGTTCGTGCTCAGCATCGTAGATCGTCATTT
+GATACTCGGCTTCTCTAACGGCCTCAGCAAACTTCTCAATCCCGTGTTCCCAAAGCCCGT
+GCCGGTGGATGACGTCGGAAAACTCTTCTACGTCATGTTCGCGAAGATACCAATTGTCCG
+GATCATCTTTCTTGGCCCATTCTTTTCTGATGATCTTACCGGTTGAAGGATTGATGACTT
+CCATGCCTGTTTTTCTTTGAATATGGCAGAGCTCATGGTCGAGCAGGGCTTTAAGCTTTT
+CTATTTGCCACGCCTCAAATGCTAGCTCAATAATAAAAATGTGGAACATCTTGCCTGTTA
+GGAATCGCTCAAAGCTTGTACACTTCTTGCATTTGCCTGTCCAGTCAACACCGCTGTCAT
+CCCGAACGTAATACTCTATAAGTTCCTTGGCATCCTTGAGATGTGGGTGATGATCATCAA
+TTAATGCCTCAGCTATTTCTCGAACTCGAGGTGATTTTTCGTAACCCATCTCTTTCCCTC
+CAATTCTTATTTTTACAGGTAAAATGCATCGTATTTCCCCGGCTTTGGCGGCTCAGGAGT
+CTTGTCCCCTGGGTCTCTATTGCGTTTGTAGTCTTTTTGGCGATTACGCTCAGCCTCTCG
+AGCATGAACCTGATCAACGGTCAAGATTCCAGATTCACGCCAGTCTTTGAGTACGCCCCT
+CAGATAGTGCATATTTCGTGCATTAGCATCAAGGCAACACTTAAGGGCTTCGATTACAAC
+CGCGTCCGGATCCGGACTTCCCCGAGTGAAAAACTCATCACAATAGGCCATAATCATGTC
+AGTCTCACCTTTGGGGATTAAACGCCCCCAGTTCTTTTCTGCCCAATTGACTGCCCGGGT
+ACCAATGGCCAAGGATACGATTTCGCTCAAATTGTTCACGTTTTTAGGGGTTTCAGACAC
+AGTTTCCTCGGGTTCGTTCACGCTCTGCCTAATTTCCTTACTTCCGTTGTTGTCGTCATT
+CTCGGCTTCGTTATGAGGGAAACAACAATCAACATTCAATATAGGGGATTCAACATTCAA
+TAAGAGGGATTCCGCCGGGCTCGTCATAACTTTTTCACGGCTAGTAAATACCTTTAAATT
+TTTAGGTTCGTCCTTGCCGTTTATTTTCACGGCTCGTTCATACCTATTTACGGCTTGGCC
+ATTTTCGGGCATATTTGGCAAATCAGACTCACCCTCTTTAGGGTGTGGTTTCTGATGTTT
+CGAAAAATTAACAATCTGAATGCATGAAATCCCATCAACTGTATAGCGAACTATAAACTC
+CGGATCTAATAGGTTAAGGAGTTCATCAACGTTGCAATCGTCATAGGGCAAAACTTCAGC
+TTTAATCCGCTTAGGCCGATCTTCGAGCTTACCCTTACGGTCAGCTAGTCCCCATAGTCC
+GATAAATAGGAGGCGGGCCAGAGGCGGCAGCTCCCCTAATTGGTCGTTTGCAAAAAAGCT
+TGGTTTAATGTTTCGTGCCCTGGCCACTCTTAATCTCCTCCTTAAACCTCAACCAAAAGC
+ATGCTCCCGCAATCCGGGCAATGCTCTTCTTTCCAGCAATCAGCAAGGCCAATTCTTAAA
+TGAATTTTCACCGGCCTGTAGGTCGTGTGGCGACAGTCCATGCAGATCTTGCGCTTACGG
+GCAAATAGGCCCCAAAGTAGATGTCTCATCAGTTTCATAAGCCTCCTCTAAAACGGACAC
+ATTTCCAACTCAATAACCTTCCCTGGCTCCGCGACCTCAACGTCCTTGCCCGTTAATTCC
+CGAATCCCTCGAACCATCCTAAATGCATCTGAATTGCCATCAGAAAGGTGAATCAAAACG
+ATTTTCCGAACCTTTGTTAGGTCATTTGCTTGCAAGAAATCCTTTACATTGTCTAGGCTA
+AAGTGGCTCTCGATCAGCCGGTTCTTTAATGATTCCGGGATCCGCCCGGCCTCAATATTT
+TCCTCAAGGATATCTCGGCAATAGTTGCACTCAACAAGAATGTAATTTAGGTCCCTGAAT
+CTGTTCCGGATGTAATAGGTGTCTGTGGCAAAAAGCAGCTTTTCACCGGTCGGCCAATAT
+TGTATGAGATATCCTAACGGTTCAGCACAATCATGTTCAGTTCGGAATGGCAGGACTGTA
+AAGTCCCTTGTTATAGGGAATTGCTCCCCTGCCCTTACTACTCCAAGACGATGACTTTCA
+ATTCCCAACTTATCGGCTGTCCCCTTACTTAAAAAGGTGTTTACTCCGAACTTAGTAAGC
+TCCTTGACTGACTTTGCGTGATCCATATGTTCATGAGTAATTAAAGCTCCGCGCACATTG
+AACAGATTAAAATTAAGTCCCTTTTGTATCTCTTTGAAGGGGACGCCTGCATCCAAGAGC
+AGGCTCCCCGTTGGTGTTTCTAAAATGTAACAGTTCCCTTTGCTTGATGAGCCGATTATT
+TTAAGTTTCATATTAGAAGTCCGGCCCTGTAGATTGGTGCTCTACCTTGTCATTTTGAGA
+CTCTGGAGCGGGAGGAACCTCAGGCCCCGCTGCTGGTTCGGCATCAATATCAACAACCTC
+TTGATTCGCCTCTTGGGCTATTTCGTTAGCAGCACGACTTTCTGCATCCTCATCTTTGTC
+AGAGGTCAAAGCTGTAGCCATTTCAGTGGACAAAAATCCATAGTGGGACAAGAGCTTTCG
+CATAGCTGTCTTGATGGCCATCTCATCAAAATTCGATTTCCAGGCCGATGAATCATAGCT
+GAAGCTTTTGCTGTAGCGTTTCGCATGCGCAAGTACTTCATCTGCTGTCATGTACACTGT
+TTTGGTAAAGCCATTAGTGAGCTGCATATAGGCAAAGTATCCCTGGGCCTTTGTGCTGGT
+CGGCTCACCAGTAAATTCAACTTCTCCCGTGAGAATGTTCTGCTTAATTTTTACGCCTTC
+TAATAAAACACCAGCATTCAAGAACTTATATTGGCCAGTCCTCATGGCGAGCTGGATGTA
+TCCTTTGTATCCAAGTTGGAACTGAGGGATGTAAACACCCTTTGATTTATAGGGAACAAC
+ATAAGCAAAGCCAAGCTGTTTGTTGATAGGAAGCTTAAGTGTTGCTGCCTTTAGGCACTC
+CATAATAACGGTCTGAGGATCGCATTTTTGCAAGTAGGTATCACTACCATATAGATCAAT
+GATTGAGGCCAGGAAAGCCCCGGAATTCTCATTGAGTGCGTTTTTAAACTGTTCCTTGAC
+GCTATCGACGTTTAAGACAGCCTTAAGTTTGTCCATTGGTTTAACTGTAATGTTGGCCAT
+GTTTATTTAACCTCCTTATTGCTTTTCAGATTTGCAATTTGTTCTGTTATTTGTGCCTTG
+ACAAGGTCCCATGCCTCCTTGTAGGCATCTTCTACAGAATTACCAAGGCACAATTTCAGC
+GGTGACTCCCGCCTCGGCAGTAAACGATTGATGGTTTCCTAGGTTTTTAACATACTTTGA
+AGAAACGCGAATCTCTTTACCGTTCATTCAGCAACCTCCACTCTAAGAACCTTATCCAGT
+TCACTCTTGAAGAGGTTGATAACTTGGCTCTCGGTTTCAATAATTCGGGACACCGACTCG
+CGGAAGTCGATAAAAATTGGGGCTGTAGAACCGTATTGGGATGCGAGTACGTTGATACAA
+TCCAGACCGGCATTAACCTTCCCTGCGTGGTTCACATCTGACCACGTTACCCCATCCACC
+ATAGCCTCGCACATTTCCTTTACGCCGCCATTAATTTGGTCATCAAAGAGCTTCCACTTG
+ACCATCTTGAACCGACTATTGAGGTTGCCTTCCAGTAAATTAACTTTGGCCTTGATAAAT
+CGCTCGAATAAGAATTTCTGCCTCTCAAGCTCACTCAGATGGGCTGCAAGGGTTCGCTCT
+TCGTCCTTGAGCTCTTCGATCCGTTCTTGAGTCTTAATCTGTACATCTCGGTTATTCAGA
+ATCTTATTGAGCGAATTAATCTGTTCTGCGACCTCATTCTTTTGCTTGAGGAGTTCGGCG
+GTCGTGTCTTCGACCGGCTTGTCCAGCTCGTCTTTAATTACTTGCTGCCGAGACAAAAGA
+CTTGTATATTCGGTATCGGCATGATAATTAACTGTGCCAGTAAGGCCCTCCATGTCTTTG
+AGTTCTTTATCAATCTCGGCCAAGCGTTCAGCTATTTCCTGAAGCTTTGCTTCTTTTTGC
+AAAAGCTCTTCGCCGAACTTCGCAGTATCTGCCTCAAGCTTTTCTTTTCGGGCCTTAAGG
+GTCTTCCCTTCTGTATTAATCTTAGTAAATTCATTTTGCTTAGTAGTATTAAAGGCCTCG
+CGCATCTCATAGATCTGTTGCCCAATGTCATCCTCTGGCAGCTCCCTCCTGCATGTAGGA
+CAAATAAAGTTGCTGGGGTCAGGCTCTTCAAAGCCTTTCGAGCTTACCTCATTCCATTTC
+GTCCGGAGGTCAGCCATATTTTTAGATACCCTTTCTATTTCACTTGAAGAACTTTCGATC
+AATTCCTTAAGGGAATAACTTGTGGTCTCAAGCCGGTACTTTTCATTCTCAAGCTGCATC
+TTCTCGTCAGTGAGCCGTTTAGATCCGGCCAAGGCTTCTGTGTCTAATTCTTTTTTTCTT
+GCCCAAATGGCCGTATCAAGCTTGAATAATTCCTGCTGCTTCTGGCGGTATTCATCCGCT
+GCCTGACTGGCATCTAACATGCTTTTCTCGATCTTCCTGAGGACTGCTTTATGTTCGAGC
+AACCTTTCTTCGACTGCTAAATAATTAACATCTTCACTTAGCAGCGTCCGTGAAAGTTCG
+TTTATCTTAATTGGTATTGACTCAATATCTTTGTTAAGCTTCTTAACACCTTCGGCAATA
+ATCTTCTTTTGAGAATCTATCGATTTTCCGTCTAAGATGTCCTGCAATGGTGCTAGGTCA
+TCACTTGAGTCAATTACATCCTGATCCGTGACGTTCCCGCAGATCTCCATAAGTGTTTTA
+CGCCGATCCTCCCACTTGAGCTGGGTGCAAAAGTAAAACGGATTCGTCAGGAGCTTGAAG
+ACATTTTCGTCGATGATAGCGTTGATTTGATCGGTATACTCCTTCTTTTTAACAGGTACA
+GTGTCAATCCAATAAGAGGTTTGATGCCCTGTAAATTCCTTCGTGGATTCACCGCGTTTT
+TTTGTCCAAACCTCTTCGAGCATCTTCCTGAGAATTTTAGGCTTGCCGTTAATGAATAGA
+TGCAGCACAACTTCTGTCTCAAGATAATTAATATCGTTACCGTTCTTATCTTGGGGCTTT
+ACTGAGAAGTCAGCACGGTTAGCAGAATCCTTATTAAATAGCGCCCACAAAAAGGCATCA
+TACAAAGTCGTCTTTCCTGCCCCGTTCTCACCAAAAACAGTGGCATTTTGCCCGTTTATA
+TCGAGGGTAAACTCTTTTATACCCTTGAAGTTCCGGAGCTCCATCTTAGAGAGCGTTATC
+TTGTTCATTTCATTCCACTTCCCAACGATTCAAATTCTTGAAGTTCTGTGCTACAATCAA
+AGTGGTTAACTTCTTTTTGAGCTTCCGCGCCAACGGGAGCTTTTTTCATGCAAAGATTTA
+TGAGTGTTTCACCGTTATAGTCAATAAAATGGAATTCACTCGGTTCTCCACCAACAATCT
+CAACGCCGACATTGCCTCGGTATTCCATGCCTGGGAACATATCCTCTAGGACTCCATTAA
+GATCCTCCTGGTCGGCATCTAACGTTGAGATGATCGTAACTCGCATAAGTCCATTCCCGT
+GGAAATCTATACTTGCCTGGGACACTAAATGGTTATGGTTTTTGGCCAGGCCCTGAATAT
+CTAAAAGTTGACCTGCTGTGAGTTGTTTCATTTCATCCCTCCACCTTTAATTTTCAATCC
+AAACTTCCAATTCCCATATTCCGAACTCTATAGCATCACTCCGTTTCTCCATGTAAAGGT
+CTAGCCTATTCCCTCGTATTGCGCCGCCCCGATCCGTGACCGTGTAGGTATGTTCAAGCT
+TTGGGATATAGATCTTGGTTCCGAAGGGTAAGCTCGGATCGGCAGCTATCGTCCAACCCT
+CTTTGACCGGTTCACCGCTGGCTGTGATTCCTTTGCCGTCCCTTCCTCTGTCATTGGCCG
+TGTAGGCCGTGACGATCATAATTCGTCGTTCATGTTTTGTAGTTGTTCCTCGGCTAATTG
+GCTTTACGGAGACCAATACCGGCGGAGACTGTTTGATTGATTGCGGCAGCTCTGGACAAA
+TAGCGTTCGATGGTGTTAAACATAAGATCGCTGCCATTAATGCGATAACAAAAATCCTTC
+GAACTTTTGATCACTCCTTTTCTAAAGAGTTTTTCGACGTAGGCGCATACTATTGCAAAT
+TGGCATTTTGTCTTATCACGCTGCCCTGTGCATCCCCCGCATGTTTCTAGATGTTTGAAA
+AAGCGTTCACAGGTCATTATTGAGCCTTCTTCCCTTTGTATTGTCCCTCCATCGCATATA
+CTTTTGATAGTGATTTAACTTTCGCTTGGGCTGCTCAGTGATAATTGGGGTAAATGTAAT
+TGTGAATAGTCCTGTTGCCCAGTATCCTTCTGGCCCACGCTCCCACCTCATCCCACATCC
+ATCAATTGGACACCTAGCTCCTGTTTTACCTACCGGAAACATCATGGCTTGTCCACACTT
+ACAGAGTGGAGTTAACCCAATTGCTTCACTCAAAGTACCTCCCTCCTTTATGCAACATCG
+ACTTCTTCCTTCGCCTCTTCCTCGGAATCAAAACTTCCAGCAAACTTTCCGTCTATCCAG
+AGCTCTACATATCCCCGCTTCTGGATGATCGTATACGACATGGCATCACCTCCTTAATAA
+ATTGTTTTCCCTACTTTCCCCGGATGACCTATTCAAATAGATGGCATTATGAATTAATCA
+CATATTGCCCTTATTTTCCCCTCTCTCGGCATCCTCTTTAAGCAGTTGTTTAAGAACCAA
+TCCGGCTAACAAATTGATTCCTCTTTCTGGGTTAGGGTGTGGGATATAACTGACCGTAAG
+ATTAACTGTGATTACCTGGGGCTTACGTGGCATTCTCCCTTCCTCCTCTCGTGGAATTCA
+TTTTCGTCGGATTCGTAACGCTTCGCTTTGTTGCTATTTTCCTCAAAAAAAAGAGTCCAT
+TTAAAGTTCAACACTTCTCCAATTCTTTGAGCAACTTTTACGCTAGGCGTTCTTTCACCG
+TTCTCAATCATGCTATAATATTGCCTTTTTACTCCAACCATTTTTGCGACCTCTTCATGC
+GTCATATCAGCATTTATGCGTATGTTCGCTAGCCAGAATCGAGTCATCATCACCACATCC
+GTCTGTAAATTCCTAGCAACACTAAGTTGCTGTGCCTTCATTATATAGCAACATAACGTT
+GCTGTAAATATTTATGGCAACAATTTGTTGCTAAGTCTTTACGCAACATAAAGTTGCCAT
+TATAATGAATTAAAAGCAATAATATTACAGGAGGCCTAGAAGATGTTTCCTGACAGACTT
+TGTACGCTAAGAACTTCAAAGGGTTTAACACATCAAGATATGGCTGATATGTTAGGAATT
+ACGCGGCAAGCGTATAGTAACTACGAGGCAGGGAAAAGAGAACCAGATCACAGCACTTTA
+AGAAAACTGGCTGAGTTTTTCATAGTCTCAACGGATTATTTACTTGGGCAAGACAATGGT
+AAGATCGTTCCCTCATGGGCAACAGCTAAAGATAAACGAGATTTTAAGAAAATGCTCGAA
+GATGATGATGATTTAATGTTTGATGGAGTTCCTATTGAGGGTGAGGATCGACAACGGATT
+AAAGATGTTCTTACCGGCCTTTTCTGGGAAGCTAAACAAATGAACAAACGAAAAAAGAAA
+TCTGACAGCACGAACGACACCAAGAAATAA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_019897.fasta.fasta
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_019904.fasta.fasta
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_019936.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_019936.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,550 @@
+>NC_019936.1|provirus_2347508_2361929
+TCAGACTTCCAGCTCTAACGTCAGATCGCCCGACGCGCTGACCTTCGCGCATGGCGTCGC
+CTTCTCCAGGATGAAATGCGCCAATTCGCTGTCTTTGATTGGCATGCGTCCCTGCCTGAC
+CAATAACTTATTGATTTCTATGCACTTTTGTCTAAGCGCTTCTTGCTCTGTATTCGACAG
+ACGCAGGGTGGCAGGCATCGTCAGTTGACCCATATCAAATTCACCTCGTGAAGTGTACGT
+GCATGCATGTGATTTGTATTGACGCATGCAAGTTCACCGGTATACATTCCGCCGCAATGT
+GATTTGCATGCATGCATGCATAGGCGAATGGACTTCACAAATGCTCGACAAAATCCACCT
+CTTCGTACCGTTTCGGGTCGATGCCATCGCTACCAGCACCGGTAAGCGCGGCAACGAGCT
+GTTGGTGGTCGATCTGGAAGCCCTGGGCGTTCCGCTCCGTGCTACCAGCGTCCTTTCGGA
+CGGGAAGGGTGGTTATCAGGTCGAGGACATAAGCCACGCTTGGGAATCTCTCTCCACTGG
+CTTTACGCCGTTGGCGTTCAAGGTCTTTCACCAGTCGCTCGGCAAGCGCATTCAGCCCGG
+CGTCGAGCTGAAAGCCAGCCCTGCGAAGCTGCTCCAGGGGCACAACGTCTTCGGGCCTAC
+CTCGATCCGCAAGGGCGGGGAGGTCATGTTGAAGTGGCTTGCCGGCTCATATCCGAAGCT
+GTGGGCCTTGCTGGACTGGCAGGCTGCTGAGGTTTACGGGATCGACTGCACCTATTCCGC
+TCGCCTGCCCGATCAGCGCACCGCGCTACAGCTCGTCCAGGCACTTCGCGGCGTTAGCAA
+CGGCCAGACTCGCAACCGTGGTGACGACTACGAAACCACGGCTTATTGGGGCTCCAAGGA
+AACCCGCCTGCGCAAGCTCAAGGCGTACCTCAAGGGCCCTGAGTTTCGCCGCCAGCTCGA
+TGATGCCATCAAGGCCGCCAGAGCCTATGGCGGTGCCAATTTCGTTCCCTCCCAAGCGTT
+CGCAGCCCACCGGCTGCTCTCGGTTCTCCAGAATCCCGCGCTCCAGGAGTGGGCCGAAAA
+CCTCCTTCGTCTCGAAGCCACTGTCATGCACCGCTGGCTCGAACGCAGAAACATCCCGAC
+GAATCTATGGGCCCTTTGCGACTACCAGGAACGGCTGGAAGAGCAGGGGAGTTGTTTTAT
+TCAGTGGTGTTGGGAACAAGTAACTAAAGAACTGTTTGCGGCCTTTGAAGGTATCTCCAT
+GCGAGTAATTAATGACGAAAAAGTGCTGGCCGCACTTAAAGCCCGTTGGACGAAGTTCGG
+AAAGAACGGGAAAGCCAATGAGACAGTTGCTCTCAACCTGTTTCGCACATATCGCAGTAT
+CAAGGATTACGGTTGGCAGGAAACCATGGACTCTATGTCTCGTGCGACTTTCTACCGCCA
+CGTTGATCAGATTTGCGAATGCGGACTTTCAAAAGCTGCACTTCAGAAGTTGAAGATGGA
+CGATCAGAAGAACAACGTTGTTCCGATCCTGCGCTTCCTGCAAGTTGACTTCAGCGCTCA
+GCGTCCTGGTTGGTACGTTGAGCCGTCCGTGGAGGCTGCATGATGCGTTCTTGGGCCTAT
+CTCCGCGGCTTTCGTGATTACCGGCCACGCCGCATTTATTGCAATCCGTACCTGCTTTGC
+AGTTACGACTACAACGAATATGAGCGTGGTTGGTTTCAGGCTCATAAGCGCACCGGGCTT
+TTTTCATGATCGCCGCGACTATCAACGCCCTGGTCGTCACTATGTGCGGACTGTTGGTAA
+TTCACTTTCTCGGGCGCTGGGCCCGTTCATAACCGAGGTAATCACCATGCTTGTACAACT
+GGGCCTGTGCAAAGGCGTCACTTCCAAAGAAAAGCAAAACGGCATCATCGAACATTACTT
+GGTCCTTACCGCTCCAGGTAAAGACCAATTCGGTCAAGAAACCGAACAGTCGGTCGGCCT
+GAAAGTCTCCAAGCGTCAACTCGATTCAGGCATCGAGAATGCCTATAAGAAATACATCGG
+CCAGCAAGTTGCTGTTCCGGTATACGCCAAAGCCTGGAAGTCCAAAACTGGCACCGCTTT
+CGGCATGGACCTGTGGCTCTCCGATGACGGCCTGCCTGTTCCAGTTCAGCGCGTACAACC
+GCGTCCTGCTGCTGTATCTGGCGGCAACTGATGACAACCGGCGCTCTCATCTGTGAAGGC
+CAAGTAACCATCGCAAATGATGGCGCTCCCCTGTGTTCTGGTATGTGGCAATTAATGGCA
+CTACCACAACCTTTCGACCCATCCCAGTTACAACCTGCCGAACTGGGCGCATTGTTTGGG
+TACGGCTTCGGCTTAGTTGCTGGCTGCTGCATCCTGGGCATTGTGGGTCGATTGTTTCTT
+AACGCTATATACAACCCAAGCAAGGAGTAACACCATGGAAGCAATGATCACTGCAATTAC
+CGGTGCTGTTGACTGGGCTGCTGTTATCACTGGCGCTGGCACCATCTTTGGTGCGCTCGC
+CCTGGTCTATGTCGCCTTCAAAGGTGGCCAGATGCTCGTCAACGTCCTGCGCCGCGGTTA
+ATCCAGCGTGCGTTGAACTGGGGGCCTCGGCCCCCTTTTCTTTTTCGGCGGGGGATATTC
+AATGGCCGATTTATATCAGTGGACGTTCTTTGTTCTCGGTTGCGTTTGTGGTTACGCCAT
+CTTCGGGAGGCTCTAATGTTCCGCCTTCTATTAGCTTTTTCTCTCTTGGTCATATCCATC
+ACTGCAAAGGCTGAATCCTACTATTGGATCATTTCCTTTCCTGCTGACAATGCTAGGTAC
+GTCACTGCTGTTGCGGCTTGTAATGCAAACCATACCTATTACCAGCAACTTAACCCCGGT
+TACGACAGATATGATCAAAGGGTTGTAGTTGGTGAAACTTCATTTTATTGCGAAACCACT
+GGTTTGCGGCGTAATGCTCAGGGTGTATACGAGCCGTATGGTAGATGGGGAAACACTGCT
+AACCGTCGTGGAGATTCTTGCCAGCCGGGTGAAAACTACGACCCTAATGTTGGTGGTTGT
+GAGGTTCCCCCAGGTGAAATGGGCGAAGCGTGTGAAGGTCCTGATCCTGGCTTAACTAAG
+TTCGGCTATGTCTACAACTCCCAAGGCCAGTGTGTTGACTACACCCGAGCCGATACAGCA
+TCACAATGCAAACTACTCGCTGGAACGTCAGCACCAACTAAGATTGCGGTTGTATTTAAC
+GATGATGGATCGCCTCAGATCCCGCCGCCAATGAATGTCGGTGGCTGCGCGGGCATCGTT
+GCCTCTGTGGAGCATTGCGAAATGGCACCAGTTCGCTGTGGTGGTGCGTCTGGTAATTCC
+TGCATGCAGTCTAGTGTCAATACCTGCAAAGTCCTTGTTTCGTTCTCTGGCGCTGTCTCT
+GGTGACGGTAAGCCGCTTGTCATTAAGGGGCATGAAGGCTCCGAAGAGGGCGTTTGCCAG
+CCGGGAGATGCGTGTGATCCTGCACCTACGCCAATTCAAAATGAGGAAAAACCCTGTGTT
+TATGTCGAGGACGGGGAAGGTAGGCGTGTTTGTGATTCCAATAAATGGACGGGGCAACCC
+GGTGAAAAAAGCTGCGGTACTGTCAATGGTCAGCTTACTTGTATAGGCAAATCGCCGACA
+TCGAACGGCATCAGCATTGGTACTGTCGTTGAGGAAAAAGCCAACGTCGACGGCACCAAG
+ACAGTTACTAAGACCGACGTTCATAACGAAACCAAGTGCATTGGTGCGGGTAGTTGCAAG
+ACCGAAACCACGACCAACAAAACCGTCATCGTTAAAGACTCTGCGGGTAACACTATCGGG
+CAGTCTGGAAGCTGCACCGGTCCTAAGTGTGCAACTGATGGCAAGGGCGACAAGAATGGT
+GATGGTCTTGATGATTGTAAGTCGGGCGAGGATTGCACCGATGAAGAGGAGTTCGAAGGC
+CCAACTAACGGCGACGCTGGAAGTTTTGGCGATAGCCTTGGCAACTTCACCTCACGTGTT
+AAAGGCGCTCCGATCATTGCGTCCGCATCAAGTTTGACGTTCGCGTCTGGCGGCTCGTGC
+TCGATGCCTTCTTTCTCTGTGCCAGTTCTCGGCACGCTTTCGTTTCAGCCTATGTGCCAA
+TGGGCAGCTGATTGGTTCGCACCAATTAAAATGATCATGCTCGCGCTTTGGGCGCTTGTT
+GCTGTTCGCACCTTCTTGGAGGCCTAATTATGCTTGCCGACTTCGCGCAGTGGCTCAAAG
+ACTTCTTCCTTTGGTTGCCGCTCAAGATATGGGAAATGATGCTCGATGCTCTCGCGAGCG
+TCATTGAGGCTCTTCCTGTCCCCGACTTCATGTCGAACGCTCAAGGTTATATGTCCAGCG
+TCGGAGGTAATGTTCTTTGGGTGCTTGATCTGTTTGCCGTTCCCCAGGGCATGGGCATGG
+TTATGGCGGCTTTAGTGCTCCGCTTCATTGTTCGCCGCATTCCGATCATTGGGTGATATA
+TGGCTATCGACGCTTATGTTGGCCTTCCTGGTAGTGGCAAAACTTATTCGGTCGTTAAGT
+TTGCGATCCTGCCCAGCCTCAAACAGGGCCGTTTAGTTATCACGAACATCCCCCTCACTG
+ATCTTGCCCATCAGGATTACCCCGACCAGATACGCCAGCTCCCGCATAACTGGTATCAGG
+ATGAGAAACTGTTTGAGACTGTCCCTAATGGCGCTGTTGTTGTCCTCGACGAACTTTGGC
+GTCGATGGCCGAAGGGCATGCCCGCTGCCAAGGTTCCGTTTCGCGATAAAGAGTTTCTCG
+CCGAGCATCGGCACTTGGTAGACGAGGAGGGCAACAGCACCCGAATCGTCCTCGTTACTC
+AAGACCTGGACCAGATTGCCGCTTTTGCCACCATGCTTGTCGATACCACTTATCAGAGCG
+TCAAGCTGTCCGCCCTCGGAGCTAACAAGAAGTTTCGTGTTGATATCTACCAGGGCGCAG
+CAAAGGGTCAGAGGCCTCCTAAATCTCGGCTTCTTCGCTCGACTTATGACCGCTACGAAA
+AGTCGATTCACCAGTACTACCAGAGTGCTACCAAGAGCCTTACGGGCGTTGTTGGTGACG
+AATCCAGGGCGGACAAGCGTGCAACCATCTGGCGATCGCCGCTCATGATCTTCACCTTGA
+TATCTCCGTTTCTGATTGGCTTCCTGGTCTGGCAGATCGTGCAGTTTTTCGGCAACGGCA
+TGAGCTTCTCGAAGCGGGAACCAGAACCCGACCCAGTTGAGGCTCTAGCCGATATGCCCC
+TGGTCAACCCTATGCCTGCCGATCTGGCTCCTGCTGTTATCCAACAGCCGCAACAGACTC
+AACCGGCGCAGCGTGGTTATTCTGCCGTCTGGCGTGTCTCTGGCCACATCAAGCGCAAAG
+ACCCTGACACGAACAAGATGCGTGACGTGGTCATGCTTTCGTCACTCAGTGGCATTCGAT
+ATGAGCCTATGGAGAACTGCGAGCCCATCAGCATGGGTTTCGAATTCCAATGCGAGGTTG
+ACGGTGATTTGGTCACGCCCTGGTCTGGTCCGATCAACCAGAACATGACGGGCTATGTTC
+TTGGAGGGGCAACCCAATCCGTTGACGCTGGCAAGCAAGCGGTAGGACTTGGCGGCGAGC
+GTAGCGCTGCCGTCGAAGGACGCACCGCGCAGCCATCCGTTAATCCGATCTGATGCATAC
+GACTCTTCATCGCACACGTTCTGATTGGGCGCTTCGCATAATGGATGGCCTTATGTTGAG
+CGGTGTCCGGACAATGCCTCTGGCTCCGGGCGCCGGTTAACATAGGGCCGATTATGCGCT
+GCGCTATCGATCTCGAATCCCGCCTCATCAAAACCGCCGAGCTGTATGCGCCGGGCCGCA
+AGGGTTCCGACGCCGTGACTTGGATTCTCGACGACTACCCACGACTTGTTGCCGAGATCC
+GTGATCTGAGAAAGCGAGTCGCCCAGCTCGATGACGAAGGTGCCCAGCTCGATGCAGTCC
+TTCAGGAGCTGCGTCAGATCGCTGAGCGAATCAATCATCTCTGACCTGTCCCCCTGGCCT
+CGACCTCGCCGCTCGCGGCGATTAGTCGCCTGCACTGCTTCCTGTCGTGCTGCATAGCGC
+CTGCGACGATACCCCCGAAGGGGCCGCAACCATCGACCCACAAAAAAGCCCCCAGCGGCC
+TGTATGGCCCTCTGGAGGCTTCTCGCGATCTTCGTCCCACCGTCCCCCCACCAGCTCAAC
+CCGCGCCCCGATCTGCCCAAATGGAACAGCTCCAGGGCTTCTCTCTGCCGCTCTCCCAGG
+ATCATCAGCACCGCTGACGGTTAGGTCACGAAGTTGCAGTGGTTCCGCCGCGCTTTGGCT
+TCACCGGCGCAGCCGGGTCCACCATCTCTAATGGTGGACTCTTGTCTCATGGTGAGACTT
+TTGGGGTGGTTTTCAGACTTCCAGCTCTAACGTCAGATCGCCCGACGCGCTGACCTTCGC
+GCATGGCGTCGCCTTCTCCAGGATGAAATGCGCCAATTCGCTGTCTTTGATTGGCATGCG
+TCCCTGCCTGACCAATAACTTATTGATTTCTATGCACTTTTGTCTAAGCGCTTCTTGCTC
+TGTATTCGACAGACGCAGGGTGGCAGGCATCGTCAGTTGACCCATATCAAATTCACCTCG
+TGAAGTGTACGTGCATGCATGTGATTTGTATTGACGCATGCAAGTTCACCGGTATACATT
+CCGCCGCAATGTGATTTGCATGCATGCATGCATAGGCGAATGGACTTCACAAATGCTCGA
+CAAAATCCACCTCTTCGTACCGTTTCGGGTCGATGCCATCGCTACCAGCACCGGTAAGCG
+CGGCAACGAGCTGTTGGTGGTCGATCTGGAAGCCCTGGGCGTTCCGCTCCGTGCTACCAG
+CGTCCTTTCGGACGGGAAGGGTGGTTATCAGGTCGAGGACATAAGCCACGCTTGGGAATC
+TCTCTCCACTGGCTTTACGCCGTTGGCGTTCAAGGTCTTTCACCAGTCGCTCGGCAAGCG
+CATTCAGCCCGGCGTCGAGCTGAAAGCCAGCCCTGCGAAGCTGCTCCAGGGGCACAACGT
+CTTCGGGCCTACCTCGATCCGCAAGGGCGGGGAGGTCATGTTGAAGTGGCTTGCCGGCTC
+ATATCCGAAGCTGTGGGCCTTGCTGGACTGGCAGGCTGCTGAGGTTTACGGGATCGACTG
+CACCTATTCCGCTCGCCTGCCCGATCAGCGCACCGCGCTACAGCTCGTCCAGGCACTTCG
+CGGCGTTAGCAACGGCCAGACTCGCAACCGTGGTGACGACTACGAAACCACGGCTTATTG
+GGGCTCCAAGGAAACCCGCCTGCGCAAGCTCAAGGCGTACCTCAAGGGCCCTGAGTTTCG
+CCGCCAGCTCGATGATGCCATCAAGGCCGCCAGAGCCTATGGCGGTGCCAATTTCGTTCC
+CTCCCAAGCGTTCGCAGCCCACCGGCTGCTCTCGGTTCTCCAGAATCCCGCGCTCCAGGA
+GTGGGCCGAAAACCTCCTTCGTCTCGAAGCCACTGTCATGCACCGCTGGCTCGAACGCAG
+AAACATCCCGACGAATCTATGGGCCCTTTGCGACTACCAGGAACGGCTGGAAGAGCAGGG
+GAGTTGTTTTATTCAGTGGTGTTGGGAACAAGTAACTAAAGAACTGTTTGCGGCCTTTGA
+AGGTATCTCCATGCGAGTAATTAATGACGAAAAAGTGCTGGCCGCACTTAAAGCCCGTTG
+GACGAAGTTCGGAAAGAACGGGAAAGCCAATGAGACAGTTGCTCTCAACCTGTTTCGCAC
+ATATCGCAGTATCAAGGATTACGGTTGGCAGGAAACCATGGACTCTATGTCTCGTGCGAC
+TTTCTACCGCCACGTTGATCAGATTTGCGAATGCGGACTTTCAAAAGCTGCACTTCAGAA
+GTTGAAGATGGACGATCAGAAGAACAACGTTGTTCCGATCCTGCGCTTCCTGCAAGTTGA
+CTTCAGCGCTCAGCGTCCTGGTTGGTACGTTGAGCCGTCCGTGGAGGCTGCATGATGCGT
+TCTTGGGCCTATCTCCGCGGCTTTCGTGATTACCGGCCACGCCGCATTTATTGCAATCCG
+TACCTGCTTTGCAGTTACGACTACAACGAATATGAGCGTGGTTGGTTTCAGGCTCATAAG
+CGCACCGGGCTTTTTTCATGATCGCCGCGACTATCAACGCCCTGGTCGTCACTATGTGCG
+GACTGTTGGTAATTCACTTTCTCGGGCGCTGGGCCCGTTCATAACCGAGGTAATCACCAT
+GCTTGTACAACTGGGCCTGTGCAAAGGCGTCACTTCCAAAGAAAAGCAAAACGGCATCAT
+CGAACATTACTTGGTCCTTACCGCTCCAGGTAAAGACCAATTCGGTCAAGAAACCGAACA
+GTCGGTCGGCCTGAAAGTCTCCAAGCGTCAACTCGATTCAGGCATCGAGAATGCCTATAA
+GAAATACATCGGCCAGCAAGTTGCTGTTCCGGTATACGCCAAAGCCTGGAAGTCCAAAAC
+TGGCACCGCTTTCGGCATGGACCTGTGGCTCTCCGATGACGGCCTGCCTGTTCCAGTTCA
+GCGCGTACAACCGCGTCCTGCTGCTGTATCTGGCGGCAACTGATGACAACCGGCGCTCTC
+ATCTGTGAAGGCCAAGTAACCATCGCAAATGATGGCGCTCCCCTGTGTTCTGGTATGTGG
+CAATTAATGGCACTACCACAACCTTTCGACCCATCCCAGTTACAACCTGCCGAACTGGGC
+GCATTGTTTGGGTACGGCTTCGGCTTAGTTGCTGGCTGCTGCATCCTGGGCATTGTGGGT
+CGATTGTTTCTTAACGCTATATACAACCCAAGCAAGGAGTAACACCATGGAAGCAATGAT
+CACTGCAATTACCGGTGCTGTTGACTGGGCTGCTGTTATCACTGGCGCTGGCACCATCTT
+TGGTGCGCTCGCCCTGGTCTATGTCGCCTTCAAAGGTGGCCAGATGCTCGTCAACGTCCT
+GCGCCGCGGTTAATCCAGCGTGCGTTGAACTGGGGGCCTCGGCCCCCTTTTCTTTTTCGG
+CGGGGGATATTCAATGGCCGATTTATATCAGTGGACGTTCTTTGTTCTCGGTTGCGTTTG
+TGGTTACGCCATCTTCGGGAGGCTCTAATGTTCCGCCTTCTATTAGCTTTTTCTCTCTTG
+GTCATATCCATCACTGCAAAGGCTGAATCCTACTATTGGATCATTTCCTTTCCTGCTGAC
+AATGCTAGGTACGTCACTGCTGTTGCGGCTTGTAATGCAAACCATACCTATTACCAGCAA
+CTTAACCCCGGTTACGACAGATATGATCAAAGGGTTGTAGTTGGTGAAACTTCATTTTAT
+TGCGAAACCACTGGTTTGCGGCGTAATGCTCAGGGTGTATACGAGCCGTATGGTAGATGG
+GGAAACACTGCTAACCGTCGTGGAGATTCTTGCCAGCCGGGTGAAAACTACGACCCTAAT
+GTTGGTGGTTGTGAGGTTCCCCCAGGTGAAATGGGCGAAGCGTGTGAAGGTCCTGATCCT
+GGCTTAACTAAGTTCGGCTATGTCTACAACTCCCAAGGCCAGTGTGTTGACTACACCCGA
+GCCGATACAGCATCACAATGCAAACTACTCGCTGGAACGTCAGCACCAACTAAGATTGCG
+GTTGTATTTAACGATGATGGATCGCCTCAGATCCCGCCGCCAATGAATGTCGGTGGCTGC
+GCGGGCATCGTTGCCTCTGTGGAGCATTGCGAAATGGCACCAGTTCGCTGTGGTGGTGCG
+TCTGGTAATTCCTGCATGCAGTCTAGTGTCAATACCTGCAAAGTCCTTGTTTCGTTCTCT
+GGCGCTGTCTCTGGTGACGGTAAGCCGCTTGTCATTAAGGGGCATGAAGGCTCCGAAGAG
+GGCGTTTGCCAGCCGGGAGATGCGTGTGATCCTGCACCTACGCCAATTCAAAATGAGGAA
+AAACCCTGTGTTTATGTCGAGGACGGGGAAGGTAGGCGTGTTTGTGATTCCAATAAATGG
+ACGGGGCAACCCGGTGAAAAAAGCTGCGGTACTGTCAATGGTCAGCTTACTTGTATAGGC
+AAATCGCCGACATCGAACGGCATCAGCATTGGTACTGTCGTTGAGGAAAAAGCCAACGTC
+GACGGCACCAAGACAGTTACTAAGACCGACGTTCATAACGAAACCAAGTGCATTGGTGCG
+GGTAGTTGCAAGACCGAAACCACGACCAACAAAACCGTCATCGTTAAAGACTCTGCGGGT
+AACACTATCGGGCAGTCTGGAAGCTGCACCGGTCCTAAGTGTGCAACTGATGGCAAGGGC
+GACAAGAATGGTGATGGTCTTGATGATTGTAAGTCGGGCGAGGATTGCACCGATGAAGAG
+GAGTTCGAAGGCCCAACTAACGGCGACGCTGGAAGTTTTGGCGATAGCCTTGGCAACTTC
+ACCTCACGTGTTAAAGGCGCTCCGATCATTGCGTCCGCATCAAGTTTGACGTTCGCGTCT
+GGCGGCTCGTGCTCGATGCCTTCTTTCTCTGTGCCAGTTCTCGGCACGCTTTCGTTTCAG
+CCTATGTGCCAATGGGCAGCTGATTGGTTCGCACCAATTAAAATGATCATGCTCGCGCTT
+TGGGCGCTTGTTGCTGTTCGCACCTTCTTGGAGGCCTAATTATGCTTGCCGACTTCGCGC
+AGTGGCTCAAAGACTTCTTCCTTTGGTTGCCGCTCAAGATATGGGAAATGATGCTCGATG
+CTCTCGCGAGCGTCATTGAGGCTCTTCCTGTCCCCGACTTCATGTCGAACGCTCAAGGTT
+ATATGTCCAGCGTCGGAGGTAATGTTCTTTGGGTGCTTGATCTGTTTGCCGTTCCCCAGG
+GCATGGGCATGGTTATGGCGGCTTTAGTGCTCCGCTTCATTGTTCGCCGCATTCCGATCA
+TTGGGTGATATATGGCTATCGACGCTTATGTTGGCCTTCCTGGTAGTGGCAAAACTTATT
+CGGTCGTTAAGTTTGCGATCCTGCCCAGCCTCAAACAGGGCCGTTTAGTTATCACGAACA
+TCCCCCTCACTGATCTTGCCCATCAGGATTACCCCGACCAGATACGCCAGCTCCCGCATA
+ACTGGTATCAGGATGAGAAACTGTTTGAGACTGTCCCTAATGGCGCTGTTGTTGTCCTCG
+ACGAACTTTGGCGTCGATGGCCGAAGGGCATGCCCGCTGCCAAGGTTCCGTTTCGCGATA
+AAGAGTTTCTCGCCGAGCATCGGCACTTGGTAGACGAGGAGGGCAACAGCACCCGAATCG
+TCCTCGTTACTCAAGACCTGGACCAGATTGCCGCTTTTGCCACCATGCTTGTCGATACCA
+CTTATCAGAGCGTCAAGCTGTCCGCCCTCGGAGCTAACAAGAAGTTTCGTGTTGATATCT
+ACCAGGGCGCAGCAAAGGGTCAGAGGCCTCCTAAATCTCGGCTTCTTCGCTCGACTTATG
+ACCGCTACGAAAAGTCGATTCACCAGTACTACCAGAGTGCTACCAAGAGCCTTACGGGCG
+TTGTTGGTGACGAATCCAGGGCGGACAAGCGTGCAACCATCTGGCGATCGCCGCTCATGA
+TCTTCACCTTGATATCTCCGTTTCTGATTGGCTTCCTGGTCTGGCAGATCGTGCAGTTTT
+TCGGCAACGGCATGAGCTTCTCGAAGCGGGAACCAGAACCCGACCCAGTTGAGGCTCTAG
+CCGATATGCCCCTGGTCAACCCTATGCCTGCCGATCTGGCTCCTGCTGTTATCCAACAGC
+CGCAACAGACTCAACCGGCGCAGCGTGGTTATTCTGCCGTCTGGCGTGTCTCTGGCCACA
+TCAAGCGCAAAGACCCTGACACGAACAAGATGCGTGACGTGGTCATGCTTTCGTCACTCA
+GTGGCATTCGATATGAGCCTATGGAGAACTGCGAGCCCATCAGCATGGGTTTCGAATTCC
+AATGCGAGGTTGACGGTGATTTGGTCACGCCCTGGTCTGGTCCGATCAACCAGAACATGA
+CGGGCTATGTTCTTGGAGGGGCAACCCAATCCGTTGACGCTGGCAAGCAAGCGGTAGGAC
+TTGGCGGCGAGCGTAGCGCTGCCGTCGAAGGACGCACCGCGCAGCCATCCGTTAATCCGA
+TCTGATGCATACGACTCTTCATCGCACACGTTCTGATTGGGCGCTTCGCATAATGGATGG
+CCTTATGTTGAGCGGTGTCCGGACAATGCCTCTGGCTCCGGGCGCCGGTTAACATAGGGC
+CGATTATGCGCTGCGCTATCGATCTCGAATCCCGCCTCATCAAAACCGCCGAGCTGTATG
+CGCCGGGCCGCAAGGGTTCCGACGCCGTGACTTGGATTCTCGACGACTACCCACGACTTG
+TTGCCGAGATCCGTGATCTGAGAAAGCGAGTCGCCCAGCTCGATGACGAAGGTGCCCAGC
+TCGATGCAGTCCTTCAGGAGCTGCGTCAGATCGCTGAGCGAATCAATCATCTCTGACCTG
+TCCCCCTGGCCTCGACCTCGCCGCTCGCGGCGATTAGTCGCCTGCACTGCTTCCTGTCGT
+GCTGCATAGCGCCTGCGACGATACCCCCGAAGGGGCCGCAACCATCGACCCACAAAAAAG
+CCCCCAGCGGCCTGTATGGCCCTCTGGAGGCTTCTCGCGATCTTCGTCCCACCGTCCCCC
+CACCAGCTCAACCCGCGCCCCGATCTGCCCAAATGGAACAGCTCCAGGGCTTCTCTCTGC
+CGCTCTCCCAGGATCATCAGCACCGCTGACGGTTAGGTCACGAAGTTGCAGTGGTTCCGC
+CGCGCTTTGGCTTCACCGGCGCAGCCGGGTCCACCATCTCTAATGGTGGACTCTTGTCTC
+ATGGCGAGACTTTCCTTTGTGGCTTTTCTCGCTTCAAACCCTTGCGCAGCAAGGGCTTGA
+AGGTTTTTTCCTTTAAATCCTCGCGCAATCCATTGTGTACGTACAAATGTTTATGTAAAT
+TTGCGCCTAACTCAGCTTGGTGATGCGTATGACTGCCGATGACCGTGGCAACTCTTTCCT
+TCGTGATCTTCGCGCTCAGCTTGGTCGTGATCCAGAAACCGGCCTTACTGCCGATGAATC
+TACGCGCGAGCGGGTAAATCAGATTCTTGCGAACTTGGCCGACAACGAAGACGCTCGCGT
+GAATTTCCGCATCAATTCTGCCGTGAAAGAAGAGTTTGAGCGTCTTTGCCAGCAGCGAAG
+CTCAACCCTTAGCCGCGAGCTTCGACGCTTCATGATTCAAGCGATCAGCCGTCAGCGCTT
+CTGGCAGCAATAGGAGGAGGGCGCACCCCACCCTGAGGGCATGCCTTAAGAAGCCCTCCA
+GCGTCAAATTAGAGGCCTTGTGCCTTAAGAATCGAGCCCGAGCGGGCTAGATGCTGCCCT
+AGGGAGCGCCAACTCCCCAGGGTAGCTACCAATAACGATCTAATAAGGAGATCGATATGG
+CTGCTTCGAATGTTACTCAAGTACAGCGCAATGCTTGCGTTCACGCTTTTGGTTCCTTTG
+GCCAAAATCAGGTCCAAGCTGAAAAAATATCATGTTGGAAAGATGGTTCTTTCTCCGCTG
+ACCCGTTCGTTTTCCTAGGGCGTCGTATTCGAGTCGGCGAACAGCTTCAGGCATGCTATG
+ACGATGAGCGCGGCTTGGTTGAAGAGTCGTATGTGTACGAGGCGAAGGTTGTCGCGGTCC
+ACATAGGCTCGGCTGCTGACGGCATCGAGAGTTCGCTGCTTTTGCGCCCGAACGACGTAA
+ATCACGAAAACTACGTTGATATCTCCAGGCTCACAGTTCTGGAGGTGCTTGAGTGAAACC
+CTTAATGCTCGGAACCTTGTCCAGAGTACCAGCAGCACGTCTGCTGCAACTGGGCGAGTG
+CCCGCAGCCCATCAGCATGGGTTTCGAATTCCAATGCGAGGTTGACGGTGATTTGGTCAC
+GCCCTGGTCTGGTCCGATCAACCAGAACATGACGGGCTATGTTCTTGGAGGGGCAACCCA
+ATCCGTTGACGCTGGCAAGCAAGCGGTAGGACTTGGCGGCGAGCGTAGCGCTGCCGTCGA
+AGGACGCACCGCGCAGCCATCCGTTAATCCGATCTGATGCATACGACTCTTCATCGCACA
+CGTTCTGATTGGGCGCTTCGCATAATGGATGGCCTTATGTTGAGCGGTGTCCGGACAATG
+CCTCTGGCTCCGGGCGCCGGTTAACATAGGGCCGATTATGCGCTGCGCTATCGATCTCGA
+ATCCCGCCTCATCAAAACCGCCGAGCTGTATGCGCCGGGCCGCAAGGGTTCCGACGCCGT
+GACTTGGATTCTCGACGACTACCCACGACTTGTTGCCGAGATCCGTGATCTGAGAAAGCG
+AGTCGCCCAGCTCGATGACGAAGGTGCCCAGCTCGATGCAGTCCTTCAGGAGCTGCGTCA
+GATCGCTGAGCGAATCAATCAT
+>NC_019936.1|provirus_3233292_3242961
+TTACTGCAACCCACCCAAGGGGCTCAGCCTAATGGCGTCGCTCAAATGCTCAGGCGCAAG
+GTGTGCATAGCGCATTGTCATGTTCAGCGACGCATGGCCCAGGATCTCCTTCAGCGTCAC
+GATATGGCCACCGCCCATGATGAAGTGAGCCGCGAAGGTGTGGCGCAGGATGTGGCTTGC
+CTGTCCGCGTGGTGGCTTGATCGAGGTCGAGAGCAGGACCAGCCGAAACACGCCAATGCA
+GTTGGTGAACGGCCCGTAGGTTTGCCAGTGCTTCTTGATCGCCGCCGCCAGCTCGGGCGT
+AACCGGGACCATCCGCACCCGTTTCGACTTCGTATTGGCGAACACCAAGGCGTTGCCTCT
+GATCCGCTCCAGTCGCAGCGCTTGAGCCTCACCCCACCTCGCCCCGGTCGCCAAGCAGAT
+ACGCGCCACCATCGCCGGGTGCGGAGACGTGGTCCGCGCCTGGAGTGCATCGAGCAGCTC
+GGAGATCTGCGGCTTGGTCAGGTAGGCCAAGGGGCGCTCCTGCAACCGAACCGGACGAAT
+ACGGGTGAAAGGACAGGGATAGTCGATCACGTCGAGTTTATGCAGCTCGTTGTAAACGGC
+TTTCAGGTAGCCAAGGCGATTGTTCGCCGTCTTGCCGGTGACGCCAGCTAACATCCAACG
+CGCGCGTGTGGCGGCGATCTTCGCGCCATCCACCATACGAGCTATCGGATCGCCCATCGC
+CTTTGCACACGCTCGCAGGATCGCCACACGACGAACGCCATCGGAGAGCGAGACGCCGTG
+AAGGTCGAACCATAGCTCGACCAGCTCTGACAGCCTGCGCTTGTCCTTTGGCCGCGGTGC
+CCAATCGTTCGATTCGCTGCACTTGGCGCGACAGGTCGCCTCGAAGCGCATTGCCTCGGC
+CTTGGTCTTCAGCGTCTTGCGGAAGCGCTTGCCTTTGACCGGCTCAACATCGACCCGCCA
+GCGACCATCTGAGAGCTGCTGAATCGCCATCAGACCGCTCTGCCCCATCGAACGTGGCGT
+TCTTGAAGCAACGTCTTGATGTGCTTGTACAGATCACGCTCGCTCATGTCCTTGGCGGCG
+TAGTGGTCACGAATGACCGGCCAGCATTCCCACTCCTTCAGTCGATCAAATGCGGTTTTA
+GCGCCCACTCGCTCCCGTGCCAGCAGGCTTACGAAGTTTCCCAGGAATAGCTCCACGTTC
+TTGCCCGAGAAGCCCCGTGAGGTCTTGTAGTAGCGCTTGTATTCCGTTTCATCGACCAGG
+GAATCGACCGCCACGTCGACCCGCACGTCATCACGCATCAGCGTCCAGATCGGTTCGTAT
+TGCCCTGGGCGATGCAGCAACTTGAACTGGCACAGCCCGTAGCGCCACAGGCCGTCCAAA
+TGGGCGGAGAACGCCGCAAACGAATCCGTTTCAATGGCCTCGCCGGTCTTGGCACTGATC
+GACCCGCTGGCGAACTGCTGGATGACCGAATGGTGATAGCGCAGCTCGACCCGCCACACG
+TCCGCCTCGGGATCGTAGTTATCAGGATCGGCCGTATCGAACGAATCCCGGCGACGCCAG
+ACGCTTTCCCAGAAGTCGAGCTTATCGGTTGCGCGGGCCTGTTCGGTTTTGTTGTAGATG
+CAGAGCTGAACGCCACCGGCTGAGCCGAACATGGACGTTTCGCCACGACCGTAGACGCTG
+GACTTGGTCGCCCAGTTGATCTCGTTGATCCCCGAGATATCCCGGTGCGTCCGCGCACGA
+CAGTGCAGGCGTGCCACCAGATCCACCGGAGGCTTCCAGCCCTGGAGATCCAACGCCAGA
+TGGACAGCGCACTGGTTTCGTTCGCGGTGCGTCATCACGGCTGCGGCGTAGTAGTCCATG
+CGCTCTTGCAGGCGCTCAGGCGACAGAGCGTCGATGGCGTGCGGCGACACCTCGATTTTC
+AGGTGCGGCCCGATGTTCTCCAGCTTGGCGTTGAAGTTCTTGATCAGCAGAATGAAGCCA
+AGGTCGGCGTTCTGCAGCTTGTACTGGTAACCCGAGTCCCGCCCTACCCGTCCCGCGTGC
+CAGAACTCTCCAGCGAATTCGACCATGACGCCCGGTTTCTCGAACAGCGCCATGATCTCC
+GGACGGATCAGCCCGCGATACAGCTGGCGGACCGTATCGACGCCGCAACGCAGCAAGCGA
+ACGCCCGACAGGTCAGTCAGCTTGGCCGAATGGCTATCGAAGAACAGTCGCCCGGCTGGG
+GTTTCCTGAAAGTTCTGATCAACACGAATTTGGTCTTTAACGCTCATCTTCTTCTGCTCC
+AAATTGCAACGAATTGACACTGTTCAGTTGGGTTTATCTGACGTGTTACAGGGACGTCAG
+CGCGCGCGTTTGCACGCCGGCTCGTGCCTCGCCGCGCGTGCAAAGAGCGCGGAGCGCACG
+CGCGCTGACGGTCATCACCACAGGAATTGCCCCTTCTGGTACGGCACGACGGTCATGTTC
+GCGCCACCAGCGGGTTGCGCTGCTCCAGGGCGCGGCTCATGCATTGCCGGAGACTGGTTG
+TTCTGGACTTGCTGGGTTCGCTCGCCGGTGGAGCGATCAGGAAGGGTCGGATCGAAGAAG
+CCGTTTTCGACCACGCGCATGCAGAAGGCGAAGTCGGTTTCGACCCGCGTGCTCTGCTGC
+GTGTAGCACTGGCAGACGGTGGGTGTGCCGTTGACTACGGCATGCGCCATTCGCCCGAAC
+TCGCGGGCATAGGTCGCAGGGTCGGTGCTGGACATGCAGTAGAGCCTGGGAAACGACACG
+GGCCGCGTCAGCTCGTCGTAGATCGGCGCCGACGATGGGACCTGTGGTATTCGAGGCACG
+CGCCGTCCGATGTAGCTGGCGACGCTTTCAGGCGCATCGGTCTTCGCTTCGCCCACCGGC
+TTGATGAACGCCCCGACCGTATCGCGTACCTGATCGACCATGCTGCCGGCCGGCGCGCTG
+GTAGCCGTCGCGGCTTGAGCTTTTTCGGCTGCATAGCGTTCATAGGCGCGATAAACGAGG
+ATGCCGGCACCGACCAGCACGCAGATGGCCAAGACGAACTTGGTCGGCACCTTGGCCTGA
+AAGTGGTGCTTGGCGTTGCTGCTGGTGTAGGCACCGAAGTAGCGCTTATCCAGCCGCAGC
+GACTTCTTGTCGGCATCCTTGAAACTGGTTTTCAGCTCAACCTTCTCTACGACGACTTCA
+GATTCGAAGCGCAGTAGCTGGGCGGACTTGAAGACGCGCCAGTAGTGGATGTGCGTGTTG
+CACAGCCGACGAAGGTGCACATCGAGATAGCGCGGGTCCTGAGTGACGAGGTGCACCTCA
+TGGCCCTGGTGGCGCATGGTCTCGAAGCGGGTGATGTGCTCCGGTGGCCGCGCCCTGGGA
+TCGCGTGAGCCGAACCAGCCCTGCGCTTCGTCGACGACGATGATCGAGTCATTGGGCAGC
+TCAAACCATTTTTCAGGATCTTCGAACTCGAACCACTGCGCTTGCAGCTGATCGGGCTTG
+AGACCGTTGATGTTGTGGAAGTAGACGACGCGGCCTTCGGCGTGGGCCTTCTGGTCGACC
+TCGCGGATGGTGTTCAGGGTCTTGCCATGGCCGGGCTTGCCGGTGCGGATAACGAGCATG
+ACGGCGCCTCCTTATGCGTCGATAGAGGTGCCGCCCGGCTTATGCCAGACCTGATTACGT
+TTGCGGTCGGTGGCCTTGTCGATGCCGGCGAGGATGAAGCGCGTGGAGATCGCGGCGAAA
+TACAGGTTCACCACCACATCGAACTTCGCCAGTCCGAGAATCCCTTGGATGACCGGCCCG
+ACATCGCCCATCAGCCCGAACAGGTAGTCCTGCGCCTGGCCAATGATGAGGTTGAAGCCC
+ATGTAGGAGACGAAGCCGAAACCGATCATCTTCAGCACCATCTTCACCAGCGGCCCGACG
+ATGATCACGAGCATCTGGACGATGAATAGAAACTGCATCATTGACCTCCTACGGCGCGGC
+CCACATACAGGGCGGCAAGAACGGTGGCCACGGCCACGAAGAGGCCGCTCAGGTCACTGG
+CGGCGCGGCATAGCGGTTCGTAGCTGAGCTGGAAAGTGCGACCGCCTGCTGTGGTCAGGC
+TGAAGCTCTCGGCGGCGGGACAGGCAGACGGCAGAAAGCGGGTGCCCTGGTTGATGAACG
+AAGGCACGTCGATGACGCCGTTACCTTCATCCAGCTGGAATCGGTCACCGGTAACAGCCG
+CCTCGATGGCGGACTGCTGTTTGGGGAAATCGGCCATTTCCTCAGCGAGGCACAGCTGTT
+CCTTCTGCTGCCGCAGGACTTCGCAATCAATCGGGTCACCACTGCACGAGAACGCCGCAT
+CGCAGGAGCCGGCCGAGGCCAAACGCTCCGGGCCTTCTTCGCCTTCGCCTTCACCTTCCT
+GGCTTTCCTTACAACCAGACCCTTTGCATTCCTTGCTCTCATCGCCCGGGGTGCCATCAG
+GGTTGGTGCCAGAGGTGGCTTTTTCTTCGGCCGTGGTGGAGGTACAGGGCTTGGTGCCAA
+CGCAGACGGTCTTGTCGGTGGTGGTGTTGGTTTCCGTCTTGGTGGAGCCGTCCGGGTTGG
+TGGTCTTGGTGGTTTCTTCGGTTTTCGTGGTGTCCTCAAGCCGTGGCGCAGGCTTGCCAG
+TGGTGCAGTGCAGGTAATCCCCGGCGTTGTCGCAATTGAGCTGGCCGGGTTCTTTCAGCT
+TTTCGCTACTGGTGCAGTTGCGCGATTGGGAGCCGTCCGGATTGGTGACCCAGTCACCGC
+ATTGGCTTTCGCTGGTGAACTGCGGTGTGCTGTCGGCCGGGGGCTTGGACGGTGGCTGAT
+CAAAGACACTGCCGGGAGGTGGGTTGTTTGAAGTGCATTGCGAGCCGGCGCCCTGGTAAA
+AAACCTTGCAATAAACGGAGTTCAGGTCCTTGCCGGTGGTGTCTTCCAGAAAGCGATTGC
+AGCCTTTGACCGTGGCGGTGCGGCTGTAGAGGCAGCCGCTTTCGCAGATCGAGGACGGCG
+GCAGAGAAGGCGGCACGGACGGGTCCAGGGAGCCGGCGTTGTACTCGTGGACGAACTCGC
+CGGTTGCGGTGGCGCACTGGTCGGGTTCAGGGGCGACACACTCGCCAGTCGAAGGGTCGT
+AAGTGGAATCAGGAGCGCAAGAATCGCCGCGTCTAGCTGCTGCGTTGTACCAAGAACCGT
+AACGCTCAAGCTTCCCGGAATAGGGATTGATATTTAATCCATATGTACGACAGGTAAAAG
+ACGCTGTACCTTTTTCAATCTCCTGCTCAAACGAAACATATTGCCCGGAGTTTAATTGCT
+TGTAGTAGGCATGGTTTGCATTACAGGCGGCGACACCGCTGGAATATCTTATTAGCGGGT
+CCGGAAATTGAATGGTCCAATAATAATCTTCGGCGCTAGCGGGCAAGTGCCAGAGCAGCA
+AAGCCAAAAAAGCCCCAAAAATCCTTTTCATAATCACACCCGCCCAAAAAACACGAGATA
+AAACGCCAGGGTGGTGAGGATCAGGACGTACAGTTCGTAGCTCATGGCGTTTCCCTGGAA
+GAGAAAACCCCGCCGGAGCGGGGTTTGTTTGCTTCGGCACATGCAGTGCGCAATACCTTG
+GTTACAGGGCGCGGCGCATGTACTTGAACGCCATCGCGGCGATGATCACCGCGAACACCG
+CCCAGCCGATGGTTCCAACGTCAGTGCCGGCGGTATCCAGCGCCGCGGTAGCTTCAGCCG
+GGACGGCGGCGTAGACGGAGCCGGCCAGGGTGGACAGCGCGACAGCAGCGCCAACGCCGA
+TTTTCTTGATGAATTGCTTGTTCAGTTGCATGGGTGATACCTCACTGTTTCAGGGCTTTT
+TTGAGGACCAGGAAGCCGAACACGGTGGCGAACAGAACAATCGCTTCGCCTTGCAGCTCG
+GAGACTTGGTCCCAGGTCAGTGCAGAGCCGTAGAGGCTTTGCATTTCCTCGACCGTGAGG
+GCGACCAGCGAGCCGGAGCAGATGGGCGAGCCGTCGGCGCCTTGCAGCCAGTCACCGTCA
+CAGGCGAGGAAATTCATTCGCCGGCCTGCTCGAGGTCGGCGGGTTGTTCGGAGGGTTCGC
+AGTCGGGGCAGACGGCGAAATGGGGCGGCAGGCTGAGGTCGGGCAGCAGGTCGCTTTGCG
+GCGCGGGCAGCGCCATGAGCTTGCCCATGTCGTTTCCGCAGCAGTCGCAGTACACCCGGT
+CATCAATCAGCATGGCCGCCCCTCCCGGTTAGTTGGCTTTGGCCGGGTCGCCGGCTTTGG
+CCTGGGGTTGAGCTGGGGTGCGCGGGGTATCGGCTGCGGCGCGGGTCTGGACGGCTTCGA
+GCTGGAGCGCCAGATTCTTGCCCTTGTTCTGGCCACCCCGGGCAATCTCGAAGTGAATGC
+GCACCAGTTGCAGCGGCTCGAACTTAGCGCCGGCTGCGAATATCTCGTCGGCTACTTCGT
+CTGCTGCTGCCATGCCGATGATCGACAGGCCGTGTTCGGTCTTGCCGTCCGGCTCGTCGC
+CGTAGAAGACTTTGATGTACTTCTGGCCCGCTTCACCGTCGAAGCGTTGAGTGCCGAGAA
+ATGCAACTTCCATAGTCGAACGTGCCATTTGTGTTTCCTCTTTCTAGTTGCGCTTAATTG
+CGCTGCTTTGCTTTCTGCAGGCCGAGCGATCCCGAGCGAGTGAAAAAGTAATTTCACTGC
+GACCGGCTTGTTACTTGGCTTGCGGGTTATCTATAGCTGTATTTGAACGCTCTTGGAACA
+ACTATTTAGCAAGTATTAAAACAATCAATACTTCATTTTTTAATGAGACGAATAGTGCTG
+AATTGACACTTTCCATCTGAGCAAACATTAATTTAATTAATCATCCGCAACGCTGTTTAA
+CACCAAGGGCTCTGCCCTTGTCATCCCGCTCTTGCCGCCGAGGGCTCGGGAGCGCGGGAG
+GGAAAAGCGCTCCCGCACTCACGAGCGGAGGCTGTTTCAGTTCGTGCAGGGTCAAGGGTG
+CGCTCCGCCCGTGCTTCCGTTCGCCGGATCGGTGAAGCGTGATCCGACGAGCCGGGAGCG
+CGGCCCCTGACCTGTTCGGCCACGCGCTCAGCCTGATAACGCTCAGCGACATAGCGACGC
+AGCTCGACGAGAGACCGGTGTTTCGTTGGCTCGCTACCGTCCAACGGAATGAACAGAGGA
+ACGTCGCGGCGATAGGTAACGTGCCCATACAGCTCCCCGCCTACGGTCAGCTCCCGCCCG
+ATCTCATGCCAGTTAGGCGACGCGATACGAACCTGCATCCGCTTACGCCCTACCCCACCA
+GCTCGAACGGTTCGTGAATCGGCACGTAGGGCGTTGGCTTGCCCGAGTCGTAGATAATGC
+TCCACCACTTCGCGGGGCGCTCGGGTGGCGTGTGCTTCTCGCAGATATAGGCCGGTTCCA
+CTGTCCAGTCCGAGAGCAGAGGCTTCCAGATTCCACCAACGCACCCCATTTGCAGTGTGC
+GAATCGGCCGCGCATAGGCGGGGCGGCATTGGGCGCATGGTGTGGACCGGGAGGGATCGG
+ATTTCGCCATTTCGCGTCTGGACCAGCAGACAGAGCAGTCGCAGTCCTGGGCGTGCGGAA
+GGCGTTGATAGCTGGCCGGCTTCTGCATAGGCCATCCCCTCCCCTGGCTTTCCGTAGACG
+GCGCGGATCATGCGGAGCGCTCCTGTTCATTGGTGCTGGGCGAAGGACGCTTCCAGGCGG
+ATGACGATTTCGGCGTTCAGGGAGCGGCGTGCAGCCCAAGCGGACCGTTCGACCTGGGCG
+CGGAGTGCCGCAGGCATGCGCAGCTTGAATTGCGGGTCTGTGCGGCTCATTGGTTCACCC
+CCCCGGAAAACGCACCAAACGGGTTTTGCCCAGCTTCACGCTCTCGACAGCGCCAGTCCT
+GACCCAGCCAGCGACCATATCCACGGGCACACCGGCCAGAGCGGCGAATGCGGCTTGCGT
+ATAGAAAGGAGGATTCATGCGGTCCACTCCTGTTCCAGCAGCCAGCTACGCAGCAGCGCG
+CTGTTAATCATGCGGCGCTTGCCGAGCTTTACGGTGGGGAGTACGCCCCGGTAGACCCAG
+GCGCGGGCCATGGAACACGTCAGACCGTTACGTTCCGCCCAGGCTTCGACGGTTTCCACG
+TCCTGCTGTGGGGCGATCAGCTTTGAAGGTTCTAGCTCTTCCAGTTCCATGCTCGTTCCG
+TCACTATTCGTGGCAATGCCAGTTATTCAGCACTGCGTTATCCATAACGGATAACCTCGA
+AACGGATAATGCCATTGCTAATCCAAATTGGATACATCACATATAGATCAAGTAGCTATG
+ATTAAAGAGCGCGTTATAACTATTCTGAAAAGCTCAGGTATTCGGCTGCCCGAGCTGGAA
+GAGCGCACTGGCATCAGTCGATATACCTGGAACAACCTGAAGAACACAGCGCGAAAGCGC
+GAGATTAAGGCTGAGGAGATCGAAGCTATCGTTAAGCTCTTTCCTCAATATGCCTTATGG
+GTCGTCAGCGGAGAGATAGCGCCAGAAGCGGGGCAGATTAGCCCTGATTACGCTATTGCC
+GATTCAAACTTGCCGAGTCAAAGCGCGGGATAGCGATCACAACGGAAGTGACTAGGCGCT
+GGTATGCCCGCTTAAGACGTTAGAACAGCTTTTTGGAGCAGTATTAAGAATGGGAATCTT
+CGCAGAAAATTTAAATGATATTGAATCCTACTGCGCCAAGCTAGAAATGCTTTTATCGAA
+GCAAGAACTTATAGATCAGCGTGTCTCTTTATGCGTGCCCATGCTGAAGAAAATTTCAGA
+TGAACCTGACGCTTATGATAAATCAGCAAGATTAAATGCTCAGTGGATCGGCGGAGAGTT
+ACTTAGCATTATTGCCAACCGAAGAACCGACGATAGCTCACTGCAAGAATTAACACGTTA
+CCTGGCTCGAATAGCAAGAGAAACCACACTTCGAACCCCTTACATACCAAAAACACCTGA
+AAAAGAGCTTCTTGATTTTTTCGACTATTCAAAAAATCATGAAACAACCGAAGACAAGGA
+AACTTCAGATCTTATTTGGGCCTCCATTCCAAAATACATAGTAAGGGAGCATCTAGATGA
+AGTTTCTAAAAAAGAGGATGATGTAACCAACCAGGTTAAAAGCTGGGAAGACCAACTCAA
+AACATATAAAGTAACCATAGACTCATATATCAGCGAACTTAAAGAGCAACAAGGAAAATT
+CAACTTCGTTCGACTATCAAAAGCCTTTCACGAAATGCACAAGAATAAGCAAAAGGAGCT
+TAAATCAAACTTTATCGCTTTGATTTCTCTAGGCGCTTTAGTGCTTTCCCCACTAATTTT
+TCAATTTGCAGTAAAGACACTCACGAACACAGACACCACACTCAACACCCTGAGCACGAC
+GGAAGCATGGAAGCTAATATCTTTAGTTGGCTTAGAAGTGGCTCTACTTTATTTCTTTAG
+AATTGCACTGAAAAGCTACTACTCAACCAAAGCTCAACTTCTGCAAATTGAACTCAGGCT
+TTCATTATGCGCATTTATAGAAAGTTATGCGGACTTTGCAAAATCAAGAAAAACGAAAGA
+CGCTGACCCCTTACTTAAGTTTGAATCAATAATTTTTTCCGGCATTACACCTGACGATAA
+CAATGTTCCCAGCACCTTTGACGGCATAGATCAGATTTTCCGATTAGCAAAAGAACTTAA
+AGGAAAGTGA
+>NC_019936.1|provirus_4295725_4304306
+CTATCCCGCGTCTTGACCGGTCAAGTTTCGGTTGGCCTCGTCGTAATCGGGACTCGTCTG
+CCCGCACTCCGGAGCGATCTCACCGCTTGCGACCCATAAGGCGTACTGCGGATAGAGCTT
+CACCAGGACCTCGACCTCCTCTGTACTCAACCGCGCCTTCTTGTGGCGTAGGTTTTTCCA
+TCGGCTGTAGTTGATCTCCGACTTGCGGACCAGATCGTCTAGGCCAGCCTTATAGATCAG
+AGCAATAGCTCTATCCTGCATCGATTCCATAAAGGTCTAAGAATCTCTGAGTTCACTATT
+TGAACTCTAGGAATACACTGTTATTCTTTGCCTGTCAGTTCACTATTTACACTCTAAAGC
+TGCACTGACGTAGCCCTATAAAGACCAACATAGTGCAACAAAGGCCAAGGACATGGAAGG
+AAACCTACCGCCGATAGACCTGCTCAACGCGCCCCCTGTCATGCCGTGGCGCCAGTTCGC
+GGACTGGATTCGCATGAATGATGAACACGACGTGGTGTGGGGCTGGATTCGCAACGGCTA
+CATCCCGTCGCACAAGGTTGGCAAGTACGTGATGGTCAACGTGGCGCTGCTGGTTAAGCA
+GCTCATGGAAAAGGAGTGGGACTCATGATCCGCGCCGCCTACGGAAAGCCAGGGGAAGGG
+ATGACCTATGTCGAAGCTGACCAGCTATCAACGCCTTCCGCACGCCCAGGACTGCGACTG
+CTCTGTCTGCTGGTCCAGACGCGAAATGGCGAAACACGCTCCCTCCCCGTCCACACGCTG
+CGCCCAATGCCGCCCCGCCTCTGCGCGGCCGATTCGCACGCTGCAAATGGGCCGCGTCGG
+TGGTGCCTGGAAGCCTCTGGTCTCGGAGTGGACAGTGGAACCGGCCTTTATCTGCGAGAA
+GCACACGCCGCCCGACCGCCCCACGAAGTGGTGGAGCGTTATCTACGACTCGGGCAAGCC
+CACGCCCTACGTACCGATTCACGAACCGTTCGAACTGGTGGGCTAAAGCCAACCGCCCCC
+GCCGAAGCCGAACAGGTCCAGGGCCGCGCTCCCGGCTCGTCGGATCACGCTTCACCGATC
+CGGCGAACGGAAGCACGGGCGCAGCGCACCCTTGACCCGGCACAAACCGAAACAGCCTCC
+GCTCGTGAGTGTGGGGCAGCTTCACCGCCCCGCGCTCCCGAGCCCTCGGCGGCAAGAGTG
+GGATGACAAGGGCAAAGCCCTTGGTGTTAACCAACTAGAGAACACGCACAACGCGACGTT
+TTAACCGGTAGGCCAAGTAACAGATCACCTCGGCGAACTTGCGAGTTCACCGGTTCGGGA
+TCGCTCGGCCTGCAGAAAGCAAAGCAGCGCAATAAAGCGCAACTAGAGAGAGGAAACACA
+AATGGCACGTTCGATCATGGAAGTTGCATTTCTCAGCGCCGAGAAAGTCGAGTTCGACAA
+CGTGAAGCTGGTGAAGCTGTTTGTTGGTGACGAGCCAGACGGCAAGCGTGACCTCGGCAT
+TTCCATCCTGTCGATGAATGTCTCCGAAGAAGCCCTGGACGAAGTGTGGTCCGCCTGCGA
+AAGCCTCGATGTGCTTGAGCCGATCCGCGTCACCACCGAGATCGAGCGAGGCTCCAAGAA
+CGCCGGCAAGTTCATCGTCCTGCACGTTGAGCCTGTGAAAGCCGCCGCTGCTCAAGCCAC
+CAAGCCGACCCAGCAACCGACCCCAACCGCCAAGCCAGCCGGCACCCAGCCGGAACCGGC
+GAAGGCCAACTAACCGGGAGGGGCGGCCATGCTGATTGATGACCGGGTGTACTGCGACTG
+CTGCGGAAACGACATGGGCAAGCTCATGGCGCTGCCCGCGCCGCAAAGCGACCTGCTGCC
+CGACCTCAGCCTGCCGCCCCATTTCGCCGTCTGCCCTGACTGCGAACCCTCCGAACAAAC
+CACCGACCTCGAGCAGGCCGGCGAATGAATTTCCTCGCCTGTGACGGTGACTGGCTACAA
+GGCGCCGATGGCTCGCCCATCTGCTCCGGCTCGCTGGTCGCCCTCACGGTCGAGGAAATG
+CAAAGCCTCTACGGCTCTGCACTGACCTGGGACCAAGTCTCCGAGCTGCAAGGCGAAGCG
+ATTGTTCTGTTCGCCACCGTGTTCGGCTTCCTGGTCCTGAAAAAAGCCCTGAAACAGTGA
+GGTATCACCCATGCAACTGAACAAGCACTTCATCAAGAAAATCGGCGTTGGCGCTGCTGT
+CGCGCTCTCCACCCTGGCCGGCTCCGTCTACGCGGCAGTCCCGGCCGAAGCCACCGCGGC
+GCTGGATACCGCCGGCACCGACGTCGGCACCATCGGCTGGGCGGTGTTCGCCGTGATCAT
+CGCCGCGATGGCGTTCAAGTACATGCGCCGCGCCCTGTAACCGGGGTTTTGCGCACTGCA
+TGTGCCGAAGCAAACAAACCCCGCTCCGGCGGGGTTTTCTCTTCCAGGGAAACGCCAATG
+AGCTACGAACTGTACGTCCTGATCCTCACCACCCTGGCGTTTTATCTCGTGTTTTTTGGG
+CGGGTGTGATTATGAAAAGGATTTTTGCGGTTTTTTTGCCTTTGCTGCTCTGGCACTTGT
+CCGCTAGCGCCGAAGATTATTATTGGACCATTCAATTTCCGGACCCGCTAATAAGATATT
+CCAGCGGTGTCGCCGCCTGTAATGCAAACCATGCCTACTACAAGCAACTAAACTCCGGGC
+AATATGTTTCGTTTGAGCAGGAGATTGAAAAAGGTACGGCGTCTTTTACCTGTCGTACAT
+ATGGATTAAATATCAATCCCTATTCCGGGAAGCTTGAGCGTTACGGTTCTTGGTACAACG
+CAGCAGCTAGACGCGGCGATTCTTGCGCCCCTGATTCCACTTACGACCCTTCGACTGGCG
+AGTGTGTCGCCCCTGAACCCGACCAGTGCGCCACCGCAACCGGCGAGTTCGTCCACGAGT
+ACAACGCCGGCTCGCTGGATCCGTCCGTTCCGCCTTCCCTGCCGCCGTCCTCCATCTGCG
+AAAGCGGCTGCCTCTACAACCGCACCGCCACGGTCAAAGGCTGCAACCGCTTTCTGGAAG
+ACACCACCGGCAAGGACCTGAACTCCGTTTATTGCAAGGTGGTTTACCAAGGCGCCGGAT
+CTCAATGCACCTCAAACAGCCCACCTCCCGGCAGTGTCTTTGATCAGCCACCGTCCAAGC
+CCCCGGCCGACAGCACACCGCAATTCACCAGCGAAAGCCAATGCGGTGACTGGGTGACCA
+ACGCGGACGGCTCGCAATCGCGCAACTGCACCAGTAGCGAAAAGCTGAAAGAGCCCGGCC
+AGCTCAATTGCGACAACGCCGGGGATTACCTGCACTGCACCACCGGCAAGCCCGCGCCAC
+GGCTTGAAGACACTACAAAAACCGAGGAAACCACCAAGACCACCAATCCGGACGGCTCCA
+CGAAGACGGAAACCAACACCACCACCGACAAGACCGTCTGCGTTGGCACCAAGCCCTGTA
+CCTCCACCACGGCTGAAGAAAAGTCCACCTCTGGCACCAACCCTGATGGCACTCCAGGCG
+ATGAGAGCAAGGAATGCAAAGGGTCTGGCTGTAAGGAAAGCCAGGAGGGTGAAGAAGACG
+GCGAAGAAGGCCCGGAGCGTTTGGCTTCTGCCGGCTCCTGCGATGCGGCGTTCTCGTGCA
+GTGGTGACCCTATTGATTGCGAAGTGCTCCGGCAGCAGAAGGAACAGCTTTGCCTTGCTG
+AGGAAATGGCCGATTTCCCCAAACAGCAGTCCGCCATCGAGGCGGCTGTTACCGGTGACC
+GATTCCAGCTGGATGAAGGTAACGGCGTCATCGACGTGCCTTCGTTCATCAACCAGGGCA
+CCCGCTTTCTGCCGTCCGCCTGTCCCGCCGCCGAGAGCTTCAGCCTGACCACAGCAGGCG
+GTCGCACTTTCCAGCTCAGCTACGAACCGCTTTGCCGCGCCGCCAGTGACCTGAGCGGCC
+TCTTCGTGGCCGTGGCCACCGTTCTTGCCGCCCTGTATGTGGGCCGCGCCGTAGGAGGTC
+AGTGATGCAGTTTCTATTCATCGTCCAGATGCTCGTGATCATCGTCGGGCCGCTGGTGAA
+GATGGTGCTGAAGATGATCGGTTTCGGTTTTGTCTCCTACATGGGCTTCAACCTCATCAT
+TGGCCAGGCGCAGGACTACCTGTTCGGGCTGATGGGCGATGTCGGGCCGGTCATCCAAGG
+GATTCTCGGACTGGCGAAGTTCGATGTGGTGGTGAACCTGTATTTCGCCGCGATCTCCAC
+GCGCTTCATCCTCGCCGGCATCGACAAGGCCACCGACCGCAAACGTAATCAGGTCTGGCA
+TAAGCCGGGCGGCACCTCTATCGACGCATAAGGAGGCGCCGTCATGCTCGTTATCCGCAC
+CGGCAAGCCCGGCCATGGCAAGACCCTGAACACCATCCGCGAGGTCGACCAGAAGGCTCA
+CGCCGAAGGCCGGGTCGTCTACTTCCATAACATCAACGGTCTCAAGCCCGATCAGCTGCA
+AGCGCAGTGGTTCGAGTTCGAAGATCCCGAGAAGTGGTTCGAGCTGCCCAACGATTCGAT
+CATCGTGGTCGACGAAGCGCAGGGCTGGTTTGGCTCGCGCGATCCCAGGGCGCGGCCACC
+GGAGCACATCACCCGCTTCGAGACCATGCGCCACCAGGGCCACGAAGTGCACCTCGTCAC
+ACAGGACCCGCGCTATCTCGATGTGCATCTGCGCCGGCTGTGTAACACCCACATTCACTA
+CTGGCGCGTCTTCAAGTCCGCCCAGCTGCTGCGCTTCGAGTCGGAAGTCGTCGTAGAAAA
+GGTCGAGCTGAAAACCAGCTTCAAGGATGCTGACAAGAAGTCACTGCGCCTGGATAAGCG
+CTACTTCGGTGCCTACACCAGCAGCAACGCCAAGCACCACTTTCAGGCCAAGGTGCCGAC
+CAAGTTCATCTTGGCCATCTGCGTGCTGGTCGGTGCCGGCATCCTCGTTTATCGCGCCTA
+TGAACGCTATGCAGCCGAAAAAGCTCAAGCCGCGACGGCTACCAGCGCGCCGGCCGGGAG
+CATGGTCGATCAAGTGAGGGATACGGTCGGCGCATTCATCAAGCCGGTAGGCGAGGCGAA
+AACCGATGCGCCGGAAAGCGCCGCCAGCTACATCGGGCGGCGCGTGCCTCGGATACCGCA
+AGTCCCATCGTCGGCGCCGATCTACGACGAGCTTACGCGGCCCGTGTCGTTTCCCCGACT
+CTACTGCATGTCCAGCACGGACCCTGCGACCTATGCCCGCGAGTTCGGGCGAATGGCGCA
+TGCGGTAGTCAACGGCACGCCCACCGTCTGCCAGTGCTACACGCAGCAGAGCACGCGGGT
+CGAAACCGACTTCGCATTCTGCATGCGCGTGGTCGAAAACGGCTTCTTCGATCCGACCCT
+TCCTGATCGCTCCGCTGGCGAGCGAACGCAGCAAGTCCAGAACAGCCAGCCTCCGGCAAT
+GCAGGGGCCACGCCCTGGACCAGCACAGCCAGCCAGTGGCACGAACATGACTGTCGTGCC
+GTACCAGAAGGGGCAATTCCTGTGGTGATGACCGTCAGCGCGCGTGCGCTCCGCGCTCTT
+TGCACGCACGGCGAGGCACGAGCCGGCGTGCAAACGCGCGCGCTGACGTCCCTGTAACAC
+GTCAGATAGATCGAGTTGAAACCGTCCGTTATTGGACATTGTTGGAGATTCAAGAATGAG
+CGTTAAAGACCAAGCAAGACTGGACCACATCACGGGCAATCCGACCAAGCGTGGACGGTT
+GTTCGTTGACCCTGGTACTGCGGCAATCACCGATCTGTCGAAGGTCCGTCTGCTGCGTTG
+CGGCGTCGATACGGTTCGCCAGTTGTATCGCGGGCTGATCCGTCCAGAGATCATGGCGCT
+GTTCGAGAAAACGGGCGCGATGGTGGAGTTTGCTGGCGAAGTCTGGCACTCGGGACGGGT
+TGGCCGGGACTCTGGCTACCAATACAAGCTCCAGAACGCTGACCTTGGGTTCATCCTGCT
+CATCAAGAATTTCAACGCCAAGCTGGAGAACATCGGGCCGCACCTGAAAATCGAGGTGTC
+GCCGCACGCCATCGACGCGCTGTCGCCTGAGCGTCTGCAAGAGCGGATGGATTACTACGC
+GGCGGCAGTCATGACCAACCGCGAACGTAACCAGTGCGCCGTCCATTTGGCGTTGGACCT
+CCAGGGCTGGAAGCCTCCAGTCGATCTGGTAGCCCGCCTGCACTGCCGCGCGCGAACGCA
+TCGCGATATTTCCGGAATCAAGGAAATTCAGTGGGCCACCAAGTCCAGTGTTTACGGTCG
+GGGCGAAACGTCCATGTTCGGCTCGGCCAGCGGCGTGCAGCTCTGCATCTACAACAAGAC
+CGAGCAGGCCCGCGCAACCGACAAGCTCGACTACTGGGAAAGCGTGTGGCGTCGCCGTGA
+CTCCTTCGACCCGACCGACCCTGACAACTACGATCCAGGCGCTGACGTGTGGCGCGTTGA
+GTTGCGCTATCACCACTCGGTCATCCAGCAGTTCGCCAGCGGCTCGATCAGTGCGAAGAC
+CGGTGAGGCCATCGATACGGATTCGTTTTCGGCCTTCTCGGCTCATCTGGACGGCCTGTG
+GCGCTATGGCCTGAGCCAATTCAAGCTGATCGCCCGCCCCGGCTATTACGAGCCGATCTG
+GACGCTAATGCGTGATGACGCGAGGGTCGATCTACCGGTCGATTCCCTGGTCGAGGAAAC
+GGAGTACAAGCGCTATTACAAGACCTCAAGGGGCTTCTCGGGCAAGAACGTCGAGCTGTT
+CCTGGGAAACTTCGTAAGCCTGCTGGCACGGGAGCGAGTGGGCGCTAAGACCGCATTTGA
+TCGATTGAAGCAATGGGAATGCTGGCCAGTGATCCGCGACCACTACGCCGCCAAGGACAT
+GAGCGAGCGCGACCTCTACAAGCACATCAAGAACCTGTTACAGGAACGACACGTGCGATG
+GGGGCGTGCCGTCTGATGGCGATACTGGCACTGCCTGACGGTCGCTGGCGGGTCGATGTT
+GAACCGATCAAGGGCAAGCGATTCCGCAAGACCTTCAAGACCAAGGGCGAAGCCCAGCGG
+TTCGAGGCTACCTGTCGATCCAAGCTGATCGAAAGCCCGCAATGGTCACCAAAACCGAAG
+GATCGTCGTCGCCTGTCTCAACTGGTGGACTGCTGGGGGCGTCTGCACGGTCAGTCGCTG
+TCCGACTATGAGGGTCGGCGCGTCATCATGGATCGCATGGTCGAACGCCTGAAAGACCCT
+GTCGCCATAGCCTTCACTGCTACCGATTTCGCGGAGTACCGCGCCAAGCGCCTCTCGTCC
+GGCATCAGCCCGAAAACGCTGAACAATGAGCTGTCTTACCTGCGGGCCATGTTCAATGAG
+CTACGGCGACTTGGTGAGATCGAGTTCGAGAATCCGCTTTCGATGCTCAGGGCGATTCGT
+GTGCAGGAAAGGGAACTGTCCTGCCTCGACAGCCATCAGATCGAACGGCTGTTCCAGGTA
+CTGCGCAGCATGGTTCACCCACACGTGGAGCTGATCGCCACGATCTGTCTGGTGACCGGT
+TGCCGATGGGGTGAAGCGCAAGGGCTCACGATCAGTCGGGTGGGCGATGGCATGCTCCAG
+TTTGTGAACACGAAGTCGAAGCGTCGCCGTGTGGTGCCGATCGATCAGAAGCTAGCGGAG
+CGGATACGCCAGCACCTTCGGCAACACGGTGCGTTCACCAACTGCCGGGATCGGTTCGAT
+GAAGCTGTGGTGCGTGCGGGGCTGGGTCTACCTGCGGGACAAAAGTCGCATGTGTTGCGG
+CATACCTTCGCCTCACACTTCATCGCGAACGGTGGCAATATCCTGACCTTGCAGAAGATA
+CTCGGGCACTCGTCCCTGGCGATGACAATGCGGTACGCGCACCTTGCGCCCGATCATCTG
+CAAGACGTGTTAGCGTTTGGGCCTGCTAGGGATTTTCGACACTTCTTCGACACTCCCGCC
+TCTGAGCGACAGTCGGGGCAGGAAATTCCTTTGTAAATCAATAAGGAAGGCAATCGCACC
+CGGTGGTGCGGCCGGGCTTCAAACCCGGTTGGGGACGGCAGCCGTTCCCGGGTGAGTTCG
+ACTCTCACTGCCTTCCGCCATTTCGACTCACACGCCCGACTCCCAAACCCTCGACACCTA
+CCCCGCGACAGCCCGTCCCACCTCGCAATATCAAAAAGCCATCGCACTTCAACGCGAAGC
+GCGTCACAATCGCGGCTTTTCTTTCCAGGGATAGGAGAGACGTCGTGGGTAACTCGCCAG
+ACGAGCGCCGTGCGTTGCACGCGCTGCGTGACCATATCGATTGCCTACTGGCCGAAGGAG
+CGTCCGTTGTCGGTCGCGACCCGGTGCAGCTGAGTTTTCAGGGCCGGACGTTGACGGTGC
+AGCACGGGATACTGCTCAACGAGAACGGCCATCAGGACCTGATCGAGACGCTTGCCGAGC
+TGGAGTGGACGAACAAGCGCACTCGCGATCTAGCCATCGATATCTGCATCCGCCAGCTAG
+ACCATGCGATCAAGGCGAGCTGCTTCGACGCGCTGGAAAGCTCAAAGCCCGACAAGCCCT
+GA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_fasta/NC_021184.fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_021184.fasta.fasta Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2005 @@
+>NC_021184.1|provirus_19778_35564
+ATGCTGGATTTGAAATTTGTGCGGAATAACCCGGAAATTGTTAAAGAGGCACTACAGAAA
+AGAGGAGCTAGCATTTCACTCGACCCGTTTTTGGAACTCGATGAGCGCCGCAGGGAAAAG
+CTGGTTGAGGTGGAGAAGCTTAAAAATAAACGTAATGTGGTATCCGAGGAGATTGGCCGG
+TTGAAAAAGGCCGGACAGTTGGCTGAGGATATGGTACTGGAAATGCGGCAGGTTTCCAAT
+GCTATCAAGGATTTAGATGAAGAAATTCGTATTTTGGATCAGCAGCTGCAACAAACATTG
+CTAAATATCCCCAATATTCCTGAAGAGAGTGTACCCGTGGGGTTGGATGAAAATGACAAT
+GTTGAATTGCGGCGCTGGGGTGAGCCCAGACAGTTTGGTTTTGAGCCCAAACCCCACTGG
+GATATCGGTGAGGCGCTGGATATATTGGATTTTGAACGGGGCGGCAAGGTTACAGGTGCC
+AGGTTTCTTTTTTACAAAGGAGCCGGTGCGGCTCTGGAGCGTGCTGTATTTAATTTTATG
+CTGGATGTGCATACGAGGGAGCACGGCTATGTAGAGGTAATGCCACCATTTATGGTTAAC
+AGCAACAGTATGATCGGCACAGGCCAACTGCCCAAGTTTGCCGAGGATATGTTTAAAGTT
+GAAAATACTGATTACTATCTAATACCCACTGCCGAAGTGCCGGTAACCAATCTTTATAAT
+AATGAAATATTGGATGGCGATAGATTGCCCATTTACCATTGTGCCTACAGCGCTTGCTTT
+AGAGCCGAGGCAGGAGCGGCGGGACGTGATACACGGGGCCTTATTAGGCTGCACCAGTTT
+AACAAGGTAGAACTGGTAAAGTTCGTTCGTCCGGAGGAGTCCTTTACTGAACTGGAGAAA
+TTGACTCAAAATGCCGAGAAAATACTGCAATTGTTGGAGCTGCCTTACCGGGTGGTTGTT
+TTAAGTACCGGTGACCTGGGTTTTAGCTCTGCCAAAACCTATGATTTAGAGGTGTGGCTA
+CCCAGTTATAACAGTTATAAAGAGATTTCTTCTTGCAGTAATTTTGTGGATTTCCAGGCC
+CGGCGGGCCAATATCAGGTACCGGGAGGGTAAAGCAAAACCTCGTTTTGTACACACTTTA
+AACGGTTCAGGTTTGGCCGTGGGCCGGACGGTAGCCGCTATATTGGAAAATTGTCAGACT
+GATACCGGTGCGGTGAAAATACCGGCGGTGTTACAGCCGTATATGGGTGGCATTAAAGAG
+ATAAATTGACACTACTGAAGGGGAACGGTGTTATTGACACCTAACCTATACTGTGTTATA
+CTTCTTATTGTCTCTGGTTGATTGAAATTGACTGGAGGGGTGTCCGAGCGGTTTAAGGAG
+GCGGTCTTGAAAACCGTTGAACCTTCACGGGTTCCGTGGGTTCGAATCCCACCTCCTCCG
+CCATTTTAATTACCTGACAGCACGGAGAGATGGCCGAGTAGGTCGAAGGCGGTCGCCTGC
+TAAGCGATTATACGGGCTAAAACTCGTATCGAGGGTTCGAATCCCTCTCTCTCCGCCAGT
+AAAGAAAACCACGGATTAAAGATCCGTGGTTTTCTGATGGGTTTACTCTCACCATATCAT
+GGTTATCACTCATTTTTACCAGTTGACTTTTACGAGTGCTTTTGTTACAATTATATTTGC
+GGTGCTGGTGAAGCAACGCAAAGAAAAAACAATATGTGCCTGTGGCTCAATTGGATAGAG
+CATCTGACTACGGATCAGAAGGTTGGGGGTTCGAGTCCCTCCAGGCACGCCACAATTTTA
+CGGCGACACAAAAGTATATATACTAATTGTGTCGCTGCATTTTATTATTAATATACCACC
+ATTGGAAATACATTAGGCGCCTGTAGCTCAGAGGATAGAGCAGCGGTTTCCTAAACCGCG
+TGCCGGGGGTTCGAGTCCCTCCAGGCGCACCACTGAAAATCAAGGCCCGCAAGGATTTGC
+GGGTTTTCGCTTTTCTAGCGAAATTCGCTGAAAGGCTATTTTGGGAGCATTTTGGGAGCA
+AAGATAACAAACCGGGAGCAAACGAGACAGGAAAAGACAGGTTTTACGCCTGTCTTTTTT
+TTGTGTCATTATGAATAATATTCTGGTACACATTTTCTAGCTTGTCCGATATTGCCTTAT
+CGGCACTCTGTAAGTAGTGACTATAAATAGCCCCAGTGGTGGCCGGGTTAGCATGTCCAA
+GCCGACCGGATATATTTTTAAGTGGCACGTTCTGATTAATCAACATTGTGGCCGCGGTAT
+GCCGGAGGCCATGAAAGGGTAGGTGCGGCAATTTGTGTTTTTTAATAAACTTGGAGAACC
+ATTGCGATGGCCATTCCGGGTGCCCGGGCCTGCCGTCCCATGTGGTAAATAATCTGTCTG
+ACCCCTGCCATAAGTCAGCGACCTTTAGGCGGTCCTTAGTCCATTCTGTTTTATACTGTT
+TAATCAGCGTCATAACGAAACCGGGAATAGATATAACCCGCTTTGACGTTTCGTTCTTTG
+GTTCTTTCGTGATGGTGCCTATACCGGGTAGGTACTGACTGGACCGCCTTACGTTAAGTA
+AGGAGTTATCAAAGTCCACATCCTGCCATTCAATGCCCATGATTTCACCACGGCGTAACC
+CGGTGAATAGTGCTATGTAAACAAGCACCTGGTGCTTTAATTCTTCTGCTTCCAGGGCTT
+GCAGTAGGGTGGCAATGTCGTTTTCATCATAACAGGCGGCCGGCTTCCTGGGGACCTTGG
+GAGCTTCCACCCGGGCGGCCGGGTTGGTTAAAATTATTTGCCATTTGACGGCAGCGTTAA
+ATATAGTGACTAATAACCTGTGATGGTGAAGTATGGTTGCGGGCGACAGTGTACCTTCCC
+TGCCGTCCTCACGGATGCCGTATTCCCGCAAGTTGTCATAGAACTGCATTATGTGAAAAG
+GCTTTATGTCCTCTAATTTCATGTGGCCCATAGCCGGTAAAATGCGGGAGTCAAGCATTT
+TTTTATACCGGTGCTTGGTTTTGGGTGCCAAGTCTATTTTGGATTTAAGCCACTGTTGGC
+TAAATTCCGTGAAGGTGAGCCCGGAGGGTTCAATATACTGGCCCTTTTGCACCTCAGCAG
+AAAAAATGTCTAGCTGTTTTTTGGCTTCACGCTCGCTGGTGGCTTCAATCGTCCGGCGGT
+AAACTTTGCGATTACCGCCCGGGCCCGTCCCACCTGGTACGTTAAGCCGCCATTTGTTGG
+TCCCCCTGTTTTCTACCCAGCCAGCCATTATTCTGATTCTCCTTCTTCTGAGAACATTAT
+TTTTAGCATAGCGAGTACGCGTTTCCGTTCATACTCAGTAAGAAGTCTGCCATTATAATA
+TGCTTCCTTTTGATGTTTAAGAAGAAAAGCTATGTCATATAAATCTTGTCCAGACATTAA
+CTTAACTGTTGTTACGCTATCAACTCCCTTTGTTGCTATCTCACCAGGCACAACAAAATT
+CACTTTTGGGAAAATAGAACCGCTAGGAATCTGGTCAATGTACATCCTGTTGGTAAGAAT
+AATATCGTAAATATCTACGTCAAGTATTTTTGCAATTTCTTCTATTACAGAAATAGGCGG
+TACAATTTCACCGCTTTCATATTTTTGTATCACGCGTTCAGACTTGTTTATTTTTTTAGC
+TAATTCCTTTTGGGTTAGTTTTTTACTTTTTCTCAATTCTCTTATCTTGGTGCCAATATC
+CAATGTATTCACCTCCATACCAATATACTACCATAACACGAATTAAAAGTACAGATAATC
+AAATAAAAACTATTTACAACGAACTATAAATACGCTATTATATAATTAGTACGAATTTAA
+AATTCGTTAAGGGGGTTTAAATAATGCATAAAACACTAGATCAGCTTAAAGACGATGCCC
+AACATGTATTACGTGAAACAATAACTGCTAGAGAAGTAGCGGAAATGCTGGGTATTAGTG
+AGTGGGCAGCATATGACTGGGCACGGAGAAAAATAATACCGCACATCAGGGCAGGTAAAC
+GCGTGCTGTTTAGGCGGAGTAGCATTCTCCAGTGGCTGGAGGCACAGGAGCAGGCTAGCG
+TTACGGTAGAGCCGGAAACTGCAGGAAAAATACGGCGGCTGAAATAATCGACATAAAAGC
+AAAAGCCCGCGCGGGGCGGCACGGGCAGGCGGTAAGGTAGGTGTGATACAGTTGCATGCT
+CCAAATAGTTTATCACGAAAAAGTAATATCTTTCAATTGGTTAAGCAAATTAATACAGTG
+GACATTATTCATAAATACAACATTGCTAATATGCACCGGCATGGTCGCTATTGGGTGGGT
+TTATGTCCAGTTCACCAAGATAAAAAACCCAGTTTCTATACTTTTCAGGATAATAAATGC
+AAATGCTGGGGATGTGGATTCTACGGTGACGCTATTGACCTAGTGGCAAAGGTGTATGGA
+CTCAGACCCATTGAGGCGGCCCGGATGATAGCGCGGGACTTTGGTATTGAGGTGGACAAT
+AGGCCGGTATCATTGGAGGCCAGGCGTAAGGCCAAGCAGTTGGCCATTGAGGCAGCCCAA
+AAGCGTGAGATTGAGAAAATCTTTAAACAAAAACGGGATCGGGCGTTAGAAATACTTTCT
+TTGTTCGTGAGAACTACCAACCATGTTTTAGCTGCTGGGGGTTATCAAGCGCATTATGAT
+TTAGCTGAATTGTTACATAAAACCGACTACCAAGAGTATTTGACCGAATGCTTGTTGAGT
+AAGGATCCCGACTTACAGCTTATGGCATTGACCGCCCCGGAGGTGCAACAATGGCTCGAA
+TAACAGCAGACGAACTCCATGAAAAAGCAAGAGATGACCCAGAGGTGGCTAAAGTGTTGG
+GGTTATCATCCTTCTGGGAAAAACTCCTAAGTAAAGATAAAAACGGTAGGATTTATTCCA
+CAATTAATAACGCTCTTTTGATATTGCGGAATGATGAAGCGTTAAAAAGTAAAGTGGCTT
+TAAATGAGTTTGCAAACCAGCTTGACATTAGGGGTGCTTTACCCTGGGGGAAGGCCAAAG
+GTACTTGGTCTGACAGTGACGATGCCGAATTAAGATATTATTTTGAGACTAGCTACAACT
+TTACTGGTAAAAGCAAAATTGATGATGCCTTTGCCATTGCCACAAGCCGGTTGAAATTTC
+ACCCGGTGCGGGAATATTTGTCAGGGCTGCAGTGGGATGGGCAGCAACGGCTTGATGCCT
+TGCTGATTGATTACTTCGGGTCTGAAGATAACGAGTATACCAGGATGGTGACGCGAAAAT
+CATTCACGGCTGCTGTGGCCCGTGTATACAAGCCTGGCATTAAGTTCGACACCATGCTGG
+TGCTGGTGGGTAACCAGGGCATAGGCAAGAGTACCTTTTTTCGTTTACTGGCCGGGGATG
+AGTGGTTTACTGATGACCTGCGGATGGAGGATATGAAAAATAAAACCGGTGCAGAAAAAA
+TGCCGGGAAAATGGATCATCGAAGTTGCGGAACTGGCCGGGTTGAGAAAAACTGAAGTTG
+AGGAAGTTAAATCATTCCTAAGCCGCAACTTTGACCGGTACCGGGAACCGTATGGCCGCC
+GATCAAAGGACCAGCTAAGACAGTGTATCCTTGTGGGGACTACAAACGCCGTGGATGGCT
+TCCTAAGGGATCAAACCGGGAACCGGCGCTTTTGGCCCGTGAGGGTGAGCCGCGGGAAAT
+TGAAACCTTGGGAAATCGATAAGGTAAGGAATCAGATATGGGCTGAAGCCAAAAAGTATT
+ATGAGACTGGGGAAGCGCTTTACCTTACGCATGAGGTTGAACAGTTAGCCACGGCGGTGC
+AAGAAGAATACACGGAAATAAGCCCATGGTACGGGTTGATTGATAAGTATCTTAGTGAAA
+AATCTATGGGAGTTGTCTGTGGAATTGAAATTTGGATACATGCCCTTAGTGGAGACAAAA
+ACAAATATGGCCATAGGGAGCAGCAAGAAATAAGCAATGTCATGAAAAAAATACCCGGAT
+GGGAACCAGGAGGGCGCGAAAGAATACCGGAATATGGACGGCAGCGCGTTTATAGGCGAA
+TATCCTAAAACCTGTCCACCTGTCCCATACCTGTCCCACACCTGTCCCCTTACGGACATA
+AGGCTTTCCCCCTCTTTGGGACAAGTGGACAAAGAAAAAGATAATAAGTATTTATATGAT
+TATAAATAAAGAAAAAATATATATATGGTTTTTTCTGTCCCCTGTCCCAAAAAAACTCGG
+AAACCTTGCAGGAGTAAGGGGACAAGATGGGACAGGAACTATCTCAACCCTGTCCCATAA
+AAGAGCCTGTCCCATATTGGAGTTGGTTACAGTAGGGGGTGATTGTGGTAAATGAGTAGG
+ATAAAAAAGGCCACTGAACAAGAATGGCGGACAATTGCAAATGAAGCAAGGGAACTTAGG
+GACCGTATAGGTAAGTTAAGCATTCAAGCCTGTCCATATCTGCCAGTTAAACTTACGGAT
+GACTTAATGAGGGCACAGCAGGTAATTGATTTATTCCGTGCAAGGGCAGAAGATGAAATG
+TTTAAACGTGGGGGTATTAAAGATACAGATATCTGGTATCCCGGAAAATGATAATAAAGG
+TGATGGCGATCTATGAAATACATACGCATTCAGATGCCCAAGCACATACTGGTACTCACC
+GACCAAGAGCTTGAACGCCTGTTGGCCCGGGACCCCAAGTTATGGAAGCTGGCCATCGGT
+AGGGGAAAAGGCTTGCGGCGTTATCAGGCGGCCAAGGCGAGAGCAAATAAAGATAGGGGT
+TGAGAACATGGAAGTTTCAATTATTCCACAAAAGAAGTTTGAATGTGTAGCGGGACGCGA
+TTACTTAAAGGCCCGAATTACATTGATTGTTTCAGCTAAGACAAAAGAAGAGAAAAGGGA
+GCTGCGGGCACGGTGGGAGCAGCTAGAGGAGAATGGATCGCTTAATGAACTGTTGGAGCT
+TGTCAGGGAGATGGAAGCGGGCAGTTACGATTAAGCATTTAGGATGCATACCCGCCCCCC
+GGGGCGTCTATCTTGTGGCCAGTTCACCTGACCGGAGGGGGAAGGCTATTTGCACACATA
+GAGCAATTACGAGATTTTAGCCAAAAATTACCCCCCTCCGCCCAAAGTAGCAAATATTAA
+CAGAAAGGGGGCAAATTATGAGCCGTCCGAGGAAACCACCAAAAACTAAAATTAAAGTCA
+GAGATATTCTTAAATACATTGAACAATTGCCCCCGGATAATCCGCTTAAACAAGAATTGA
+CACCGGACAAGCTAATCCGGATTAAGCGATATATCGAGGAATTGCAATATCTGGATTACA
+TCATCGTGGGGTTGAAATCAGACATAGAGGCAAACGGAGAAATTGAGCTATATGAAAATG
+GTAATCAGAAAACCCGGCGTACCAATCCGGCGTTGACAACTTACATTGACACAATCAAGG
+CATACAATGCCCTATTGCGGCAAGTCTCAGAAATTTTGAGGGGGATAGAAATTGAAATTG
+CCAAAACGTGGTAGTGAAATACTACAGGTGATTGATGCCTGGCATACTCTTATACACCAG
+GCAAAGGCGGGCAACCTACAGGCAATTAAAATTTTTCTAAGTTTGAAAGCTAACAATCAA
+TCCGGTGCTGGAACGGCGCCAGGCAAGGTTGTTGACATAGATAAATACCCGCTGGAATAG
+CGGGATTGAAAGGGGGAAGCCCTCATGAAACTCTACGGCTTTTCAAATGAGCTGAGGGCG
+GCTGGTGAAGAAAATAATATGCTGCTGGAAGGGCGGGCAATTGTTTTCGACCAACCGACC
+GTACTTTATGAATTTGACGGTATCGAGTACAAGGAAATCATTGCTTCAACGGCCTTGGAT
+AAGGCTGATATGAGCGATGTTGTACTTCGATATAACCATAATGGTGAATACATCGTCTTG
+GCGCGAACTCGGAATAAGTCCCTAACGCTGGAAAAGCGGCCAGACGGGCTCTATATGCGG
+GCAACTTTACAGTCAGATATAACAAGCCACCGGGACCTATATAATGCGGTAAAATCCGGT
+TTAATTGACAAGATGAGTTTCGGTTTTGCGGTGGCTGATGATGGTGATAGTTATGACTCA
+GCCACGCATACCCGGACAATCATGAATATACGCAAACTTTTTGAGACCTCTTTAGTTGAC
+CAACCGGCGTATGACCAAACCTATGTTGAAGCCAGAAGCAGGCTTGAACAGTTAGCGGAT
+GTTGAAGAATATCGGAAAGCATTGCTCATTAGAGCAAAATTAATCAGGAGGTACTAGCAT
+GAATAAATTCAAATATATGACCGAAAGTGAAATTGAAGAATATCGTTCCCAGTTGGAAGC
+CGAACTTTTAACCAGTTCCCCGGAGCGTTTAAAGGAAATTGACAAAGAACTGACGGACAT
+CGCGGCAGCCCTGGCCAAAGACGAATATCGGCGCACCGTGGGCGCTGGCCCGAGGCAACA
+GCGCACTGCCGGCCCTATTGGTCAAATGCAAATCCTGGGCACCTACGGCATTGGTACCGG
+TATTACGAACAATACCAACACCAGGGGCAATGAACCCGTAAACGGCAATGTTTACGGCTC
+CTCGGAATACCGGCAGGCTTTCATGGGCTTCGTGTTAACCGGCGCCCGGTCAGAGATTTT
+GGAATACCGGGCCAACGCTACCACTCTAACCAGCGACATTGGAACCGTGATCCCAACAAC
+GATCGTACAGAAAGTCTACGAGAAAATGTCCGCTTACTCCATGATCTGGGACCGCATTAC
+CAAAACAAACGTCAAGGGTGGCGTGTCTGTCCCGACATCCAGCTTAAAACCAACCGCAAC
+ATGGGTTGCTGAGGGTAGCGTTTCAGATAAACAGAAAAAGCCTACCGGCAGTATCACTTT
+TAACTACTACAAGCTGCAATGCCGTGTAGCTATCTCCCTGGAAGCTTCCACGGTAAGCCT
+GGAGATGTTTGAATCAACTGTTGTAGAGAACATTTACGAGGCAATGATTATTGCAGTTGA
+ACAATCGGTTGTAACCGGCACAGGCGTGGGCCAGCCCCTGGGTATCGTAAACGACAACAC
+TATTCCTGCTGGCCAGATTATAGATGTAACTGCCGCTGAAATAAGCACCTATGGCAAATG
+GGCTGCCATTATCGGGACTATACCACTGGCTTACGAGGCAAAAGTCAATTTAACTCTTAC
+AAAAAAAGATTGGGACAAGTATATTGCCGGTATGGTTGATGCCAACGGGCAACCCATAGC
+CCGGATTAACCTGGGCCTGGCTGAAAGACCGGAGCGGCGCGTCCTGGGTTACAATGTGGT
+GCTTGTGGACGATTACCTACCCAGCTTTGACGCGGCGAATGTCGGCGACATTTTTGGGTA
+TTTTGTGGATTATAAAGATTACATCTTCAACAGTAATCTGCAGATGCTCTACAAGAAATA
+TTTCGACGAGGACACCGACGAATTTGTGCATAAGTCGACCCAACTGGGTGACGGCAAACT
+TGCAGCTCCGCACAGCGTAATTCTACTCAGAAAAGCCGTCTAAGTTCCTCCGGCTCCTTT
+TTATACTGCCCATCTTTAACGGTGGGCAGTAGAAAGGGAGCAAGGGGAGTTCCCTTTAAC
+TGCAGCGCGGTCGATCGTTGCAGGCGTACAAACCCCATAGCCATTTTTTCATAAACCTAT
+CCTTTTATTTTAAGGCGGCCACCAGGGGGCTCACTGGTACGGTGAGCCTGGCCGCCTACT
+TTCTTTTTTAAAAATAACTTTCGGGAGTTGATAATATGGCAGGTTCTACCATAAAGGGCA
+TTTCTATTGAATTCGGAGCCAACACCCAAGCCCTTACGGCAGCATTAGCAGACGTAAACC
+AGAAGAGCCGAAATCTCCAGGGGGAGCTTTCACAGGTGCAGCGTCTTTTACGCATGGACC
+CCGGTAATACAACTTTGATAGCACAGCAGCAGCAACTTTTAGGGCAGGCTGTAAACAATA
+GCCGGGAAAAGCTTGATCGCCTAAAGGCTGCCCAAGAACAGGTAAATGAGCAGTTTCGGC
+GCGGTGACATAAACGAAGCCCAGTGGCGGTCGTTTCAGCGAGAAGTGGCCGCGAGTGAGC
+AGCAATTGCAACGATTTGAGGAACAACTGCAGCAGGTTAACCAAACATCTGACAACCTTA
+CTCTGGGCGATAAATTCAAAACCAGCGTGTCCGGCGTTGCTGATAATGTTAAAAACATTA
+TCAGCCCTGCAACACTGGCGGCGGGGGCCGTGGCCGGTATCGGAATTGCAGCCGTTGGAG
+TGGTGGCACAAGGCGTAAATATGGCTTCTAGCTGGGACCAGGCCAGCAGGCAAATGGCAG
+CAGCGACTGGGTTACCAATGGAAGCAATGGGCGAATTTGAAGCACAAGCAGAAATCATGT
+TCGGTAATGCCCGGGGCAGTGTTGATGAAATCTATGCAGCCATGACACAAGTACAACAGG
+TATTCCATGGATCGGCCGAGGAAACAGGCGCTTTGGCTGACAAAGCGCTGGTGTTGCAAC
+AGGTTTTTGGCTTTGAAGTGTCTGAAAGTATAAAATCAGTCGATAGCCTAGTCAAAAACT
+TTGGCATTGATGGCAATACAGCCTTTGATATTATTACCAAAACATCACAAATGGCCGGCG
+ACAAAGCCGGGGATCTGTTGGATACTTTCAATGAGTATTCCCCACAATTCGCGGCAATGG
+GTTTCTCTGCTGAAGAATTTGCCGGGATTCTTGTCAAAGGGGCTCAAGAAGGCGCGTTTA
+ACCTGGACAAGGTCGGTGATGCCGTCAAAGAATTCAATATTCGTGCCCAGGACGGTAGTA
+AAACCACGGCAGAAGGGTTTGCCGCTATTGGCCTAAACGCTGACGAGATGGGCGCAGCTA
+TCGCTGCTGGTGGCGATAAGGCACAAGCGGCTTTTGAAGCAACCATAGCGGGACTAGCTG
+CAATAGATGATCCAATGAAACAAAACCAAGCAGGGGCGGCCCTTTTCGGTGAACAATGGA
+ACGATGTCAGATCAAAAGTTATAACTGCAATGGCTGACGGTAAAACCGCTCTGGGCGACT
+TCGCGGGGGCAACTGATGACGCAGCTGGTAAGGTTGACGGTGGTTTTGGCCAGGCGATGG
+AAAGGCTGAAAAATAAATTTGGCCTCGTCACAAAAGAGATCGGTGAAAAACTGGCCCCTG
+TTTTGAATGAAATGGCCACCTGGATAGAAGACCATATGCCTGAGATCCAAGCAACTGTTG
+AGACTGCTTTTAATGTTATGGGTAAGGTGATAGAAGGTTTAACATTGCCGATTCGGAACA
+TCATTGCCTTACTGCAAGGTGACTTTGACCAGGTGATGGAAAACACGCTTCATTTGTGGG
+GTATCTCGTGGGACGGAGTAAAATCCAAAGGACTTGAGGTTTGGAACTCTATAACAACGG
+GCGTTAAAAACTGGTGGAGCGGCATAACAAGCTGGTTGTCCTCTCTAAACCCCTGGGGGG
+CCGTTTCGGGGGCATGGAATACCTTTAAAACCAACACAATCCAGGTTTGGTCTAATCTTG
+TTACCGATGCAAAATCATGGGGTAAAAACATCGTTCAGGGCCTCTGGCAAGGCATCTCCA
+GCATGGGCACAACCCTAAGAGCCAACGTCACAGAGTTTATTAACCAGAACATACCGGAAG
+TCATTAGAAAGCTTTTAGGAATACATTCCCCGTCAACAGTGGCGTATGAAATCGGAGCAA
+AGATTGAGGATGCAGACGAAAAGGCACAATTGGCATTAATTGAAATTAGAAAGTTTATGG
+AAAGGTGGGCGGTAGCATGACTCTTGTAATATCGGCAAATAACCGCGATGAATACGCTCT
+TGTGACCGGTGATTTTCTTGGTCGCAAGCATAAAGACATGGACTATAATAACCCGGTAAA
+CCATAATGATAGTGACGTTGAGCTGGTTAATAATGTTTACAAGACACTTAAAGTTAGTGA
+CTATGTATTACTTGGCGCTGCCGGTTGCCATGACCTTGGCGAGTGGCTTAGAAAGGAAAT
+ACAAGACCGGGCAGCGCCTGACTTTGATTTAATCCAGTGCAGGCAATTGGCCGAAGAAAT
+CGTCGAGGAAATGAGGGATAAACGCACCCTTAGAATAACTTTTGACATGGAGCCCCTATA
+CTTAAACCATTTATATCAGGAAAATGGCTTTGCCTTTGTGTTGACCGGCTTTTATAAAGA
+AGGCGGAACCGGTTATGTCTCTTTTGAAAGCAACCCTGACGGCGGGACATTCACAGAAAA
+GAATTGCAGTAATAACAGAGGTTACCAGTTATTTACTCCGGCAAACAACTACAGGGAGTT
+GATGGATCAATATTTTGAGCTTCGTGACGGCATAACCCCTGTTATTACAACCGCAATGGC
+ACAGGCACTATGCTTGCACCATATCATTGTTGATCATATGCCGGAGCATGTCTCCCGTGA
+AATGGAAATATTGATTTTACAAAAACAGCCTGGGCAGAATAAGCCGTGCTTTGGTCGGAT
+AAAATTAACCGATCAGAGCCGGGATAGCGCCATAAAAACAGCGGGCCAGAGGTATGCTGA
+CATATTTTTAAAACCAATGTTACAAACCATTGTAAAAACCAAACCCCAAAAACCTTCTGG
+TTATGTTAACGTTATTAAAGACATAGCCGGTCTGGGCAAAACCATGGTCGTATTAGGTCA
+AGCCATGAAGAAAAACGACATGAAGCGCATAAATATCTGCATAGATTTATACGTTGCAGA
+AGTGGCCAAGGTTAACAATTCCTTTGCCGGACTTACCCCGCCTAAGGAATTAAAGAACTA
+CCACGGGTACTATAAAAAGCTGATGAGTCATCATACCAAAGCCGTTAAATGGCTAAAGCA
+GTTTCAAAAAACAGGGGACATTGTCTTTATAGATAGGTTAAATATTGAAATGGATAACAT
+TGAAAAAATAATAGATAAGCTAAAGCGCCCGGTTTAAACCGGGCGTTATTCAGTCTTTTT
+TAGGGATGTCACTGAAATATTTCCAAGCCCCTTGTTCATCCTGAACTAGATGCATGGACG
+CTTTGTAGGGTTGTTTATTACCAACGAGATTGACTGTTATTTCGAATGGTATTTCGGCTA
+CGTTTTTGTAAGTTTTACCGGTACCTTTTGAATCAGTCCAGCTATTAAGTAAAACTGGCT
+CTTTCACTTGGTAGCTTTCAATTGCAAGTACCGGGCCATCCTCTTTCATTTTAATAAATT
+CATCTTCAGTAATTAATGCCCGGGTATCCGGGTGAAGGTATTTGTATAATTGCTGCCACT
+GTTGATATGACATATACTCTAAAATGCTTTGGGCAACCTTTTCTGGTGGCTCAGCCTTTG
+GTTCTGGACTTTCCTTTGGCATATTGTTCTCACCACAGCCAATCAGTAAAGTTAAGACTA
+ATACTAATATGGTAAGCAAGCTTTTGGGTTTCATACTATCGCCCTCCTTTTTAATTATTT
+GGTTTATTGTATTACGTTACCAAGGCAATAACATGTCACTTAAAGTCGAATATAACTTAA
+AAATTTAAAATTATCCTAACATATCAATTAATTTTTAAGGATAATAATTTCATGTAAAAT
+AAGTGGGATTACTTCCGCTTTTTGTATTTTCGTTTGGCTGCGGTATTTTCCGCTGCGAGA
+GGAAATAAAACTGGCCATGATGGACTAGGTGATCGGCTTAAAATTACATTTAACCCCAAG
+CGAGAAGGTTGAGCTGGCCCGTAGGATCGAGGAAGCATTGGGAGGACGGCAGGGCAGCAA
+TCAATATCAACGGAAAGAGGACCCGCAAAATTTTGCGGAAGCTCAAAAAGGAGAATCCCG
+AGACATAGCTGCCAAAGCCGTGGGTATGAACCGGGAAACCTACCGTCAAGCAAAAGCAGT
+AAACATGAAATCGAGGAGGAACGGGCGCTAAAAAGAAAACAAGCTACACAATTGATAGGT
+AAGGATAAGAATGGTTTGCCAACACAAAGAACTTCGGTTGGGGAACTGAGTTCCACCACC
+GAAAAGGGCAAAACCCGCGATAAGATAGCGGAGCAGATAGACTTCCCTTTGTCGGGCAGA
+ACGCTTAGTAAAGGCATGAAAATTTATGAAGCTGCCAAAGACAGCAATAAAGACGCTCAA
+GAGTCGTTAAAGAAAATAGACAACAAAGAATCAAGTATTACCGCTGAATACAAAAAGCTT
+TTCAAAAAAGATGAAATCCCAAAATGGGCAATTAAATATAGTGACTACCATATGCCCACT
+ACATAGTTCGGGTACTGGCCCTTCATAGGTAGGGTGGCCATCCTTTCCATTCCGGCGAAT
+TTGCCGGATTGCTCTGGTACTGGCCCTTCATAGGTAGGGTGGCCATCAGTACCGGACAAT
+CTGTCGGTTACTGAAAATGTGTACTTAACCCCGGTCAAACTATCCCAAGTTGAAGGGTGC
+TGGCACGCCATAGGTAGGGTGAAAACGCACCTTGTGGAACTCAGTTCCCCAAGGTCAGGA
+TTAGGTGCTGGCACGCCATAGGTAGGGTGAAAACCCCTCAGTTGTACCCAACTTGACGAC
+AACTGAAAATAACCCGGCAATGGCCGGGTTTATCTACTGCCTGTTATTTTTTCTTGGTTA
+ATTAGCCGGTTGTCCAATCTTAGTATATCCCCCCAAACTCCCTTAAGCTGCAGTTTGACT
+TCTGATACATCCTTCTGTATTTTGCGCTGGCCCTTCTCTAAAGTATCCAGACGTTTAACA
+ATGGATGCCTGGCCTTGCTCCAAGGTGCCCATGCGTTGATCCATGTCGTCAAGGCGTTCA
+TTGATAGGCTGCAGCTTCTCGGTTAGTGCCTCATCCAGTACCCGGCGGAGCATTTTTTCA
+AGCTCACTCATTGGCGGTGGCACCCCCTTCTTTGTCGGGTATGTGTTCTAGTAGATCACC
+AGGCTGGCAGTTTAAGGCGGCACAGAGCTTATTTAAAGTGGAAAAATCCATCCTTTCAGT
+TTTTTCATGGTAAAGCAAAAAAACCGTATTTCTTGATAATCCCGTTTGCTGTGCTATTTC
+TGTCATATTAATTCTTTTAGCCCCAAGTATTTTAGATAAATGCACTTTTATCATAGGCAT
+ACCCCCTGTCTTTATAATACAGTAAATAGTTAACAATGTACAGCTAATAATAAATAATTT
+ACTGATAATAGTAAATAAAGTATTGACAATGGTACGGGTAGTGGTTAAAATTGTACTAGA
+AGCAATACAGTCCACGCTACCAGGGAGGCGATCCCTGGGGAAAATTAAAAGAGGGATTTT
+AAGATGCTTAAACTTGAGAACGGCGATTATTTGGTTTATTCGGACGGCAAATTTTATCTT
+ATTGCGGACGGTGGCAGGGAGTCAGAATAAGGAGGCTTAAATCATGGCTAGTAAAAGAAA
+AGTTATCATTGTTCCTGATTTGCTACAGGACTACATCGTACTGGGAGATGTTGTATTGGT
+TAGTTTAAGGTACGTAAAGGAGCTCATAGGAGAGAAACGAGAGGATGAAGCCCATGTCAG
+CTAGAAGAGGGGTAGTAATTGTACCAGATTTGCCGGTTGATTATATTGAACTGGAGCACG
+TCGTGCTTGTTAATGCGGAATATTACATTGGTTTATTGGAGAATTAACCTGTAGCTTTAA
+AAGGGGGTATTCGTTAATGAAAACGGTAGTTTTTTGTAACTTCAAAGGTATGGAAGGCCC
+TGCCAGTCAATTTACATGTATTGCAACTGATGATTTTATTATGATTGAAGAAAGCCTTTC
+ACAAGAGGAAAAGGAACTAATTACATTTGTGCATGGCGGCAGTTTACCTTTAGCGAAGGA
+GGCGTAA
+>NC_021184.1|provirus_4466413_4519129
+GTGAAAGTTCAGAACCCACACGATAAATTCTTCAAAAAGACCTTTGGCGATGTAGCCGTG
+GCCAAGGATTTTTTAAATAATTATTTGCCTCAAAGCATCACGGATATAGTAGACGTGGAC
+ACATTGGAGCCGCAGAAAGACAGCTTTATTAACAAAGAGCTACAGGAAAGTTTTTCGGAT
+CTCCTTTTTAAGGCCAATATCAATAAACGGGAAGGCTACCTTTATTTTCTCTTTGAACAT
+AAAAGCTATCCCAGCCGGGATGTTGCTTTTCAGCTCCTAAAATACATGGTAGAAATTTGG
+AACGCCAAGATTGAAAATACCAATCAACTGCCGGTAATTATTCCGCTGGTAATATACCAC
+GGCAAGGACGGCTGGAACATAAAACATACTTTAGGGGAAATGCTTTCGGGCTATGAGGAA
+CTGCCAAGGGATGTCCAGGCACACATTCCAAATTACAAATATCTGCTTTATGATTTTTCT
+AGGTTTACTGATAGGGAAATAAAAGGTGAAGTAAGAAACAAAATAACAGTGACGATAATG
+CGGGATATGCCGAGAGAGGATATTGGCGAAATCCTAAAGTATGTTTTTAGAGCGGCTGTC
+TATTTGCTGGAGCTTGAAGATAAACAGACAGGGATAGAATATCTTGAGACCCTAGTCAGA
+TATCTGCTCAGCGCTAGGGCTGATTTAACCAAGGATGACTTCAATGAATTGGTTAAGAAA
+ATCGAAACCATCTATCCGGAAGGGAGTGAAAGGATAATGACTTTAGCTGAACTGTTTAGG
+GAAGAAGGCATGGAGCGGGGAATAGAAGTAGGTGAAGCAAAAGCCCTTGCAAGGACTGCA
+ATAAAGTTTTTAGTTAAGAAATTTGGTTTTGTGCCAGAGGATTTAAAGCAGGGTATAACG
+AAATTAGATGTACCAACACTGGAAGTTATAATTGACGGTGTATCGGAATATAAAGACCTC
+GATGAGGTAAAAAAATATATCCAGTAACAAAAACCTAAGAAAACCTTTATGAATAATAAG
+CTTATATTTCCTAACCCTATGGATAGTGCTGCTAATCATATCTACCAGAACTACAATGAA
+AAGGTAAGAAGCCCCCAAGCCCTTGTCCCATGCGGGTTTGCGGGGTTTTTAATATACACG
+AAACCAGGGGCTTTAGTGCTATTAACGCTAACAAAATTAAAGTAACATTCAACAAGGCTG
+TTGAAGATACTACAAAAGCAACCTTCGCAGTAAAACGTGGTACGGTTACTGAAGAAGTAG
+CAGTAACTTGGAACGAAGCAAAAACAGAAGCAACCTTAACAAAAACAGGAAATTTTACTC
+CAGCTGAGTACACTGTGACTGTTGGTGGGGTTGTAGAAGCTACCAATACTGTCACAATTG
+CAGCAGAAGAAGTTAAGAGCGTAGTTATCAATACTACTCAGTTACAAAAATCAGCTACTG
+CTCCAGTGTCAATTGATTTCATCAACCAATATGGTGAGAAAGCAACTGTCGCTGCAAATG
+ATACCAAATTGACTCTAACTGCTTACAACAAAACTGCTGGCGTTGCATTAGCTCAAGTCC
+CTGCTAAATTCCAATTTAATGCGGCTGCAGCTACTCTTAAAGATGAAGTTGTAATTACGG
+TAATGTACAAAGGTATTACCCAAACAGCTACAGCCATTGTTGTGAATGCTGCTACTGTTG
+GAAATGTAACATTGGGAGAAGCCGTGTTACCAACTGGTAAGACAATGTTCACACCGACAG
+GAACTAAAGATGTTGAATTAGCTTATACAGCTACTAATACACTTGGTGAGGCTTATAAAC
+TAACAGCCGCTGACAAAACAAGTGGAGCTGTACAATTCTTAAGTTCAGACAACACGATCT
+TAAACCCAGCGGATATCTCAATCGATACTAACAATAAAATTAAAATCGCTAAATTTGGTA
+AAGCTGGTACTGTTACATTGACAGCACTTACACCAGCTACCGGTGCATCAACTACAACTA
+CTGTCGTAGTAAATGAAGATGCTGGCGCAGCATACGGATTAACTTTAGAAAAAGCTGCAG
+CAGACTTCCCAGCTGGTTCCATAACGCCATTCTATGTAACACAAACTGTGGTTGATAAGT
+ATGGTACTGCTATTGCACAGAAAGACTTAAAAACAGCAGATTATACCGTCTCAACAAATA
+ACAGTTCAGTTGCTACTGCAGCATTTGAAATTACACCAGGTACTGACTATGGTAAAATCA
+AAATCACTCCAGCCGCTGCAGCTGTCAAAGGTAACTCAGCAACGATTACTGTAACTGTCA
+ATGCTACTGGTAATCAGGCAACATTATTAGTGACTGCTAGTGATGCAGCTGTACCATCAA
+GTGTTGACACCAAAAAGAATACAACCGTTTCAACTAACATGTTAACTGGTGCAACACAAA
+CATTGAGTTTTGATGTAAAAGACCAATACTCCACAACCTACACAGCAGGCGTAGCAGGAT
+ATACTGTTGAGTACACAACCAGTGATTCTAGTGTTATTGCAATCACTTCTAACGAAACTG
+CAAAAGATGCTATAAATACAGCTGCAGTTGATGTGAAAGCACTGAAAGCTGGTTCTGCTA
+CCATTAAGGCTACATTGAAAAAAGATAGCGTAGCAGTTGCTGAAAAGGCTTACACGATCA
+CAGCTATAGCAAATAGCTCTGCCGGACTTACTTACAGTGTAGAAGCGCCAACTCCTGCAT
+ATAAAGGATTACTTTCTAAGGATATCGTTGGCGAAACACTTGGTGATGCTGGTGCCGCAA
+CCTTAACAACAAACGCTGATAAAGAGCGTGCTATTAAATCTGGTTATGCAGCAGAAGTTG
+CTCTGTATGCAACAGATGCAAATGGCGTAAAAACCTTAGTTCCATCTAGCGCCTTAGTCG
+GAGGAGCCCCAACTATTACTCAAGCACAAAAAGCGGATGGAACAGGTGCTGCGACTGTTC
+AGGTAGCTGTATTTGAATATAATAATAAATACTACGTATATACCTCAACAGCAGCCGCTG
+CAACTGACTTTGAAGTTACTGTAAATGGTACTAAAGTTACACAAGATGTAAAAGCAAAAC
+TAGAGTTTACAATCAACGCAGATGATACTATCAAAACTATTTCACAAGATGTCACAATTT
+CAAAAGATGCTTTAAAAGCACAATCCATCGAATTTAAATCAGCTGCACCTGGAACAACCA
+CTGCAACTGATGTAACAGCAATCACTGTAGCTGACTACGCTGCATATACGACTGCGCTAA
+CTACAAAGGCTTATGTATGGGTAAAAGACCAATTTGGTGGCTACTCATTATCTGATACAG
+GTACTGAAGCTTCTGCCTTCTTATCTGTCGTAGACTTAACAGATGTAACAGGCGCAAGTA
+ACGACACAGTAGTTATTGGTGGGGCAGCTGCTGCACAAGATGGTGTAATTACTATTACTG
+ATACCGGTAGTAATACTGTAATCAATAAAAATGGCGGTGTAGTACGTATTATTGCTAAGA
+CTGGAGCTTTAACAGACTTTATCAACTTAACAATTGGGAAAGAGAACGTAAAACCAACAC
+TTGACTCAGTAGTATTAGCAAACGGTAGTGGAACTGCAGCAACATTGGACGTTAATGACA
+CTATTACATTAACATTCAGTGAAGCAATGACAACTACTGGAAATGCAACTTTTGCTATGA
+CAAACGGTGTTGTAACCTTACTTGATACCACTACATTAACATTTGGTACAGTAGGTGTTA
+ATGCTGGAACTGGAACGGTTGCATGGAGCGCAGATGGTAAAGTCGCTACATTGACTTTCA
+CTGCTGTAACAGATGCAACAACCGCTCCATCAGGTGCTGTTACTCCTGGAGCAGTTGTGT
+TAAAGGATGCTAATGGCAACCTAACTGCAACAACAGCTAGTGCTGCCGCAACAGGCACAT
+TCTAGGCTCAAGGAAATTCAATGCTCTAGAAAACACAATCTGATGGTTCTTTTGTTGAAA
+ACCGTCCAGTGCACTAACTAAACCAGAACAAAAAAAGCCCGGGTGGTCCCAAAGCGGATC
+GCCCGGTCTTTTGTTTATTGGGTTCGCTTGGCATAAGGCAAAGGGGCTGGCGTGGCCCAA
+GTGGAATATTAGTGGGCTTGGCTAGTGAATAAAGCTAGCCCGGCGGGTTGGCCTGATAGG
+GGTTATCTGGGTACCTGGTTGGCCGGGAACATAGAATGGCCGCGAGTTTTGCCCAGTTTG
+TGCAGGAATATAAATAATACTGATTACACGGCAAACCAGGGGGACGGTTCCTGCGGTTTG
+CGAGAACACAAGTGCTCGGGACAAACCAGAGGGACGGTTCTGGAAAAACACAAGGGGACG
+GTTCTGTTGTGCAGTAGATAACCGTCCGGCGCACTAACTAACCAAACAACCAAACAGCCC
+GGGAGGTCCTACACGGATCGCCCGGCTGTTTTTTATTGGGCGGGGTGCGCAGGAACGCTG
+GGTATAAAGGAAAGAGGCCAGCGTGGGGTTGAGGAGGGCGAGATTGGTAGGCAGCCCGGC
+AGGTAGGCCTGATTGGGGTTATCTGGCTACCTGGTTGGCTAGTAAATGCGGGGGATAGTT
+GAGCATGAAAAAACACCTTACAGGTAGAAATACTTGTAGGGTGTTTTTTTTTATTTCTCC
+AGGCTAGTTTTATCGGCAGCTCCGCCGGAACGTATCCACTCATCCACTTCGGAAATCTTA
+AATTTCCAAAGCCGTCCAACCTTGTGCGCTGGCATGTTACGGTGGTTAATCCACTGAAGT
+ATAGTTTCCCGGCTCACATCAAGATAGTCAGTTATAGTGGCCATTGATGACCATTTTTCT
+ATGTTGTCCATTGTTAAATCCTCCAGATTATCAGCGCACACCATGTAAGAATCCATAGCG
+GCCATGTTCTGTGTCCTTTGTAAAAGTGATTAGGTTGGCACCGGTATAATCCAAATCCGG
+GGGTTCGTTTTCAACAATAATAACTTGACCTTTATGCTGGTTATCAAGCAGATATTGGAA
+TAGGCCTGCTTTCATACTATCCGGTGCGCTCTCATCCCCTCGTTCCTTTAATGAGAGGAT
+AGGTGAATCCACAACCAATAGTCCCGGCGCATATTTCCCCTGCTCCACCAAATATTCCAT
+GAGTGTGACTGCAAGTACAGTATTTAAGAACGCCCGATACCCTTTACCAAAACTTTCCTT
+TGGTTTTCCGTTTACAACCACATCAAATTCCCTAGGGTCAAAAAATGCAGATCCAAATCC
+CTCGTACATACACAAATCCAAAATATCGTTTAGGCGTTCATCTAGCGTGCCTAAAATATT
+GCTGCTGAACTGGTTCTTTATTTTAAATTCTAACTGTGATTCATCCTCCATTTGTACGTT
+GAATAGCTCAGTCTTTATGTTAGTTTCAAATTTGTCAATAACAGTTGTTTCATTTTGGAT
+TTCGATGGCCCGGCGATATTCAGCCAATGTTTTCTTAAGTGCTGCCACCTTGGGCTTTAG
+TTCACTGTTGAGTAAATCTTCGATCCCCCATCTTTCATGATTCAAATCTGCAAGCCTTGC
+CTCAAGAGCAGAGCGCTCTTTGACGATGTCTTCATTGGCCTCCTTAAGATCGGAAAGTTG
+CAGCTGTATTCTATGCAGTTCCGCATGTGATGCCTCGATGTAACCCTTCTCAATCTCCAC
+GGGAACATTGCTTTCGCAGAACGGGCATTTTGACACTTCCTTGACATTCCCCCTGTTTAA
+CTCCCCTTCAACAATAAAGGCTAAACGTTTTACATCTGCGGCATACTGGCTCCCCAGGGC
+CTGGTACCGGTTGTAAAGGGTATTGCACTCCGCCAATTGTGCATTTACCGAAAATATTTC
+TTTCAACAACTGTTTATTGTGCTCAATGGCCCTGGCGATGGCTTTTTCGGTTTCAGCAAT
+ATCATCAAGTACTGTTTCAACCTTGGCTTGAAGATCCAAAGCACCGTAAGGAATATTTCC
+CAGCTCTTCTTTTCGGTCGGCAAAGGTTATTAGCTGTTTATGCATATAATCAACCAATGC
+TTTTCTTCGGGCCTCCGATATTTCCTTTTTCTCAAGGGGTTCTTCCTCGGCAAAATCTAT
+TCCTGTGATCAGAAAGAATAATGCACTGAGTGCTGCTGTTGCGGAGGTATTCTGTCTCGG
+AAGAATAATGGACCGCTCCTGTAAAACACTTGTTTCCTTGATAAGGAACATGTGTGAAAA
+TGTTCTCCAGGTAAGCCTTTGTTTCTCAAATCTTGAGTTTTTTATAATATCGTGTTCTTC
+CTCTATTCCAATTAGTTGGAGCCACAAATCACTGATATTATTCTTTTTACCGCTGGTTTT
+ATAGGTACCAGACATAATATCATAGGCGTCACTATGCACTTCAATTCTATTGGTATCTAG
+TTGGCGGCTTAATGTAACTTTACGACCTTCAGTTGCGATAATAAGTTTTATCCGGTCATA
+CCCGGCGGTTCTATCAAAACGAATTCTATCGCTGCCAAACAAATAGTCCAGGCATTCTAA
+GACATAACTTTTACCGGTATCAGATGGCCCGCAAATAATATTAAGACCCCGCTCAAACTC
+CAGGATGGAAGGTTCCTTGCCGCTGCCCATCACGATTAATTTTTCAATATGGAACTTAGA
+CATCATTCACACCCCTTTGCAGCCAGGTAAATGCGTTACGGTTAATCATTTCAAAAATTT
+GCCGCTCCGATTTTTGTGCTATGTAGCCCTGTGTTCGTTTAGCAAGATAGCGGTATGTTT
+CAGCATAATGATTTGTAAACCGTGAACAATAATCCTTTCCTTTTTGATTTATCGAATATA
+AAAAACCCCTTTGTGAAGACGCTACATCAATTAGGCCGGTTAGGACAAGTTGTTTAACAG
+CTTTTTTAACTAGTTCACGGCGGAGCGGGAATTCACTGTATTTGAAGGCACTGTCCCCAT
+GAAGATCGTTATCTGATATTTCAAAATCCTTACCATAGACCGTTATAAAATCAGCTGCGG
+CTATCATATCAGCTGTCTGGATTAAGCCGGTTTCTAACATTAATAAAACACGCAGTGAGA
+TCTCAAATGGGGTGTTAAATATATTATTCATTCCTTAACACCCACCCTTCAATCTCGCCA
+TCGTTTACCAGAATGTGGCAGACCCCTTTTTTCTCACTGGCTCCGACCCATTTTAGCGGC
+TCACATAGCCAGCATTTGTTAACCTGGATAACAGCTGCATGAGCCATTACACCATTCATC
+CGGGCAAAACCGTGTTTAAAATCATTATAGTAAATATCAATAATGCCATTGTATGTCTCT
+TCTTTTAAGGTTTCAAATTGATCTGGTTCCGTCATACCAAAAATATCCCTTGCATCTCTC
+CTTACGGTTTCAGCGGCATAGTAATCTTTTCTTCGCCGTTCAAAATCTTTTTTATATCTG
+GGATATCGGTCAAGTAATTCTTTTGACAAATCAGTTAATTTCTCGGCTTCTGCATAGGCT
+GCCAACAATTTTGTGACATAGGTCAACTCATGTTTTTGAATTTCTTCCGGTGGTGTTAGG
+GGAGGAGGGCGTAAACCATGGGATTTACTCAATATGGCCTTTAGTGCCTTTACTTCATCC
+ACAATGGTTGGAATTCCGCCATTTGTTTGCTTGTCCCCCGTTAGTTTATTAGGCTTCTTT
+ATTGCATACAGAAAAACCTCGGAAAGAAATCTAGCTAATTTTTCTCCCTCCGCAAGGGCC
+AAGAAATCTTTCTTTTTATTTTGTGGAATCTTAGTGTCCTGGGAGATAAGTTTAGTAAGT
+TCATGCACCAGATCAGAGGTTAAATCAGGTGTAATGGCAGGTATGACCACGTCTTCAAAG
+TAATCGTGGGCGGCGTCAATGATTAATTTGGAGCTAGCCGCTTTTTTAATTTTATTATGT
+ACTTGAGCATTAAGCCCTAATAACTGATTGGCGATTTTAGCCGTAACCACATATGGTTCA
+CCTATTTGATTTGTGATAACAACATTATCAAGAATTAGGCCCAGCAGGAGCTCCGTTACC
+TCCACTTGGCTGTCAGAACCTTTGATTACCTTTTGAACAGCTCTAGCGTATGTACCAAAA
+CACAGCCCGACCACTAGGATTCCCCCTTCCCGCAGAATTCAAGGGTCAAAAAAGGGTCAA
+AAACAGGTCAAACTGAGGGTAAATATTTTTAGGTCACAACCTGTTATCATTTTATTAATA
+AGTGTTGTTGAAAGAGGATGTTTCTACTTGGTTGATTGTTGTATGTGGGCATGGATGAAG
+GTGCCTCAAAAAAAAACTCCGAAAACAACCAGTTGATTCTGCCAGATATTAAAAATATTA
+TATCACCCTATTTTGGGTGTTACAACATTATTAACCATAATTCGAAACAATCTTATCCAG
+TGCAACTTAAACAATCACAAATACACTTAAATACTTGATGGATGAAATTATAGAAAGGAA
+GGTGTTTATGAATAAAAAACTGATTAACATTGAATGCCCCACATGCGGCAATCCAATTGT
+ATCAAAGTATGCCAATGGGGAAGTAACCGGCCTACTGTTGCATAAATGCAGCCGATGCAA
+GCGCTACTGGGATTTAAATTACACAACTGGAACAATTTCCTGGGTAGATGGGAAACCGGA
+CAAAACCCCAGCCAAAAATTTTATAGTGGATTTATCAACGGGGAAAACCCGTCCAATGTA
+TGATAAAGCTTTACTGAGACGAAAAGGAGCCTAACATAGAGCTACCTTAAGGACCAGATA
+GCTAATAATTAATTTTATTAGTTATCTGGCCTTTTTTTTGTCCATTACAAACTTAATAAT
+GCTTTGCCAATTATAGCGAGTTAGGAATCAAAGAATTACCTCAGACCGCATAATTACTGA
+TTTTTCGGTAATTATGCGGTTTTTTTATGCCCGTTTTTCGGACCCGCCCCATTGGGCCTT
+AAAAAAGGAGGAAATAAACATGATAAAAAAATTTCAAACCCAAGATGCTGAGATCACCAT
+TGAAATCACTGAGCAAGGAAAAGCGATTTATGCAGTAGGTAAAAAAAAGACCACATTTGA
+TTTAAGCAAATGTGAATCCTTTACTTACTGGTCAGTTATGGAAAGGGAAAAGTTTGTCGT
+CACGGAGGACATGCTCACCGGTGCAGATGAGATTGAGCCCTGGGTGTGGCTTGTAATTAG
+CCGGGGAGAAGATCGGCTGGAATATAACAACGACCAGGCGGAAACCCGTAGCCATCAAAG
+TTATTCCAGCCAAAACGATAAAGCTAAAGATTTAGTTTCTGATGAGGATGCCCTCGAAGA
+AGTGCTGGCCAATTTGGGCAGGGAAGCCGTAAGAAAAGCTATTAGGTCGCTTGAACCCAA
+GCAGCAAGAGTTAATCTTTGACATATATTACCGGGGCCTTTCCAAGGCGGATGTAGCCAA
+ACGTGATGGCGTTTCTAAAATGGCGATCACCAACCGAATGAACAAGATCATTAATCGGTT
+GAAAAAATATTTAATAAATCTATAAATTCGGGGGGGGTTTACTTTTTGCTCTACCATGAC
+TTGTATATAGAGGCCGTTAACAAAATTTATATTGCAAATCAAAACCGGCCTCTAATCATG
+GTAAAGGTAGGTGAAAAAAGTTGAGTAAAAACGCTTATATTGGCTCCACTACCCGGCACC
+ACATGGAAATTGGCATCAAGAAACCAAATTCCAGCCAAGTGTTGGCGGCAAGGAAGGTCA
+AACTTCGTGACCGGTTCTTAAATGCAATCTTTGGTAAAGGGCACAGCATGGTTGTGCTAG
+TGCCTGGGGAAAGCATTGGCACCATTTCCATTACAGAAATGGAGGTACATGAACTGGAAG
+AAGCGGAAAAGGAATGCGAAAAAATGAAGTCGATACAACGGGAAAAAGGCAGGTGATCTA
+AATCAATGTAATTTTATTCCCGCACCAACAAAGAGCATTAAACCAAACCATGCACCGCAA
+CCTGGTAGCTTACTACCTAGATATGGGACTTGGAAAAACATTTTTAGGTTCAGAGAAATT
+AAAGCAACTAAATGCACCCTTTAACCTCATAGTTTGCCAGAAGTCTAAAATCACGGACTG
+GGCTGAGCACTTTAAGACCTACTATGACTACGAAGTTATTATTTTCAAAAACCAGCCCAT
+CGAAGCAATTCCACCACACAGCATCATCATAATTAATTACGATCTGGTGTGGCGGCGCAA
+GCAGTTAGAGGAATTAAGGGATTTTTCGATGTTACTAGATGAGAGCCAATATATCAAAAA
+CGAAAATTCCAACCGGGCCAAGTTTATTCTTAACTTAAAACCAGACAATGTAATTTTATT
+ATCCGGCACCCCCACCGGTGGAAAGTATGAGGAACTGTGGTCGCAGCTAAGGTTGTTGGG
+GTGGGGTATAAGCAAAAAGTTATTTTACAAACAGTACACCATCACTGAAAAACTTGATGT
+TGGCGGATTCTACATTACCGTGGTCACTGGCTACAAAAACGTTGACCGGCTAAAGGACAA
+ACTTTACCAGCATGGGGCGATATTCATGAAAACTGATGAAGTGGTGGAACTACCGCAGCA
+GGTGGAGCAAATCATTAAAATCCCCAACACCCCCCAGTACAGGAAATTTAACCAAGACAG
+AGTGATTACCATTGATGACGAAATGCTGGTCGGCGATACCGCTCTTGCAAAATTGTTATA
+TCTGCGGCAATTAGCATCGATTTACAACCAACATAAACAACAAGCTTTAAAGGATTTACT
+GTCTTCCACCCATGACCGGGTAATTGTATTTTACAACTTCAAGAAGGAATACCAGCTCAT
+TAAAAGACTAGCTGAAGAACTGGAAAAACCGGCGTCCCATATTAACGGTGACGGTACAGA
+TTTAGATAACTACGATACAAAGGACAACAGCGTCACTCTAGTCCAGTATCAGGCTGGATC
+GACCGGGGTCAATCTACAAAAGGCAAACCGGGTTATTTACTACAGCCTGCCGCTGTCAGC
+AGAGCTATGGATGCAATCAAAAAAACGCATTCACCGCATCGGCCAGCCTCGCAGTTGTTT
+CTACTACTACCTGATCACAGAGAAGTCTGTGGAAGAAAAAATACTGGAAGCCCTAAAGCA
+AAGGAGGGATTTTACCTTGGAGTTATTTGAAAAGGGGGTGAAGTAGCACCAGTGACTGAG
+AAACAGCTTCAAAAGAAAGTCATTAAATATTTAAATTCCCTGCCCAATACCTGGTTTTTT
+AAGGTGTGGGGTGGCGGGTTCCAGCGAAGCGGCATACCGGATTTAATTTGCTGTATTAAC
+GGGTTGTTTGTGGCCCTTGAACTAAAGGGAACGGGCGGTAAATCTACCAAGCTCCAAGAG
+CTAAATATCAATAACATTAACGCTGCTGGTGGCATTGGCCTCATTTTATACCCCGCCGAT
+TTTAAGGAATTTAAGACCCTTGTAAAGGAGGTGAGTAACGGATGCGGTTTAGCCACAGCA
+GAGTTGAATGCTTTGAAAAATGCCGGTACCAATTCATGCTCCGATACATCCGAAACTTAA
+CTACGATTTTCCCCCCGGCAGCGGATAATCCCTTAATAGTCGGTAGCGCTCTCCACTTGG
+GATTGGAAAAAGGACCAACTGCTATGGAGGAATATTACTACAGCCAATACCCGGTGATTA
+ATGACTTTCACATCAACGAAATGATAAAACTGACCACCTTGGTGGAGAAAGCCAATGAAG
+TGCTGCAGGAGTTAACTCGGGGGAAAGTCAGCATATTCGAGTATGAGATAAACTTCCCGG
+AATTTATAGGTTATGTAGATTTAATAGTCCATAACGGTGATGGCAGTGCAGATGTTTATG
+ATTTTAAGTACAGCAACAACATTGACCATTACCTAGAATCCAAGCAGTTACATTTGTACA
+AGTATTACCTGGAGAAACAAGGGTTTGACGTGTTCAAGCTGGGGTATGTTTTTATTCCTA
+AAACCCAAATCCGGCAAAAGAAAACCGAGGATTTATACCAGTTCAGGAAACGGCTAACGG
+AAACCCTGGCGGCCATGCAAGTAAAAGTGGTGGAAGTGAACTACGACCACTCCAAGGTGG
+ATGGATTTTTCCAACGCTGCCATGAGATTCAAAACGAAAGCATTTATGAAAGAACACCGT
+CAAGGCTATGTGCCTGGTGCGAGTTTCAAAAATATTGCGAGGAGGAAATCGATTTTATGT
+TATTACCGAAAAATGAAAAGCGGGAAAGGAAGATGGATCTAAATCCGGATAAGTGGGTTT
+ACGGCGATTCCTATGTAGGAAAGTCCACTTTCATCGAGCGCTATGAAGACCTGCTGATGG
+TAAACACGGACGGCAATATTGACAACCTAACCTCCCCGGTGGTCAGGATTACGGACGAGG
+TGACTTATGAGGGCAGGCTCCGAAAAGAAAAATTAGCCTGGGAAGTCTTTTTAGCAGTCA
+TCGATGAACTGGAAAAGAAGGATAACACCTTCAAACGAGTGGCTATTGATTTGGTGGAGG
+ATTTGTACGAACACAGCCGGTTGTACATTTATAAAAAACTAGGCATTGACCATGAACAGG
+ACGCCGGGTTCGGCAAGGGTTGGGACATGGTGCGGACTGAATTTCTATCGGCTATGAAGC
+GCCTGAAGAACTTAGGCTACCAGGTAATCTTTATCTCCAAGGAACTGACCTCGGAGATTA
+CCCTGAAAAACGGTAACAAAATCACCACCATCAAGCCAAACATCAACGACAAGGTGGCCA
+ATGTACTAGCGGGAATCGTGGATTTGACAGTTCGGGCGTTTATGGATGGCGATGAAAGAT
+ATTTACAGCTGGAGAAAAAGGAAAATGTCTTTGGCGGTGGCCGGTTTAATTTCAAAGTGC
+CAGTTGTGAAATTGGATAAGGATGAATTTATTAAGGCATTAAGGGGCGCTCAGGAAGGCA
+TCAAGACTTATTCCAGGGCGGAAAGCGCCAAGGAAGCAGCAGCAGGAGAAACAACCGGGA
+ATGAAACCAAGGAAGATGGGGCTACGGCAACTGCTAAGGGAGATACCAACGGGGATGAAA
+CTAGCGAGGAAGAAACGGCGGCTACCACTACGGAGGAAACCACTGCGGCGACCGATAAAC
+CCGAAAAACCGGCTAAAAGGAGCAGGCGCTCTCGCAAGTCCGGTAACCAATTAACTAATT
+AAATTACAAGGAGGACAAATTTAATGAGTAGTGTATTTGCAAGGTTCGACAAAGAGTTTG
+ACCTGAAAGGTCTTAAAGAAGACCTGAAAAATGTGGGTACAGGCGATGGCCATTACCGGG
+AAGTTCCCTATGGCACCTATGAAGTGAAAATTGAAAAACTAGAATTGGTGGAATCCAAAA
+CTGGCAAGCCTATGGTCACCAGTTGGATGCGCATTATTGCCGGAGAGTACCAAAATTCTA
+TTTTATTCATGAATCAAGTCGTCCACACTGCCTTCGGAATTCATATGGCTAATGAATTTT
+TACGCTCCTTAGATTCTGGCATCGATGTTACTTTCGAGAATTTTACCCAGTATCACAACC
+TCATTTTGGACATCCATGAGGCCATTGACGGGAATTACGAGTATGCAGTGGAGTATGGGG
+AAACCAACAAAGGATTCAAAACCTTTAAAATTACTGAAGTTTTTGAGGCGGAGTAGGGTG
+CTGTTATTCTATGACGCAGAAGTCTATCCCCACGATTGGCTCTTTGTCATAATCGAACCT
+GCCAGCCAGCAAAAACATGTGTTCATAAACGATGCCAGGGCACTGGCGTCGTTTTATGAA
+CAGCATACTGATCATATTTGGGTTGGCTACAACAACCGGCACTATGACCAGTACATTTTA
+AAGGGTATCCTTTGTGGTTTTGATCCCCATGAAATCTCCAAGTTCATTATAGCAGAAAAG
+AAACCAGGCTGGCAGTTTAGTTCCCTCTTAAACAGGATTAAGCTGAACCAATTTGATGTC
+ATGACCACCTTACACAGCCTAAAGGAACTGGAAGGCTTTATGGGGCATGATATCCGGGAA
+ACAACAGTTAGTTTTGATACCAACCGGAAACTTACAACACGGGAAATTGATGAGTTGGTT
+AGTTACTGCACCCATGATGTGCAAGAAACCATGGAAATATTCCTTCACCGGAAGGAAGAA
+TTTGATAGTCACGTAGCTTTATTAAAGACCTTTAACCTGCCGCTGAATTATCTGAGTAAA
+ACCAAGGCGCAACTGGCGGCTGTGATTTTAAGGGCCAATAGAATAAACCGAAACGATGAG
+TTTGATTTAGTTTTACCCGACACTTTAAGGATTAAAAAATACCGCCATGTGGTGGATTGG
+TACAAGGATGCCCATAACCACAACTATGATAATTTTCTACAGACTACTGTTAGTGGTGTA
+CCCCATATTTTTGCCTGGGGAGGGTTACACGGGGCTAGGGATCAGTACCAGGATGAAGGG
+ATTTTGGTCAATGTGGATGTGGCCTCTTTCTACCCTTCACTTATGCTGGAGTATGGTTTT
+TTATCCCGGAATGTGGAAGACCCCAAACTCTACCAAGAGATTTATCAAGAGCGGTTAAAA
+CTGAAAGCGGAGAAAAACCCCATGCAGCTGCCATATAAGATTGTCTTAAATGCCACCTAC
+GGGGCCATGAAATATCAGTACAACAACCTTTATGACCCCAGGCAGGCCAATAACGTCTGC
+GTAGGCGGGCAGCTGCTGCTCTTAGATTTAATCGAAAAGCTAGAGCCGAAGTGGACGCTG
+ATTCAATCGAACACGGATGGATTAATCGGAAAAATTAAACGCCTGCGGGACTTGGACACT
+ATTAAAGATATTTGCCGGGAGTGGGAAACCCGTACCCGGATGCAGCTGGAATTTGAACTG
+TTCCGGAAAATCTACCAAAAGGATGTCAATAATTACATCATCATCCGGGTAGACGGCAGC
+TATGAATCAAAGGGAGCATATGTCAAGAAATTAAACGAAATTGACAATGACCTGCCTATA
+GTAAACTCGGCCCTTAAAGAGTATTTCATTAACGGTGTACCGGTGGAAAAAACCATCAAC
+GATTGCCGGGAACTGATGATGTTCCAGAAGGTAGTGAAGGTCACCAATAAATTCTCCCAT
+GCTCTTTATGGCAGCCAAAGGTTATCGGAAAAATGCCTCAGGGTGTTTGCTTCCAAAAAC
+GATGATCCCGGTGTTTTTAAGGTCAAGATAAATGGACGACCCCATAAAATAGCCGGTACC
+CCGGAGCACTGTTTTATCATCAACAGTGATGTGCGGGGTAAAAGGATACCTAGAAGGCTG
+GATAAAGATTGGTATGTTCAGGTGGCTAAAAAGCGGTTAGCGGATTTTTTGGGAAAGGAT
+GATCTGAAATGATGACAGTGTTTAAAAATAAAGATTTCGGTGAAGTAAGAAGTATTTTAA
+TTAATCAAGAACCTTGGTTTGTTGGTAAAGATGTGGCGGAGATTTTGGCGTATAAGGAAC
+CCCATAAAGCCATTGCCCGACATGTGGATGAGGATGACGGGATGAAACATCCCATCAGCG
+ATAACTTAGGCAGGGTACAAGAAACACTGCTGATCAATGAAAGCGGCCTGTATGCTTTAA
+TAATATCTTCAAGGCTCCCCAGGGCGAAAGCATTTAAAAGATGGATCACCTCCGAGGTGT
+TGCCAACCCTTAGAAGAACCGGCGGTTATTCTATGCGCCCCAAAGGGCCAAGCCTAAGTG
+AGATTATACGATTTCTAAAGCTGATAAGAGACGTGATGGTTGCCCAAGGATGTAATGAAA
+GAGATATTGCTGTAACGGTAAACAACATCTGCCAGCAATTTCAGATCCAGCTTCCCACAG
+AATTCATCCGGCTATCAGATCTGGAAGTGAAGTTTATGCAGTTTCTTTACAGGGATGAGC
+TTGCCAGGCAAATGAGTAGCGGTGATGCCATAGCGGTGTTTTTAGGTAGGGAAATCAGCG
+ATATTAGCGAGGAAAGGTATCAACAGCTCAAAACCATTTACTGCGACATAGAAAAAAACT
+AACCCAGGAAGCGGGCGGACCTACCAAACTAAAATCATTTTATCGACTAGTGACATTAAA
+AACCGGTGCCAGTTTGGTAGGTTGCCTCCCAAATGAACATTAAAAACAATAAAACAGCCG
+GGGGAAATTATCCATACTGACTGTATGTTGGGACATTAACCATCGTTTAAGCAGAAAATA
+TGTCGGGAAACACTGCCAAAATGAACTGTAGGTCTTCCGGCTACCCCATGCTTTTGGGAT
+ATAAACATCCCATAAATATCAGGTTTTTTATGAAAGAGGTGATGACCATTTGGACATGGT
+TAAGGGTTATATCAAAACCAAAGGTAAAAAACCCATAGAACCTTACCGCAATAAAAAATC
+ATTTTACACCTATGACTATATCCGCAAAACGGGCGGCGACTTTGCTGGTATCCTGGCCGA
+TGGCATGGTGCAAATAGATCTTGATGATGAAAAAGAAGGGAAACTTGTCAAACAGATTGT
+CACAGAAACCGGCCTTAGAAGCGCAATTCTTAAAACCGATCGGGGCATCCACTTTTACTT
+TAGGAACACCGAGGTCAAGAAAAAACAAGTGAAGCTGATGACTCCCATCGGCGTCACCGT
+AGATGTGGCCGTGGGCGAGCAAAATGCACCGATACCGATAAAAGTAAACGGAAAAACCCG
+GCGCTGGCTCAATAAAATCGATGCCATAGAAGATATCGATTTCCTCCCAGATTGGTTGCA
+GCCGCTGAAGAAAAAACACAATTTACCGGACTTTAGTTCCTTAGCCGATGGCGATGGCCG
+AAACCAGGCACTTTTTAACTATATCCTTACCCTCCAGGCCGAGGGTTTTGGCAAGGAAGC
+CATCAAAGGCATTATTCAGATTATAAACCAGCATGTGCTAAAAACCCCTCTGGGGGATAA
+GGAAGTGGAGACTATTTTAAGGGATGAAGCCTTTTTAAAGCAGACCTTTTATATAAAATC
+AAAATTCCTCCACGACCGGTTCGCCAAGTATCTAAAAACCGAGGAGCGGATTATTAAAAT
+CAATAACCAGCTCCACATTTATCGAGACGGGGTTTACAAAAACGATGCCTTGGAAATAGA
+AACGGCCATGATTAAACACCTGCCGGAGCTGAATCGGGCTAAACGCTCGGAAACACTAAC
+TTATTTAGACCTTATAGCGGAAGACAAGGAACCGGCTTCAGCAAATTATATTGGGTTTAA
+CAACGGGATTTTAGATATTGACAGCATGACCATGCATGACTTTTCAGCGGACATCGTGCT
+GCAAAATAAAATTGAATATGATTACATTCCCGGTGTTTACGATCAAATAGTAGATAAAAC
+CTTGGATAAAATTTGCTGCCAGGACAATAACTTGAGGAAGCTGTTGGAGGAACTAGTTGG
+CTATCTGTTCTTTAGAAGAAACGAACTGGGCAAATGTTTTATTCTTACCGGGGGCGGCAG
+CAATGGCAAATCCACATTCCTGGATATGATTAAAAACCTACTGGGAAATAACAATTATTC
+ATCCCTGGGTATAGATGAACTTGGAGTGCGCTTTAAAACGGCGGAGTTGTTCCACAAACT
+TGCCAATGTTGGAGATGACATCAGCAAAAAGTATATGGACGATAGTGCTATTTTCAAGAA
+GTTGGTCACCGGCGAAACAGTTAACGCTGAGCGCAAAGGTAAAGACCCTTTTGAATTCAA
+CAATTATGCCAAGCTGCTTTTTAGTACAAATAAATTGCCTAGGATCAACGATACTTCCGT
+AGGACTTATGCGCAGGCTGGTGATTATCCCCTTTAATGCGGTATTTAGCGACAAGGACAC
+CGATTTTGATCCTTTTATCAAAGACAAGCTGCTAACAAAACCAGCCATGGAATATTTGCT
+GAAACTAGGGATAGAGGGTTTAACCCGTGTGTTGGCCAGTGGGTTTACCGAGGCTCAGGC
+GGCAAAAAGGGAGAAACGGGATTACGAAGTGGTGAATAACCCTGTTCTGGCTTTTGTTAA
+TGAAGGATTAAAAATCGAAAATGAGGCAATAAAGGACGTTTATCGAAAATATGGGACTTG
+GTGTTATGAAAACGGCCTAAAACCTCTTAGCCACATAGAGTTTGGACGGGAGCTAAGTAA
+AAATGGCTACCAATCAGAGGTAAAAAGAATTGGCGGGGAGACCGTTCGGATTTATGTGAA
+GGCCGCTACAGATGTAACAAATGGGCAAAATGATTTGTAACGGTTAAAAGTCAGTTAATC
+CAACAGTTAGGAAGGATGATACAGATGTTACAGATATTCGTTTATCTTTTATAAATAAGG
+GATAAGAAAGATTATAAATTATTTATATAAAAGAAGTATATATATATTTATTTATAATAT
+CTGTAACGCTGTAAAAATATCACATTTAACGACATTGTAATTTAAGTGAGGTGTTAAGTC
+TTGAAAAATATAGTTTTTATCTGCAGTCCCTTTGCCGGGGATGTGGCAGGAAACATAGAT
+AGGGCCAGGCGCTACGGGCGGTTTGCGGTAACGAAAAAAGTGATACCTATTATCCCCCAC
+CTGATGTATCCACAGTTCCTTGATGAGGATGACCCGGCGGAAAGACAACTGGGGATTGAA
+ATGGGACTGGCACTATTGTCACATTGCCGGGAAGTGTGGGTGTTTGGGAGCCGGGTGTCA
+TCGGGGATGGCGGCGGAGATAGATCAGGCCAAGGTGCTAGGGATTCCGGTTAAGTATTTT
+ACGGTGGATTGTAAACCAGTGGGAGGGTTGACCTATGGGATTTGATGCTGTAGACTGTTT
+TGCCCATAAACGAAATAGCTGCACAGCTTTAAAGGTTAAACAGTGTGAAGGCTGCAGTTT
+TTATAAAACCAAGGAGCAGTATGAACTGGGTCAGCAGAAGGCGTTGGAGAGGATTTACAC
+CTTGGATATAGCCAAACAGAAACATATTTCAGAAACCTATTATGGCGGCAAACTGGAGGT
+GATAGCTGATGAAGGCTAAAGAATATTTATCCCAAGCCATCAGGCTTGACCACAGAATAA
+GCAGCAAGCTGGAGCAATTGGAGAACTTAAAGGCCCTGGCCATGCGGGTAACCTCAAACC
+TGACCCAGGAAAAGGTATCCGGTGGTAGAAATATCAGAGGTCCTTTTGAAAACACCATGG
+CTAAGATTATTGATTTGGAAAAAGAAATTAACCAGGAGGTTGACCAGTTTATAGAACTCA
+AACAGGAAATCATGGGCACCATTTGCCGGGTGGAAGATGTGAATTGCCAGTTGGTGCTGG
+AGAAAAGATATATCAGCGGCAAGTCCTGGGGGGATATCTCTTTGGAGCTTGGGTATAGCA
+GGAGCGGGGGTTTTTAGAATCCACGGTGAAGGATTAAAAGAAATTAACGAAATACTAAAA
+AAGTGGACTAAAATGGACTAAAGTGGACTTAGCAAGTGTGGTATAGTGTAAGGTGTAAAG
+ATATAAAAACATATTCAAGAAAAGCCCCAGGATACTGTGGGCTTTAATTTTTTAGGAGAT
+GAAACCAAATGAGAACATGCGCCTATGAAGGTTGTCGGCATGAAATAAAACCCGGCAGCC
+CTTATTGTAAATATCATGCCAGGCTGATTGAAATAGAAAATAACAGTCCGAAGTGGCTCA
+ATGACATGATCCAGGAAATGCGGGACAAAATGAACAGCGAAAAATGCGTAAAGGCAAGCA
+TGGCACCAGGCGATCATCCAGTTAAAAGTGACTAAACAACCATATGCCACGGCTACTAAC
+GAAAATAATCTAAGCTCTGACAGCAACTTGCTCTCAGGGCTTTTTCTATGGAGGTGCCAT
+TATGAAATGCATATCCTGTCGCTTTGCCAGCACCGATAAATCCGCTAGCGATAAACACTG
+GACGGCTTATGAGTGTGGTAACCCAAAGAGCGAATACCATAAATCTTTAATTAACATATC
+CGAAGACGGCAATAAACATAAACGTATCTCCTGGTCCGGCTGCCAGCACGGTGAGAGGAA
+GGTGAAACCCAATGCCACGGAAACCACCAGCGCCATGCCGCCATCCCGGTTGCCCGGAGC
+TAACGGAAGCCAGGTTCTGTCCCAAACACATGCAGGAATACAACCGGCAGTACAACCGGA
+AGGAAAGACCCAAGTATTCCAAACAGCTTTACAACAGTGCCCGGTGGCAGCGGTTAAGAA
+AGAAAGTTCTACTGGAGCATCCCCTCTGTGTAGAGTGTGAACGCCAGGGCAGGATTACTC
+CGGCAACAATAGTTGATCACGTAAAACCCCACAAAGGTAATCTGAATCTGTTTTGGGATG
+AGAACAATTTACAAGCTCTTTGTAAAAATTGTCATGACAGCAAGACCACAAAGGAAGGCC
+GCTGGGGTGATAAGAATAGGGTTTACAGTTATTAGGCAGTCTGGCAGCAGTAGAAAAAAA
+AAGCGACTTTATCCTGCTTAGAATAAATCGCTGTGGGTTCCCGTCCTGGTTAAAGATAGG
+GTCAGGATATCCTTTTCAATTTTGTATATAAGCAGCCAGTCAGGAGTAATGTGGCATTCA
+CGGTGACCACCGTAATTACCGGAAAGCGGGTGGTCAAGATATTTTTGAGGAAGTGGTTTC
+TCCTGGACAAGAATATTTAACACTTCCTCCAGCAGTTTTACATCATAGCCCCGTTTAACA
+ATAGCTTTGTAGTCCTTTTTAAAGCGGCTGGAGTATCTAATTTTCAGCATTTAGATCCTC
+CATCAAGGCATCTACGCTGTCAAAGGTTTTGCTCATATTGCGGTTGTTATTAACATCATC
+AATTGCGGCCCGTGTTTCCTCATTGGGTGTGTCAAGGCGAAGGTCAAAAGGAATGCCGCC
+GTAACGAACGGAGTAACGCAAAAACATATTCATAGCAGTGGACATGTTGAGGCCAAGCTC
+GTTAAAGATAGCCTCAGCTTTACGCTTTAATTCCTTATCGACACGAACATTTATATTGGT
+TGTACCGGCCATAATATCAACTCCTTTCTATACTTATATTGTAAAACATTGTACGCAATT
+TATCAATAAATAATACCATAATGTTTTACTTTGTAATGGAAGGTCATTCTCATGGAGGGG
+GTAGTAAATCGCTGAAAACGGGAGCAAAACGGAGCGGGCGCGGGCCTTCGCGTGGGAATT
+CGCAAAATTCCAGATGGGGGTTGTCAAGGTCTAATGCTTGACATGGCACGAAATACAGCG
+ATTTTAAGCAGGTTAAGAAGGAGGTGGCCCTTTTGGAGATTAAACGCATTCCACTGAAAC
+AGATTAACCCGGCCAAATACAATCCTCGTAAGGATTTAAAGCCTGGAGATCCGGAATACG
+AGAAATTAAAGAAATCTATTGACGAATTTGACCTGGTGGAACCTTTGGTGATGAACAAGC
+GGGGCAACATGCTCATCTCTGGCCACCAACGACTAAAAATTTTACTGGAGCGGGGAGATA
+CCGAAACGGAAGTGTCCGTGGTTGATTTGCCACCTGACCGTGAAAGGGCCTTAAACATTA
+CCCTTAATAAAATCGCCGGTCAATGGGATCTGCCCAAACTGAGCGAGCTGCTCAAGAACT
+TGGATGATGACTTAAAAGATATTACCGGCTTTGATGCCGAGGAAATAGATGAATTGCTGG
+GCTTTAAAGAAGAAGTCCAGGAGGATAACTTTGACGAGGAAGCACCGGAGCGGCCCATCA
+CTAAACCAGGGGACATCTGGCTTTTGGGCAATCACCGGCTGCTTTGTGGGGACAGCACCA
+ACCCAGCTGATGTAGAAAGACTAATGCACGGTGCCAAAGCCAACTGCGTTATTACCTCCC
+CGCCCTACGCCATGCAGCGCAAGGACGACTACGGCGGGATACCGGCAGAGGAATATCCGG
+GCTGGTTTTTTCATGTGGCCAGTAACGTTTACCGGATACTTGACGACAGCGGCTCCTTCT
+TCGTCAACATCAAGGAGCACGTTGAGGGCGGCCAGCGTTCCCTTTACGTGATGAAAACCA
+TCATTGCTTTGGTGGAAGGTGGCTGGCGGTATGTGGATCAGCTAATCTGGACGAAGCCAG
+GGCTGCCCGGTGGCTGGTCTAATCGCCTGAGAAACGACTTTGAGCCGGTGCACTTCTTCA
+CCAAGAAGGAACAGATCGACTGGATGGTGCAGCTGGTAGAGGTTGATGAGGACAGATTGG
+CAACATTACCGGCGGACCTGGTGGAAATGTACGAGGACATTTTCCACTTCACCAAAGCTA
+AGAAAATTAAATTCAAACCCAGGGCGGTAGGCAGTGAATCAGATGCCATCCGGGTCTACA
+GCAAAACCAATAAAACCAAAGGCGACTCCGGTAATATCAGCGTCAGCGGCAAATTCAAAA
+AGGGCATCGCTAGGCCAGGGAATGTGCTATCATTACCCGGCAACCAAAGTTCCGTAAAAC
+ACTCAGCCGCATTTCCAGTGAAGCTCCCGGCCTTTTTCATCAAGCTCGCTACTGATGTGG
+GGGATAACGTTTACGAACCCTTCAGCGGCTCTGGCACCACCATCATGGCCGCTGAGCAGC
+TGGGACGGAATTGCTATGCCATGGAATTGTCCCCAGGGTATTGTGATTTGGCCGTGAAAC
+GCTGGGAGCAGCTTACCAGGGAGAAGGCAGTAAGGCAGGAGGTGTAAAGATTGGAGATAC
+AAAGACTACCGCTGGAGAAATTAAATCCGGCTAAATATAACCCACGGAAAGACTTAAAGC
+CCGGAGATCCGGAATACGAAAAACTGAAAAAATCCATAGAGACCTTTGGCTATGTGGAGC
+CCATCGTGTGGAATAAACGCACTGGTCAGATCGTAGGGGGCCACCAGAGATTTAAAGTTT
+TACAGCACCAAGGGGAAACCGAGATTGAGTGTGTAGTAGTGGATCTGGATGAGCAACGGG
+AAAAGGCCCTGAACATAACGCTTAATAAAGTCACTGGTGAATGGGACCTGCCTAAACTGG
+CCGACTTAATCAGCGAACTGGATAACGGAATATTTGATATTTCCCTAACCGGCTTTGATG
+CCGCTGAGATAGAGGATTTATTTTCCAAAGTCCACGACAAGGATGTTAAAGAAGACGACT
+TCGATGTGGACGGAGCTTTGAAGGAACCGGTTATCAGTAAACCCGGTGACTTGTGGCTGC
+TGGGAAGGCACCGGCTCCTTTGTGGAGATAGCACTAAAGCGCAAACGTATGAAAAACTAA
+TGGACGGCAAAAAGGCCAATCTCATAGTCAGTGACTTGCCTTATAACGTGGACTACGAAG
+GAACGGCAGGGAAAATTAAAAACGATAATATGGGAGACAGGGAATTTTACGAATTTCTCC
+TAAAGGCCGCCACAAATATGTATGAAAATGTTGTAGACGGTGGCGTTGTCTATATTTTTC
+ATGCAGACAGGGAAACCGTTAATTTTAGAACCGCCTTTAGGGACGCTGGCTTCTTTTGTC
+ACCAAACCTGCATTTGGGTGAAAAACGCACCGGTGCTTAGTAGATGCGACTATTTATACG
+CTCATGAACCCATTTTATATCTATGGAAGCCCACAGCAGGCCATAAGTTTTACGGTGATA
+GAAAACATAGGACGGTATGGAATTTTGACCGGCCAGCCAAATCAAAACTCCATCCAACTA
+CGAAGCCAGTGGCTCTGTGTGCTTACCCTATCCAAAACAGCAGTGCTCCCAATGGCATCG
+TGCTCGACCCCTTCTCCGGCAGCTTTTCTACCGGCATTGCTTGCGAACAGCTGGATCGTA
+TTTGCTATGCTACCGAGTTGGAGGAACGCTTCGTAGATGTAGGAGTGAAAAGATACATTG
+AGCATATCGGCTCCGATAGTGATGTCTACTTAATCCGGGATGGACAGAAAATTAGATACG
+CTGACCTGCTATAAATCCCTTGCTATTCCTGTGGTTTTAAGTGATGTATAGACATACCAA
+AAACCACAGGAGGGGACCCAAGATGACCAGAAAAGAGCTTGTACACAAGCTGGCTGAGCA
+TTTAGGAATACGACCTGTCTATTTAGCTGCCCCCAGCTTTGCTTATCAAGTTGGCGAATA
+TACCGTTAACCGACAAGGCAATATCCTTGACAGCGAGGGTCAGGTGCTGGAACTGGAGGC
+GCTGCTGGCAGGCGGGAAGGAGGAACCGGAGTTGGAGATCATAACTGAGCAAAAGGAAAC
+TGCGGAAGCGAACACTTCTGTCGAAACAAAACCCACTGCTTTGGAAGTAGGGATACCTTT
+GGAAGGCTACGATGGCCGGAGTTTGCGGAACCTGCTCCACATGATTTACAGTAAGCAGCC
+GTTAATTAAAAAAGCATTAAACCTTGATGCAGATTTGGTGAGCGAGGAAGTAATAACTGC
+TTTAAACCAGCAGCCCATGACAACTCTGGAGCATTTCCAAAATGCACTGGAAGGTAAAAG
+CTGCCCCGGCATCGACTTTGATTTCAACAAGGGAACCATCACCTTCAAGCTAGGGCAAGG
+TGGAGACGACCCGGAGAAGGTAGAAGCGGCCACTCAATTGTTAGCCTTGGTGAACCTTAG
+CGCCAGGCGCTCCAAGCTAAACATTTCTGCCAAGGTCAAAGCCACCGATAATGAAAAATA
+CACATTTAGAACTTGGCTCCTGCGCTTAGGGATGATAGGCGATGACTACAGGCTAGCCCG
+CCGGGTTCTTTTGCAAAACCTCCCCGGTAACAGCGCTTTTAGAAAACAAGTCCAGGAGGG
+AGCGTAAATGACCAAACCAAGATGCAAATTGGTCGGTGAAAACGGCAACATCTTTAACCT
+AATGGGCATCGCCAGCCGCACTCTTAAAGATGCCGGGCTGGAGGAACAAGCGGCAGAAAT
+GCGAGAGAGGATTTTTAAGTCCGAAAGCTACGACAGAGCACTGCAGATAATCATGGAATA
+TGTGGATGCGGAATAAGGCTGGGGCATAAGCACCGGTCTTTTCTCTAGCTAAACAACCGC
+CTAAATATTAACTTTTAAGGAAAATAACCCTTGCTATTATGTGTGTTTAGAGTGATATAT
+AGACTACCAAAAACACACAGGGGGTTTTCCGAACATGAAAAACTTAACCTTTGGGATAGA
+AATTGAACTCACCGGGATTAGCAGGGAAGCAGCTGCCAAAGCAGTGGCGGGATACTTCGG
+CACCAGCGCCCACTACCTTGGCGGCGGCTACGACAAATGGGAAGCGCCGGACAACCAAGG
+CCGCAGCTGGTTTATTATGAACGACAGCAGCATCAGGCCGGAAACCAAGCGGCAAGGCAA
+AAGAATCGCAGCGGGATTGGACCACCGGTTGGAGCTGGTTTCCCCCATCTGCACCTACAG
+CGACATCGAAACGGTGCAGGAGATTATCAGAGCCTTAAGAAAAGCCGGAGCCTTCTGCAA
+CCGCAGTTGTGGGCTGCACGTCCATGTTGGCAAAGAAAGATTCACCGCCAAAACTTTACG
+GAATCTGGTCAACATTGTGGCCAGCAAAGAGGACTTGATTTACCAAGCTCTGCAGGTGGA
+CGAGCAGCGGAAACGCCGGTACTGCCAAAAGGTAAAGGAGAGCTTTTTGGAAGAACTGAA
+CCGGCGAAAGCCAACGGAGCTGGAGCAGCTGGCCGACCTTTGGTACCAGGGTTACAGCGG
+CAGCCGCAGCCAACATTACCACAGCAGCCGCTACCACGGGTTAAACTTACATGCTACTTT
+CAACGGCCCCACGGTGGAGTTTAGGCTTTTCAACGGAACCACCCACGCCGGGAAAGTCAA
+AGCCTACATACAGTTTTGCTTGGCGGTAAGTTACCAGGCTTTAAGCCAAAAGAACGCCAG
+CGCCAAGAAGACTGAGACCTCAAACCCCAAGTACACTTTTAGAACCTGGCTTTTGAGACT
+AGGCCTTATTGGCAAAGAATTTGAAACCGCCAGGCTTCACCTTTTAAAGAACCTGGAAGG
+CGACAGCGCCTTTAGAAACGGCAGACAGGTGGCTGGGCTTTAAAGCCCGGCTTCCCTTTC
+TGACAAATAGATGTTAATATGTGGGAAAAAGGGTGGTGAAGGCATGTATCTACGGGTAAT
+GACTTTGGATGGCAAACGGGTCAGTGTGGCCAAAGATGAACTGGGAGTGTTTGAGGAACT
+AAAGAGCTTTGCTTTTGTCCCCCACACCATGACTGTGGAAGAGTATATTAATTCCATGGT
+GCATAGCGCCTGGACCTTTTACGGCAAAGGTGTGCATGTCACCGGAGATACCCTGGCAGA
+GAAGGCTAAAAGTGCCTACCGTCAATTCGTGGACTATGGCTTTCTGATTGAAATCACCAA
+GGAAGAAGCCCTGGAGCATTTTGGCCTCACCCAAGCTGATGCAGACAAGATGAACATTCC
+GGGCCTTAGAAGTAACGAATAACGCCCGGTTTAAATAAAAAATACTTGCAAAACCCCTGT
+TTTTGAGTGATAGATAGGTTTACACCATTTAGCCCAAAAAGGGGGTTTTTTGTATGTACT
+ACTTTGCCTACGGCAGCAACCTGAACAAGGAACAGATGATGAGCCGCTGCCCGGATGCAA
+TACCGGTGGCCAGGGTAAAACTGCATGGCTACCAACTGACTTTTAACCGGGTGGCGGATA
+TCGTGGAAGAAGAACAGGCAATTACCTGGGGTGCCATTTACACCGTTTCGTCGGAAGATA
+TTAAAAAACTTGACCGCTATGAAGGCTATCCCCGCCTTTATAACAAAATGCCGGTAACGA
+TAGAGGACGACCGGGGAAACATTTACCAGGCCTTTGCTTATGTGCTGACCATCAAGGGTT
+TAAACGAACCCAGCGATGGCTACTATCACATCATTGAACAAGGCTACCGGGACTGGGGGC
+TGCCCCAAAAACCGCTGCGGGAGGCTTTAAAACGAAGCCTTTTGAGCGCCCCTGTGGGCC
+TTTAGCGTTGGGTTATAGCGGCTACATGGTTGGGGAGCAGTGACTAAGGCCAAAACAGGG
+GGCGATTCGATTGGATAAATTCTTTTCCCAAAGGCACTGCGATCGGTGCGGCGGGGATTT
+AAAGGGTGGCCGGACAATGTCCGCCTTTAATTTGGATTGCATCTGCATGGATTGCAAGGC
+CAAAGAAAAACAGGATAAGGATTACGACAAGGCGGTAAAGGCCGATATTGATGAGATAAA
+GAAGGGGAATTACAACTTTCCGGGTATTAGGAAATAAAAAACAAAAGGGCCAAGTGAGGC
+TCCTTTTTCAATTGGAGGTGAAAAGCTATGGCGACACGGGGAAGAAAACCAAAACCAACA
+GCTCTTAAAGTCCTGGAAGGAAACCCCGGCAAAAGGCCATTAAATGAAAACGAACCCAAG
+CCTGAAAACAAGGCACCCCGCTGCCCGTCATGGCTGGAGCAAGAGGCCAAAAATGAATGG
+AGGCGGATGAGTAAAACCTTAGAAGCTATGGGGCTTTTAACTCTGGTGGATAAAGCTGCC
+TTTGCCGGGTACTGTCAGGCCTACGCCCGGTGGAAAGAAGCCGAGGAGTTTTTAAGCAAA
+CACGGCACCATCTTTAAAACCCCATCCGGGTACATTCAGCAGGTGCCGCAAGTCTCCATC
+GCCCAAACTTACCTGAAGGTGATGAAAGATTTCTGCTCTGAGTTTGGGCTAACACCGGCG
+GCCAGGACGAGGATTAGTGTTGACACTGAAGCAGTAAACACGGACGATCCCATGGAAAAG
+CTGTTAAAAGTAACGAAGTAGGAGGTTTTTTTAATCGGAGGTGATGCCCTTGCTCTACAG
+CGAAGAAAAGGTAAATCACGTTGTCGATTTTATCCGGCAACTAAAACACACCAAAGGTAA
+ATGGGCAGGACAGCCTTTTGAATTAATTCCATGGGAACTTGATTTAATAAAACAAACCTT
+TGGCACCTTAAGGGAAGACGGCACCCGGCAGTACAGAACCGTGTATACAGAAATTGGAAA
+GAAAAATGGGAAATCCTCGATCGCCGCTGCCATTGCCCTGTATATGCTCTTAGCCGATGG
+GGAGCCAAACGCCGAGGTCTATGTAGCCGCTTGCGACCGGCAACAGGCCAGTATAATTTT
+CAATACCAGTGTTAATTTCGTGGAGGGTAATCAGACCCTTTCGAGGGTGACTAAAACCAT
+CATGTCCACCAAAAGAATTGTCTACCCTAGAACCGGTAGTTTTTATCAGGTGTTAAGTTC
+AGATGTAAAATCCAAGTCAGGACTTAACCCATCTTGCGTTATCCTCGATGAAATCTGGAC
+TTATCCAAACCCTGACCTGGCCAAGATGTTGACCACTGGTTCCGGTGATGCCAGGGAGCA
+GCCCCTGTTTATCTATTTAACCACGGCGGGTAACAAGCTGCAGGGCTACGGCTGGGAGAT
+GCATTGCAAGGCCAAGGATATTTTAGCCGGAAGAAGAATTGACCCCACTTTCCTGCCTAT
+CATTTATGGTCTGGAGGAAGATGACGATTGGGAAGATGAAGCCAACTGGTATAAAGCCAA
+CCCAAGCCTGGGCCATACCATTCAAATAGAGCGGGTCAGAGAACATTTCTTGCAAGCCAA
+ACAAGACCCGGCGGAGGAAGCACTTTTTAAACAGCTGCGACTAAATATGTGGCTGAAACA
+ACAGATCAAGTGGATGCCCATGGATACCTGGGCTAAATGCGCTCACCCGGTAGACCCGGA
+TATGCTCAAAGGTAGGGTTTGTTTCGGCGGGCTAGACTTATCCAGTTCCACTGACATCAC
+CGCCTTTGTGCTGGTGTTTTCACCGGTGGCTGGGGACGACAAGTATTACGTTCTCCCCTA
+CTTTTGGCTGCCGGAGGAAACCTTAGATTTACGGGTGCGCAGGGATCATGTGCCCTACGA
+CATCTGGCAGCGGCAAGGATACCTGTTAACCACCGAAGGCAATGTCATCCACTACGGTTT
+TATTGAAAAATTTATCGAAGAGCTGGGCCAGGATTACAACATCCAGGAGATTGCCTTTGA
+CCGCTGGGGTGCTGTGCAGATGGTGCAGAACCTGGAGGGTGCCGGATTTACCGTGGTTCC
+CTTCGGCCAGGGCTTTAAAGATATGTCCCCACCCACCAAAGAACTGATGAAACTGACCCT
+GGAGAGAAGAATTGCCCACGGTGGCCACCCGGTGCTGGCCTGGATGATGGATAACATCCA
+TATCCGTACCGACCCTGCCGGTAATATCAAGCCGGACAAGGCCAAATCAACAGAGAAAAT
+TGACGGTGCAGTGGCTATGATTATGGCGCTAGACCGATGCATTCGGAATGAAGGAGTGAG
+CAAAGACAAATCGGTGTATGATGAACGGGGTTTAGTGGTGTTTTAAGTCTGCGAATATAT
+TGCATATCGCAATACAAAATGGTAAAATATAAATACCAAGAAGGAGGCGATATGTGTGTC
+GAAAACTACAAGTATTTTTGCTCGTGTTGAGCCGGAAATAAAAGAACAAGCAGAAATGGT
+GTTAAATAAACTTGGCATACCTATGTCAAATGCTATTAATATTTTTTTAAGACAGGTTGT
+TTTGCAAAACGGGCTACCATTTGAAGTTAAAATTACACACAATAAACCTCTTGCAGTTAA
+GGATTTAACACCTGAAGATTTTAACAATGAAATTGAAAAAGGGTTTAATGATTTAAGGGC
+AGGCAGAGTTGTGCCTGCAGATAAGGTAGCCGAGCGAATCAATAGGGAATATGGGCATGA
+GTTATAGAATTATTTATACCGAAGAAGCGGAGCAGGATCTTATAAATGTTTACAGGTATA
+TTGCAATGGATTTATTAGTGCCAGAAATTGCGAAAAAGCAAATCGATAGAATCATGAATG
+CAATTAAAGGCCTGGATGAAATGCCCCTCAGGCATAAACTCTACCAAGACGAACCATGGC
+ACAGTAAGGGTTTGAGAGTTCTTCCAGTAGACAACTACCTCGTATTTTATATAGTAATTG
+AAGAAGAGATAGTTGCAATAGTAAGAATAATGTATGGTGGACGTAATATAGAATTGCAAT
+TGTCAAACACAAAAATTGGTGATTAAATATTAAAATCCACAATGGCATCTCAATTGAGGT
+GCTTTTTTCATGCCCAATATTAAGGAGGTGTGGCCTCTAACATGAAAATACCCATCTTAT
+CCAAGCTGTTTAAACCCAGGGCCAGTCCCAAGAACACCTTCTGGCAAAACGCCTACACCT
+TTTTCTTCGGCCCTACGCCCAGCGGCAAAACCGTCAACGAGCGCACGGCCATGACCACCT
+CAGCTGTATATGCCTGTGTGCGGGTATTGTCAGAAACCATCGCTTCACTGCCTCTGCACA
+CATACAGGCGCACCGAGCGGGGCAAGGGAAAAGCCATGGACCATAACCTCTACTACCTAC
+TCCATGACGAACCTAACCCGGAGATGACCTCATTTGTGTTCAGGGAAACACTTATGGGTC
+ATCTTTTACTTTGGGGCAACGCCTATGCCCAGATTATTCGGGACGGCAGGAGCAGGGTGA
+TTGGTCTTTATCCTTTATTGCCCGATCGCATGGAGGTAAGCCGCACAGAAAAAGGCGAGC
+TCTACTACCGCTATCAAAAGGAAGGCCGAGAATATTTGTTGCGCCGTGAAGAAGTGCTGC
+ACATTCCGGGTCTTAGCTTTGACGGCTTGGTGGGCTACTCCCCCATCGCCATGGCCAAAA
+ACGCCATCGGTATGGCCCTGGCCACCGAAGAATACGGTTCCAAGCTTTTTGCCAACGATG
+CCCGGCCCAGTGTGGTCTTAGAACACCCGGGTGTACTGAAAGACCCGGCTAAAATCAGAG
+AGAGCTGGAACCAAATCTACCGGGGCAGCGAAAACGCCCATAAGGTAGCGGTACTGGAAG
+AAGGAATGCAGGTAAAAACCTTAAGCATTCCCCCGGAACAGGCCCAGTTTTTAGAAACCC
+GCAAGTTCCAGATTGAGGAAATCTGCCGCATTTTCCGGGTACCACCCCATTTGGTGGCCA
+GCCTGGACCGGGCTACTTTCAGCAATATAGAAAGCCAAAGTATTAGTTTTATTGACAACA
+CCATTGTTCCTTGGGTTTCTCGCTTTGAACAAGCCATGCAAAAGGCTCTGTTTTCAGTTA
+GAGAAAAACAGCAATATTTAATCAAATTTAATTTGAACGGTAGGTTGCGTGGAGACGCCC
+AATCCCGTGCTGCTTATTATCAAACCATGCGGCAAAACGGCATTATGTCAGCGAATGACA
+TCCGAGAGCTAGAAGAGATGAACTTAATTCCGGATAAATTAGGCGGAAATAAATATTTAG
+TCAACGGAAATTTTGTAGATATGGCTGATGCCGGGGCTTGGAGTGAAAAATATGGAAAGG
+AGGCTACCGATGCATAGGTTTTGGAACTTCGAAGAAACAGATACCGACCGAATCCTCTAC
+CTGGACGGCTACATTGCCCCGGAGAGCTGGTTCGAGGATGAAATAAGCCCCAAAGAATTT
+AAAAATGAGTTAGAAGCAGGAATCGGTAACATCACCGTCTGGGTTAATTCTCCAGGGGGT
+GATTTTTTTGCCGCCAGTCAAATTTACACCATGCTCAAAGAATACAGCGGCCAGGTGCTG
+GTCAAGATTGATGGCATTGCCGCCAGTGCCGCAGCGGTGATTGCCATGGCCGGAGACAGG
+GTACTCATGTCCCCCACAGCCATGCTCATGATCCATAATCCGTCCACTTTTGTTTGGGGC
+GAAGAATCTGATATGCAAAAGGGCATTGAGATGCTCTCCGAAGTTAAGGAAGCCATCATT
+AACGCCTTTGAAGCCAAGACGGGATTGCCAAGAAAACAGATCGCTCAAATGATGGATGCC
+GAAACCTGGTTCAGTGCTAATAAAGCGGTGGATCTTGGTTTTGCTGATGAAATACTCTAT
+AGCGAACCGCCACCTCAGGTCACTGACTTCATGTTTGACCGGGTAACGGTAGTCAATGCA
+CTGATGCGGAAACTACCGGCGGTTAAAGCTCAATCTAAACCGGTAATCAATGAACCTTTG
+AACAGCAGTGGGGTTTCATACGAACAGCTAATCAAACGGCTGGAATTAATAAAAGGGAGG
+TAATATACCATGAGTAAAATTATTGAACTGCGGGAAAAGCGGGCTAAAGTGTGGGAGCAG
+GCCAAGGCCTTCCTGGATGAAAAGCGGGGAGAGAACGGCTTACTATCGGCTGAGGATACC
+GCCACTTATGAGAAGATGGAAGCGGAAGTGGTCAATTTAGGCAAGGAAGTTGAGCGCCTT
+GAGCGCCAGGCCACTATTGATCTTGAACTATCCAAGGCTACTAGCACAGCATTAAAAACT
+ATTCCTGGTGATGGTCCTAAAGGCCGGGCTTCCAATGAATACGATAAGGCCTTCTGGCAG
+TATATGCGCAACCGCAATAGCTATGAGGCCAGAAACGCTTTAACCATTGGCGGTGACGGC
+ACCGAAGGCGGGTATTTAGTTCCGGATGAGTTTGAACGTACCTTGATTGAAGCCCTGGAA
+GAAGAAAACATCATGCGCACCCTGGCTAAAGTAATTACCACCTCTACGGGAGATAGGAAA
+ATCCCAGTGGTAGCTTCCAAGGGTGTGGCTACCTGGGTAGATGAAGAAGGGCCGTACCAG
+GATAAAGATGATGCTTTTGACCAGGTATCCATTGGGGCCTACAAGGTGGCCACCATGATT
+AAGGTTTCCGAAGAACTATTAAACGACAGCGTCTTTAACCTGGAAAGCTACATTGCTAAA
+GAATTCGCTCGCCGCATTGGGGCCAAGGAAGAAGAAGCCTTTTTAATCGGGGATGGTGAG
+GGGAAACCCACCGGCATCTTTGACAATGACAGTGGCGGGGAGATTGGAGCAACCACTGCC
+GGGGCTACTCTTAAAGCGGATGAGGTTTTCGACCTCTTTTATTCCCTAAAAGCCCCCTAC
+CGCAAGAAGACTGTCTTTATCATGAACGATGCCACGGTGAAGGAAATCAGGAAACTAAAA
+GACGGTAACGGTGTGTACCTGTGGCAGCGTGCGACACGTTCGTAATTGAAAAGATTACGC
+ACTGCAACCAGTAGGTTGCGGGAGAACTGACAGTTCGATAGGTAAAATGATGGAGTAACG
+CCCTGAAGTACCTACCCTAATACTCCGAATGGCGTCGAGGTTATTAAGAACGGAACGGCG
+TCATGAGCTCGGTGAAGACGGCTGAGAGCACACCCTAACAGGTCAAGCTGAGGAAAACCG
+AACAATAAAAACGTCGAGTGTGTGATAGGCCGGGGGTCTACAAAACACCTATGGTCAGAA
+TATCCATCCCTAAACCGATGGATGACGAATTCTCGAAGGTAAGGGTCTAGAACAGGATTT
+AGTCGAAAGGCTAGAAATTGCCTACAGTGCAAGGTTTGTGAGGACGAGTAAGAATGTTGC
+CTATGAAAATCCTTATGCCATTACAGGTGGCATCCAGCAAACAGGCCCAGAGAGAAGACC
+TAAGGGTGTATGAATAGATAGAACTATCGGAACGTGGAAAGTGTGCAACGTGGAGGGCTT
+AATCCCTAGGAAGCGTTAGTGAGGAAACCCCACGGGATAACTTACTTTCATGCACATGAG
+AGCAGTGGCACAGTACCTAGGAAACCGTGATAATAAACGGTGGAGGGATAGCCACAAGTC
+AGTACTATCACCACAAATCTCACTTATTACAGCATAAGGTTCGAGTATGACTAAGAGAGG
+CGAAATTCCCAAGAGGGGATGATAAGCCGACTTATGACGACCAAGAGACTTAAGAAGAGG
+CAAAAACTTAGAAACAACGAGTACTACGACATCCAAGAGAAGTTTGATGACCTTTATCGA
+CGCTCGAAGCAAGGTTCGACATTCAACAATCTCGTTGAACTAATAGCCAGTGACCAAAAT
+ATCTTACTCGCATATAGGAACATCAAGAAGAACAAGGGTAGCAAAACCAGAGGTTCCAAC
+CGCACCACAATTATCGACATAGGCAAAACGAATCCTGACAGACTGCTACAGTATGTCAAG
+AACAGGCTTCAGAATTACTCGCCACAGCCGATAAGGCGGAAGGAGATAGAAAAAGAAGAT
+GGTAGGATGCGACCGCTTGGTATTCCAACTATAGAAGACCGCCTAATACAGCAGTGTATC
+AAGCAGGTATTAGAACCCATTTGTGAGGCAAAATTCTATGAGCACAGCTACGGCTTCAGA
+CCCAACAGGGGGACACACCACGCAATAGCGAGAGTGAACTTCCTAGCATATAAGTCTAAG
+CTACAATACGTAGTCGATATAGATATCAAAGGATTTTTTGACAACGTAGACCATGCCAAG
+CTCATGAAGCAGATGTGGAGTATAGGAATTCAAGACAAGAATTTGCTTTGCATTATTTCT
+AAGATGCTCAAAGCAGAAATTAAGGGAATTGGAATTCCAACCAGAGGAACACCCCAGGGG
+GGGATTCTTAGTCCACTGCTTTCGAATATTGTCCTAAACGAATTGGATTGGTGGATAGCT
+AGCCAATGGGAAACTATGCCGACGAAGCACCAATATGCGAGCAAGAGCAAGAGGGTTCGT
+GCCCTCAAGACAGCAGGATTAAAGGAAGTCTACATCGTGAGGTATGCGGATGACTTCAAA
+CTGCTATGCAGGACTAGGAAAGAAGCTGAAAAGTTGTTCTGCGCAGTTAAAAAATGGCTA
+AACGAGAGATTAAAGTTGGAGATAAGCCCGGAGAAATCAAAGATAGTGAATCTAAAGAGA
+CACTATTCTGATTTTCTTGGGGTGAGGATTAAGCTTCAGGAGAAAGGGCAACAACAAGTC
+ACAACCTCCCGAATGACAGAGAGATCGGTTCGGAAGAGTAAGGACAAGTTGAAGAACTGT
+GTTGACACTCTGCAGAGGCAGCCCACCGTAGACAACATGCAGAAACTTAATGCCTGTATA
+TTAGGCCTGCATAATTACTACTGTGTGGCAACAAACGTAAGCAGAGATTTCGACAAAATC
+GCCTTTCATGTCGACGCGAACCTTAGAAATACGAGGTCTATGACAACTCGACGAGGACAA
+CTAACCAAAGCTTTTACCCAGTTTTATGGGCATTATACTGGGCGCCCGAAGTTTATAATG
+GGCATACCCCTATTCCCCATACACTTGGTAAAGTTCAAGCCACCTCCATATTTTAACCAG
+GACAAGTGCAATTACACGCTAGAAGGGCGGAATATGATACACAAACCTCTTCAAGCCATT
+GACACATCGGTATTGCGCTATCTCATGGAGCACCCTGTGGAACAGGAAAGCACAGAGTAC
+AACGATAATAGAATATCCTTGTACGTGAGCCAACGGGGTAAATGTTTCATCACTGGCTTA
+GAGCTTACGACATTCACCGCAGAGGCTCACCGCAAAACCCCAAAAGGGAACGGCGGAACC
+GACGAATATGGAAACTTGGTTATTGTAGTCCCGGAAGTGCATAGGCTGATACATGCCTTG
+GACGAGGAGACTGTTCAGAAATGTCTGTTAGCACTGACGAACAGCAATATAAATTATAAA
+CGCCTCAATCAACTAAGGAAAATGGTTGGAAATAGTGAAATTTGTGTGGGGTAGTTATTG
+ATGGAGCGCCGTATGAGGGGAAACTCTCACGTACGGTGCGGAACGGGGGAAAAGGCAGAG
+ATGATTTCAAAGCCTTACCTATCGTTATCCTCCCTCACTGCAGGCGACCCGAACACTTTG
+TTAAACCGTCCCGTCAAGACCTCGGCTTATGTGCCCACCATTGCCGCCGGGAAAAAAGTG
+ATCGCCTTCGGTGATATGGGCTACTACTGGATTGCTGACCGTCAGGGAAGGATTTTCCAA
+AGGCTGAACGAACTCTATGCCGCCACCGGTCAAGTAGGGTTTAGGGCAGCGCAGCGGGTG
+GATGGCAAGCTGATCCTTAAAGAAGCCATTAAAATTCTCAAGGTGAAAGCGTAGGTGATG
+GTAGATGAGTAATGTTAAAAACTATCACGAACAAGGCGGGCAGAAATGGGTGGTGGGTGG
+CCAGCTGGAGATTACAGCTGGTGGTAAGCTCACCTTCAAGGGAACCGAACTAAAACCAGC
+ACTAGGCCAAACTAACAGTGAAGCCAGCACTGTTGCCGCTCTAAAAGAGGATTTCAACTC
+CCTCTTGGGGCGGCTTTTTGCTGCCGGTCTGATGGTGGTGGATAAATCAGCACTTGAAGC
+GGCCATCACCGCAGCTTTGGAACTTTTAGATAGTGCAGTGGTTGGCGAGGATGTTGGGGA
+ATATCCGCAAGCTGCCTACGATACTTTTGAGAGCGCCATTGAAGCTGCCCTAGGTGTGGT
+GGATGATACAGGTGCTACCCAAAACGAAGTTAGTACTGCGCTTGCAGCATTAACAACTGC
+GGTATCCACCTTTGAAGCAGCAGTAATCACTGTAGATAAATCTGTTCTTCGAGCGGCTAT
+TGCTGCCGCTCAAGATATACTGGATGGTGCTCAGGTGGGCTCCGAGCCTGGCCAATATCC
+GCAAGAGGCTGTTACTGCTTTTGAAACTGCCATTGGTGCAGCACAGGCAGTAGTGGAAAA
+CGCTGATGCCACCCAAACCAATGTAGACGATGCTGTGACTGCTTTAGCTACGGCGGTATC
+CACCTTTGAAGCAGCGGTCATCACGGAATAAACAGCGGGAGGTGGTGAGTGTATGGTGGT
+AACCCTGGAAGAAGTAAAACTGTATTTAAGGATAGACGGTGATGAGGAAGATACACTCAT
+CACTAATTTTATTTCTACCGCCGTGGAAATTTGCGAGGATATCTTAAGATACTCATTGTC
+GGAGTTTGAAGAAATACCGGCGGTAGTCAGGCAAGCGGTTTTGTACTGTGTGGCCAATCT
+GTATGAAAAAAGGGAAGGAACCCACTATTATCTGAAAAACGAAGGCGGCGGCATGGCTGA
+AACCGTAAATGTGATGAAACTGATACTGGCAAACCTTCGCCGGGAAAGCTGGTGATGCAG
+GTGGAGATTGGGGATTTAAGACACCGGATAACTTTCCAGAAACTTACCACTAGCGTCAAT
+GAGAACGGCTTTGAGGTAGAAACCTGGGAGGATTTCAAGACCGTATGGGCGGCAGTGAGC
+AACCTGCATGGCCGGGAGTACTTTGCTGCCGCCGCTGTCCAGGCAGAGAATACGGTGAAG
+TTTACCATTAGGTATTTAACGGGTCTGGATACCACCATGCGGATTGTTTTTCAAGGCAAA
+CAGTACAACATCACCGCTATTTACAACATCAAATATCAAAACCGGTATCTGGAAATCAAA
+GCACTGGAGGTGGTAAGCAGTGGCTAGGGTAGAGTTAGAGGGCTTGGAAGCCCTCATCAA
+TGCCGTTCAAAGGCTGGGCAGCGAAGGCAAGAAAATAGAAAACAAAGCCTTAAAAGAAGC
+CGGTGCTGTAATGCAAGAGGCCATCCAAAACGAAACTCCAGTGCGGACTGGCAAGCTAAA
+AGAAAGCATTACCGTTTCCGGTGTGAGAACCCAGGATGGGGTTAAGTATGTAGCAGTGGG
+GCCGAGTAAGGAAGCCTATTATGGCAAATTTCTGGAACTGGGAACTGTCAAAATGAGAGC
+TAAACCCTTCATGGCACCGGGCTATGAAAACGGTAAAGACCGGGCCACAGCAACCATCAA
+GGAAGAACTGCGAAGGGGGCTGGGCCTATGAGCATGAACCAAAATATAATAACGGCTTTA
+AAGGATATAGGAGTACCGGTACAATTCCAAAACTACACAGGCAAAGCCGATAGCTACATC
+ACCTTTTTCACCTACCTGGATAAACCGGAGCAGCATGCCGATGATGCGGAGTTAATTACT
+GGCCATTATGTGCAAGTTGATGTGTGGAGCAAAACCGATTACACAGATTTAGTCAAATCA
+ATCCATCAAAAGATGCTGACTGCCGGTTTTACCAAACAGAACTTTTATGACCTGTACGAA
+CAGGATTTAGGAATTTATCACAAAGCCATGCGATTTTTTAAGGAGGTGCTGTAGATGGCA
+CAAGTAGGATTAAATGATTTACACTTTGCGATTCTTACCGCTGATACCAAGGATGAGTTA
+ACCTATGAACCCACCGAAGCCTTGGTGGGAGCCATTAACGCCACTATCAACCCGGCGGTG
+AATACTCAGGAGCTTTACGCTGATGACCAGCTGTGGGAATCGGTATCGGCTTTAGGCAAA
+GTGGATGTGGAAATAGAGACGGCGGAACTACCCTTAACTATTCGAGCCAAAATCCTGGGT
+AATGAACTTAAAGACGGGGTACTGATTGAAAAAGCTACCGATGTACCGCCCCATCTTGCC
+TTAGGCTTTAAAAGCTTAAAATCCAACGGCAAGTACCGCTACATCTGGCTCTTAAAGGGT
+GTGGCCCAGCCCATGGCCGAGGACTTCTCCACCAAAAAGGATAACGTGGAACACAAAACA
+CCCAAGGTGAAATTCACCTTTATGGCCAGAGTCCATGATGGCGAGTGGAAAAGAACAGCG
+GATGAGGATAGTGCCGATTTTCTGGGAGCAGCCACCTGGTTTGAGCAAGTACCCGGCGAT
+ACAACGGTAGTGGGAGGTTAAAGCTATGGAGATTACTCTGAAAGTAGCAGATCAAAATAA
+AACCTACACCACAAACTTTATCAGCGCCCGCATGGTCAGAAGAACCATTGAAATATCCAA
+AGACATCAACTTTGAAAACATCTCCCCGGAGGAACTGGATAAATTGATGGACTACATTAC
+CGAGCTCTTTGGCGGCCAGTTTAGCCGGGATGATTTATATGATGGCTTACCATCCCAAGA
+GCTACTCCCCGCCATTACTGGCTGCATCAACGAAGTGGTGGGGCGAATGGCTGAAGTGAC
+CAAAGGTGATGAAAAAAACGCCTAGAGGGGAACGCCATGGCTCCCCAAGACTTTATGGAC
+AGTCTATACCTGGCATTACTAGAAAAGGGCTGGACATTGAATGAAATTGACAGTATGGAT
+ATCATCTACTATTTGAAACTACTGAACAAAAAGCTGGGAGAAGAAAAAGTGTATATCGAT
+GGGGTTTTATAGGAGTTTCTTGGAGTATAATCTAATTGTTAGCGTAGCATAATAATGCTA
+TAATTAAGGCATAATGTAACCAAAGGAGTTGATATTATGCCTGAAATTAGACCGATAAGA
+GATTTAAGAAACACAACTGAGATTTCTGAACTGTGTCATAAAAATGAAGAACCAATTTTC
+ATTACGAAAAATGGCTATGGCGATTTAGTAATCATGAGTATGGAAACTTATGAAAAAAAG
+CTAGCCCAAGCAGACCTCTATAAGAAATTAGCTGAAGCAGAAAGTCAAGTTGAAAACGGT
+GAGCCACTTTTAGATGCTGAAGATGTATTTGAAAAATTAAGGAAGAAATATGTCAAAGAA
+TAGTTATAGCTTAAAACTTACTCCAAAAGCTAGTAAGGATTTAGATAAAATATATAGATA
+CATTACCGAAGAACTTTATGCTGAACAAGCAGCTGTTAATCTTTTGGAGAAAATAGAAAC
+AAGTGTAATGAGATTAAAGGACTTTCCGTTTTCAGGTAATTATTTCGCTGATGAATATCT
+AAAGAAGAAGGGTTATCGAAAATTAATAATTGATAACTACATTGACTTTTATGTAGTCGA
+TGAAGAAGAAAAACAAGTAGTTGTTATGCGTTTTTTATACGGCAGACAAAAATATGAAGG
+TTTACTCTAATAGCATCTGATAAGCAGGTGCTTTTTTTATGCCCAAAGGTGGTGAGCTAA
+ATGTCAGATGTCGGGGATCTAAATGTACGGATCAACCTTGATGCCCTGGGCTTTCAAAAC
+GGGATCAGTAAAATCAATACGGAAATGAAAAAACTGCAATCGGAGTTTAAGCTGGCCGGT
+GCCCAATTGGGTAAACACGGCAGTGAGCTGGACAAATTACGGCTTAAATCCGATAACCTG
+ACCAAAGGAACGGAGCTGCAAAGGCAAAAGGTGCAAGCCTTAGAAGAAGCCCACCGGAAG
+TCTGTGGAGGCCAAAGGCAGTGATGCCAAGGCTACCCAGGAGCTGGAAATTAAGCTAAAT
+CAAGCTCGCGCCAGGCTAGTGACCATGGAGCAGAACTTGGAAGAAGTTAATAACGAGATA
+ACCCTCCAGTCATCCAGCTGGTACAAGCTGGGCAAAGAGCTGGAAGCCGCCGGACAAAAG
+ATGCAGGCTGTGGGCCAAAAGATGGAGCAGGCCGGAAAAGAACTCAGCATGAAGGTTACC
+ATGCCCCTGGTGGGTTTAGGAGCTGCTGCGGCAAAAATCGGCTCGGACTTTGAAGCCGGG
+ATGAGCGAAGTGCAGGCCATCAGCGGAGCCACCGGCACTCAATTAGAAATGCTGGAAGAA
+AAGGCCAAGGAAATGGGTGCCACCACCAAATTCAGCGCCGCCCAGTCGGCAGAAGCATTA
+AAGTACATGGCCATGGCTGGTTGGGATACTGGTCAGATGCTAGATGGTTTAGATGGCGTC
+ATGATGCTGGCTGCTGCCAGTGGCGAGAACTTGGGTACCGTTTCCGATATTGTCACCGAT
+GCCCTGACCGCCTTTGGCATGCAGGCAGGCCAGGCAGGTGAGTTTGCCGACCTTCTGGCC
+AGCACTTCTAGTAGCGCCAACACCAATGTTTCTATGTTAGGGGAGTCCTTTAAATATGTG
+GCTCCCCTTTTTGGTTCACTGGGTTATTCGGCAGAAGATGCAGCCCTGGCTCTAGGCTTA
+ATGGCTAATGCGGGTATCAAAGGGAGCGAATCAGGTACTGCACTAAGGGGTGCTATTGCT
+AACTTAGCTAATCCCACAGCCGGTATGGCCAAAGCCATAAATGAACTGGGCCTCACTATT
+ACTGATGCCAGCGGGGAAATGCTACCCTTTAAAGATGTGATGGACCAGCTAAGAACTGCC
+TTTGCCGGGCTTACCGAAGAGCAAAAAGCCCAATATGCTGCCACCATCTTTGGTAAGGAA
+GCCATGAGCGGCATGCTGGCCATTATCAACTCCAGTGAAGAAGACTACGCCAAACTGACC
+CAGGCTACCAGGGAATACAACGGTGTGGCCAAAGAAATGGCCGAAACTATGGAAGCAAAC
+CTGCAAGGGCAGCTGACAAAATTAAGATCAGCTCTGGAAGGTGTAGGCATACAAATTTTT
+GAGATCCTGCTTCCCCATCTAAATAAGCTGGTGGAGATGCTGCAATCCTTGACCGATAAA
+TTTGCCAGTCTTAGCCCCGCTACCCAGGAAACCATCGTAAAAATTGCCGTTCTTGTCGCA
+GCCATCGGGCCGCTTTTACTTATCGGCGGTAAACTTATCGGTGTTATCGGTGCTGTTGTG
+GGTGCGCTGTCCACAGTATCCGGGGCTATTGCTGTGGCCAGCACTGGAGCAGTTGCAGCA
+ACACCTGCCATTGGAGCCTTAGCCACAGCATTTACAGTTTTAACAGGGCCGGTGGGAATT
+GCGGTTGCTGCTATTGCCGGAGTTACCGCAGCAGGCGTAGCTTTATACAAACACCTAAGC
+CAGGAAGGCATCCCGGCCATTGAACTCTTTGACGATGAAGTATCGGAATCCACCCAAAAA
+GCTGTGGGTGGTTTTTTAGCGCTTAACGACCAGGCTACTTTAGCTTTAAACCAATTATCC
+TGGAGTGGTCAGGAAGTTACCAAGGAGATGGTGGACAACATTGCCGGGAACTTCTCACAG
+ATGGCTTCACAAGTACAAGCCGGACTGGATAAACACCATCAAGAATCCCTGGCGAAAATC
+CAAAACTTTGTCACCAGCAGCACAGCTTTATCTCAAGCTGAGCAGGACGAAATATTAAAC
+AACATGCAGCAGGGCTATGAAACCAGGAAACAAACCATTGCTGAAGGCGAAGCCAGGATA
+AAGGAAATCCTGGATATGGCCAGTACAGAGAAAAGAGCCCTGACCAAAGCCGAGCAGGAA
+GAAATCAATGCCATCCAAAGGCAGATGGTGGACACCGGCATCCAGGTCCTTTCCGAAAAC
+GAAATCGAAGCCAAAGCCATTATGGAACGCATGAAAGCCCAGGCCATAGAGTTAACGGCT
+TTGCAGGCGGCAGAAGTGGTTAAAAACAGCATTGAGCAAAGGGACGGGGCCATTCAAGCG
+GCCAATGAGCAGTATGATCAGGTGATCAAGGAAATCATCCGGCAGCGCGATGAAGCAGGC
+ACCATCTCTAAAGAACAGGCCGATAAATTGATTATCGAGGCCACCAGGCAAAAGGACGAG
+TCTATAGCCAAAGCCGAAGAAATGCACCTGCGGGTTGTTGCCGAAGCCCAGGCCCAAGCC
+CAGGAACACGTCAATCAAGTTGATTGGGAAACAGGAGAAATCAAGACCAAATGGCAGGTT
+ATGCGTGACGATATATTCGCCAAGGCCGGAGCAATTAAAGAAAACGTCTTTACCACCTGG
+GAGGAAATTAAGACCAACACCTCCCAGCAGTGGGAAAGTATCCGTACGACCATGAGCGAC
+AGGTGGAATGACATTAAAACCAATACCTCCGAAACGGTAGCCGCTATTAAAACCAATGTC
+AGCATCACCTGGGATGAGGTTAAGACCAAAACCTTTGAAACCTGGGACAACATCAAAACC
+AAAACTGCTGAAACTTGGCAGGCCATACAAAATAAAATCGATGAACACGGCGGCGGTATT
+AAGGGCCTTATTGGAGCCTACACCGAGGGATATAAATCCGTTTGGGACAGTGCCTTGACC
+ACCATGGAGGAAATCACCGGCATCAAATTTAGCGACATGGCCGATAAGGTAGCTGATGCT
+TTAGAGCGGGTTAAAAAGGCTATTAGCAGTGCTATCGACCGGATAAAAGAGTGGAACGAT
+ACCAAAGTCAAGGAAAAAGTATTTAGTATCACTGAAACCATTACCAGGATCATTAGAACC
+ATTACCACCGGTGGAGGTGGCGGCGGCGGTGGTGATACTTCTGCTTCCAAAGGCGGTGCG
+GCAGCTTCAAACTTTAGCGGCACCAGCTTCTTCCCTGGTGGTTTAACCATGGTAGGGGAA
+CTGGGACCAGAACTGGTGGCCTTGCCCAGGGGAAGTAGGATTTATAACGACCATGAAACA
+AAGAAAATATTGGATGGAAGTAAAGGCATTGTCCAACACATTACCCTCCTTTCCCCTACT
+CCCCTATCCCCTGCGGAAACGGCAAGAAGAATTAAAAATGCCTCTAGAGAGCTGGCTCTA
+GAATGGTAGGAGGTGTAGTATGGACAGAATAGTTATCACTAACCAAAAGGGAGAAAGCAT
+CACGTTAGGCAACCAGGCCCCATATTTCCTTGAAACCATTGACGGTGTCGGGGAAGTGCC
+GGTAGCTATTGAAAGCCAAAAAGCACCCAAACAGGATGGCTCGACTTATCTCGACAATAT
+GTTGGATAACCGGGCCATTTCTATTGAAGGCACGATTATCACGAAGATTGACCCTGCTTT
+TGTACTGGAAGCCAGAAGGAAAATGCAAAGGGTACTAAACCCAAAATTGGGGGAAGTAAC
+TATCACCTACCATCAGAGAGACCAGGTCCGGGAGATTAAAGGTCTGGCCGAAACCACTCC
+GGTATTCCCCGGTGGGCAAGGGAGTAAAGGTTTGTATTACCAAAAATTCTTACTTCACCT
+GCTCTGCCACCAACCCTTCTGGCTGGATACCTTCTATGAAAGCCGGGAGATGTCTTATCT
+CATGGGCGGGATTAAGTTTAAACTAATCCTTCCCACTGTATTCTCCTACCGGGGTTTTAA
+GAGGCGGGCGGTAAACGAAGGCGATGTGGCTACGCCGGTGGAGATAGAGTTTAAGGGACC
+GGCAACTAATCCTACAGTTAATAATCTAACCACTGGGGAATTTATCAAAGTTAACCGGGA
+ACTTGGGGAGGAAGATGTGCTCACCATCAATACCGCCTTCGGGCAGAAATATGTGAGGAT
+TAACGGGCAGAATGCTTTCCACTATATTGACTTGGACAGCGTATTTTGGCAGCTAGTACC
+GGGAGAAAACACCTTAAGCTACCGGAGCAACAACGACAGCATCAAAACCAGGGTTACCGT
+CAAGTGGAAAAACCGCTATGTTGGCCTATAGAAAGGAGTGATTTTGTGGCAGAGCTTTAC
+AGATTTTTTGATTCCGTTGATGGCGAGGACGAACGTTTTTATACCGCAGATGAGTTCGCT
+GAATACTTCCGCCAGTTTATCAGAAACGGCATCTTCAACGGCTCCGGGGACAACTTGCAG
+GTAGGAGCCGAAGGCCAGGACATGCGAACTTTTATTAAACCCGGCTATGCCTGGATTGAA
+GGCTACCTTTACAAAATCGACATTGAACCTTTGGAACTTTACCACCCGATGGCCCATGCC
+AACTACGACCGCATCGACCGGGTGGTGATTAGATTAGATAAGACTTTAGAAAACCGCTAC
+GTGAAAGCCTTTGTGTTAACTGGTACCCCAGCGGAAACGCCACAGGTACCGGAGCTGACT
+AGGGATGAGAATGTTTATGAGCTGGCTTTAGCCCAGGTGAAGATCTTGGCCGGGAAAAGC
+TTTATCGAAGCGTACCAAATTACTGATGAAAGATTAAATCCGGAAGTCTGCGGCGTGGTC
+ACCCATTTATTTGAACAGGTGGACACCACCGAGCTGTTTAACGAATGGCAGTTATACCTC
+AATGCCAGGAGAGCACACGGAGATACAGAGTTTGCCGCCTGGCTTGAATATTTGACAGAT
+AAAAAGCAAGATGCTGGTATTGAGCATGCTGCCTTTTTGGCCATGCTGCAATCAAAGTTC
+ACCGCTTTTCAAAACACCTGGACTAACTGGGTAAACGATAAGCTAACCATTCCGGATGGA
+GCCTTCTACATCCAGTGGAAAACCTGGTTCGATAGAATCCAGCAGGACTGGGATATTTGG
+TTTGACCATGAAGCCCAGCGGGTTTGGCAAGCCTGGGTAAACGAGAAGTTAACGGCACCT
+GATGGCGAATTTTACACCCAGTGGCAGGACTGGTTTGAAGAAATCCAAGACGTAACCAAC
+CTGGTGCCCAGGAGCCAATTCAAGGCCCACAAAGATCGGACTGTCAGGGAAGGTGCCCAC
+GGTCTACGCTTTGCTGCTAATCACTTGGAAGTAGAAATTAATGACGGCAAATGGCGCAGG
+CTGCAAGCACCAATCAGCACATGGGGAGGGATGTAATATGGGCAGCGCTATAAGATTGAG
+CAAGGGTGAATTGACCACTACTTTCGAGCCTTTATACCAGGTGCCCAATGATCGGGTGGT
+GATTCTAAAATCCATCATCTTAACGAACTTAACAGATACAGCGCAAACCATCAGCCTAAA
+ACTGGCCGGGGCTTATGTGATGCGGGATAAAACACTATCCGCCGGTGAATCTTACCAAGC
+ATCGGTATTTGACCAGGTTATTGTATCGGGGGAAGTTATCGAGGGCAAAGCCGGTCAACC
+GGAAGCAGTGGATTACTACATCAGCGGCAAACTGCTCCTGCCCCAGGACATCGCCAGTGA
+AACCCAGTGGATGCAAGAGCAGTGGGACGCCTGGTGGGCAGCGCACCCGGAAGTATTCGA
+AGTGGTTTGGGATGCCTGGCTGCAAAGTAAAACCCGTGAACCAGATGGGGCCTTTTATGC
+TGAGTGGAAAGAGTGGTTTGACTATATTCAAGGACTTAGCTTTGATGCCACCGACCTGGT
+GCCCTGGACTGCTTTTAGGGACCACGAGGCTGATTTTTCCGCCCATGGGGATCTGGCCAA
+TACCTACCGTTTTGGGAAAGACCACAAGGGGATTTTCACCACCATTGAATGGCACCGGCA
+AGATGGAACCCTGGCTAAACGGTCTGTGTTAAGCGGCGGCAACTCACCACGCTACGAAAA
+CCGGACGGTTACTTATTATGAGGCAGATGGAGAAACAATTAAGACTGCTGTTGTATACAA
+CCAAATATATGACGAGGCAGGAAACTGGATAGAGGAGGTAATGGCAAGTGAGTGATTTAT
+GGCTGCACGGCTTGGGGCAAACATCAATGGGAGATCCGGGGGTTATTCCCATTGAAGGGT
+TAACGCCAATTATAGCATCAGATGAGATTAAAGGGCTGGGATTGCCTTTTGCCTACCGCT
+CATTGGGAACCTTGTCCAACCGTAAAGGTGTTAACCACTACCACAATGGGAAGGTCTATG
+TACTTCACGGCCTGGGGGTGACTATTTATGATGCGACTACCGGAGAAGTGATAGCCGATA
+ATACCCACACAACTTCTTCAGCGCATATGACCCCTGACCTTGCGGCTACGGATGGTAGTT
+ATTATCTTGCGCAGGGCACAACCCTATATAAATATGCCTCTGATGGTGCTTTAATTTGGA
+AAGCAGAGAATGTTGGTTCTTCATACTGTATCGCAGTAGAAACATCTGGTGTTTATGTTG
+GAGTTAGTGCATCCTCGGCTTATTATATTAAAAAATGTAACCGAACCAATGGTCAAGTTA
+CGTGGACATCAACTAGCCTAAGTAGTAACATAGCGGCATTAGCGGTTAACAGTAATACAG
+TTATTGCGGCTGACCAAAGTTATAAGATCTATAGGTTAAATCCAAGTAACGGGAGCACGG
+TATATACTTACACCATACCTAATAACCGCTATGCCTATGCCCTAGCCATTGAGCCGGGTA
+CTAACCATTTTTACTCAATAGATAGTTACCATGTCATACGAAAACATAGCTACCAAACAG
+GCGAGCCAATTTTTGAGAAAACCAGCGCCAACACAACTACCGTATACAATCTATTCATCG
+ACAGCGAAAACAACATTTATACCGTCTCCAATCGGGAAATCACCAAGCTGGACAATCAAC
+TGGCCGGTTTTATCTGGCGAGAGGATCACAACATTAGCGGTAACCCCATTTATGGTTTCG
+GCCTTGATAAAGAGCAGGGAAAAATCTATGTGCTGCGCCAGCATTCAGCCCGCATTTTAT
+CTACCGATAAAGAGTGGTCGGATTTTATCCCGCATCAATTTGAAGGCGTAGTAAATTCCA
+TTGATGTGGATGTCAACGGCAACTTCTACGGAGCCAGTGATGACTGGACGGCAAGGAAGT
+TCAATGCGCTGGGTGAGCAGCAGTGGGTATACCGTCATAACCTTGCTTTGAACTTTGTCA
+AAGCCGATAAGAACGGTAATGTTTATATTGCCGATACCAACCGAACCTTGAAAAAACTTA
+ATCCGTACGGGGTGGAACAGTGGTCCTGCAGCATTTCCGGTACAACAGGTGCGGTAACAG
+ATTTAGTGGTAAACAGCGAAGGAGTAATCATTGTTAGCATTGCTTATTTTCATACTTCCG
+GCTCCAAGGACTATTTAGTCAAAATATCCCCGGAAGGAACTTTGTTAAAGACCATGGAGA
+TTGGTACCAGCGGTGTGTTTCGTAAACTGCATCTGTGGGATGACCGCACTGTAATGGCTT
+TTAACAAGTTGTACGACATCGACACCCTTCGGACTATACGATATTTCAGTGCGGCAAGGG
+CGATATTTGGTAGGCATGGAGATTTTCTCTTTGGTGTTTATGATGATGAAATCAGGGTAT
+TCAATAAATATTCTGGTGGGCAGATACACTCTTTTGAAGTAAGCGATATTAACATTACCA
+ACTTCTATTTGCGGGCTGTCCAAGGTTTGGACGGAGCTGTTTACGCCTGGGATAATGATA
+AGACCTTGATTAAATTCAATGAAAAAGGGGAGAAATTCTGGCGCTACAAGGCAGTGGAGA
+AGATTGCGGATATCAAGGTGGATGACGAGCACAATATTTATCTGGCCACCGGCTACTATA
+TTGAAAAACTAACCCAAACCTTTGGAATCAAGGGTTACGATAAAAATTAGAGGAGGGCTT
+TAATATGATTTATGTATTTGAAAGCGGCAGTATCGTTTACGATGAGAGTGTTTTGGCAGA
+GGCGGATAAGGCCAGGGCTGTGGCGGTGGAGCAGCTGCCGGAGCAGGAAACGCCAGTAGG
+AAAGATCGCCATTATCAAGGCGGACAAGGCAACGGAGACCGTTTGGTGGGAATATGTAGA
+TTCCCCTGCGGCTGTTGAATTTCGAGAGCTTGAAGTTCAAATCCAGGGGCTTCAGATGGC
+CTTAGCAGAACTGACAATATTGTTAGCGGGAGGTGAAGCATAATGACCTTTGATAAAAAC
+TCGGCATTGGTTAAAAACGTATGGGTTCCGCTCATACTGGCCGGAGTGTACACACATGAA
+CAGGTGCCAGCCTTGGGAAATCTAAGAGCAGTGGTGCAGCAAGTATTAGCGGAGATGGAG
+TAACACCTGGAAGGGGTGTTTTTTTAATGTTTTTTCTTTCCCCTTTATTGTGGTAAAATA
+TGGCAGGAGGTGGAAAATGGAAAGAATAACTTGTAGCGGACCAATACTAATAAAATTTGC
+ACCTTTGAAGTTGGCGAAGAGTTTTCGCAGCGGTACAATTTATATGAATTCGCTGGACTA
+CTTTAGAGGTCTAGAAGATGACAATAAAGTAAGAGGAGATCTTTTGGAAGGTACACATAG
+TCTGATTGCAAAAGATGATTTTAGCCAGGTGTTGCCTCAATTTGGTATGGATTTTCCTGA
+AGCGATTAAGAAAAAAATAATTGGGGGCATACATCTGTTAGACGAAGAGTTAAAATATTA
+TAAGGTTTTTTGTATGTATCAGTTAAATTGTGATTTTAAGAGCAGGTACATTGAGCCTAT
+CGATACCAGGGTAAATAATTTTGGAGATACTTTTGTTTTAATATTTAATCTTAAAGAATT
+TAGAAGAAGGATTGTTGCTGAATTAGAAAAAGGAACATACAATGCCCTGGGATTTGCCGG
+ACAAGGTGTGGAGTATTATCAATATGATACTTCTACTCAAAAATTAGGCCCATTAAAAAA
+GTTGGATTTATATAAGTGGCAAAATGAGTATAGGTTAATTGCTGAACCACTTGAACATAC
+ATTAGATCCGTTAATTCTTAACATTGGTGATATCTCTGATATTTCGATAATTGGCTCAAC
+AAGTAGGTTAATTGAAGAGATTCATTTTGAAGGTAAGGAGCTTTTTGTACCAGGTTATAA
+CTTATAACCACAAGAAATTGATAGAGGTGAGCCATGAAACCAATACGCATAATAACCCCG
+GCCCTGGAGCTTAAGGGAGAGGTAGACAACTATCTCTCCCTTTCCTTTTGCCGCAGCTAC
+CACTCGCCTGGCGAGTTCCAGCTGGTGACAAACCGCAAGGTGCAAAACGCCAATCAGCTC
+GAAATCAACAATCTAATCATGCTGGGGGCTGACCCGTGCAAGACCGGCATCATCCGCCAC
+AAGGAAATTAAAAGCAATGACAAAGGAGAAGAAATGCTCACCATCAAGGGTTACGCATTG
+GGGACTATCCTTCGTCAGCGCATCACCATCCCACCTGTCGGACAAGCCTACGACATCCAG
+GAAGCCAATGCGGAAACGGTCATGAAACACTATGTCCGGCGAAACTGTCTACAGATATCG
+GAGATGGAATTTCCGTTTCTTGTGATTGGTGATGACCAGCAAAGGGGAGAAAACGTTAAA
+TGGCAAACACGATACAAGAACCTGGCTGATGAGCTGGAACAGATAAGCATACTTACTAGC
+CTTGGTTGGCATATCTACCCGGACTTCAATTCAAAGAAGTGGATATTTGACATATATAAT
+AGAAGGAATTTTTCAGCCGGTCAACAAATAAACCCGCCGGTTATCTTCTCACCGGAGTTT
+GATAACATCAGAAGTCAGGAATTTATTGATAGCTTGGTGGGCTTTGGTAACTATGCAATC
+GTAGCTGGTCGAGACGAGGGAGCCAATAGAGAGATCATGATGCTGGGCAGCGATGCTACT
+GGTCTGGATCGCCACGTTATCTTTGTTGATGCCAGGGATGTTAAAGATACTGCTGACCTG
+CCAGCAAAAGGTGAAGCAAAACTGGTTGAGCATCAAAGGGTTTTATCCTTTCAAGCCGAG
+GTTTTAACCGCTGGGCCTTTTAAATATCGGGATGATTGGGATGTTGGGGATATCGTCACG
+GTGCAAAACAAAGCTTGGGACCTGACCATGGACACTCGGATTACAGAGGTGCAGGAAATC
+CATGAGGCTAGTGGCTTCAAACTGAACGTCACATTCGGCAACAACCTCCCCACCCTATCC
+CAGAAGTTAAAAACGGCCCTGGGGGAGTTCAAAACAGAAAGCACACGATAAGGACGCCTT
+TGACAGGTGTCTATTTTTTATGAAAGAAGGACGATTGCATGAAAGATATCATTCATACCC
+TGCAGCTTGCCTTTACGGCAATCGGCGGCTATATCGGCTGGTTTTTAGGTGGCTATGACG
+GTTTAGTCTTAGCTCTGGTGGCCTTTGTGGTCATTGATTATATTACTGGACTGATGGCAG
+CAGTTATTGAAAAGAAGCTTTCCAGTAGTATCGGCTTTCGGGGGATTTTCAAAAAAGTGC
+TCATATTTTCCTTGGTGGGTATAGGCCACATTATCGATTACTATCTGATTGAAAAGGGCA
+GTGCAGTCCGTACCGCTGTGATTTTCTTTTATTTGTCCAACGAAGGATTGAGCATCATCG
+AAAATGCATCCAAGGTGGGCCTGCCCATACCGGAGAAGCTGAGGGTGGTATTCACGGAAC
+TTAGAAGGGAGGATAGAAAGAATGGCTAGAATTTGTATCGACGCCGGACACGGTGGAAAT
+GATCCAGGGGCTGTATATACGGGAAGAAAGGAATCCGATGATAATTTAGCACTGGGAAAA
+GCAGTAGCGGCAGAACTAAGGCGGCACGGGGTAATTGTTGATGAAACCAGAACTGCTGAT
+GTCACTGTCAGCCTCAATGAAAGGAGCAACTTTGAAAACCGGCAGTCTTACGATTGTTTC
+ATCTCCTTCCATCGCAATGCCTTCAAGCCAGAGCAGGCCACGGGTGTGGAAACATACACC
+TATTTGAACCCAGGAGCCAAGGCCAAAGGGCTAGCAGAAAAAATCCAAACTGCATTGGTG
+GGTGTTGGCTTTACCAACCGGGGTGTTAAGGCGGCTAACTTCCATGTCCTTCGGGAAACA
+AAAGCACCGGCGGTATTGGTGGAGGTGGGTTTTATTGATAACACCGGTGACAACCAACTG
+TTTGATGTTAAAAGGGATGAGATCGTAGCGGCTATAACTAAAGCAATTCTGGAACAGGTG
+GGTATCAAATATCTGCCATCTACTCCCCCATCACCCAAGCAGCAAACCGGCCAAACATTA
+TACAGAGTAATGGCAGGCTCCTATGCTGTTAGGGAAAACGCTGAAAGGCAGGTGGAAAGG
+TTAAAGGCCGCCGGGTTTGACGCCACCATTATGATATTTACGCCTTAGGCTAAAACGCTT
+AGGGCTTCTTTTTTTCAACGCCCAAATCCTTAACTTTTCTAAGTTGAATTATAAGTAATT
+ATAACTTGATGTTATCCCAATGTAACGGTAACATGCTACCTACCAAAGGAGGGAGAGAAA
+TGCTCTTAAACCAAGCAATCGAGGGTTTTACAAAGTACATGCACCTTATTGATAGATCGC
+AGGAAACCATTCGGGGCTATGCCATAGAATTGAAAGGGTTTAACAACTTCTTGACTGTCA
+AGCATAACTGCCCGGTGTATTTGGAAGACATTGTGCTTCAGGATTTGGAGGACTACCTGT
+TCTACGAAAAGGAAAGAGGGGCAGCCTCATCTAGTAGAAGCCGCTCATTATATATTCTAA
+GAAGCTTTTACAACTACTGCTGCAGGAAGGACTTATGCGTCAAGAACATTGCCAGCTTAC
+TGGAGCCAGTGAAAATCAAACAAAAGGAACGAGAGTTTATCACCGAGGATGAGCTCGGGG
+AACTGGTAGCTGCCATTGAGCAACCAGTCATTAAAACCGTAGTCCAAGCCATGTTTTACA
+CCGGTGGCCGGATTTCAGAGATGATCCACCTGACACTTGAGGATGTGGATCTGGATGGCC
+GGGTGTTACACATCATTGACGGCAAGGGCGGCAAAGACCGGGATGTGCCCATCAATGATA
+AGCTACACCGGATTTTGACCCACTACCTAGAGCACATCCGGGACGCACATTCAAATCGCT
+TCTTTGCTTTAACCAGAACCGGCAAAGTATCGGCCAGCTATATCAACTACTGGATTCATA
+CCGCAGTAGAGGAATTGGGCTGGGACAAGAACATCAGCGCCCACGTGCTTCGGCACTCCT
+TTGGCTCCAACCTGCTGGAGAAAGGGGCCTCGGTGGTGAGCATTCAAAAGCTGCTGGGCC
+ACTCAAGCCTTAGGGTAACGTCAAGATATCTGCACCAGGACACGGATAAGCTGACTGAAG
+CGGTTAATCTTTTATAGGGAGGGATAAAACCATGGAACCTATTTACGATGAAAAGGTCAA
+ACGGATTATTGAAATGCTAAAATTTAAAACCAGGGATGAAGTGGCGGCAGAGTTGAAGTA
+CAAGAGTTACAAAAGCCTTGATATGTACATGCGCCGGAAGAACTTTGCTTTCGACAGCCA
+GCAAGGTCAGTATTTCCCCCGGAAGAACAGAATTGAAAAACCAGACCCCAAAAGCTACGC
+ACCCACCAAGGTAGCCAGCATCATCACAGCTTTTGAGATTGAGGGCATTGACCCAAGGAT
+GGTGGCCAGACAAGAGGGATTTGCTGACCACCGGGAAATGGCTGAGTACATGAAAACCAA
+GGGCTACGAGTGGAACGTCCATAAAAACAACTATGTCAAGACCGTGGGTAGGATTGATGT
+GCCGGAGCCGGTTGGTGATCCAATGCCGGAATCAATCAACCTACCAGGGCCAATTGTTCA
+ATCGGCATTATCGCCAACCGTTCAACCAACCAGCGGGGAATTACCGGAGGGGCTTGGGGA
+ATATCTGCCCTTCCTTCGCTTCCTCTATGAAAACCGGGATGAACTCTATCAGTTACTCAC
+CGGTACCAGGGACGATGGCATAATTCCAAGGTATGCTGTGCCAGGGGAAGTCAGGACTAA
+AGCCATTTACATGAGTGATGTTATTGCCAAGCTGGCCGGGGAATTTAGCAAGGAGAAGAA
+GGTTGCCTTAAGGGAAGTCATGGAAGGGGCGCTAGTGGAATACCTGATGAGGTATGGGTT
+CAAGCGGGAAGTGGAAACGCTCCTAAGAAACCAGTAA
+>NC_021184.1|provirus_4563831_4615358
+TCACTTCTTTAACCCACCCTTCCTTCGGCTAGTGATAAGGTGTATTTGGCCATCCTTTTG
+TTTTATGAAATGCTGCTTCATCTCATCTGTTAAACGCACTTTTCTATCCTCCGTGATAAA
+GGCAAACCTTATTATGTTAATATCCGTAAAATCTATGGCTTCCAATTTGTTTTTAAGATA
+TATTTTCCACCTAAGATTGAGGTCAGTGTTGTCCTGCCAATTAGCATAGAAGGTGTTATC
+AGTGTATAATTTAGTGTCTAGGCTAAGATATAATTCCGCAATAATATCAAGTAATAGTAA
+AACCCTGGTATTATTGTCACGTAAGACGTCCGGCTCCTCCATATACTCAAGGAAGTGCAA
+AGCCCTATTTCTATTAAATTCCCGCTTCACGCCTTTTTTAGAACCGGCAAAATTCTGGTA
+AAACACTTCTTTGATCATATACTCCAGATATTTAATTTGGTTGCGAATCCAGTTTTGGAA
+ATCAGGATTAGATCGCCTTTCATCATTCCTCTCCCCCAAATATTTTACTAAATACTTCCC
+AAAAACAAGTATGCTAAACTCACCTTTTGTGTTTGCAGATTTTATTTCCGGGTGCTCGAT
+AGCCCACTCTCTTAATGCAACTTCTACGGCTGGCACCAGGGTCAAATATGAGCATATATA
+ATTGCCGATCATTAGATCATAGGTAGCGCTTTCAATCACTTTCGTTAAACGGCTCAATAT
+CTTCGAGGGTTTAAACCTATATTCAATCTGATATGCTCTTTGCCATGGATTAATTACCAT
+CCTTAACACTTCTCCCTCCAGCCCTCCCCAAGCCGGATCCGGATTTTCTAAACAGCCTAA
+TAATTCCTCAACCTTTTTCCCGGAGACACAAGGGTAAGGAGGAATAGTAAGCAACTTGTC
+CTTTAGATGGTCATCAATTTTGTCGAAGGCCTCCCATAAATTCATGTTATCCCCCCTTTA
+GGTAAATATACTATTTAAAACACGCTTCACCTCTTATTACCTTGAGAACCTTAACGATTA
+AATGACCTCTGATACGTTCCGACGGGGCAGTTGTTAAAAATAAAATAACCAGCCAACTAG
+GTAAGCCGATATACCCTATCAGGCCTACCTGTTTGGATGGTTGTCCTGGTATAATGAGAT
+AGAATCCATGATAGCAAAAATATGTGTATTGGCAACAATTCTTCATGTTCTGCGCAGCTA
+TATTACTACATTGTAACTATCTCGCTTAATTTTTTTATGTTTTCTTCATCTTGAATATCA
+GTCCAGCATGAACTGATATTTTTACTTTTACTCATCTCGGCTTTTTCTTCTCCAAATGCA
+CTTTTTGTTTTTTCGTAATTTTTATCGCTGACCGTTTTTCCTATTGGATTCCTTTTCCAA
+CCACAAAAATATATCTTGCTAGCCTCCTCAATGTTCCTCCTTTTTGAAGCAGCCCTTATG
+ACATCCGTATAGTTTGGTTTCCGCTGAAACTCCTTTGGTATTTTTCGATTTAAAGCCTTA
+AAAAAATCGATTGGAGCAAATTTATGGTTGGGGTCATATTCTAATTCAAGATATGCAACT
+AATTTTTTGTAATCTTCCATGTAACACTTAACTCTATACCCTTTTTTTATTTCCAGTTCA
+AATACTTCAGGATTGATGCCAAGTGTTGTCAAATATAGCCGATAAGGTAATATGTCCGTC
+AAAAAGATACAGCTAAAATTTTTTCCATTATAATCAAAGGGGAATATTGCCCTCTTTTCT
+TTTTTTTGCTTCATATTCTTATGAAGTATTCTCAACCCACTAAATTCAAATATCCTCATA
+CTACTACCTTCTTTTTGAACCGTATTTGCTCTCTTTCTCCGATTCTCACTTTGGCCTTCC
+GCCACGCTACCCCGACTATATGTAAGCACTCAATCCGAAAGTACATGGTTACGCCTCTTG
+AAACATGCGACAATACCTCCATAAGACTTAAAACTAAAGAACGGAGGTAAAAGGGGCAAA
+AAGGAGAACGACAAACCCTTGTTAAGGAATACAATGCTAGTGGATTTTATGACAGAAAAC
+AATCATGATAATGCTTAACACAGAAGAATGAATAAAATTATCCACTTATTCCCGCAGTTG
+CACATTAATGTTAACCGTCCCCTTGTTTGATATATAAGACTATCCTTTATGTTGACTGCT
+ACGCCTTTCGTTACTGGCCGTTCTTGCCATTTCGATGCCCCTTGACTATATGGTAACATG
+CGTGGGTAGAAACAACAACACAAAAGAGCCATCCCGTTGTGTTGTGTTGCCAGCCCCCCA
+GGTAAGCCAGATAACTCCTATCCGGCCAACCTGCTTGGCTGGCTATATTCCCACCCACCC
+GGCTGGCTCACAATTCCTATATCCCCACCCACACGGCAGCCAAAAAACAGGCCAGGCGAT
+CCACGTGGGACCGCACTGGCCTTGGTTAGCTGATTGGGACTAATTGGATGACACAAAAGA
+ACTGTCCCCTTGTGCTCTTCGGGACTGACCCCTTTTGGGAGGAACTGGATGGGGCTTTTC
+GAGCCCCGTCCAGATTCCGACCCGTGCACTTCATTTTTCAGGACAGGATTCCTGTCTTGT
+AACAATTGTTCACAATTTTGAAATATATGTTCATCCCTCAGAAAAGAATGCTTAATATTC
+TTTCGTTATAATGTAGTTGTTAAATCCTAAGCACTTAAAGCAAAATGCTATTATTTAACC
+GGTCAGTTAAATTCATTCCTGTCCTTTGACAATTGAATACCACCGGGGGCACAACAATTC
+ATGCTGGCTATCTGCTGGACCGATTCCAGGGCTGAAAGGGAAAAAACGAGCATAAGGGAG
+AACAAAAAAAGAAAACAGCTGGGCGATCCGCGTAGGACCTCCCGGCTGTTAAATTCTTTA
+TCTCGCTAAACTGTTAACGCAGTGGGGGACTGTCCCCTTTTGGGAGGTTTTGGGAGCCAG
+TTAGGATTCCCGAAACCGACCCGAGCATCGACACCACTTGCCAATATTTACCTCGTTTTT
+TATACCCACAAAATCTCACCTGTGCAACGTATATTTCTATGGAAGAAACAAAAAGGTCGG
+TTAAACCTTATATACAAATGGAAAAACCGATTTATAAAATGCTTGTATGGCACTTATTAC
+CTGTTGTATTTTTCGACATATTATACTATACTTAGCTATACATATTAAATTTTAGAAATC
+TAGGTTTTTTTTGACTTAAGTTACAAATTATTGTATTCAAATTTTTCTAAACCTAGTGTT
+AAGACTTTAGCCGGGTTTAGCTGGTTGGGTAGGTTAATTTTTTTCGCTCTTTGACATTTG
+AATATTGTTCGGTGAGCACAGTGAGGACAATTACAGTGCTGGAAGGCTAGAAAAGAAGGT
+AGCCTTGGTGTTGTAGACTTCACAAAATGGTTCCGACGTCTTTGGTGCTGGTTCTGACAG
+CCAACTCAGGGGGGGGCATGACACAAAAAGAAGACAACCGGGCGATCCGCTTGGGACCTC
+CCGGCTGAAAAGCTCTTTAATGTGTTAAATTGTTAACGCAGCGAGGGACTGTCCCCTTTT
+GGGAGGAACTGGATGGGGCCGCCAGGCCTCGGCCAGATCCGACCCGTGCATTTCTTACAA
+AGAGGTGCCCCCAGAGGATTTAACCCCCGGGGGCACAGACCATTGGCACGCGTTTACAAC
+TAATAAGTTAAATGCCTGGTACGTTCTTTGTTAAATCATTTACGGCAAATCAACTACTTT
+CTGAGCATTGTTTACATTACCGGCAACGTCTGTAAGATTTGCTGTTACATCAGCAGCAAA
+AGCAGTATCATTTGCGCCATCGGTGTTTGCTACTGTTAATTCAGTATTTGCAGCGTTCCA
+GGTAAAGGTCAATGTTCCTGACACTTTTGCCGCATCTATCGCAGTCTCAACAGCAGTCTT
+GCCAGCAGCAGATAATGCTTCAGAGAATGTAACCTTAGCAGAATCACCATGCGCAATCTG
+TGCTGTTATAGCAGTTGCGACAGTCGGCAGAACACCATCAGTTACAGTAACGGTAATGTA
+GTCAGAATATGCACCTGAAGAAGCGATCACGCGGAATTTCGCACTGTCCTTGGTGAATGT
+GGTATCGCCACCAACTTCAGTTACACTAACTGCTCCACCAGCAACCGCAACAGTATCGGT
+TGCCATACCGGTCACACCGTCCATAGGAGCGAGTAAAGTTGTTTCAGTACCACTTAAGGA
+ATATCCACCGAACTGGTCAGTGACCCATACAAAAACGTCCTGAGCTCCGCTTTGGTCGGC
+ATTGTTATATCCAGCAGCATTTGCTACGGTGTACTCTTCAACATCCTTGGTTGTCGTGGC
+TTTAGCATTAGTAACGCTCGGTGTAACATTCTTGAATGTAACAGAAACTGCCTGAGAAGC
+ATCCTTGGAAATCGTTACATCTTTAGACAGAGTTTTCACGGTGTCGGCAGCATTGACAAT
+CACTGTCAACTTAGCAGTGACATCTTTGTCAGCAACAACTACGTTATTAGTATCAATGTA
+GTATTTGCCATTTACCAGCCCAGTTACAACTTGAGCATTATCAGTAGCTACGCTAACTAT
+ACTCGATACAGGAACTGTATAAGTATTGCCACTGGCATCAGTAGCCGTTACTTTGATCTC
+CTTAGCGTATCCGGCGTCAACAGCGGCTGCATCAACAGCAGCAGCTCCTGCATTATGGTA
+CAGTGTCGGGATATCACCTATGCTGTAAGTTACAGTCCCACTGTCGTTCTTAGCAACTGT
+AAAGGTGTAGGCTTTTTCTGCCACAGCCACACCGTCTTTCATCAGCTGAGCTTTAACAGT
+AGCAGTACCTTCCTTCAGCGCAGTAGCTACAACGCTTACAGTAGTAATATCCGCATCATC
+AGTTTTATTCAAGGAAACTACAGTGTTGTCAGTGGTAACGTAATGAACACTCCAGGAAGC
+GCTGTCTACTGCCGCATTACCATACTGATCTTTGCAATCGAATTGCAATGTCTGAGTTGC
+ACCGACTAACATATTGTTACTTACAGTAGTATCTTTCTTAGTGTCGATAGTTGTTGGAGT
+TGCTGCATCATTAGCTGTTACTGTCACTTGTGCTTTCTGGCCAGAAGCATTTACAGTAAT
+AGTAACGACTGAAGATGCACCCATAACCGCTGAGGCGGCAGGAGTGATTTTTACGCAATC
+TTCGTATCCAGCATCAGCAGTAAAAATAACGGTGGCACCGACAACCTGGCTGTTATCTGC
+AGTTACAGTGTAATCAGCAGCATTCAGATCCTTGGTCGCAATAGCTGTGCCATACTTGTC
+AGCAACAGTTGCCTTAATGTATATGGGAGTTATAGCTCCGGCAGCAAACGATGCTGAATT
+TTTTTCCAGAGTTATTGAGTATGGTGCACTAGTATCTTCGTTAATTGTGATGTCAATGTT
+ACTGCTTTCTCCAGAAGCCGGGCAAAGTGCTGTCAGCTTAACCGTGCCAGCTTTCAGGAA
+CGCACTGATGATAATTTTGTTGTTGGCATCAACCGAGACATTAGCAGCAGGCAGAATGGT
+TTCGTCTGAAGACTTGAAAATCACACCATTGCCTACATCACCAGTAACAAGTTTGCAATC
+TTCATTTAAGGTGTTTTTCGCGGTATAAGTTACTTCAACATTCTTAGTGCCAGTAGGGGT
+GAACATGGTTTTGCCTGTAGGCAGCTGTGCTGCACCTAATGTTACACTAGAAACGGTTGC
+TGTATTGACTACTTCTAAAGTCTTGGTAGCCTTAACACTACCGTACATAACTGTGACAAC
+AACCTGGTCTTTAAGAGTAGCACCTGCTGCATTTAATTGGAATTTGCCAACTACTTGGTT
+GATTGTAGCATTTGCGGTTGTGTCAAAAGCAGTGATAGTTAATTTTGCGTCAGAAGCGGA
+AATGGTTGATTCTGTACCATACTGATTTGTGAACTTAATTGTGAGTGGTGCAGTTGCTGA
+TTTCTGAAGAGCGTTGTTCGCAATCTCAATGGATTGAACTGTTTCAGCAGCAACGGTAGT
+GGTTGCGGTATCTTTACCAGCTTCCAAATCCAACCCAGAAACTGTTACAGTATAATCTCC
+AGCAATGAAATTGCCAGATGTTTTTTCTAAAGTTGCTACGGTTTTGTCATCATTCCATGT
+AGCAGCTTTTACATCCTCAGCAACAGTACCCCTTTTAACCGAGAAAACGGCTTTACTGGT
+ATCGGTTACGGGAGCACTGAATGTTACCGCTAACTTATTAGCGTTAATAGCACTAAAGCT
+TCTGGTTTCCTGTATATTAAAAACCCCGAAAACCCGCATGGGACAAGGGCTTGAGGGGTT
+TGTTAACTTTTCATTGTGGTCTTAATGGATATAATTATTAGCAGGTTCCATAAGGTTAGG
+AGAAATTAGATAATTATTCATAATAGATTTTCTTATAAATCACTGATATGCTACACTTTT
+TTCGTAAAGAACCTCGGGATCAATATCTGCTTGATTGCTCCACTCTATGCTATCAAAACT
+CACCCGAACCGATCTAAATAAATTCTTGTCTTTTAATTCCCTAAAAATTCCTTTGTTCAG
+ATAAGGCGTCATATCAAATAACCTTTTTTCTCCGTTTTCAAAGGTTAAAAGCAGTCTATA
+GCTCTCCAAAGGTTCAACTCCTACTACAGACACATACATAATTCATCACCTCTATTTCAA
+AGGTTCAATTTTAAACGGCAATTCGCTATTCATTGCCAACACCCAGTTTGCCAATAAATC
+TTCCTGTCTTAATTCTGCCCAAGCAAGGACAAGTTTAAGCTGTTTTTTAGGGAGACTCCC
+ATTAGTTAGTTCACAAGTATTTATATCAATTATCGCCTTATGCTTCCCATAATATGCATG
+AAAGTGAGGCGGGTTATGCTCACCAGGGGCGCAATACATTCTTATAATTATCCCATAAAA
+CATACAAATGGTCGGCATTATATCACCTTTTTCCCTACAATACTCCACATCTATTATACC
+ATAAAAACACACTCGTGGAATAAATATTTTTACTGGTTTCTTAAGAGCGTTTCCACTTCC
+CGCTTAAACCCATACTTCATCAGGTATTCCACTAACGCCCCTTCCATTACTCCCCTTAAA
+GCGACCTTCTTTTCTTTGCTAAATTCCACAGCCAGCTTGGCGACAACCTCGCTCATATAA
+ATGGCCTTAGTCCTTACCTCCCCTGGAACAGCGTAACGTGGAATGATGCCATCCTCCCTG
+GTGCCGGTGATTAGCTGATATAGTTCATCCCGGTTTTCATAGAGGAAGCGGAGGAAGGGC
+AAATATTCCCCAAGCCCTTCCGGTATTTCCCCGTTATTTAGTTGAGCAGTTGGTCCCGGT
+ATTGGCTCTGGCATTGATTGACTGACCGGCTCCGGCACATCAATCCTGCCCACCGTCTTA
+ACGTAGTTGTTTTTATGGACGTTCCACTCGTAGCCCTTGGTTTTCATATACTCAGCCATT
+TCCTTGTGGTCTTGAAAGCCCTCCTGCTTGGCCACCAGCCTGGGGTCTGCTCCTTCCATC
+TCAAAGGCGGTAATGATGCTGGCTACCTTGGTGGGTGCGTAGCTTTTGGGGTCCGGTTTT
+TCCAGTCTGTTCCGCATAGGAAAATACTGACCCTGCTGGCTGTCAAAGGCAAAATTCTTC
+CGGCGCATGTACATATCAAGGCTCTTCCAACTCTTGTACTTCAGCTCTGCCGCCACTTCA
+TCCCTGGTTTTAAACTTTAACATTTCAATAATCTGCTTAACCTTCTCATCATAAATTGGC
+TTTTTCATGGTGTTTCTCCTTCCCTACAAAAGATTAACCGCTTCAGTAAGCTTGCCCGTG
+TCCTGGTGCAGGTATCTGGATGTTACCCGAAGGCTTGAATGGCCCAGGAGTTTTTGGATA
+CTGACCACCGAGGCCCCCTTCTCCAGTAGGTTCGAGCCAAAGGAGTGCCTAAGCACATGA
+GCGCTGATGGTTTTACTCCAGCCCAACTGTTCTACCGCATCATGGATGCAGCGATTGATA
+TAACTGTCGGAAACCTTGCCGGTTCTAGCCAATGCAAAGAAGCGGTCGGAATCCGCCTTC
+CGGATGTGCTTTAGGTAATGGGTGAGAATCTGGTGGAGTTTATCATTGATGGGCACATCC
+CGATCCTTGCCGCCCTTGCCGTCAATGATGTGCAGCACTTTGCCTTCTAAATCCACGTCA
+TTCAGTTTCAAATTTATCATTTCCGAAATCCGACCGCCGGTATAAAACATGGCTTGGACT
+ACAGTTTTAATGACTGGTTGCTCAATGGCGGCTACCAATTCTCTCAGTTCATCCTCGGTG
+ATAAACTCCCGCTCCTTTTGCTTGATTTTCACCGGCTCCAAAAGGCTGGCGATGTTCTTG
+GTGCAGAGGTCTTTCTTGCAGCAGTAATTGTAAAAGCTGCGTAAAATATATAACGACCGG
+CTCCTGCTGGCTGATGCTGAGCCTCTTTCCTTTTCATAGAGCAAATAGTCCTCCAAATCC
+TGCAGCACAATATCTTCTAAATACACCGGGCAGTTGTGCTTGACAGTCAAGAAGTTATTA
+AACCCTTTCAATTCTATGGCATAGCCCCGGATGGTTTCCTGCGATCTATCAATAAGGTGC
+ATGTACTTTGCAAAACCCTCGATTGCTTGGTTTAAGAGCATTTCTCTCCCTCCTTTGGTA
+GGTAGCATATTACCGTTACATTGGGATAACATCAAGTTATAATTACCTAAAGATTTAACA
+AGAAAAGTTAAGTATTCGGGCGTTAAAAAAAAAGAAGCCCCGGACTGGTTTTCGTCCAAG
+GCTTTTATCTTCAAGGCGGCGGGTGTTTTTCCAATAATAATGCCGCCATCCTCTCAATTA
+AGGCAGCGGCATAGGCTCCGTTTACGGTTTTTCCTTCCCTGGCGTTTTGTTGCCAGTATT
+CAGGTGTATTAATTATTCCTTTGGCCACTAGAATCTTTAAGGCTTCTGCCAATTCATCCC
+TGGGCTGTTCGGTCAATGACTTCTTGAAAGTATGCCACCTGGCCCAGTTGTTTTCCCGCA
+TGGTACCGGGGCAGATTTTCCGGCTGGCGTCATAGTGCCTGACCACCCTTTCCGGTGGAA
+TGAAGTATTTGCCCATCAGGTGTTTGACCAGCTCCACCGTGTTGGCCACTGCCTTTTCGT
+AATCCCCGTCAGCGTTAATGCAAATTTCTACTCCGATGGAATTGCTGTTGGTAATGCCAT
+ATTTCCCGCCACCGTCACCGCAGTGCCAGGAAGCTTGGGAATCCTCCACCAGCTGCAGTA
+TGCTCTTATCATCCACAAAGTAGTGGGCTGAGGCTTGCCGATCTCCACCGTTAAAATATT
+TATAGTGAGCCTCCGCATCAGCTCCTGCCCGTGGATTGCCGGTATCGTGAACGACAATGT
+ACTTGATAGACTGGCCGTTCCTGCTAGAGTGGTTATATTTTATAAGCTTCTTATTTATGT
+GCAGCATGTTGTCCCTCCTTGTCTTCTTTCAGGTTCAGCAATACCGATTTCAATTTTTCC
+GGTATAGGCAACCCAACCCTGGCGGCGTTTTCCATAATGCTCAAGCCTTCATTGGACAGG
+TAGAAAAATATCACAGCGGTACGAACGGCACTGCCCTTTTCAATCAGATAGTAATCGATA
+ATGTGACCTATGCCCACCAAGGAAAATATGAGTACCTTTTTGAAAATCCCCCGAAAGCCG
+ATCTCACTGGAAAGTTTCTTTTCGATAACTGCCACCATCAGGCCGGTAATGTAGTCAATG
+GCCACAAAAGCCACTAAGGCTAATACTAAACCGTCATAGCCACCCAAGAACCAACCGATA
+TAGCCGCCAATAGCGGTAAAAGCCAGCTGCAGGGTATGAATGATATCTTTCATGCAATCG
+TCCTTCTTTCATAAAAAATAGACACCTGTCAAAGATGTCCTTATCGTGTGCTTTCTGTTT
+TGAAGTCCCCCAGGGCCGCTTTTAACTTCTGGGGGAGGGTAGGAAGGTTGTTGCCGAATG
+TGACGTTCAGTTTGAAGCCACTGGCCTCATGGATTTCCTGCACTTCAGTAATCCTGGTAT
+CCATGGTCACGTTCCAGTCCTTGTTTTGAACGGTCACAACATCCCCAACATCCCAATCCT
+GCTGATATTTAAATGGCCCAGCAGTTAAAACCTCGGCTTGAAAGGAAATGACCCGTTGAT
+GCTCAGCCAACTTTGCTTCACCTTTTGCTGGCAGGTCAGCAGTATCTTTAACATCCCTGG
+CATCAACAAAGATAACGTGGCGATCCAGACCAGTAGCATCGCTGCCCAGCATCATGATTT
+CTCTATTGGCTCCCTCGTCTCGACCAGCTACGATTGCATAGTTACCAAAGCCCACCAAGC
+TATCAATAAATTCCTGACTTCTGATATTATCAAACTCTGGTGAGAAGATAACCAGCGGGT
+TTATTTGCTGGCTGGCGGAAAAATCCCTTCCATTGTATATGTCAAATACCCACTTCCTTG
+CATTGAAGTCCGGATAGATATGCCAACCAAGGCCGGTGAGTGTGCTTATCTGTTCCAGTT
+CATCAGCCAGGTTCTTGTATCGTGTTTGCCATTTAATGATTTCTCCCCTTTGCTGGTCAT
+CACCAATCACAAGAAACGGAAATTCCATCTCCGATATCTGTAGACAGTTCCGCCGCACAT
+AGTGTTTCATGACCGTTTCCGCATTGGCTTCCAGGATGTCGTAGGCTTGCCCGACAGGTG
+GGATGGTGATGCGCTGACTAAGGATAGTCCCCAATGCGTAACCCTTGATGGTGAGCATTT
+CTTCTCCCCGTTCACCTGCCTTGATTTCTTTGTGGCGGATGATGCCTACTTTCCCGGTAT
+CTGCACCCAGCATAATCAGGTTGTTGATTTCAAGCTGCTCCGTATTTCGTACCTTCCGAT
+TCGTGACCAGCTGGAATTCGCCAGGCGAGTGGTAGCTGCGGCAAAAGGTAAAGGAGAGAT
+AGTTGTCTACCTCTCCCAATAAATCTAATCCCGGCGATAATATTCTAATCGGTTGCATAA
+AAAAACACCCCTCTCAAGGTGTTACTCCATTTCCGCTAATACCTGCTGCACTGCCGCTTT
+CAGGTTCCCCAGTGCCGGTACCTGCTCCACCGTGTAAACCCCGGCCAGTATGAGCGGCAC
+CCATACGTTTTTAACTAGTGCCGAATTTCTATCAAAAGTCATTATGCTTCACCTCCTGCT
+AACAATATTGTCAGTTCCGCCATAGCCATCTGCAGCCCTTGGATTTGAACTTCAAGCTCT
+CGAAATTCAACAGCCGCAGGGGAATCTACATATTCCCACCAAACAGTCTCCGTTGCCTTG
+TCCGCCTTGATAATGGCGATCTTTCCTACTGGCTTCTCCTGCTCCGACAGCTTTTCCACC
+GCCACAGCTCTGGCCTTATCCGCCTCTGTCAAAACACTCTCATCGTAAACGATACTGCCG
+CTTTCAAATACATAAATCATATTAAAGCCCTCCCTTAATTTTTATCGTAACCTTCGATTC
+CAAAGGTCTGGGTTAGTTTTTCAATGTAGTAGCCGGTGGCCAGGTAGATATTGTGCTCGT
+CATCCACCTTGACATCTGCAATCTTCTCCACTGCCTTATAACGCCAGAATTCCTCCCCTT
+TTTCATTGAATTTAACCAAGGTCTTATCATTATCCCAGGCGTAAACAGCTCCGTCCAAAC
+CTTGGACAGCCCGCAAATAGAAGTTGGTAATGTTAATATCGCTTACTTCAAAAGAGTGTA
+TCTGCCCACCAGAATATTTATTGAATACCCTAATGTCATCGTCATAAACACCAAAGAGAA
+AATCTCCATGCCTACCAAATATCGCCCTTGCCGTACTGAAATATCGTATAGTCCGAAGGG
+TGTCGATATCGTACAACTTGTTGAAAGCCAATACAGTGCGGTCATCCCACAGATGCAGTT
+TACGAAAAACACCACTAGTACCAATTTCTCTTTTCTCTAAAAGAGTACCCTCCGGGGATA
+TTTTGGCTAAATAGTCCTTGGAGCCGGAAGTGTAAAAATAAGTAATGCTAACAACAATTA
+CCCCTTCGCTGTTTACCACTAAATCTGTTACCGCACCTGTTGTACCAGTTATGCTGCAGG
+ACCACTGTTCCACCCCGTACGGGTTAAGTTTTTTCAAGGTTCGGTTGGTATCGGCAATAT
+AAACATTCCCATTCTTATCGGCTTTGACAAAGTTCAAGGCAAGGTTATGACGATATACCC
+ACTGCTGCTCACCCAGCGCATTGAACTTCCTTGCCGTCCAGTCATCACTGGCACCATAAA
+AGTTACCGGTTATATCCACATCAATGGAATTTACTACACCTTCAAATTGATGGGGGATAA
+AATCCGACCACTCTTTATCGGTAGATAAAATGCGGGCTGAATGCTGGCGCAGCACATAGA
+TTTTTCCCTGCTCTTTATCAAGGCCAAAACCATTAATGGGGTTACCGCTAATGTTGTGAT
+CCTCACGCCAGATAAAACCGGCCAGTTGATTATCCAGCTTGGTGATTTCCCGATTGGAGA
+CGGTATAAATGTTGTTTTCGCTGTCGATGAATATATTGTATACGGTAGTTGTGTTGGCAC
+TAGATCGTTCAAAAATTGGCTCGCCTGTTTGGTAGCTGTGTTTGCGCAGGGTATAGTAAT
+TATCTATTGAGTAAAAATGGTTAGTGCCCGGCTCAATAGCTAAAGCATAGGCATTTCTGG
+AATTAGGTATGGTGTAAGAATATACCGTGCTCCCGTTACTTGGATTTAGTCTATAAATCT
+TATAACTTTGATCAGCCACAATAACTGTATTGCTGTTCACCGCTAAAGCGTATATATAGG
+AATTTAGGCTACTTGAAGTCCACATAACATTGCCATTGTTTCGGTTGAACTTCTTCACGT
+AATAAGTTGAGGATTCAGTAACTCCAATATGAACACCAGATGTTTCTACTGCGATACAGT
+AAGGAGAACCAATATTTGGAGTTTCCCAAATTAAGGTGCCGCCTAAAGCGTATTTATATA
+GGCTCGATCCCTGAGCAAGGAAATAGCTACCATCCGTAGCTGCCAAGTCTGGGATCATAA
+GAGCACTGGAGGTTGTGTGGACATTATCGGCAATTACCTCGCCGGACTCAGCATCATAAA
+TGTTCACACCTGAGCTGTGCAGCACATAGACTTTCCCGTCATGATAATGATTGACACCCT
+TGCGGTTGGACGAGGTTCTCAGGGAGTGGTGGGCAAAAGGCAGTCCAATCCCTTTAATCT
+CATCTGATGCTATGATTGGCGTTAACCCTTCAATGGGGATAACTCCCGTATCTCCCATTG
+ATATTTGCCCCAAGCCGTGCAGCCATAAATCACTCATCTGTCATTACCTCCTTTATCCAA
+TTTCCTGCCTCGTCATATATTTGGTTGTATACAACTACAGCCCGTACTGTTTCACCGTCT
+GTCTCATAATAAGTAACTGTACGGTTTTCGTAGCGTGGTGAGTTACCGCCGCTTAGTACG
+GACCGTTTAGCCAGGGTTCCATCTTGCCGGTGCCATTCAATGGTGGTGAAAATCCCCTTG
+TGGTCTTTCCCAAAACGGTAGGTATTGGCCAGATCCCCATGGGCGGAAAAGTCAGCCTCG
+TGGTCTCTAAAAGCAGTCCAGGGCACCAGGTCAGTGGCATCAAAGCTAAGTCCTTGAATA
+TAGTCAAACCACTCTTTCCACTCGGCGTAAAACTCACCGTCTGGTTCCCTAATCTTGCTT
+TGCAGCCAGGCATCCCAGACAACTTCAAAGACTTCGGGGTGATTTGCCCACCAAGCGTCC
+CACTGCTCTTGCATCCACTGGGTTTCACTAGCTATGTCCTGGGGCAATAGCAGTTTGCCG
+CTGATATAGTAATCCACCGCTTCCGGGTGGCTGGCTTTACCCTCGATAACTTCCCACGAT
+ACAATAACCTGATCGAATACCGATGCTTGGTAGGACTCACCGGCTGATAGAATTTTATCT
+CGCATCACATAAGCCCCGGCCAGCTTTAGGCTGACGGTCTGCGCTGTATCGGTTAAATTG
+GTTAAAATGATTGATTTCAGCACTACCACCCGATCATTGGGTACCTGGTATAAAGGCTCA
+AATTCTGTGGGTAGTTCCCCTTTGGCAAGTCTGATGGCACTGCCCATATTACATCCCTCC
+CCAGGTGTTGATTACCGGTTGCGCTTCCAACCTGCGCCATTTGCCATCATTGATTTCAAC
+TTCCAGATTACCGCCCCTTAAGCGTAGGCCATGGGTTTCCTCTCTTACGGTGCGGTCCCG
+GTGGGCTTTAAACTGGCTCCATGGTACTAGATTAGTGATGTCTTGTATTTCTTCAAACCA
+ATCTTTCCACTGGGTGTAAAACTCACCGTCCGGTGCCGTTAATTTTTCGTTTACCCAGTC
+CTGCCAGACCCTCTGCGCTTCATGGTCAAACCAAATATCCCAGTCTTGCTGGATTCTATC
+GAACCAGGTTTTCCACTGGATGTAGAAGGCACCATCCGGAATGGTTAGCTTATCGTTTAC
+CCAGTTAGTCCAGTTGTTTTGGAAAGCGGTGAACTTTGATTGCAGCATAGCTAAAAAAGC
+AGCATGCTCAACACTGGCATTCTGCTTTTTATCTGTCAAATATTCAAGCCAGGCGGCAAA
+CTCTGTATCCCCGTGTGCTCTCCTGGCATTGAGGTATAACTGCCATTCGTTAAACAGCTC
+GGTGGTGTCCACCTGTTCAAATAAATGGGTGACCACGCCGCAGACGGCAGGGTTTAATCT
+TTCATCGGTTATCTGGTATGCCTCAATAAAACTTTTCCCGGCCAGTACCACTACCTGTGC
+CAGGGCCAATTCATAGATGTTTTCATTACGGGTTAGTTCCGGTACTTGGGGCGTTTCTGC
+AGCAGTACCAGTTAACACAAAGGCTTTCACATAGCGGTTTTCTAAAGTCTTATCTAATCT
+GATCACCACCCGGTCGATACGGTCGTAGTTGGCATGGGCCATGGGGTGGTAAAGTTCCAA
+AGGCTCGATGTCAATTTTGTAGAGATAACCCTCAATCCAGGCATAGCCAGGTTTAATAAA
+TGTTCTCATGTCCTGGCCTTGTGCTCCTACCTGCAAGTTGTCCCCGGAGCCGTTGAAGAT
+GCCGTTTCTGATAAACTGGCGGAAGTATTCAGCGAACTCATCGGCGGTATAATAGCGTTC
+ATCTTCGCCGTCAACTGAGTCGAAAAATCTGTAGTGTTCAGCCACAAAAACCCTCCTTTC
+TAAAGGCCCACATAGCGGTTTTTCCACTTAACGAGAACCCTGGTCTTGATACTGTCGTTG
+TTGCTGGTGTAGCTTAGTGCATTTTCTCCTGGTACCAGTTGCCAAAACACACTGTTAAGA
+TCAATGTAATGGAAGGCATTTTGCCCGTTAATCTTCACGTATTTATGCCCGAAGGCGGTA
+TTGACGGTGAGCACATCTTCCTCCTCAAGCTCACGATTAACTTTGATAAATTCCCCGGTG
+GTTAGGTTAGACACGGTGGGATTCACCGCTGGCCCTTTGAATTCAATCTCCACTGGGGTT
+GCCACATCACCGCCATTGATGGCTCTACGCTTGAATCCCCGGTAGGAAAACATGGTGGGG
+AGCATTAGCCTGAATTGAATTCCACCCATGAGATAAGACATCTCCCTGCTTTCAAAATAG
+GGGTCTAACCAAAATGGCTCATGGCAAATTAAATGTAGCAGGAACTTTTGATAATACAAA
+CCTTTGCTGCCTTGGCCGCTGGGAAAGATGGGTGTAGACTCCGCTATGCCTGTAATTTCT
+TTCACCTGATTTCCCTGGTGGTAGGTGATCGTCACTTCCCCCAGTTTTGGGTTTAGTACC
+TTCTGCATTTTCCTTCTTGCCATCAACACCGCAGCAGGATCGCCTTTGGTGATAATTGTG
+CCTTCAATGCTAACGGCCCGGTTATCCAATGTGTTATCAATAAAGGTGGAGCCATCCTGT
+TTCGGTGCCTTCTGGCTTTCAAGGGCTACCGGTACTTCGCCAACACCATCAATACTTTCT
+AGGAAATAAGGGGCTTGATTGCCTAATTTTATGCTTTCGCCGTTTTTGTTCGTGATGATA
+ACACTGTCCACAATCTCACCTCCTACCACTCAAGAGCCAGCTGCCGGGATGCATTTTTTA
+TCCGCCTAGCGGTTTCTGCCGGGGTAAGCGGTGTGGGGGAGTTAATCACGATATTTTGGG
+TAATGCCTTTATCCCCACCAAGGATCTCCTTTGTTTCGTGGTCGCTATAAATCCTACTTC
+CCCTGGGCAAGGCCACTAGCTCCGGCCCTAATTCACCCACCATAGTTAAACCACCGGGAA
+AGAAGCTGGTGCCGCTGTAGTTATCATCAGCCCCACCACCGGAAGTAACTGTGCTGATTA
+CCCGTGTGATGCGCTCCACAATGCTAAATACCTTCTCCTTAACACTGGTGGCGTTCCATT
+CCTTAATCCGGTCAATGGCACTACTGATGGCACTTTTAACCCGATCCAATGATTCGTTCA
+CTTTATCAGCCATAGCGGAAAACTTCTCGCTGGTGACTTCTTTCATGGTGGTTAATGCGC
+TGTCCCAAACGGATTTATAACCCTCGGTGTAGCTATTAATTAAACCTTTAATACCACCGC
+CATGCTCATCAATTTTATTTTGTATGGCCTGCCAAGTTTCAGCGGTTTTGGTTTTGATGT
+TGTCCCAGGTTTCATAGGTTTTAGTTTTAACCTCATCCCAGGTGGTGCTGACATTGGTTT
+TAATAGCAGCCACGGTTTCGGAGGTATTGGTTTTAATGTCATTCCACCTATCACTCATGG
+TAGAGCGGATGTTTTCCCATTGCTGGGATGTGGTAGTTTTAATTTCTTCCCAGGTGGAAA
+TCACATTTTCTTTAATGGCCTGGGCTTTGGCGAAGATGTCGTCTTTCATGGCCTGCCACT
+TGGTTTTTATCTGGCCGGTTTCCCAATCCACCTGATTAACGTGCTCTTGAGCTTGAGCCT
+TAGCTTCCTCCACTACCCGCTGGTGCATAATTTCAGCCTGTTTAACCGTGTCATCCTTTT
+GCCGGGTGGCTTCTTTGATTAAGCGATCCGCCTGATCTTTGGTGATGGTGCCTGCTTCAT
+CCCGCTGCCGGATAATTTCCTTAATTACCCGGTCGTACTGTTCATTAGCCGCTTTGATGG
+TTTTATCCTTTTGCTCAATGCTGTTTTTGACCACTTCGGCGGCTTGCTTGACACTAATCT
+CCCCGGCCTGGGCTTTCATCCGTTCCATAATGGCTTTGGCTTCGATTTCATTCTCGGAGA
+GGACTTGAATGCCGGTGTCCACCATCTGCCTTTGGATGGCATTAATTTCTTCCTGTTCAG
+ACTTGGTAAGCGCCCTTTTCTCTGCCGTAGCGGTATCCAGTATGGTTTTTATCCTGGCTT
+CCCCGTCAGCTATGGTTTGTTTTCTGTTTTCATAGCCCTGCTGCATATTGTTTAATATTT
+CATCCTGCTCCTGCTGGGATAGGGAAGTGCTACCGGCAACAAAACCCTTAATTTTAGCCA
+GGGACTCTTCATGATGTTTAGCCAACCCCGCCTGCACTTGAGAAGCCATCTGTGAGAAGT
+TACCGGCAATGTTGTCGGCCATTTCTTTGGTAACTTCTTGGCCACTCCAAGACAGCTGGT
+TTAAAGCAACGGTGGCTTCATCATTCAGTTCTAAAAACCCGCCTACCGCTTCTTTGGTTG
+CTTCAGATACTTCCTTACCAAACAGTTTAATAGCAGGGATGCTCTCCTGACTTAAGTGTT
+TATATAAAGCCACCCCTGCCACCGTTAATCCAGCAATAGCAGCTACCGCAATCCCCACCG
+GCCCGGTTAAAACTGTAAATACTGTGGCTAAGGCACCAATGGCAGGTGTTGCTGCAACTG
+CTCCGGTGGTGGCCACAGCAATAGCCCCGGATACTGTAGATAGTACTCCTGCTACAGAGC
+CGATAACTCCGATAAGCTTGCCACCAATAAGTAATAGCGGGCCAATGGCTGCAGCCAAAC
+CCGCTACTACAAGAATAGTCGTCTTAGCCCCATCGCTTAGTTCGCTGAATCTTTGGACGA
+GGGGAGTAATCCCTTCCAGTGCTTTGGAGATCACCGGCAGCAAGGCATCTCCAAAAGCAC
+TGGCTGTTAATTGTAGTTGGTTTTTGAATAATTGTATCTTGGAAGCTGTGGTGCCAAAGC
+GCAGTTCCGCTTCTTTGTTAAGGGCATTGTTTTCTACCCAAGCCTCACTACCCAGTTCCA
+AGCTTTCCCTGAACAGGTCACCTGCACCGGATGCCCGCAGTAATGCGTCACGAACCCGGA
+TTTCCGATAGGCCCAGATCCTCTAAGACTGCAAATACATTGCCGCCGCTTTTTGCTGTTT
+TATCTAAACCCTCAATAAATGAGATGATCGCCCCGGCTGCATCTTTTTCAAAAGCTTGTT
+GGAATTGACTAGCTGACATACCCGACACTTGGGCGAATTGTTCTAACTTTTGACCTCCGG
+AAGCTACGGCATTAGCCATGTCTACCATGACTCGGGAGATAGCGGAACCGCCGGATTCAG
+CCTCAATACCAACTGAACTTAAAGCACCGGCAAAGGAAAGAATCTGGGCTTCGGTTAAGC
+CGACCTGACTCCCGGCACCGGCGATACGCAGCCCCATCTCCACGATTTCGGCCTCGGTGG
+TGGCCAGGTTATTGCCTAAGGCCACAATGGTGGCACCCAAACGGTCAAACTCGGTTTGCG
+GCATTTGGGTAATGTTGGCGAGCCTGGCCAGCGCAGTTGCCGCCTGGTCGCTACTCATGT
+TTGTGGTTACGCCCAGCTTGGCCATTACATCGGAAAATCTTAAAATGTTTTCTTTTTTAA
+TGCCTAGTTGTCCGGCGGCTTCACCGATGCCGTAGAGTTCTGTAGTAGCAATCGGCACAG
+TTTTAGCCATGGTTTCAAAGCCCTGTTTAAGTTCTTGCAGTTCCTGTTCGGTGGCATCTA
+CCGTCTTGATAACCCCGGTAAAAGCTGTTTCTAAATCAATGGAGGCCTTGGTCGCTAATG
+CTCCAAGACCCACCAGGGGTGCCGTAACCTTGGTGCTCAGTTCCTTACCCGCTGCTTCCA
+TCTTTTTACCGACAGCCTGCAGTTTCTCCCCGGCAGCCTCCAGTTCCTTGCCCAGTTTGC
+CCCAGCTAGAGGATTGCAGGGTTAATTGGTTATTGACATCTTTTAGATTCTGTTCCATGG
+TCACCAGCCTGGCACGGGCTTGGTTTAATCTGATTTCTAATTCCTGCGTGACCCTGGCAT
+CAGCACCTTTGGTTTCAACCGCCTTCCGGTGGGCTTCCTCCAAGGTTTGCACCCTTTGCC
+TTTGCAGCTCTGTTTCCTTGGTCATGTGTTCGGATTTAAGGCGTAGTTTATCTAATTCAC
+TGCCGTGTTGACCAAGTTGGGCACTGGCTAGTTTAAACTCCGATTGCAGTTTTCGCATTT
+CAGTGCCTAATTTACTGATTCCTTCTTGGAAGCCTTGGGAATCTAGGAATATCCGGACAC
+TAAGATCACCAACACTTGCCATCTGTCTCACCACCTAAAAATAACGCCGTCAATAGGCGC
+TACAATATACTGTCGATATATACTTTTTCAGTTCCTCGTTTTCGGTTAAGCAACTTCAAG
+TAATAAATGATGTCCGTGGAATCAATCTCACCCATAGTCCAGCCCTGTTCTAAAAGAGCC
+AAATACAGCCGGTCAATAAACTCTTGGGGCTCCATGGCGTTTCCCGCTATTCGTTTTTTC
+CTGCTGTGGCCTCTCCCATCGCTCCCACCACTTCATTGATACAACGGGTAATGGTGGGGA
+TTAAATCCTTGGAAGCCAGGCCGTCATAAAGTTCATCACGGGTAAATTGACTGCCGAATA
+GATCCACGATGTAATCCATTAATTTGTCCAGTTCCTCGGGGGCAATATTGTCGAAATTTA
+TCTCTTGTGATACGGCAATGGTTGTTCTCACCATCCGGGCGCTAATAAAGCCAGCGGTGT
+AGGTTTTGTCCTTGCCATTAGTTTTAAGTACAATCTCCAAGGTTTAACCCTCCTCCGTAA
+TTATCGCCGCTTCAAAGGCAGATACCGCTACGGCTAAAGTGGCCAGTGCCGCATCGACCT
+GGGCTTGGGTAGCGTTTTCATCATCCACCACGGCTTGAGCGGCATCGATAGCGTCGCTGA
+AGGTGTCGTAGGCTTCCTGGGGGTATTCTCCGATGCCAGTACCTACAGTTGCACCAGCTA
+ATAAATCTTCGGCTTCACCAATAGTGGCAATGAGGGCAGACTTATCAACCACTACTGGAC
+TGGTATCACCCGGTACCCTACTGAACCAACTTTCAAATCCAGTGAAACCCTGCCCGTCTT
+CGTCTGCTGTGTGCTTCCACTCACCGTCATGCACTCTGGCCATAAAGGTAAACTTCACTT
+TAGGGGTTTTGTGTTCTACGTTGTCCTTTTTAGTGGAGAAGTCCTCGGCCATGGGCTGGG
+CTACTCCTTTTAAGAGCCAGACATAGCGGTACTTGCCGTTGGACTTAAGACTCTTGAAAC
+CTAAAGCAATATGAGGCGGAACGTCGGTAGCCTTTTCAATGAGCACCCCGTTTTTCAACT
+CATTGCCTAAAAGTTTGGCCCGGATAGTTAAGGGTAGTTCCGCCGTTTCTATTTCCACAT
+CCACCTTGCCTAAAGCCGATACCGATTCCCACAGCTGGTCATCAGCGTAAAGCTCCTGAG
+TATTCACCGCCGGGTTGATAGTGGCGTTAATGGCTCCCACCAAGGCTTCGGTGGGTTCAT
+AGGTTAACTCATCTTTAGTATCTGCGGTAAGAATAGCAAAGTGTAAATCATTTAATCCTA
+CTTGTGCCATCTACAGCACCTCCTTAAAAAATCGCATGGCTTTGTGATAAATTCCTAAAT
+CCTGTTCGTACAGGTCATAAAAGTTCTGTTTGGTAAAACCGGCAGTCAGCATCTTTTGAT
+GGATTGATTTGACTAAATCTGTGTAATCGGTTTTGCTCCACACATCAACTTGCACATAAT
+GGCCAGTAATTAACTCCGCATCATCGGCATGCTGCTCCGGTTTATCCAGGTAGGTGAAAA
+AGGTGATGTAGCTATCGGCTTTGCCTGTGTAGTTTTGGAATTGTACCGGTACTCCTATAT
+CCTTTAAAGCCGTTATTATATTTTGGTTCATGCTCATAGGCCCAGCCCCCTTCGCAGTTC
+TTCCTTGATGGTTGCTGTGGCCCGGTCTTTACCGTTTTCATAGCCCGGTGCCATGAAGGG
+TTTAGCTCTCATTTTGACAGTTCCCAGTTCCAGAAATTTGCCATAATAGGCTTCCTTACT
+CGGCCCCACTGCTACATACTTAACCCCATCCTGGGTTCTCACACCGGAAACGGTAATGCT
+TTCTTTTAGCTTGCCAGTCCGCACTGGAGTTTCGTTTTGGATGGCCTCTTGCATTACAGC
+ACCGGCTTCTTTTAAGGCTTTGTTTTCTATTTTCTTGCCCTCGCTGCCCAGCCTTTGAAC
+GGCATTGATGAGGGCTTCCAAGCCCTCTAACTCTACCCTAGCCACTGCTTACCACCTCCA
+GTGCTTTGATTTCCAGATACCGGTTTTGATATTTGATGTTGTCAATAGCGGTGATGTTGT
+ACTGTTTGCCTTGAAAAACAATCCGCATGGTGGTATCCAGACCCGTTAAATACCTAATGG
+TAAACTTCACCGTATTCTCTGCCTGGACAGCGGCGGCAGCAAAGTACTCCCGGCCATGCA
+GGTTGCTCACTGCCGCCCATACGGTCTTGAAATCCTCCCAGGTTTCTACCTCAAAGCCGT
+TCTCATTGACGCTAGTGGTAAGTTTCTGGAAAGTTATCCGGTGTCTTAAATCCCCAATCT
+CCACCTGCATCACCAGCTTTCCCGGCGAAGGTTTGCCAGTATCAGTTTCATCACATTTAC
+GGTTTCAGCCATGCCGCCGCCTTCGTTTTTAAGATAATAGTGGGTTCCTTCCCTTTTTTC
+ATACAGATTGGCCACACAGTACAAAACCGCTTGCCTGACTACCGCCGGTATTTCTTCAAA
+CTCCGACAAGGGGTATCTTAAGATATCCTCGCAAATTTCCACGGCGGTAGAAATAAAATT
+AGTGATGAGTGTATCTTCCTCATCACCGTCTATCCTTAAATACAGTTTTACTTCTTCCAG
+GGTTACCACCATACACTCACCACCTCCCGCTGTTTATTCCGTGATGACCGCTGCTTCAAA
+GGTGGATACCGCCGTAGCTAAAGCAGTCACAGCATCGTCTACATTGGTTTGGGTGGCATC
+AGCGTTTTCCACTACTGCCTGTGCTGCACCAATGGCAGTTTCAAAAGCAGTAACAGCCTC
+TTGCGGATATTGGCCAGGCTCGGAGCCCACCTGAGCACCATCCAGTATATCTTGAGCGGC
+AGCAATAGCCGCTCGAAGAACAGATTTATCTACAGTGATTACTGCTGCTTCAAAGGTGGA
+TACCGCAGTTGTTAATGCTGCAAGCGCAGTACTAACTTCGTTTTGGGTAGCACCTGTATC
+ATCCACCACACCTAGGGCAGCTTCAATGGCGCTCTCAAAAGTATCGTAGGCAGCTTGCGG
+ATATTCCCCAACATCCTCGCCAACCACTGCACTATCTAAAAGTTCCAAAGCTGCGGTGAT
+GGCCGCTTCAAGTGCTGATTTATCCACCACCATCAGACCGGCAGCAAAAAGCCGCCCCAA
+GAGGGAGTTGAAATCCTCTTTTAGAGCGGCAACAGTGCTGGCTTCACTGTTAGTTTGGCC
+TAGTGCTGGTTTTAGTTCGGTTCCCTTGAAGGTGAGCTTACCACCAGCTGTAATCTCCAG
+CTGGCCACCCACCACCCATTTCTGCCCGCCTTGTTCGTGATAGTTTTTAACATTACTCAT
+CTACCATCACCTACGCTTTCACCTTGAGAATTTTAATGGCTTCTTTAAGGATCAGCTTGC
+CATCCACCCGCTGCGCTGCCCTAAACCCTACTTGACCGGTGGCGGCATAGAGTTCGTTCA
+GCCTTTGAAAAATCCTTCCCTGACGGTCAGCAATCCAGTAGTAGCCCATATCACCGAAGG
+CGATCACTTTTTCCCCAGCGGCAATGGTGGGCACATAAGCCGAGGTCTTGACGGGACGGT
+TTAACAAAGTGTCCGGGTCGCCTGCAGTGAGGGAGGGCTGCCACAGGTACACACCGTTAC
+CGTCTTTTAGTTTCCTGATTTCCTTCACCGTGGCATCGTTCATGATAAAGACAGCCTTCT
+TGCGGTAGGGGGCTTTTAGGGAATAAAAGAGGTCGAAAACCTCATCCGCTTTAAGAGTAG
+CCCCGGCAGTGGTTGCTCCAATCTCCCCGCCACTGTCATTGTCAAAGATGCCGGTGGGTT
+TCCCCTCACCATCCCCGATTAAAAAGGCTTCTTCTTCCTTGGCCCCAATGCGGCGAGCGA
+ATTCTTTAGCAATGTAGCTTTCCAGGTTAAAGACGCTGTCGTTTAATAGTTCTTCGGAAA
+CCTTAATCATGGTGGCCACCTTGTAGGCCCCAATGGATACCTGGTCAAAAGCATCATCTT
+TATCCTGATACGGCCCTTCTTCATCTACCCAGGTGGCCACCCCCTTGGAAGCTACCACCG
+GGATTTTCCGGTCACCGGTAGAGGTGGTAATTACTTTAGCCAGTGTACGCATGATGTTTT
+CTTCTTCCAAGGCTTCAATCAAGGTGCGTTCGAACTCATCAGGCACCAAATATCCACCCT
+CAGTGCCGTCACCGCCAATGGTTAAAGCGTTTCTGGCCTCATAGCTATTGCGGTTGCGCA
+TATACTGCCAGAAAGCCTTATCGTATTCATTGGAAGCCCGGCCTTTAGGCTCATCACCAG
+GAATAGTTTTTAATGCTGTGCTGGTGGCCTTGGAAAGCTCAAGGTCAATGGCGGTTTGAC
+GTTCCAGGCGTTCAATCTCTTTACCTAAATTGACAACTTCGGTTTCCATTTTCTCATAAG
+TGGCGGTATCCTCAGCAGAGAGAAGACCGTTTTCACCACGCTTTTCATCCAGGAAGGCCT
+TGGCTTGTTCCCACACTTTAGTCCGCTTTTCCCGCAGTTCGATAATTTTACTCATGGTAT
+ATTACCTCCCTTTTATTAGTTCCAGCCGTTTAATTAGCTGTTCGTATGGAATGCCATCGT
+TGTTTACTGGTTTAGGTTGAGCCTTGACCGGTGGTAGTTTCCGCATCAGTGCATTGACCA
+CTGTTACCCGGTCAAACATGAAGTCAGTGACTTGGGCTGGCGGCTCACTGTAAAGGATCT
+CGTCAGCAAAACCAAGCTCCACCGCTTTATTGGCGCTCATCCAGGTTTCAGCGTCCATCA
+TCTTAGCGATCTGCTTCCTGGGTAGTCTGGCCTTGGCTTCAAAGGCATTAATGATGGCTT
+CCTTCACCTCGGACAGCATCTCGATTCCCTTTTGCATGTCAGATTCTTCGCCCCAAACAA
+AAGTGGCTGGATTGTGGATCATAAGCATAGAAGTGGGGGACATACAAACCATATCGCCCG
+CCATGGCAATTACCGCTGCAGCGCTGGCGGCAATACCGTCAATTTTAATCAGCACTTGGC
+CGCTGTATTCTTTGAGCATGGTGTAGATTTGGCTGGCTGCAAAAAAGTCCCCGCCTGGTG
+AGTTGATATAAACTGTGATGTCACCGGTTGCTGCTTCCAGCTCTTTTTTAAATTCCTTGG
+GGCTTACTTCATCTTCAAACCAACTCTCCGGGGCAATATAGCCATCCAGGTAGAGGGTTC
+TCTCGCCTTCGTTTTTAATCCAGTTCCAGAATTTATTCATCTGTGTCCTCCTTTCTGTAT
+TTTTCAGTCCAAGCCCCGGCATCAGCCATGTCCACGAAATTTCCGTTGACTAAATATTTA
+TTTCCGCCTAGCTCATCCGGGATTAGGTTCATGGATTCTAGCTCTCGAATGTCGTTCGCT
+GACATGATGCCATTTTGCCGCATGGTCTGGTAAAAGGCGGCCCGTGATTGAGCATCTCCC
+CTGAGCCTGCCGTTAAGGTTGAACTTGACCAGATATTGCTGTTTTTCTCCACCAAGGAAC
+AAGGCCTTTTGCATGGCCTGTTCAAAGCGGGCCACCCAAGGAACAATGGTGTTGTCGATA
+AAACTGATGCTTTGGCTTTCAATGTTGCTAAAGGTTGCCCGCTCTAAATTAGCCACTAGG
+TGAGGGGGTACCCTGAATATCCGACATATTTCCTCAATCTGAAACTTCCTGGTCTCCAAA
+AACTGTGCTTGCTCCGGTGGCATACTCAGGGTCTTGACGCTCATACCTTCTTCCAGCACC
+GCTACCTTGTGAGCATTTTCGCTGCCCCTGTAAATCTGGTTCCAGCTGTCACGGATTTTA
+GCCGGGTCTTTTAATATGCCGGGATGTTCTAATACCACACTTGGCCGGGCATCGTTGGCA
+AAAAGTTTGGAGCCGTATTCTTCTGTGGCCAGTGCCATTCCGATGGCATTCTTGGCCATG
+GCAATCGGGGAATAGCCCACCAAGCCATCAAAGCTAAGGCCCGGAATGTGCAGCACTTCT
+TCCCGGCGCAGTAAATACTCCCGGCCTTCTTTTTGGTAACGGTAGTACAGCTCTCCTTGT
+TCTGTGCGGCCAACATCCATGCGATCCGGCAGCAGGGGATATAAACCGATGACCCTACCC
+CGGCCATCCCTGATAATCTGAGCGTAAGCATTGCCCCAAAGTAAAAGATGACCCATCAGT
+GTTTCTCTGAACACAAATGAAGTCATCTCGGGGTTGGGCTCATCATGGAGCAGGTAATAT
+AAATTGTGATCCATGGCTTTTTCCTTCCCTTGGCCTGTGCGCCGGTAAACGTGGAGGGGT
+AGGGAGGCTATGGTTTCCGAGAGTACCCGCACACAGGCATAAACTGCTGATGTGGCCATA
+GCTGTGCGCTCGTTGACGGTTTTACCGCTAGGTGTGGGGCCAAAGAAAAAAGCCTGGGTA
+TTTTGCCAGAAGCTGTTCCTAGGACTGGCTCTGGACTTAAACAGGTTTGATAGAATAGGT
+ATTTTCAGAATCTCACCCCCCTTAAAATGAGCATGAAAAAAGCACCTCGGTTGAGATGCC
+CTCATGAACCTTAATATTTAAATTTTTGTGCTTGACAGTTGCAGTTCTATATTACGCCCA
+CCATACATTATCCTCACTACTGCAACCAGTTTTTCTTCTTCAACTACCACATAAAACACC
+AGGTAATTATCTACCGGAAGGACCCTCAAACCCCTACTGTGCCAAGGTTCTTTTTGGTAA
+AGTTTATGCCTGAGGGGCATTTCATCCAGGCCATTAATCGCATCCATGATTCTGTCTGTT
+TGATTTTTTGCGGTTTCCGGCACAGATAAATTTATGGCAATGTATCTGTAGATATTTATA
+AGATCCTGTTCGGATTCTTCTGTATAGATGATCCTATAGCCCATGGCCATATTCCTTACC
+CATACGTTCGGCTACCTTATCCGCAGATACAACCCTGCCTGCTTTCAAATCACCTAGTCC
+CTTTTCAATTTCATGGTTAAATTCTTCAGGCGTTAAATCCCCAAATGCAAGGGGTCTGTT
+ATGTGTAATCTTAACTTCAAAGGGCAGCCCGTTTTGTAAAACAACCTGCCTTAAAAAAAT
+ATTGATGGCGTTTGACATGGGTATGCCAAGTTTATTCAACACCATTTCCGCCTGTTCTTT
+TATTTCCGGCTCAACCCGAGCAAAAATACTTGTGGTTTTGGACATGCATACCGCCTCCTT
+TATGATATTTATATTTTACCATTTTGTATTGCGATATGCAATATATCTGCAAGCCTAGAA
+CACCACCAGCCCTCTCTCATCATAGACCGATTTATCCTTTTCCACCCCTTCATTCCGGAT
+ACACCGGTCTAGCGCCATAATCATAGCCACCGCACCGTCAATCTTCTCTGTTGATTTGGC
+TTTGTCCGGCTTGATATTACCGGCAGGGTCGGTGCGAATGTGAATGTTATCCATCATCCA
+AGATAAAACCGGGTGGCCGCCATGAGCGATTCTTTTCTCCAGGGTCAGTTTCATCAGTTC
+TTTGGTGGGTGGGGACATATCTTTAAAGCCCTGGCCGAAGGGAACCACGATAAATCCGGC
+ACCCTCTAAGTTCTGCACCATCTGCACAGCACCCCAGCGGTCAAAGGCAATCTCCTGGAT
+GTTGTAATCCTGGCCCAGCTCTTCGATAAATTTTTCAATAAAGCCGTAGTGGATGACATT
+ACCCTCGGTGGTTAAAAGGTATCCCTGGTTTTGCCAAATATCGTAGGGTACATGATCCCG
+GCGCACTCTAAGGTCTAAGGTTTCCTCCGGCAGCCAAAAGTAGGGGAGAATGTAATACTT
+GTCGTCCCCATCCACCGGTGGAAACACCAGCACAAAGGCGGTGATGTCAGTGGAACTGGA
+TAAGTCTAGCCCGCCGAAACAAACCCTGCCTTTAAGCTTTTCTGGGTCTACCGGGAAAGC
+GCATTTTTCCCAGGTGTCCATGGGCATCCACTTTATCTGCTGTTTCAGCCACATATTAAG
+CCGCAGCTGTTTGAATAATGCTTCCTCCGCTGGTTCTTGTTTGGCTTGCAAGAAATGTTC
+TCTGACCCGCTCTATTTGAATGGTATGGCCCAGGCTTGGGTTGGCTTTATACCAGTTGGC
+TTCATCTTCCCAATCGTCATCTTCCTCCAGACCATAAATGATAGGCAGGAAAGTGGGGTC
+AATTCTTCTTCCGGCTAAAATATCCTTGGCCTTGCAATGCATCTCCCAGCCGTAGCCCTG
+CAGCTTGTTACCCGCCGTGGTTAAATAGATAAACAGGGGCTGCTCCCTGGCATCACCGGA
+ACCAGTGGTCAACATCTTGGCCAGGTCAGGGTTTGGATAAGTCCAGATTTCATCGAGGAT
+AACGCAAGATGGGTTAAGTCCTGACTTGGATTTTACATCTGAACTTAACACCTGATAAAA
+ACTACCGGTTCTAGGGTAGACAATTCTTTTGGTGGACATGATGGTTTTAGTCACCCTCGA
+AAGGGTCTGATTACCCTCCACGAAATTAACACTGGTATTGAAAATTATACTGGCCTGTTG
+CCGGTCGCAAGCGGCTACATAGACCTCAGCGTTTGGCTCTCCGTCCGCTAGAAGCATATA
+TAGGGCAATGGCAGCGGCGATCGAGGATTTCCCATTTTTCTTTCCAATTTCTGTATACAC
+GGTTCTATACTGCCGGGTGCCGTCTTCCCTTAAGGTGCCAAAGGTTTGTTTTATTAAATC
+AAGTTCCCATGGAATTAGCTCAAAAGGCTGTCCTGCCCATTTACCTTTGGTGTGTTTTAG
+TTGCCGGATAAAATCGACAACGTGCTTTACCTTTTCTTCGCTGTAGAGCAAGGGCATCAC
+CTCCGATTAAAAAAACCTCCTACTTCGTTACTGTTAACAGCTTTTCCATGGGGTCGTCCG
+TGTTTACCGCTTCAGTGTCAACACTAATCCTCGTCCTAGCCGCCGGTGTTAAACCAAACT
+CGCTGCAGAAATCCTTCATCACTTTCAGGTAAGTTTGGGCGATGGAGACTTGCGGCACCT
+GCTGAATGTACCCGGATGGGGTTTTAAAGATGGTGCCGTGTTTGCTTAAAAACTCCTCGG
+CTTCTTTCCACCGGGCGTAGGCCTGACAGTACCCGGCAAAGGCAGCTTTATCCACCAGAG
+TTAAAAGCCCCATAGCTTCTAAGGTTTTACTCATCCGCCTCCATTCATTTTTGGCCTCTT
+GCTCCAGCCATGACGGGCAGCGGGGTGCCTTGTTTTCAGGCTTGGGTTCGTTTTCATTTA
+ATGGCCTTTTGCCGGGGTTTCCTTCCAGGACTTTAAGTGCGGTGGGTTTGGGTTTTCTTC
+CCCGTGTCGCCATAGCTTTTCACCTCCAATTGAAAAAGGAGCCTCACTTGGCCCCTTTGT
+TTTCTATTTATTTTCTAATCCCCGGAAAATTGTAATTCCCCTTCTTTATCTCATCAATAT
+CGGCCTGTACCGCCTTCTCGTAATCCCTGTCCTGCTTTTCTTTGGCCTTGCAATCCAAGC
+AGATGCAGTCCTGGTTGAACATGGACATTGTCCGGCCACCCTTTAAATCCCCGCCGCACC
+GATCGCAGTGCCTTTGGGAAAAGAATTTATCCAATCGAATCGCCCCCTGTTTTGGCCTTA
+TTTACCGCTGTCCGACCTGCCCCCTCTACAGCCGCCATAACCCTTCGCTGTGGCCCACGG
+GAACTCTCAGGCGACTTCGTTTTAATGCCTCCCGCAGTGGTTTTTGGGGCAGTCCCCAGT
+CCCGGTAGCCTTGTTCAATGATGTGATAGTAGCCATCGCTGGGTTCGTTTAAACCCTTGA
+TGGTCAGCACATAAGCAAAGGCCTGGTAAATGTTTCCCAGGTTGTCCTCTACCGTTACCG
+GCATTTTGTTATAAAGGCGGGGATAGCCTTCATAGCGGTCAAGTTTTTTAATATCTTCCG
+ACGAAACGGTGTAAATGGCACCCCAGGTAATTGCCTGTTCTTCTTCCACGATATCCGCCA
+CCCGGTTAAAAGTCAGTTGGTAGCCATGCAGTTTTACCCTGGCCACCGGTATTGCATCCG
+GGCAGCGGCTCATCATCTGTTCCTTGTTCAGGTTGCTGCCGTAGGCAAAGTAGTACATAC
+AAAAAACCCCCTTTTTTGGCTAAATGGTGTAAACCTATCTATCACTCAAAAACAGGGGTT
+TTGCAAGTATTTTTTATTTAAACCGGGCGTTATTCATCACTTCTAAGGCCCGGAATGTTC
+ATCTTGTCTGCATCAGCTTGGGTGAGGCCAAAATGCTCCAAGGCTTCTTCCTTGGTGATT
+TCAATCAGAAAGCCATAGTCCACGAATTGGCGAAAGGCACTTTTGGCCTTTTCCGCCAGG
+GTATCTCCGGTGACATGCACACCTTTGCCGTAGAAAGTCCAGGCACTATTAGCCATTTCT
+TGAATATATTCTCCCACAGTCATGGTGTGGGGGACAAAAGCAAAGCTCTTTAGTTCCTCA
+AACACTCCCAGTTCATCTTTGGCCACACTGACCCGTTTGCCATCCAAAGTCATTACCCGT
+AGATACATGCCTTCACCACCCTTTTTCCCACATATTAACATCTATTTATCAGAAAGGGAA
+GCCGGGCTTTAAAGCCCAGCCACCTGTCTGCCGTTTCTAAAGGCGCTGTCGCCTTCCAGG
+TTCTTTAAAAGGTGAAGCCTGGCGGTTTCAAATTCTTTGCCGATAAGGCCTAGTCTCAAA
+AGCCAGGTTCTAAAAGTGTACTTGGGGTTTGAGGTCTCAGTCTTCTTGGCGCTGGCGTTC
+TTTTGGCTTAAAGCCTGGTAACTTACCGCCAAGCAAAACTGTATGTAGGCTTTGACTTTC
+CCGGCGTGGGTGGTTCCGTTGAAAAGCCTAAACTCTACCGTGGGGCCGTTGAAAGTAGCA
+TGTAAGTTTAACCCGTGGTAGCGGCTGCTGTGGTAATGTTGGCTGCGGCTGCCGCTGTAA
+CCCTGGTACCAAAGGTCGGCCAGCTGCTCCAGCTCCGTTGGCTTTCGCCGGTTCAGTTCT
+GCCAAAAAGCTTTCCTTTACCTTTTGGCAGTACCGGCGTTTCCGCTGCTCGTCCACCTGC
+AGAGCTTGGTAAATCAAGTCCTCTTTGCTGGCCACAATGTTGACCAGATTCCGTAAAGTT
+TTGGCGGTGAATCTTTCTTTGCCAATGTGCAGGTGTATCCCGCAGCTCTTATTAGCGAAG
+GCCCCGACCTTTCTTAAGGTTCTGATGATCTCCTGCACCGTTTCGATGTCGCCGTAGGTG
+CAGATGGGGGAGACTAGCTCCACTCGGTGGTCTAATCCCGCTGCGATTCTTTTGCCTTGC
+CGCTTGGTTTCCGGCCTGATGCTGCTGTCGTTCATAATAAACCAGCTGCGGCCTTGGTTG
+TCCGGCGCTTCCCATTTGTCGTAGCCGCCGCCAAGGTAGTGGGCGCTGGTGCCGAAGTAT
+CCCGCCACTGCTTTGGCCGCCGCTTCCCTGGAAATCCCCGTTAGCTCAATTTCTATCCCG
+AAGGTTAAGTTTTTCATGTTTGGAAAACCCCCTGTGTGTTTTTGGTAGTCTATATATCAC
+TCTAAACACACATAATAGCAAGGGTTATTTTCCTTAAAAGTTAATATTTAGGCGGTTGTT
+TAGCCAGAGAAAAGACCGGTGCTTATGCCCCAGCCTTATTCCGCATCCACATATTCCATG
+ATTATCTGCAGTGCTCTGTCGTAGCTTTCGGACTTAAAAATCCGCTCTCGCATTTCTGCC
+GCTTGTTCCTCCAGCCCGGCATCTTTAAGTGTGCGGCTGGCGATGCCCATTAGGTTAAAG
+ATGTTGCCGTTTTCACCGACCAATTTGCATCTTGGTTTGGTCATTTACGCTCCCTCCTGG
+ACTTGTTTTCTAAAAGCGCTGTTACCGGGGAGGTTTTGCAAAAGAACCCGGCGGGCTAGC
+CTGTAGTCATCGCCTATCATCCCTAAGCGCAGGAGCCAAGTACGGAAAGTATACTTCTCA
+TTGTCGGTGGCCTTGACCTTGGCCGCTACATTCCGCTGCAGCCGCCTGACATTGATGTTT
+ATCAATTCTAAAAGCTGGGTGGCGGCTTCTACCTTCTCCGAGTCATCTCCATCCCGCCCC
+AGCTTGAAAGTAATGGCTCCCTTGTTGAAATCAAAGTCAATACCGGGGCAGCTTTTGCCT
+GCCAGTGCATTTTGGAAATGCTCCAGAGTTGTCATGGGCTGCTGGTTTAAAGCGTTAATA
+ACTTCCTTGCTCACCAAATCGGTATCAAGGTTTAACGCCTTTTTAATTAACGGCTGCTTA
+CTGTAAATCATGTGGAGCAGGTTCCGCAAACTCCGGCCATCGTAGCCTTCCAAAGGTATC
+CCTACTTCCAAAGCAGTGGGTTTTGTTTCGACAGAAGTGTTCGCTTCCGCAGTTTCCTTT
+TGCTCAGTTACGATCTCCAACTCCGGTTCCTCCTTCCCGCCTGCCAGCAGCGCCTCCAGT
+TCCAGCACCTGACCCTCGCTGTCAAGGATATTGCCTTGTCGGTTAACGGTATATTCGCCA
+ACTTGATAAGCAAAGCTGGGGGCAGCTAAATAGACAGGTCGTATTCCTAAATGCTCAGCC
+AGCTTGTGTACAAGCTCTTTTCTGGTCATCTTGGGTCCCCTCCTGTGATTTTTGGTATGT
+CTATACATCACTTAAAACCACAGGAATAGCAAGGGATTTATAGCAGGTCAGCGTATCTAA
+TTTTCTGGCCATCCCGGATTAAATAGACATCATTATCGGAGCCAGTGTGCTCAATGTATC
+TTTTCACTCCTACATCTACGAAGCGTTCCTCCAACTCGGTAGCATAGCAAATACGATCCA
+GCTGTTCGCAAGCAATCCCTGTTGAAAAGCTGCCGGAGAAGGGGTCGAGCACGATGCCAT
+TGGGAGCACTGCTGTTTTGGATGGGGTAAGCGCACAGAGCCACTGGCTTCGTAGTTGGAT
+GGAGTTTTGATTTGGCTGGCCGGTCAAAATTCCATACCGTCCTATGTTTTCTATCACCGT
+AAAACTTATGGCCTGCTGTGGGCTTCCATAGATATAAAATGGGTTCATGAGCGTATAAAT
+AGTCGCATCTACTAAGCACCGGTGCGTTTTTCACCCAAATGCAGGTTTGGTGACAAAAGA
+AGCCAGCGTCCCTAAAGGCGGTTCTAAAATTAACGGTTTCCCTGTCTGCATGAAAAATAT
+AGGCAACGCCACCGTCTATAACATTTTCATACATATTTGTGGCGGCCTTTAGGAGAAATT
+CGTAAAATTCCCTGTCTCCCATATTATCGTTTTTAATTTTCCCTGCCGTTCCTTCGTAGT
+CCACGTTATAAGGCAAGTCACTGACTATGAGATTGGCCTTCTTCCCATCCAACAATTTCT
+CGTAAGTTTCAACTTTGGTACTGTCCCCGCAGAACAGCCGGTGCCTTCCCAGCAGCCACA
+AGTCACCGGGTTTACTGATGACCGGTTCCTTCAAAGCTCCGTCCACATCGAAGTCATCTT
+CTTTGACATCCTTATCGTGTACCTTGGAAAATAAATCCTCTATCTCAGCGGCATCAAAGC
+CGGTAATGCTCACATCAAATATTCCGTTATCCAGTTCGCTGATTAAGTCGGCCAGTTTAG
+GCAGGTCCCATTCACCAGTGACTTTATTAAGCGTTATGTTCAGGGCCTTTTCCCGCTGCT
+CATCCAGATCCACTACTACACACTCAATCTCGGTTTCCCCTTGGTGCTGTAAAACTTTAA
+ATCTCTGGTGGCCCCCTACGATCTGACCAGTGCGTTTATTCCACACGATGGGCTCCACAT
+AGCCAAAGGTCTCCATGGATTTTTTAAGCTTCTCGTATTCCGGATCTCCGGGCTTTAAGT
+CTTTCCGTGGGTTATATTTGGCCGGGTTTAATTTCTCCAGCGGTAGTTTTTGTATCTCCA
+ATCCTTACACCTCCTGCCTTACTGCCTTCTCCCCGGTGAACTGCTCCCAGCGTTTAACGG
+CCAAATCACAATACCCTGGGGACAATTCCATGGCATAACAGTTTCTACCCAGCTGCTCAG
+CGGCCATGATGGTGGTGCCAGAGCCGCTGAAGGGTTCGTAAACGTTATCCCCCACATTGG
+TAGTGAGCTTGATGAAAAAGGCCGGTAGCTTCACTGGAAATGCGGCTGAGTGTTTTACGG
+AACTTTGATTGCCGGGTATCTGCAGCACATTGCCTGGCCTGGCAATGCCTTTTTTGAATT
+TACCGCTGACGCTGATGTTGCCGGAGTCGCCTTTGGATTTATTGTTTTTGCTATAGACCC
+GGATTAAATCAGACTGTTTCCCTACCGCCCTGGGTTTGAATTTAATTTTCTTAGCTTTGG
+TGAAGTGGAAAATGTCCTCGTACATTTCCACCAGGTCCGCCGGTAATGTTGCCAATCTAC
+CCTCATCAACATCTACCAGCTGCACCATCCAGTCGATCTGTTCCTTCTTGGCGAAAAAGT
+GTACCGGTTCAAAGTCATTTCTCAAGCGGTTAGACCAGCCACCGGGCAGCCCTGGCTTCG
+TCCAGATTAGCTGATCCACATACCGCCAGCCACCTTCCACCAAAGCAATGATGGTTTTCA
+TCACGTAAAGGGAACGCTGGCCGCCCTCAACGTGTTCCTTGATATTGACGAAGAAGGAGC
+CGCTGTCGTCAAGTATCCGGTAAACATTACTGGCCACATGAAAAAACCAGACCGGATATT
+CCTCTGCCGGTATCCCGCCGTAGTCGTCCTTGCGCTGCATGGCGTAGGGCGGGGAGGTAA
+TAACGCAGTTGGCTTTTTCTCCGTTCATCAGTTTTTCAACATCGGCAATATTTGTGCTAT
+CACCACAAAGTAACCGGTGATTGCCTAAGAGCCAGATGTCCCCTGGTTTAGTGATGGGCT
+GCTCCGGTGCTTCCTCGTCAAAGTTATCCTCCTGGACTTCTTCTTTAAAGCCCAGCAATT
+CATCTATTTCCTCGGCATCAAAGCCGGTAATATCTTTTAAGTCATCATCCAAGTTCTTGA
+GCAGCTCGCTCAGTTTGGGCAGATCCCATTGACCGGCGATTTTATTAAGGGTAATGTTTA
+AGGCCCTTTCACGGTCAGGTGGCAAATCAACCACGGATACTTCCGTTTCGGTATCTCCCC
+GCTCCAGTAAAATTTTTAGTCGTTGGTGGCCAGAGATGAGCACGTTGCCCCGCTTGTTCA
+TCACCAAAGGTTCCACCAGGTCAAATTCGTCAATAGATTTCTTTAATTTCTCGTATTCAG
+CATCCCCCGGCTTTAAGTCCTTACGAGGATTGTATTTGGCCGGGTTAATCTGGTCTAACG
+GGATGCGCTGAATCTCCAAAAGGGCCACCTCCTTCTTAACCTGCTTAAAATCGCTGTATT
+TCGTGCCATGTCAAGCATTAGACCTTGACAACCCCCATCTGGAATTTTGCGAATTCCCAC
+GCGAAGGCCCGCGCCCGCTCTGGAGCCGCTTAGCTGCAGGGTTTGAGGACCCCCTACCCT
+AATTTATCCACAGCGTTATCTACAGGTCAGGCTGGTAATTATACTAATAACTGTAAATCT
+TGTTTTTATCTCCCCAGCGGCCTTCTTTGGTGGTCTTGCTGTCATGACAATTTTTACAAA
+GAGCTTGTAAATTGTTCTCATCCCAAAACAGATTCAGATTGCCTTTGTGGGGTTTTACGT
+GATCAACTATTGTTGCCGGAGTAATCCTGCCCTGACGTTCACACTCTACACAGAGGGGAT
+GCGCCAGCAAAACTTTCTTCCTTAACCGCTGCCAGCGGGCACTGTTGTAAAGCTGTTTAG
+AATACTTGGGTCGCTCTTTCCGGTTGTACCGCCAGTTGTATTCCTGCATGTGTTTGGGGC
+AGAACCGAGCATCGGTCAGCTCCGGGCAACCGGGATGGCGGCAGGGTGCTAGTGGCTTCC
+TTGGCAATGGACTTCACCTTCCTCTCACCGTGCTGACACCCGGACCAGGAGATCCGTTTA
+TGTTTGTCACCGTTTACGGAAATGTTAATTAAGGATTTATGGTACTCGCTCTTTGGATTG
+CCACACTCGTAAGCCGTCCAATGTTTATCACTGGCGGATTCATCAATGGTGGCAAAGCGG
+CAGGATATACATTTCATAATGGCACCTCCATAGAAAAAGCCCTGAGAGCAAGTGTGCTGT
+CAGAGCCTGGTTATTTCCGTTAATAGTCGTGGTGGTATTCTACGGTGAGTTTAGTCACCT
+TTCATTATTATTCAGTCCTGTTTTTTGGGCATAGAAAAACCACAAGCTTTGTTGCCTGTG
+GTTTTAATTTTATTTATTTTTGCCTACGTTCATAGTTTTCCAAATTGCCATTGGGTGCTG
+TTTTATATTCTCCAGCGTCTTCCCAGAAAACAATAGCTCCGGCTGGTAGCTTCCCCTGGA
+GAACTGCTGTAAATATTCTTTATGCCTTGATGTTAAAACAATACTGTTTACTAGAAATTC
+CTTGACTTCTGATTTGGTTTTGTCCAATTCAAACCGTTCACTTTTAACCAGCATGGGATA
+TAAATCCTGATGGACTGTTCTCATTTTTAGCTGGTCCATCCGGTTAGGAGAAAAACTTAA
+TTTTGCCGCTTCTCCTGAAATGGAACCATAAAAAACTACAGCTTTACAATAGCTGACATA
+GTCCTTTTCAGAAAGAATACCATACTTTTTCACATTGTATAAATCGTAAAAATCCCTTGC
+CGCCAGACGGTTAAACAGAGCCGCTGTTTTGGAAGCCAAAAGTTCAATGCCATCTAAAGT
+TTTCACTTCTCCTCTGGCCCCAAATAAATCTGTATTTATTCTTCTCATTACGGGCGGCCA
+AATATGATGTCTTAAAGAATAGTTTATCTCAATTTTTATATTATCAAAATTACCTGCGTT
+GTTTTGAAAACGAGCTACAATTGATTCCAGAGCAAAATAGTCTTTTGATTTTTTGGATAT
+ATCATAACCTTGTCTCTCTAAATGTGCATATAACAATTCTTTTACTTTAATCCGTTCTTC
+AAGTACCTTCTCCCGGCTATCATAGGAGTGAAAATCTAGATCTATATCTACAGATAATCT
+GGGCAAAGCAAAGATAGTAAGGTTTAAGGCAGTCCCACCTTTTAGGACTAATCGGTCTTT
+TAAAAATGCATTGCTATTTATAAATTCTAGTATAACAATTAACCGGTGAACCTTCTCTAT
+TACGTCTTTGTGAAACCCTGTTTTTTCAGAAAGTTTCAGGTAGTATTTCCGATCTGGACT
+AAACAAATATATCATCCCTAACTTCAAGAGTTTTTGGCACTATCAGGGCCCATCTTTTTA
+TAAGCACACCGCTACCATTTTGTGCTTCTTCACTTAAATACTTTTTTGTATTTCCGGTCT
+TTTTTTCTATCAGACTTAATAAACCATCTGTTATTCCTAAAGATTGCTGGTGGCGCTCCA
+GGAAGTAGCCTGCCTTTTTATAAAGTATCTGTTTATTATACATTTCTAAATAATTTGCCA
+GCTTTGTTTCATCCAGAACCGTACATATTTTTAATATCTCATCTAATTCATGGACCCCGC
+CACAGTAATCCGGCCTGTCTAGAGAGTCAACAACTGTTCTTTCTAGATCTGTCAGTTTAA
+CCTTGTCATTTAAACGATAATGAGTAACACCCTCTTTAATGCCTTTACCCACATATTTGT
+ATAAAACTCCTTCAAATTCAAAATCGGATATCTTTTGTTCTGAGGACACATAAACTACAA
+AACTTACCTGGTGGGATAATCCATGGACCTCAAAGGCAGAGTGGTATGTCAAATAAGCAC
+TGTCATTTATTTTACTACCCACCAAATATCGATTAGCCGGCGCATCTCTGTTTTCTAAAT
+TTACAGCACAATACAAATCTCGGCGTACTCGCTTGACAAGGCCATTTTTTACATATGAAT
+TTAATAACACCTTGGCGTTTTCTATGCTCCCTACAACTTTTTGGGCATCCTTAAGGTTAA
+ATACTTCCATCTTTAAGAAATCTTCATAATACTTCATGTTAATTGAATCACCCAGTTCCT
+TGTTTTGCCTTTAAGTTAATATTAGTATTAACCTTCTAGGTAAATTTGATACCATTATAC
+TTTAAGTTCTTTATTTTTTCAATAGGTTAATATATATATTAACTTTCTAGGCAAAAAAGA
+AACTAAAATGTTTACAGTTCGACTAGTTTCAGGCATAGAAAAAGCCCCGAGGGTTTAATC
+CCACTAGGGCTTGCTATCAAGAATGCTGCGTTTCCCCGGAGTCGTTGGGCGATCTATCCT
+AAGGGCCTATTCAAACAGCATCTGGTGCTCTTGATATTTTTCCATGCCTTTACAGGTATA
+ATATAACACATGTCGGGGGTGGATTCTACTGGATTTTACTCCATTTTACTGTATTTTACT
+ACCCTCTTTTTTTATTCTGTTGACTTCTTTCAGGGCTCTACTATGGATCTTAAAGATTGA
+GCTGTCCCGGTAATTCAGGCTACTGGAAATCTCATCCCAGCCTTTGCCGTTGATATACCG
+CATCTCCAGTATTATTTGACCGATAGGGTCATCCACCTGGCTGATGGTGTTCATAATTTC
+AGCTTTGATGGCAATTGACCGGGCAAGGTCCTCTTTGATTTCTTTCTCTAAATCCACAAT
+TTTAACCACCGTATTTTCCATCTGGCCTTTTTTATTATTGCCACCGGCCACCTTTTCCAC
+TGTCAGGTTAGCCGACACCTTCATGGACAGTTCCCGCAGTGTTTGCAGCTGCTCTAGCTT
+GGTGTTAACCCGCTGGTCAAGCCATAGGGCTTGCGATAAATATTCCTTGGCATTCATGCT
+CTTTCACCCCCGTAATATTTTTCAAAAATATGTTTCTGCCTCTCCGCATCCAAACCACGA
+ATCCGCTCCAATGCCTTTTTTTGACCCAACTCAAACTGCTCCTTGGTTTTATAGAAACTG
+CAGCCTTCACACTTTTTTACTTTTAAGGCCGTGCAGCTGTTTCGTTTGTAAGCAAAACAA
+CCGGTACGCATGATTACTCCACCTCCTGATAAATCCTGGCCTTCACTGCTTCGATTAGTG
+CATTTTGGGTTTTATCTTTTCTTTTCAAAGCGTTCATAACATCTTCATCAATGGTGCCTT
+CAGTGATGATGTGGTGAATAACAACCGTATCCTGCTGGCCTTGCCGCCACAGCCGGGCAT
+TGGTTTGCTGGTAAAGTTCCAGGCTCCAAGTTAAACCAAACCAGATTAAAGTGCTGCCGC
+CTGCTTGCAGGTTTAGCCCATGGCCAGCGGAGGCGGGGTGGATAACAGCCACCGGGATTT
+CACCTTCATTCCACCGTTTTATGGAAGTGGTGTCATCCAGCTTTGTAGCCTTAAACCGCT
+TTAGTATCCGCTGTAGGTCATGCTTGAACCAGTAAGCAATTAATACCGGTTTGCCGTTAG
+CCGCTTCGATTAAATCCTCCAGTGCATCCAGCTTACGGTCGTGTATCTGCACCACGGCAC
+CGTCTTCATCGTATACAGCCCCGTTGGCCATCTGAAGAAGTTTACCGGACAGGGCTGCAG
+CGTTAACGGCATCAATCTCTTTGCCTTTTAGCGGCAGCACTAGTTCCTGCTGCAAGGTAC
+GGTAGTAATCCGCCTCTTTGTCCGATAGCTTGACGGTTACTTCGTTCATCACCAATTCCG
+GTAACTTCAGGTAGTCGGTATTCTTCATGGATATCGTGATGTCGGAGATGCGCCGGTAGA
+TGGCATATTCAGCACCGGGCTTTGGTTTATAGCTGAATACAATCTGCTGATTCCTTTTAT
+CCGGTACAAAGTAGTCCTCTCTATATCTTCCAATAAAGCGGCCCAGCCTGTGGCCCATAT
+CCAGAAGCCGGAATTCCGCCCATAAATCCATTAAGCCGTTAGCCGATGGTGTGCCGGTAA
+GGCCCACAATTCTTTTTACTTTTGGCCGCACTTTCATCAGGCTTTTAAACCGTTTGGCCT
+GGTGGGATTTAAAGGAACTTAGCTCATCTACCACCACCATGTCGTAATCGAAAGGCAGCC
+CGCTTTTATTAACTAACCAGTCCACATTTTCCCGGTTGATGATATAGATATCGGCTGCTT
+GCAGTAATGCCGTTTTGCGCTGTGCCTCTGTGCCAATGGCCACTGCAAACCGCAGCATAT
+TTAGATGCTGCCATTTAATTATTTCCTCCACCCACACAGCCCCCACCCGTAGAGGGCAAA
+TTACAAGCACTTTTCTGATTTCAAAGTAATCAAACAGCAGGTAGAATAAGGCCGTTAGGG
+TGATTACCGTCTTGCCTAAACCGCAATCAAGGAATATAGCGGCCTGGGGATGGTTTAATA
+TAAAATGGGTAGTATACTTCTGATAATCATGTGGTCTGTATTTCATTTAAAATCACCCCA
+ATCTGCCGCTGCTCGTCCAATACGTATACCTTAAATCCTAGCCGCCTCAGCTTTTCGTGT
+CTTTTTACCTGCAGGGGCCGTGGTTTTATGCCATAGCCCTTGATCTCAACGAAGGCTATT
+TTGCCTTCTGGTAATAACACCAAGCGGTCAGGCATACCGGCAAGACCTGGACTGATAAAC
+TTTGGCGCTATACCTCCCGCCGCTTTAACTGCTTTGACTAGCTTTTGTTCAATATGTTTT
+TCACTCATATTCCCCCTCCTTAGCGTCAGGGATTAGTGGGGGTGTGAAGGTCGTGATGGT
+CAATTACATAACTTTATATATATAGTTTTATTTATTTTTTTTTTGCTATAGGAAACTCTA
+TGACAAGACCTACATCGACCTTCACACCTAGGAAAATAGCCTATTCTAGAAGAAAATCAG
+ACCTTAACCTTAATCCCTTGACAATAACTCCTGCTCTTGTCCTTTGCCTTTCAAAATCTT
+CCATTTCAAGCGCCGCGTAGAAATCGGTGGTGCTCCTGGTATACTCACCTGTCCTCATGC
+AAAAGGCCCGGTACTCGCTGTATAGTTCACCTGATTTTTCAGTGAAGGTTCTATCCAGCT
+CACAGCATTCCTCAAGGAAGTGGGCTAGCCAATCGTTGTTTTCCTTGTAGGCGGAAATGG
+CATCCTTCACTTTTTCCGGTAGCTCGATCTGGTAATCATCCATAATCACTTTTTTGGCAC
+CTTCGATTATCCAGCTAAGTATGGCCCCGCCCGCTTGCTCGAACAGGTAATCGCCGTAGT
+TTTTAATATCGGCGCTGCCTTCAATCTTGGCAGTAAAGGGGATAACGATTAGCCGCCTCC
+AGGTACCGGTGTCCAGGGCTCCCACCCTTGGCAAGTGGTTGGTGTATAACACCAAGGTGT
+GGCTGGGAATATAGCTGAATGGGTCTTTGTATTTCTTTTCCGCATAGATTTCATCAGTGG
+AGCAAAGCTGTTTGACGTTGGAGGTATTTAGCCGCATGCCTTCTTCCATCTCCGCTGCAA
+TTAAGAGCCTTTTTCCCTTGGCCTCAGCCAGTTCTGGCTTTACATTTCTCCGGCAGCCAA
+CGGTCAATATATCGGCGGAAATATTGCCACTATAGGTGCCCAGCACTCTGGAGATTGCGT
+TCCAGAAGGTAGATTTACCATTGCGGCCTTCCCCGTGGGCGATAATTAAGGCCTCCACGT
+AGACCTTGCCAATGGCGGCCAGTCCCACTACCTTTTGCACGTAGTCAATTAGTGACTTAT
+CATTTAGGAAAAAGGTATTTAAAGCATCCTTCCATTTATCCATACCTGCAGTACCCGGTT
+CCACCGCAGTTTCTTTGGTAATAAAGTGACCAGGATCATGTTTCATTCTGGCCCCGGTTC
+TTAAGTCATAGGTGGCCTTGGGTGTGTTTAGTAAAAATTCATTGGTATCAAGAGCACTTT
+GGTTAATCTCCAGCATGGGCTGAGCTTCTTTTAATGATGCCGCTATATACTTTGAATTCC
+GGCGCTTGATGGCATATTTCCTATACGCATCGGCGGCTTCAAACTTTTCATAGGCATGGG
+ACTGTACATCATTAAAATCAGCTATTGCCTTTTTGGGACCCTTGTCGGCTAATATGTCAA
+GTGCACCGTTTTTCTCCATCTCATCCATGGCTTTTTTCATTTCAGCCCTGGCTTCTTTCA
+GTTGCCTGGTGGTAAGTTCCTGGGCTATGGCCTGGGCTTTGGGCTTTGATTCCTCCCAAA
+AGCTGCCGTTGTAGACAATGAAATCTGTAGCCGGGGAGTACCTGAGTTTGTCCTCATATT
+CCCTGGCTAAAACAACTGCTTGGCCTACATCCGAAAAATCTGATGGCTTTAAAACACTGT
+CTGAATTGTAGACCTCCGGTGGGATATACCCGGCCTGGGCAGCTACCTTTTCCCCGAAGC
+TGACAGCACTGTTCCAAATAATTTGCAGTTCCTTTTCCTCAAGCGGTGGATTGCATTTTT
+CCGCCAGGGCTAGAAACTTGGAGTGGGCTTCTTCGGTGTTGCCAAAACGCTTGATGATTC
+TCCCGGCATAACGGGACATGGTGTTGTTGCGCTGCCCTTGGGGTATTTCATCCTGGCTCT
+CGTCCCAGTCGGTAAAACTGCTGTCCTCCAGGAATTCTTTGATGTTGATGTCCCCTTCGA
+AAAGCTCCACATTACCGTTATCCGAGCCGAAGATAAACCTGGCACTGTCAAGGGCGTTGC
+TATCGAAAAAGGGAAACCTTGATGCCACGGCAAGCTTTAAGGCGGCGTATTCTTTCGGAT
+CAGTAATTACCGGAATAGCAAAATACACGTGGAACCTGGGCCGGGGTAATTTATCGCCTT
+TTTGCTTCATGTGGTTTCGGCTATAAGATACGACAAAGGGAACCCCTGGGAAGGCCGTGG
+CAACATCATCGGGGGTAACCCAATCCTTGGGATCATCCGAGTGGTCGTTATCGCAATCGA
+ATACGTTATTATCAGCCTTGATGAAATTGGCGTTGCTGCGGTAGTTGCCCTTATACTTCG
+CACTTACGTGGTCAAACTTGATGGCTTCGATGAAGGAGGCCTTGTCTTTGATTACCACCT
+TGTTTGGGTACAGGCAGTTGGCCAGGTTCCCCGTGCAATTTGCTGTGTAAAGGGTAAATT
+CAATCATTCTAAGACCTCCTTCCCGCCCCATTTGTTAGACAACACATTGAGTCACCTCCA
+GGAAATCTTCCCAAGCAGTGATGGGATAACTGTTAACGGTGCCAAACCTTTCATCATTCG
+TTTCGCACGTCCTTATTTCAATAGCACGGGAGCGGCAGTATGCAGATAAGCGTTTGCCGA
+TCCTTTGGCACTGTTTTAAATTCCAGCCCATATTAAAAGTCCTGTTATATTTGGCCACGG
+TATAAAACTTAAGCGATGAATTAAGGGCGATTTCAAGGGTTTCATTTTCCTCAACCAAGG
+CAAATATCTTTCTTTCAGCTTCAATGGCTTTTTGCTGGGCGATCTGCAGTGCCCGCTCCA
+TAATTTTTTCAGGGGAGTTCCAGGCTTCCTCGATGGCGATGAAGTGTTCCCTAAACTTTT
+TCCCTATTTCATTTCTTTGGATCATGCAGATTTCTTTTGCCATGGATATTGTTAGGGAAT
+GATCAGTTTTTGGTTTACCGGGAAGTCCATCCGATCTAACCGTCAAAAATGACGAATAGT
+CTTTTCCTTCTTTAAAACCGTATTCTGTCATTCGGCTAAACCATTTGGCATACTCGGTTC
+CTATTTCCAAAGCCTTGTGAAGTTCACGTCCATTAACCGTAGGGGTATCATTTTTATAAT
+CAATTGCAATTAAATCGTGCATCTCCCAACCTCCTCACCTTTACTGTCAAAGTACCTAAT
+AGGCATACCCCGCCGTTCCGCTTTAGCGATTTCAGCAGCCATGCCGCTACTGATGTGGCT
+ACCAAATACCCAAAGTTCGTCACATTTTCCAAGCAGGATTAGAGCAAACCAAAGGCCCAG
+TTCCCGCTGCTGCCTGTCCCCATCGTCCATAAACTGCGGGTAGTGCAGGTGCGGGGCCAG
+GGGAATGCACCCCAGGCTGACCGCCAATCTGCAATAGCCTCTGGCTCGTTCGATGTTCCT
+TTCCATATCCCCGGCAAAAGGTGATGCTATATACACCAGTGGCCGATAAATCTTGACTGC
+TTTCAAGGCTTCATATGGTGTCGGGTCGGAGTAACCCTCACTGTTGCGCCAGTCCATCTA
+TCTCCCTCCAATCTGACCCGGCTGCACTCCGAGCAAAATACTTCAGTGCCATACAGGTCG
+CTATCACCGGTGCCCAATATCTCAGCGAGGTCAACTTCTACTTCACGCCCACAACCGGGG
+CAGATGCAAAACACATTGTCATCATGGATTTCCACAGCAATTTCCACTTCATCACTAAGC
+TGCGCTTTTACATAAAACATAGGTTTTCTGCCTCCTTTACTTTTCACAGGACAGTAAGCA
+GTGGTTTGGCAACTGACCTTCTAATATACACAGGACATTTTTGATGGTTTTGAGTACCCA
+TAAGCGGAGAAATAATTCGAACCCCCGCCTGTTACCTGATGTTGCTGGCAACATGATTTT
+GTTGTATCGTTAATAAAAATTAATTTATACTGTTGCCAACAACATGAGGCTCCTTACTAT
+CTAAAGGACAGGTACCAGCCAAAATCCGTAGTTAATCTTTCTGGTAAAAATCACATTCGA
+AGCCCTCCGCCCGAAGTAACAGCCCCTTGGCCCAAGGCGGAATTTGGCTCATTTGTTCGC
+ACACCGTCCGAACTGACATTTGCTGTTCAGCTTCGATGACGATTTCGTCATGGATGTGCA
+TCACGATAGGCAAATGCCGCAGGTTCTGCATGGCATAACACAGAAGGTCACGGCTGATTG
+CCTGAATAATGTTTTCAACAATTTTCGCACCGTATGTTTCCAGCCGCTCCCACTTCTTAG
+CCGCACCAATACCTTCATAAGTCACACTGTCGGAGCCAAAGTGGTTAGTACCAATGCGAG
+GTTTCACATAGGCCAGCCGTCTGCCAGAAGGCAAGGTGATAAACAGCATTCCGCTTTGAT
+AAGCAAAACGGATACCGTGAGTTTCTGTGGTGGTGCGTTCCCGAACTGCGGTTAATGCCG
+CCCGGTCAACGTCCCACCAAAAGCGGACAATGTTGGGGTTGGCTGCTCTCCAGGCATCAA
+CCAGTGGTTTTAGTTCTTCCTCTGTAAGTCCCATTTCCAAAGCACCCATGGCCTTTATTG
+CACCCACCGAGCCGCCGTAGCCGCAGTTATGAACCAAACACAGCCGCCGTCCGTTCCATA
+CTGCAAACCGGTGCCGCCTGCCGCAGTTCACCAGGTCATATACCCGTTTTACCCCGGCGG
+GGGTAGGGGATAATGCCTGGACAGCACTATTTGGACGATAAACCCCGGCCCAATGAAGGC
+CGCCACTTTTACCGCTTTCCACCCAGCCCTGATTAGTTAAAACCAGGTGGTCTGGGGTGC
+ATATCACACCATCAACGTTTACGGTCTCCCGCTGGCCTTTGTGAACTAAACCTCCATGGG
+TTACCCACCCTTGGCCATCCCAAACTTTATGTTCTGTGGTAACTTCCTCTATGGGTACAA
+GTCCTGTATCCGTCAACACCAGTTGCCCTTTCGCTATACAGGCCAAATCCGCAATTTTAC
+CTTTTTGCCTGAGTGGGTCTTTTTTATCTGTAATAGGCACACCAAACATCTGACTAGCGG
+TAGCGATGTATAAATCCTTTTTAGCAGCGTAGGCATCTAGCACCCACCGCTCCCCGGCAA
+GCCAGGCCAACACTACCCGCTCGATTGATGAGAAATCCGCCACGATGAATTTATAACCGA
+GTTTGGGAATGAAGGCGGTTCTAATTAATTCCGACAGCACTTCCGGCACCGAATCATAGA
+GCATCTCCAAAGCGGTAAAATTACCGGAGCGCACAAGGCTCCTGGCTTGTGCCAAACCAG
+GCATGTCGTTCCTCGGTAAATTTTGTGGCTGTAAAAGCCTGCCTGACCATCGCCCGGTTC
+GATTGGCACCATAGAATTGAAATATTCCACGAGTGCGATTATCTAGACAGGCCACGTTTT
+CCATGGCCTGATACTTTTTCACTGATGATTTAGCCAGCTGCTGGCGAAGTTGCAGCACTT
+CATCCAGGGGTTTAGGTGCTGTTTCCAATAGCTCCGCCACAGCTTTTTTGCCCAGGGTAT
+CTGTCTCAAGCCCATGGTCAGCTAACCATTCTTTTAGCTGTTGTACGGAATTGGGATTAT
+CAAGGTCTGTCAGCTCGCCCATTCTCCCTAATAGTTCAGAGCGGGTACGCTCATCGGCTT
+TAATGGCTTGCTGGACAAGGGTCATATCCAAAGCCACACCCCGGTCGTTTATCTCCTGAT
+CCAGGTGGAATTCGTCCCAAATGTTCTCCGGCACGGGAAACTTGGCTAACCTTTCCTGAA
+TGGCTATTTCCACCTCCACATCCCGGCGGTTATAGGCTTTGAACTGTTCCCACTTAGCCG
+GGTCATGGATGGGCAGATTCCTTGTCCGCTTACCGTTAGCAATAGTTGGTTTACACGGGG
+TGCAGAAGTAGCGGATTAAATCTTTCCCTTCCGTTAATTTTTGTTTTTCCAATCCCAGCA
+CCGCACCCACTCCTTCTAAAGAAAGGGGCAGTCCCATATAGGCCGACCAAACCATGGTGC
+AGCGCCAGGGCCTTGGATCGAGATATTGAAGTCCCAACCAGCGGGATAAACAGATGCGTT
+CAAACTGACTGTTAAAGGCCCACTTGGTAACACCAGGGTCAGTTAATGCATGTATTATTT
+CATCCGGCAACTTCTCACCGGCGGTAAAATCCACTACCTGAACCTCACCGCCATCCACGC
+TGTAGCCAAACAGGAGTATTTCAAAATCGTGTGATTCGGCGTATTTATAAACACCGGTCT
+TTTTAAGGTCTGCACTGGAAAATGTCTCAATATCGATTCCGAGCGTTTTCATTGGATTCT
+CCTTTACAGGTGTGGGGCAGCGAGGCAAAACCCCGCCACCCCTGCAGTCACTAGGAAAGG
+AAATCATCATCGTCAGCAGTGGCGAAGTCGTCCTCTGCCCTGGACTTGCCGCCGAGCGGT
+TCGCCGTCACGGATTTTCTGCAGATTATTGAGCCCACATGCGATCCCGCGATTTCCCGAA
+CTATTGTAGGCATAAAAATTGATACTGGCCCGGCCATAAACACCGCTGTAAACCTCGGAG
+CGCTCCAGGATGGGCTGACGGTCGGCATCCACAATGCCCGGTGCAGTGGTGGAATTGGCA
+TTGACGAAATAGGCATTGGCGTATGCCGGATCATCGGGTCTTTCGGTATCGCCGTCCCTA
+AGCGGTGTCTTAATAGCGGAAAGAGGTGGTACCGTTTTACCGTTACCCTTCAGCTTTGCT
+TCCCCCTCACGGTAGGCAGCTTCGATGGCAGCTTTAATCTTGGCCACCGTTTTGGTGTCG
+CTCTTTGGGACAATCAAAGATACCGAGAACTTTGGGGTGCCGCCGTTAATTGACTTGGCC
+TCCCACACATTTGCGTAGGACCAACGAGTATTAGGTCCGGTAATAACTTTCATAGGGTTT
+TTAAACATATGATTTTCCTCCTTAATTTTCACTAAAGTCCTGTTGTGCTGTATTGATAGC
+CGGGCGTTTATCATCCACCGGCACTAAAGTCGGTTTTCCAGGTGGTTTTTCAACCAATCC
+ACCTAGCAGTTCAGTAAATCTGGCTTTGCCGAGGGTTTTTTCCATGACAGTGATGCCCTT
+CAATTTTTGTTCATATGGGTCATAACCCGCTGCCTGTACCGCCTGGGCTACCGCATCTTC
+ACTAATGTACTTGCGAACACTTCTACCTGCGACCAGTTTCCAGCCGTTCCACTCCTTACC
+GCCCAGGGCCGCTTGCAAAGCGTAAGTCTTGATGTCACCCGCCCAGGATATGAGTTCATC
+GATTCTGCCCAGGATGGCTTCCACTTCATCGTCTTCCAATAGTGGTGGCAGCTTGAAGTC
+AAAACGAGCAAATTCCATGTTGTGTTCAGCCCTGGCCCGGCACTCGTGCTTGGCCTTACA
+GAACTGACACCACTCGCCACACAGGAACTCCCCGCCACCGGCGTAGGCCAGTTCAGCGAT
+TGGCTTTAGCTCTTCCTCTGCCCAGCGGTAGAGGTCTTCCTTGGTCATGATGTAGGTGCT
+GATGTTGTCCCTGCGGGGCTGGTAGATGGTCATGGATACCGTTTCGATATCAAACAGACA
+ATCAAATATCTCCAGTGCCCCCAGCCCGTACAGCATCATTTGCGGGTTTCTTTCGGCTTC
+CACCAGCACCCCTTGACCATGCTTGTAATCAATGATGTGGAGCACCTTATCGGCGATAAC
+CAGGGCATCCCCGGTGCCAAAGCCGCCCTCTGCATATCTGGAGTAGTCCAGCCGCTGTTC
+AATGAGGACAACTGGATCGGTGCAGGTATACTTGGCCGCTTCCACCAACTCCATGATGTA
+GGCTGCGTAACCATCCGCACATTCCTCCATCTCTTGGCTGTAGTAACTTAAGTCAGCAGT
+TGGGTCTTTTGCCTCCATGCCCAAGGCCTTTTTCAACTTGTATTCACACAGGATATGAGC
+GGCTGTACCCTCGGCGGCGTAATCGCTGCCCCTGTCCTCGTAGTTCTGGCACAGCCGGGC
+TGACGGCGGACATTTTAACCACCTGGGGGAAGCTGAAGCCGAAAGCAGTGCGTGTTTACC
+CATCGCCCAGCACCTCAGCTTCCGCTAAGAGGGTCTTATAATTTGCCGGGTCAACCTCCG
+AAAGCCTGGCTGCCCCGTGCTTTTCAATGAGCATTTTAACTTCTCTTGTAAAACCGCTTC
+TGGATTTCTCCGCCAGAACTGCCCGGACAGTTTCCAGGGTGATAGGTTTTTCCTCCGGTG
+CTGATTCTGGTTGGGGTGCTACTTCGCCGCCAAATAAGTCATTAAGTGAATCTGCTACAC
+TAATTAGCGATTGGGCTGCATTCCTTAGCTCCGTTACTGCTTGCGAAAAATCACTCATCC
+TGTTCACCCACATCCCTTCCTTCCTCTTTAATGGCGTCCTGGTGCTGAAGCGTTAACAGC
+TTCCTTGCTAAACGCCGGGATACGATACTGATGGCGCTTAGGATGCCAGCCAGTTCTTCA
+TCTAGCTCCGGGTCCCTAAGATTCGTTTGCATATTGCCACCTCCATTTCTAAGGGCCTTT
+TTATCCCCTCACCATACACAGGACATTTTTGATGGTTTTGAGTACTAAAAACTGCCCTTC
+AATATCCACAGGACATTTGGGGGCAGTTTGAGTACCTTTTTATCTATAATTTTTTAGGCG
+CTGGTGAAGCTGACCGAAAATCTTGGCCTTGCGCTTGTTTACCGTCCTTTGGGAAAGTCC
+AACCTTATCGGCAATCTGCCGCTCCGACATTCCGTCACCATACAATTCAGCAATTCTTTT
+ATTTTGCGGATCTAGTTCATCAAGGGCTGCCGCTAGTTCCTCAAATAAAAGCTTTTCCGC
+TACCAATTCGGCAACATCAAAGGAACCGGGTATCTCGTAACCATCCTCTGAGAATTTTTC
+TAGTGACAAAACGCTACCGATGCGCTGTTTATCACACTGACTGCAATCCTCCATACAACG
+CTTTGTTTTACCCTTGCCATCACTAATCAAGCATCTTTTTTCCCGTTCCTGACGTTTCAG
+CTCTGCCCACACTGGTCGCCTATCGGTCCTATAAACACCCTCCGTCACCGTAATTTTCTT
+GCCATCAATTGTCAGGTAATACTCCTTGTTTGACTTCTGGTTGTCACCTTTTGGCATAAA
+AAAGCCCCTTTCCCGGTGAGAAAAGGGCATAGGAATTAGCCAAAAAACTCACCGTTTTTT
+TAAACGGGAGCCGTTTGGCTGCACCAAATTTATTGTGGAATTGCTTCCTTCACCTCTACT
+ATCGTCCATAAACAGGGTGCTGTGGCGGACACTTCATGCCCGCTTTTTTAGGGGCAAAAC
+AGGTTTTTTGGGCAAAAAAAAAAGAGCCATACACAAATCCTTGTTTGGATTCATATATGG
+CTCTTAGGAATTTAGGAATAAAAAAACCGGACACCACGTGTCCGCTTTGCTAAAAAATAT
+TTTTATAATGGCGCATCGTTTTCTTGTAAAAAGGCTCTGATATCATCCATTTTCTTGGCG
+TATAGGTGGTTTAGCGCAAATTTATAATAAACATGGCTTTCGTTAGTGTAGTTTAATGAA
+TATGGAGATCTTTCGATGATATGACTACTGATTTCCGGCGGGAGATGCAAGCTGAGGCAA
+ATTGAAACTAATGAATTAATAGAACCCTGCCCCTCACCATTGACGATCCGCCGGATGGTG
+CGTTCATCAATTAGCGTCCTTTCCTCAAGTTCTTTATATGTCACGCCCCTCCATTTCTTT
+ACCATTTTGAGGCAGGCGGTATAGCTATTTGGCAATTCACTATACATACGAGCATTTTCC
+GCTAACACATCGGCTAACAATGCTTTCCTTTTTTCCGGTTTAGCATGCTGGTAGCCTTTC
+CCGTAAACGATATCAAAACTTATGACAGCGGCTTCATCCCTATTTAGAAAACATTCCCGG
+TGGTATCTTTCCCGAACACCAGCTCTAACTGATAGGTCAAATACTAAACAACATTCTTCC
+ATATGTGTCCTGGCATAATCCGTTAGTTCGGTCTCCCCGAATAAATTCTGTGCTACATAT
+TTGGGATGGTTTAATACAAAATGGGCATCTACATACAGGTAGCTGCCGTCTTTCACCAGG
+GGGATTAATTCCGGATTGGTTATACTCTGAATTGCCGCATCTTCAGCACCGATGGAGAAG
+GTCTGATTCTTTAGAAGTGCACCCTTTTTAAAGCTGTGGGGTTTAACGTAGCGCCCGTCT
+ATGTAGGTGAAAGTACCAATGGCTTCTTCATACCCGGCGTTAATCATGCGGATTTTGGCA
+GCCTGGCGAGAGACGCAGAAGAAGATGCCCAGTGCTTCGATGACCGGTTCCATCACATCT
+ATTAGTTCAGTAGTTCCCAGTTCCCTTTGAAATTGCTTGATAAGTTCAAAGGCCTTGGTT
+TTAAACGTTCCCAGGGGCATTTGAATTCTAGGGGCTAAGGAGTTAGCCTGCCACTCCATC
+CAGTCGGTGGCATCCTTTTCACCGTCCTTGATGCCGCCAACTGTTTCACACCTAATTCTA
+CTGGCGCTGGCGTTATATAGGCGTTCTAGTTCAAAGGCTTTCCTGTGCTTGTCCCAGTGG
+ACACATTCATGGACGATAGTATTATTGACGGCACCCAAATTGCGCATGAAATATGCCTTG
+GGGTCAACGAATATCGTCTTGGCCCTGACTGATGTTTTTATTAACTGGTCTACTTCCGAA
+TCATAAAATTCCGCCTCAGCATCGTGAAAATATATCTGGCCGAAGATGGATAAATCCTCG
+GTGATGTCCCGTACTTCTACCCTGAGCCCCATTCGCTCAGCCAATTTTGATGGGTCAAGC
+GGCATGGGGGTTTTTAAGGCCTCCGGATAATATTTGCTCAGGAAGTCAACAGCTACCTTG
+TCCAAGTCCTCTTTATAAATGTATGGAACCAAAGCATCGGAAAGGGGTTTGGGCATCTTT
+CCCTTTTGATATGGGATAATGCTTCTGATCTGAAAATCATCCAGGTTACAGGCTAGATCC
+CCGGTGCATCGGATGGAAAGCCATTGATTGCAGATATCGTAATCATCATAATGGTAGTCG
+CCCTCTGTAACTTCAATTTCAGCATCCACCACGACATCAAATTCTATTTTCAGATCCGGG
+AGGTCGTAAACCGTCACGAATTTAATTACCATATCCGACATGGCAACCCCGCCAACTTCA
+TGAACATTACGCAGATATAAATCTAAACTCTCCCAATTTTGCTCGACATATTCTTCTGCT
+GCAGGATAAAGGTCATCAAGAAACCGGCTTTTTACATAATCGGTAAAAGAGCGATCGCCC
+GCCACGTCATAGCCCCCCTTCCCCCATAGGTAAATTATAGCACATATTGTCGCATGCTCA
+ACCTGATATTTGCATTTGTAAATTTTAATTGCGCTATAACTCTTTTTGTGTTAGTCTTTA
+TAGGCAGCTAAGTGAGGTGGCAACATGAGGACAAGTTATAAGAAACTATGGAAGCTCTTG
+ATAGATAGGGATATGTTAAAGAAGGATTTGCGGGAGACTGCCGGAATCAGTACAGCATCC
+ATGGCCAAGCTGGGCAAAGGTGAAAATGTGACCACTGACGTCTTGGTTAAAATATGTAAG
+GCTCTGGACTGTGATATTTCTGATATCGTGGAGATTGTGGAGGAATAA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_000913.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_000913.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,144 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_000913.3|provirus_563848_584430_520 563848 564480 633 -1 0.368 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_521 564815 565978 1164 -1 0.467 11 GGAG/GAGG GENOMAD.133037.VP 1.252e-16 85 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_563848_584430_522 566098 566361 264 -1 0.496 11 GGA/GAG/AGG GENOMAD.095346.VP 5.936e-50 171 0 0 1 2561 Caudoviricetes NA NA PF09588;K01143;COG5377;TIGR03033 Phage-related protein, predicted endonuclease
+NC_000913.3|provirus_563848_584430_523 566684 566779 96 1 0.521 11 AGGAG GENOMAD.086130.VV 3.579e-13 62 0 0 0 2561 Caudoviricetes NA NA PF08222;TIGR00373;COG4519 CodY helix-turn-helix domain
+NC_000913.3|provirus_563848_584430_524 566842 567141 300 1 0.500 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_525 567138 568004 867 1 0.551 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_526 568315 568647 333 1 0.411 11 AGGA/GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_527 568902 570428 1527 1 0.356 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_528 570893 571444 552 1 0.424 11 GGAG/GAGG GENOMAD.189584.CP 1.606e-07 53 0 0 0 1 NA NA NA PF01161;COG1881;TIGR00481 Phosphatidylethanolamine-binding protein
+NC_000913.3|provirus_563848_584430_529 571454 572251 798 1 0.362 11 AGxAGG/AGGxGG GENOMAD.166602.PC 1.614e-10 64 0 0 0 1 NA NA NA PF06719;PF12833;TIGR02297;K18991;COG2207 4-hydroxyphenylacetate catabolism regulatory protein HpaA
+NC_000913.3|provirus_563848_584430_530 572466 572921 456 1 0.504 11 GGAGG GENOMAD.022699.VV 2.722e-81 265 0 0 0 2561 Caudoviricetes NA NA PF05772 NinB protein
+NC_000913.3|provirus_563848_584430_531 572921 573091 171 1 0.485 11 AGGAGG GENOMAD.177576.VP 2.504e-28 107 0 0 0 2561 Caudoviricetes NA NA PF05322 NINE Protein
+NC_000913.3|provirus_563848_584430_532 573084 573374 291 1 0.533 11 AGGAGG GENOMAD.038211.VV 1.658e-20 87 0 0 0 2561 Caudoviricetes NA NA PF07102 Putative nuclease YbcO
+NC_000913.3|provirus_563848_584430_533 573371 573733 363 1 0.532 11 AGxAGG/AGGxGG GENOMAD.154527.VP 2.554e-18 82 0 0 0 2561 Caudoviricetes NA NA PF05866;K01160;COG4570 Holliday junction resolvase RusA (prophage-encoded endonuclease)
+NC_000913.3|provirus_563848_584430_534 573733 573870 138 1 0.478 11 GGA/GAG/AGG GENOMAD.073918.VV 4.945e-10 54 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_563848_584430_535 573956 574339 384 1 0.430 11 GGAG/GAGG GENOMAD.054312.VV 3.04e-60 203 0 0 0 2561 Caudoviricetes NA NA PF06576 Phage antitermination protein Q
+NC_000913.3|provirus_563848_584430_536 574481 574699 219 1 0.447 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_537 574737 575717 981 -1 0.550 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_538 575758 576825 1068 -1 0.444 11 GGA/GAG/AGG GENOMAD.042052.CC 7.284e-09 60 0 0 0 1 NA NA NA PF00267;K10940;COG3203 Outer membrane protein (porin)
+NC_000913.3|provirus_563848_584430_539 577398 577613 216 1 0.477 11 GGAG/GAGG GENOMAD.208385.VP 5.344e-28 107 0 0 1 2561 Caudoviricetes NA NA PF04971 Bacteriophage P21 holin S
+NC_000913.3|provirus_563848_584430_540 577613 578110 498 1 0.476 11 GGAG/GAGG GENOMAD.171676.VP 2.772e-28 113 0 0 1 2561 Caudoviricetes NA NA PF00959;COG3772 Phage-related lysozyme (muramidase), GH24 family
+NC_000913.3|provirus_563848_584430_541 578107 578568 462 1 0.513 11 GGxGG GENOMAD.219285.VP 5.677e-41 149 0 0 0 2561 Caudoviricetes NA NA PF03245 Bacteriophage Rz lysis protein
+NC_000913.3|provirus_563848_584430_542 578600 578893 294 -1 0.422 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_543 579184 579594 411 -1 0.314 11 GGA/GAG/AGG GENOMAD.227189.VP 1.298e-32 124 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_563848_584430_544 579880 580086 207 1 0.396 11 GGAG/GAGG GENOMAD.227340.VP 5.416e-34 124 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_545 580834 581379 546 1 0.526 11 GGA/GAG/AGG GENOMAD.161251.VP 7.238e-77 254 0 0 1 2561 Caudoviricetes NA NA PF07471;K22014;COG4220 Phage DNA packaging protein, Nu1 subunit of terminase
+NC_000913.3|provirus_563848_584430_546 581354 582097 744 1 0.508 11 None GENOMAD.167268.VP 1.572e-44 164 0 0 1 2561 Caudoviricetes NA NA PF02413 Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_563848_584430_547 582152 582583 432 -1 0.412 11 3Base/5BMM NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_563848_584430_548 582875 583060 186 1 0.495 11 GGA/GAG/AGG GENOMAD.178075.VP 3.901e-19 81 0 0 1 2561 Caudoviricetes NA NA PF02413 Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_563848_584430_549 583681 584430 750 1 0.317 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1105 1196867 1197532 666 -1 0.350 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1106 1197533 1198228 696 -1 0.310 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1107 1198695 1199588 894 1 0.368 11 GGAG/GAGG GENOMAD.088167.PP 1.632e-150 473 0 0 0 1 NA NA NA PF10463;COG2856 Peptidase U49
+NC_000913.3|provirus_1196867_1213107_1108 1199679 1200806 1128 -1 0.447 11 GGA/GAG/AGG GENOMAD.195357.VP 1.34e-89 301 0 0 0 2561 Caudoviricetes NA NA PF09003;K21039 Bacteriophage lambda integrase, Arm DNA-binding domain
+NC_000913.3|provirus_1196867_1213107_1109 1200787 1201032 246 -1 0.435 11 GGA/GAG/AGG GENOMAD.095038.VV 1.817e-43 152 0 0 0 2561 Caudoviricetes NA NA PF07825 Excisionase-like protein
+NC_000913.3|provirus_1196867_1213107_1110 1201497 1201838 342 1 0.386 11 AGGA GENOMAD.226053.VP 1.147e-47 166 0 0 0 2561 Caudoviricetes NA NA PF11080;K18840 Endoribonuclease GhoS
+NC_000913.3|provirus_1196867_1213107_1111 1201776 1202084 309 -1 0.469 11 GGAG/GAGG GENOMAD.226995.VP 1.008e-59 200 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1112 1202259 1202933 675 -1 0.441 11 3Base/5BMM NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1113 1203024 1203224 201 1 0.428 11 GGAGG GENOMAD.218084.VP 6.055e-32 118 0 0 0 2561 Caudoviricetes NA NA PF15943;COG4197 NA
+NC_000913.3|provirus_1196867_1213107_1114 1203268 1203825 558 1 0.496 11 GGAG/GAGG GENOMAD.058510.VV 7.507e-87 283 0 0 1 2561 Caudoviricetes NA NA PF06892 Phage regulatory protein CII (CP76)
+NC_000913.3|provirus_1196867_1213107_1115 1203822 1204160 339 1 0.499 11 GGAG/GAGG GENOMAD.102216.VV 1.096e-55 189 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1116 1204170 1205537 1368 1 0.543 11 GGAG/GAGG GENOMAD.159591.VP 5.958e-37 149 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1117 1205549 1205731 183 1 0.601 11 GGAG/GAGG GENOMAD.088953.VV 9.423e-11 57 0 0 0 2561 Caudoviricetes NA NA PF10003 NA
+NC_000913.3|provirus_1196867_1213107_1118 1205731 1206204 474 1 0.563 11 GGAGG GENOMAD.031947.VV 1.897e-07 52 0 0 1 2561 Caudoviricetes NA NA PF04860;TIGR01537 phage portal protein, HK97 family
+NC_000913.3|provirus_1196867_1213107_1119 1206173 1206922 750 1 0.576 11 None GENOMAD.110264.VV 3.24e-56 198 0 0 1 2561 Caudoviricetes NA NA PF04865;COG3948 Phage-related baseplate assembly protein
+NC_000913.3|provirus_1196867_1213107_1120 1206913 1207497 585 1 0.573 11 GGA/GAG/AGG GENOMAD.113504.VP 5.104e-87 284 0 0 1 2561 Caudoviricetes NA NA PF10076;COG3778 Uncharacterized protein YmfQ in lambdoid prophage, DUF2313 family
+NC_000913.3|provirus_1196867_1213107_1121 1207501 1208130 630 1 0.503 11 GGAG/GAGG GENOMAD.044962.VV 2.458e-85 280 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1122 1208171 1208545 375 1 0.437 11 None GENOMAD.045203.VV 3.842e-40 145 0 0 1 2561 Caudoviricetes NA NA PF02413 Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_1196867_1213107_1123 1208517 1209119 603 -1 0.476 11 GGAG/GAGG GENOMAD.140378.VP 8.011e-41 151 0 0 1 2561 Caudoviricetes NA NA PF02413 NA
+NC_000913.3|provirus_1196867_1213107_1124 1209119 1209655 537 -1 0.453 11 AGxAGG/AGGxGG GENOMAD.191048.VP 2.151e-63 215 0 0 0 2561 Caudoviricetes NA NA COG4675 Microcystin-dependent protein (function unknown)
+NC_000913.3|provirus_1196867_1213107_1125 1209685 1210239 555 1 0.488 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1126 1210346 1211179 834 1 0.384 11 None GENOMAD.030786.VV 1.161e-05 49 0 0 0 2561 Caudoviricetes NA NA PF13395 HNH endonuclease
+NC_000913.3|provirus_1196867_1213107_1127 1211413 1211577 165 1 0.467 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1196867_1213107_1128 1212703 1213107 405 -1 0.368 11 AGGA/GGAG/GAGG GENOMAD.227190.VP 2.116e-26 106 0 0 0 2561 Caudoviricetes NA NA PF07166;COG5562 Prophage-encoded protein YbcV, DUF1398 family
+NC_000913.3|provirus_1412000_1434224_1320 1412000 1413235 1236 -1 0.428 11 None GENOMAD.159447.VP 2.063e-29 125 0 0 1 2561 Caudoviricetes NA NA PF12167;K14059;TIGR01634;COG4385 phage tail protein, P2 protein I family
+NC_000913.3|provirus_1412000_1434224_1321 1413237 1413452 216 -1 0.454 11 GGAG/GAGG GENOMAD.114098.VV 1.562e-32 120 0 0 0 2561 Caudoviricetes NA NA PF06806 Putative excisionase (DUF1233)
+NC_000913.3|provirus_1412000_1434224_1322 1413531 1413740 210 -1 0.352 11 GGAGG GENOMAD.223267.VP 1.749e-30 114 0 0 0 1 NA NA NA PF06688;K19780 NA
+NC_000913.3|provirus_1412000_1434224_1323 1413984 1414793 810 -1 0.472 11 AGGA GENOMAD.127355.VP 2.712e-58 205 0 0 0 2561 Caudoviricetes NA NA PF03837;TIGR00616;COG3723 recombinase, phage RecT family
+NC_000913.3|provirus_1412000_1434224_1324 1414786 1417386 2601 -1 0.494 11 GGAG/GAGG GENOMAD.084315.VV 4.036e-74 272 0 0 0 2561 Caudoviricetes NA NA PF06630;K10906 Enterobacterial exodeoxyribonuclease VIII
+NC_000913.3|provirus_1412000_1434224_1325 1417488 1417763 276 -1 0.391 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1326 1417838 1418008 171 -1 0.374 11 GGAG/GAGG GENOMAD.110847.VV 1.628e-32 119 0 0 0 1 NA NA NA PF04181 NA
+NC_000913.3|provirus_1412000_1434224_1327 1418008 1418229 222 -1 0.410 11 GGAG/GAGG GENOMAD.074955.VV 1.258e-35 129 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1328 1418548 1419159 612 1 0.395 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1329 1419156 1419311 156 -1 0.481 11 GGA/GAG/AGG GENOMAD.222124.VP 1.495e-23 93 0 0 0 2561 Caudoviricetes NA NA PF07151 NA
+NC_000913.3|provirus_1412000_1434224_1330 1419322 1419456 135 -1 0.474 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1331 1419765 1420241 477 -1 0.419 11 AGGAG/GGAGG GENOMAD.115833.VV 4.047e-72 239 0 0 0 2561 Caudoviricetes NA NA PF00376;COG5606;TIGR00673;K10123 MerR family regulatory protein
+NC_000913.3|provirus_1412000_1434224_1332 1420365 1420661 297 1 0.434 11 GGAG/GAGG GENOMAD.054651.VV 1.154e-09 56 0 0 0 2561 Caudoviricetes NA NA PF15943;COG4197 DNA-binding transcriptional regulator YdaS, prophage-encoded, Cro superfamily
+NC_000913.3|provirus_1412000_1434224_1333 1420684 1421106 423 1 0.508 11 GGAG/GAGG GENOMAD.072359.VV 8.614e-72 237 0 0 0 2561 Caudoviricetes NA NA PF06254 Putative bacterial toxin ydaT
+NC_000913.3|provirus_1412000_1434224_1334 1421119 1421976 858 1 0.479 11 None GENOMAD.195765.VP 5.5e-122 390 0 0 0 2561 Caudoviricetes NA NA PF07120;COG3756 Uncharacterized conserved protein YdaU, DUF1376 family
+NC_000913.3|provirus_1412000_1434224_1335 1421983 1422729 747 1 0.527 11 AGxAGG/AGGxGG GENOMAD.047125.VV 5.612e-10 62 0 0 1 2561 Caudoviricetes NA NA PF16463;COG5437;TIGR02126 Phage tail tube protein family
+NC_000913.3|provirus_1412000_1434224_1336 1422752 1423312 561 1 0.488 11 GGAG/GAGG GENOMAD.144793.VV 5.225e-30 119 0 0 0 1 NA NA NA PF07789 NA
+NC_000913.3|provirus_1412000_1434224_1337 1423345 1423644 300 1 0.533 11 GGA/GAG/AGG GENOMAD.219285.VP 4.845e-42 149 0 0 0 2561 Caudoviricetes NA NA PF03245 Bacteriophage Rz lysis protein
+NC_000913.3|provirus_1412000_1434224_1338 1423815 1425239 1425 1 0.382 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1339 1425377 1425640 264 1 0.481 11 GGA/GAG/AGG GENOMAD.159709.VV 5.097e-06 45 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1340 1425621 1425980 360 1 0.472 11 None GENOMAD.109865.VV 7.702e-05 43 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1341 1426454 1427482 1029 1 0.468 11 AGGAG GENOMAD.120741.VP 1.03e-151 479 0 0 1 2561 Caudoviricetes NA NA COG5281 Phage-related minor tail protein
+NC_000913.3|provirus_1412000_1434224_1342 1427482 1427613 132 1 0.553 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1343 1427746 1428726 981 -1 0.555 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1344 1429049 1432411 3363 1 0.533 11 None GENOMAD.020617.VV 5.058e-116 406 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1345 1432411 1432986 576 1 0.481 11 GGAG/GAGG GENOMAD.167268.VP 3.58e-55 192 0 0 1 2561 Caudoviricetes NA NA PF02413 Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_1412000_1434224_1346 1433084 1433674 591 -1 0.448 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1412000_1434224_1347 1433991 1434224 234 -1 0.359 11 AGGA GENOMAD.221767.PV 3.984e-26 102 0 0 0 1 NA NA NA PF10965 Biofilm development protein YmgB/AriR
+NC_000913.3|provirus_1627517_1653915_1513 1627517 1628263 747 1 0.506 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1514 1628352 1629038 687 1 0.501 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1515 1629215 1629418 204 1 0.520 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1516 1629453 1630913 1461 -1 0.494 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1517 1631002 1632285 1284 -1 0.469 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1518 1633072 1633305 234 1 0.355 11 AGGA GENOMAD.221767.PV 3.984e-26 102 0 0 0 1 NA NA NA PF10965 Biofilm development protein YmgB/AriR
+NC_000913.3|provirus_1627517_1653915_1519 1633622 1634212 591 1 0.448 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1520 1634310 1634885 576 -1 0.479 11 GGAG/GAGG GENOMAD.167268.VP 3.58e-55 192 0 0 1 2561 Caudoviricetes NA NA PF02413 Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_1627517_1653915_1521 1634885 1635847 963 -1 0.526 11 None GENOMAD.211480.VP 3.667e-69 239 0 0 0 2561 Caudoviricetes NA NA COG5301 Phage-related tail fibre protein
+NC_000913.3|provirus_1627517_1653915_1522 1635798 1636367 570 -1 0.537 11 GGA/GAG/AGG GENOMAD.161251.VP 1.255e-74 248 0 0 1 2561 Caudoviricetes NA NA PF07471;K22014;COG4220 Phage DNA packaging protein, Nu1 subunit of terminase
+NC_000913.3|provirus_1627517_1653915_1523 1637047 1637457 411 1 0.316 11 GGA/GAG/AGG GENOMAD.227189.VP 1.298e-32 124 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1524 1637609 1637782 174 -1 0.299 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1525 1638455 1638667 213 -1 0.404 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1526 1639030 1639527 498 -1 0.458 11 GGA/GAG/AGG GENOMAD.062288.VV 1.369e-70 235 0 0 0 2561 Caudoviricetes NA NA PF10721 NA
+NC_000913.3|provirus_1627517_1653915_1527 1639524 1640057 534 -1 0.506 11 None GENOMAD.171676.VP 8.945e-29 115 0 0 1 2561 Caudoviricetes NA NA PF00959;COG3772 Phage-related lysozyme (muramidase), GH24 family
+NC_000913.3|provirus_1627517_1653915_1528 1640054 1640365 312 -1 0.439 11 AGGAG GENOMAD.225519.VP 1.173e-50 174 0 0 0 1 NA NA NA PF07041 NA
+NC_000913.3|provirus_1627517_1653915_1529 1640370 1640576 207 -1 0.473 11 AGGA GENOMAD.208385.VP 5.126e-27 104 0 0 1 2561 Caudoviricetes NA NA PF04971 Bacteriophage P21 holin S
+NC_000913.3|provirus_1627517_1653915_1530 1640618 1640737 120 1 0.342 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1531 1641339 1641554 216 -1 0.356 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1532 1641855 1642067 213 1 0.484 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1533 1642489 1643241 753 -1 0.481 11 GGAG/GAGG GENOMAD.136613.VP 1.109e-26 112 0 0 0 2561 Caudoviricetes NA NA PF03589;TIGR02642 Antitermination protein
+NC_000913.3|provirus_1627517_1653915_1534 1643255 1644304 1050 -1 0.521 11 GGAGG GENOMAD.196019.VP 1.481e-50 186 0 0 0 2561 Caudoviricetes NA NA PF06147 dATP/dGTP pyrophosphohydrolase
+NC_000913.3|provirus_1627517_1653915_1535 1644651 1644902 252 -1 0.409 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1536 1645119 1645274 156 -1 0.519 11 AGGAG GENOMAD.136858.PV 7.473e-23 91 0 0 0 2561 Caudoviricetes NA NA PF01848;K18919 Hok/gef family
+NC_000913.3|provirus_1627517_1653915_1537 1645346 1645633 288 -1 0.469 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1538 1645633 1645872 240 -1 0.471 11 GGAG/GAGG GENOMAD.151401.PV 4.39e-26 102 0 0 0 1 NA NA NA PF04221;TIGR02384;COG3077;K07473 addiction module antitoxin, RelB/DinJ family
+NC_000913.3|provirus_1627517_1653915_1539 1646405 1646737 333 1 0.429 11 AGGAG GENOMAD.078672.PP 6.68e-60 201 0 0 0 1 NA NA NA PF14282 FlxA-like protein
+NC_000913.3|provirus_1627517_1653915_1540 1647122 1647349 228 -1 0.421 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1541 1647346 1647636 291 -1 0.505 11 GGxGG GENOMAD.150946.VV 3.745e-51 175 0 0 0 1 NA NA NA PF06254 Putative bacterial toxin ydaT
+NC_000913.3|provirus_1627517_1653915_1542 1647620 1647850 231 -1 0.459 11 GGA/GAG/AGG GENOMAD.108381.VV 1.622e-34 126 0 0 0 2561 Caudoviricetes NA NA K22302 NA
+NC_000913.3|provirus_1627517_1653915_1543 1647934 1648341 408 1 0.436 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1544 1648508 1648663 156 1 0.481 11 GGAG/GAGG GENOMAD.222124.VP 6.689e-24 94 0 0 0 2561 Caudoviricetes NA NA PF07151 NA
+NC_000913.3|provirus_1627517_1653915_1545 1648665 1648793 129 1 0.465 11 GGA/GAG/AGG GENOMAD.136713.VV 1.3e-20 84 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1546 1648823 1649041 219 1 0.479 11 GGAG/GAGG GENOMAD.180239.VV 1.159e-43 152 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1547 1649045 1649209 165 -1 0.509 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1548 1649609 1649797 189 1 0.360 11 GGAG/GAGG GENOMAD.189052.VV 3.595e-35 127 0 0 0 2561 Caudoviricetes NA NA PF05358;K22304 DicB protein
+NC_000913.3|provirus_1627517_1653915_1549 1649794 1649985 192 1 0.432 11 AGGA GENOMAD.094923.VV 7.175e-29 109 0 0 0 2561 Caudoviricetes NA NA PF07358 NA
+NC_000913.3|provirus_1627517_1653915_1550 1650078 1650998 921 1 0.497 11 GGAG/GAGG GENOMAD.075680.VV 3.9e-07 54 0 0 0 2561 Caudoviricetes NA NA K10906 NA
+NC_000913.3|provirus_1627517_1653915_1551 1650995 1651537 543 1 0.541 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1552 1651512 1652708 1197 1 0.422 11 None GENOMAD.099267.VV 1.899e-19 94 0 0 0 2561 Caudoviricetes NA NA PF00589;TIGR02224;COG4973;K03733 tyrosine recombinase XerC
+NC_000913.3|provirus_1627517_1653915_1553 1652728 1652838 111 -1 0.414 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_1627517_1653915_1554 1652896 1653915 1020 -1 0.449 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2313 2461306 2462646 1341 1 0.498 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2314 2463012 2464070 1059 1 0.355 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2315 2464252 2465007 756 -1 0.519 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2316 2465301 2466233 933 1 0.486 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2317 2466545 2467702 1158 1 0.478 11 GGA/GAG/AGG GENOMAD.064492.VV 0.0007762 44 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2318 2468214 2469134 921 1 0.395 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2319 2469131 2470462 1332 1 0.276 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2320 2470803 2471105 303 1 0.545 11 GGA/GAG/AGG GENOMAD.167268.VP 2.711e-17 78 0 0 1 2561 Caudoviricetes NA NA PF02413 Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_2461306_2476510_2321 2471077 2471517 441 -1 0.454 11 GGAG/GAGG GENOMAD.045203.VV 2.366e-80 262 0 0 1 2561 Caudoviricetes NA NA PF02413 Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_2461306_2476510_2322 2471544 2472146 603 -1 0.509 11 GGAG/GAGG GENOMAD.044962.VV 4.611e-91 296 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2323 2472112 2472387 276 -1 0.518 11 GGxGG GENOMAD.178309.VP 1.935e-09 55 0 0 0 2561 Caudoviricetes NA NA PF05869;TIGR01712 phage N-6-adenine-methyltransferase
+NC_000913.3|provirus_2461306_2476510_2324 2472387 2472881 495 -1 0.545 11 AGGA GENOMAD.225234.VP 1.741e-67 226 0 0 0 2561 Caudoviricetes NA NA PF06069 PerC transcriptional activator
+NC_000913.3|provirus_2461306_2476510_2325 2472878 2473246 369 -1 0.556 11 GGA/GAG/AGG GENOMAD.086968.VV 4.891e-69 228 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2326 2473604 2473966 363 1 0.501 11 AGGAG GENOMAD.056235.VV 4.359e-53 182 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2327 2474032 2474856 825 1 0.457 11 GGAG/GAGG GENOMAD.052651.VV 8.505e-66 227 0 0 0 2561 Caudoviricetes NA NA PF10065;COG5532 Uncharacterized conserved protein YfdQ, DUF2303 family
+NC_000913.3|provirus_2461306_2476510_2328 2474984 2475520 537 1 0.462 11 GGAG/GAGG GENOMAD.172054.VC 5.137e-36 136 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2329 2475511 2475873 363 1 0.471 11 GGAG/GAGG GENOMAD.067358.VV 4.901e-68 225 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2330 2475873 2476178 306 1 0.428 11 GGAGG GENOMAD.222350.VP 2.161e-43 153 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_000913.3|provirus_2461306_2476510_2331 2476310 2476510 201 1 0.438 11 GGAG/GAGG GENOMAD.195460.VP 1.864e-28 108 0 0 0 2561 Caudoviricetes NA NA COG2452 NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_002737.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_002737.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,172 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_002737.2|provirus_529627_569283_517 529627 531042 1416 -1 0.322 11 GGAG/GAGG GENOMAD.022372.VV 6.087e-23 106 0 0 1 2561 Caudoviricetes NA NA PF04708;COG1961;K14060 Site-specific DNA recombinase related to the DNA invertase Pin
+NC_002737.2|provirus_529627_569283_518 531163 531528 366 -1 0.333 11 GGAG/GAGG GENOMAD.142683.VV 5.916e-18 81 0 0 0 2561 Caudoviricetes NA NA PF11446;TIGR04165;COG4888 Cys-rich peptide, TIGR04165 family
+NC_002737.2|provirus_529627_569283_519 531555 532316 762 -1 0.329 11 AGGA GENOMAD.108504.VP 7.914e-35 136 0 0 0 2561 Caudoviricetes NA NA PF05866;PF00717;COG4570;TIGR02754 Endodeoxyribonuclease RusA; Peptidase S24-like
+NC_002737.2|provirus_529627_569283_520 532500 532730 231 1 0.372 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_529627_569283_521 532799 532936 138 1 0.326 11 GGAG/GAGG GENOMAD.061610.VV 0.0002144 38 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_522 532938 533063 126 1 0.302 11 AGGAG GENOMAD.129654.VV 6.909e-19 79 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_523 533060 533287 228 1 0.320 11 GGA/GAG/AGG GENOMAD.108243.VV 1.543e-34 126 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_524 533287 534606 1320 1 0.385 11 GGAG/GAGG GENOMAD.010825.VV 1.953e-201 628 0 0 0 2561 Caudoviricetes NA NA PF13175;TIGR00634;COG4717;K03546 DNA repair protein RecN
+NC_002737.2|provirus_529627_569283_525 534621 535712 1092 1 0.444 11 GGAG/GAGG GENOMAD.141036.VV 6.091e-73 252 0 0 1 2561 Caudoviricetes NA NA PF13479;TIGR01618;K04484;COG0468 phage nucleotide-binding protein
+NC_002737.2|provirus_529627_569283_526 535752 536174 423 1 0.383 11 AGGA/GGAG/GAGG GENOMAD.092954.VV 1.157e-35 133 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_527 536176 536910 735 1 0.351 11 AGGA GENOMAD.014438.VV 4.323e-50 180 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_528 536932 537567 636 1 0.410 11 AGGAG GENOMAD.005320.VV 5.429e-31 123 0 0 0 2561 Caudoviricetes NA NA PF05037 NA
+NC_002737.2|provirus_529627_569283_529 537567 539150 1584 1 0.411 11 GGAGG GENOMAD.030980.VV 1.795e-05 50 0 0 0 2561 Caudoviricetes NA NA PF04851;PF17338;K17677;TIGR00614;COG1061 Type III restriction enzyme, res subunit; Gene product 88
+NC_002737.2|provirus_529627_569283_530 539160 539789 630 1 0.314 11 AGGAG GENOMAD.116271.VP 3.678e-24 103 0 0 0 2561 Caudoviricetes NA NA PF07768 PVL ORF-50-like family
+NC_002737.2|provirus_529627_569283_531 539779 542052 2274 1 0.395 11 GGA/GAG/AGG GENOMAD.168744.VP 3.155e-85 303 0 0 0 2561 Caudoviricetes NA NA K07505 NA
+NC_002737.2|provirus_529627_569283_532 542330 542548 219 1 0.292 11 GGAG/GAGG GENOMAD.004447.VV 1.326e-12 63 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_533 542541 542936 396 1 0.419 11 GGA/GAG/AGG GENOMAD.028440.VV 8.304e-68 225 0 0 0 2561 Caudoviricetes NA NA PF05866;COG4570;K01160 Holliday junction resolvase RusA (prophage-encoded endonuclease)
+NC_002737.2|provirus_529627_569283_534 542933 543154 222 1 0.365 11 AGxAGG/AGGxGG GENOMAD.053518.VV 3.344e-41 145 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_535 543157 543429 273 1 0.418 11 GGAGG GENOMAD.072347.VV 1.269e-43 153 0 0 0 2561 Caudoviricetes NA NA TIGR02209 NA
+NC_002737.2|provirus_529627_569283_536 543431 544066 636 1 0.358 11 GGAGG GENOMAD.138295.VP 1.141e-77 258 0 0 0 2561 Caudoviricetes NA NA TIGR02987;COG0827 NA
+NC_002737.2|provirus_529627_569283_537 544339 544773 435 1 0.418 11 GGAGG GENOMAD.111673.VV 1.324e-85 277 0 0 0 2561 Caudoviricetes NA NA PF05263;TIGR01637 phage transcriptional regulator, ArpU family
+NC_002737.2|provirus_529627_569283_538 545083 546249 1167 1 0.373 11 AGGA GENOMAD.038338.VV 1.175e-46 176 0 0 0 2561 Caudoviricetes NA NA COG3392 NA
+NC_002737.2|provirus_529627_569283_539 546592 547068 477 1 0.449 11 AGGA GENOMAD.003239.VV 1.762e-30 119 0 0 1 2561 Caudoviricetes NA NA PF05133;TIGR01538 phage portal protein, SPP1 family
+NC_002737.2|provirus_529627_569283_540 547151 548362 1212 1 0.412 11 GGA/GAG/AGG GENOMAD.064889.VV 5.208e-172 541 0 0 1 2561 Caudoviricetes NA NA PF04466;PF17288;TIGR01547;COG1783;K06909 phage terminase, large subunit, PBSX family
+NC_002737.2|provirus_529627_569283_541 548376 549878 1503 1 0.409 11 AGGAG GENOMAD.003916.VV 9.779e-91 310 0 0 1 2561 Caudoviricetes NA NA PF05133;TIGR01542 phage portal protein, putative, A118 family
+NC_002737.2|provirus_529627_569283_542 549883 551376 1494 1 0.396 11 GGAG/GAGG GENOMAD.063181.VV 1.974e-184 582 0 0 1 2561 Caudoviricetes NA NA PF06152;TIGR01641 Phage minor capsid protein 2
+NC_002737.2|provirus_529627_569283_543 551376 551603 228 1 0.303 11 GGAGG GENOMAD.148778.VV 3.696e-41 145 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_529627_569283_544 551690 551956 267 1 0.363 11 AGGAG GENOMAD.076597.VV 2.091e-45 158 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_545 552088 552696 609 1 0.399 11 AGGAG GENOMAD.041104.VV 8.665e-41 151 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_546 552700 553518 819 1 0.435 11 AGGA GENOMAD.013974.VV 8.477e-55 195 0 0 1 2561 Caudoviricetes NA NA PF20036;TIGR04387 major capsid protein, N4-gp56 family
+NC_002737.2|provirus_529627_569283_547 553572 553988 417 1 0.396 11 GGA/GAG/AGG GENOMAD.034545.VV 3.007e-49 172 0 0 0 2561 Caudoviricetes NA NA PF11436 NA
+NC_002737.2|provirus_529627_569283_548 553978 554310 333 1 0.393 11 None GENOMAD.114565.VV 2.724e-37 136 0 0 1 2561 Caudoviricetes NA NA PF10665 Minor capsid protein
+NC_002737.2|provirus_529627_569283_549 554310 554666 357 1 0.440 11 GGAGG GENOMAD.008261.VV 1.315e-48 169 0 0 1 2561 Caudoviricetes NA NA PF11114 Minor capsid protein
+NC_002737.2|provirus_529627_569283_550 554663 555061 399 1 0.363 11 GGA/GAG/AGG GENOMAD.034546.VV 2.354e-24 100 0 0 1 2561 Caudoviricetes NA NA PF12691 Bacteriophage minor capsid protein
+NC_002737.2|provirus_529627_569283_551 555061 555531 471 1 0.425 11 AGxAGG/AGGxGG GENOMAD.028171.VV 1.557e-56 194 0 0 1 2561 Caudoviricetes NA NA PF16461;COG5437 Lambda phage tail tube protein, TTP
+NC_002737.2|provirus_529627_569283_552 555584 556018 435 1 0.393 11 AGGAG GENOMAD.064813.VV 7.473e-34 128 0 0 1 2561 Caudoviricetes NA NA PF10666 Phage tail assembly chaperone protein Gp14 ()A118
+NC_002737.2|provirus_529627_569283_553 556022 556603 582 1 0.376 11 AGGAG GENOMAD.013935.VV 5.591e-51 180 0 0 0 2561 Caudoviricetes NA NA PF06854 Bacteriophage Gp15 protein
+NC_002737.2|provirus_529627_569283_554 556593 559853 3261 1 0.431 11 AGGAG GENOMAD.002456.VV 1.364e-297 940 0 0 1 2561 Caudoviricetes NA NA COG3941 NA
+NC_002737.2|provirus_529627_569283_555 559850 560566 717 1 0.389 11 GGA/GAG/AGG GENOMAD.006390.VV 2.824e-80 267 0 0 0 2561 Caudoviricetes NA NA PF20195;COG4722;TIGR01633 Phage-related protein
+NC_002737.2|provirus_529627_569283_556 560563 562707 2145 1 0.422 11 None GENOMAD.049306.VV 0.0 1000 0 0 0 2561 Caudoviricetes NA NA COG4926 Phage-related protein
+NC_002737.2|provirus_529627_569283_557 562704 563717 1014 1 0.438 11 GGAGG GENOMAD.093524.VV 3.153e-136 434 0 0 0 2561 Caudoviricetes NA NA PF07212 Hyaluronidase protein (HylP)
+NC_002737.2|provirus_529627_569283_558 563732 565618 1887 1 0.449 11 AGGAG GENOMAD.033709.VV 0.0 1088 0 0 0 2561 Caudoviricetes NA NA PF07902 gp58-like protein
+NC_002737.2|provirus_529627_569283_559 565630 566061 432 1 0.354 11 AGGAG GENOMAD.073534.VV 4.564e-80 261 0 0 0 2561 Caudoviricetes NA NA PF07761 NA
+NC_002737.2|provirus_529627_569283_560 566064 566681 618 1 0.430 11 AGGAG GENOMAD.024672.VV 8.84e-112 356 0 0 0 2561 Caudoviricetes NA NA PF07104 NA
+NC_002737.2|provirus_529627_569283_561 566691 566966 276 1 0.348 11 GGAG/GAGG GENOMAD.039653.VV 9.653e-09 53 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_562 566963 567190 228 1 0.390 11 AGGAG GENOMAD.126098.VV 2.718e-14 68 0 0 0 2561 Caudoviricetes NA NA COG5546 NA
+NC_002737.2|provirus_529627_569283_563 567199 567309 111 1 0.387 11 AGGAG GENOMAD.102275.VV 5.331e-12 59 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_564 567306 568508 1203 1 0.446 11 AGGAG GENOMAD.133734.VP 7.911e-45 171 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_529627_569283_565 568576 569283 708 -1 0.284 11 AGGAG GENOMAD.223462.VP 3.741e-24 104 0 0 0 2561 Caudoviricetes NA NA PF02876;PF01123;K11040 Staphylococcal/Streptococcal toxin, beta-grasp domain; Staphylococcal/Streptococcal toxin, OB-fold domain
+NC_002737.2|provirus_777501_820593_756 777501 778541 1041 1 0.404 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_777501_820593_757 778635 779774 1140 -1 0.389 11 GGAG/GAGG GENOMAD.111131.VV 7.217e-08 57 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_758 780028 780837 810 -1 0.344 11 AGGAG GENOMAD.221704.VP 7.412e-31 125 0 0 0 2561 Caudoviricetes NA NA PF02452;COG3692;K18841 Uncharacterized protein YifN, PemK superfamily
+NC_002737.2|provirus_777501_820593_759 780850 781596 747 -1 0.395 11 AGGAG GENOMAD.179094.VV 4.977e-08 56 0 0 0 2561 Caudoviricetes NA NA PF08667;COG1974;K18830;TIGR02612 SOS-response transcriptional repressor LexA (RecA-mediated autopeptidase)
+NC_002737.2|provirus_777501_820593_760 781786 781944 159 1 0.358 11 AGGAG GENOMAD.097925.VV 1.016e-27 105 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_761 781978 782145 168 1 0.256 11 AGGAG GENOMAD.116752.VV 1.286e-19 82 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_762 782123 782962 840 -1 0.295 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_777501_820593_763 783080 783307 228 -1 0.346 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_777501_820593_764 783381 783587 207 1 0.382 11 AGGAG GENOMAD.223061.VP 0.0006542 38 0 0 0 2561 Caudoviricetes NA NA PF06892;COG5606;TIGR00673;K07727 Predicted DNA-binding protein, XRE-type HTH domain
+NC_002737.2|provirus_777501_820593_765 783627 784355 729 1 0.401 11 GGA/GAG/AGG GENOMAD.133073.VP 1.055e-36 141 0 0 0 2561 Caudoviricetes NA NA PF03374;COG3645 Phage antirepressor protein YoqD, KilAC domain
+NC_002737.2|provirus_777501_820593_766 784387 784653 267 1 0.356 11 GGAG/GAGG GENOMAD.133830.VV 1.414e-41 147 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_767 784588 785394 807 -1 0.369 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_777501_820593_768 785536 785772 237 -1 0.350 11 None GENOMAD.153962.VV 1.274e-45 158 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_769 785983 786222 240 1 0.363 11 None GENOMAD.050216.VV 1.824e-42 149 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_770 786224 786409 186 1 0.371 11 AGGAG GENOMAD.105558.VV 2.903e-29 110 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_771 786509 786748 240 1 0.342 11 GGA/GAG/AGG GENOMAD.136142.VP 7.591e-36 130 0 0 0 2561 Caudoviricetes NA NA PF13730;TIGR00373;COG4738;K07721 transcription factor E
+NC_002737.2|provirus_777501_820593_772 786892 787278 387 1 0.367 11 AGGAG GENOMAD.198321.CP 4.29e-06 47 0 0 0 2561 Caudoviricetes NA NA PF07261;COG3611;TIGR04548;K02086 Replication initiation and membrane attachment protein DnaB
+NC_002737.2|provirus_777501_820593_773 787259 787492 234 1 0.355 11 None GENOMAD.100896.VV 1.121e-38 138 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_774 787489 787629 141 1 0.404 11 AGGAG GENOMAD.079484.VV 1.722e-06 44 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_775 787638 787844 207 1 0.435 11 AGGAG GENOMAD.114751.VV 3.555e-38 136 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_776 787900 788229 330 1 0.333 11 GGAG/GAGG GENOMAD.040347.VV 1.569e-42 151 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_777 788232 789023 792 1 0.398 11 GGAGG GENOMAD.177891.VP 2.824e-31 126 0 0 0 2561 Caudoviricetes NA NA PF03837;TIGR01913;COG3723 phage recombination protein Bet
+NC_002737.2|provirus_777501_820593_778 789033 789698 666 1 0.399 11 AGGAG GENOMAD.012371.VV 4.137e-128 404 0 0 0 2561 Caudoviricetes NA NA PF07083 NA
+NC_002737.2|provirus_777501_820593_779 789702 790061 360 1 0.408 11 None GENOMAD.012371.VV 7.592e-55 187 0 0 0 2561 Caudoviricetes NA NA PF07083 NA
+NC_002737.2|provirus_777501_820593_780 790257 790595 339 1 0.354 11 GGA/GAG/AGG GENOMAD.060064.VV 3.644e-11 61 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_781 790592 791104 513 1 0.382 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_777501_820593_782 791091 791285 195 1 0.385 11 GGA/GAG/AGG GENOMAD.100776.VV 1.514e-29 111 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_783 791282 791527 246 1 0.374 11 GGAG/GAGG GENOMAD.105486.VP 3.33e-22 91 0 0 0 2561 Caudoviricetes NA NA PF09643;TIGR01671 phage uncharacterized protein TIGR01671
+NC_002737.2|provirus_777501_820593_784 791579 792040 462 1 0.383 11 AGGAG GENOMAD.003865.VV 3.718e-37 138 0 0 1 2561 Caudoviricetes NA NA PF11753;PF07852 Protein of unknwon function (DUF3310)
+NC_002737.2|provirus_777501_820593_785 792037 792207 171 1 0.333 11 GGAG/GAGG GENOMAD.094280.VV 2.018e-30 113 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_786 792490 792930 441 1 0.399 11 None GENOMAD.111673.VV 9.888e-90 289 0 0 0 2561 Caudoviricetes NA NA PF05263;TIGR01637 phage transcriptional regulator, ArpU family
+NC_002737.2|provirus_777501_820593_787 793076 793279 204 1 0.338 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_777501_820593_788 793245 794159 915 1 0.286 11 GGAG/GAGG GENOMAD.141545.VV 2.021e-203 626 0 0 0 1 NA NA NA PF20505 Intracellular sensor of Lambda phage, Abi component
+NC_002737.2|provirus_777501_820593_789 794178 794639 462 1 0.266 11 GGAG/GAGG GENOMAD.146805.VV 3.296e-80 262 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_777501_820593_790 794667 795149 483 1 0.393 11 None GENOMAD.168355.VP 1.714e-11 64 0 0 1 2561 Caudoviricetes NA NA PF03592;COG3728;K07474 Phage terminase, small subunit
+NC_002737.2|provirus_777501_820593_791 795127 796416 1290 1 0.384 11 None GENOMAD.100877.VP 2.658e-56 206 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_792 796428 796790 363 1 0.413 11 AGGA GENOMAD.033166.VV 2.201e-68 226 0 0 1 2561 Caudoviricetes NA NA PF05133;TIGR01538 phage portal protein, SPP1 family
+NC_002737.2|provirus_777501_820593_793 796902 797930 1029 1 0.421 11 None GENOMAD.100877.VP 9.441e-55 198 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_794 797911 799536 1626 1 0.381 11 GGAG/GAGG GENOMAD.004769.VV 9.122e-66 238 0 0 1 2561 Caudoviricetes NA NA PF04233;COG5585;TIGR01641 NAD+--asparagine ADP-ribosyltransferase
+NC_002737.2|provirus_777501_820593_795 799527 799706 180 1 0.344 11 AGGAG GENOMAD.137178.VV 6.881e-35 126 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_796 799766 800035 270 1 0.363 11 AGGAG GENOMAD.076597.VV 2.432e-44 155 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_797 800125 800295 171 1 0.357 11 None GENOMAD.179672.VV 0.0001663 39 0 0 0 2561 Caudoviricetes NA NA PF16777;COG4453;TIGR04563 Transcriptional regulator, RHH-like, CopG
+NC_002737.2|provirus_777501_820593_798 800424 800672 249 1 0.349 11 AGGAG GENOMAD.106940.VV 2.117e-42 149 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_799 800674 801420 747 1 0.386 11 GGA/GAG/AGG GENOMAD.024598.VV 2.917e-13 72 0 0 0 2561 Caudoviricetes NA NA COG3617 Prophage antirepressor
+NC_002737.2|provirus_777501_820593_800 801532 802065 534 1 0.419 11 AGGAG GENOMAD.010937.VV 1.418e-32 126 0 0 0 2561 Caudoviricetes NA NA PF14265 NA
+NC_002737.2|provirus_777501_820593_801 802075 802455 381 1 0.365 11 AGGAG GENOMAD.010435.VV 1.932e-15 74 0 0 0 2561 Caudoviricetes NA NA PF02924 NA
+NC_002737.2|provirus_777501_820593_802 802458 803507 1050 1 0.416 11 AGGAG GENOMAD.004151.VV 1.227e-66 233 0 0 1 2561 Caudoviricetes NA NA PF03864 Phage major capsid protein E
+NC_002737.2|provirus_777501_820593_803 803519 803785 267 1 0.378 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_777501_820593_804 803797 804150 354 1 0.379 11 GGAGG GENOMAD.020971.VV 2.807e-56 191 0 0 0 2561 Caudoviricetes NA NA PF11436;TIGR01560 NA
+NC_002737.2|provirus_777501_820593_805 804147 804455 309 1 0.392 11 AGxAGG/AGGxGG GENOMAD.042575.VV 1.017e-43 154 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_806 804436 804801 366 1 0.385 11 GGA/GAG/AGG GENOMAD.011013.VV 8.24e-39 141 0 0 1 2561 Caudoviricetes NA NA PF11114;TIGR01725;COG5005 phage protein, HK97 gp10 family
+NC_002737.2|provirus_777501_820593_807 804798 805187 390 1 0.369 11 GGAGG GENOMAD.023411.VV 1.013e-64 216 0 0 1 2561 Caudoviricetes NA NA PF16807 NA
+NC_002737.2|provirus_777501_820593_808 805197 805850 654 1 0.381 11 AGGAG GENOMAD.018762.VV 2.107e-36 139 0 0 1 2561 Caudoviricetes NA NA TIGR02126;COG5437 phage major tail protein, TP901-1 family
+NC_002737.2|provirus_777501_820593_809 805910 806263 354 1 0.381 11 AGGAG GENOMAD.019874.VV 2.516e-25 102 0 0 1 2561 Caudoviricetes NA NA PF12363 Phage tail assembly chaperone protein, TAC
+NC_002737.2|provirus_777501_820593_810 806305 806634 330 1 0.345 11 None GENOMAD.025799.VV 5.349e-22 92 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_811 806649 810284 3636 1 0.436 11 AGGAG GENOMAD.013432.VV 0.0 1205 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_812 810317 811096 780 1 0.354 11 AGGA GENOMAD.016670.VV 7.839e-14 74 0 0 0 2561 Caudoviricetes NA NA PF20195;TIGR01633;COG4722 putative phage tail component, N-terminal domain
+NC_002737.2|provirus_777501_820593_813 811093 813141 2049 1 0.421 11 GGAG/GAGG GENOMAD.130674.VP 5.583e-216 683 0 0 0 2561 Caudoviricetes NA NA COG4926 Phage-related protein
+NC_002737.2|provirus_777501_820593_814 813141 814259 1119 1 0.417 11 GGAGG GENOMAD.093524.VV 4.112e-132 424 0 0 0 2561 Caudoviricetes NA NA PF07212 Hyaluronidase protein (HylP)
+NC_002737.2|provirus_777501_820593_815 814272 816182 1911 1 0.428 11 AGGAG GENOMAD.033709.VV 1.037e-307 946 0 0 0 2561 Caudoviricetes NA NA PF07902 gp58-like protein
+NC_002737.2|provirus_777501_820593_816 816196 816357 162 1 0.321 11 AGGAG GENOMAD.181912.VC 1.836e-15 70 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_817 816360 816971 612 1 0.420 11 AGxAGG/AGGxGG GENOMAD.024672.VV 4.154e-119 377 0 0 0 2561 Caudoviricetes NA NA PF07104 NA
+NC_002737.2|provirus_777501_820593_818 816982 817278 297 1 0.377 11 GGAG/GAGG GENOMAD.084276.VV 2.759e-55 187 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_819 817275 817460 186 1 0.376 11 AGGAG GENOMAD.004934.VV 1.248e-22 91 0 0 1 2561 Caudoviricetes NA NA PF16945 Putative lactococcus lactis phage r1t holin
+NC_002737.2|provirus_777501_820593_820 817464 817571 108 1 0.352 11 GGAG/GAGG GENOMAD.102275.VV 1.131e-11 58 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_777501_820593_821 817572 818906 1335 1 0.383 11 AGGAG GENOMAD.006162.VV 6.011e-104 346 0 0 0 2561 Caudoviricetes NA NA K07273;COG3757 Lyzozyme M1 (1,4-beta-N-acetylmuramidase), GH25 family
+NC_002737.2|provirus_777501_820593_822 819180 819857 678 1 0.296 11 None GENOMAD.223611.VP 2.952e-108 347 0 0 0 2561 Caudoviricetes NA NA PF02876;PF01123;K11040 Staphylococcal/Streptococcal toxin, beta-grasp domain; Staphylococcal/Streptococcal toxin, OB-fold domain
+NC_002737.2|provirus_777501_820593_823 819883 820593 711 1 0.301 11 AGGAG GENOMAD.224010.VP 3.442e-49 177 0 0 0 1 NA NA NA PF02876 Staphylococcal/Streptococcal toxin, beta-grasp domain
+NC_002737.2|provirus_1186916_1222544_1181 1186916 1188778 1863 -1 0.405 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1182 1189309 1189491 183 -1 0.415 11 AGGAG GENOMAD.222241.VP 3.425e-27 104 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1183 1189729 1190529 801 1 0.367 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1184 1190749 1191234 486 1 0.270 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1185 1191304 1192509 1206 -1 0.440 11 AGGAG GENOMAD.133734.VP 8.732e-41 159 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1186 1192506 1192616 111 -1 0.387 11 AGGAG GENOMAD.102275.VV 5.331e-12 59 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1187 1192625 1192852 228 -1 0.395 11 AGGAG GENOMAD.126098.VV 2.718e-14 68 0 0 0 2561 Caudoviricetes NA NA COG5546 NA
+NC_002737.2|provirus_1186916_1222544_1188 1192849 1193124 276 -1 0.351 11 GGAG/GAGG GENOMAD.039653.VV 9.653e-09 53 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1189 1193134 1193751 618 -1 0.429 11 AGGAG GENOMAD.024672.VV 3.618e-113 360 0 0 0 2561 Caudoviricetes NA NA PF07104 NA
+NC_002737.2|provirus_1186916_1222544_1190 1193754 1194185 432 -1 0.370 11 AGGAG GENOMAD.073534.VV 1.119e-78 257 0 0 0 2561 Caudoviricetes NA NA PF07761 NA
+NC_002737.2|provirus_1186916_1222544_1191 1194197 1195981 1785 -1 0.406 11 AGGAG GENOMAD.033709.VV 3.341e-135 444 0 0 0 2561 Caudoviricetes NA NA PF07902 gp58-like protein
+NC_002737.2|provirus_1186916_1222544_1192 1195996 1197108 1113 -1 0.399 11 GGAGG GENOMAD.093524.VV 3.001e-116 378 0 0 0 2561 Caudoviricetes NA NA PF07212 Hyaluronidase protein (HylP)
+NC_002737.2|provirus_1186916_1222544_1193 1197108 1199066 1959 -1 0.393 11 GGAGG GENOMAD.010194.VV 2.301e-123 412 0 0 1 2561 Caudoviricetes NA NA PF06605;COG4926 Phage-related protein
+NC_002737.2|provirus_1186916_1222544_1194 1199063 1199758 696 -1 0.375 11 GGAG/GAGG GENOMAD.004911.VV 4.418e-12 68 0 0 0 2561 Caudoviricetes NA NA PF20195;COG4722;TIGR01633 Phage-related protein
+NC_002737.2|provirus_1186916_1222544_1195 1199755 1202112 2358 -1 0.416 11 AGGAG GENOMAD.003531.VV 1.119e-145 483 0 0 0 2561 Caudoviricetes NA NA COG5412 Phage-related protein
+NC_002737.2|provirus_1186916_1222544_1196 1202112 1202483 372 -1 0.368 11 None GENOMAD.024158.VV 1.493e-41 149 0 0 0 2561 Caudoviricetes NA NA PF17318 NA
+NC_002737.2|provirus_1186916_1222544_1197 1202498 1202761 264 -1 0.322 11 GGA/GAG/AGG GENOMAD.021224.VV 2.203e-21 89 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1198 1202772 1203365 594 -1 0.375 11 AGGAG GENOMAD.073691.VV 9.405e-47 168 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1199 1203377 1203712 336 -1 0.354 11 AGxAGG/AGGxGG GENOMAD.019860.VV 4.248e-41 147 0 0 1 2561 Caudoviricetes NA NA PF16807 NA
+NC_002737.2|provirus_1186916_1222544_1200 1203713 1203949 237 -1 0.392 11 GGA/GAG/AGG GENOMAD.017784.VV 2.629e-38 137 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1201 1203942 1204280 339 -1 0.375 11 AGGAG/GGAGG GENOMAD.018809.VV 1.338e-53 183 0 0 1 2561 Caudoviricetes NA NA PF10665 Minor capsid protein
+NC_002737.2|provirus_1186916_1222544_1202 1204240 1204662 423 -1 0.404 11 AGGAG GENOMAD.076853.VV 1.373e-58 199 0 0 1 2561 Caudoviricetes NA NA PF09355 Phage protein Gp19/Gp15/Gp42
+NC_002737.2|provirus_1186916_1222544_1203 1204672 1204872 201 -1 0.403 11 AGGAG GENOMAD.069443.VV 8.097e-08 49 0 0 1 2561 Caudoviricetes NA NA PF09124 T4 recombination endonuclease VII, dimerisation
+NC_002737.2|provirus_1186916_1222544_1204 1204872 1205783 912 -1 0.402 11 AGGAG GENOMAD.013457.VV 1.303e-93 309 0 0 1 2561 Caudoviricetes NA NA PF05065;TIGR01554;COG4653 Phage capsid family
+NC_002737.2|provirus_1186916_1222544_1205 1205808 1206269 462 -1 0.398 11 AGGA GENOMAD.083647.VV 5.39e-33 126 0 0 0 2561 Caudoviricetes NA NA PF14265 NA
+NC_002737.2|provirus_1186916_1222544_1206 1206350 1207765 1416 -1 0.397 11 AGGA GENOMAD.003419.VV 3.618e-228 707 0 0 1 2561 Caudoviricetes NA NA PF20441;PF03354;COG4626;TIGR01547;K17677 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_002737.2|provirus_1186916_1222544_1207 1207875 1208141 267 -1 0.363 11 AGGAG GENOMAD.076597.VV 5.163e-44 154 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1208 1208134 1208313 180 -1 0.317 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1209 1208363 1208587 225 -1 0.387 11 None GENOMAD.193246.VV 2.324e-45 157 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1210 1208593 1210086 1494 -1 0.364 11 GGAGG GENOMAD.003531.VV 5.059e-87 299 0 0 0 2561 Caudoviricetes NA NA COG5412 Phage-related protein
+NC_002737.2|provirus_1186916_1222544_1211 1210079 1211347 1269 -1 0.414 11 AGGAG GENOMAD.076853.VV 1.22e-50 189 0 0 1 2561 Caudoviricetes NA NA PF09355 Phage protein Gp19/Gp15/Gp42
+NC_002737.2|provirus_1186916_1222544_1212 1211344 1211700 357 -1 0.314 11 GGAGG GENOMAD.072475.VV 3.993e-61 205 0 0 0 2561 Caudoviricetes NA NA PF12855;COG4338 ECL1/2/3 zinc binding proteins
+NC_002737.2|provirus_1186916_1222544_1213 1211849 1212193 345 -1 0.432 11 GGA/GAG/AGG GENOMAD.108097.VV 8.959e-27 106 0 0 0 2561 Caudoviricetes NA NA PF13395 HNH endonuclease
+NC_002737.2|provirus_1186916_1222544_1214 1212302 1212721 420 -1 0.362 11 AGGAG GENOMAD.024790.VV 1.124e-76 251 0 0 0 2561 Caudoviricetes NA NA PF07374;TIGR01636;COG2739 phage transcriptional activator, RinA family
+NC_002737.2|provirus_1186916_1222544_1215 1212989 1213624 636 -1 0.360 11 GGAGG GENOMAD.138295.VP 1.141e-77 258 0 0 0 2561 Caudoviricetes NA NA TIGR02987;COG0827 NA
+NC_002737.2|provirus_1186916_1222544_1216 1213626 1213895 270 -1 0.393 11 GGA/GAG/AGG GENOMAD.072347.VV 2.986e-42 149 0 0 0 2561 Caudoviricetes NA NA TIGR02209 NA
+NC_002737.2|provirus_1186916_1222544_1217 1213979 1214491 513 -1 0.378 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1218 1214488 1214880 393 -1 0.361 11 None GENOMAD.060064.VV 5.451e-14 70 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1219 1215006 1215803 798 -1 0.397 11 GGAG/GAGG GENOMAD.161534.VP 1.003e-148 466 0 0 0 2561 Caudoviricetes NA NA PF12684;TIGR01896 PDDEXK-like domain of unknown function (DUF3799)
+NC_002737.2|provirus_1186916_1222544_1220 1215796 1215996 201 -1 0.318 11 GGAG/GAGG GENOMAD.148606.VV 1.297e-39 140 0 0 0 1 NA NA NA PF06289 NA
+NC_002737.2|provirus_1186916_1222544_1221 1215993 1216982 990 -1 0.399 11 GGAG/GAGG GENOMAD.091877.VP 1.608e-51 188 0 0 0 2561 Caudoviricetes NA NA PF03837;COG3723;K07455;TIGR00616 Recombinational DNA repair protein RecT
+NC_002737.2|provirus_1186916_1222544_1222 1216982 1217314 333 -1 0.315 11 GGAG/GAGG GENOMAD.040347.VV 3.314e-43 153 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1223 1217370 1217576 207 -1 0.406 11 AGGAG GENOMAD.114751.VV 1.769e-37 134 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1224 1217585 1217725 141 -1 0.404 11 AGGAG GENOMAD.079484.VV 1.722e-06 44 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1225 1217722 1217955 234 -1 0.359 11 None GENOMAD.100896.VV 1.121e-38 138 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1226 1217936 1218322 387 -1 0.370 11 AGGAG GENOMAD.198321.CP 4.29e-06 47 0 0 0 2561 Caudoviricetes NA NA PF07261;COG3611;TIGR04548;K02086 Replication initiation and membrane attachment protein DnaB
+NC_002737.2|provirus_1186916_1222544_1227 1218448 1218702 255 -1 0.396 11 4Base/6BMM GENOMAD.136142.VP 2.402e-34 126 0 0 0 2561 Caudoviricetes NA NA PF13730;TIGR00373;COG4738;K07721 transcription factor E
+NC_002737.2|provirus_1186916_1222544_1228 1218811 1218996 186 -1 0.382 11 AGGAG GENOMAD.105558.VV 1.448e-28 108 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1229 1218998 1219309 312 -1 0.353 11 GGAG/GAGG GENOMAD.050216.VV 2.881e-57 193 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1230 1219407 1219538 132 -1 0.341 11 AGGA GENOMAD.114759.VV 3.069e-20 83 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_002737.2|provirus_1186916_1222544_1231 1219579 1219791 213 -1 0.347 11 AGGAG GENOMAD.225776.VP 0.0003177 39 0 0 0 1 NA NA NA PF05339;TIGR00673;COG3620;K22299 cyanase
+NC_002737.2|provirus_1186916_1222544_1232 1219993 1220748 756 1 0.368 11 AGGAG GENOMAD.091877.VP 8.865e-44 162 0 0 0 2561 Caudoviricetes NA NA PF03837;COG3723;K07455;TIGR00616 Recombinational DNA repair protein RecT
+NC_002737.2|provirus_1186916_1222544_1233 1220760 1221278 519 1 0.326 11 AGGAG GENOMAD.064488.VV 1.26e-91 296 0 0 0 2561 Caudoviricetes NA NA PF08797 HIRAN domain
+NC_002737.2|provirus_1186916_1222544_1234 1221402 1222544 1143 1 0.354 11 GGAG/GAGG GENOMAD.111131.VV 8.486e-09 60 0 0 0 2561 Caudoviricetes NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_003450.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_003450.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_008261.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_008261.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,113 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_008261.1|provirus_1070550_1127691_877 1070550 1072190 1641 1 0.238 11 GGA/GAG/AGG GENOMAD.082048.VV 1.889e-05 50 0 0 0 12031 Mimiviridae NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_878 1072272 1072892 621 1 0.337 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_879 1073139 1074983 1845 1 0.246 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_880 1075096 1076289 1194 1 0.258 11 AGGAG GENOMAD.076874.VV 1.378e-16 85 0 0 0 2561 Caudoviricetes NA NA PF01041;K07806;TIGR03588;COG0399 UDP-4-amino-4,6-dideoxy-N-acetyl-beta-L-altrosamine transaminase
+NC_008261.1|provirus_1070550_1127691_881 1076295 1076897 603 1 0.227 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_882 1076920 1077945 1026 1 0.217 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_883 1077932 1079059 1128 1 0.243 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_884 1079063 1080139 1077 1 0.194 11 GGA/GAG/AGG GENOMAD.216304.PC 1.438e-24 109 0 0 0 1 NA NA NA PF14897;K19419;COG4745;TIGR03663 EpsG family
+NC_008261.1|provirus_1070550_1127691_885 1080176 1081549 1374 1 0.191 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_886 1081573 1082385 813 1 0.232 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_887 1082401 1083114 714 1 0.230 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_888 1083114 1083731 618 1 0.235 11 AGGAG/GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_889 1083893 1084318 426 1 0.312 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_890 1084498 1084986 489 1 0.266 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_891 1085277 1087037 1761 1 0.293 11 AGGA GENOMAD.152449.VC 1.254e-06 54 0 0 0 1 NA NA NA PF13597;PF01638;K21636;TIGR02487;COG1328 anaerobic ribonucleoside-triphosphate reductase
+NC_008261.1|provirus_1070550_1127691_892 1087034 1087492 459 1 0.307 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_893 1087687 1088409 723 1 0.245 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_894 1088615 1088833 219 -1 0.187 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_895 1089077 1090141 1065 -1 0.241 11 GGAG/GAGG GENOMAD.225071.VP 1.1e-06 53 0 0 0 1 NA NA NA PF00589;PF13102;TIGR02225;COG4973;K14059 tyrosine recombinase XerD
+NC_008261.1|provirus_1070550_1127691_896 1090234 1090698 465 -1 0.282 11 AGxAGG/AGGxGG GENOMAD.123021.VV 2.145e-26 107 0 0 0 2561 Caudoviricetes NA NA PF06114;COG2856 IrrE N-terminal-like domain
+NC_008261.1|provirus_1070550_1127691_897 1090714 1091217 504 -1 0.270 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_898 1091369 1091605 237 1 0.241 11 GGAGG GENOMAD.069056.VV 3.217e-21 88 0 0 1 2561 Caudoviricetes NA NA PF06892;TIGR00673;COG1974;K07727 cyanase
+NC_008261.1|provirus_1070550_1127691_899 1091617 1092348 732 1 0.294 11 AGGAGG GENOMAD.119058.VP 1.071e-22 100 0 0 0 2561 Caudoviricetes NA NA PF10552 ORF6C domain
+NC_008261.1|provirus_1070550_1127691_900 1092374 1092628 255 1 0.239 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_901 1092597 1093268 672 -1 0.226 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_902 1093445 1093747 303 1 0.323 11 AGGAGG GENOMAD.061044.VV 4.551e-51 175 0 0 1 2561 Caudoviricetes NA NA PF13411;COG4220;TIGR02054 Phage DNA packaging protein, Nu1 subunit of terminase
+NC_008261.1|provirus_1070550_1127691_903 1093749 1093928 180 1 0.233 11 AGGAGG GENOMAD.164182.VV 2.491e-15 70 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_904 1093939 1094121 183 1 0.268 11 GGA/GAG/AGG GENOMAD.117872.VV 7.847e-06 43 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_905 1094118 1094225 108 1 0.269 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_906 1094418 1094603 186 1 0.339 11 AGGAGG GENOMAD.172161.VC 4.982e-10 55 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_907 1094603 1095514 912 1 0.305 11 AGGAGG GENOMAD.142278.VP 1.844e-07 55 0 0 1 2561 Caudoviricetes NA NA PF09588;COG5377;TIGR03033 Phage-related protein, predicted endonuclease
+NC_008261.1|provirus_1070550_1127691_908 1095516 1096385 870 1 0.313 11 AGGAGG GENOMAD.098980.VP 5.121e-35 138 0 0 0 2561 Caudoviricetes NA NA PF03837;COG3723;K07455;TIGR00616 Recombinational DNA repair protein RecT
+NC_008261.1|provirus_1070550_1127691_909 1096403 1097116 714 1 0.312 11 AGGAGG GENOMAD.178290.VP 7.894e-26 109 0 0 1 2561 Caudoviricetes NA NA PF04492;TIGR01714;COG2188 Bacteriophage replication protein O
+NC_008261.1|provirus_1070550_1127691_910 1097117 1097290 174 1 0.299 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_911 1097284 1097670 387 1 0.333 11 GGAGG GENOMAD.194141.VP 1.905e-16 77 0 0 0 2561 Caudoviricetes NA NA PF05866;COG4570 Endodeoxyribonuclease RusA
+NC_008261.1|provirus_1070550_1127691_912 1097820 1098467 648 1 0.267 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_913 1099026 1099499 474 1 0.274 11 AGGAGG GENOMAD.062141.VV 1.203e-15 76 0 0 0 2561 Caudoviricetes NA NA PF05263;TIGR01636 phage transcriptional activator, RinA family
+NC_008261.1|provirus_1070550_1127691_914 1099982 1101157 1176 1 0.225 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_915 1101226 1101693 468 1 0.333 11 AGxAGG/AGGxGG GENOMAD.026460.VV 4.147e-28 112 0 0 1 2561 Caudoviricetes NA NA PF03592;COG3728;K07474 Phage terminase, small subunit
+NC_008261.1|provirus_1070550_1127691_916 1101686 1103050 1365 1 0.304 11 AGGA GENOMAD.017640.VV 7.419e-95 320 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_917 1103106 1103873 768 1 0.217 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_918 1103919 1105439 1521 1 0.300 11 AGGAGG GENOMAD.016130.VV 7.684e-228 708 0 0 1 2561 Caudoviricetes NA NA PF05133;TIGR01542 phage portal protein, putative, A118 family
+NC_008261.1|provirus_1070550_1127691_919 1105423 1107060 1638 1 0.299 11 GGAG/GAGG GENOMAD.015690.VV 1.626e-76 270 0 0 1 2561 Caudoviricetes NA NA PF06152;TIGR01641 Phage minor capsid protein 2
+NC_008261.1|provirus_1070550_1127691_920 1107073 1107297 225 1 0.262 11 GGAG/GAGG GENOMAD.093339.VV 2.906e-13 65 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_921 1107325 1107942 618 1 0.235 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_922 1108036 1108641 606 1 0.345 11 GGAGG GENOMAD.041104.VV 1.371e-23 101 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_923 1108666 1109571 906 1 0.305 11 AGGAG GENOMAD.075076.VV 1.757e-79 268 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_924 1109586 1109855 270 1 0.263 11 AGGAG GENOMAD.050526.VV 1.494e-18 81 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_925 1109891 1110253 363 1 0.267 11 AGGA GENOMAD.020431.VV 1.927e-29 114 0 0 0 2561 Caudoviricetes NA NA PF11436 Putative DnaT-like ssDNA binding protein
+NC_008261.1|provirus_1070550_1127691_926 1110257 1110583 327 1 0.315 11 AGGAGG GENOMAD.024076.VV 1.104e-53 183 0 0 1 2561 Caudoviricetes NA NA PF10665 Minor capsid protein
+NC_008261.1|provirus_1070550_1127691_927 1110583 1110966 384 1 0.271 11 GGAG/GAGG GENOMAD.019595.VV 1.238e-61 207 0 0 1 2561 Caudoviricetes NA NA PF11114 Minor capsid protein
+NC_008261.1|provirus_1070550_1127691_928 1110966 1111352 387 1 0.300 11 AGGA/GGAG/GAGG GENOMAD.028696.VV 6.269e-45 159 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_929 1111362 1111820 459 1 0.353 11 GGA/GAG/AGG GENOMAD.019307.VV 5.136e-50 175 0 0 1 2561 Caudoviricetes NA NA PF16461;COG5437 Predicted secreted protein
+NC_008261.1|provirus_1070550_1127691_930 1111833 1112201 369 1 0.263 11 AGGAGG GENOMAD.052890.VV 8.683e-47 164 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_931 1112161 1112523 363 1 0.314 11 3Base/5BMM GENOMAD.015650.VV 9.786e-61 204 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_932 1112564 1115776 3213 1 0.311 11 AGxAGG/AGGxGG GENOMAD.171590.VP 0.0 1638 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_933 1115780 1116133 354 1 0.319 11 None GENOMAD.012935.VV 2.528e-49 171 0 0 0 2561 Caudoviricetes NA NA PF20458 NA
+NC_008261.1|provirus_1070550_1127691_934 1116156 1116422 267 1 0.292 11 AGxAGG/AGGxGG GENOMAD.163907.VV 7.646e-48 165 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_935 1116489 1116869 381 1 0.226 11 GGAG/GAGG GENOMAD.016019.VV 6.313e-44 156 0 0 0 2561 Caudoviricetes NA NA PF07761 NA
+NC_008261.1|provirus_1070550_1127691_936 1116905 1122013 5109 1 0.296 11 AGxAGG/AGGxGG GENOMAD.141397.VP 0.0 2111 0 0 1 2561 Caudoviricetes NA NA PF06605;PF00149;TIGR01665;K01517;COG4926 phage minor structural protein, N-terminal region
+NC_008261.1|provirus_1070550_1127691_937 1122032 1122280 249 1 0.217 11 AGGAGG GENOMAD.113645.VV 4.861e-34 125 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_938 1122294 1122710 417 1 0.276 11 AGGA GENOMAD.112625.VV 0.0002838 42 0 0 1 1 NA NA NA PF05105;TIGR01593;COG4824 toxin secretion/phage lysis holin
+NC_008261.1|provirus_1070550_1127691_939 1122751 1123167 417 1 0.281 11 AGxAGG/AGGxGG GENOMAD.224084.VP 7.697e-31 119 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_940 1123253 1124281 1029 1 0.290 11 AGxAGG/AGGxGG GENOMAD.169358.VC 0.0003137 45 0 0 0 2561 Caudoviricetes NA NA PF06725;PF18348;COG3584;K11060;TIGR04211 3D (Asp-Asp-Asp) domain
+NC_008261.1|provirus_1070550_1127691_941 1124699 1125361 663 1 0.186 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_942 1125585 1126673 1089 1 0.234 11 GGAG/GAGG GENOMAD.129207.VV 1.696e-28 121 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_943 1126618 1126959 342 1 0.266 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1070550_1127691_944 1126966 1127691 726 1 0.247 11 AGxAGG/AGGxGG GENOMAD.129093.VV 5.379e-18 86 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1520 1784095 1784580 486 -1 0.302 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1521 1784747 1785049 303 -1 0.261 11 AGGAGG GENOMAD.099786.VV 1.61e-22 93 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1522 1785241 1786269 1029 -1 0.287 11 AGxAGG/AGGxGG GENOMAD.169358.VC 1.801e-05 49 0 0 0 2561 Caudoviricetes NA NA PF06725;PF18348;COG3584;K11060;TIGR04211 3D (Asp-Asp-Asp) domain
+NC_008261.1|provirus_1784095_1821197_1523 1786323 1786805 483 -1 0.271 11 AGxAGG/AGGxGG GENOMAD.222318.VP 5.723e-61 207 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1524 1786826 1787059 234 -1 0.226 11 GGA/GAG/AGG GENOMAD.080405.VV 7.991e-27 104 0 0 0 2561 Caudoviricetes NA NA PF10779 Haemolysin XhlA
+NC_008261.1|provirus_1784095_1821197_1525 1787141 1787326 186 -1 0.290 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1526 1787345 1789843 2499 -1 0.279 11 AGGAG GENOMAD.033703.VV 5.052e-243 769 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1527 1789859 1791739 1881 -1 0.297 11 AGGAG GENOMAD.082024.VV 7.094e-68 247 0 0 0 2561 Caudoviricetes NA NA PF10651;PF15425 BppU N-terminal domain
+NC_008261.1|provirus_1784095_1821197_1528 1791790 1794849 3060 -1 0.307 11 None GENOMAD.004842.VV 2.175e-102 362 0 0 1 2561 Caudoviricetes NA NA PF06605;PF18994;COG4926;TIGR01665 Phage-related protein
+NC_008261.1|provirus_1784095_1821197_1529 1794854 1795564 711 -1 0.249 11 GGAGG GENOMAD.055476.VV 7.973e-38 144 0 0 0 2561 Caudoviricetes NA NA PF20195;COG4722;TIGR01633 Phage-related protein
+NC_008261.1|provirus_1784095_1821197_1530 1795557 1798811 3255 -1 0.299 11 AGGAGG GENOMAD.104282.VP 3.823e-53 208 0 0 0 2561 Caudoviricetes NA NA COG5412 Phage-related protein
+NC_008261.1|provirus_1784095_1821197_1531 1798847 1799200 354 -1 0.218 11 None GENOMAD.080513.VV 1.378e-06 48 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1532 1799362 1799679 318 -1 0.270 11 GGA/GAG/AGG GENOMAD.080540.VV 1.741e-55 188 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1533 1799682 1800284 603 -1 0.315 11 AGxAGG/AGGxGG GENOMAD.013991.VV 4.274e-39 146 0 0 1 2561 Caudoviricetes NA NA PF04630;TIGR01603 phage major tail protein, phi13 family
+NC_008261.1|provirus_1784095_1821197_1534 1800301 1800648 348 -1 0.261 11 AGxAGG/AGGxGG GENOMAD.056191.VV 7.661e-29 112 0 0 0 2561 Caudoviricetes NA NA PF05657 NA
+NC_008261.1|provirus_1784095_1821197_1535 1800657 1801094 438 -1 0.304 11 GGAG/GAGG GENOMAD.072939.VV 1.155e-20 90 0 0 1 2561 Caudoviricetes NA NA TIGR01725;COG5005 phage protein, HK97 gp10 family
+NC_008261.1|provirus_1784095_1821197_1536 1801094 1801423 330 -1 0.276 11 None GENOMAD.078312.VV 2.185e-15 73 0 0 1 2561 Caudoviricetes NA NA PF05521;TIGR01563;COG5614 phage head-tail adaptor, putative, SPP1 family
+NC_008261.1|provirus_1784095_1821197_1537 1801416 1801694 279 -1 0.262 11 GGA/GAG/AGG GENOMAD.034954.VV 1.311e-13 67 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR01560 Phage gp6-like head-tail connector protein
+NC_008261.1|provirus_1784095_1821197_1538 1801706 1802890 1185 -1 0.295 11 AGGAGG GENOMAD.014413.VV 7.217e-42 162 0 0 1 2561 Caudoviricetes NA NA PF05065;TIGR01554;COG4653 phage major capsid protein, HK97 family
+NC_008261.1|provirus_1784095_1821197_1539 1802931 1803536 606 -1 0.289 11 AGxAGG/AGGxGG GENOMAD.126260.VV 7.801e-51 180 0 0 1 2561 Caudoviricetes NA NA PF04586;COG3740;K06904;TIGR01543 Phage head maturation protease
+NC_008261.1|provirus_1784095_1821197_1540 1803526 1804773 1248 -1 0.272 11 GGAG/GAGG GENOMAD.126260.VV 8.756e-55 201 0 0 1 2561 Caudoviricetes NA NA PF04586;COG3740;K06904;TIGR01543 Phage head maturation protease
+NC_008261.1|provirus_1784095_1821197_1541 1804774 1806513 1740 -1 0.303 11 AGGA GENOMAD.166487.VP 8.866e-49 188 0 0 1 2561 Caudoviricetes NA NA PF20441;COG4626 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_008261.1|provirus_1784095_1821197_1542 1806506 1807018 513 -1 0.271 11 GGA/GAG/AGG GENOMAD.136127.VP 7.834e-17 80 0 0 1 2561 Caudoviricetes NA NA PF05119;COG3747;TIGR01558 Phage terminase, small subunit
+NC_008261.1|provirus_1784095_1821197_1543 1807521 1808342 822 -1 0.246 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1544 1808517 1809065 549 -1 0.270 11 GGAG/GAGG GENOMAD.027124.VV 1.276e-14 74 0 0 0 2561 Caudoviricetes NA NA PF07104 NA
+NC_008261.1|provirus_1784095_1821197_1545 1809160 1809513 354 -1 0.263 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1546 1809572 1809778 207 -1 0.304 11 GGAG/GAGG GENOMAD.117627.VV 5.796e-41 144 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1547 1809920 1810381 462 -1 0.264 11 GGAG/GAGG GENOMAD.062141.VV 1.839e-18 84 0 0 0 2561 Caudoviricetes NA NA PF05263;TIGR01636 phage transcriptional activator, RinA family
+NC_008261.1|provirus_1784095_1821197_1548 1810917 1811306 390 -1 0.295 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1549 1811321 1811467 147 -1 0.272 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1550 1811479 1812762 1284 -1 0.296 11 GGA/GAG/AGG GENOMAD.068048.VV 6.568e-15 80 0 0 1 2561 Caudoviricetes NA NA PF20307;TIGR03600;K02314;COG0305 phage replicative helicase, DnaB family, HK022 subfamily
+NC_008261.1|provirus_1784095_1821197_1551 1812773 1813513 741 -1 0.266 11 GGAG/GAGG GENOMAD.096239.VV 9.382e-28 115 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1552 1813541 1813699 159 -1 0.270 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1553 1813702 1813881 180 -1 0.267 11 AGGAGG GENOMAD.148814.VV 1.3e-07 48 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1554 1813907 1814137 231 -1 0.277 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1555 1814143 1814640 498 -1 0.295 11 AGGAG GENOMAD.142555.VV 5.332e-20 89 0 0 1 2561 Caudoviricetes NA NA PF06892;TIGR02612;K22299;COG3620 Phage regulatory protein CII (CP76)
+NC_008261.1|provirus_1784095_1821197_1556 1814690 1814878 189 -1 0.243 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1557 1815028 1815372 345 1 0.278 11 AGGA/GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1558 1815423 1817012 1590 1 0.228 11 GGAGG GENOMAD.219971.CV 7.902e-13 74 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1559 1817080 1817934 855 1 0.237 11 AGGAG GENOMAD.170359.VC 3.605e-08 57 0 0 0 1 NA NA NA PF02086;TIGR00571;COG0338;K06223 DNA adenine methylase (dam)
+NC_008261.1|provirus_1784095_1821197_1560 1818046 1818543 498 1 0.267 11 GGxGG GENOMAD.123021.VV 2.082e-10 61 0 0 0 2561 Caudoviricetes NA NA PF06114;COG2856 IrrE N-terminal-like domain
+NC_008261.1|provirus_1784095_1821197_1561 1818556 1820064 1509 1 0.250 11 GGAGG GENOMAD.169508.VP 2.109e-24 111 0 0 1 2561 Caudoviricetes NA NA PF04708;PF13262;COG1961;K14060 Site-specific DNA recombinase related to the DNA invertase Pin
+NC_008261.1|provirus_1784095_1821197_1562 1820078 1820416 339 -1 0.301 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_008261.1|provirus_1784095_1821197_1563 1820820 1821197 378 -1 0.257 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_009012.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_009012.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,223 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_009012.1|provirus_1938476_1983993_1694 1938476 1938967 492 -1 0.404 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1695 1938931 1940499 1569 -1 0.392 11 AGGAGG GENOMAD.097162.VV 2.214e-10 66 0 0 1 2561 Caudoviricetes NA NA PF20307;TIGR03600;COG0305;K18947 phage replicative helicase, DnaB family, HK022 subfamily
+NC_009012.1|provirus_1938476_1983993_1696 1940561 1940779 219 -1 0.416 11 AGGAGG GENOMAD.180442.VC 1.734e-24 97 0 0 0 2561 Caudoviricetes NA NA PF20612 SHOCT domain
+NC_009012.1|provirus_1938476_1983993_1697 1940837 1941841 1005 -1 0.450 11 AGGAGG GENOMAD.215835.VV 1.253e-44 168 0 0 0 2561 Caudoviricetes NA NA PF01510;COG5632;K11066 N-acetylmuramoyl-L-alanine amidase CwlA
+NC_009012.1|provirus_1938476_1983993_1698 1941838 1942257 420 -1 0.464 11 GGAGG GENOMAD.083633.VV 5.263e-08 53 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1699 1942344 1944812 2469 -1 0.465 11 AGxAGG/AGGxGG GENOMAD.116546.VV 0.0 1051 0 0 1 2561 Caudoviricetes NA NA PF06605;TIGR01665;COG4926 phage minor structural protein, N-terminal region
+NC_009012.1|provirus_1938476_1983993_1700 1944809 1945384 576 -1 0.472 11 GGA/GAG/AGG GENOMAD.066153.VV 1.508e-90 294 0 0 1 2561 Caudoviricetes NA NA PF06605;TIGR01665;COG4926 phage minor structural protein, N-terminal region
+NC_009012.1|provirus_1938476_1983993_1701 1945394 1945588 195 -1 0.446 11 GGAG/GAGG GENOMAD.089015.VV 2.452e-32 119 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1702 1945599 1948121 2523 -1 0.450 11 GGAGG GENOMAD.116546.VV 0.0 1208 0 0 1 2561 Caudoviricetes NA NA PF06605;TIGR01665;COG4926 phage minor structural protein, N-terminal region
+NC_009012.1|provirus_1938476_1983993_1703 1948126 1948899 774 -1 0.433 11 GGAGG GENOMAD.116614.VV 3.551e-139 438 0 0 0 2561 Caudoviricetes NA NA PF20195;COG4722;TIGR01633 Phage-related protein
+NC_009012.1|provirus_1938476_1983993_1704 1948913 1951201 2289 -1 0.504 11 AGGAGG GENOMAD.036973.VV 4.796e-161 527 0 0 0 2561 Caudoviricetes NA NA K02334;COG4722 Phage-related protein
+NC_009012.1|provirus_1938476_1983993_1705 1951335 1951607 273 1 0.502 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1706 1951604 1952008 405 1 0.504 11 AGGA/GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1707 1952057 1952248 192 -1 0.453 11 None GENOMAD.223693.VP 2.475e-24 96 0 0 1 2561 Caudoviricetes NA NA PF09550;TIGR02216 Phage tail assembly chaperone protein, TAC
+NC_009012.1|provirus_1938476_1983993_1708 1952245 1952628 384 -1 0.448 11 AGGAGG GENOMAD.166825.VP 3.751e-66 220 0 0 1 2561 Caudoviricetes NA NA PF11836 Phage tail tube protein, GTA-gp10
+NC_009012.1|provirus_1938476_1983993_1709 1952631 1953227 597 -1 0.513 11 AGGAGG GENOMAD.005050.VV 1.417e-111 355 0 0 1 2561 Caudoviricetes NA NA PF04630;TIGR01603 phage major tail protein, phi13 family
+NC_009012.1|provirus_1938476_1983993_1710 1953233 1953577 345 -1 0.429 11 AGGAG/GGAGG GENOMAD.077616.VV 1.204e-39 143 0 0 0 2561 Caudoviricetes NA NA PF05657 NA
+NC_009012.1|provirus_1938476_1983993_1711 1953574 1954005 432 -1 0.465 11 AGGAGG GENOMAD.032585.VV 5.7e-53 183 0 0 1 2561 Caudoviricetes NA NA PF11114;COG5005;TIGR01725 Mu-like prophage protein gpG
+NC_009012.1|provirus_1938476_1983993_1712 1954022 1954357 336 -1 0.440 11 GGA/GAG/AGG GENOMAD.040271.VV 1.154e-54 186 0 0 1 2561 Caudoviricetes NA NA PF05521;COG5614;TIGR01563 Bacteriophage head-tail adaptor
+NC_009012.1|provirus_1938476_1983993_1713 1954360 1954668 309 -1 0.472 11 GGAGG GENOMAD.028909.VV 6.135e-49 169 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR01560 Phage gp6-like head-tail connector protein
+NC_009012.1|provirus_1938476_1983993_1714 1954690 1955892 1203 -1 0.482 11 AGGAGG GENOMAD.168658.VV 4.012e-34 139 0 0 1 2561 Caudoviricetes NA NA PF05065;PF04586;PF12518;COG4653;TIGR01554;K06904 Predicted phage phi-C31 gp36 major capsid-like protein
+NC_009012.1|provirus_1938476_1983993_1715 1955943 1956671 729 -1 0.439 11 GGAGG GENOMAD.028909.VV 1.82e-27 114 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR01560 Phage gp6-like head-tail connector protein
+NC_009012.1|provirus_1938476_1983993_1716 1956610 1957932 1323 -1 0.485 11 AGGAG GENOMAD.179073.VP 1.831e-53 198 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1717 1958009 1959793 1785 -1 0.324 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1718 1959867 1961096 1230 -1 0.462 11 None GENOMAD.181434.VP 5.613e-61 219 0 0 1 2561 Caudoviricetes NA NA PF20441 Terminase large subunit, endonuclease domain
+NC_009012.1|provirus_1938476_1983993_1719 1961099 1961434 336 -1 0.458 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1720 1961573 1961767 195 -1 0.385 11 GGAG/GAGG GENOMAD.140940.VV 2.57e-10 56 0 0 0 2561 Caudoviricetes NA NA PF16468 NA
+NC_009012.1|provirus_1938476_1983993_1721 1961771 1962238 468 -1 0.464 11 AGGAGG GENOMAD.191984.VP 6.704e-12 65 0 0 0 2561 Caudoviricetes NA NA PF07128 NA
+NC_009012.1|provirus_1938476_1983993_1722 1962300 1963199 900 -1 0.504 11 AGGAG GENOMAD.105515.VV 0.0005042 44 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1723 1963341 1963571 231 -1 0.463 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1724 1963597 1964289 693 -1 0.440 11 GGAGG GENOMAD.105515.VV 6.371e-26 109 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1725 1964406 1965659 1254 -1 0.440 11 GGAGG GENOMAD.208446.VP 2.08e-27 119 0 0 0 2561 Caudoviricetes NA NA PF01555;COG4725;K13581 N6-adenosine-specific RNA methylase IME4
+NC_009012.1|provirus_1938476_1983993_1726 1965665 1966963 1299 -1 0.464 11 AGGAG GENOMAD.005053.VV 4.044e-23 106 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1727 1966938 1967120 183 -1 0.350 11 AGGAGG GENOMAD.195270.VP 2e-32 119 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1728 1967120 1967671 552 -1 0.502 11 GGAG/GAGG GENOMAD.098194.VV 4.683e-91 295 0 0 1 2561 Caudoviricetes NA NA PF05119;COG3747;TIGR01558 Phage terminase, small subunit
+NC_009012.1|provirus_1938476_1983993_1729 1967792 1968151 360 -1 0.478 11 AGGAGG GENOMAD.127444.VV 9.611e-12 63 0 0 0 2561 Caudoviricetes NA NA PF13395 HNH endonuclease
+NC_009012.1|provirus_1938476_1983993_1730 1968273 1968515 243 -1 0.399 11 AGGAG GENOMAD.212426.VP 6.855e-15 70 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1731 1968659 1969657 999 -1 0.379 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1732 1969697 1970107 411 -1 0.309 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1733 1970346 1970801 456 -1 0.436 11 GGAGG GENOMAD.056402.VV 3.108e-38 141 0 0 0 2561 Caudoviricetes NA NA PF05263;TIGR01636 phage transcriptional activator, RinA family
+NC_009012.1|provirus_1938476_1983993_1734 1970893 1971195 303 -1 0.452 11 GGAGG GENOMAD.138066.VP 1.61e-22 93 0 0 0 2561 Caudoviricetes NA NA PF03838;COG3331;TIGR00648 Penicillin-binding protein-related factor A, putative recombinase
+NC_009012.1|provirus_1938476_1983993_1735 1971496 1974051 2556 -1 0.449 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1736 1974048 1974473 426 -1 0.465 11 AGxAGG/AGGxGG GENOMAD.179451.VC 2.953e-05 45 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1737 1974489 1975286 798 -1 0.396 11 GGAGG GENOMAD.153366.VP 4.288e-20 93 0 0 0 2561 Caudoviricetes NA NA PF03374;COG3645 Phage antirepressor protein YoqD, KilAC domain
+NC_009012.1|provirus_1938476_1983993_1738 1975291 1977213 1923 -1 0.440 11 AGGAG GENOMAD.140318.VC 1.003e-23 110 0 0 0 2561 Caudoviricetes NA NA PF00476;COG0749;TIGR00593 DNA polymerase I - 3'-5' exonuclease and polymerase domains
+NC_009012.1|provirus_1938476_1983993_1739 1977271 1978023 753 -1 0.467 11 GGAGG GENOMAD.211539.VV 6.84e-47 171 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1740 1978145 1978585 441 -1 0.469 11 AGGAG GENOMAD.026103.VV 4.552e-65 218 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1741 1978551 1979909 1359 -1 0.444 11 None GENOMAD.003266.VV 2.422e-23 107 0 0 0 2561 Caudoviricetes NA NA PF00176;K14440;COG1061;TIGR04095 Superfamily II DNA or RNA helicase
+NC_009012.1|provirus_1938476_1983993_1742 1979876 1980058 183 -1 0.454 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1743 1980282 1982201 1920 -1 0.369 11 GGAGG GENOMAD.213960.VV 1.039e-08 61 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1744 1982360 1982566 207 1 0.343 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_1938476_1983993_1745 1983046 1983993 948 -1 0.397 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1786 2022140 2023468 1329 -1 0.340 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1787 2023413 2024702 1290 -1 0.350 11 AGxAGG/AGGxGG GENOMAD.022372.VV 2.322e-18 91 0 0 1 2561 Caudoviricetes NA NA PF04708;COG1961;K14060 Site-specific DNA recombinase related to the DNA invertase Pin
+NC_009012.1|provirus_2022140_2067593_1788 2024803 2025474 672 -1 0.368 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1789 2025494 2025979 486 -1 0.340 11 AGGAGG GENOMAD.170412.VP 4.718e-05 45 0 0 1 2561 Caudoviricetes NA NA PF03354;COG4626 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_009012.1|provirus_2022140_2067593_1790 2025972 2026382 411 -1 0.353 11 GGAGG GENOMAD.083633.VV 5.663e-05 44 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1791 2026399 2028087 1689 -1 0.325 11 GGAG/GAGG GENOMAD.068767.VV 1.613e-200 632 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1792 2028099 2029256 1158 -1 0.335 11 AGxAGG/AGGxGG GENOMAD.222380.VP 5.366e-06 51 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1793 2029269 2031173 1905 -1 0.332 11 GGxGG GENOMAD.004340.VV 1.903e-153 499 0 0 1 2561 Caudoviricetes NA NA PF06605;PF18994;COG4926;TIGR01665 Phage-related protein
+NC_009012.1|provirus_2022140_2067593_1794 2031173 2031877 705 -1 0.296 11 GGxGG GENOMAD.004006.VV 7.585e-128 404 0 0 0 2561 Caudoviricetes NA NA PF20195;COG4722;TIGR01633 Phage-related protein
+NC_009012.1|provirus_2022140_2067593_1795 2031877 2034156 2280 -1 0.357 11 GGAGG GENOMAD.089120.VP 5.755e-58 220 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1796 2034172 2034297 126 -1 0.333 11 4Base/6BMM GENOMAD.202970.VV 1.546e-18 78 0 0 1 1 NA NA NA PF09550;TIGR02216 NA
+NC_009012.1|provirus_2022140_2067593_1797 2034366 2034689 324 -1 0.306 11 AGGAG GENOMAD.136836.VV 3.52e-41 147 0 0 0 2561 Caudoviricetes NA NA PF16478 Phage tail tube protein, GTA-gp10
+NC_009012.1|provirus_2022140_2067593_1798 2034818 2035258 441 -1 0.306 11 GGA/GAG/AGG GENOMAD.053493.CC 5.322e-30 117 0 0 0 1 NA NA NA PF14101 NA
+NC_009012.1|provirus_2022140_2067593_1799 2035656 2036699 1044 -1 0.345 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1800 2036776 2036883 108 -1 0.204 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1801 2037023 2037595 573 -1 0.356 11 GGA/GAG/AGG GENOMAD.013991.VV 6.347e-57 197 0 0 1 2561 Caudoviricetes NA NA PF04630;TIGR01603 phage major tail protein, phi13 family
+NC_009012.1|provirus_2022140_2067593_1802 2037598 2037927 330 -1 0.294 11 GGA/GAG/AGG GENOMAD.018077.VV 2.114e-47 165 0 0 0 2561 Caudoviricetes NA NA PF05657 NA
+NC_009012.1|provirus_2022140_2067593_1803 2037924 2038316 393 -1 0.356 11 GGAGG GENOMAD.066487.VV 1.944e-66 221 0 0 1 2561 Caudoviricetes NA NA TIGR01725;COG5005 phage protein, HK97 gp10 family
+NC_009012.1|provirus_2022140_2067593_1804 2038309 2038635 327 -1 0.318 11 GGA/GAG/AGG GENOMAD.124210.VP 2.543e-21 90 0 0 1 2561 Caudoviricetes NA NA PF05521;COG5614;TIGR01563 Bacteriophage head-tail adaptor
+NC_009012.1|provirus_2022140_2067593_1805 2038632 2039231 600 -1 0.330 11 AGGAG GENOMAD.158311.VV 2.792e-34 132 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR02215 phage conserved hypothetical protein, phiE125 gp8 family
+NC_009012.1|provirus_2022140_2067593_1806 2039246 2039686 441 -1 0.329 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1807 2039699 2040988 1290 -1 0.367 11 AGGA GENOMAD.093418.VV 2.924e-30 128 0 0 1 2561 Caudoviricetes NA NA PF05065;TIGR01554;COG4653 phage major capsid protein, HK97 family
+NC_009012.1|provirus_2022140_2067593_1808 2041016 2041759 744 -1 0.344 11 AGGA GENOMAD.158277.VP 2.322e-25 108 0 0 0 2561 Caudoviricetes NA NA PF00574;PF19602;K01358;TIGR00493;COG3904 ATP-dependent Clp endopeptidase, proteolytic subunit ClpP
+NC_009012.1|provirus_2022140_2067593_1809 2041764 2043023 1260 -1 0.352 11 AGGAGG GENOMAD.179073.VP 1.345e-39 156 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1810 2043035 2045584 2550 -1 0.349 11 AGGAGG GENOMAD.181434.VP 3.417e-57 219 0 0 1 2561 Caudoviricetes NA NA PF20441 Terminase large subunit, endonuclease domain
+NC_009012.1|provirus_2022140_2067593_1811 2045577 2046059 483 -1 0.400 11 AGGAGG GENOMAD.168120.VP 3.555e-12 66 0 0 1 2561 Caudoviricetes NA NA PF05119;COG3747;TIGR01558 Phage terminase, small subunit
+NC_009012.1|provirus_2022140_2067593_1812 2046118 2046333 216 -1 0.329 11 4Base/6BMM GENOMAD.225559.VP 4.489e-15 70 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1813 2046326 2047078 753 -1 0.325 11 GGAGG GENOMAD.105515.VV 2.253e-07 54 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1814 2047192 2047503 312 -1 0.356 11 GGAGG GENOMAD.224340.VP 3.569e-39 141 0 0 0 1 NA NA NA PF19854 NA
+NC_009012.1|provirus_2022140_2067593_1815 2047574 2048053 480 -1 0.327 11 GGxGG GENOMAD.191984.VP 1.926e-08 55 0 0 0 2561 Caudoviricetes NA NA PF07128 NA
+NC_009012.1|provirus_2022140_2067593_1816 2048198 2049121 924 -1 0.379 11 GGA/GAG/AGG GENOMAD.105515.VV 2.991e-05 48 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1817 2049221 2050672 1452 -1 0.390 11 GGA/GAG/AGG GENOMAD.136632.VV 1.346e-08 60 0 0 0 2561 Caudoviricetes NA NA PF00145;TIGR00675;K00558;COG0270 DNA-methyltransferase (dcm)
+NC_009012.1|provirus_2022140_2067593_1818 2050674 2051909 1236 -1 0.358 11 GGAGG GENOMAD.038338.VV 2.311e-33 137 0 0 0 2561 Caudoviricetes NA NA COG3392 NA
+NC_009012.1|provirus_2022140_2067593_1819 2051914 2052339 426 -1 0.350 11 AGGAGG GENOMAD.133740.VV 1.401e-16 78 0 0 0 2561 Caudoviricetes NA NA PF07750;COG5352;K13583;TIGR00721 GcrA cell cycle regulator
+NC_009012.1|provirus_2022140_2067593_1820 2052752 2053132 381 -1 0.404 11 GGAGG GENOMAD.208831.VV 4.697e-14 70 0 0 0 2561 Caudoviricetes NA NA PF13395 HNH endonuclease
+NC_009012.1|provirus_2022140_2067593_1821 2053313 2053558 246 -1 0.260 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1822 2053627 2054031 405 -1 0.304 11 AGGAGG GENOMAD.159035.VP 6.65e-39 142 0 0 0 2561 Caudoviricetes NA NA PF07374;TIGR01636;COG2739 phage transcriptional activator, RinA family
+NC_009012.1|provirus_2022140_2067593_1823 2054033 2054335 303 -1 0.340 11 AGxAGG/AGGxGG GENOMAD.212426.VP 1.787e-21 90 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1824 2054533 2056407 1875 -1 0.297 11 AGxAGG/AGGxGG GENOMAD.024099.VV 3.13e-70 254 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1825 2056608 2058299 1692 -1 0.303 11 GGAG/GAGG GENOMAD.102034.VP 2.393e-111 373 0 0 0 2561 Caudoviricetes NA NA TIGR01636 NA
+NC_009012.1|provirus_2022140_2067593_1826 2058302 2058760 459 -1 0.316 11 AGGAGG GENOMAD.031678.VV 2.327e-33 127 0 0 0 2561 Caudoviricetes NA NA PF05037 NA
+NC_009012.1|provirus_2022140_2067593_1827 2058779 2060209 1431 -1 0.311 11 GGA/GAG/AGG GENOMAD.016341.VV 4.675e-134 435 0 0 1 2561 Caudoviricetes NA NA PF13479;PF12684;TIGR01618;K07465;COG1468 phage nucleotide-binding protein
+NC_009012.1|provirus_2022140_2067593_1828 2060293 2060658 366 -1 0.314 11 AGGAG GENOMAD.010330.VV 1.124e-51 178 0 0 0 2561 Caudoviricetes NA NA PF03838;COG3331;TIGR00648 Recombination protein U
+NC_009012.1|provirus_2022140_2067593_1829 2060655 2061833 1179 -1 0.314 11 GGA/GAG/AGG GENOMAD.014802.VV 1.234e-10 66 0 0 0 2561 Caudoviricetes NA NA PF00176;K20093;COG1061;TIGR04095 Superfamily II DNA or RNA helicase
+NC_009012.1|provirus_2022140_2067593_1830 2061823 2061912 90 -1 0.367 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1831 2061942 2062706 765 -1 0.319 11 GGAGG GENOMAD.171549.VP 1.527e-13 73 0 0 0 2561 Caudoviricetes NA NA COG3617 Prophage antirepressor
+NC_009012.1|provirus_2022140_2067593_1832 2062722 2062973 252 -1 0.286 11 AGGAGG GENOMAD.222352.VV 3.867e-07 48 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1833 2062994 2063317 324 -1 0.340 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1834 2063536 2063763 228 -1 0.272 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1835 2063973 2064683 711 -1 0.336 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1836 2064700 2065068 369 -1 0.271 11 GGAGG GENOMAD.213960.VV 6.573e-66 219 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1837 2065083 2065463 381 -1 0.333 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1838 2065520 2066308 789 -1 0.324 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1839 2066610 2067026 417 -1 0.312 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2022140_2067593_1840 2067186 2067593 408 1 0.350 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2581 2931283 2932395 1113 -1 0.436 11 AGGAGG GENOMAD.016861.VV 8.63e-05 47 0 0 0 2561 Caudoviricetes NA NA PF13671;COG2019;TIGR01359;K13829 AAA domain
+NC_009012.1|provirus_2931283_2970170_2582 2932453 2932875 423 -1 0.350 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2583 2932954 2933160 207 1 0.406 11 GGxGG GENOMAD.087773.VV 6.92e-17 75 0 0 0 2561 Caudoviricetes NA NA PF14083 PGDYG protein
+NC_009012.1|provirus_2931283_2970170_2584 2933136 2933600 465 -1 0.353 11 AGxAGG/AGGxGG GENOMAD.170160.VC 7.688e-09 56 0 0 0 2561 Caudoviricetes NA NA PF18184 SMODS and SLOG-associating 2TM effector domain 3
+NC_009012.1|provirus_2931283_2970170_2585 2933630 2934070 441 -1 0.401 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2586 2934086 2934514 429 -1 0.408 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2587 2934642 2934881 240 1 0.358 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2588 2934900 2935646 747 1 0.383 11 AGxAGG/AGGxGG GENOMAD.132419.VP 5.435e-24 104 0 0 0 2561 Caudoviricetes NA NA PF03374;COG3645 Phage antirepressor protein YoqD, KilAC domain
+NC_009012.1|provirus_2931283_2970170_2589 2935649 2935867 219 1 0.507 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2590 2935963 2936175 213 1 0.460 11 AGxAGG/AGGxGG GENOMAD.209016.VC 1.289e-41 146 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2591 2936162 2936335 174 1 0.477 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2592 2936351 2936569 219 1 0.411 11 GGA/GAG/AGG GENOMAD.088748.VV 2.403e-36 131 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2593 2936562 2937113 552 1 0.404 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2594 2937114 2938019 906 1 0.429 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2595 2938109 2938396 288 1 0.444 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2596 2938386 2938574 189 1 0.450 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2597 2938591 2939673 1083 1 0.437 11 GGAGG GENOMAD.021533.VV 5.011e-133 426 0 0 1 2561 Caudoviricetes NA NA TIGR01714 phage replisome organizer, putative, N-terminal region
+NC_009012.1|provirus_2931283_2970170_2598 2939670 2940506 837 1 0.458 11 GGAGG GENOMAD.034827.VV 1.47e-07 55 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2599 2940508 2940882 375 1 0.477 11 GGAG/GAGG GENOMAD.151656.VP 2.586e-44 157 0 0 1 2561 Caudoviricetes NA NA PF17288;K06909;TIGR01547;COG1783 phage terminase, large subunit, PBSX family
+NC_009012.1|provirus_2931283_2970170_2600 2940930 2941352 423 1 0.414 11 AGxAGG/AGGxGG GENOMAD.221128.VP 8.436e-64 214 0 0 0 2561 Caudoviricetes NA NA PF05263;TIGR01636;COG2739 phage transcriptional activator, RinA family
+NC_009012.1|provirus_2931283_2970170_2601 2941501 2941743 243 1 0.374 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2602 2941811 2942653 843 1 0.323 11 GGAG/GAGG GENOMAD.178342.VP 1.96e-33 133 0 0 0 2561 Caudoviricetes NA NA PF02086;PF06576;PF06147;K21507;TIGR00571;COG0338 DNA adenine methylase (dam)
+NC_009012.1|provirus_2931283_2970170_2603 2942646 2943926 1281 1 0.304 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2604 2944119 2944964 846 1 0.301 11 AGGAGG GENOMAD.225783.VP 6.425e-63 219 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2605 2945034 2945183 150 1 0.280 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2606 2945216 2945665 450 1 0.413 11 GGA/GAG/AGG GENOMAD.026460.VV 5.098e-23 97 0 0 1 2561 Caudoviricetes NA NA PF03592;COG3728;K07474 Phage terminase, small subunit
+NC_009012.1|provirus_2931283_2970170_2607 2945652 2946899 1248 1 0.421 11 AGxAG GENOMAD.141197.VP 5.699e-78 269 0 0 1 2561 Caudoviricetes NA NA PF17288;K06909;TIGR01547;COG1783 Terminase RNAseH like domain
+NC_009012.1|provirus_2931283_2970170_2608 2946915 2948348 1434 1 0.371 11 AGxAGG/AGGxGG GENOMAD.006049.VV 7.501e-107 356 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2609 2948345 2948494 150 1 0.340 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2610 2948505 2949914 1410 1 0.362 11 AGxAGG/AGGxGG GENOMAD.003968.VV 2.731e-31 132 0 0 1 2561 Caudoviricetes NA NA PF06152;COG5585;TIGR01641 NAD+--asparagine ADP-ribosyltransferase
+NC_009012.1|provirus_2931283_2970170_2611 2949911 2950117 207 1 0.348 11 AGGAG GENOMAD.066155.VV 6.191e-11 58 0 0 0 2561 Caudoviricetes NA NA PF06372 NA
+NC_009012.1|provirus_2931283_2970170_2612 2950161 2950847 687 1 0.339 11 None GENOMAD.007545.VV 1.038e-29 120 0 0 0 2561 Caudoviricetes NA NA PF06810 Phage minor structural protein GP20
+NC_009012.1|provirus_2931283_2970170_2613 2950866 2951789 924 1 0.394 11 AGGAG GENOMAD.092843.VP 1.736e-163 511 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2614 2951802 2951948 147 1 0.388 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2615 2951926 2952327 402 1 0.443 11 AGGA/GGAG/GAGG GENOMAD.047671.VV 6.175e-72 237 0 0 0 2561 Caudoviricetes NA NA PF11436 NA
+NC_009012.1|provirus_2931283_2970170_2616 2952324 2952659 336 1 0.464 11 GGAGG GENOMAD.074010.VV 3.139e-52 179 0 0 0 2561 Caudoviricetes NA NA PF12206 NA
+NC_009012.1|provirus_2931283_2970170_2617 2952656 2953066 411 1 0.416 11 GGxGG GENOMAD.019155.VV 1.438e-72 239 0 0 1 2561 Caudoviricetes NA NA PF11114;TIGR01725 phage protein, HK97 gp10 family
+NC_009012.1|provirus_2931283_2970170_2618 2953056 2953475 420 1 0.438 11 4Base/6BMM GENOMAD.025660.VV 2.016e-70 233 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2619 2953638 2954927 1290 -1 0.420 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2620 2955379 2956425 1047 1 0.393 11 AGGAG GENOMAD.118787.VV 2.086e-155 490 0 0 1 2561 Caudoviricetes NA NA PF04984;PF17482;COG3497 Phage tail sheath protein subtilisin-like domain; Phage tail sheath C-terminal domain
+NC_009012.1|provirus_2931283_2970170_2621 2956446 2956922 477 1 0.392 11 AGGAGG GENOMAD.018728.VV 4.047e-72 239 0 0 1 2561 Caudoviricetes NA NA PF09393 Phage tail tube protein
+NC_009012.1|provirus_2931283_2970170_2622 2956939 2957352 414 1 0.377 11 GGAG/GAGG GENOMAD.009389.VV 1.083e-59 202 0 0 1 2561 Caudoviricetes NA NA PF08890;PF17482 Phage XkdN-like tail assembly chaperone protein, TAC; Phage tail sheath C-terminal domain
+NC_009012.1|provirus_2931283_2970170_2623 2957352 2957543 192 1 0.391 11 3Base/5BMM GENOMAD.059912.VV 9.647e-19 80 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2624 2957545 2959380 1836 1 0.406 11 AGxAGG/AGGxGG GENOMAD.118787.VV 2.585e-124 413 0 0 1 2561 Caudoviricetes NA NA PF04984;PF17482;COG3497 Phage tail sheath protein subtilisin-like domain; Phage tail sheath C-terminal domain
+NC_009012.1|provirus_2931283_2970170_2625 2959377 2960036 660 1 0.374 11 AGxAGG/AGGxGG GENOMAD.017357.VV 6.647e-18 85 0 0 0 2561 Caudoviricetes NA NA PF06995;COG1652 Nucleoid-associated protein YgaU, contains BON and LysM domains
+NC_009012.1|provirus_2931283_2970170_2626 2960033 2960977 945 1 0.403 11 3Base/5BMM GENOMAD.018966.VV 1.564e-77 263 0 0 1 2561 Caudoviricetes NA NA PF14594;COG4379;TIGR03361;K06905 Mu-like prophage tail protein gpP
+NC_009012.1|provirus_2931283_2970170_2627 2960974 2961207 234 1 0.427 11 GGA/GAG/AGG GENOMAD.096038.VV 2.254e-39 140 0 0 0 2561 Caudoviricetes NA NA PF10844 NA
+NC_009012.1|provirus_2931283_2970170_2628 2961204 2961599 396 1 0.376 11 GGAGG GENOMAD.016318.VV 1.625e-52 181 0 0 0 2561 Caudoviricetes NA NA PF10934;COG4381;TIGR03357 Mu-like prophage protein gp46
+NC_009012.1|provirus_2931283_2970170_2629 2961599 2962657 1059 1 0.432 11 GGAGG GENOMAD.004833.VV 7.052e-52 190 0 0 1 2561 Caudoviricetes NA NA PF04865;COG3299 Baseplate J-like protein
+NC_009012.1|provirus_2931283_2970170_2630 2962647 2963249 603 1 0.420 11 GGA/GAG/AGG GENOMAD.015577.VV 8.917e-17 81 0 0 1 2561 Caudoviricetes NA NA PF10076;COG3778;TIGR02242 Uncharacterized protein YmfQ in lambdoid prophage, DUF2313 family
+NC_009012.1|provirus_2931283_2970170_2631 2963259 2963543 285 1 0.407 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2632 2963546 2964928 1383 1 0.513 11 AGGAGG GENOMAD.087125.VV 1.015e-11 70 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2633 2964993 2965253 261 1 0.402 11 AGGA GENOMAD.213587.VP 4.024e-30 114 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2634 2965254 2965406 153 1 0.386 11 AGGAG GENOMAD.065816.VV 5.681e-11 57 0 0 0 2561 Caudoviricetes NA NA PF09693;TIGR01669 phage uncharacterized protein, XkdX family
+NC_009012.1|provirus_2931283_2970170_2635 2965495 2965785 291 1 0.354 11 AGxAGG/AGGxGG GENOMAD.171716.VV 1.182e-08 53 0 0 0 1 NA NA NA PF07439 NA
+NC_009012.1|provirus_2931283_2970170_2636 2965801 2966457 657 1 0.482 11 AGxAGG/AGGxGG GENOMAD.220135.VV 1.55e-13 72 0 0 0 2561 Caudoviricetes NA NA COG5632 N-acetylmuramoyl-L-alanine amidase CwlA
+NC_009012.1|provirus_2931283_2970170_2637 2966597 2966896 300 1 0.450 11 GGAGG GENOMAD.151236.VC 1.963e-43 153 0 0 1 1 NA NA NA PF06946 Bacteriophage A118-like holin, Hol118
+NC_009012.1|provirus_2931283_2970170_2638 2967070 2967705 636 1 0.332 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2639 2967690 2968121 432 1 0.315 11 AGGAGG GENOMAD.206152.VV 2.957e-68 227 0 0 0 1 NA NA NA PF01845;COG2337;K07171 mRNA-degrading endonuclease, toxin component of the MazEF toxin-antitoxin module
+NC_009012.1|provirus_2931283_2970170_2640 2968641 2969126 486 1 0.440 11 AGGAG/GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2641 2969366 2969530 165 1 0.352 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_2931283_2970170_2642 2969562 2970170 609 1 0.417 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2977 3339258 3339497 240 1 0.429 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2978 3339748 3340554 807 1 0.446 11 AGGAGG GENOMAD.197438.VP 4.39e-23 102 0 0 0 2561 Caudoviricetes NA NA PF09250 Bifunctional DNA primase/polymerase, N-terminal
+NC_009012.1|provirus_3339258_3389049_2979 3340946 3342793 1848 1 0.414 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2980 3342816 3344054 1239 1 0.348 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2981 3344263 3344400 138 1 0.333 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2982 3344462 3344791 330 1 0.382 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2983 3344804 3345274 471 1 0.376 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2984 3345548 3345952 405 -1 0.410 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2985 3346045 3346803 759 -1 0.451 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2986 3346803 3348287 1485 -1 0.436 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2987 3348393 3349109 717 -1 0.392 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2988 3349682 3350029 348 1 0.405 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2989 3350172 3351857 1686 1 0.419 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2990 3351870 3352448 579 1 0.304 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2991 3352630 3353019 390 1 0.415 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2992 3353012 3353149 138 1 0.406 11 GGxGG GENOMAD.223510.VP 6.369e-08 48 0 0 0 1 NA NA NA PF10122;TIGR04104;COG4530 Mu-like prophage protein Com
+NC_009012.1|provirus_3339258_3389049_2993 3353530 3354081 552 1 0.457 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2994 3354477 3356318 1842 1 0.410 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2995 3356345 3357583 1239 1 0.350 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2996 3358087 3358431 345 1 0.336 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2997 3358458 3358892 435 1 0.315 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2998 3358867 3359211 345 1 0.397 11 AGxAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_2999 3359399 3359644 246 1 0.435 11 4Base/6BMM NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3000 3360040 3360228 189 1 0.370 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3001 3360466 3361671 1206 1 0.440 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3002 3361685 3361972 288 1 0.292 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3003 3362170 3362559 390 1 0.441 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3004 3362549 3362689 141 1 0.440 11 GGAGG GENOMAD.223510.VP 2.986e-08 49 0 0 0 1 NA NA NA PF10122;TIGR04104;COG4530 Mu-like prophage protein Com
+NC_009012.1|provirus_3339258_3389049_3005 3362816 3364975 2160 1 0.468 11 AGGAGG GENOMAD.169139.VV 4.569e-22 105 0 0 0 2561 Caudoviricetes NA NA PF09250 Bifunctional DNA primase/polymerase, N-terminal
+NC_009012.1|provirus_3339258_3389049_3006 3365247 3366560 1314 1 0.453 11 GGAGG GENOMAD.093418.VV 1.24e-13 76 0 0 1 2561 Caudoviricetes NA NA PF05065;TIGR01554;COG4653 phage major capsid protein, HK97 family
+NC_009012.1|provirus_3339258_3389049_3007 3366819 3367121 303 1 0.432 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3008 3367461 3368705 1245 1 0.441 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3009 3369138 3369425 288 1 0.299 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3010 3369641 3369937 297 1 0.434 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3011 3370188 3370994 807 1 0.454 11 AGGAGG GENOMAD.197438.VP 2.102e-21 97 0 0 0 2561 Caudoviricetes NA NA PF09250 Bifunctional DNA primase/polymerase, N-terminal
+NC_009012.1|provirus_3339258_3389049_3012 3371390 3373237 1848 1 0.403 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3013 3373261 3374499 1239 1 0.351 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3014 3374708 3375235 528 1 0.358 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3015 3375248 3375718 471 1 0.374 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3016 3375991 3377127 1137 -1 0.403 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3017 3377700 3378047 348 1 0.408 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3018 3378190 3378969 780 1 0.442 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3019 3378971 3379900 930 1 0.413 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3020 3379902 3380144 243 1 0.358 11 GGxGG GENOMAD.227820.VP 6.79e-08 50 0 0 0 1 NA NA NA PF15597 Immunity protein 59
+NC_009012.1|provirus_3339258_3389049_3021 3380249 3380851 603 1 0.274 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3022 3381065 3382069 1005 1 0.392 11 3Base/5BMM NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3023 3382076 3382312 237 1 0.308 11 AGGAGG GENOMAD.218640.VC 3.123e-07 48 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3024 3382430 3382819 390 1 0.428 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3025 3382812 3382949 138 1 0.399 11 GGAGG GENOMAD.223510.VP 6.369e-08 48 0 0 0 1 NA NA NA PF10122;TIGR04104;COG4530 Mu-like prophage protein Com
+NC_009012.1|provirus_3339258_3389049_3026 3383070 3385229 2160 1 0.468 11 AGGAGG GENOMAD.169139.VV 2.257e-22 106 0 0 0 2561 Caudoviricetes NA NA PF09250 Bifunctional DNA primase/polymerase, N-terminal
+NC_009012.1|provirus_3339258_3389049_3027 3385500 3386813 1314 1 0.451 11 GGAGG GENOMAD.093418.VV 6.053e-14 77 0 0 1 2561 Caudoviricetes NA NA PF05065;TIGR01554;COG4653 phage major capsid protein, HK97 family
+NC_009012.1|provirus_3339258_3389049_3028 3387138 3387440 303 1 0.436 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_009012.1|provirus_3339258_3389049_3029 3387805 3389049 1245 1 0.449 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_012982.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_012982.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_014008.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014008.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_014168.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014168.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,99 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_014168.1|provirus_27479_67296_28 27479 28375 897 1 0.672 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_29 28372 28920 549 1 0.667 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_30 28917 29114 198 1 0.712 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_31 29111 29863 753 1 0.671 11 GGAG/GAGG GENOMAD.032144.VV 1.48e-35 138 0 0 0 2561 Caudoviricetes NA NA PF12684 NA
+NC_014168.1|provirus_27479_67296_32 29860 30516 657 1 0.658 11 GGA/GAG/AGG GENOMAD.124252.VP 2.931e-32 127 0 0 0 2561 Caudoviricetes NA NA PF03837;TIGR01913 phage recombination protein Bet
+NC_014168.1|provirus_27479_67296_33 30516 30917 402 1 0.649 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_34 30923 31276 354 1 0.638 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_35 31280 31432 153 1 0.660 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_36 31426 31845 420 1 0.662 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_37 31842 32357 516 1 0.698 11 GGAG/GAGG GENOMAD.033304.VV 2.452e-10 61 0 0 0 2561 Caudoviricetes NA NA PF13395 NA
+NC_014168.1|provirus_27479_67296_38 32357 33292 936 1 0.661 11 GGxGG GENOMAD.028141.VV 1.19e-25 111 0 0 1 2561 Caudoviricetes NA NA PF09681;TIGR01714 N-terminal phage replisome organiser (Phage_rep_org_N)
+NC_014168.1|provirus_27479_67296_39 33289 33654 366 1 0.658 11 GGAGG GENOMAD.087217.VV 8.175e-05 43 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_40 33651 34037 387 1 0.674 11 AGGAG GENOMAD.018151.VV 4.881e-23 96 0 0 0 2561 Caudoviricetes NA NA PF01870;COG1591 Holliday junction resolvase, archaeal type
+NC_014168.1|provirus_27479_67296_41 34034 34234 201 1 0.672 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_42 34231 34542 312 1 0.670 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_43 34539 34751 213 1 0.596 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_44 34748 34984 237 1 0.578 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_45 35011 35331 321 1 0.617 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_46 35328 35798 471 1 0.620 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_47 35795 36223 429 1 0.653 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_48 36220 36798 579 1 0.585 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_49 36795 37106 312 1 0.647 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_50 37103 37882 780 1 0.663 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_51 37879 38100 222 1 0.676 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_52 38249 40009 1761 1 0.681 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_53 40017 40673 657 1 0.636 11 AGGA/GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_54 40670 40990 321 1 0.632 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_55 41205 41459 255 1 0.663 11 GGAGG GENOMAD.083226.VV 1.61e-08 52 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_56 41512 41895 384 1 0.620 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_57 41892 42371 480 1 0.640 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_58 42274 42642 369 -1 0.672 11 AGGAG GENOMAD.215374.PC 1.387e-08 54 0 0 0 1 NA NA NA PF13827 NA
+NC_014168.1|provirus_27479_67296_59 42807 43085 279 1 0.674 11 AGGAG GENOMAD.014408.VV 1.177e-14 70 0 0 0 2561 Caudoviricetes NA NA PF13395;TIGR02646 HNH endonuclease
+NC_014168.1|provirus_27479_67296_60 43082 43267 186 1 0.602 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_61 43504 43767 264 1 0.655 11 AGGAG GENOMAD.047538.VV 9.427e-15 70 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_62 43751 45166 1416 1 0.663 11 AGGAG/GGAGG GENOMAD.002060.VV 1.733e-134 436 0 0 1 2561 Caudoviricetes NA NA PF20441;PF04466;COG4626;TIGR01547;K06909 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014168.1|provirus_27479_67296_63 45190 46566 1377 1 0.687 11 GGAGG GENOMAD.080886.VV 1.496e-47 181 0 0 1 2561 Caudoviricetes NA NA PF05133;TIGR01538 phage portal protein, SPP1 family
+NC_014168.1|provirus_27479_67296_64 46550 47233 684 1 0.697 11 GGAG/GAGG GENOMAD.097054.VV 4.565e-30 121 0 0 1 2561 Caudoviricetes NA NA PF04233;TIGR01641 phage putative head morphogenesis protein, SPP1 gp7 family
+NC_014168.1|provirus_27479_67296_65 47285 47761 477 1 0.644 11 GGA/GAG/AGG GENOMAD.040462.VV 2.062e-54 188 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_66 47788 48696 909 1 0.636 11 GGAG/GAGG GENOMAD.013023.VV 2.718e-53 192 0 0 1 2561 Caudoviricetes NA NA PF05065;TIGR01554;COG4653 phage major capsid protein, HK97 family
+NC_014168.1|provirus_27479_67296_67 48696 48869 174 1 0.724 11 AGGA/GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_68 48841 49308 468 1 0.686 11 GGAG/GAGG GENOMAD.062537.VV 2.534e-42 153 0 0 1 2561 Caudoviricetes NA NA PF09355 Phage protein Gp19/Gp15/Gp42
+NC_014168.1|provirus_27479_67296_69 49305 49646 342 1 0.702 11 None GENOMAD.038727.VV 1.417e-21 91 0 0 1 2561 Caudoviricetes NA NA PF12206;COG5614;TIGR01563 Minor capsid protein
+NC_014168.1|provirus_27479_67296_70 49647 49955 309 1 0.673 11 GGAGG GENOMAD.087122.VV 2.723e-10 58 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_71 49959 50357 399 1 0.714 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_72 50395 51042 648 1 0.657 11 AGGA GENOMAD.004252.VV 6.372e-16 79 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_73 51039 51371 333 1 0.658 11 GGA/GAG/AGG GENOMAD.187636.VV 2.624e-05 44 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_74 51380 51763 384 1 0.693 11 3Base/5BMM GENOMAD.056037.VV 4.163e-06 47 0 0 0 2561 Caudoviricetes NA NA PF17318;PF08765;TIGR02417 Mor transcription activator family
+NC_014168.1|provirus_27479_67296_75 51744 55466 3723 1 0.706 11 AGGAG GENOMAD.016295.VV 2.211e-48 193 0 0 0 2561 Caudoviricetes NA NA COG3953 SLT domain protein
+NC_014168.1|provirus_27479_67296_76 55466 56728 1263 1 0.678 11 GGAGG GENOMAD.053786.VV 4.118e-58 211 0 0 0 2561 Caudoviricetes NA NA COG4722 Phage-related protein
+NC_014168.1|provirus_27479_67296_77 56728 58500 1773 1 0.679 11 GGA/GAG/AGG GENOMAD.019112.VV 3.356e-155 502 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_78 58500 58751 252 1 0.675 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_79 58751 59812 1062 1 0.658 11 GGAGG GENOMAD.059914.VV 2.914e-67 235 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_80 59814 61079 1266 1 0.682 11 None GENOMAD.079434.VV 5.593e-20 96 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_81 61144 62403 1260 1 0.683 11 AGGAG GENOMAD.047467.VV 2.371e-19 94 0 0 0 2561 Caudoviricetes NA NA COG5632 N-acetylmuramoyl-L-alanine amidase CwlA
+NC_014168.1|provirus_27479_67296_82 62400 62756 357 1 0.669 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_83 62756 63031 276 1 0.656 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_84 63031 63237 207 1 0.705 11 GGxGG GENOMAD.158505.VV 1.14e-05 43 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_85 63230 63589 360 1 0.689 11 AGGAG GENOMAD.073706.VV 2.772e-08 53 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_27479_67296_86 63716 64087 372 -1 0.570 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_87 64298 64633 336 -1 0.560 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_88 64630 64902 273 -1 0.615 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_89 64902 66164 1263 -1 0.621 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_27479_67296_90 66247 67296 1050 -1 0.604 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1152 1141631 1141948 318 -1 0.736 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1153 1142010 1142369 360 -1 0.742 11 GGA/GAG/AGG GENOMAD.082050.VV 3.69e-22 93 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1154 1142366 1142698 333 -1 0.685 11 GGA/GAG/AGG GENOMAD.076859.VV 2.776e-13 67 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1155 1142709 1143020 312 -1 0.740 11 AGGAGG GENOMAD.103239.VV 2.089e-13 67 0 0 1 2561 Caudoviricetes NA NA PF10665;TIGR01563;COG5614 Minor capsid protein
+NC_014168.1|provirus_1141631_1162952_1156 1143056 1143292 237 1 0.633 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1157 1143298 1143807 510 -1 0.716 11 GGAG/GAGG GENOMAD.028700.VV 2.384e-22 96 0 0 0 2561 Caudoviricetes NA NA TIGR02215 phage conserved hypothetical protein, phiE125 gp8 family
+NC_014168.1|provirus_1141631_1162952_1158 1143813 1144004 192 -1 0.609 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1159 1144022 1145302 1281 -1 0.680 11 AGGAG GENOMAD.098207.VP 2.112e-87 297 0 0 1 2561 Caudoviricetes NA NA PF06673;TIGR01554;COG1659 Lactococcus lactis bacteriophage major capsid protein
+NC_014168.1|provirus_1141631_1162952_1160 1145299 1145991 693 -1 0.700 11 AGGAG GENOMAD.207278.VV 3.963e-19 89 0 0 1 2561 Caudoviricetes NA NA PF04586;COG3740;K06904;TIGR01543 Phage head maturation protease
+NC_014168.1|provirus_1141631_1162952_1161 1145948 1147249 1302 -1 0.707 11 GGAG/GAGG GENOMAD.138175.VV 2.9e-86 294 0 0 1 2561 Caudoviricetes NA NA PF04860;TIGR01537;COG4695 phage portal protein, HK97 family
+NC_014168.1|provirus_1141631_1162952_1162 1147274 1148770 1497 -1 0.707 11 GGAGG GENOMAD.037086.VV 2.935e-120 396 0 0 1 2561 Caudoviricetes NA NA PF20441;PF03354;COG4626;TIGR01547 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014168.1|provirus_1141631_1162952_1163 1148787 1149077 291 -1 0.735 11 GGAG/GAGG GENOMAD.064187.VV 3.239e-06 46 0 0 1 2561 Caudoviricetes NA NA TIGR01558 NA
+NC_014168.1|provirus_1141631_1162952_1164 1149335 1149841 507 1 0.677 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1165 1150029 1150580 552 1 0.661 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1166 1150720 1151001 282 -1 0.645 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1167 1151045 1151320 276 -1 0.703 11 None GENOMAD.041582.VV 4.527e-16 74 0 0 0 2561 Caudoviricetes NA NA PF13395;TIGR02646 TIGR02646 family protein
+NC_014168.1|provirus_1141631_1162952_1168 1151326 1152444 1119 -1 0.718 11 GGAGG GENOMAD.064801.VV 2.016e-15 81 0 0 0 2561 Caudoviricetes NA NA PF00145;TIGR00675;COG0270;K15336 DNA-methyltransferase (dcm)
+NC_014168.1|provirus_1141631_1162952_1169 1152853 1153509 657 -1 0.702 11 AGGAG GENOMAD.066690.VV 1.852e-101 327 0 0 0 2561 Caudoviricetes NA NA PF10122;COG5349;TIGR01206 Uncharacterized conserved protein, DUF983 family
+NC_014168.1|provirus_1141631_1162952_1170 1153506 1153754 249 -1 0.683 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1171 1153751 1154008 258 -1 0.698 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1172 1154012 1154389 378 -1 0.675 11 GGAG/GAGG GENOMAD.063447.VV 9.173e-15 72 0 0 0 2561 Caudoviricetes NA NA PF11417 NA
+NC_014168.1|provirus_1141631_1162952_1173 1154389 1155183 795 -1 0.659 11 AGGAG GENOMAD.049678.VV 1.151e-06 52 0 0 1 2561 Caudoviricetes NA NA PF09681;TIGR01714 phage replisome organizer, putative, N-terminal region
+NC_014168.1|provirus_1141631_1162952_1174 1155187 1155612 426 -1 0.732 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1175 1155609 1155995 387 -1 0.700 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1176 1156014 1156796 783 -1 0.706 11 GGAGG GENOMAD.021092.VV 7.29e-40 151 0 0 0 2561 Caudoviricetes NA NA PF12684;TIGR00372;COG1468;K07465 CRISPR-associated protein Cas4
+NC_014168.1|provirus_1141631_1162952_1177 1156793 1157083 291 -1 0.698 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1178 1157080 1157307 228 -1 0.693 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1179 1157304 1157678 375 -1 0.739 11 GGAG/GAGG GENOMAD.067886.VV 1.484e-08 54 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1180 1157757 1158599 843 -1 0.706 11 AGGA GENOMAD.161352.VP 5.904e-23 102 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1181 1158605 1159525 921 -1 0.701 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1182 1159522 1159776 255 -1 0.729 11 GGA/GAG/AGG GENOMAD.222641.VP 1.01e-05 44 0 0 0 1 NA NA NA PF08667;COG5606;TIGR02612;K07727 Predicted DNA-binding protein, XRE-type HTH domain
+NC_014168.1|provirus_1141631_1162952_1183 1159861 1160289 429 1 0.713 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1184 1160403 1161263 861 1 0.700 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1185 1161230 1161493 264 1 0.746 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014168.1|provirus_1141631_1162952_1186 1161597 1162952 1356 1 0.684 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_014211.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014211.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_014212.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014212.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,120 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_014212.1|provirus_1170297_1209132_1203 1170297 1171460 1164 -1 0.588 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1204 1171538 1171798 261 -1 0.452 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1205 1171872 1173071 1200 -1 0.613 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1206 1173072 1173524 453 -1 0.587 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1207 1173812 1174465 654 -1 0.567 11 GGAGG GENOMAD.212789.VC 7.003e-10 61 0 0 0 1 NA NA NA PF08667;TIGR00673;COG1974;K22299 cyanase
+NC_014212.1|provirus_1170297_1209132_1208 1174604 1174783 180 1 0.517 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1209 1174780 1175010 231 1 0.623 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1210 1175054 1175242 189 1 0.614 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1211 1175242 1175514 273 1 0.648 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1212 1175507 1175629 123 1 0.618 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1213 1175629 1175847 219 1 0.689 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1214 1175875 1176492 618 1 0.544 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1215 1176556 1178289 1734 1 0.577 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1216 1178289 1178624 336 1 0.610 11 None GENOMAD.004598.VV 3.185e-12 64 0 0 0 2561 Caudoviricetes NA NA PF18743;COG1591 REase_AHJR-like
+NC_014212.1|provirus_1170297_1209132_1217 1178621 1181314 2694 1 0.628 11 GGAG/GAGG GENOMAD.106709.VV 1.101e-06 55 0 0 0 2561 Caudoviricetes NA NA PF16793 RepB DNA-primase from phage plasmid
+NC_014212.1|provirus_1170297_1209132_1218 1181304 1181546 243 1 0.424 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1219 1181649 1182485 837 1 0.568 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1220 1182591 1183058 468 1 0.645 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1221 1183055 1183510 456 1 0.596 11 GGAGG GENOMAD.172137.VP 1.504e-54 188 0 0 1 2561 Caudoviricetes NA NA PF07141;COG3728;TIGR02036 Putative bacteriophage terminase small subunit
+NC_014212.1|provirus_1170297_1209132_1222 1183500 1184804 1305 1 0.611 11 AGGA/GGAG/GAGG GENOMAD.190694.VP 5.526e-100 334 0 0 1 2561 Caudoviricetes NA NA PF04466;PF17288;TIGR01547;COG1783;K06909 phage terminase, large subunit, PBSX family
+NC_014212.1|provirus_1170297_1209132_1223 1184801 1186228 1428 1 0.680 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1224 1186209 1187081 873 1 0.667 11 None GENOMAD.064248.VV 1.444e-15 80 0 0 1 2561 Caudoviricetes NA NA PF04233;TIGR01641 phage putative head morphogenesis protein, SPP1 gp7 family
+NC_014212.1|provirus_1170297_1209132_1225 1187022 1187201 180 -1 0.578 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1226 1187232 1188875 1644 1 0.609 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1227 1188995 1189195 201 1 0.627 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1228 1189265 1190137 873 1 0.649 11 GGA/GAG/AGG GENOMAD.063287.VV 0.0001126 46 0 0 1 2561 Caudoviricetes NA NA PF04586;TIGR01543;COG3740;K06904 phage prohead protease, HK97 family
+NC_014212.1|provirus_1170297_1209132_1229 1190337 1190996 660 -1 0.620 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1230 1191039 1192691 1653 1 0.683 11 None GENOMAD.196129.VP 5.652e-07 55 0 0 1 2561 Caudoviricetes NA NA PF05125;TIGR01551;COG4653 phage major capsid protein, P2 family
+NC_014212.1|provirus_1170297_1209132_1231 1192702 1192935 234 1 0.662 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1232 1192937 1193491 555 1 0.686 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1233 1193488 1193814 327 1 0.670 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1234 1193804 1194343 540 1 0.704 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1235 1194336 1194770 435 1 0.674 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1236 1194779 1195567 789 1 0.646 11 AGGAGG GENOMAD.154545.VV 0.0001874 45 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1237 1195567 1196052 486 1 0.693 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1238 1196182 1199919 3738 1 0.622 11 AGxAGG/AGGxGG GENOMAD.183233.VP 3.13e-19 97 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1239 1199916 1200356 441 1 0.599 11 4Base/6BMM NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1240 1200353 1201429 1077 1 0.550 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1241 1201432 1203336 1905 1 0.602 11 None GENOMAD.084202.VV 0.0003846 46 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1242 1203346 1203888 543 1 0.645 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1243 1203979 1204518 540 1 0.696 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1244 1204529 1204840 312 1 0.580 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1245 1204843 1206681 1839 1 0.591 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1246 1206689 1207249 561 1 0.667 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1247 1207242 1207553 312 1 0.647 11 GGAG/GAGG GENOMAD.103334.VV 2.089e-13 67 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1248 1207563 1208354 792 1 0.635 11 GGAGG GENOMAD.024392.VV 1.495e-72 246 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1249 1208354 1208902 549 1 0.608 11 None GENOMAD.052331.VV 1.732e-50 178 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1170297_1209132_1250 1208917 1209132 216 1 0.579 11 GGAGG GENOMAD.199026.VV 1.153e-06 46 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1776 1746722 1747702 981 -1 0.630 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1777 1747716 1748285 570 -1 0.400 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1778 1748294 1749001 708 -1 0.552 11 AGxAGG/AGGxGG GENOMAD.190987.VC 3.906e-07 53 0 0 0 2561 Caudoviricetes NA NA PF00717;COG1974;TIGR00498 SOS-response transcriptional repressor LexA (RecA-mediated autopeptidase)
+NC_014212.1|provirus_1746722_1764354_1779 1749082 1749270 189 1 0.582 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1780 1749263 1749469 207 1 0.614 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1781 1749504 1749674 171 1 0.614 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1782 1749664 1749942 279 1 0.609 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1783 1749935 1750057 123 1 0.650 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1784 1750057 1750149 93 1 0.613 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1785 1750146 1750445 300 1 0.623 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1786 1750442 1750786 345 1 0.600 11 4Base/6BMM GENOMAD.138277.VP 0.0001458 42 0 0 0 9913 Herelleviridae NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1787 1750786 1751118 333 1 0.583 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1788 1751069 1752535 1467 1 0.571 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1789 1752532 1752741 210 1 0.595 11 GGA/GAG/AGG GENOMAD.127419.VV 5.309e-06 44 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1790 1752729 1753061 333 1 0.616 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1791 1753134 1753376 243 1 0.626 11 AGGA/GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1792 1753373 1753642 270 1 0.507 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1793 1753645 1753848 204 1 0.539 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1794 1753930 1754400 471 1 0.590 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1795 1754397 1754762 366 1 0.653 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1796 1755173 1755850 678 1 0.599 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1797 1755852 1756052 201 1 0.622 11 GGAG/GAGG GENOMAD.187456.VV 2.238e-19 82 0 0 0 4181 Sphaerolipoviridae NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1798 1756052 1756789 738 1 0.608 11 AGGA/GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1799 1756850 1757281 432 1 0.586 11 None GENOMAD.226936.VP 5.158e-29 114 0 0 0 4181 Sphaerolipoviridae NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1800 1757291 1757752 462 1 0.576 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1801 1757761 1758645 885 1 0.631 11 AGGA GENOMAD.175220.VV 1.243e-35 140 0 0 0 4181 Sphaerolipoviridae NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1802 1758645 1758887 243 1 0.551 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1803 1758899 1759534 636 1 0.616 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1804 1759531 1759830 300 1 0.573 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1805 1759827 1760003 177 1 0.582 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1806 1759994 1760500 507 1 0.649 11 GGA/GAG/AGG GENOMAD.201673.VV 2.522e-06 49 0 0 0 4181 Sphaerolipoviridae NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1807 1760511 1760699 189 1 0.587 11 GGAGG GENOMAD.131894.VV 1.707e-06 45 0 0 1 1 NA NA NA PF04531;TIGR01598;COG5546 NA
+NC_014212.1|provirus_1746722_1764354_1808 1760702 1760875 174 1 0.569 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1809 1760863 1761318 456 1 0.581 11 GGAG/GAGG GENOMAD.199413.VV 4.785e-15 74 0 0 0 4181 Sphaerolipoviridae NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1810 1761318 1762367 1050 1 0.577 11 4Base/6BMM GENOMAD.107709.VV 1.275e-125 404 0 0 0 4181 Sphaerolipoviridae NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1811 1762357 1763370 1014 1 0.537 11 AGGAG GENOMAD.109373.VV 8.278e-11 66 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1812 1763367 1763630 264 1 0.610 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1746722_1764354_1813 1763605 1764354 750 1 0.620 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1936 1893193 1893432 240 1 0.600 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1937 1893580 1893810 231 1 0.567 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1938 1893803 1894078 276 1 0.641 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1939 1894071 1894289 219 1 0.603 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1940 1894299 1894694 396 1 0.667 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1941 1894780 1895259 480 1 0.635 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1942 1895256 1895957 702 1 0.660 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1943 1895947 1896387 441 1 0.639 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1944 1896444 1896692 249 1 0.586 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1945 1896702 1897043 342 1 0.617 11 AGGAG GENOMAD.188989.VV 8.584e-67 221 0 0 0 1 NA NA NA PF10711 Hypothetical protein (DUF2513)
+NC_014212.1|provirus_1893193_1914973_1946 1897045 1897365 321 1 0.604 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1947 1897376 1897837 462 1 0.632 11 GGA/GAG/AGG GENOMAD.102149.VV 7.093e-30 117 0 0 1 1 NA NA NA PF11985 Bacteriophage Mu, Gp27
+NC_014212.1|provirus_1893193_1914973_1948 1897824 1899107 1284 1 0.639 11 GGA/GAG/AGG GENOMAD.025283.VV 5.515e-85 290 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1949 1899107 1900642 1536 1 0.645 11 AGGAG GENOMAD.116653.VV 5.637e-33 138 0 0 0 2561 Caudoviricetes NA NA PF06074;COG4383 Mu-like prophage protein gp29
+NC_014212.1|provirus_1893193_1914973_1950 1900644 1901816 1173 1 0.660 11 GGAG/GAGG GENOMAD.169564.VP 1.859e-13 75 0 0 0 2561 Caudoviricetes NA NA COG2369 Uncharacterized conserved protein, contains phage Mu gpF-like domain
+NC_014212.1|provirus_1893193_1914973_1951 1901828 1903027 1200 -1 0.613 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1952 1903028 1903480 453 -1 0.587 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1953 1903664 1904203 540 1 0.667 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1954 1904257 1904703 447 1 0.691 11 None GENOMAD.191448.VP 4.904e-23 97 0 0 1 2561 Caudoviricetes NA NA PF05069;TIGR01635;COG5005 phage virion morphogenesis (putative tail completion) protein
+NC_014212.1|provirus_1893193_1914973_1955 1904784 1905284 501 1 0.679 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1956 1905295 1905507 213 1 0.648 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1957 1905504 1906925 1422 1 0.675 11 AGGAGG GENOMAD.041181.VV 9.292e-41 161 0 0 1 2561 Caudoviricetes NA NA PF10758;COG3497 Phage tail sheath protein FI
+NC_014212.1|provirus_1893193_1914973_1958 1906936 1907367 432 1 0.595 11 AGGAGG GENOMAD.115837.VV 7.589e-83 269 0 0 0 2561 Caudoviricetes NA NA PF10772 Bacteriophage HP1, Orf24
+NC_014212.1|provirus_1893193_1914973_1959 1907426 1907800 375 1 0.629 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1960 1907805 1907936 132 -1 0.712 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1961 1907951 1910032 2082 1 0.691 11 GGAGG GENOMAD.113463.VP 1.273e-12 74 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1962 1910032 1910610 579 1 0.646 11 AGGAGG GENOMAD.163406.VV 9.335e-105 335 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1963 1910607 1911272 666 1 0.715 11 GGA/GAG/AGG GENOMAD.068883.VV 3.569e-104 335 0 0 0 2561 Caudoviricetes NA NA TIGR03361;COG3500 type VI secretion system Vgr family protein
+NC_014212.1|provirus_1893193_1914973_1964 1911274 1911750 477 1 0.671 11 AGGAGG GENOMAD.068883.VV 1.244e-15 76 0 0 0 2561 Caudoviricetes NA NA TIGR03361;COG3500 type VI secretion system Vgr family protein
+NC_014212.1|provirus_1893193_1914973_1965 1911750 1912124 375 1 0.651 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014212.1|provirus_1893193_1914973_1966 1912117 1913199 1083 1 0.664 11 GGAGG GENOMAD.106861.VV 2.93e-22 102 0 0 1 2561 Caudoviricetes NA NA PF04865;COG3299 Baseplate J-like protein
+NC_014212.1|provirus_1893193_1914973_1967 1913200 1913811 612 1 0.667 11 GGAGG GENOMAD.067612.VV 1.972e-93 303 0 0 1 2561 Caudoviricetes NA NA PF10076;COG4385;TIGR01634 Bacteriophage P2-related tail formation protein
+NC_014212.1|provirus_1893193_1914973_1968 1913819 1914973 1155 1 0.602 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_014363.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014363.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_014364.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014364.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,170 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_014364.1|provirus_2121424_2157334_1980 2121424 2123298 1875 -1 0.279 11 AATAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1981 2123295 2124836 1542 -1 0.291 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1982 2124849 2126519 1671 -1 0.313 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1983 2126533 2127723 1191 -1 0.296 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1984 2128349 2128567 219 1 0.425 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1985 2128620 2128988 369 1 0.512 11 AAAAAA GENOMAD.048210.VV 0.0001851 42 0 0 0 2561 Caudoviricetes NA NA PF05263;TIGR01636;COG1737;K03481 phage transcriptional activator, RinA family
+NC_014364.1|provirus_2121424_2157334_1986 2129017 2129205 189 1 0.439 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1987 2129348 2129836 489 1 0.462 11 AAAA GENOMAD.053051.VV 1.914e-10 61 0 0 0 2561 Caudoviricetes NA NA PF10772;PF02086;TIGR00571;COG0338 Bacteriophage HP1, Orf24; D12 class N6 adenine-specific DNA methyltransferase
+NC_014364.1|provirus_2121424_2157334_1988 2130317 2130664 348 1 0.483 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1989 2130715 2131533 819 1 0.548 11 AACAA GENOMAD.177891.VP 2.239e-15 79 0 0 0 2561 Caudoviricetes NA NA PF03837;TIGR01913;COG3723 phage recombination protein Bet
+NC_014364.1|provirus_2121424_2157334_1990 2131552 2132241 690 1 0.470 11 AAA GENOMAD.183319.VP 1.282e-26 111 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1991 2132238 2132714 477 1 0.564 11 None GENOMAD.111167.VV 2.064e-79 260 0 0 0 2561 Caudoviricetes NA NA PF16784 Putative HNHc nuclease
+NC_014364.1|provirus_2121424_2157334_1992 2132711 2133103 393 1 0.506 11 None GENOMAD.002027.VV 4.172e-17 79 0 0 1 2561 Caudoviricetes NA NA PF05766 Bacteriophage Lambda NinG protein
+NC_014364.1|provirus_2121424_2157334_1993 2133113 2133715 603 1 0.557 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1994 2133728 2134816 1089 1 0.573 11 None GENOMAD.018355.VV 8.801e-10 63 0 0 1 2561 Caudoviricetes NA NA PF09681;TIGR01714 phage replisome organizer, putative, N-terminal region
+NC_014364.1|provirus_2121424_2157334_1995 2134821 2135222 402 1 0.537 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1996 2135206 2135424 219 1 0.438 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1997 2135387 2135821 435 -1 0.522 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1998 2135946 2136674 729 1 0.442 11 AAAAAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_1999 2137384 2137893 510 1 0.539 11 AAA GENOMAD.170837.VV 9.661e-13 68 0 0 1 2561 Caudoviricetes NA NA PF05119;COG3747;TIGR01558 Phage terminase, small subunit
+NC_014364.1|provirus_2121424_2157334_2000 2137890 2139611 1722 1 0.564 11 None GENOMAD.194580.VP 1.811e-50 193 0 0 1 2561 Caudoviricetes NA NA PF03354;PF05521;PF20441;COG4626;TIGR01563 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014364.1|provirus_2121424_2157334_2001 2139608 2140849 1242 1 0.576 11 None GENOMAD.120555.VV 2.308e-46 176 0 0 1 2561 Caudoviricetes NA NA K21511 NA
+NC_014364.1|provirus_2121424_2157334_2002 2140839 2141672 834 1 0.574 11 None GENOMAD.096083.VP 2.363e-26 112 0 0 0 2561 Caudoviricetes NA NA PF00574;K01358;TIGR00493;COG0740 ATP-dependent Clp endopeptidase, proteolytic subunit ClpP
+NC_014364.1|provirus_2121424_2157334_2003 2141673 2142872 1200 1 0.563 11 None GENOMAD.080602.VV 1.495e-11 69 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR02215 phage conserved hypothetical protein, phiE125 gp8 family
+NC_014364.1|provirus_2121424_2157334_2004 2142889 2143311 423 1 0.582 11 None GENOMAD.129880.VV 8.259e-56 191 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2005 2143390 2143947 558 1 0.570 11 None GENOMAD.080176.VV 6.661e-14 72 0 0 0 2561 Caudoviricetes NA NA PF11436;TIGR02215 phage conserved hypothetical protein, phiE125 gp8 family
+NC_014364.1|provirus_2121424_2157334_2006 2143917 2144369 453 1 0.574 11 None GENOMAD.060383.VV 2.955e-10 60 0 0 1 1 NA NA NA PF04883;TIGR01725;COG5005 phage protein, HK97 gp10 family
+NC_014364.1|provirus_2121424_2157334_2007 2144347 2144745 399 1 0.534 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2008 2144749 2145444 696 1 0.519 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2009 2145447 2145848 402 1 0.530 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2010 2145869 2146144 276 1 0.554 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2011 2146125 2148398 2274 1 0.563 11 None GENOMAD.009561.VV 4.996e-38 157 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2012 2148401 2151679 3279 1 0.526 11 None GENOMAD.109300.VV 0.0 2070 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2013 2151676 2152287 612 1 0.547 11 None GENOMAD.007262.VV 1.557e-22 98 0 0 1 1 NA NA NA PF16778 Phage tail assembly chaperone protein
+NC_014364.1|provirus_2121424_2157334_2014 2152292 2152525 234 1 0.483 11 AAAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2015 2152527 2152997 471 1 0.507 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2016 2152994 2153242 249 1 0.478 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2017 2153244 2153633 390 1 0.538 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2018 2153947 2154315 369 1 0.360 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2019 2154472 2154795 324 1 0.349 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2020 2155168 2155953 786 1 0.392 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2121424_2157334_2021 2156093 2157334 1242 -1 0.475 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2174 2329685 2330950 1266 1 0.534 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2175 2331412 2331927 516 -1 0.260 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2176 2331924 2332307 384 -1 0.333 11 AATAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2177 2332404 2333627 1224 -1 0.283 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2178 2333802 2334419 618 -1 0.278 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2179 2334416 2335450 1035 -1 0.266 11 AAAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2180 2335637 2336704 1068 -1 0.370 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2181 2336829 2337170 342 -1 0.450 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2182 2337251 2337481 231 1 0.407 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2183 2337478 2337723 246 1 0.504 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2184 2337961 2338164 204 1 0.534 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2185 2338728 2339270 543 1 0.492 11 None GENOMAD.112664.VP 5.227e-63 214 0 0 0 2561 Caudoviricetes NA NA PF11195 NA
+NC_014364.1|provirus_2329685_2350621_2186 2339267 2339521 255 1 0.486 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2187 2339518 2340633 1116 1 0.544 11 None GENOMAD.090362.VV 6.936e-21 98 0 0 1 2561 Caudoviricetes NA NA PF13479;TIGR01618;COG2087 phage nucleotide-binding protein
+NC_014364.1|provirus_2329685_2350621_2188 2340648 2341298 651 1 0.498 11 None GENOMAD.025041.VV 1.179e-20 93 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2189 2341303 2341941 639 1 0.535 11 None GENOMAD.067346.VV 8.792e-124 391 0 0 0 2561 Caudoviricetes NA NA PF06023;TIGR00372;COG4343 CRISPR-associated protein Cas4
+NC_014364.1|provirus_2329685_2350621_2190 2341938 2342411 474 1 0.527 11 None GENOMAD.111167.VV 1.217e-84 275 0 0 0 2561 Caudoviricetes NA NA PF16784 Putative HNHc nuclease
+NC_014364.1|provirus_2329685_2350621_2191 2342625 2342858 234 1 0.500 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2192 2342868 2343407 540 1 0.554 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2193 2343420 2344475 1056 1 0.536 11 None GENOMAD.018355.VV 3.86e-05 48 0 0 1 2561 Caudoviricetes NA NA PF09681;TIGR01714 phage replisome organizer, putative, N-terminal region
+NC_014364.1|provirus_2329685_2350621_2194 2344481 2344894 414 1 0.551 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2195 2344878 2345096 219 1 0.438 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2196 2345093 2345284 192 1 0.505 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2197 2345287 2345487 201 1 0.542 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2198 2345630 2346916 1287 1 0.431 11 AAAA GENOMAD.185015.VV 0.0001092 47 0 0 0 2561 Caudoviricetes NA NA PF18692;PF14466;TIGR03066;COG3187;K03668 Gemmata obscuriglobus paralogous family TIGR03066
+NC_014364.1|provirus_2329685_2350621_2199 2347200 2348180 981 1 0.448 11 AAAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2329685_2350621_2200 2348796 2349302 507 1 0.550 11 AAA GENOMAD.170837.VV 4.939e-10 60 0 0 1 2561 Caudoviricetes NA NA PF05119;COG3747;TIGR01558 Phage terminase, small subunit
+NC_014364.1|provirus_2329685_2350621_2201 2349299 2350621 1323 1 0.550 11 None GENOMAD.194580.VP 1.831e-53 198 0 0 1 2561 Caudoviricetes NA NA PF03354;PF05521;PF20441;COG4626;TIGR01563 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014364.1|provirus_2666253_2703772_2490 2666253 2667515 1263 1 0.469 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2491 2667512 2667952 441 -1 0.458 11 None GENOMAD.167054.PV 6.452e-08 53 0 0 0 1 NA NA NA PF06892;TIGR02612;COG3655 mobile mystery protein A
+NC_014364.1|provirus_2666253_2703772_2492 2667949 2668332 384 -1 0.474 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2493 2668604 2668852 249 -1 0.414 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2494 2668815 2669231 417 -1 0.465 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2495 2669290 2669850 561 -1 0.381 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2496 2670024 2670449 426 -1 0.528 11 AAAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2497 2670476 2670724 249 -1 0.518 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2498 2670721 2670822 102 -1 0.539 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2499 2670819 2671190 372 -1 0.527 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2500 2671197 2671430 234 -1 0.487 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2501 2671435 2672046 612 -1 0.560 11 None GENOMAD.007262.VV 7.521e-22 96 0 0 1 1 NA NA NA PF16778 Phage tail assembly chaperone protein
+NC_014364.1|provirus_2666253_2703772_2502 2672043 2675357 3315 -1 0.506 11 None GENOMAD.109300.VV 0.0 2147 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2503 2675360 2677537 2178 -1 0.555 11 None GENOMAD.040051.VV 1.304e-19 97 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2504 2677518 2677793 276 -1 0.558 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2505 2677814 2678215 402 -1 0.520 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2506 2678218 2678973 756 -1 0.511 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2507 2678912 2679310 399 -1 0.526 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2508 2679288 2679713 426 -1 0.561 11 None GENOMAD.060383.VV 4.591e-11 62 0 0 1 1 NA NA NA PF04883;TIGR01725;COG5005 phage protein, HK97 gp10 family
+NC_014364.1|provirus_2666253_2703772_2509 2679710 2680267 558 -1 0.534 11 None GENOMAD.080176.VV 1.118e-18 86 0 0 0 2561 Caudoviricetes NA NA PF11436;TIGR02215 phage conserved hypothetical protein, phiE125 gp8 family
+NC_014364.1|provirus_2666253_2703772_2510 2680271 2680684 414 -1 0.534 11 None GENOMAD.210649.VV 1.155e-06 49 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2511 2680638 2681888 1251 -1 0.552 11 None GENOMAD.090434.VV 2.489e-32 134 0 0 1 2561 Caudoviricetes NA NA PF05065;TIGR01554;COG4653 phage major capsid protein, HK97 family
+NC_014364.1|provirus_2666253_2703772_2512 2681903 2682610 708 -1 0.556 11 None GENOMAD.126169.VV 1.014e-33 132 0 0 1 2561 Caudoviricetes NA NA PF04586;K06904;COG3740;TIGR01543 Phage head maturation protease
+NC_014364.1|provirus_2666253_2703772_2513 2682607 2684223 1617 -1 0.557 11 None GENOMAD.179073.VP 3.772e-33 139 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2514 2684220 2685944 1725 -1 0.556 11 None GENOMAD.194580.VP 1.898e-51 196 0 0 1 2561 Caudoviricetes NA NA PF03354;PF05521;PF20441;COG4626;TIGR01563 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014364.1|provirus_2666253_2703772_2515 2685941 2686450 510 -1 0.561 11 AAA GENOMAD.170837.VV 2.224e-11 64 0 0 1 2561 Caudoviricetes NA NA PF05119;COG3747;TIGR01558 Phage terminase, small subunit
+NC_014364.1|provirus_2666253_2703772_2516 2686454 2686852 399 -1 0.549 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2517 2687097 2687804 708 -1 0.381 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2518 2687794 2688030 237 -1 0.359 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2519 2688024 2688701 678 -1 0.412 11 None GENOMAD.222821.VP 3.109e-116 370 0 0 0 2561 Caudoviricetes NA NA TIGR03116 CRISPR type IV/AFERR-associated protein Csf3
+NC_014364.1|provirus_2666253_2703772_2520 2688698 2689639 942 -1 0.429 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2521 2689612 2689965 354 -1 0.387 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2522 2689910 2690650 741 -1 0.406 11 None GENOMAD.222446.VP 5.477e-146 457 0 0 0 1 NA NA NA TIGR03114 CRISPR type AFERR-associated protein Csf1
+NC_014364.1|provirus_2666253_2703772_2523 2690719 2690904 186 -1 0.425 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2524 2690927 2691118 192 -1 0.490 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2525 2691115 2691333 219 -1 0.425 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2526 2691317 2691718 402 -1 0.557 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2527 2691723 2692811 1089 -1 0.567 11 None GENOMAD.018355.VV 8.801e-10 63 0 0 1 2561 Caudoviricetes NA NA PF09681;TIGR01714 phage replisome organizer, putative, N-terminal region
+NC_014364.1|provirus_2666253_2703772_2528 2692824 2693420 597 -1 0.554 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2529 2693430 2693843 414 -1 0.500 11 None GENOMAD.002027.VV 5.448e-17 79 0 0 1 2561 Caudoviricetes NA NA PF05766 Bacteriophage Lambda NinG protein
+NC_014364.1|provirus_2666253_2703772_2530 2693840 2696353 2514 -1 0.494 11 None GENOMAD.126436.VP 5.738e-126 427 0 0 0 2561 Caudoviricetes NA NA PF13872 NA
+NC_014364.1|provirus_2666253_2703772_2531 2696356 2696832 477 -1 0.570 11 None GENOMAD.111167.VV 6.951e-83 270 0 0 0 2561 Caudoviricetes NA NA PF16784 Putative HNHc nuclease
+NC_014364.1|provirus_2666253_2703772_2532 2696829 2697434 606 -1 0.464 11 AAA GENOMAD.176983.VP 4.38e-16 79 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2533 2697453 2698265 813 -1 0.534 11 AACAA GENOMAD.177891.VP 4.712e-16 81 0 0 0 2561 Caudoviricetes NA NA PF03837;TIGR01913;COG3723 phage recombination protein Bet
+NC_014364.1|provirus_2666253_2703772_2534 2698316 2699071 756 -1 0.516 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2535 2699141 2699344 204 -1 0.554 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2536 2699404 2700138 735 -1 0.509 11 None GENOMAD.014438.VV 2.838e-34 134 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2537 2700139 2700486 348 -1 0.517 11 AAAA GENOMAD.100208.VV 1.289e-06 48 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2538 2700598 2700861 264 -1 0.379 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2539 2700891 2701232 342 1 0.456 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2540 2701372 2701794 423 -1 0.492 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2541 2701796 2702014 219 -1 0.457 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2542 2702096 2702443 348 1 0.405 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2543 2702566 2703069 504 1 0.357 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2544 2703117 2703407 291 1 0.392 11 None GENOMAD.219421.VC 7.977e-05 42 0 0 0 9067 Straboviridae NA NA NA NA
+NC_014364.1|provirus_2666253_2703772_2545 2703410 2703772 363 1 0.377 11 AAAA GENOMAD.227798.VP 1.946e-45 160 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2796 2976748 2977998 1251 1 0.455 11 None GENOMAD.225071.VP 8.645e-08 57 0 0 0 1 NA NA NA PF00589;PF13102;TIGR02225;COG4973;K14059 tyrosine recombinase XerD
+NC_014364.1|provirus_2976748_3014759_2797 2978103 2978576 474 -1 0.432 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2798 2978601 2978786 186 1 0.441 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2799 2978805 2979119 315 1 0.410 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2800 2979484 2979939 456 -1 0.355 11 AATAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2801 2980070 2980450 381 -1 0.454 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2802 2981023 2981250 228 1 0.544 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2803 2981859 2982401 543 1 0.488 11 None GENOMAD.112664.VP 2.835e-61 209 0 0 0 2561 Caudoviricetes NA NA PF11195 NA
+NC_014364.1|provirus_2976748_3014759_2804 2982398 2982652 255 1 0.467 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2805 2982649 2983740 1092 1 0.552 11 None GENOMAD.032961.VV 1.703e-27 118 0 0 1 2561 Caudoviricetes NA NA PF13479;TIGR01618;COG2087;K04484 phage nucleotide-binding protein
+NC_014364.1|provirus_2976748_3014759_2806 2983755 2984405 651 1 0.498 11 None GENOMAD.025041.VV 1.179e-20 93 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2807 2984410 2985048 639 1 0.546 11 None GENOMAD.067346.VV 1.619e-125 396 0 0 0 2561 Caudoviricetes NA NA PF06023;TIGR00372;COG4343 CRISPR-associated protein Cas4
+NC_014364.1|provirus_2976748_3014759_2808 2985045 2985518 474 1 0.540 11 None GENOMAD.111167.VV 7.301e-82 267 0 0 0 2561 Caudoviricetes NA NA PF16784 Putative HNHc nuclease
+NC_014364.1|provirus_2976748_3014759_2809 2985528 2985974 447 1 0.506 11 None GENOMAD.002027.VV 2.633e-21 92 0 0 1 2561 Caudoviricetes NA NA PF05766 Bacteriophage Lambda NinG protein
+NC_014364.1|provirus_2976748_3014759_2810 2985984 2986526 543 1 0.562 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2811 2986554 2987651 1098 1 0.533 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2812 2987656 2988057 402 1 0.545 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2813 2988041 2988259 219 1 0.447 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2814 2988256 2988462 207 1 0.507 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2815 2988462 2989181 720 1 0.528 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2816 2989159 2990028 870 1 0.553 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2817 2990048 2990725 678 1 0.527 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2818 2990697 2990873 177 1 0.525 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2819 2990900 2991442 543 1 0.499 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2820 2991609 2991938 330 1 0.521 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2821 2991948 2993630 1683 1 0.551 11 None GENOMAD.060970.VV 1.975e-99 338 0 0 1 2561 Caudoviricetes NA NA PF12236 Bacteriophage head to tail connecting protein
+NC_014364.1|provirus_2976748_3014759_2822 2993627 2993929 303 1 0.545 11 None GENOMAD.118268.VV 1.689e-06 47 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2823 2993926 2994732 807 1 0.545 11 None GENOMAD.072294.VV 2.192e-115 370 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2824 2994744 2995730 987 1 0.532 11 None GENOMAD.004790.VV 4.85e-58 207 0 0 1 2561 Caudoviricetes NA NA PF19307 Phage capsid-like protein
+NC_014364.1|provirus_2976748_3014759_2825 2995745 2996119 375 1 0.565 11 None GENOMAD.013948.VV 1.528e-25 103 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2826 2996128 2996442 315 1 0.556 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2827 2996452 2997045 594 1 0.532 11 None GENOMAD.061091.VV 8.908e-15 75 0 0 1 2561 Caudoviricetes NA NA PF17212 Tail tubular protein
+NC_014364.1|provirus_2976748_3014759_2828 2997042 2998754 1713 1 0.537 11 None GENOMAD.063463.VV 3.739e-12 72 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2829 2998751 2999638 888 1 0.484 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2830 2999654 3001600 1947 1 0.500 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2831 3001597 3007842 6246 1 0.505 11 None GENOMAD.224557.VP 0.0001899 49 0 0 0 2561 Caudoviricetes NA NA PF18819 Phage MuF-C-terminal domain
+NC_014364.1|provirus_2976748_3014759_2832 3007790 3011446 3657 1 0.470 11 AAA GENOMAD.113444.VC 1.137e-11 72 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2833 3011443 3012054 612 1 0.554 11 None GENOMAD.007262.VV 3.024e-24 103 0 0 1 1 NA NA NA PF16778 Phage tail assembly chaperone protein
+NC_014364.1|provirus_2976748_3014759_2834 3012059 3012292 234 1 0.487 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2835 3012298 3012777 480 1 0.479 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2836 3012774 3012995 222 1 0.419 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2837 3013047 3013463 417 1 0.540 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_014364.1|provirus_2976748_3014759_2838 3013650 3014759 1110 1 0.259 11 AAA NA NA NA 0 0 0 1 NA NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_015761.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_015761.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,112 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_015761.1|provirus_847397_862760_745 847397 847636 240 -1 0.438 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_847397_862760_746 847705 848118 414 1 0.611 11 None GENOMAD.138177.VP 1.107e-17 81 0 0 1 2561 Caudoviricetes NA NA PF04717;PF18715;COG4540;TIGR01644 Phage P2 baseplate assembly protein gpV
+NC_015761.1|provirus_847397_862760_747 848177 848536 360 1 0.553 11 GGAGG GENOMAD.121581.VP 1.359e-07 51 0 0 1 2561 Caudoviricetes NA NA PF04965;COG3628;K06903;TIGR03357 Phage baseplate assembly protein W
+NC_015761.1|provirus_847397_862760_748 848523 849431 909 1 0.590 11 AGGAG GENOMAD.105501.VV 2.367e-122 392 0 0 1 2561 Caudoviricetes NA NA PF03434;COG3948 Phage-related baseplate assembly protein
+NC_015761.1|provirus_847397_862760_749 849424 850029 606 1 0.578 11 GGxGG GENOMAD.114503.VV 2.832e-71 239 0 0 1 2561 Caudoviricetes NA NA PF09684;COG4385;TIGR01634 Bacteriophage P2-related tail formation protein
+NC_015761.1|provirus_847397_862760_750 850026 850943 918 1 0.548 11 GGA/GAG/AGG GENOMAD.118528.VP 8.226e-145 457 0 0 1 2561 Caudoviricetes NA NA PF12571;COG5301 Phage-related tail fibre protein
+NC_015761.1|provirus_847397_862760_751 851338 852495 1158 1 0.306 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_847397_862760_752 852717 853181 465 -1 0.447 11 AGGA GENOMAD.168001.VP 6.793e-48 169 0 0 1 2561 Caudoviricetes NA NA PF16778 Phage tail assembly chaperone protein
+NC_015761.1|provirus_847397_862760_753 853514 853768 255 -1 0.424 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_847397_862760_754 853798 854055 258 1 0.508 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_847397_862760_755 854436 854621 186 1 0.586 11 AGGAG GENOMAD.120968.VV 2.238e-24 96 0 0 1 2561 Caudoviricetes NA NA COG3497 Phage tail sheath protein FI
+NC_015761.1|provirus_847397_862760_756 854942 855244 303 1 0.558 11 AGGA GENOMAD.135969.VP 5.864e-25 100 0 0 1 2561 Caudoviricetes NA NA PF10109 Phage tail assembly chaperone proteins, E, or 41 or 14
+NC_015761.1|provirus_847397_862760_757 855371 856519 1149 1 0.586 11 None GENOMAD.130201.VP 2.372e-43 166 0 0 1 2561 Caudoviricetes NA NA COG5283 Phage-related tail protein
+NC_015761.1|provirus_847397_862760_758 856462 858486 2025 1 0.583 11 None GENOMAD.145447.VP 1.422e-33 142 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_847397_862760_759 858446 858832 387 1 0.535 11 None GENOMAD.116424.VV 2.281e-14 71 0 0 0 2561 Caudoviricetes NA NA PF06995;K06906;COG3499 Phage protein U
+NC_015761.1|provirus_847397_862760_760 858829 859881 1053 1 0.531 11 GGAGG GENOMAD.209614.VP 3.524e-49 182 0 0 1 2561 Caudoviricetes NA NA PF05954;K06905;COG3500;TIGR03361 Phage protein D
+NC_015761.1|provirus_847397_862760_761 859972 860190 219 1 0.461 11 GGAG/GAGG GENOMAD.222803.VP 3.752e-10 56 0 0 0 2561 Caudoviricetes NA NA PF04606;TIGR04165;COG1326 Ogr/Delta-like zinc finger
+NC_015761.1|provirus_847397_862760_762 860426 862111 1686 -1 0.537 11 AGxAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_847397_862760_763 862383 862760 378 1 0.508 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_886 1007223 1008242 1020 -1 0.473 11 GGAG/GAGG GENOMAD.212993.VP 2.024e-35 141 0 0 0 2561 Caudoviricetes NA NA PF14659;K21039 Phage integrase, N-terminal SAM-like domain
+NC_015761.1|provirus_1007223_1045009_887 1008243 1008467 225 -1 0.502 11 GGAG/GAGG GENOMAD.151670.VV 1.037e-08 52 0 0 0 2561 Caudoviricetes NA NA PF13986 NA
+NC_015761.1|provirus_1007223_1045009_888 1008909 1009049 141 1 0.532 11 GGAG/GAGG GENOMAD.224144.VP 3.211e-14 66 0 0 0 2561 Caudoviricetes NA NA PF10798;K21975 Biofilm development protein YmgB/AriR
+NC_015761.1|provirus_1007223_1045009_889 1009155 1009961 807 -1 0.337 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_890 1009958 1010806 849 -1 0.418 11 GGAG/GAGG GENOMAD.212816.VV 1.518e-152 478 0 0 0 2561 Caudoviricetes NA NA PF20613;TIGR03843 HipA-like kinase
+NC_015761.1|provirus_1007223_1045009_891 1010978 1011445 468 -1 0.476 11 AGGA GENOMAD.091484.VV 0.0004177 42 0 0 0 2561 Caudoviricetes NA NA PF13411;COG3415;K22302;TIGR00721 Transposase
+NC_015761.1|provirus_1007223_1045009_892 1011459 1011686 228 1 0.425 11 AGGAGG GENOMAD.151341.VV 0.0001753 40 0 0 1 2561 Caudoviricetes NA NA PF11242;TIGR00673;COG5606;K18830 cyanase
+NC_015761.1|provirus_1007223_1045009_893 1011706 1012026 321 1 0.539 11 GGAG/GAGG GENOMAD.069430.VV 6.718e-58 195 0 0 1 2561 Caudoviricetes NA NA PF18010;TIGR00721;COG4220 Cry35Ab1 HTH C-terminal domain
+NC_015761.1|provirus_1007223_1045009_894 1012118 1013023 906 1 0.475 11 AGGAG GENOMAD.208204.VP 3.298e-81 273 0 0 0 2561 Caudoviricetes NA NA PF04492;TIGR01610 phage replication protein O, N-terminal domain
+NC_015761.1|provirus_1007223_1045009_895 1013020 1013712 693 1 0.551 11 GGAG/GAGG GENOMAD.194512.VV 1.29e-76 256 0 0 1 2561 Caudoviricetes NA NA PF06992 NA
+NC_015761.1|provirus_1007223_1045009_896 1013726 1013983 258 1 0.488 11 AGGAG GENOMAD.072808.VV 9.932e-44 153 0 0 0 2561 Caudoviricetes NA NA PF15944 NA
+NC_015761.1|provirus_1007223_1045009_897 1013980 1014891 912 1 0.498 11 GGAGG GENOMAD.068933.VV 1.147e-200 618 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_898 1014993 1015319 327 1 0.462 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_899 1015319 1015426 108 1 0.454 11 AGGA/GGAG/GAGG GENOMAD.226031.VP 2.127e-06 43 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_900 1015606 1016037 432 -1 0.389 11 GGA/GAG/AGG GENOMAD.213484.VP 5.7e-53 183 0 0 0 2561 Caudoviricetes NA NA PF05509;COG4877 Plasmid stability protein
+NC_015761.1|provirus_1007223_1045009_901 1016160 1016327 168 1 0.411 11 AGxAGG/AGGxGG GENOMAD.168832.VV 8.581e-31 114 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_902 1016314 1017228 915 1 0.462 11 GGA/GAG/AGG GENOMAD.222649.VP 4.345e-08 57 0 0 0 2561 Caudoviricetes NA NA PF10548;PF10547;COG3617 Prophage antirepressor
+NC_015761.1|provirus_1007223_1045009_903 1017301 1018047 747 1 0.475 11 AGGA GENOMAD.167364.VP 3.729e-134 423 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_904 1018233 1018466 234 1 0.462 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_905 1018866 1019468 603 1 0.526 11 GGAG/GAGG GENOMAD.040195.VV 1.554e-77 257 0 0 0 2561 Caudoviricetes NA NA PF07105 NA
+NC_015761.1|provirus_1007223_1045009_906 1019857 1020528 672 1 0.512 11 GGA/GAG/AGG GENOMAD.058019.VV 7.177e-33 129 0 0 0 2561 Caudoviricetes NA NA PF06323 Phage antitermination protein Q
+NC_015761.1|provirus_1007223_1045009_907 1020797 1021369 573 1 0.471 11 GGAG/GAGG GENOMAD.209828.VP 1.159e-20 92 0 0 0 2561 Caudoviricetes NA NA PF10543;COG3646 ORF6N domain
+NC_015761.1|provirus_1007223_1045009_908 1021511 1022011 501 -1 0.465 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_909 1022022 1022201 180 -1 0.472 11 GGAG/GAGG GENOMAD.175300.VV 1.174e-29 111 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_910 1023134 1023559 426 1 0.352 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_911 1023588 1024331 744 1 0.423 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_912 1024569 1024958 390 1 0.482 11 GGAG/GAGG GENOMAD.222896.VP 4.488e-57 194 0 0 1 2561 Caudoviricetes NA NA PF16931 Putative phage holin
+NC_015761.1|provirus_1007223_1045009_913 1024945 1025226 282 1 0.514 11 GGAGG GENOMAD.214895.VP 1.105e-15 73 0 0 1 2561 Caudoviricetes NA NA PF05449 Putative 3TM holin, Phage_holin_3
+NC_015761.1|provirus_1007223_1045009_914 1025226 1025840 615 1 0.528 11 GGAG/GAGG GENOMAD.021660.VV 3.743e-21 94 0 0 0 2561 Caudoviricetes NA NA COG3179;K18950 Predicted chitinase
+NC_015761.1|provirus_1007223_1045009_915 1025837 1026379 543 1 0.534 11 None GENOMAD.108518.VV 1.733e-31 123 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_916 1026641 1027171 531 1 0.448 11 GGA/GAG/AGG GENOMAD.068419.VV 7.247e-49 173 0 0 0 2561 Caudoviricetes NA NA PF10549 ORF11CD3 domain
+NC_015761.1|provirus_1007223_1045009_917 1027137 1027496 360 1 0.506 11 GGA/GAG/AGG GENOMAD.062288.VV 1.85e-37 137 0 0 0 2561 Caudoviricetes NA NA PF10721 NA
+NC_015761.1|provirus_1007223_1045009_918 1027571 1027981 411 1 0.353 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_919 1028070 1028375 306 1 0.392 11 GGAG/GAGG GENOMAD.210890.VV 1.177e-49 171 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_920 1028478 1028828 351 1 0.510 11 AGGA GENOMAD.179073.VP 2.39e-17 79 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_921 1028913 1029170 258 1 0.523 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_922 1029172 1030284 1113 1 0.524 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_923 1030383 1030499 117 1 0.436 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_924 1030656 1031234 579 1 0.402 11 AGGA GENOMAD.222575.VP 5.62e-21 93 0 0 0 2561 Caudoviricetes NA NA PF06416 Effector protein NleG
+NC_015761.1|provirus_1007223_1045009_925 1031568 1033916 2349 -1 0.456 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_926 1034271 1035401 1131 -1 0.546 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_927 1035640 1035837 198 1 0.510 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_928 1036394 1036723 330 -1 0.476 11 AGGA GENOMAD.182552.PC 9.486e-56 189 0 0 0 1 NA NA NA PF15781;COG3668;TIGR00053;K06218 Plasmid stabilization system protein ParE
+NC_015761.1|provirus_1007223_1045009_929 1036749 1036979 231 -1 0.450 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_930 1037060 1037353 294 -1 0.476 11 GGA/GAG/AGG GENOMAD.221919.VP 3.483e-21 89 0 0 0 2561 Caudoviricetes NA NA PF00589 Phage integrase family
+NC_015761.1|provirus_1007223_1045009_931 1038122 1038700 579 1 0.402 11 AGGA GENOMAD.222575.VP 5.62e-21 93 0 0 0 2561 Caudoviricetes NA NA PF06416 Effector protein NleG
+NC_015761.1|provirus_1007223_1045009_932 1039093 1039440 348 1 0.534 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_933 1039590 1040444 855 1 0.385 11 4Base/6BMM GENOMAD.120636.VV 2.17e-58 206 0 0 0 2561 Caudoviricetes NA NA PF09612;TIGR02192 protein YibB
+NC_015761.1|provirus_1007223_1045009_934 1040507 1040737 231 -1 0.320 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_935 1040933 1043740 2808 -1 0.577 11 AGGAGG GENOMAD.054026.VV 1.896e-05 51 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_1007223_1045009_936 1044602 1045009 408 1 0.451 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2808 3084741 3084959 219 -1 0.507 11 GGAG/GAGG GENOMAD.223866.VP 4.224e-09 53 0 0 0 2561 Caudoviricetes NA NA PF04606;TIGR02098 Ogr/Delta-like zinc finger
+NC_015761.1|provirus_3084741_3115735_2809 3085026 3086195 1170 -1 0.548 11 GGAGG GENOMAD.209614.VP 1.088e-49 185 0 0 1 2561 Caudoviricetes NA NA PF05954;K06905;COG3500;TIGR03361 Phage protein D
+NC_015761.1|provirus_3084741_3115735_2810 3086192 3086677 486 -1 0.543 11 GGAG/GAGG GENOMAD.116424.VV 2.262e-19 87 0 0 0 2561 Caudoviricetes NA NA PF06995;K06906;COG3499 Phage protein U
+NC_015761.1|provirus_3084741_3115735_2811 3086692 3089133 2442 -1 0.566 11 GGA/GAG/AGG GENOMAD.130201.VP 4.265e-179 582 0 0 1 2561 Caudoviricetes NA NA COG5283 Phage-related tail protein
+NC_015761.1|provirus_3084741_3115735_2812 3089278 3089613 336 -1 0.571 11 GGA/GAG/AGG GENOMAD.135969.VP 1.933e-25 102 0 0 1 2561 Caudoviricetes NA NA PF10109 Phage tail assembly chaperone proteins, E, or 41 or 14
+NC_015761.1|provirus_3084741_3115735_2813 3089676 3090194 519 -1 0.586 11 AGGAG/GGAGG GENOMAD.222086.VV 9.473e-26 106 0 0 1 2561 Caudoviricetes NA NA PF04985;K06908;TIGR01611;COG3498 phage contractile tail tube protein, P2 family
+NC_015761.1|provirus_3084741_3115735_2814 3090210 3091397 1188 -1 0.549 11 GGAG/GAGG GENOMAD.102019.VV 3.796e-60 216 0 0 1 2561 Caudoviricetes NA NA PF10758;COG3497 Phage tail sheath protein FI
+NC_015761.1|provirus_3084741_3115735_2815 3091532 3092080 549 -1 0.475 11 AGGA GENOMAD.209102.VP 2.721e-113 359 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2816 3092093 3094069 1977 -1 0.518 11 GGA/GAG/AGG GENOMAD.151930.VP 1.701e-178 573 0 0 1 2561 Caudoviricetes NA NA PF12571;COG5301 Phage-related tail fibre protein
+NC_015761.1|provirus_3084741_3115735_2817 3094080 3094610 531 -1 0.539 11 GGxGG GENOMAD.114503.VV 2.848e-76 252 0 0 1 2561 Caudoviricetes NA NA PF09684;COG4385;TIGR01634 Bacteriophage P2-related tail formation protein
+NC_015761.1|provirus_3084741_3115735_2818 3094603 3095511 909 -1 0.554 11 GGA/GAG/AGG GENOMAD.105501.VV 5.746e-121 388 0 0 1 2561 Caudoviricetes NA NA PF03434;COG3948 Phage-related baseplate assembly protein
+NC_015761.1|provirus_3084741_3115735_2819 3095518 3095865 348 -1 0.549 11 GGAGG GENOMAD.121581.VP 1.186e-07 51 0 0 1 2561 Caudoviricetes NA NA PF04965;COG3628;K06903;TIGR03357 Phage baseplate assembly protein W
+NC_015761.1|provirus_3084741_3115735_2820 3095862 3096503 642 -1 0.615 11 AGGA/GGAG/GAGG GENOMAD.166314.VP 7.564e-57 198 0 0 1 2561 Caudoviricetes NA NA K22111;TIGR01644;COG4540 phage baseplate assembly protein V
+NC_015761.1|provirus_3084741_3115735_2821 3096572 3097021 450 -1 0.596 11 GGA/GAG/AGG GENOMAD.134219.VP 5.44e-48 169 0 0 1 2561 Caudoviricetes NA NA PF05069;TIGR01635;COG5005 phage virion morphogenesis (putative tail completion) protein
+NC_015761.1|provirus_3084741_3115735_2822 3097014 3097481 468 -1 0.568 11 AGGA GENOMAD.125799.VP 3.104e-65 219 0 0 1 2561 Caudoviricetes NA NA PF06891 P2 phage tail completion protein R (GpR)
+NC_015761.1|provirus_3084741_3115735_2823 3097444 3097602 159 -1 0.572 11 GGA/GAG/AGG GENOMAD.116277.VV 5.069e-27 103 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2824 3097589 3098002 414 -1 0.594 11 GGxGG GENOMAD.191084.VP 1.984e-28 112 0 0 0 2561 Caudoviricetes NA NA PF10828;TIGR03495 phage lysis regulatory protein, LysB family
+NC_015761.1|provirus_3084741_3115735_2825 3097999 3098496 498 -1 0.572 11 AGxAGG/AGGxGG GENOMAD.123113.VP 0.0005094 42 0 0 0 2561 Caudoviricetes NA NA PF19846 NA
+NC_015761.1|provirus_3084741_3115735_2826 3098483 3098779 297 -1 0.549 11 GGAG/GAGG GENOMAD.177230.VP 7.699e-37 134 0 0 1 2561 Caudoviricetes NA NA PF04550;TIGR01594 Phage holin family 2
+NC_015761.1|provirus_3084741_3115735_2827 3098783 3098971 189 -1 0.571 11 GGA/GAG/AGG GENOMAD.159179.VP 4.593e-18 78 0 0 1 2561 Caudoviricetes NA NA COG5004;K06370 P2-like prophage tail protein X
+NC_015761.1|provirus_3084741_3115735_2828 3098986 3099492 507 -1 0.586 11 GGAG/GAGG GENOMAD.119083.VV 9.468e-51 178 0 0 0 2561 Caudoviricetes NA NA PF05926 Phage head completion protein (GPL)
+NC_015761.1|provirus_3084741_3115735_2829 3099586 3100335 750 -1 0.615 11 GGAG/GAGG GENOMAD.034571.VV 3.734e-44 163 0 0 1 2561 Caudoviricetes NA NA PF05944 Phage small terminase subunit
+NC_015761.1|provirus_3084741_3115735_2830 3100339 3101406 1068 -1 0.529 11 AGGA GENOMAD.125799.VP 2.236e-60 215 0 0 1 2561 Caudoviricetes NA NA PF06891 P2 phage tail completion protein R (GpR)
+NC_015761.1|provirus_3084741_3115735_2831 3101482 3102336 855 -1 0.538 11 AGGA GENOMAD.042716.VV 2.893e-146 460 0 0 0 2561 Caudoviricetes NA NA COG4388 Mu-like prophage I protein
+NC_015761.1|provirus_3084741_3115735_2832 3102502 3104271 1770 1 0.572 11 GGAG/GAGG GENOMAD.151636.VP 8.559e-104 352 0 0 0 2561 Caudoviricetes NA NA COG5484 Uncharacterized protein YjcR, contains N-terminal HTH domain
+NC_015761.1|provirus_3084741_3115735_2833 3104271 3105317 1047 1 0.538 11 GGAG/GAGG GENOMAD.073411.VV 2.533e-07 55 0 0 1 2561 Caudoviricetes NA NA PF04860;TIGR01540;COG4695 phage portal protein, PBSX family
+NC_015761.1|provirus_3084741_3115735_2834 3105395 3106399 1005 1 0.375 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2835 3106779 3107327 549 -1 0.341 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2836 3107438 3108169 732 -1 0.455 11 AGGA GENOMAD.226160.VP 4.122e-139 437 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2837 3108252 3108692 441 -1 0.454 11 GGAGG GENOMAD.137104.VV 8.416e-25 102 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2838 3108810 3111029 2220 -1 0.516 11 None GENOMAD.182861.VP 4.397e-89 314 0 0 1 2561 Caudoviricetes NA NA PF05840 Bacteriophage replication gene A protein (GPA)
+NC_015761.1|provirus_3084741_3115735_2839 3111152 3111673 522 -1 0.481 11 None GENOMAD.170058.VV 8.762e-113 357 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2840 3111670 3111894 225 -1 0.573 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2841 3111894 3112121 228 -1 0.509 11 AGGAG GENOMAD.071646.VV 8.539e-33 121 0 0 0 2561 Caudoviricetes NA NA PF10809 NA
+NC_015761.1|provirus_3084741_3115735_2842 3112191 3112391 201 -1 0.403 11 GGA/GAG/AGG GENOMAD.167874.VV 2.606e-40 142 0 0 0 1 NA NA NA NA NA
+NC_015761.1|provirus_3084741_3115735_2843 3112378 3112605 228 -1 0.482 11 GGAG/GAGG GENOMAD.087231.VV 3.1e-35 128 0 0 0 2561 Caudoviricetes NA NA PF10893 Bacteriophage 186, Fil
+NC_015761.1|provirus_3084741_3115735_2844 3112613 3113122 510 -1 0.539 11 GGAG/GAGG GENOMAD.170830.VP 4.59e-76 251 0 0 1 2561 Caudoviricetes NA NA PF06892 Phage regulatory protein CII (CP76)
+NC_015761.1|provirus_3084741_3115735_2845 3113153 3113416 264 -1 0.530 11 GGA/GAG/AGG GENOMAD.120542.VV 1.195e-50 173 0 0 0 1 NA NA NA PF07618;COG3311;TIGR02405 Putative transcription regulator (DUF1323)
+NC_015761.1|provirus_3084741_3115735_2846 3113547 3114125 579 1 0.454 11 GGA/GAG/AGG GENOMAD.069724.VV 5.35e-42 154 0 0 0 2561 Caudoviricetes NA NA PF16452 Bacteriophage CI repressor C-terminal domain
+NC_015761.1|provirus_3084741_3115735_2847 3114125 3115162 1038 1 0.489 11 GGAG/GAGG GENOMAD.212346.VP 5.632e-52 190 0 0 1 2561 Caudoviricetes NA NA PF16452;PF06892;COG1974 Bacteriophage CI repressor C-terminal domain; Phage regulatory protein CII (CP76)
+NC_015761.1|provirus_3084741_3115735_2848 3115400 3115735 336 -1 0.473 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_017033.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_017033.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,163 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_017033.1|provirus_1052334_1094910_930 1052334 1052537 204 -1 0.647 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_931 1053148 1054167 1020 -1 0.611 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_932 1054169 1054387 219 -1 0.594 11 GGAG/GAGG GENOMAD.180717.VC 2.645e-13 65 0 0 0 2561 Caudoviricetes NA NA PF13986 NA
+NC_017033.1|provirus_1052334_1094910_933 1054387 1054635 249 -1 0.554 11 GGAGG GENOMAD.104567.VV 3.707e-07 48 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_934 1054637 1054864 228 -1 0.548 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_935 1054857 1055138 282 -1 0.681 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_936 1055135 1055392 258 -1 0.593 11 GGA/GAG/AGG GENOMAD.178404.VP 6.067e-41 145 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_937 1055389 1056072 684 -1 0.611 11 GGAGG GENOMAD.171154.VP 4.943e-50 179 0 0 0 2561 Caudoviricetes NA NA PF13986;PF05551 NA
+NC_017033.1|provirus_1052334_1094910_938 1056069 1056419 351 -1 0.661 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_939 1056446 1056697 252 -1 0.579 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_940 1056715 1057194 480 -1 0.652 11 None GENOMAD.061727.VV 9.654e-06 47 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_941 1057194 1057496 303 -1 0.571 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_942 1057582 1057857 276 -1 0.620 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_943 1057854 1057982 129 -1 0.636 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_944 1058637 1059326 690 1 0.528 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_945 1059393 1059671 279 1 0.591 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_946 1060095 1060526 432 -1 0.544 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_947 1061139 1061330 192 1 0.542 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_948 1061475 1061768 294 1 0.595 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_949 1061876 1062043 168 -1 0.595 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_950 1062409 1062666 258 1 0.469 11 GGAG/GAGG GENOMAD.209492.VC 7.51e-09 53 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_951 1062672 1063235 564 1 0.426 11 AGGA GENOMAD.193207.VC 1.694e-10 62 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_952 1063880 1064236 357 -1 0.594 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_953 1064740 1065435 696 -1 0.593 11 None GENOMAD.223691.VP 7.797e-07 52 0 0 0 2561 Caudoviricetes NA NA PF16452;COG1974;K22300;TIGR02612 SOS-response transcriptional repressor LexA (RecA-mediated autopeptidase)
+NC_017033.1|provirus_1052334_1094910_954 1065731 1065943 213 1 0.606 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_955 1066043 1066552 510 -1 0.573 11 GGA/GAG/AGG GENOMAD.177794.VC 4.267e-34 130 0 0 0 2561 Caudoviricetes NA NA PF09639 YjcQ protein
+NC_017033.1|provirus_1052334_1094910_956 1066578 1067204 627 1 0.614 11 None GENOMAD.120202.VV 1.214e-07 54 0 0 1 1 NA NA NA PF06892 NA
+NC_017033.1|provirus_1052334_1094910_957 1067201 1068190 990 1 0.614 11 GGAGG GENOMAD.105893.VV 9.514e-13 72 0 0 0 2561 Caudoviricetes NA NA PF07120;COG3756 Uncharacterized conserved protein YdaU, DUF1376 family
+NC_017033.1|provirus_1052334_1094910_958 1068177 1068839 663 1 0.621 11 AGGAG GENOMAD.073619.VV 0.0005392 43 0 0 0 1 NA NA NA PF11417 Loader and inhibitor of phage G40P
+NC_017033.1|provirus_1052334_1094910_959 1068836 1069036 201 1 0.652 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_960 1069033 1069539 507 1 0.641 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_961 1069536 1069925 390 1 0.672 11 GGAGG GENOMAD.022482.VV 2.349e-31 120 0 0 0 2561 Caudoviricetes NA NA PF16786 Recombination enhancement, RecA-dependent nuclease
+NC_017033.1|provirus_1052334_1094910_962 1069922 1070419 498 1 0.542 11 GGAGG GENOMAD.159849.VP 2.603e-19 87 0 0 0 2561 Caudoviricetes NA NA PF07102;PF13264 Putative nuclease YbcO
+NC_017033.1|provirus_1052334_1094910_963 1070416 1070799 384 1 0.669 11 GGAG/GAGG GENOMAD.194195.VV 4.071e-16 76 0 0 0 2561 Caudoviricetes NA NA PF08774 VRR-NUC domain
+NC_017033.1|provirus_1052334_1094910_964 1070975 1071658 684 1 0.640 11 3Base/5BMM GENOMAD.069895.VV 4.278e-31 124 0 0 0 2561 Caudoviricetes NA NA PF17302;TIGR02642 Tryptophan RNA-binding attenuator protein inhibitory protein
+NC_017033.1|provirus_1052334_1094910_965 1071772 1072077 306 -1 0.565 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_966 1072058 1072372 315 -1 0.543 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_967 1072433 1072939 507 1 0.615 11 GGA/GAG/AGG GENOMAD.219399.VP 4.416e-42 153 0 0 0 2561 Caudoviricetes NA NA PF10549;COG3646;TIGR02681 Phage regulatory protein Rha
+NC_017033.1|provirus_1052334_1094910_968 1073003 1073221 219 1 0.612 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_969 1073205 1073681 477 1 0.671 11 GGAG/GAGG GENOMAD.083189.VV 3.344e-12 66 0 0 1 2561 Caudoviricetes NA NA PF00959;COG3772;K01185 Phage-related lysozyme (muramidase), GH24 family
+NC_017033.1|provirus_1052334_1094910_970 1073681 1074163 483 1 0.656 11 GGAG/GAGG GENOMAD.077452.VV 3.762e-11 63 0 0 1 2561 Caudoviricetes NA NA PF03245;K14744 Bacteriophage Rz lysis protein
+NC_017033.1|provirus_1052334_1094910_971 1074160 1074501 342 1 0.675 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_972 1074715 1075245 531 1 0.629 11 GGA/GAG/AGG GENOMAD.161251.VP 3.022e-32 125 0 0 1 2561 Caudoviricetes NA NA PF07471;K22014;COG4220 Phage DNA packaging protein, Nu1 subunit of terminase
+NC_017033.1|provirus_1052334_1094910_973 1075220 1077124 1905 1 0.637 11 AGGA GENOMAD.129396.VP 3.658e-61 227 0 0 1 2561 Caudoviricetes NA NA PF20454 Terminase large subunit gpA, endonuclease domain
+NC_017033.1|provirus_1052334_1094910_974 1077125 1077361 237 1 0.662 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_975 1077361 1078962 1602 1 0.670 11 None GENOMAD.019804.VV 6.033e-91 312 0 0 1 2561 Caudoviricetes NA NA PF05136;TIGR01539;COG5511 phage portal protein, lambda family
+NC_017033.1|provirus_1052334_1094910_976 1078962 1080191 1230 1 0.686 11 AGGAG GENOMAD.160855.VP 4.845e-09 61 0 0 0 2561 Caudoviricetes NA NA PF00574;TIGR00706;COG0740 signal peptide peptidase SppA, 36K type
+NC_017033.1|provirus_1052334_1094910_977 1080191 1080607 417 1 0.686 11 AGGAG GENOMAD.191487.VP 3.287e-14 71 0 0 0 1 NA NA NA PF02924 Bacteriophage lambda head decoration protein D
+NC_017033.1|provirus_1052334_1094910_978 1080672 1081673 1002 1 0.618 11 GGA/GAG/AGG GENOMAD.124233.VP 2.33e-71 246 0 0 1 2561 Caudoviricetes NA NA PF03864 Phage major capsid protein E
+NC_017033.1|provirus_1052334_1094910_979 1081673 1081981 309 1 0.650 11 None GENOMAD.092349.VV 3.404e-39 141 0 0 0 1 NA NA NA PF13856 ATP-binding sugar transporter from pro-phage
+NC_017033.1|provirus_1052334_1094910_980 1081978 1082574 597 1 0.657 11 GGAG/GAGG GENOMAD.066423.VV 4.833e-81 267 0 0 1 2561 Caudoviricetes NA NA PF06763 Prophage minor tail protein Z (GPZ)
+NC_017033.1|provirus_1052334_1094910_981 1082571 1083152 582 1 0.634 11 GGA/GAG/AGG GENOMAD.065270.VV 5.57e-42 154 0 0 1 2561 Caudoviricetes NA NA PF09646 Gp37 protein
+NC_017033.1|provirus_1052334_1094910_982 1083127 1083714 588 1 0.675 11 AGGAG GENOMAD.162066.VP 1.032e-44 162 0 0 1 2561 Caudoviricetes NA NA PF04717;COG4540;TIGR01644 Phage P2 baseplate assembly protein gpV
+NC_017033.1|provirus_1052334_1094910_983 1083725 1084081 357 1 0.672 11 GGA/GAG/AGG GENOMAD.099345.VV 3.147e-06 47 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_984 1084078 1084407 330 1 0.636 11 GGA/GAG/AGG GENOMAD.136378.VP 5.237e-38 138 0 0 1 2561 Caudoviricetes NA NA PF05136;PF04965;TIGR01539;K06903;COG5511 phage portal protein, lambda family
+NC_017033.1|provirus_1052334_1094910_985 1084404 1085288 885 1 0.655 11 GGA/GAG/AGG GENOMAD.105501.VV 4.427e-74 252 0 0 1 2561 Caudoviricetes NA NA PF03434;COG3948 Phage-related baseplate assembly protein
+NC_017033.1|provirus_1052334_1094910_986 1085281 1085826 546 1 0.663 11 GGA/GAG/AGG GENOMAD.114503.VV 4.33e-30 119 0 0 1 2561 Caudoviricetes NA NA PF09684;COG4385;TIGR01634 Bacteriophage P2-related tail formation protein
+NC_017033.1|provirus_1052334_1094910_987 1085826 1087793 1968 1 0.613 11 GGAG/GAGG GENOMAD.208390.VP 2.441e-59 222 0 0 1 2561 Caudoviricetes NA NA COG5301 Phage-related tail fibre protein
+NC_017033.1|provirus_1052334_1094910_988 1087794 1088279 486 1 0.646 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1052334_1094910_989 1088349 1089569 1221 1 0.649 11 GGAG/GAGG GENOMAD.218214.VV 7.277e-53 195 0 0 1 2561 Caudoviricetes NA NA PF17541;COG3497 Phage tail sheath protein FI
+NC_017033.1|provirus_1052334_1094910_990 1089579 1090082 504 1 0.647 11 AGGAG GENOMAD.099825.VV 1.006e-10 62 0 0 1 2561 Caudoviricetes NA NA PF04985;K06908;COG3498;TIGR01611 Phage tail tube protein FII
+NC_017033.1|provirus_1052334_1094910_991 1090092 1090415 324 1 0.623 11 AGGAG GENOMAD.073828.VV 1.34e-19 85 0 0 1 2561 Caudoviricetes NA NA PF10109 Phage tail assembly chaperone proteins, E, or 41 or 14
+NC_017033.1|provirus_1052334_1094910_992 1090522 1092840 2319 1 0.658 11 GGA/GAG/AGG GENOMAD.141796.VV 3.591e-106 366 0 0 1 11124 Peduoviridae NA NA COG3941 Phage tail tape-measure protein, controls tail length
+NC_017033.1|provirus_1052334_1094910_993 1092844 1093686 843 1 0.637 11 None GENOMAD.124222.VP 1.683e-115 371 0 0 0 2561 Caudoviricetes NA NA K06906;COG3499 Phage protein U
+NC_017033.1|provirus_1052334_1094910_994 1093661 1093867 207 1 0.614 11 GGA/GAG/AGG GENOMAD.159179.VP 5.502e-12 61 0 0 1 2561 Caudoviricetes NA NA COG5004;K06370 P2-like prophage tail protein X
+NC_017033.1|provirus_1052334_1094910_995 1093858 1094910 1053 1 0.633 11 GGAG/GAGG GENOMAD.158351.VP 2.572e-37 147 0 0 1 2561 Caudoviricetes NA NA PF05954;K06905;COG3500;TIGR03361 Phage protein D
+NC_017033.1|provirus_1557694_1600481_1419 1557694 1557981 288 -1 0.594 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1420 1557981 1558169 189 -1 0.598 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1421 1558169 1558477 309 -1 0.511 11 GGAG/GAGG GENOMAD.060822.VV 8.986e-06 45 0 0 0 10823 Zobellviridae NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1422 1558474 1558842 369 -1 0.547 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1423 1558835 1559113 279 -1 0.692 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1424 1559113 1559442 330 -1 0.542 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1425 1559439 1561094 1656 -1 0.650 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1426 1561091 1561423 333 -1 0.604 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1427 1561433 1561660 228 -1 0.623 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1428 1561663 1563417 1755 -1 0.613 11 GGAGG GENOMAD.151126.VP 2.362e-52 199 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1429 1563414 1564154 741 -1 0.592 11 AGGAG GENOMAD.119436.VP 4.501e-07 53 0 0 0 2561 Caudoviricetes NA NA PF03837;TIGR00616;K07455;COG3723 recombinase, phage RecT family
+NC_017033.1|provirus_1557694_1600481_1430 1564207 1564491 285 -1 0.614 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1431 1564488 1564682 195 -1 0.579 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1432 1564679 1564894 216 -1 0.560 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1433 1564891 1565016 126 -1 0.619 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1434 1565064 1565897 834 -1 0.625 11 GGAG/GAGG GENOMAD.115107.VV 1.94e-45 168 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1435 1566063 1566449 387 -1 0.618 11 AGGAG GENOMAD.094188.VV 1.81e-25 103 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1436 1566860 1567096 237 1 0.624 11 AGGAGG GENOMAD.189851.VV 5.539e-09 53 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1437 1567124 1567516 393 -1 0.555 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1438 1567963 1568715 753 -1 0.463 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1439 1568715 1569317 603 -1 0.580 11 GGA/GAG/AGG GENOMAD.205774.CP 1.338e-70 237 0 0 0 1 NA NA NA PF08000;PF20612 Bacterial PH domain; SHOCT domain
+NC_017033.1|provirus_1557694_1600481_1440 1569343 1569669 327 -1 0.557 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1441 1569750 1569992 243 1 0.560 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1442 1570044 1570337 294 -1 0.565 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1443 1570557 1570766 210 1 0.581 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1444 1570759 1571061 303 1 0.644 11 GGAG/GAGG GENOMAD.045996.VV 6.818e-47 163 0 0 0 2561 Caudoviricetes NA NA PF09012;TIGR02702;COG1777 FeoC like transcriptional regulator
+NC_017033.1|provirus_1557694_1600481_1445 1571058 1571933 876 1 0.604 11 None GENOMAD.208559.VP 0.0002331 45 0 0 0 2561 Caudoviricetes NA NA PF13730;COG5529;TIGR01610 Pyocin large subunit
+NC_017033.1|provirus_1557694_1600481_1446 1571920 1572411 492 1 0.673 11 GGA/GAG/AGG GENOMAD.166457.VP 3.827e-75 248 0 0 1 2561 Caudoviricetes NA NA PF06992 Replication protein P
+NC_017033.1|provirus_1557694_1600481_1447 1572408 1572614 207 1 0.628 11 GGAG/GAGG GENOMAD.063929.VV 1.765e-08 51 0 0 0 2561 Caudoviricetes NA NA PF05810;COG4068 Predicted nucleic acid-binding protein, contains Zn-ribbon domain
+NC_017033.1|provirus_1557694_1600481_1448 1572611 1572808 198 1 0.535 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1449 1572805 1572999 195 1 0.651 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1450 1572996 1573445 450 1 0.631 11 GGAG/GAGG GENOMAD.061349.VV 2.093e-91 294 0 0 0 2561 Caudoviricetes NA NA PF05772 NinB protein
+NC_017033.1|provirus_1557694_1600481_1451 1573594 1573941 348 1 0.609 11 GGAG/GAGG GENOMAD.036842.VV 1.144e-24 100 0 0 0 2561 Caudoviricetes NA NA PF07102 Putative nuclease YbcO
+NC_017033.1|provirus_1557694_1600481_1452 1573938 1574111 174 1 0.672 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1453 1574111 1574446 336 1 0.631 11 GGAGG GENOMAD.040593.VV 7.087e-28 109 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1454 1574449 1575066 618 1 0.638 11 GGA/GAG/AGG GENOMAD.069895.VV 4.385e-31 123 0 0 0 2561 Caudoviricetes NA NA PF17302;TIGR02642 Tryptophan RNA-binding attenuator protein inhibitory protein
+NC_017033.1|provirus_1557694_1600481_1455 1575159 1575422 264 -1 0.462 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1456 1575504 1576007 504 1 0.631 11 None GENOMAD.044304.VV 3.936e-34 130 0 0 0 5262 Schitoviridae NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1457 1575998 1576297 300 1 0.623 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1458 1576294 1576560 267 1 0.596 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1459 1576756 1577097 342 1 0.591 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1460 1577111 1577446 336 1 0.652 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1461 1577458 1577721 264 1 0.633 11 AGxAGG/AGGxGG GENOMAD.077615.VV 2.28e-06 46 0 0 0 7278 Salasmaviridae NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1462 1577734 1578405 672 1 0.613 11 GGAG/GAGG GENOMAD.076022.VV 5.673e-65 222 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1463 1578350 1579906 1557 1 0.615 11 AGxAGG/AGGxGG GENOMAD.013124.VV 7.041e-150 483 0 0 1 377 Drexlerviridae NA NA PF13262;COG5410 NA
+NC_017033.1|provirus_1557694_1600481_1464 1579903 1581441 1539 1 0.640 11 AGGA/GGAG/GAGG GENOMAD.003432.VV 5.04e-57 211 0 0 1 2561 Caudoviricetes NA NA PF06381;K09961;TIGR01555;COG3567 phage-related protein, HI1409 family
+NC_017033.1|provirus_1557694_1600481_1465 1581398 1582051 654 1 0.636 11 3Base/5BMM GENOMAD.083949.VV 7.556e-40 149 0 0 1 2561 Caudoviricetes NA NA PF04233;COG2369;TIGR01641 Uncharacterized conserved protein, contains phage Mu gpF-like domain
+NC_017033.1|provirus_1557694_1600481_1466 1582189 1582368 180 1 0.517 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1467 1582429 1583739 1311 1 0.652 11 None GENOMAD.099067.VP 2.252e-113 373 0 0 0 2561 Caudoviricetes NA NA PF09979;K09960;COG3566 NA
+NC_017033.1|provirus_1557694_1600481_1468 1583749 1584243 495 1 0.657 11 AGGAG GENOMAD.033203.VV 1.156e-46 166 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1469 1584321 1585328 1008 1 0.626 11 GGAG/GAGG GENOMAD.085797.VV 1.048e-165 519 0 0 0 2561 Caudoviricetes NA NA PF09950;COG4834 Encapsulating protein for peroxidase
+NC_017033.1|provirus_1557694_1600481_1470 1585339 1585563 225 1 0.649 11 AGGAG GENOMAD.170487.VV 4.114e-10 56 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1471 1585541 1585936 396 1 0.634 11 GGAG/GAGG GENOMAD.005453.VV 5.437e-56 191 0 0 1 2561 Caudoviricetes NA NA PF11863;COG4386 Mu-like prophage tail sheath protein gpL
+NC_017033.1|provirus_1557694_1600481_1472 1585933 1586475 543 1 0.641 11 GGxGG GENOMAD.008778.VV 5.955e-53 185 0 0 1 2561 Caudoviricetes NA NA PF05069;COG5005;TIGR01635 NA
+NC_017033.1|provirus_1557694_1600481_1473 1586475 1586858 384 1 0.630 11 GGAGG GENOMAD.040078.VV 2.69e-45 160 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1474 1586851 1587405 555 1 0.632 11 GGAGG GENOMAD.023692.VV 7.854e-43 156 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1475 1587409 1588893 1485 1 0.640 11 GGAG/GAGG GENOMAD.005453.VV 4.878e-99 334 0 0 1 2561 Caudoviricetes NA NA PF11863;COG4386 Mu-like prophage tail sheath protein gpL
+NC_017033.1|provirus_1557694_1600481_1476 1588902 1589342 441 1 0.603 11 GGAG/GAGG GENOMAD.017010.VV 3.75e-67 224 0 0 0 2561 Caudoviricetes NA NA PF11681 Bacteriophage KPP10, Structural protein ORF10
+NC_017033.1|provirus_1557694_1600481_1477 1589353 1589742 390 1 0.633 11 GGAG/GAGG GENOMAD.055746.VV 7.707e-27 107 0 0 1 2561 Caudoviricetes NA NA PF10876 Phage tail assembly chaperone protein, TAC
+NC_017033.1|provirus_1557694_1600481_1478 1589936 1592188 2253 1 0.603 11 GGA/GAG/AGG GENOMAD.015777.VV 2.615e-80 288 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1479 1592185 1592805 621 1 0.589 11 GGA/GAG/AGG GENOMAD.017318.VV 4.715e-50 178 0 0 0 2561 Caudoviricetes NA NA COG3499 NA
+NC_017033.1|provirus_1557694_1600481_1480 1592809 1593123 315 1 0.571 11 GGAGG GENOMAD.105312.VV 3.054e-41 147 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1481 1593120 1594067 948 1 0.593 11 None GENOMAD.123309.VP 2.371e-34 137 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1482 1594067 1594726 660 1 0.621 11 None GENOMAD.006053.VV 1.581e-30 122 0 0 1 2561 Caudoviricetes NA NA PF18352;COG4540;TIGR01644 Phage protein Gp138 N-terminal domain
+NC_017033.1|provirus_1557694_1600481_1483 1594729 1595076 348 1 0.575 11 GGA/GAG/AGG GENOMAD.009002.VV 2.079e-42 151 0 0 1 2561 Caudoviricetes NA NA PF10934;COG3628 Phage baseplate assembly protein W
+NC_017033.1|provirus_1557694_1600481_1484 1595073 1596251 1179 1 0.611 11 GGAGG GENOMAD.005285.VV 1.352e-45 173 0 0 0 2561 Caudoviricetes NA NA PF03434;COG3299 Uncharacterized phage protein gp47/JayE
+NC_017033.1|provirus_1557694_1600481_1485 1596248 1596832 585 1 0.581 11 GGxGG GENOMAD.008482.VV 3.01e-67 227 0 0 1 2561 Caudoviricetes NA NA PF11041;TIGR02242 Bacteriophage Mu-like, Gp48
+NC_017033.1|provirus_1557694_1600481_1486 1596899 1598707 1809 1 0.603 11 GGAG/GAGG GENOMAD.051520.VV 3.018e-18 92 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1487 1598708 1599193 486 1 0.652 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1488 1599313 1599489 177 1 0.548 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_1557694_1600481_1489 1599510 1600481 972 -1 0.571 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1926 2089294 2090280 987 -1 0.612 11 GGA/GAG/AGG GENOMAD.147153.VV 7.117e-20 94 0 0 0 2561 Caudoviricetes NA NA PF07120;COG3756 Uncharacterized conserved protein YdaU, DUF1376 family
+NC_017033.1|provirus_2089294_2107522_1927 2090277 2090723 447 -1 0.649 11 GGA/GAG/AGG GENOMAD.220574.VP 9.96e-24 99 0 0 1 2561 Caudoviricetes NA NA PF06892 Phage regulatory protein CII (CP76)
+NC_017033.1|provirus_2089294_2107522_1928 2090810 2091313 504 1 0.597 11 None GENOMAD.226021.VP 3.576e-86 280 0 0 0 2561 Caudoviricetes NA NA PF14205 NA
+NC_017033.1|provirus_2089294_2107522_1929 2091539 2092288 750 1 0.575 11 GGA/GAG/AGG GENOMAD.179157.VV 8.047e-05 46 0 0 0 1 NA NA NA PF18090;TIGR00673;K22300;COG5606 cyanase
+NC_017033.1|provirus_2089294_2107522_1930 2092428 2093327 900 1 0.390 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1931 2093272 2093736 465 1 0.443 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1932 2094023 2094286 264 1 0.549 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1933 2094513 2095400 888 1 0.418 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1934 2096207 2096452 246 1 0.610 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1935 2096599 2096730 132 1 0.568 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1936 2096727 2097047 321 1 0.626 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1937 2097044 2097382 339 1 0.540 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1938 2097379 2097660 282 1 0.621 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1939 2097713 2098534 822 1 0.584 11 AGGAG GENOMAD.192631.VV 3.816e-31 126 0 0 0 2561 Caudoviricetes NA NA PF03837;TIGR01913 RecT family
+NC_017033.1|provirus_2089294_2107522_1940 2098531 2100282 1752 1 0.619 11 GGAGG GENOMAD.151126.VP 1.22e-60 224 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1941 2100285 2100512 228 1 0.623 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1942 2100522 2100854 333 1 0.568 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1943 2100851 2101072 222 1 0.622 11 GGAG/GAGG GENOMAD.224342.VP 6.345e-06 44 0 0 0 2561 Caudoviricetes NA NA PF09035;COG3311 Predicted DNA-binding transcriptional regulator AlpA
+NC_017033.1|provirus_2089294_2107522_1944 2101069 2101995 927 -1 0.592 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1945 2102598 2104394 1797 -1 0.681 11 GGAG/GAGG GENOMAD.005687.VV 3.84e-08 59 0 0 0 2561 Caudoviricetes NA NA COG5519;K02334 NA
+NC_017033.1|provirus_2089294_2107522_1946 2104375 2105307 933 -1 0.681 11 GGAGG GENOMAD.166800.VP 1.166e-23 105 0 0 0 2561 Caudoviricetes NA NA COG4643 Uncharacterized domain associated with phage/plasmid primase
+NC_017033.1|provirus_2089294_2107522_1947 2105304 2105672 369 -1 0.629 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1948 2105669 2106016 348 -1 0.655 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1949 2106013 2106468 456 -1 0.623 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_017033.1|provirus_2089294_2107522_1950 2106551 2107522 972 -1 0.631 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_017095.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_017095.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_018014.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_018014.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_018068.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_018068.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,86 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_018068.1|provirus_1361108_1399802_1216 1361108 1361524 417 -1 0.372 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1217 1361850 1362134 285 1 0.456 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1218 1362138 1362350 213 1 0.465 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1219 1362514 1363338 825 1 0.421 11 AGGAG(G)/GGAGG GENOMAD.133073.VP 4.745e-26 111 0 0 0 2561 Caudoviricetes NA NA PF03374;COG3645 Phage antirepressor protein YoqD, KilAC domain
+NC_018068.1|provirus_1361108_1399802_1220 1363335 1364579 1245 1 0.426 11 3Base/5BMM GENOMAD.014802.VV 5.219e-14 77 0 0 0 2561 Caudoviricetes NA NA PF00176;K20093;COG1061;TIGR04095 Superfamily II DNA or RNA helicase
+NC_018068.1|provirus_1361108_1399802_1221 1364572 1364856 285 1 0.456 11 AGGA GENOMAD.062524.VV 5.888e-30 114 0 0 0 2561 Caudoviricetes NA NA PF03838;COG3331;TIGR00648;K03552 Penicillin-binding protein-related factor A, putative recombinase
+NC_018068.1|provirus_1361108_1399802_1222 1364853 1366520 1668 1 0.430 11 3Base/5BMM GENOMAD.016341.VV 2.768e-209 657 0 0 1 2561 Caudoviricetes NA NA PF13479;PF12684;TIGR01618;K07465;COG1468 phage nucleotide-binding protein
+NC_018068.1|provirus_1361108_1399802_1223 1366538 1366987 450 1 0.389 11 AGGAG/GGAGG GENOMAD.031678.VV 6.602e-29 114 0 0 0 2561 Caudoviricetes NA NA PF05037 NA
+NC_018068.1|provirus_1361108_1399802_1224 1367256 1368950 1695 1 0.433 11 GGAG/GAGG GENOMAD.102034.VP 2.969e-108 364 0 0 0 2561 Caudoviricetes NA NA TIGR01636 NA
+NC_018068.1|provirus_1361108_1399802_1225 1369137 1371011 1875 1 0.415 11 GGAGG GENOMAD.024099.VV 5.474e-55 208 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1226 1371524 1371904 381 1 0.428 11 GGAGG GENOMAD.192072.VP 2.313e-13 68 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1227 1372021 1372473 453 1 0.406 11 AGGAGG GENOMAD.076519.VV 2.465e-40 147 0 0 0 2561 Caudoviricetes NA NA PF05263;TIGR01636;COG2739;K01994 phage transcriptional activator, RinA family
+NC_018068.1|provirus_1361108_1399802_1228 1372631 1372819 189 1 0.402 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1229 1372954 1373160 207 1 0.469 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1230 1373168 1373524 357 1 0.473 11 AGxAGG/AGGxGG GENOMAD.045242.VV 1.014e-10 60 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1231 1373710 1374237 528 1 0.460 11 AGxAGG/AGGxGG GENOMAD.098194.VV 3.009e-58 200 0 0 1 2561 Caudoviricetes NA NA PF05119;COG3747;TIGR01558 Phage terminase, small subunit
+NC_018068.1|provirus_1361108_1399802_1232 1374300 1375553 1254 1 0.433 11 GGAG/GAGG GENOMAD.038338.VV 1.076e-29 126 0 0 0 2561 Caudoviricetes NA NA COG3392 NA
+NC_018068.1|provirus_1361108_1399802_1233 1375834 1376358 525 1 0.375 11 None GENOMAD.133508.VP 1.117e-12 68 0 0 0 2561 Caudoviricetes NA NA PF13392 HNH endonuclease
+NC_018068.1|provirus_1361108_1399802_1234 1376401 1376586 186 1 0.489 11 GGA/GAG/AGG GENOMAD.209016.VC 3.22e-07 47 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1235 1376590 1377405 816 1 0.433 11 AGxAGG/AGGxGG GENOMAD.105515.VV 4.177e-12 69 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1236 1377405 1377644 240 1 0.442 11 AGGAGG GENOMAD.225559.VP 1.638e-13 66 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1237 1377747 1377998 252 -1 0.413 11 AGGAGG GENOMAD.197050.CP 0.0001087 41 0 0 0 1 NA NA NA PF19124 NA
+NC_018068.1|provirus_1361108_1399802_1238 1378174 1378383 210 1 0.348 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1239 1378503 1380050 1548 1 0.468 11 GGA/GAG/AGG GENOMAD.190509.VP 4.55e-66 238 0 0 1 2561 Caudoviricetes NA NA PF03354;COG4626 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_018068.1|provirus_1361108_1399802_1240 1380176 1381339 1164 1 0.456 11 None GENOMAD.179073.VP 5.583e-45 171 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1241 1381339 1382406 1068 1 0.465 11 GGA/GAG/AGG GENOMAD.158277.VP 6.708e-34 137 0 0 0 2561 Caudoviricetes NA NA PF00574;PF19602;K01358;TIGR00493;COG3904 ATP-dependent Clp endopeptidase, proteolytic subunit ClpP
+NC_018068.1|provirus_1361108_1399802_1242 1382396 1383670 1275 1 0.469 11 AGGAG GENOMAD.092606.VV 1.506e-40 159 0 0 1 2561 Caudoviricetes NA NA PF05065;COG4653;TIGR01554 Predicted phage phi-C31 gp36 major capsid-like protein
+NC_018068.1|provirus_1361108_1399802_1243 1383704 1384180 477 1 0.486 11 AGGAGG GENOMAD.077304.VV 2.485e-35 133 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1244 1384255 1384848 594 1 0.468 11 AGGA GENOMAD.067701.VV 2.482e-44 161 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR02215 phage conserved hypothetical protein, phiE125 gp8 family
+NC_018068.1|provirus_1361108_1399802_1245 1384864 1385193 330 1 0.412 11 GGxGG GENOMAD.027939.VV 2.94e-20 87 0 0 1 2561 Caudoviricetes NA NA PF05521;COG5614;TIGR01563 Bacteriophage head-tail adaptor
+NC_018068.1|provirus_1361108_1399802_1246 1385186 1385599 414 1 0.435 11 GGAG/GAGG GENOMAD.018908.VV 5.448e-17 79 0 0 1 2561 Caudoviricetes NA NA PF04883;TIGR01725;COG5005 Bacteriophage HK97-gp10, putative tail-component
+NC_018068.1|provirus_1361108_1399802_1247 1385599 1386033 435 1 0.414 11 GGA/GAG/AGG GENOMAD.029331.VV 3.675e-58 198 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1248 1386037 1387104 1068 1 0.463 11 AGGAGG GENOMAD.014203.VV 9.347e-74 254 0 0 1 2561 Caudoviricetes NA NA PF04984;PF17482;COG4386 Mu-like prophage tail sheath protein gpL
+NC_018068.1|provirus_1361108_1399802_1249 1387116 1387544 429 1 0.471 11 GGAGG GENOMAD.008035.VV 8.025e-49 171 0 0 1 2561 Caudoviricetes NA NA PF09393 Phage tail tube protein
+NC_018068.1|provirus_1361108_1399802_1250 1387599 1388000 402 1 0.443 11 GGAGG GENOMAD.020710.VV 1.165e-40 147 0 0 1 2561 Caudoviricetes NA NA PF08890 Phage XkdN-like tail assembly chaperone protein, TAC
+NC_018068.1|provirus_1361108_1399802_1251 1388204 1390375 2172 1 0.472 11 GGA/GAG/AGG GENOMAD.117212.VP 4.285e-62 232 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1252 1390388 1390792 405 1 0.432 11 AGxAGG/AGGxGG GENOMAD.025221.VV 2.91e-72 238 0 0 0 2561 Caudoviricetes NA NA PF06995;COG1652 Nucleoid-associated protein YgaU, contains BON and LysM domains
+NC_018068.1|provirus_1361108_1399802_1253 1390789 1391781 993 1 0.438 11 GGA/GAG/AGG GENOMAD.020668.VV 8.021e-51 186 0 0 1 2561 Caudoviricetes NA NA PF05954;COG4379;K06905;TIGR03361 Mu-like prophage tail protein gpP
+NC_018068.1|provirus_1361108_1399802_1254 1391791 1392159 369 1 0.439 11 GGAG/GAGG GENOMAD.046601.VV 4.306e-46 162 0 0 0 2561 Caudoviricetes NA NA PF10844 NA
+NC_018068.1|provirus_1361108_1399802_1255 1392156 1392587 432 1 0.431 11 GGA/GAG/AGG GENOMAD.015505.VV 4.579e-47 166 0 0 0 2561 Caudoviricetes NA NA PF10934;COG4381 Mu-like prophage protein gp46
+NC_018068.1|provirus_1361108_1399802_1256 1392580 1393653 1074 1 0.465 11 GGAG/GAGG GENOMAD.110264.VV 3.326e-30 126 0 0 1 2561 Caudoviricetes NA NA PF04865;COG3948 Phage-related baseplate assembly protein
+NC_018068.1|provirus_1361108_1399802_1257 1393646 1394167 522 1 0.423 11 GGxGG GENOMAD.018612.VV 1.342e-21 94 0 0 1 2561 Caudoviricetes NA NA PF10076;COG3778;TIGR02242 Uncharacterized protein YmfQ in lambdoid prophage, DUF2313 family
+NC_018068.1|provirus_1361108_1399802_1258 1394168 1394734 567 1 0.497 11 GGAGG GENOMAD.069954.VV 8.47e-44 159 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1259 1394734 1395069 336 1 0.476 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1260 1395078 1396721 1644 1 0.485 11 GGA/GAG/AGG GENOMAD.140563.VP 5.937e-15 81 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1261 1396735 1397073 339 1 0.416 11 AGxAGG/AGGxGG GENOMAD.213587.VP 1.005e-16 77 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1262 1397074 1397211 138 1 0.348 11 AGGAGG GENOMAD.042441.VV 4.212e-05 40 0 0 0 2561 Caudoviricetes NA NA PF09693;TIGR01669 phage uncharacterized protein, XkdX family
+NC_018068.1|provirus_1361108_1399802_1263 1397268 1397507 240 1 0.475 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1264 1397695 1398015 321 1 0.442 11 AGGAGG GENOMAD.130222.VV 2.136e-14 70 0 0 0 2561 Caudoviricetes NA NA COG3105 NA
+NC_018068.1|provirus_1361108_1399802_1265 1397993 1398478 486 1 0.440 11 GGA/GAG/AGG GENOMAD.151608.VV 2.569e-36 136 0 0 0 2561 Caudoviricetes NA NA PF19988 NA
+NC_018068.1|provirus_1361108_1399802_1266 1398599 1399372 774 1 0.464 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_1361108_1399802_1267 1399389 1399802 414 1 0.415 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1928 2072558 2072734 177 1 0.429 11 AGGAGG GENOMAD.222548.VP 1.604e-05 42 0 0 0 1 NA NA NA PF06806;COG3311;TIGR01764 Predicted DNA-binding transcriptional regulator AlpA
+NC_018068.1|provirus_2072558_2098541_1929 2072878 2073066 189 1 0.386 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1930 2073461 2073664 204 1 0.446 11 4Base/6BMM NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1931 2073775 2073921 147 1 0.388 11 AGGAG(G)/GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1932 2073908 2074774 867 1 0.468 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1933 2074771 2077260 2490 1 0.472 11 AGGAG/GGAGG GENOMAD.021366.VV 4.949e-07 56 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1934 2077248 2077511 264 1 0.383 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1935 2078510 2078722 213 1 0.418 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1936 2078760 2078948 189 1 0.381 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1937 2078967 2079275 309 1 0.463 11 None GENOMAD.037442.VV 3.636e-15 72 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1938 2081715 2081849 135 1 0.222 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1939 2081855 2081998 144 1 0.250 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1940 2082018 2082221 204 1 0.353 11 AGGAG/GGAGG GENOMAD.220824.VP 3.347e-09 53 0 0 0 2561 Caudoviricetes NA NA PF18903 NA
+NC_018068.1|provirus_2072558_2098541_1941 2082224 2082352 129 1 0.271 11 AGGA/GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1942 2082428 2082634 207 1 0.329 11 GGAG/GAGG GENOMAD.207723.VP 1.947e-14 68 0 0 1 2561 Caudoviricetes NA NA PF10960 BhlA holin family
+NC_018068.1|provirus_2072558_2098541_1943 2082649 2083065 417 1 0.336 11 AGGAG GENOMAD.126365.VV 7.377e-48 168 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1944 2083107 2083994 888 1 0.370 11 AGxAGG/AGGxGG GENOMAD.136497.VV 4.06e-55 197 0 0 0 2561 Caudoviricetes NA NA PF17236 Phage capsid-like protein
+NC_018068.1|provirus_2072558_2098541_1945 2084087 2084278 192 1 0.344 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1946 2084442 2085254 813 1 0.332 11 None GENOMAD.225339.VP 2.875e-113 364 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1947 2085426 2086922 1497 1 0.279 11 AGGA GENOMAD.225126.VP 2.658e-245 758 0 0 0 2561 Caudoviricetes NA NA PF06862;TIGR01587;COG4098;K17677 CRISPR-associated helicase Cas3
+NC_018068.1|provirus_2072558_2098541_1948 2087352 2087744 393 1 0.308 11 AGGAG GENOMAD.142024.VV 3.756e-43 154 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1949 2087741 2089312 1572 1 0.344 11 3Base/5BMM GENOMAD.180947.VP 4.422e-38 154 0 0 1 2561 Caudoviricetes NA NA PF04466;COG5323;TIGR01547;K21523 Large terminase phage packaging protein
+NC_018068.1|provirus_2072558_2098541_1950 2089329 2090789 1461 1 0.332 11 GGA/GAG/AGG GENOMAD.003260.VV 2.398e-204 639 0 0 1 2561 Caudoviricetes NA NA PF05133;TIGR01538;COG3567 phage portal protein, SPP1 family
+NC_018068.1|provirus_2072558_2098541_1951 2091361 2091654 294 -1 0.344 11 AGGAGG GENOMAD.213863.VC 0.00091 39 0 0 0 1 NA NA NA PF05810;COG4068;TIGR01206;K21463 Predicted nucleic acid-binding protein, contains Zn-ribbon domain
+NC_018068.1|provirus_2072558_2098541_1952 2091691 2092041 351 -1 0.325 11 AGGAG GENOMAD.223401.VP 5.93e-32 121 0 0 0 2561 Caudoviricetes NA NA PF09851 NA
+NC_018068.1|provirus_2072558_2098541_1953 2092685 2093926 1242 1 0.465 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1954 2094078 2094944 867 -1 0.330 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1955 2095132 2095350 219 1 0.311 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1956 2095375 2095635 261 1 0.257 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1957 2095704 2096051 348 1 0.307 11 AGGAGG GENOMAD.220167.VP 1.032e-41 149 0 0 0 2561 Caudoviricetes NA NA PF20449 NA
+NC_018068.1|provirus_2072558_2098541_1958 2096068 2097186 1119 1 0.344 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1959 2097227 2097439 213 -1 0.315 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018068.1|provirus_2072558_2098541_1960 2097555 2098541 987 -1 0.330 11 GGA/GAG/AGG GENOMAD.214049.VP 0.0005959 44 0 0 0 2561 Caudoviricetes NA NA PF00589;TIGR02224;COG4973;K03733 tyrosine recombinase XerC
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_018515.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_018515.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,75 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_018515.1|provirus_3418112_3436097_3127 3418112 3418687 576 -1 0.474 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3128 3418979 3419323 345 -1 0.412 11 GGAGG GENOMAD.178485.VV 8.068e-52 178 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3129 3419421 3420176 756 -1 0.463 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3130 3420203 3420451 249 -1 0.434 11 AGGA GENOMAD.042597.VV 2.985e-31 117 0 0 0 2561 Caudoviricetes NA NA PF10779 Haemolysin XhlA
+NC_018515.1|provirus_3418112_3436097_3131 3420532 3420702 171 -1 0.316 11 AGGAGG GENOMAD.019319.VV 0.0001663 39 0 0 0 2561 Caudoviricetes NA NA PF09693;TIGR01669 phage uncharacterized protein, XkdX family
+NC_018515.1|provirus_3418112_3436097_3132 3420716 3421015 300 -1 0.360 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3133 3421030 3422109 1080 -1 0.488 11 AGGAG GENOMAD.010477.VV 1.931e-16 84 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3134 3422122 3422733 612 -1 0.431 11 AGxAGG/AGGxGG GENOMAD.018612.VV 2.241e-57 199 0 0 1 2561 Caudoviricetes NA NA PF10076;COG3778;TIGR02242 Uncharacterized protein YmfQ in lambdoid prophage, DUF2313 family
+NC_018515.1|provirus_3418112_3436097_3135 3422739 3423455 717 -1 0.480 11 GGAGG GENOMAD.072355.VV 1.988e-75 253 0 0 0 5262 Schitoviridae NA NA PF18454 Major tropism determinant N-terminal domain
+NC_018515.1|provirus_3418112_3436097_3136 3423468 3424490 1023 -1 0.475 11 AGGAGG GENOMAD.072355.VV 2.41e-07 55 0 0 0 5262 Schitoviridae NA NA PF18454 Major tropism determinant N-terminal domain
+NC_018515.1|provirus_3418112_3436097_3137 3424494 3424907 414 -1 0.435 11 GGxGG GENOMAD.105081.VV 2.709e-66 221 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3138 3424912 3425949 1038 -1 0.480 11 AGGAGG GENOMAD.004833.VV 1.671e-45 171 0 0 1 2561 Caudoviricetes NA NA PF04865;COG3299 Baseplate J-like protein
+NC_018515.1|provirus_3418112_3436097_3139 3425949 3426350 402 -1 0.440 11 AGxAGG/AGGxGG GENOMAD.016318.VV 3.473e-37 137 0 0 0 2561 Caudoviricetes NA NA PF10934;COG4381;TIGR03357 Mu-like prophage protein gp46
+NC_018515.1|provirus_3418112_3436097_3140 3426347 3426703 357 -1 0.457 11 GGA/GAG/AGG GENOMAD.020599.VV 1.753e-21 91 0 0 0 2561 Caudoviricetes NA NA PF10844 NA
+NC_018515.1|provirus_3418112_3436097_3141 3426703 3427689 987 -1 0.443 11 AGGAGG GENOMAD.018966.VV 5.985e-106 346 0 0 1 2561 Caudoviricetes NA NA PF14594;COG4379;TIGR03361;K06905 Mu-like prophage tail protein gpP
+NC_018515.1|provirus_3418112_3436097_3142 3427706 3428368 663 -1 0.448 11 AGxAGG/AGGxGG GENOMAD.015578.VV 2.506e-23 101 0 0 0 2561 Caudoviricetes NA NA PF06995;COG1652 Nucleoid-associated protein YgaU, contains BON and LysM domains
+NC_018515.1|provirus_3418112_3436097_3143 3428368 3430056 1689 -1 0.436 11 AGGAGG GENOMAD.032671.VV 1.142e-122 406 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3144 3430684 3431106 423 -1 0.437 11 GGAGG GENOMAD.001212.VV 8.9e-47 165 0 0 1 2561 Caudoviricetes NA NA PF08890 Phage XkdN-like tail assembly chaperone protein, TAC
+NC_018515.1|provirus_3418112_3436097_3145 3431161 3431628 468 -1 0.459 11 GGA/GAG/AGG GENOMAD.011307.VV 3.196e-73 242 0 0 1 2561 Caudoviricetes NA NA PF09393 Phage tail tube protein
+NC_018515.1|provirus_3418112_3436097_3146 3431632 3432948 1317 -1 0.455 11 GGAGG GENOMAD.013578.VV 4.449e-94 317 0 0 1 2561 Caudoviricetes NA NA PF17481;PF04984;PF17482;COG4386 Mu-like prophage tail sheath protein gpL
+NC_018515.1|provirus_3418112_3436097_3147 3432950 3433132 183 -1 0.388 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3148 3433125 3433544 420 -1 0.448 11 AGGAG GENOMAD.023771.VV 1.411e-24 101 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3149 3434218 3434688 471 -1 0.410 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3150 3435000 3435596 597 1 0.405 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_3418112_3436097_3151 3435618 3436097 480 1 0.352 11 AGGAG GENOMAD.123021.VV 8.264e-31 120 0 0 0 2561 Caudoviricetes NA NA PF06114;COG2856 IrrE N-terminal-like domain
+NC_018515.1|provirus_4659544_4694673_4266 4659544 4659789 246 -1 0.398 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4267 4659786 4660568 783 -1 0.415 11 AGGAGG GENOMAD.053051.VV 3.635e-13 72 0 0 0 2561 Caudoviricetes NA NA PF10772;PF02086;TIGR00571;COG0338 Bacteriophage HP1, Orf24; D12 class N6 adenine-specific DNA methyltransferase
+NC_018515.1|provirus_4659544_4694673_4268 4660808 4661533 726 1 0.310 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4269 4661559 4662848 1290 -1 0.354 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4270 4662851 4663681 831 -1 0.357 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4271 4663834 4664334 501 -1 0.435 11 AGGAGG GENOMAD.220913.VP 9.323e-12 65 0 0 1 2561 Caudoviricetes NA NA PF09682;TIGR01673 Bacteriophage holin of superfamily 6 (Holin_LLH)
+NC_018515.1|provirus_4659544_4694673_4272 4664379 4665224 846 -1 0.488 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4273 4665235 4665600 366 -1 0.413 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4274 4665683 4665937 255 -1 0.412 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4275 4666125 4666301 177 -1 0.429 11 GGAGG GENOMAD.202651.VV 1.242e-28 108 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4276 4666298 4666576 279 -1 0.423 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4277 4666573 4667667 1095 -1 0.525 11 GGAG/GAGG GENOMAD.135924.VV 5.173e-50 185 0 0 0 4312 Hafunaviridae NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4278 4667682 4669058 1377 -1 0.439 11 GGAG/GAGG GENOMAD.007293.VV 1.173e-76 267 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4279 4669065 4670156 1092 -1 0.412 11 GGxGG GENOMAD.006687.VV 4.266e-78 267 0 0 1 2561 Caudoviricetes NA NA PF14594;COG4926;TIGR01665 Siphovirus ReqiPepy6 Gp37-like protein
+NC_018515.1|provirus_4659544_4694673_4280 4670159 4671022 864 -1 0.403 11 AGxAGG/AGGxGG GENOMAD.009232.VV 5.496e-87 289 0 0 0 2561 Caudoviricetes NA NA PF16774;COG4722;TIGR01633 Phage-related protein
+NC_018515.1|provirus_4659544_4694673_4281 4671033 4673771 2739 -1 0.449 11 None GENOMAD.110013.VP 2.08e-93 332 0 0 1 2561 Caudoviricetes NA NA COG5280 Phage-related minor tail protein
+NC_018515.1|provirus_4659544_4694673_4282 4673768 4673995 228 -1 0.430 11 None GENOMAD.095592.VV 3.087e-06 45 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4283 4674073 4674399 327 -1 0.404 11 GGAGG GENOMAD.044337.VV 2.719e-52 179 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4284 4674442 4675005 564 -1 0.502 11 GGA/GAG/AGG GENOMAD.009652.VV 1.45e-80 265 0 0 1 2561 Caudoviricetes NA NA TIGR01537 NA
+NC_018515.1|provirus_4659544_4694673_4285 4675011 4675370 360 -1 0.444 11 AGGAGG GENOMAD.058243.VV 1.023e-51 178 0 0 1 2561 Caudoviricetes NA NA PF11367 NA
+NC_018515.1|provirus_4659544_4694673_4286 4675367 4675792 426 -1 0.465 11 GGxGG GENOMAD.072075.VV 6.875e-16 76 0 0 1 2561 Caudoviricetes NA NA PF11114;TIGR01725;COG5005 phage protein, HK97 gp10 family
+NC_018515.1|provirus_4659544_4694673_4287 4675793 4676104 312 -1 0.458 11 GGA/GAG/AGG GENOMAD.008635.VV 1.997e-29 113 0 0 1 2561 Caudoviricetes NA NA PF05521;TIGR01563;COG5614 phage head-tail adaptor, putative, SPP1 family
+NC_018515.1|provirus_4659544_4694673_4288 4676101 4676370 270 -1 0.393 11 GGAG/GAGG GENOMAD.053459.VV 1.209e-43 153 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4289 4676371 4676568 198 -1 0.455 11 GGxGG GENOMAD.188189.VV 3.555e-29 110 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4290 4676592 4677815 1224 -1 0.483 11 AGGAGG GENOMAD.088359.VV 4.366e-19 93 0 0 1 2561 Caudoviricetes NA NA PF05065;PF18316;PF17078;TIGR01554;COG4653 phage major capsid protein, HK97 family
+NC_018515.1|provirus_4659544_4694673_4291 4677854 4678474 621 -1 0.470 11 AGGAGG GENOMAD.116539.VV 2.017e-19 89 0 0 1 2561 Caudoviricetes NA NA PF04586;PF05065;K06904;COG3740;TIGR01543 Phage head maturation protease
+NC_018515.1|provirus_4659544_4694673_4292 4678428 4679657 1230 -1 0.460 11 GGAG/GAGG GENOMAD.003590.VV 9.884e-09 60 0 0 1 2561 Caudoviricetes NA NA PF04860;TIGR01537;COG4695 phage portal protein, HK97 family
+NC_018515.1|provirus_4659544_4694673_4293 4679878 4681632 1755 -1 0.471 11 AGxAGG/AGGxGG GENOMAD.194580.VP 2.855e-27 121 0 0 1 2561 Caudoviricetes NA NA PF03354;PF05521;PF20441;COG4626;TIGR01563 Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_018515.1|provirus_4659544_4694673_4294 4681625 4682008 384 -1 0.464 11 GGAGG GENOMAD.092852.VV 8.987e-49 170 0 0 1 2561 Caudoviricetes NA NA TIGR01558 NA
+NC_018515.1|provirus_4659544_4694673_4295 4682094 4682456 363 -1 0.394 11 AGGA/GGAG/GAGG GENOMAD.080571.VV 4.962e-76 248 0 0 0 11831 Demerecviridae NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4296 4683479 4684264 786 1 0.359 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4297 4684476 4685324 849 1 0.269 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4298 4685564 4686076 513 -1 0.454 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4299 4686432 4686794 363 -1 0.501 11 AGGAG(G)/GGAGG GENOMAD.151656.VP 8.696e-38 138 0 0 1 2561 Caudoviricetes NA NA PF17288;K06909;TIGR01547;COG1783 phage terminase, large subunit, PBSX family
+NC_018515.1|provirus_4659544_4694673_4300 4686791 4687312 522 -1 0.454 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4301 4687336 4688310 975 -1 0.463 11 AGGAGG GENOMAD.017981.VV 2.221e-42 161 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4302 4688325 4688492 168 -1 0.494 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4303 4688511 4689254 744 -1 0.440 11 GGA/GAG/AGG GENOMAD.129273.VC 1.957e-41 155 0 0 0 2561 Caudoviricetes NA NA PF12706;TIGR02651;COG1234;K06167 ribonuclease Z
+NC_018515.1|provirus_4659544_4694673_4304 4689256 4690083 828 -1 0.447 11 AGGAGG GENOMAD.121864.VP 4.873e-26 111 0 0 0 2561 Caudoviricetes NA NA PF03837;COG3723;K07455;TIGR00616 Recombinational DNA repair protein RecT
+NC_018515.1|provirus_4659544_4694673_4305 4690183 4690290 108 -1 0.426 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4306 4690287 4692251 1965 -1 0.439 11 GGA/GAG/AGG GENOMAD.182234.VP 4.932e-58 218 0 0 0 2561 Caudoviricetes NA NA PF13175;TIGR00634;COG1195;K03546 DNA repair protein RecN
+NC_018515.1|provirus_4659544_4694673_4307 4692248 4692634 387 -1 0.429 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4308 4692650 4692922 273 -1 0.502 11 None GENOMAD.199250.VV 1.281e-05 44 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4309 4692957 4693220 264 -1 0.432 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4310 4693210 4693476 267 -1 0.449 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4311 4693491 4693604 114 -1 0.465 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4312 4693681 4693836 156 -1 0.436 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_018515.1|provirus_4659544_4694673_4313 4693815 4694144 330 -1 0.415 11 None GENOMAD.169643.VC 1.05e-06 48 0 0 1 1 NA NA NA PF11242;TIGR02612;COG4197;K22299 mobile mystery protein A
+NC_018515.1|provirus_4659544_4694673_4314 4694266 4694673 408 1 0.395 11 AGGAGG GENOMAD.053307.VV 0.0005741 41 0 0 0 2561 Caudoviricetes NA NA PF13744;COG3655;TIGR02612;K18830 DNA-binding transcriptional regulator, XRE family
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_019897.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_019897.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_019904.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_019904.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_019936.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_019936.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,50 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_019936.1|provirus_2347508_2361929_2122 2347508 2347720 213 -1 0.521 11 GGAG/GAGG GENOMAD.221461.VP 1.082e-35 129 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2123 2347848 2349110 1263 1 0.571 11 GGA/GAG/AGG GENOMAD.223897.VP 6.327e-42 163 0 0 0 8016 Inoviridae NA NA PF05155 Phage X family
+NC_019936.1|provirus_2347508_2361929_2124 2349110 2349256 147 1 0.510 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2125 2349354 2349698 345 1 0.528 11 GGAG/GAGG GENOMAD.215295.VP 5.435e-24 98 0 0 0 8016 Inoviridae NA NA PF17426 Putative Gamma DNA binding protein G5P
+NC_019936.1|provirus_2347508_2361929_2126 2349942 2350088 147 1 0.565 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2127 2350223 2351734 1512 1 0.511 11 GGAGG GENOMAD.222416.VP 9.094e-24 109 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2128 2351737 2352003 267 1 0.532 11 GGAGG GENOMAD.197598.VP 3.988e-31 117 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2129 2352007 2353200 1194 1 0.550 11 None GENOMAD.056690.VV 1.152e-05 50 0 0 1 8016 Inoviridae NA NA PF05707;COG4128;K10954 Zona occludens toxin, predicted ATPase
+NC_019936.1|provirus_2347508_2361929_2130 2353258 2353545 288 -1 0.587 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2131 2353940 2354152 213 -1 0.521 11 GGAG/GAGG GENOMAD.221461.VP 1.082e-35 129 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2132 2354280 2355542 1263 1 0.571 11 GGA/GAG/AGG GENOMAD.223897.VP 6.327e-42 163 0 0 0 8016 Inoviridae NA NA PF05155 Phage X family
+NC_019936.1|provirus_2347508_2361929_2133 2355542 2355688 147 1 0.510 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2134 2355786 2356130 345 1 0.528 11 GGAG/GAGG GENOMAD.215295.VP 5.435e-24 98 0 0 0 8016 Inoviridae NA NA PF17426 Putative Gamma DNA binding protein G5P
+NC_019936.1|provirus_2347508_2361929_2135 2356374 2356520 147 1 0.565 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2136 2356655 2358166 1512 1 0.511 11 GGAGG GENOMAD.222416.VP 9.094e-24 109 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2137 2358169 2358435 267 1 0.532 11 GGAGG GENOMAD.197598.VP 3.988e-31 117 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2138 2358439 2359632 1194 1 0.550 11 None GENOMAD.056690.VV 1.152e-05 50 0 0 1 8016 Inoviridae NA NA PF05707;COG4128;K10954 Zona occludens toxin, predicted ATPase
+NC_019936.1|provirus_2347508_2361929_2139 2359690 2359977 288 -1 0.587 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2140 2360944 2361303 360 1 0.511 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2141 2361300 2361584 285 1 0.586 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_2347508_2361929_2142 2361642 2361929 288 -1 0.587 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2952 3233292 3234299 1008 -1 0.619 11 None GENOMAD.212346.VP 4.357e-26 113 0 0 1 2561 Caudoviricetes NA NA PF16452;PF06892;COG1974 Bacteriophage CI repressor C-terminal domain; Phage regulatory protein CII (CP76)
+NC_019936.1|provirus_3233292_3242961_2953 3234281 3235558 1278 -1 0.596 11 GGAG/GAGG GENOMAD.226808.VP 8.692e-257 787 0 0 0 8016 Inoviridae NA NA PF02486 Replication initiation factor
+NC_019936.1|provirus_3233292_3242961_2954 3235706 3236890 1185 -1 0.617 11 AGGAG GENOMAD.090645.VV 1.347e-06 53 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2955 3236903 3237229 327 -1 0.572 11 AGGAG GENOMAD.224290.VP 3.685e-65 216 0 0 0 1 NA NA NA PF10734 NA
+NC_019936.1|provirus_3233292_3242961_2956 3237229 3238722 1494 -1 0.586 11 GGxGG GENOMAD.222416.VP 3.831e-276 847 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2957 3238725 3238853 129 -1 0.558 11 3Base/5BMM NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2958 3238873 3239082 210 -1 0.638 11 GGAG/GAGG GENOMAD.224287.VP 6.332e-33 121 0 0 1 1 NA NA NA PF05356 Inovirus Coat protein B
+NC_019936.1|provirus_3233292_3242961_2959 3239093 3239308 216 -1 0.597 11 AGxAGG/AGGxGG GENOMAD.225528.VP 1.222e-42 149 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2960 3239305 3239484 180 -1 0.672 11 GGAGG GENOMAD.226094.VP 6.522e-28 106 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2961 3239500 3239859 360 -1 0.611 11 GGAG/GAGG GENOMAD.225482.VP 6.187e-49 170 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2962 3240152 3240922 771 -1 0.641 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2963 3240938 3241081 144 -1 0.660 11 GGxGG GENOMAD.213484.VP 1.701e-13 64 0 0 0 2561 Caudoviricetes NA NA PF05509;COG4877 Plasmid stability protein
+NC_019936.1|provirus_3233292_3242961_2964 3241086 3241229 144 -1 0.611 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2965 3241226 3241441 216 -1 0.616 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_3233292_3242961_2966 3241921 3242961 1041 1 0.386 11 AGGA/GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_4295725_4304306_3986 4295725 4295985 261 -1 0.567 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_4295725_4304306_3987 4296137 4296352 216 1 0.574 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_4295725_4304306_3988 4296349 4296930 582 1 0.662 11 AGGAG GENOMAD.226428.VP 0.0008059 42 0 0 0 8016 Inoviridae NA NA PF17525 NA
+NC_019936.1|provirus_4295725_4304306_3989 4297106 4297477 372 1 0.597 11 GGAG/GAGG GENOMAD.225482.VP 2.427e-28 111 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_4295725_4304306_3990 4297493 4297672 180 1 0.644 11 GGAGG GENOMAD.226094.VP 7.27e-27 103 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_4295725_4304306_3991 4297669 4297884 216 1 0.588 11 AGxAGG/AGGxGG GENOMAD.225528.VP 1.222e-42 149 0 0 0 1 NA NA NA NA NA
+NC_019936.1|provirus_4295725_4304306_3992 4297895 4298104 210 1 0.657 11 GGAG/GAGG GENOMAD.224287.VP 5.695e-34 124 0 0 1 1 NA NA NA PF05356 Inovirus Coat protein B
+NC_019936.1|provirus_4295725_4304306_3993 4298256 4299749 1494 1 0.583 11 GGxGG GENOMAD.222416.VP 3.831e-276 847 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_4295725_4304306_3994 4299749 4300075 327 1 0.566 11 AGGAG GENOMAD.224290.VP 3.685e-65 216 0 0 0 1 NA NA NA PF10734 NA
+NC_019936.1|provirus_4295725_4304306_3995 4300088 4301272 1185 1 0.619 11 AGGAG GENOMAD.090645.VV 5.588e-06 51 0 0 0 8016 Inoviridae NA NA NA NA
+NC_019936.1|provirus_4295725_4304306_3996 4301420 4302700 1281 1 0.596 11 GGAG/GAGG GENOMAD.226808.VP 9.102e-257 787 0 0 0 8016 Inoviridae NA NA PF02486 Replication initiation factor
+NC_019936.1|provirus_4295725_4304306_3997 4302682 4303740 1059 1 0.590 11 AGGA/GGAG/GAGG GENOMAD.212346.VP 6.393e-29 122 0 0 1 2561 Caudoviricetes NA NA PF16452;PF06892;COG1974 Bacteriophage CI repressor C-terminal domain; Phage regulatory protein CII (CP76)
+NC_019936.1|provirus_4295725_4304306_3998 4303989 4304306 318 1 0.613 11 AGGAG GENOMAD.200462.VV 1.519e-09 56 0 0 0 1 NA NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_genes/NC_021184.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_021184.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,144 @@
+gene start end length strand gc_content genetic_code rbs_motif marker evalue bitscore uscg plasmid_hallmark virus_hallmark taxid taxname annotation_conjscan annotation_amr annotation_accessions annotation_description
+NC_021184.1|provirus_19778_35564_13 19778 21046 1269 1 0.465 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_14 21861 23045 1185 -1 0.483 11 AGGAG GENOMAD.016861.VV 4.71e-05 48 0 0 0 2561 Caudoviricetes NA NA PF13671;COG2019;TIGR01359;K13829 AAA domain
+NC_021184.1|provirus_19778_35564_15 23045 23500 456 -1 0.342 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_16 23641 23904 264 1 0.481 11 AGxAGG/AGGxGG GENOMAD.221988.VV 2.546e-05 43 0 0 0 1 NA NA NA PF06806;COG3311;TIGR01764 Predicted DNA-binding transcriptional regulator AlpA
+NC_021184.1|provirus_19778_35564_17 23960 24580 621 1 0.435 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_18 24568 25845 1278 1 0.462 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_19 26129 26368 240 1 0.412 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_20 26390 26560 171 1 0.532 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_21 26565 26771 207 1 0.449 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_22 26935 27291 357 1 0.409 11 AGxAGG/AGGxGG GENOMAD.096257.VV 5.932e-08 52 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_19778_35564_23 27269 27457 189 1 0.434 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_24 27482 28054 573 1 0.447 11 AGxAGG/AGGxGG GENOMAD.103011.VV 5.601e-31 122 0 0 1 2561 Caudoviricetes NA NA PF04586;COG3740;K06904;TIGR01543 Phage head maturation protease
+NC_021184.1|provirus_19778_35564_25 28056 29300 1245 1 0.491 11 AGGAGG GENOMAD.113164.VP 4.496e-51 190 0 0 1 2561 Caudoviricetes NA NA PF05521;COG5614;TIGR01563 Bacteriophage head-tail adaptor
+NC_021184.1|provirus_19778_35564_26 29533 31557 2025 1 0.486 11 GGAG/GAGG GENOMAD.110013.VP 2.142e-73 265 0 0 1 2561 Caudoviricetes NA NA COG5280 Phage-related minor tail protein
+NC_021184.1|provirus_19778_35564_27 31554 32714 1161 1 0.414 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_28 32727 33191 465 -1 0.391 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_29 33713 34003 291 1 0.405 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_30 34327 34608 282 -1 0.465 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_31 34601 34831 231 -1 0.390 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_32 35121 35261 141 1 0.411 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_33 35242 35364 123 1 0.398 11 AGGAG/GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_19778_35564_34 35394 35564 171 1 0.380 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4217 4466413 4467399 987 1 0.396 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4218 4467522 4470317 2796 1 0.406 11 None GENOMAD.104116.VV 8.672e-09 62 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4219 4471023 4471277 255 -1 0.451 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4220 4471243 4473018 1776 -1 0.420 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4221 4473008 4473463 456 -1 0.384 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4222 4473456 4474466 1011 -1 0.409 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4223 4474820 4475086 267 1 0.416 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4224 4475312 4475857 546 1 0.419 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4225 4475973 4476248 276 1 0.457 11 GGA/GAG/AGG GENOMAD.222700.VP 1.456e-50 173 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4226 4476302 4477498 1197 1 0.426 11 3Base/5BMM GENOMAD.014802.VV 5.286e-15 80 0 0 0 2561 Caudoviricetes NA NA PF00176;K20093;COG1061;TIGR04095 Superfamily II DNA or RNA helicase
+NC_021184.1|provirus_4466413_4519129_4227 4477794 4479494 1701 1 0.453 11 AGGAGG GENOMAD.016341.VV 2.929e-155 501 0 0 1 2561 Caudoviricetes NA NA PF13479;PF12684;TIGR01618;K07465;COG1468 phage nucleotide-binding protein
+NC_021184.1|provirus_4466413_4519129_4228 4479516 4479968 453 1 0.413 11 AGGAGG GENOMAD.031678.VV 1.272e-30 119 0 0 0 2561 Caudoviricetes NA NA PF05037 NA
+NC_021184.1|provirus_4466413_4519129_4229 4479970 4481664 1695 1 0.436 11 AGxAGG/AGGxGG GENOMAD.102034.VP 2.19e-113 379 0 0 0 2561 Caudoviricetes NA NA TIGR01636 NA
+NC_021184.1|provirus_4466413_4519129_4230 4481661 4482314 654 1 0.428 11 AGGA GENOMAD.171549.VP 2.774e-19 89 0 0 0 2561 Caudoviricetes NA NA COG3617 Prophage antirepressor
+NC_021184.1|provirus_4466413_4519129_4231 4482602 4484512 1911 1 0.425 11 GGAG/GAGG GENOMAD.024099.VV 5.934e-52 199 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4232 4484713 4485057 345 1 0.507 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4233 4485047 4485271 225 1 0.418 11 GGAGG GENOMAD.212426.VP 2.242e-30 114 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4234 4485261 4485629 369 1 0.455 11 GGAGG GENOMAD.159035.VP 2.564e-27 108 0 0 0 2561 Caudoviricetes NA NA PF07374;TIGR01636;COG2739 phage transcriptional activator, RinA family
+NC_021184.1|provirus_4466413_4519129_4235 4485801 4486007 207 1 0.435 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4236 4486094 4486492 399 1 0.501 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4237 4486710 4486982 273 -1 0.410 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4238 4486969 4487244 276 -1 0.435 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4239 4487505 4488899 1395 1 0.507 11 AGGAGG GENOMAD.005053.VV 3.055e-18 91 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4240 4488903 4490126 1224 1 0.455 11 AGGAGG GENOMAD.038338.VV 3.758e-27 118 0 0 0 2561 Caudoviricetes NA NA COG3392 NA
+NC_021184.1|provirus_4466413_4519129_4241 4490195 4490959 765 1 0.492 11 AGGAGG GENOMAD.105515.VV 3.381e-15 78 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4242 4490960 4491148 189 1 0.471 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4243 4491287 4492195 909 1 0.528 11 AGxAGG/AGGxGG GENOMAD.105515.VV 1.222e-10 65 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4244 4492256 4492594 339 1 0.475 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4245 4492686 4493117 432 1 0.509 11 AGxAGG/AGGxGG GENOMAD.191984.VP 5.92e-08 53 0 0 0 2561 Caudoviricetes NA NA PF07128 NA
+NC_021184.1|provirus_4466413_4519129_4246 4493183 4493389 207 1 0.444 11 AGxAGG/AGGxGG GENOMAD.225559.VP 7.754e-16 72 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4247 4493440 4493913 474 1 0.502 11 GGAGG GENOMAD.168120.VP 1.382e-13 70 0 0 1 2561 Caudoviricetes NA NA PF05119;COG3747;TIGR01558 Phage terminase, small subunit
+NC_021184.1|provirus_4466413_4519129_4248 4493942 4495498 1557 1 0.489 11 GGAGG GENOMAD.181434.VP 5.884e-56 208 0 0 1 2561 Caudoviricetes NA NA PF20441 Terminase large subunit, endonuclease domain
+NC_021184.1|provirus_4466413_4519129_4249 4495568 4495879 312 1 0.356 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4250 4495869 4496198 330 1 0.348 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4251 4496274 4497509 1236 1 0.493 11 AGGAG(G)/GGAGG GENOMAD.179073.VP 1.101e-41 162 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4252 4497502 4498215 714 1 0.475 11 AGGAGG GENOMAD.028909.VV 1.007e-19 91 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR01560 Phage gp6-like head-tail connector protein
+NC_021184.1|provirus_4466413_4519129_4253 4498222 4499157 936 1 0.495 11 GGAGG GENOMAD.168658.VV 2.457e-20 95 0 0 1 2561 Caudoviricetes NA NA PF05065;PF04586;PF12518;COG4653;TIGR01554;K06904 Predicted phage phi-C31 gp36 major capsid-like protein
+NC_021184.1|provirus_4466413_4519129_4254 4499866 4501686 1821 1 0.440 11 3Base/5BMM GENOMAD.036196.VV 0.0007312 45 0 0 0 2561 Caudoviricetes NA NA PF01824 MatK/TrnK amino terminal region
+NC_021184.1|provirus_4466413_4519129_4255 4501705 4502046 342 1 0.523 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4256 4502057 4502743 687 1 0.504 11 GGA/GAG/AGG GENOMAD.111513.VV 1.908e-15 78 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4257 4502765 4503067 303 1 0.439 11 GGAGG GENOMAD.041843.VV 4.112e-13 66 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR01560 Phage gp6-like head-tail connector protein
+NC_021184.1|provirus_4466413_4519129_4258 4503067 4503399 333 1 0.477 11 GGA/GAG/AGG GENOMAD.142742.VP 1.864e-17 79 0 0 1 2561 Caudoviricetes NA NA PF05521;COG5614;TIGR01563 Bacteriophage head-tail adaptor
+NC_021184.1|provirus_4466413_4519129_4259 4503392 4503763 372 1 0.503 11 GGAGG GENOMAD.137411.VP 1.962e-22 94 0 0 1 2561 Caudoviricetes NA NA PF11114;TIGR01725;COG5005 phage protein, HK97 gp10 family
+NC_021184.1|provirus_4466413_4519129_4260 4503760 4504086 327 1 0.407 11 AGxAGG/AGGxGG GENOMAD.018077.VV 6.075e-44 155 0 0 0 2561 Caudoviricetes NA NA PF05657 NA
+NC_021184.1|provirus_4466413_4519129_4261 4504087 4504653 567 1 0.487 11 AGGAGG GENOMAD.003250.VV 2.873e-56 195 0 0 1 2561 Caudoviricetes NA NA PF04630;TIGR01603 phage major tail protein, phi13 family
+NC_021184.1|provirus_4466413_4519129_4262 4504658 4504957 300 1 0.453 11 GGAGG GENOMAD.063000.VV 7.958e-45 157 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4263 4504969 4505124 156 1 0.378 11 GGAG/GAGG GENOMAD.108553.VV 1.339e-24 96 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4264 4505209 4505475 267 1 0.333 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4265 4505462 4505782 321 1 0.293 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4266 4505833 4509261 3429 1 0.498 11 AGxAGG/AGGxGG GENOMAD.181727.VP 1.385e-58 226 0 0 1 2561 Caudoviricetes NA NA COG5280 Phage-related minor tail protein
+NC_021184.1|provirus_4466413_4519129_4267 4509272 4510123 852 1 0.472 11 AGGAGG GENOMAD.008827.VV 2.998e-171 532 0 0 0 2561 Caudoviricetes NA NA PF20195;COG4722;TIGR01633 Phage-related protein
+NC_021184.1|provirus_4466413_4519129_4268 4510138 4511208 1071 1 0.486 11 AGGAG GENOMAD.007754.VV 4.216e-63 223 0 0 1 2561 Caudoviricetes NA NA PF08931 Receptor-binding protein of phage tail base-plate Siphoviridae, head
+NC_021184.1|provirus_4466413_4519129_4269 4511210 4512007 798 1 0.501 11 GGAGG GENOMAD.078804.VV 2.471e-67 231 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4270 4512000 4513862 1863 1 0.436 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4271 4513877 4514155 279 1 0.502 11 AGGAGG GENOMAD.169028.VV 1.692e-49 170 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4272 4514155 4514295 141 1 0.468 11 GGAGG GENOMAD.166984.VP 1.613e-13 64 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4273 4514369 4515079 711 1 0.332 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4274 4515106 4516203 1098 1 0.476 11 GGAG/GAGG GENOMAD.006687.VV 1.779e-36 145 0 0 1 2561 Caudoviricetes NA NA PF14594;COG4926;TIGR01665 Siphovirus ReqiPepy6 Gp37-like protein
+NC_021184.1|provirus_4466413_4519129_4275 4516251 4516661 411 1 0.448 11 AGxAGG/AGGxGG GENOMAD.083633.VV 1.122e-06 49 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4276 4516654 4517340 687 1 0.483 11 GGAGG GENOMAD.058849.VV 0.0002819 44 0 0 0 2561 Caudoviricetes NA NA PF01520;COG0860;TIGR02883 N-acetylmuramoyl-L-alanine amidase
+NC_021184.1|provirus_4466413_4519129_4277 4517472 4518329 858 1 0.480 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4466413_4519129_4278 4518344 4519129 786 1 0.485 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4319 4563831 4564775 945 -1 0.388 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4320 4565036 4565629 594 -1 0.325 11 AGxAGG/AGGxGG GENOMAD.221500.PV 0.0001909 44 0 0 0 1 NA NA NA PF19503 NA
+NC_021184.1|provirus_4563831_4615358_4321 4567530 4570109 2580 -1 0.437 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4322 4570230 4570469 240 -1 0.358 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4323 4570482 4570748 267 -1 0.382 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4324 4570820 4571578 759 -1 0.484 11 AGGAG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4325 4571594 4572604 1011 -1 0.459 11 3Base/5BMM NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4326 4572601 4573257 657 -1 0.492 11 AGGAGG GENOMAD.055867.VV 1.36e-18 87 0 0 0 2561 Caudoviricetes NA NA COG5632 N-acetylmuramoyl-L-alanine amidase CwlA
+NC_021184.1|provirus_4563831_4615358_4327 4573241 4573663 423 -1 0.449 11 AGxAGG/AGGxGG GENOMAD.083633.VV 1.257e-06 49 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4328 4573711 4574808 1098 -1 0.476 11 AGGA/GGAG/GAGG GENOMAD.006687.VV 8.567e-33 134 0 0 1 2561 Caudoviricetes NA NA PF14594;COG4926;TIGR01665 Siphovirus ReqiPepy6 Gp37-like protein
+NC_021184.1|provirus_4563831_4615358_4329 4574832 4574972 141 -1 0.504 11 AGGAGG GENOMAD.166984.VP 1.819e-12 61 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4330 4574972 4575250 279 -1 0.477 11 GGAGG GENOMAD.169028.VV 3.079e-51 175 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4331 4575265 4577127 1863 -1 0.430 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4332 4577120 4577917 798 -1 0.490 11 GGAGG GENOMAD.078804.VV 1.766e-71 243 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4333 4577919 4578995 1077 -1 0.476 11 AGGAGG GENOMAD.007754.VV 1.197e-59 213 0 0 1 2561 Caudoviricetes NA NA PF08931 Receptor-binding protein of phage tail base-plate Siphoviridae, head
+NC_021184.1|provirus_4563831_4615358_4334 4579010 4579861 852 -1 0.465 11 AGGAGG GENOMAD.008827.VV 2.146e-166 518 0 0 0 2561 Caudoviricetes NA NA PF20195;COG4722;TIGR01633 Phage-related protein
+NC_021184.1|provirus_4563831_4615358_4335 4579873 4583292 3420 -1 0.488 11 AGxAGG/AGGxGG GENOMAD.207179.VP 1.909e-93 337 0 0 1 2561 Caudoviricetes NA NA PF05521;COG5283;TIGR01563 Phage-related tail protein
+NC_021184.1|provirus_4563831_4615358_4336 4583330 4583485 156 -1 0.410 11 GGA/GAG/AGG GENOMAD.108553.VV 1.339e-24 96 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4337 4583497 4583790 294 -1 0.459 11 AGGAGG GENOMAD.063000.VV 3.242e-45 158 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4338 4583794 4584600 807 -1 0.496 11 AGGAGG GENOMAD.003250.VV 3.053e-56 199 0 0 1 2561 Caudoviricetes NA NA PF04630;TIGR01603 phage major tail protein, phi13 family
+NC_021184.1|provirus_4563831_4615358_4339 4584601 4584927 327 -1 0.407 11 AGxAGG/AGGxGG GENOMAD.018077.VV 6.075e-44 155 0 0 0 2561 Caudoviricetes NA NA PF05657 NA
+NC_021184.1|provirus_4563831_4615358_4340 4584924 4585295 372 -1 0.508 11 GGAGG GENOMAD.137411.VP 1.962e-22 94 0 0 1 2561 Caudoviricetes NA NA PF11114;TIGR01725;COG5005 phage protein, HK97 gp10 family
+NC_021184.1|provirus_4563831_4615358_4341 4585288 4585620 333 -1 0.477 11 GGA/GAG/AGG GENOMAD.142742.VP 1.686e-18 82 0 0 1 2561 Caudoviricetes NA NA PF05521;COG5614;TIGR01563 Bacteriophage head-tail adaptor
+NC_021184.1|provirus_4563831_4615358_4342 4585620 4585922 303 -1 0.439 11 GGAGG GENOMAD.041843.VV 4.112e-13 66 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR01560 Phage gp6-like head-tail connector protein
+NC_021184.1|provirus_4563831_4615358_4343 4585944 4586630 687 -1 0.505 11 GGA/GAG/AGG GENOMAD.111513.VV 1.908e-15 78 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4344 4586641 4587825 1185 -1 0.499 11 GGAGG GENOMAD.168658.VV 3.396e-31 130 0 0 1 2561 Caudoviricetes NA NA PF05065;PF04586;PF12518;COG4653;TIGR01554;K06904 Predicted phage phi-C31 gp36 major capsid-like protein
+NC_021184.1|provirus_4563831_4615358_4345 4587832 4588530 699 -1 0.478 11 AGGAGG GENOMAD.028909.VV 1.64e-23 102 0 0 1 2561 Caudoviricetes NA NA PF05135;TIGR01560 Phage gp6-like head-tail connector protein
+NC_021184.1|provirus_4563831_4615358_4346 4588523 4589815 1293 -1 0.497 11 None GENOMAD.179073.VP 7.993e-40 157 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4347 4589828 4590154 327 -1 0.401 11 AGGA NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4348 4590144 4590455 312 -1 0.426 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4349 4590525 4592081 1557 -1 0.482 11 GGAGG GENOMAD.181434.VP 1.249e-57 213 0 0 1 2561 Caudoviricetes NA NA PF20441 Terminase large subunit, endonuclease domain
+NC_021184.1|provirus_4563831_4615358_4350 4592110 4592583 474 -1 0.511 11 GGAGG GENOMAD.168120.VP 1.382e-13 70 0 0 1 2561 Caudoviricetes NA NA PF05119;COG3747;TIGR01558 Phage terminase, small subunit
+NC_021184.1|provirus_4563831_4615358_4351 4592638 4592844 207 -1 0.473 11 AGxAGG/AGGxGG GENOMAD.225559.VP 7.754e-16 72 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4352 4592896 4593348 453 -1 0.510 11 AGxAGG/AGGxGG GENOMAD.191984.VP 7.214e-08 53 0 0 0 2561 Caudoviricetes NA NA PF07128 NA
+NC_021184.1|provirus_4563831_4615358_4353 4593440 4593778 339 -1 0.475 11 GGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4354 4593839 4594747 909 -1 0.530 11 AGxAGG/AGGxGG GENOMAD.105515.VV 1.222e-10 65 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4355 4594886 4595074 189 -1 0.476 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4356 4595075 4595839 765 -1 0.498 11 AGGAGG GENOMAD.105515.VV 7.138e-14 74 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4357 4595908 4597131 1224 -1 0.462 11 AGGAGG GENOMAD.038338.VV 3.932e-28 121 0 0 0 2561 Caudoviricetes NA NA COG3392 NA
+NC_021184.1|provirus_4563831_4615358_4358 4597135 4598529 1395 -1 0.491 11 AGGAGG GENOMAD.005053.VV 3.988e-20 97 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4359 4598987 4599307 321 -1 0.505 11 GGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4360 4599480 4600436 957 -1 0.357 11 GGA/GAG/AGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4361 4600429 4601187 759 -1 0.362 11 None NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4362 4601556 4601987 432 -1 0.444 11 GGxGG GENOMAD.159035.VP 1.815e-23 98 0 0 0 2561 Caudoviricetes NA NA PF07374;TIGR01636;COG2739 phage transcriptional activator, RinA family
+NC_021184.1|provirus_4563831_4615358_4363 4601984 4602181 198 -1 0.424 11 AGGAGG GENOMAD.212426.VP 2.201e-26 102 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4364 4602184 4603536 1353 -1 0.474 11 None GENOMAD.116250.VP 4.087e-30 128 0 0 0 2561 Caudoviricetes NA NA PF00270;COG1111;TIGR04095;K17677 ERCC4-related helicase
+NC_021184.1|provirus_4563831_4615358_4365 4603517 4603798 282 -1 0.454 11 AGGAGG GENOMAD.004000.VV 3.23e-20 86 0 0 0 2561 Caudoviricetes NA NA COG1591 NA
+NC_021184.1|provirus_4563831_4615358_4366 4603951 4606197 2247 -1 0.477 11 AGGAGG GENOMAD.016441.VV 9.643e-11 68 0 0 0 2561 Caudoviricetes NA NA TIGR01613 phage/plasmid primase, P4 family, C-terminal domain
+NC_021184.1|provirus_4563831_4615358_4367 4606225 4606872 648 -1 0.414 11 AGGAGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4368 4606860 4607267 408 -1 0.529 11 GGAGG GENOMAD.220271.VP 0.0002632 42 0 0 0 2561 Caudoviricetes NA NA PF09152;COG3613;TIGR03646 Nucleoside 2-deoxyribosyltransferase
+NC_021184.1|provirus_4563831_4615358_4369 4607213 4607470 258 -1 0.496 11 AGGAGG GENOMAD.159187.VV 1.664e-38 138 0 0 0 2561 Caudoviricetes NA NA PF14205;TIGR02098;COG1996 MJ0042 family finger-like domain
+NC_021184.1|provirus_4563831_4615358_4370 4607722 4610022 2301 -1 0.501 11 AGGAG GENOMAD.038590.VV 7.582e-125 421 0 0 0 2561 Caudoviricetes NA NA PF00476;PF13482;K02334;COG0749;TIGR01388 DNA polymerase I - 3'-5' exonuclease and polymerase domains
+NC_021184.1|provirus_4563831_4615358_4371 4610081 4610638 558 -1 0.518 11 AGGAGG GENOMAD.039702.VV 2.165e-40 149 0 0 0 2561 Caudoviricetes NA NA PF10991 NA
+NC_021184.1|provirus_4563831_4615358_4372 4610652 4611773 1122 -1 0.529 11 GGAG/GAGG GENOMAD.136786.VV 3.244e-49 183 0 0 0 2561 Caudoviricetes NA NA PF10926;TIGR01896;COG2887;K07465 CRISPR-associated exonuclease Csa1
+NC_021184.1|provirus_4563831_4615358_4373 4611766 4612083 318 -1 0.494 11 GGAG/GAGG GENOMAD.222352.VV 4.487e-22 92 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4374 4612061 4612222 162 -1 0.506 11 GGAGG GENOMAD.116519.VV 3.339e-10 55 0 0 0 2561 Caudoviricetes NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4375 4612350 4612847 498 -1 0.448 11 GGA/GAG/AGG GENOMAD.204246.VV 1.065e-07 53 0 0 0 2561 Caudoviricetes NA NA PF03333;K01994;TIGR03879 Adhesin biosynthesis transcription regulatory protein
+NC_021184.1|provirus_4563831_4615358_4376 4613153 4615015 1863 -1 0.444 11 AGxAGG/AGGxGG NA NA NA 0 0 0 1 NA NA NA NA NA
+NC_021184.1|provirus_4563831_4615358_4377 4615155 4615358 204 1 0.422 11 GGAG/GAGG NA NA NA 0 0 0 1 NA NA NA NA NA
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_000913.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_000913.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_000913.3|provirus_1412000_1434224 22225 Provirus 1412000-1434224 28 11 0.9653 NA 4 27.1536 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_000913.3|provirus_2461306_2476510 15205 Provirus 2461306-2476510 19 11 0.9611 NA 2 18.3692 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_000913.3|provirus_1196867_1213107 16241 Provirus 1196867-1213107 24 11 0.9605 NA 6 22.4142 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_000913.3|provirus_563848_584430 20583 Provirus 563848-584430 30 11 0.9007 NA 6 14.4709 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_000913.3|provirus_1627517_1653915 26399 Provirus 1627517-1653915 42 11 0.8949 NA 4 21.7953 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_002737.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_002737.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_002737.2|provirus_529627_569283 39657 Provirus 529627-569283 49 11 0.9801 NA 13 76.8805 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_002737.2|provirus_777501_820593 43093 Provirus 777501-820593 68 11 0.9796 NA 10 90.5047 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_002737.2|provirus_1186916_1222544 35629 Provirus 1186916-1222544 54 11 0.9770 NA 8 73.4096 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_003450.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_003450.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_008261.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_008261.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_008261.1|provirus_1784095_1821197 37103 Provirus 1784095-1821197 44 11 0.9669 NA 13 47.9680 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_008261.1|provirus_1070550_1127691 57142 Provirus 1070550-1127691 68 11 0.9536 NA 12 61.5635 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_009012.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_009012.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_009012.1|provirus_2931283_2970170 38888 Provirus 2931283-2970170 62 11 0.9595 NA 14 62.6553 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_009012.1|provirus_1938476_1983993 45518 Provirus 1938476-1983993 52 11 0.9466 NA 14 58.8179 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_009012.1|provirus_2022140_2067593 45454 Provirus 2022140-2067593 55 11 0.9296 NA 12 56.7329 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_009012.1|provirus_3339258_3389049 49792 Provirus 3339258-3389049 53 11 0.9122 NA 2 13.1702 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_012982.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_012982.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_014008.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014008.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_014168.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014168.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_014168.1|provirus_27479_67296 39818 Provirus 27479-67296 63 11 0.9641 NA 7 44.2001 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014168.1|provirus_1141631_1162952 21322 Provirus 1141631-1162952 35 11 0.9457 NA 7 27.6971 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_014211.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014211.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_014212.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014212.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_014212.1|provirus_1746722_1764354 17633 Provirus 1746722-1764354 38 11 0.9025 NA 1 16.7440 Viruses;Varidnaviria;Helvetiavirae;Dividoviricota;Laserviricetes;Halopanivirales;Sphaerolipoviridae
+NC_014212.1|provirus_1893193_1914973 21781 Provirus 1893193-1914973 33 11 0.8895 NA 5 22.1216 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014212.1|provirus_1170297_1209132 38836 Provirus 1170297-1209132 48 11 0.8869 NA 5 21.9558 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_014363.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014363.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_014364.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014364.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_014364.1|provirus_2666253_2703772 37520 Provirus 2666253-2703772 56 11 0.9674 NA 8 31.3276 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014364.1|provirus_2976748_3014759 38012 Provirus 2976748-3014759 43 11 0.9540 NA 6 25.4448 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014364.1|provirus_2121424_2157334 35911 Provirus 2121424-2157334 42 11 0.9330 NA 8 27.2215 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014364.1|provirus_2329685_2350621 20937 Provirus 2329685-2350621 28 11 0.8720 NA 4 13.7214 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_015761.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_015761.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_015761.1|provirus_3084741_3115735 30995 Provirus 3084741-3115735 41 11 0.9788 NA 20 51.6697 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_015761.1|provirus_1007223_1045009 37787 Provirus 1007223-1045009 51 11 0.9585 NA 5 39.7532 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_015761.1|provirus_847397_862760 15364 Provirus 847397-862760 19 11 0.9561 NA 10 16.7146 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_017033.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_017033.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_017033.1|provirus_1557694_1600481 42788 Provirus 1557694-1600481 71 11 0.9788 NA 11 61.4099 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_017033.1|provirus_1052334_1094910 42577 Provirus 1052334-1094910 66 11 0.9602 NA 20 58.7796 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_017033.1|provirus_2089294_2107522 18229 Provirus 2089294-2107522 25 11 0.9392 NA 1 11.4432 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_017095.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_017095.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_018014.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_018014.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_018068.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_018068.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_018068.1|provirus_1361108_1399802 38695 Provirus 1361108-1399802 52 11 0.9631 NA 13 58.9401 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_018068.1|provirus_2072558_2098541 25984 Provirus 2072558-2098541 33 11 0.9473 NA 3 21.6083 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_018515.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_018515.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_018515.1|provirus_3418112_3436097 17986 Provirus 3418112-3436097 25 11 0.9523 NA 6 32.1738 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_018515.1|provirus_4659544_4694673 35130 Provirus 4659544-4694673 49 11 0.9431 NA 14 45.8652 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_019897.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_019897.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_019904.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_019904.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_019936.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_019936.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_019936.1|provirus_4295725_4304306 8582 Provirus 4295725-4304306 13 11 0.9664 NA 2 10.7145 Viruses;Monodnaviria;Loebvirae;Hofneiviricota;Faserviricetes;Tubulavirales;Inoviridae
+NC_019936.1|provirus_2347508_2361929 14422 Provirus 2347508-2361929 21 11 0.9596 NA 2 12.9957 Viruses;Monodnaviria;Loebvirae;Hofneiviricota;Faserviricetes;Tubulavirales;Inoviridae
+NC_019936.1|provirus_3233292_3242961 9670 Provirus 3233292-3242961 15 11 0.9092 NA 2 8.9242 Viruses;Monodnaviria;Loebvirae;Hofneiviricota;Faserviricetes;Tubulavirales;Inoviridae
diff -r 000000000000 -r 315c2ed31af1 test-data/genomad_virus_summary/NC_021184.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_021184.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name length topology coordinates n_genes genetic_code virus_score fdr n_hallmarks marker_enrichment taxonomy
+NC_021184.1|provirus_4563831_4615358 51528 Provirus 4563831-4615358 59 11 0.9554 NA 11 60.5769 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_021184.1|provirus_4466413_4519129 52717 Provirus 4466413-4519129 62 11 0.9421 NA 12 58.6292 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_021184.1|provirus_19778_35564 15787 Provirus 19778-35564 22 11 0.9155 NA 3 8.5756 Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
diff -r 000000000000 -r 315c2ed31af1 test-data/gtdbtk.bac120.summary
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/gtdbtk.bac120.summary Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,23 @@
+user_genome classification closest_genome_reference closest_genome_reference_radius closest_genome_taxonomy closest_genome_ani closest_genome_af closest_placement_reference closest_placement_radius closest_placement_taxonomy closest_placement_ani closest_placement_af pplacer_taxonomy classification_method note other_related_references(genome_id,species_name,radius,ANI,AF) msa_percent translation_table red_value warnings
+NC_000913.fasta d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli GCF_003697165.2 95.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli 96.74 0.856 GCF_000026225.1 95.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii 91.54 0.56 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__ taxonomic classification defined by topology and ANI N/A GCF_000194175.1, s__Escherichia coli_F, 95.0, 95.46, 0.89; GCF_002965065.1, s__Escherichia sp002965065, 95.0, 94.52, 0.691; GCF_004211955.1, s__Escherichia sp004211955, 95.0, 93.12, 0.774; GCF_005843885.1, s__Escherichia sp005843885, 95.0, 92.76, 0.782; GCF_011881725.1, s__Escherichia coli_E, 95.0, 92.37, 0.807; GCF_029876145.1, s__Escherichia ruysiae, 95.0, 92.28, 0.788; GCF_014836715.1, s__Escherichia whittamii, 95.0, 91.78, 0.782; GCF_002900365.1, s__Escherichia marmotae, 95.0, 90.92, 0.738; GCF_000759775.1, s__Escherichia albertii, 95.0, 90.18, 0.68 98.47 11 N/A N/A
+NC_002737.fasta d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes GCF_002055535.1 95.0 d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes 99.7 0.968 GCF_002055535.1 95.0 d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes 99.7 0.968 d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_900459225.1, s__Streptococcus dysgalactiae, 95.0, 88.16, 0.456; GCF_900636575.1, s__Streptococcus canis, 95.0, 86.81, 0.468 98.31 11 N/A N/A
+NC_003450.fasta d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Corynebacterium;s__Corynebacterium glutamicum GCF_000011325.1 95.0 d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Corynebacterium;s__Corynebacterium glutamicum 100.0 1.0 GCF_000011325.1 95.0 d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Corynebacterium;s__Corynebacterium glutamicum 100.0 1.0 d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Corynebacterium;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_002355155.1, s__Corynebacterium suranareeae, 95.0, 86.55, 0.531; GCF_001643015.1, s__Corynebacterium crudilactis, 95.0, 84.07, 0.363; GCF_001277995.1, s__Corynebacterium deserti, 95.0, 83.77, 0.275 96.43 11 N/A N/A
+NC_008261.fasta d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens GCF_000013285.1 95.0 d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens 100.0 1.0 GCF_000013285.1 95.0 d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens 100.0 1.0 d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_029258205.1, s__Sarcina sp029258205, 95.0, 92.75, 0.744; GCF_029267215.1, s__Sarcina sp029267215, 95.0, 84.03, 0.29 94.4 11 N/A N/A
+NC_009012.fasta d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum GCF_000015865.1 95.0 d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum 100.0 1.0 GCF_000015865.1 95.0 d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum 100.0 1.0 d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_000521465.1, s__Hungateiclostridium straminisolvens, 95.0, 84.49, 0.429; GCF_004102745.1, s__Hungateiclostridium mesophilum, 95.0, 81.39, 0.257 94.22 11 N/A N/A
+NC_012982.fasta d__Bacteria;p__Pseudomonadota;c__Alphaproteobacteria;o__Caulobacterales;f__Hyphomonadaceae;g__Hirschia;s__Hirschia baltica GCF_000023785.1 95.0 d__Bacteria;p__Pseudomonadota;c__Alphaproteobacteria;o__Caulobacterales;f__Hyphomonadaceae;g__Hirschia;s__Hirschia baltica 100.0 1.0 GCF_000023785.1 95.0 d__Bacteria;p__Pseudomonadota;c__Alphaproteobacteria;o__Caulobacterales;f__Hyphomonadaceae;g__Hirschia;s__Hirschia baltica 100.0 1.0 d__Bacteria;p__Pseudomonadota;c__Alphaproteobacteria;o__Caulobacterales;f__Hyphomonadaceae;g__Hirschia;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments N/A 98.25 11 N/A N/A
+NC_014008.fasta d__Bacteria;p__Verrucomicrobiota;c__Verrucomicrobiae;o__Opitutales;f__Coraliomargaritaceae;g__Coraliomargarita;s__Coraliomargarita akajimensis GCF_000025905.1 95.0 d__Bacteria;p__Verrucomicrobiota;c__Verrucomicrobiae;o__Opitutales;f__Coraliomargaritaceae;g__Coraliomargarita;s__Coraliomargarita akajimensis 100.0 1.0 GCF_000025905.1 95.0 d__Bacteria;p__Verrucomicrobiota;c__Verrucomicrobiae;o__Opitutales;f__Coraliomargaritaceae;g__Coraliomargarita;s__Coraliomargarita akajimensis 100.0 1.0 d__Bacteria;p__Verrucomicrobiota;c__Verrucomicrobiae;o__Opitutales;f__Coraliomargaritaceae;g__;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments N/A 90.76 11 N/A N/A
+NC_014168.fasta d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus GCF_000092825.1 95.0 d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus 100.0 1.0 GCF_000092825.1 95.0 d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus 100.0 1.0 d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_000185725.2, s__Segniliparus rugosus, 95.0, 80.18, 0.178 96.56 11 N/A N/A
+NC_014211.fasta d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Streptosporangiales;f__Streptosporangiaceae;g__Nocardiopsis;s__Nocardiopsis dassonvillei GCF_000092985.1 95.0 d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Streptosporangiales;f__Streptosporangiaceae;g__Nocardiopsis;s__Nocardiopsis dassonvillei 100.0 1.0 GCF_000092985.1 95.0 d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Streptosporangiales;f__Streptosporangiaceae;g__Nocardiopsis;s__Nocardiopsis dassonvillei 100.0 1.0 d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Streptosporangiales;f__Streptosporangiaceae;g__Nocardiopsis;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_012396365.1, s__Nocardiopsis alborubida, 95.0, 94.89, 0.822; GCA_000340945.1, s__Nocardiopsis synnemataformans, 95.0, 94.67, 0.838; GCA_002529455.1, s__Nocardiopsis fusca, 95.0, 93.48, 0.743; GCF_000341065.1, s__Nocardiopsis halotolerans, 95.0, 89.3, 0.575; GCF_001905145.1, s__Nocardiopsis sp001905145, 95.0, 89.08, 0.554; GCF_008638415.1, s__Nocardiopsis sinuspersici, 95.0, 88.61, 0.531; GCF_008638365.1, s__Nocardiopsis quinghaiensis, 95.0, 88.23, 0.498; GCF_009830945.1, s__Nocardiopsis sp009830945, 95.0, 87.99, 0.442; GCA_937957845.1, s__Nocardiopsis sp937957845, 95.0, 87.38, 0.277; GCF_026642255.1, s__Nocardiopsis nanhaiensis_A, 95.0, 86.06, 0.436; GCF_030271535.1, s__Nocardiopsis sp030271535, 95.0, 84.81, 0.338; GCF_013410755.1, s__Nocardiopsis aegyptia, 95.0, 84.69, 0.277; GCF_018316655.1, s__Nocardiopsis changdeensis, 95.0, 84.65, 0.301; GCF_000341125.1, s__Nocardiopsis lucentensis, 95.0, 84.45, 0.226; GCF_001279585.1, s__Nocardiopsis sp001279585, 95.0, 84.4, 0.267; GCA_018388625.1, s__Nocardiopsis eucommiae, 95.0, 84.39, 0.264; GCF_014201115.1, s__Nocardiopsis metallicus, 95.0, 84.3, 0.268; GCF_003634495.1, s__Nocardiopsis sp003634495, 95.0, 84.18, 0.288; GCF_030766825.1, s__Nocardiopsis sp030766825, 95.0, 84.18, 0.286; GCF_000341085.1, s__Nocardiopsis ganjiahuensis, 95.0, 84.16, 0.28; GCF_030555055.1, s__Nocardiopsis sp030555055, 95.0, 84.06, 0.267; GCF_024134545.1, s__Nocardiopsis exhalans, 95.08, 84.04, 0.267; GCF_900141985.1, s__Nocardiopsis flavescens, 95.0, 83.82, 0.272; GCF_003386285.1, s__Nocardiopsis sp003386285, 95.0, 83.73, 0.264; GCF_014651695.1, s__Nocardiopsis terrae, 95.0, 83.6, 0.27; GCF_014203695.1, s__Nocardiopsis algeriensis, 95.0, 83.59, 0.238; GCF_020741345.1, s__Nocardiopsis listeri_A, 95.0, 83.53, 0.202; GCF_000341225.1, s__Nocardiopsis alba, 95.0, 83.47, 0.217; GCF_018207095.1, s__Nocardiopsis sp018207095, 95.0, 83.32, 0.229; GCF_028882275.1, s__Nocardiopsis sp028882275, 95.0, 83.25, 0.266; GCF_900143625.1, s__Nocardiopsis sp900143625, 95.0, 83.09, 0.229; GCF_000515115.1, s__Nocardiopsis sp000515115, 95.0, 83.02, 0.181; GCF_014892575.1, s__Nocardiopsis coralli, 95.0, 82.85, 0.213; GCF_000341265.1, s__Nocardiopsis prasina, 95.0, 82.63, 0.245; GCF_001942255.1, s__Nocardiopsis sp001942255, 95.0, 82.61, 0.248; GCF_000341005.1, s__Nocardiopsis alkaliphila, 95.0, 82.53, 0.186; GCF_001570765.1, s__Nocardiopsis listeri, 95.0, 82.26, 0.198; GCF_000341025.1, s__Nocardiopsis salina, 95.0, 82.22, 0.158; GCF_000341145.1, s__Nocardiopsis xinjiangensis, 95.0, 81.14, 0.168 26.24 11 N/A N/A
+NC_014212.fasta d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Allomeiothermus;s__Allomeiothermus silvanus GCF_000092125.1 95.0 d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Allomeiothermus;s__Allomeiothermus silvanus 100.0 0.999 GCF_000092125.1 95.0 d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Allomeiothermus;s__Allomeiothermus silvanus 100.0 0.999 d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Allomeiothermus;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_003226535.1, s__Allomeiothermus sp003226535, 95.0, 87.73, 0.485 93.82 11 N/A N/A
+NC_014363.fasta d__Bacteria;p__Actinomycetota;c__Coriobacteriia;o__Coriobacteriales;f__Atopobiaceae;g__Olsenella;s__Olsenella uli GCF_000143845.1 95.0 d__Bacteria;p__Actinomycetota;c__Coriobacteriia;o__Coriobacteriales;f__Atopobiaceae;g__Olsenella;s__Olsenella uli 100.0 1.0 GCF_000143845.1 95.0 d__Bacteria;p__Actinomycetota;c__Coriobacteriia;o__Coriobacteriales;f__Atopobiaceae;g__Olsenella;s__Olsenella uli 100.0 1.0 d__Bacteria;p__Actinomycetota;c__Coriobacteriia;o__Coriobacteriales;f__Atopobiaceae;g__;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments N/A 95.47 11 N/A N/A
+NC_014364.fasta d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae GCF_000143985.1 95.0 d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae 100.0 1.0 GCF_000143985.1 95.0 d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae 100.0 1.0 d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_000378205.1, s__Sediminispirochaeta bajacaliforniensis, 95.0, 94.41, 0.82 88.42 11 N/A N/A
+NC_015761.fasta d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori GCF_000252995.1 95.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori 100.0 1.0 GCF_000252995.1 95.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori 100.0 1.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_000006945.2, s__Salmonella enterica, 95.0, 90.34, 0.758; GCA_900478215.1, s__Salmonella houtenae, 95.0, 90.05, 0.755; GCF_008692785.1, s__Salmonella diarizonae, 95.0, 89.91, 0.746; GCF_008692845.1, s__Salmonella arizonae, 95.0, 89.51, 0.704 97.58 11 N/A N/A
+NC_017033.fasta d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia GCF_000242255.2 95.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia 100.0 1.0 GCF_000242255.2 95.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia 100.0 1.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments N/A 98.45 11 N/A N/A
+NC_017095.fasta d__Bacteria;p__Thermotogota;c__Thermotogae;o__Thermotogales;f__Fervidobacteriaceae;g__Fervidobacterium;s__Fervidobacterium pennivorans GCF_000235405.2 95.0 d__Bacteria;p__Thermotogota;c__Thermotogae;o__Thermotogales;f__Fervidobacteriaceae;g__Fervidobacterium;s__Fervidobacterium pennivorans 100.0 1.0 GCF_000235405.2 95.0 d__Bacteria;p__Thermotogota;c__Thermotogae;o__Thermotogales;f__Fervidobacteriaceae;g__Fervidobacterium;s__Fervidobacterium pennivorans 100.0 1.0 d__Bacteria;p__Thermotogota;c__Thermotogae;o__Thermotogales;f__Fervidobacteriaceae;g__Fervidobacterium;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_001644665.1, s__Fervidobacterium pennivorans_A, 95.0, 92.25, 0.827 90.82 11 N/A N/A
+NC_018014.fasta d__Bacteria;p__Acidobacteriota;c__Terriglobia;o__Terriglobales;f__Acidobacteriaceae;g__Terriglobus;s__Terriglobus roseus GCF_000265425.1 95.0 d__Bacteria;p__Acidobacteriota;c__Terriglobia;o__Terriglobales;f__Acidobacteriaceae;g__Terriglobus;s__Terriglobus roseus 100.0 1.0 GCF_000265425.1 95.0 d__Bacteria;p__Acidobacteriota;c__Terriglobia;o__Terriglobales;f__Acidobacteriaceae;g__Terriglobus;s__Terriglobus roseus 100.0 1.0 d__Bacteria;p__Acidobacteriota;c__Terriglobia;o__Terriglobales;f__Acidobacteriaceae;g__Terriglobus;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_900105625.1, s__Terriglobus roseus_B, 95.0, 82.2, 0.254 94.06 11 N/A N/A
+NC_018068.fasta d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus GCF_000255115.2 95.0 d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus 100.0 1.0 GCF_000255115.2 95.0 d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus 100.0 1.0 d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_002196705.1, s__Desulfosporosinus sp002196705, 95.0, 81.15, 0.156 93.92 11 N/A N/A
+NC_018515.fasta d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei GCF_000231385.2 95.0 d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei 100.0 1.0 GCF_000231385.2 95.0 d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei 100.0 1.0 d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_900100785.1, s__Desulfosporosinus hippei, 95.0, 94.11, 0.765; GCF_000765145.1, s__Desulfosporosinus sp000765145, 95.0, 92.48, 0.692 94.5 11 N/A N/A
+NC_019897.fasta d__Bacteria;p__Bacillota;c__Bacilli;o__Paenibacillales;f__Paenibacillaceae;g__Thermobacillus;s__Thermobacillus xylanilyticus GCF_907165215.1 95.0 d__Bacteria;p__Bacillota;c__Bacilli;o__Paenibacillales;f__Paenibacillaceae;g__Thermobacillus;s__Thermobacillus xylanilyticus 97.81 0.815 GCF_907165215.1 95.0 d__Bacteria;p__Bacillota;c__Bacilli;o__Paenibacillales;f__Paenibacillaceae;g__Thermobacillus;s__Thermobacillus xylanilyticus 97.81 0.815 d__Bacteria;p__Bacillota;c__Bacilli;o__Paenibacillales;f__Paenibacillaceae;g__Thermobacillus;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_002159085.1, s__Thermobacillus sp002159085, 95.0, 85.65, 0.466 95.97 11 N/A N/A
+NC_019904.fasta d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Cytophagales;f__Cyclobacteriaceae;g__Echinicola;s__Echinicola vietnamensis GCF_000325705.1 95.0 d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Cytophagales;f__Cyclobacteriaceae;g__Echinicola;s__Echinicola vietnamensis 100.0 1.0 GCF_000325705.1 95.0 d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Cytophagales;f__Cyclobacteriaceae;g__Echinicola;s__Echinicola vietnamensis 100.0 1.0 d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Cytophagales;f__Cyclobacteriaceae;g__Echinicola;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_005281475.1, s__Echinicola rosea, 95.0, 83.28, 0.288; GCF_006575665.1, s__Echinicola soli, 95.0, 81.29, 0.203; GCF_003260975.1, s__Echinicola strongylocentroti, 95.0, 80.38, 0.164 96.96 11 N/A N/A
+NC_019936.fasta d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE GCF_000327065.1 95.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE 100.0 1.0 GCF_000327065.1 95.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE 100.0 1.0 d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments GCF_003696315.1, s__Stutzerimonas songnenensis, 95.0, 93.2, 0.909; GCF_000661915.1, s__Stutzerimonas decontaminans, 95.0, 91.33, 0.803; GCF_900114065.1, s__Stutzerimonas kunmingensis, 96.6, 90.17, 0.753; GCF_024397475.1, s__Stutzerimonas xanthomarina_A, 97.0, 90.15, 0.746; GCA_007713455.1, s__Stutzerimonas sp007713455, 95.0, 90.03, 0.748; GCF_014764705.1, s__Stutzerimonas sp002692525, 96.82, 90.01, 0.736; GCA_003530955.1, s__Stutzerimonas sp003530955, 96.79, 89.98, 0.727; GCF_002929225.1, s__Stutzerimonas stutzeri_U, 97.04, 89.97, 0.743; GCF_000935215.1, s__Stutzerimonas stutzeri_AD, 96.98, 89.84, 0.723; GCF_000495915.1, s__Stutzerimonas chloritidismutans, 96.78, 89.84, 0.717; GCA_018823765.1, s__Stutzerimonas sp018823765, 97.02, 89.77, 0.71; GCA_003488145.1, s__Stutzerimonas sp003488145, 96.59, 89.74, 0.666; GCF_000341615.1, s__Stutzerimonas stutzeri_G, 95.0, 89.32, 0.697; GCF_002890795.1, s__Stutzerimonas stutzeri_AA, 95.0, 89.28, 0.735; GCF_024448335.1, s__Stutzerimonas frequens, 95.0, 88.75, 0.714; GCF_015291885.1, s__Stutzerimonas stutzeri_AC, 95.0, 88.59, 0.662; GCF_000219605.1, s__Stutzerimonas stutzeri, 95.0, 88.34, 0.673; GCF_002909485.1, s__Stutzerimonas stutzeri_AH, 95.0, 88.19, 0.688; GCF_000307775.2, s__Stutzerimonas stutzeri_B, 95.0, 86.95, 0.549; GCF_002890915.1, s__Stutzerimonas stutzeri_AF, 95.0, 85.91, 0.472; GCF_025966695.1, s__Stutzerimonas sp025966695, 95.0, 85.39, 0.44; GCA_000263395.1, s__Stutzerimonas stutzeri_C, 95.0, 85.38, 0.392; GCF_024448505.1, s__Stutzerimonas degradans, 96.08, 85.26, 0.426; GCF_021432765.1, s__Stutzerimonas phenolilytica, 95.0, 85.11, 0.435; GCF_015070855.1, s__Stutzerimonas lopnurensis, 95.0, 85.07, 0.41; GCF_021726475.1, s__Stutzerimonas oligotrophica, 95.0, 84.76, 0.419; GCF_000818015.1, s__Stutzerimonas balearica, 95.0, 83.88, 0.33; GCF_003696285.1, s__Stutzerimonas nitrititolerans, 95.0, 82.51, 0.26; GCF_018138085.1, s__Stutzerimonas stutzeri_AI, 95.0, 82.03, 0.245; GCF_005876855.1, s__Stutzerimonas nosocomialis, 95.0, 81.99, 0.242; GCF_019090095.1, s__Stutzerimonas stutzeri_AN, 95.0, 81.91, 0.245; GCF_013522825.1, s__Stutzerimonas stutzeri_AK, 95.0, 81.91, 0.2; GCA_002339675.1, s__Stutzerimonas stutzeri_O, 95.0, 81.89, 0.253; GCF_019355055.1, s__Stutzerimonas sp004331835, 95.0, 81.83, 0.222; GCF_024448955.1, s__Stutzerimonas stutzeri_AQ, 95.0, 81.79, 0.232; GCF_024448695.1, s__Stutzerimonas stutzeri_T, 95.0, 81.71, 0.242; GCF_022810315.1, s__Stutzerimonas marianensis, 95.0, 81.66, 0.218; GCF_024448935.1, s__Stutzerimonas stutzeri_AO, 95.0, 81.57, 0.177; GCF_009789555.1, s__Stutzerimonas stutzeri_R, 95.0, 81.41, 0.22; GCA_022448005.1, s__Stutzerimonas sp022448005, 95.0, 81.35, 0.194; GCF_003325755.1, s__Stutzerimonas sp003325755, 95.0, 81.28, 0.206; GCA_004010935.1, s__Stutzerimonas sp004010935, 95.0, 81.27, 0.216; GCA_002387205.1, s__Stutzerimonas stutzeri_N, 95.0, 81.26, 0.195; GCF_024448985.1, s__Stutzerimonas stutzeri_AP, 95.0, 81.22, 0.203; GCF_000425625.1, s__Stutzerimonas azotifigens, 95.0, 81.18, 0.187; GCF_000756775.1, s__Stutzerimonas saudiphocaensis, 95.0, 81.13, 0.219; GCF_000952685.1, s__Stutzerimonas stutzeri_E, 95.0, 81.08, 0.216; GCF_000235745.1, s__Stutzerimonas stutzeri_H, 95.0, 81.07, 0.199; GCF_013522725.1, s__Stutzerimonas azotifigens_A, 95.0, 80.99, 0.203; GCA_900766265.1, s__Stutzerimonas sp900766265, 95.0, 80.94, 0.196; GCF_024448895.1, s__Stutzerimonas stutzeri_Q, 95.0, 80.91, 0.193; GCF_900129835.1, s__Stutzerimonas xanthomarina, 95.0, 80.89, 0.2; GCF_002890895.1, s__Stutzerimonas stutzeri_AB, 95.0, 80.87, 0.198; GCF_019880365.1, s__Stutzerimonas stutzeri_P, 95.0, 80.81, 0.187; GCA_002345575.1, s__Stutzerimonas stutzeri_S, 95.0, 80.74, 0.191; GCF_013620795.1, s__Stutzerimonas sp013620795, 95.0, 80.74, 0.187; GCF_024448715.1, s__Stutzerimonas stutzeri_AR, 95.0, 80.6, 0.18; GCF_000590475.1, s__Stutzerimonas stutzeri_D, 95.0, 80.4, 0.167; GCF_003696365.1, s__Stutzerimonas zhaodongensis, 95.0, 79.95, 0.152 97.72 11 N/A N/A
+NC_021184.fasta d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae GCF_000233715.2 95.0 d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae 100.0 1.0 GCF_000233715.2 95.0 d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae 100.0 1.0 d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__ taxonomic classification defined by topology and ANI topological placement and ANI have congruent species assignments N/A 95.73 11 N/A N/A
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_000913.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_000913.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,50 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_000913.3|provirus_1196867_1213107,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;92.80
+NC_000913.3|provirus_1196867_1213107,RS_GCF_000026225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii,blast,96.90,iPHoP-RF;92.40
+NC_000913.3|provirus_1196867_1213107,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;93.40
+NC_000913.3|provirus_1196867_1213107,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;96.40
+NC_000913.3|provirus_1196867_1213107,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;93.70
+NC_000913.3|provirus_1196867_1213107,RS_GCF_004211955.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp004211955,iPHoP-RF,96.40,None
+NC_000913.3|provirus_1196867_1213107,RS_GCF_005843885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp005843885,iPHoP-RF,96.40,None
+NC_000913.3|provirus_1196867_1213107,RS_GCF_011881725.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli_E,iPHoP-RF,96.40,None
+NC_000913.3|provirus_1196867_1213107,RS_GCF_002965065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp002965065,iPHoP-RF,96.10,None
+NC_000913.3|provirus_1196867_1213107,RS_GCF_014836715.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia whittamii,iPHoP-RF,95.10,None
+NC_000913.3|provirus_1412000_1434224,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;93.70
+NC_000913.3|provirus_1412000_1434224,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;93.10
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002075345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter;s__Citrobacter braakii,blast,96.90,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;95.40
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002925905.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Klebsiella;s__Klebsiella michiganensis,blast,96.90,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;95.40
+NC_000913.3|provirus_1412000_1434224,RS_GCF_005843885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp005843885,iPHoP-RF,96.10,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002965065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp002965065,iPHoP-RF,95.40,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_014836715.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia whittamii,iPHoP-RF,95.40,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_000026225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii,iPHoP-RF,95.10,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_011881725.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli_E,iPHoP-RF,95.10,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002042885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter;s__Citrobacter portucalensis,blast,94.90,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_004211955.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp004211955,iPHoP-RF,92.40,None
+NC_000913.3|provirus_1627517_1653915,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;95.10
+NC_000913.3|provirus_1627517_1653915,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;96.10
+NC_000913.3|provirus_1627517_1653915,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;96.70
+NC_000913.3|provirus_1627517_1653915,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;96.10
+NC_000913.3|provirus_1627517_1653915,RS_GCF_011881725.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli_E,blast,96.90,iPHoP-RF;96.10
+NC_000913.3|provirus_1627517_1653915,RS_GCF_000026225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii,iPHoP-RF,96.40,None
+NC_000913.3|provirus_1627517_1653915,RS_GCF_004211955.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp004211955,iPHoP-RF,96.10,None
+NC_000913.3|provirus_1627517_1653915,RS_GCF_005843885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp005843885,iPHoP-RF,96.10,None
+NC_000913.3|provirus_1627517_1653915,RS_GCF_002965065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp002965065,iPHoP-RF,95.70,None
+NC_000913.3|provirus_1627517_1653915,RS_GCF_014836715.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia whittamii,iPHoP-RF,95.70,None
+NC_000913.3|provirus_2461306_2476510,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;93.10
+NC_000913.3|provirus_2461306_2476510,RS_GCF_000026225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii,blast,96.90,iPHoP-RF;94.40
+NC_000913.3|provirus_2461306_2476510,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;94.10
+NC_000913.3|provirus_2461306_2476510,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;93.40
+NC_000913.3|provirus_2461306_2476510,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;92.80
+NC_000913.3|provirus_2461306_2476510,RS_GCF_011881725.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli_E,blast,96.90,iPHoP-RF;96.40
+NC_000913.3|provirus_2461306_2476510,RS_GCF_002965065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp002965065,iPHoP-RF,95.10,None
+NC_000913.3|provirus_2461306_2476510,RS_GCF_004211955.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp004211955,iPHoP-RF,95.10,None
+NC_000913.3|provirus_2461306_2476510,RS_GCF_005843885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp005843885,iPHoP-RF,93.70,None
+NC_000913.3|provirus_2461306_2476510,RS_GCF_014836715.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia whittamii,iPHoP-RF,93.40,None
+NC_000913.3|provirus_563848_584430,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;88.20
+NC_000913.3|provirus_563848_584430,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;89.20
+NC_000913.3|provirus_563848_584430,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;88.50
+NC_000913.3|provirus_563848_584430,RS_GCF_002925905.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Klebsiella;s__Klebsiella michiganensis,blast,96.90,None
+NC_000913.3|provirus_563848_584430,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;87.00
+NC_000913.3|provirus_563848_584430,RS_GCF_002075345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter;s__Citrobacter braakii,blast,96.50,None
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_002737.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_002737.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,133 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000186445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus agalactiae,CRISPR,97.80,blast;91.00 iPHoP-RF;88.90
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900459225.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus dysgalactiae,iPHoP-RF,97.10,blast;96.90
+NC_002737.2|provirus_1186916_1222544,RS_GCF_002055535.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes,blast,96.90,iPHoP-RF;96.40
+NC_002737.2|provirus_1186916_1222544,RS_GCF_022354845.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_AA,CRISPR,96.80,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900459405.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis,CRISPR,96.80,iPHoP-RF;89.50
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900636575.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus canis,iPHoP-RF,96.70,blast;96.60
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000425025.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus castoreus,iPHoP-RF,94.70,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_001598035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halotolerans,iPHoP-RF,93.70,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000154985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus infantarius,iPHoP-RF,93.40,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900475675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus lutetiensis,iPHoP-RF,93.10,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000187265.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equinus,iPHoP-RF,92.80,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900101445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equinus_B,iPHoP-RF,92.80,None
+NC_002737.2|provirus_1186916_1222544,GB_GCA_000283635.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus macedonicus,iPHoP-RF,92.40,None
+NC_002737.2|provirus_1186916_1222544,GB_GCA_934196125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp934196125,iPHoP-RF,92.40,None
+NC_002737.2|provirus_1186916_1222544,GB_GCA_900637675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equi,iPHoP-RF,92.10,blast;62.80
+NC_002737.2|provirus_1186916_1222544,RS_GCF_004843545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pasteurianus,iPHoP-RF,91.80,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_003337175.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus_B,iPHoP-RF,91.40,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_009870755.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halichoeri,iPHoP-RF,91.10,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_002000985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus,iPHoP-RF,90.80,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000188015.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ictaluri,iPHoP-RF,90.50,blast;62.80
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000188055.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus urinalis,iPHoP-RF,90.50,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000960035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus oralis_G,CRISPR,98.60,iPHoP-RF;97.10
+NC_002737.2|provirus_529627_569283,RS_GCF_002055535.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes,CRISPR,98.60,blast;97.50 iPHoP-RF;96.10
+NC_002737.2|provirus_529627_569283,RS_GCF_002093545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus oralis_C,CRISPR,98.60,iPHoP-RF;96.10
+NC_002737.2|provirus_529627_569283,RS_GCF_900636575.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus canis,CRISPR,98.40,iPHoP-RF;97.10 blast;96.70
+NC_002737.2|provirus_529627_569283,RS_GCF_001937065.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp001937065,CRISPR,98.20,iPHoP-RF;96.70
+NC_002737.2|provirus_529627_569283,RS_GCF_902729355.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp902729355,CRISPR,98.10,iPHoP-RF;95.40
+NC_002737.2|provirus_529627_569283,RS_GCF_000186445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus agalactiae,CRISPR,97.60,iPHoP-RF;91.40 blast;67.70
+NC_002737.2|provirus_529627_569283,RS_GCF_000188035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pseudoporcinus,CRISPR,97.60,iPHoP-RF;96.40
+NC_002737.2|provirus_529627_569283,RS_GCF_000220065.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp000220065,iPHoP-RF,97.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000379985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus caballi,iPHoP-RF,97.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000380105.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus orisratti,iPHoP-RF,97.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000380125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ovis,iPHoP-RF,97.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_900459225.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus dysgalactiae,blast,96.90,iPHoP-RF;93.10
+NC_002737.2|provirus_529627_569283,RS_GCF_000423745.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus plurextorum,iPHoP-RF,96.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_002953735.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pluranimalium,iPHoP-RF,96.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_006739205.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus mutans,iPHoP-RF,96.70,None
+NC_002737.2|provirus_529627_569283,GB_GCA_945876895.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp945876895,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000425025.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus castoreus,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_002000985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_002355215.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus troglodytae,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_003337175.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus_B,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_900475415.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus porcinus,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,GB_GCA_900637675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equi,iPHoP-RF,96.10,blast;78.70
+NC_002737.2|provirus_529627_569283,GB_GCA_934196125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp934196125,iPHoP-RF,96.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000420785.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyovaginalis,iPHoP-RF,96.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_004843545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pasteurianus,iPHoP-RF,96.10,None
+NC_002737.2|provirus_529627_569283,GB_GCA_000283635.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus macedonicus,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000423765.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus porci,iPHoP-RF,95.70,blast;72.00
+NC_002737.2|provirus_529627_569283,RS_GCF_003686955.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hillyeri,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_011039275.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis_A,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_012277075.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus alactolyticus,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_900459405.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_901542335.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus porcinus_A,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000187995.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus macacae,iPHoP-RF,95.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000380145.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus thoraltensis,iPHoP-RF,95.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_012396585.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ovuberis,iPHoP-RF,95.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_016908655.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus saliviloxodontae,iPHoP-RF,95.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000188055.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus urinalis,iPHoP-RF,95.10,blast;66.30
+NC_002737.2|provirus_529627_569283,RS_GCF_001598035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halotolerans,iPHoP-RF,95.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_009870755.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halichoeri,iPHoP-RF,95.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_024814375.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp024814375,iPHoP-RF,95.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_011421425.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus catagoni,iPHoP-RF,94.70,blast;66.30
+NC_002737.2|provirus_529627_569283,RS_GCF_000380085.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus merionis,iPHoP-RF,93.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000785785.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus uberis_A,iPHoP-RF,93.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_003674745.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus iniae,iPHoP-RF,93.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_900475595.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus uberis,iPHoP-RF,93.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_019794555.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_AB,iPHoP-RF,91.10,None
+NC_002737.2|provirus_777501_820593,MGYG000003717,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__,CRISPR,98.40,iPHoP-RF;96.70
+NC_002737.2|provirus_777501_820593,RS_GCF_004843545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pasteurianus,CRISPR,98.40,iPHoP-RF;94.10
+NC_002737.2|provirus_777501_820593,GB_GCA_000283635.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus macedonicus,CRISPR,98.30,iPHoP-RF;88.50
+NC_002737.2|provirus_777501_820593,RS_GCF_000186445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus agalactiae,CRISPR,98.30,iPHoP-RF;80.30 blast;76.70
+NC_002737.2|provirus_777501_820593,RS_GCF_002055535.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes,blast,98.00,iPHoP-RF;93.70
+NC_002737.2|provirus_777501_820593,RS_GCF_900636575.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus canis,CRISPR,98.00,blast;96.50 iPHoP-RF;95.40
+NC_002737.2|provirus_777501_820593,RS_GCF_010120595.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus thermophilus,CRISPR,97.90,iPHoP-RF;96.10
+NC_002737.2|provirus_777501_820593,RS_GCF_000220065.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp000220065,iPHoP-RF,97.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_001697145.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus anginosus_C,iPHoP-RF,97.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_009717815.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus parasanguinis_F,iPHoP-RF,97.10,blast;83.70
+NC_002737.2|provirus_777501_820593,RS_GCF_016648925.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp900766505,iPHoP-RF,97.10,blast;83.70
+NC_002737.2|provirus_777501_820593,RS_GCF_900636475.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus anginosus,iPHoP-RF,97.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_902167705.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus constellatus_A,iPHoP-RF,97.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_943193075.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus parasanguinis_E,iPHoP-RF,97.10,blast;83.70
+NC_002737.2|provirus_777501_820593,RS_GCF_900459225.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus dysgalactiae,blast,96.90,iPHoP-RF;95.10
+NC_002737.2|provirus_777501_820593,RS_GCF_000380125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ovis,iPHoP-RF,96.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000423765.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus porci,iPHoP-RF,96.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_001598035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halotolerans,iPHoP-RF,96.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_023109675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus parasanguinis_I,iPHoP-RF,96.70,blast;83.70
+NC_002737.2|provirus_777501_820593,RS_GCF_023167545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus constellatus,iPHoP-RF,96.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000423745.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus plurextorum,iPHoP-RF,96.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_003686955.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hillyeri,iPHoP-RF,96.40,blast;70.10
+NC_002737.2|provirus_777501_820593,RS_GCF_011039275.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis_A,iPHoP-RF,96.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000380025.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus entericus,iPHoP-RF,96.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000380145.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus thoraltensis,iPHoP-RF,96.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_900475675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus lutetiensis,iPHoP-RF,96.10,blast;68.90
+NC_002737.2|provirus_777501_820593,RS_GCF_000154985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus infantarius,iPHoP-RF,95.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000420785.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyovaginalis,iPHoP-RF,95.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000425025.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus castoreus,iPHoP-RF,95.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_002000985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus,iPHoP-RF,95.40,blast;68.90
+NC_002737.2|provirus_777501_820593,GB_GCA_000440235.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_F,iPHoP-RF,95.10,None
+NC_002737.2|provirus_777501_820593,GB_GCA_934196125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp934196125,iPHoP-RF,95.10,None
+NC_002737.2|provirus_777501_820593,GB_GCA_002831545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_P,iPHoP-RF,94.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000785515.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus salivarius,iPHoP-RF,94.70,blast;68.90
+NC_002737.2|provirus_777501_820593,RS_GCF_003337175.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus_B,iPHoP-RF,94.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_900101445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equinus_B,iPHoP-RF,94.70,None
+NC_002737.2|provirus_777501_820593,GB_GCA_945876895.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp945876895,iPHoP-RF,94.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_002760245.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_I,iPHoP-RF,94.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_002953735.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pluranimalium,iPHoP-RF,94.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000380105.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus orisratti,iPHoP-RF,94.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_902702775.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_W,iPHoP-RF,94.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_902729355.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp902729355,iPHoP-RF,94.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000376985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus henryi,iPHoP-RF,93.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_012396585.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ovuberis,iPHoP-RF,93.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_016743335.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_Y,iPHoP-RF,93.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_900459405.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis,iPHoP-RF,93.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000294495.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis,iPHoP-RF,93.40,blast;65.20
+NC_002737.2|provirus_777501_820593,RS_GCF_000380085.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus merionis,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_001302265.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus phocae,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_016908655.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus saliviloxodontae,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_019794555.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_AB,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_021654455.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus parasuis,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,GB_GCA_900637675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equi,iPHoP-RF,93.10,blast;70.70
+NC_002737.2|provirus_777501_820593,RS_GCF_000440115.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_L,iPHoP-RF,93.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_003595525.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus respiraculi,iPHoP-RF,93.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_015594605.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp015594605,iPHoP-RF,92.80,blast;68.90
+NC_002737.2|provirus_777501_820593,RS_GCF_000188055.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus urinalis,iPHoP-RF,92.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_012277075.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus alactolyticus,iPHoP-RF,92.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_001578805.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp001578805,iPHoP-RF,91.80,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000785785.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus uberis_A,iPHoP-RF,91.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_022354845.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_AA,iPHoP-RF,91.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_900475595.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus uberis,iPHoP-RF,91.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_003674745.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus iniae,iPHoP-RF,90.80,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000188035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pseudoporcinus,iPHoP-RF,90.50,None
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_008261.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_008261.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_008261.1|provirus_1070550_1127691,RS_GCF_000013285.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens,blast,97.50,iPHoP-RF;76.60 CRISPR;50.20
+NC_008261.1|provirus_1784095_1821197,RS_GCF_000013285.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens,blast,96.90,CRISPR;93.40 iPHoP-RF;85.40
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_009012.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_009012.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_009012.1|provirus_1938476_1983993,RS_GCF_000015865.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum,blast,94.90,iPHoP-RF;71.30
+NC_009012.1|provirus_2022140_2067593,RS_GCF_000015865.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum,blast,93.90,None
+NC_009012.1|provirus_2931283_2970170,RS_GCF_000015865.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum,blast,91.80,None
+NC_009012.1|provirus_3339258_3389049,RS_GCF_000015865.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum,blast,95.50,iPHoP-RF;69.10
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_014168.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_014168.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_014168.1|provirus_1141631_1162952,RS_GCF_000092825.1,d__Bacteria;p__Actinomycetota;c__Actinomycetia;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus,blast,95.70,iPHoP-RF;68.00
+NC_014168.1|provirus_27479_67296,RS_GCF_000092825.1,d__Bacteria;p__Actinomycetota;c__Actinomycetia;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus,blast,96.00,iPHoP-RF;79.30
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_014212.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_014212.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,9 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_014212.1|provirus_1170297_1209132,RS_GCF_000092125.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Meiothermus_B;s__Meiothermus_B silvanus,blast,95.50,iPHoP-RF;80.80
+NC_014212.1|provirus_1170297_1209132,RS_GCF_003226535.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Meiothermus_B;s__Meiothermus_B sp003226535,blast,92.20,iPHoP-RF;72.60
+NC_014212.1|provirus_1170297_1209132,RS_GCF_000430045.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Calidithermus;s__Calidithermus chliarophilus,blast,90.90,CRISPR;76.20 iPHoP-RF;73.70
+NC_014212.1|provirus_1746722_1764354,RS_GCF_000092125.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Meiothermus_B;s__Meiothermus_B silvanus,blast,95.20,iPHoP-RF;86.00
+NC_014212.1|provirus_1893193_1914973,RS_GCF_000092125.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Meiothermus_B;s__Meiothermus_B silvanus,blast,94.80,iPHoP-RF;66.00
+NC_014212.1|provirus_1893193_1914973,RS_GCF_003574095.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Calidithermus;s__Calidithermus roseus,blast,91.00,None
+NC_014212.1|provirus_1893193_1914973,RS_GCF_000430045.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Calidithermus;s__Calidithermus chliarophilus,blast,90.80,iPHoP-RF;57.10
+NC_014212.1|provirus_1893193_1914973,RS_GCF_000373205.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Calidithermus;s__Calidithermus timidus,blast,90.40,None
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_014364.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_014364.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,7 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_014364.1|provirus_2121424_2157334,RS_GCF_000143985.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae,blast,96.20,CRISPR;95.40 iPHoP-RF;68.40
+NC_014364.1|provirus_2121424_2157334,RS_GCF_000378205.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta bajacaliforniensis,CRISPR,93.40,blast;91.30 iPHoP-RF;63.50
+NC_014364.1|provirus_2329685_2350621,RS_GCF_000143985.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae,blast,95.70,iPHoP-RF;65.10
+NC_014364.1|provirus_2329685_2350621,RS_GCF_000378205.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta bajacaliforniensis,blast,92.10,iPHoP-RF;52.80
+NC_014364.1|provirus_2666253_2703772,RS_GCF_000143985.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae,blast,96.20,CRISPR;74.20 iPHoP-RF;72.60
+NC_014364.1|provirus_2976748_3014759,RS_GCF_000143985.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae,blast,96.20,iPHoP-RF;69.80
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_015761.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_015761.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,21 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_015761.1|provirus_1007223_1045009,GB_GCA_900446925.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter_B;s__Citrobacter_B koseri,blast,96.90,iPHoP-RF;83.30
+NC_015761.1|provirus_1007223_1045009,GB_GCA_900478215.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella houtenae,blast,96.90,iPHoP-RF;90.80
+NC_015761.1|provirus_1007223_1045009,RS_GCF_000006945.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella enterica,blast,96.90,iPHoP-RF;88.50
+NC_015761.1|provirus_1007223_1045009,RS_GCF_000252995.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori,blast,96.90,iPHoP-RF;91.10
+NC_015761.1|provirus_1007223_1045009,RS_GCF_008692785.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella diarizonae,blast,96.90,iPHoP-RF;93.40
+NC_015761.1|provirus_1007223_1045009,RS_GCF_008692845.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella arizonae,blast,96.90,iPHoP-RF;90.50
+NC_015761.1|provirus_1007223_1045009,RS_GCF_006874705.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Leclercia;s__Leclercia adecarboxylata_C,blast,91.00,None
+NC_015761.1|provirus_3084741_3115735,RS_GCF_000006945.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella enterica,CRISPR,98.50,blast;96.80 iPHoP-RF;89.80
+NC_015761.1|provirus_3084741_3115735,RS_GCF_008692785.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella diarizonae,CRISPR,98.10,iPHoP-RF;90.80
+NC_015761.1|provirus_3084741_3115735,RS_GCF_000252995.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori,blast,96.90,iPHoP-RF;90.10
+NC_015761.1|provirus_3084741_3115735,RS_GCF_002918555.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter_C;s__Citrobacter_C amalonaticus_A,blast,93.20,None
+NC_015761.1|provirus_3084741_3115735,GB_GCA_900446925.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter_B;s__Citrobacter_B koseri,iPHoP-RF,92.10,CRISPR;67.50
+NC_015761.1|provirus_847397_862760,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;88.90
+NC_015761.1|provirus_847397_862760,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.30,iPHoP-RF;86.70
+NC_015761.1|provirus_847397_862760,RS_GCF_001729745.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Enterobacter;s__Enterobacter hormaechei_A,blast,96.20,iPHoP-RF;73.00
+NC_015761.1|provirus_847397_862760,RS_GCF_000252995.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori,blast,93.90,iPHoP-RF;71.50
+NC_015761.1|provirus_847397_862760,GB_GCA_900478215.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella houtenae,blast,91.90,iPHoP-RF;73.70
+NC_015761.1|provirus_847397_862760,RS_GCF_000006945.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella enterica,blast,91.70,iPHoP-RF;88.50
+NC_015761.1|provirus_847397_862760,RS_GCF_008692845.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella arizonae,blast,91.70,iPHoP-RF;84.50
+NC_015761.1|provirus_847397_862760,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,90.00,iPHoP-RF;87.00
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_017033.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_017033.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_017033.1|provirus_1052334_1094910,RS_GCF_000242255.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia,blast,98.40,None
+NC_017033.1|provirus_1557694_1600481,RS_GCF_000242255.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia,blast,98.40,iPHoP-RF;64.30
+NC_017033.1|provirus_2089294_2107522,RS_GCF_000242255.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia,blast,95.20,None
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_018068.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_018068.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,13 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_018068.1|provirus_1361108_1399802,RS_GCF_000255115.2,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus,blast,96.40,iPHoP-RF;53.60
+NC_018068.1|provirus_1361108_1399802,RS_GCF_001707885.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp001707885,iPHoP-RF,95.40,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_001936615.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus metallidurans,iPHoP-RF,95.40,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_000224515.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp000224515,iPHoP-RF,95.10,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_000960765.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp000960765,iPHoP-RF,93.40,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_004766055.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp004766055,iPHoP-RF,93.10,None
+NC_018068.1|provirus_1361108_1399802,3300011997_21,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__,iPHoP-RF,92.10,None
+NC_018068.1|provirus_1361108_1399802,GB_GCA_002404215.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp002404215,iPHoP-RF,91.80,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_001029285.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acididurans,blast,91.80,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_002196705.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp002196705,blast,91.20,iPHoP-RF;78.30
+NC_018068.1|provirus_1361108_1399802,GB_GCA_900290375.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus infrequens,blast,90.30,iPHoP-RF;73.50
+NC_018068.1|provirus_2072558_2098541,RS_GCF_000255115.2,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus,blast,93.60,iPHoP-RF;69.50
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_018515.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_018515.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,22 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_018515.1|provirus_3418112_3436097,RS_GCF_000231385.2,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei,blast,95.90,iPHoP-RF;79.80
+NC_018515.1|provirus_3418112_3436097,RS_GCF_004766055.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp004766055,iPHoP-RF,95.70,None
+NC_018515.1|provirus_3418112_3436097,GB_GCA_002404215.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp002404215,iPHoP-RF,95.10,None
+NC_018515.1|provirus_3418112_3436097,3300011997_21,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__,iPHoP-RF,94.70,None
+NC_018515.1|provirus_3418112_3436097,GB_GCA_021779415.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp021779415,iPHoP-RF,92.80,None
+NC_018515.1|provirus_3418112_3436097,RS_GCF_023897015.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus nitroreducens,blast,91.80,iPHoP-RF;73.20
+NC_018515.1|provirus_3418112_3436097,GB_GCA_003132105.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp003132105,iPHoP-RF,91.40,None
+NC_018515.1|provirus_3418112_3436097,RS_GCF_020595055.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp020595055,blast,91.40,iPHoP-RF;74.10
+NC_018515.1|provirus_3418112_3436097,RS_GCF_000235605.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus orientis,blast,90.70,iPHoP-RF;73.00
+NC_018515.1|provirus_3418112_3436097,RS_GCF_900100785.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus hippei,blast,90.30,iPHoP-RF;71.70
+NC_018515.1|provirus_4659544_4694673,RS_GCF_000231385.2,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei,blast,96.40,iPHoP-RF;77.30
+NC_018515.1|provirus_4659544_4694673,RS_GCF_023897015.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus nitroreducens,blast,95.70,iPHoP-RF;86.00
+NC_018515.1|provirus_4659544_4694673,GB_GCA_002404215.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp002404215,iPHoP-RF,94.40,None
+NC_018515.1|provirus_4659544_4694673,GB_GCA_900290375.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus infrequens,iPHoP-RF,94.40,None
+NC_018515.1|provirus_4659544_4694673,3300011997_21,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__,iPHoP-RF,94.10,None
+NC_018515.1|provirus_4659544_4694673,RS_GCF_900100785.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus hippei,blast,93.30,iPHoP-RF;73.50
+NC_018515.1|provirus_4659544_4694673,GB_GCA_003132105.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp003132105,iPHoP-RF,92.40,None
+NC_018515.1|provirus_4659544_4694673,GB_GCA_016278585.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp016278585,iPHoP-RF,92.10,None
+NC_018515.1|provirus_4659544_4694673,RS_GCF_001707885.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp001707885,blast,90.80,iPHoP-RF;85.70
+NC_018515.1|provirus_4659544_4694673,RS_GCF_000244895.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus youngiae,blast,90.40,iPHoP-RF;83.30
+NC_018515.1|provirus_4659544_4694673,RS_GCF_001029285.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acididurans,blast,90.40,iPHoP-RF;85.70
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_019936.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_019936.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,45 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_019936.1|provirus_2347508_2361929,RS_GCF_015291885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AC,CRISPR,97.40,blast;95.00 iPHoP-RF;87.30
+NC_019936.1|provirus_2347508_2361929,RS_GCF_003640395.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas urumqiensis,CRISPR,96.90,iPHoP-RF;51.70
+NC_019936.1|provirus_2347508_2361929,RS_GCF_000219605.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri,blast,96.10,CRISPR;90.50 iPHoP-RF;84.20
+NC_019936.1|provirus_2347508_2361929,RS_GCF_000327065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE,blast,95.90,iPHoP-RF;69.30
+NC_019936.1|provirus_2347508_2361929,RS_GCF_002929225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_U,blast,94.10,iPHoP-RF;89.50
+NC_019936.1|provirus_2347508_2361929,RS_GCF_003935375.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas xanthomarina_A,blast,94.10,iPHoP-RF;86.70 CRISPR;82.70
+NC_019936.1|provirus_2347508_2361929,GB_GCA_007713455.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp007713455,blast,93.10,iPHoP-RF;77.10
+NC_019936.1|provirus_2347508_2361929,RS_GCF_021432085.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis_A,blast,93.00,iPHoP-RF;89.20
+NC_019936.1|provirus_2347508_2361929,RS_GCF_000341615.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_G,blast,91.80,iPHoP-RF;75.00
+NC_019936.1|provirus_2347508_2361929,RS_GCF_003696285.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas nitrititolerans,blast,90.60,iPHoP-RF;51.50
+NC_019936.1|provirus_2347508_2361929,RS_GCF_015070855.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas lopnurensis,blast,90.10,iPHoP-RF;73.50
+NC_019936.1|provirus_3233292_3242961,RS_GCF_003696285.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas nitrititolerans,blast,96.90,iPHoP-RF;70.40
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000219605.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri,blast,96.80,iPHoP-RF;95.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000495915.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas chloritidismutans,blast,96.80,iPHoP-RF;88.90
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000818015.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas balearica,blast,96.80,iPHoP-RF;65.30
+NC_019936.1|provirus_3233292_3242961,RS_GCF_002929225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_U,blast,96.80,iPHoP-RF;92.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_003935375.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas xanthomarina_A,blast,96.80,iPHoP-RF;88.90
+NC_019936.1|provirus_3233292_3242961,RS_GCF_900114065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis,blast,96.80,iPHoP-RF;92.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_002890795.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AA,iPHoP-RF,96.70,blast;91.70
+NC_019936.1|provirus_3233292_3242961,RS_GCF_015291885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AC,blast,96.70,iPHoP-RF;93.70
+NC_019936.1|provirus_3233292_3242961,RS_GCF_021432085.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis_A,blast,96.70,iPHoP-RF;93.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_003696315.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas songnenensis,blast,96.20,iPHoP-RF;94.70
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000327065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE,blast,95.70,iPHoP-RF;94.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_002909485.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AH,blast,94.30,iPHoP-RF;91.80
+NC_019936.1|provirus_3233292_3242961,RS_GCF_014764705.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp002692525,iPHoP-RF,92.40,None
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000661915.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_A,iPHoP-RF,92.10,blast;91.90
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000935215.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AD,iPHoP-RF,91.10,None
+NC_019936.1|provirus_4295725_4304306,RS_GCF_003696285.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas nitrititolerans,blast,96.90,iPHoP-RF;85.40
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000219605.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri,blast,96.80,iPHoP-RF;96.10
+NC_019936.1|provirus_4295725_4304306,RS_GCF_015291885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AC,blast,96.60,iPHoP-RF;96.10
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000818015.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas balearica,blast,96.20,iPHoP-RF;85.70
+NC_019936.1|provirus_4295725_4304306,RS_GCF_002909485.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AH,iPHoP-RF,95.70,blast;92.80
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000495915.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas chloritidismutans,iPHoP-RF,94.10,blast;89.90
+NC_019936.1|provirus_4295725_4304306,RS_GCF_002929225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_U,iPHoP-RF,94.10,blast;89.90
+NC_019936.1|provirus_4295725_4304306,RS_GCF_003935375.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas xanthomarina_A,iPHoP-RF,94.10,blast;90.30
+NC_019936.1|provirus_4295725_4304306,RS_GCF_003696315.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas songnenensis,blast,93.90,iPHoP-RF;86.30
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000327065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE,blast,93.80,iPHoP-RF;85.70
+NC_019936.1|provirus_4295725_4304306,RS_GCF_014764705.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp002692525,iPHoP-RF,93.70,None
+NC_019936.1|provirus_4295725_4304306,RS_GCF_900114065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis,iPHoP-RF,93.70,blast;91.00
+NC_019936.1|provirus_4295725_4304306,GB_GCA_003488145.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp003488145,iPHoP-RF,93.40,None
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000935215.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AD,iPHoP-RF,92.40,blast;90.60
+NC_019936.1|provirus_4295725_4304306,RS_GCF_021432085.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis_A,iPHoP-RF,92.40,blast;89.90
+NC_019936.1|provirus_4295725_4304306,GB_GCA_007713455.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp007713455,iPHoP-RF,91.80,None
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000661915.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_A,blast,91.70,iPHoP-RF;83.10
diff -r 000000000000 -r 315c2ed31af1 test-data/iphop_host_prediction_to_genome/NC_021184.fasta.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_021184.fasta.csv Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,9 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_021184.1|provirus_19778_35564,RS_GCF_000233715.2,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae,blast,95.50,iPHoP-RF;84.20
+NC_021184.1|provirus_19778_35564,RS_GCF_008124625.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum thermosapovorans,iPHoP-RF,93.40,blast;90.30
+NC_021184.1|provirus_19778_35564,GB_GCA_016841645.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum geothermicum_B,blast,90.90,iPHoP-RF;74.80
+NC_021184.1|provirus_19778_35564,GB_GCA_016841205.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum geothermicum_A,blast,90.60,iPHoP-RF;70.90
+NC_021184.1|provirus_19778_35564,GB_GCA_016841905.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum geothermicum_C,blast,90.40,iPHoP-RF;51.20
+NC_021184.1|provirus_19778_35564,RS_GCF_009932395.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum syntrophicum,blast,90.30,iPHoP-RF;83.30
+NC_021184.1|provirus_4466413_4519129,RS_GCF_000233715.2,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae,blast,98.40,iPHoP-RF;68.90
+NC_021184.1|provirus_4563831_4615358,RS_GCF_000233715.2,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae,blast,98.20,iPHoP-RF;76.80
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_000913.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_000913.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
+NC_000913.3|provirus_1196867_1213107_23 NC_000913.3|provirus_1196867_1213107 K00031 "IDH1, IDH2, icd; isocitrate dehydrogenase [EC:1.1.1.42]" PF00180.20 Isocitrate/isopropylmalate dehydrogenase
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_002737.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_002737.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
+NC_002737.2|provirus_777501_820593_1 NC_002737.2|provirus_777501_820593 K01710 "E4.2.1.46, rfbB, rffG; dTDP-glucose 4,6-dehydratase [EC:4.2.1.46]" PF16363.5 "GDP-mannose 4,6 dehydratase"
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_003450.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_008261.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_008261.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_009012.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_009012.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
+NC_009012.1|provirus_2022140_2067593_32 NC_009012.1|provirus_2022140_2067593 K00558 "DNMT1, dcm; DNA (cytosine-5)-methyltransferase 1 [EC:2.1.1.37]" PF00145.17 C-5 cytosine-specific DNA methylase
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_012982.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_014008.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_014168.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_014168.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
+NC_014168.1|provirus_1141631_1162952_17 NC_014168.1|provirus_1141631_1162952 K00558 "DNMT1, dcm; DNA (cytosine-5)-methyltransferase 1 [EC:2.1.1.37]" PF00145.17 C-5 cytosine-specific DNA methylase
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_014211.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_014212.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_014212.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_014363.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_014364.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_014364.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
+NC_014364.1|provirus_2666253_2703772_28 NC_014364.1|provirus_2666253_2703772 K00390 cysH; phosphoadenosine phosphosulfate reductase [EC:1.8.4.8 1.8.4.10] PF01507.19 Phosphoadenosine phosphosulfate reductase family
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_015761.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_015761.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_017033.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_017033.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
+NC_017033.1|provirus_1557694_1600481_7 NC_017033.1|provirus_1557694_1600481 K00558 "DNMT1, dcm; DNA (cytosine-5)-methyltransferase 1 [EC:2.1.1.37]" PF00145.17 C-5 cytosine-specific DNA methylase
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_017095.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_018014.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_018068.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_018068.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_018515.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_018515.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
+NC_018515.1|provirus_4659544_4694673_38 NC_018515.1|provirus_4659544_4694673 K06167 "phnP; phosphoribosyl 1,2-cyclic phosphate phosphodiesterase [EC:3.1.4.55]" PF00753.27 Metallo-beta-lactamase superfamily
+NC_018515.1|provirus_3418112_3436097_1 NC_018515.1|provirus_3418112_3436097 K00106 XDH; xanthine dehydrogenase/oxidase [EC:1.17.1.4 1.17.3.2] PF02738.18 Molybdopterin-binding domain of aldehyde dehydrogenase
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_019897.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_019904.fasta.tabular
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_019936.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_019936.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name
diff -r 000000000000 -r 315c2ed31af1 test-data/vibrant_amg_individuals/NC_021184.fasta.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_021184.fasta.tabular Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein scaffold AMG KO AMG KO name Pfam Pfam name