changeset 0:315c2ed31af1 draft

planemo upload for repository https://github.com/Helmholtz-UFZ/ufz-galaxy-tools/blob/main/tools/phi-toolkit commit 45c746567f48e6c9bcc19ba4e94e87348df3ac7a
author ufz
date Wed, 04 Jun 2025 17:36:40 +0000
parents
children 3a7f73d638ba
files phitk.xml report.Rmd test-data/abricate_results/NC_000913.fasta.tabular test-data/abricate_results/NC_002737.fasta.tabular test-data/abricate_results/NC_008261.fasta.tabular test-data/abricate_results/NC_009012.fasta.tabular test-data/abricate_results/NC_014168.fasta.tabular test-data/abricate_results/NC_014212.fasta.tabular test-data/abricate_results/NC_014364.fasta.tabular test-data/abricate_results/NC_015761.fasta.tabular test-data/abricate_results/NC_017033.fasta.tabular test-data/abricate_results/NC_018068.fasta.tabular test-data/abricate_results/NC_018515.fasta.tabular test-data/abricate_results/NC_019936.fasta.tabular test-data/abricate_results/NC_021184.fasta.tabular test-data/checkm2.Quality_report.tabular test-data/checkv_quality_summary/NC_000913.fasta.tabular test-data/checkv_quality_summary/NC_002737.fasta.tabular test-data/checkv_quality_summary/NC_003450.fasta.tabular test-data/checkv_quality_summary/NC_008261.fasta.tabular test-data/checkv_quality_summary/NC_009012.fasta.tabular test-data/checkv_quality_summary/NC_012982.fasta.tabular test-data/checkv_quality_summary/NC_014008.fasta.tabular test-data/checkv_quality_summary/NC_014168.fasta.tabular test-data/checkv_quality_summary/NC_014211.fasta.tabular test-data/checkv_quality_summary/NC_014212.fasta.tabular test-data/checkv_quality_summary/NC_014363.fasta.tabular test-data/checkv_quality_summary/NC_014364.fasta.tabular test-data/checkv_quality_summary/NC_015761.fasta.tabular test-data/checkv_quality_summary/NC_017033.fasta.tabular test-data/checkv_quality_summary/NC_017095.fasta.tabular test-data/checkv_quality_summary/NC_018014.fasta.tabular test-data/checkv_quality_summary/NC_018068.fasta.tabular test-data/checkv_quality_summary/NC_018515.fasta.tabular test-data/checkv_quality_summary/NC_019897.fasta.tabular test-data/checkv_quality_summary/NC_019904.fasta.tabular test-data/checkv_quality_summary/NC_019936.fasta.tabular test-data/checkv_quality_summary/NC_021184.fasta.tabular test-data/defense_finder_systems/NC_000913.fasta.tabular test-data/defense_finder_systems/NC_002737.fasta.tabular test-data/defense_finder_systems/NC_003450.fasta.tabular test-data/defense_finder_systems/NC_008261.fasta.tabular test-data/defense_finder_systems/NC_009012.fasta.tabular test-data/defense_finder_systems/NC_012982.fasta.tabular test-data/defense_finder_systems/NC_014008.fasta.tabular test-data/defense_finder_systems/NC_014168.fasta.tabular test-data/defense_finder_systems/NC_014211.fasta.tabular test-data/defense_finder_systems/NC_014212.fasta.tabular test-data/defense_finder_systems/NC_014363.fasta.tabular test-data/defense_finder_systems/NC_014364.fasta.tabular test-data/defense_finder_systems/NC_015761.fasta.tabular test-data/defense_finder_systems/NC_017033.fasta.tabular test-data/defense_finder_systems/NC_017095.fasta.tabular test-data/defense_finder_systems/NC_018014.fasta.tabular test-data/defense_finder_systems/NC_018068.fasta.tabular test-data/defense_finder_systems/NC_018515.fasta.tabular test-data/defense_finder_systems/NC_019897.fasta.tabular test-data/defense_finder_systems/NC_019904.fasta.tabular test-data/defense_finder_systems/NC_019936.fasta.tabular test-data/defense_finder_systems/NC_021184.fasta.tabular test-data/drep_compare/NC_000913.fasta.csv test-data/drep_compare/NC_002737.fasta.csv test-data/drep_compare/NC_008261.fasta.csv test-data/drep_compare/NC_009012.fasta.csv test-data/drep_compare/NC_014168.fasta.csv test-data/drep_compare/NC_014212.fasta.csv test-data/drep_compare/NC_014364.fasta.csv test-data/drep_compare/NC_015761.fasta.csv test-data/drep_compare/NC_017033.fasta.csv test-data/drep_compare/NC_018068.fasta.csv test-data/drep_compare/NC_018515.fasta.csv test-data/drep_compare/NC_019936.fasta.csv test-data/drep_compare/NC_021184.fasta.csv test-data/drep_compare_clustering_dendrogram/NC_000913.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_002737.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_008261.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_009012.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_014168.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_014212.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_014364.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_015761.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_017033.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_018068.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_018515.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_019936.fasta.pdf test-data/drep_compare_clustering_dendrogram/NC_021184.fasta.pdf test-data/genomad_virus_fasta/NC_000913.fasta.fasta test-data/genomad_virus_fasta/NC_002737.fasta.fasta test-data/genomad_virus_fasta/NC_003450.fasta.fasta test-data/genomad_virus_fasta/NC_008261.fasta.fasta test-data/genomad_virus_fasta/NC_009012.fasta.fasta test-data/genomad_virus_fasta/NC_012982.fasta.fasta test-data/genomad_virus_fasta/NC_014008.fasta.fasta test-data/genomad_virus_fasta/NC_014168.fasta.fasta test-data/genomad_virus_fasta/NC_014211.fasta.fasta test-data/genomad_virus_fasta/NC_014212.fasta.fasta test-data/genomad_virus_fasta/NC_014363.fasta.fasta test-data/genomad_virus_fasta/NC_014364.fasta.fasta test-data/genomad_virus_fasta/NC_015761.fasta.fasta test-data/genomad_virus_fasta/NC_017033.fasta.fasta test-data/genomad_virus_fasta/NC_017095.fasta.fasta test-data/genomad_virus_fasta/NC_018014.fasta.fasta test-data/genomad_virus_fasta/NC_018068.fasta.fasta test-data/genomad_virus_fasta/NC_018515.fasta.fasta test-data/genomad_virus_fasta/NC_019897.fasta.fasta test-data/genomad_virus_fasta/NC_019904.fasta.fasta test-data/genomad_virus_fasta/NC_019936.fasta.fasta test-data/genomad_virus_fasta/NC_021184.fasta.fasta test-data/genomad_virus_genes/NC_000913.fasta.tabular test-data/genomad_virus_genes/NC_002737.fasta.tabular test-data/genomad_virus_genes/NC_003450.fasta.tabular test-data/genomad_virus_genes/NC_008261.fasta.tabular test-data/genomad_virus_genes/NC_009012.fasta.tabular test-data/genomad_virus_genes/NC_012982.fasta.tabular test-data/genomad_virus_genes/NC_014008.fasta.tabular test-data/genomad_virus_genes/NC_014168.fasta.tabular test-data/genomad_virus_genes/NC_014211.fasta.tabular test-data/genomad_virus_genes/NC_014212.fasta.tabular test-data/genomad_virus_genes/NC_014363.fasta.tabular test-data/genomad_virus_genes/NC_014364.fasta.tabular test-data/genomad_virus_genes/NC_015761.fasta.tabular test-data/genomad_virus_genes/NC_017033.fasta.tabular test-data/genomad_virus_genes/NC_017095.fasta.tabular test-data/genomad_virus_genes/NC_018014.fasta.tabular test-data/genomad_virus_genes/NC_018068.fasta.tabular test-data/genomad_virus_genes/NC_018515.fasta.tabular test-data/genomad_virus_genes/NC_019897.fasta.tabular test-data/genomad_virus_genes/NC_019904.fasta.tabular test-data/genomad_virus_genes/NC_019936.fasta.tabular test-data/genomad_virus_genes/NC_021184.fasta.tabular test-data/genomad_virus_summary/NC_000913.fasta.tabular test-data/genomad_virus_summary/NC_002737.fasta.tabular test-data/genomad_virus_summary/NC_003450.fasta.tabular test-data/genomad_virus_summary/NC_008261.fasta.tabular test-data/genomad_virus_summary/NC_009012.fasta.tabular test-data/genomad_virus_summary/NC_012982.fasta.tabular test-data/genomad_virus_summary/NC_014008.fasta.tabular test-data/genomad_virus_summary/NC_014168.fasta.tabular test-data/genomad_virus_summary/NC_014211.fasta.tabular test-data/genomad_virus_summary/NC_014212.fasta.tabular test-data/genomad_virus_summary/NC_014363.fasta.tabular test-data/genomad_virus_summary/NC_014364.fasta.tabular test-data/genomad_virus_summary/NC_015761.fasta.tabular test-data/genomad_virus_summary/NC_017033.fasta.tabular test-data/genomad_virus_summary/NC_017095.fasta.tabular test-data/genomad_virus_summary/NC_018014.fasta.tabular test-data/genomad_virus_summary/NC_018068.fasta.tabular test-data/genomad_virus_summary/NC_018515.fasta.tabular test-data/genomad_virus_summary/NC_019897.fasta.tabular test-data/genomad_virus_summary/NC_019904.fasta.tabular test-data/genomad_virus_summary/NC_019936.fasta.tabular test-data/genomad_virus_summary/NC_021184.fasta.tabular test-data/gtdbtk.bac120.summary test-data/iphop_host_prediction_to_genome/NC_000913.fasta.csv test-data/iphop_host_prediction_to_genome/NC_002737.fasta.csv test-data/iphop_host_prediction_to_genome/NC_008261.fasta.csv test-data/iphop_host_prediction_to_genome/NC_009012.fasta.csv test-data/iphop_host_prediction_to_genome/NC_014168.fasta.csv test-data/iphop_host_prediction_to_genome/NC_014212.fasta.csv test-data/iphop_host_prediction_to_genome/NC_014364.fasta.csv test-data/iphop_host_prediction_to_genome/NC_015761.fasta.csv test-data/iphop_host_prediction_to_genome/NC_017033.fasta.csv test-data/iphop_host_prediction_to_genome/NC_018068.fasta.csv test-data/iphop_host_prediction_to_genome/NC_018515.fasta.csv test-data/iphop_host_prediction_to_genome/NC_019936.fasta.csv test-data/iphop_host_prediction_to_genome/NC_021184.fasta.csv test-data/vibrant_amg_individuals/NC_000913.fasta.tabular test-data/vibrant_amg_individuals/NC_002737.fasta.tabular test-data/vibrant_amg_individuals/NC_003450.fasta.tabular test-data/vibrant_amg_individuals/NC_008261.fasta.tabular test-data/vibrant_amg_individuals/NC_009012.fasta.tabular test-data/vibrant_amg_individuals/NC_012982.fasta.tabular test-data/vibrant_amg_individuals/NC_014008.fasta.tabular test-data/vibrant_amg_individuals/NC_014168.fasta.tabular test-data/vibrant_amg_individuals/NC_014211.fasta.tabular test-data/vibrant_amg_individuals/NC_014212.fasta.tabular test-data/vibrant_amg_individuals/NC_014363.fasta.tabular test-data/vibrant_amg_individuals/NC_014364.fasta.tabular test-data/vibrant_amg_individuals/NC_015761.fasta.tabular test-data/vibrant_amg_individuals/NC_017033.fasta.tabular test-data/vibrant_amg_individuals/NC_017095.fasta.tabular test-data/vibrant_amg_individuals/NC_018014.fasta.tabular test-data/vibrant_amg_individuals/NC_018068.fasta.tabular test-data/vibrant_amg_individuals/NC_018515.fasta.tabular test-data/vibrant_amg_individuals/NC_019897.fasta.tabular test-data/vibrant_amg_individuals/NC_019904.fasta.tabular test-data/vibrant_amg_individuals/NC_019936.fasta.tabular test-data/vibrant_amg_individuals/NC_021184.fasta.tabular
diffstat 161 files changed, 24224 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/phitk.xml	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,247 @@
+<tool id="phi_toolkit_report" name="PHI toolkit report" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="20.01" license="MIT">
+    <description></description>
+    <macros>
+        <token name="@TOOL_VERSION@">0.1.0</token>
+        <token name="@VERSION_SUFFIX@">0</token>
+
+        <xml name="zenodo_collection_element" tokens="id">
+            <element name="@ID@" location="https://zenodo.org/records/15594463/files/NC_000913.fasta.fasta?download=1" value="genomes/@ID@.fasta.fasta" ftype="fasta"/>
+        </xml>
+
+        <xml name="test_collection_element" tokens="id,folder,ext">
+            <element name="@ID@" value="@FOLDER@/@ID@.fasta.@EXT@" ftype="@EXT@"/>
+        </xml>
+        <xml name="test_collection_non_empty" tokens="name,folder,ext">
+            <param name="@NAME@">
+                <collection type="list">
+                    <expand macro="test_collection_element" id="NC_000913" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_002737" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_008261" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_009012" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_014168" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_014212" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_014364" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_015761" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_017033" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_018068" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_018515" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_019936" folder="@FOLDER@" ext="@EXT@"/>
+                    <expand macro="test_collection_element" id="NC_021184" folder="@FOLDER@" ext="@EXT@"/>
+                    <yield/>
+                </collection>
+            </param>
+        </xml>
+        <xml name="test_collection" tokens="name,folder,ext">
+            <expand macro="test_collection_non_empty" name="@NAME@" folder="@FOLDER@" ext="@EXT@">
+                <expand macro="test_collection_element" id="NC_003450" folder="@FOLDER@" ext="@EXT@"/>
+                <expand macro="test_collection_element" id="NC_012982" folder="@FOLDER@" ext="@EXT@"/>
+                <expand macro="test_collection_element" id="NC_014008" folder="@FOLDER@" ext="@EXT@"/>
+                <expand macro="test_collection_element" id="NC_014211" folder="@FOLDER@" ext="@EXT@"/>
+                <expand macro="test_collection_element" id="NC_014363" folder="@FOLDER@" ext="@EXT@"/>
+                <expand macro="test_collection_element" id="NC_017095" folder="@FOLDER@" ext="@EXT@"/>
+                <expand macro="test_collection_element" id="NC_018014" folder="@FOLDER@" ext="@EXT@"/>
+                <expand macro="test_collection_element" id="NC_019897" folder="@FOLDER@" ext="@EXT@"/>
+                <expand macro="test_collection_element" id="NC_019904" folder="@FOLDER@" ext="@EXT@"/>
+            </expand>
+        </xml>
+        
+    </macros>
+    <!-- TODO <xrefs>
+        <xref type="bio.tools"></xref>
+    </xrefs> -->
+    <requirements>
+        <requirement type="package" version="2.74.0">bioconductor-biostrings</requirement>
+        <requirement type="package" version="1.58.0">bioconductor-genomicranges</requirement>
+        <requirement type="package" version="1.18.0">bioconductor-gmoviz</requirement>
+        <requirement type="package" version="0.2.1">r-formattable</requirement>
+        <requirement type="package" version="1.0.1">r-here</requirement>
+        <requirement type="package" version="2.2.1">r-janitor</requirement>
+        <requirement type="package" version="1.4.0">r-kableextra</requirement>
+        <requirement type="package" version="1.3.0">r-patchwork</requirement>
+        <requirement type="package" version="2.0.0">r-tidyverse</requirement>
+        <requirement type="package" version="2.0.2">r-base64</requirement>
+        <requirement type="package" version="3.5.0">r-pdftools</requirement>
+    </requirements>
+    <command detect_errors="exit_code"><![CDATA[
+       mkdir -p data/genomes &&
+        #for e in $genomes
+            ln -s '$e' 'data/genomes/${e.element_identifier}.fna' &&
+        #end for
+
+        mkdir -p data/host_analyses &&
+        mkdir -p data/virus_analyses &&
+
+        ## checkm
+        mkdir -p data/host_analyses/checkm2 &&
+        ln -s '$checkm' data/host_analyses/checkm2/quality_report.tsv &&
+
+        ## defense-finder inputs
+        mkdir -p data/host_analyses/defense-finder &&
+        #for e in $defense_finder
+            mkdir -p 'data/host_analyses/defense-finder/${e.element_identifier}/' &&
+            ln -s '$e' 'data/host_analyses/defense-finder/${e.element_identifier}/${e.element_identifier}_defense_finder_systems.tsv' &&
+        #end for
+
+        ## genomad inputs
+        mkdir -p data/host_analyses/genomad &&
+        #for e in $genomad
+            mkdir -p 'data/host_analyses/genomad/${e.element_identifier}/${e.element_identifier}_summary/' &&
+            ln -s '$e' 'data/host_analyses/genomad/${e.element_identifier}/${e.element_identifier}_summary/${e.element_identifier}_virus_summary.tsv' &&
+        #end for
+        #for e in $genomad_phages
+            mkdir -p 'data/host_analyses/genomad/${e.element_identifier}/${e.element_identifier}_summary/' &&
+            ln -s '$e' 'data/host_analyses/genomad/${e.element_identifier}/${e.element_identifier}_summary/${e.element_identifier}_virus.fna' &&
+        #end for
+        #for e in $genomad_annotations
+            mkdir -p 'data/host_analyses/genomad/${e.element_identifier}/${e.element_identifier}_summary/' &&
+            ln -s '$e' 'data/host_analyses/genomad/${e.element_identifier}/${e.element_identifier}_summary/${e.element_identifier}_virus_genes.tsv' &&
+        #end for
+
+        ## GTDBTK
+        mkdir -p data/host_analyses/gtdbtk &&
+        ln -s '$gtdb_summary' data/host_analyses/gtdbtk/gtdbtk.bac120.summary.tsv &&
+
+        ## CheckV
+        mkdir -p data/virus_analyses/checkv &&
+        #for e in $checkv
+            mkdir -p 'data/virus_analyses/checkv/${e.element_identifier}/' &&
+            ln -s '$e' 'data/virus_analyses/checkv/${e.element_identifier}/quality_summary.tsv' &&
+        #end for
+
+        ## drep compare
+        mkdir -p data/virus_analyses/drep_compare &&
+        #for e in $drep_compare
+            mkdir -p 'data/virus_analyses/drep_compare/${e.element_identifier}/data_tables' &&
+            ln -s '$e' 'data/virus_analyses/drep_compare/${e.element_identifier}/data_tables/Cdb.csv' &&
+        #end for
+        #for e in $drep_compare_clustering_dendrogram
+            mkdir 'data/virus_analyses/drep_compare/${e.element_identifier}/figures/' &&
+            ln -s '$e' 'data/virus_analyses/drep_compare/${e.element_identifier}/figures/Primary_clustering_dendrogram.pdf' &&
+        #end for
+
+        ## iphop
+        mkdir -p data/virus_analyses/iphop &&
+        #for e in $iphop
+            mkdir -p 'data/virus_analyses/iphop/${e.element_identifier}/' &&
+            ln -s '$e' 'data/virus_analyses/iphop/${e.element_identifier}/Host_prediction_to_genome_m90.csv' &&
+        #end for
+
+        ## abricate
+        mkdir -p data/virus_analyses/abricate &&
+        #for e in $abricate
+            mkdir -p 'data/virus_analyses/abricate/${e.element_identifier}/' &&
+            ln -s '$e' 'data/virus_analyses/abricate/${e.element_identifier}/${e.element_identifier}_virus_vfdb.tsv' &&
+        #end for
+
+        ## vibrant
+        mkdir -p data/virus_analyses/vibrant &&
+        #for e in $vibrant
+            mkdir -p 'data/virus_analyses/vibrant/${e.element_identifier}/VIBRANT_${e.element_identifier}_virus/VIBRANT_results_${e.element_identifier}_virus/' &&
+            ln -s '$e' 'data/virus_analyses/vibrant/${e.element_identifier}/VIBRANT_${e.element_identifier}_virus/VIBRANT_results_${e.element_identifier}_virus/VIBRANT_AMG_individuals_${e.element_identifier}_virus.tsv' &&
+        #end for
+
+        Rscript -e "library(rmarkdown); render('$__tool_directory__/report.Rmd', output_dir='"\$(pwd)"', output_format = 'html_document', intermediates_dir = '"\$(pwd)"', knit_root_dir='"\$(pwd)"')" &&
+        cp report.html '$report'
+    ]]></command>
+    <inputs>
+        <param type="data_collection" name="genomes" format="fasta" label="Genomes"/>
+        <param type="data" name="checkm" format="tabular" label="Checkm2 quality report"/>
+        <param type="data_collection" name="genomad" format="tabular" label="geNomad Virus Summary"/>
+        <param type="data_collection" name="genomad_phages" format="fasta" label="geNomad Virus fasta"/>
+        <param type="data_collection" name="genomad_annotations" format="tabular" label="geNomad Virus genes"/>
+        <param type="data_collection" name="defense_finder" format="tabular" label="DefenseFinder systems"/>
+        <param type="data" name="gtdb_summary" format="tsv" label="GTDB-Tk summary"/>
+        <param type="data_collection" name="checkv" format="tabular" label="CheckV Quality summary"/> 
+        <param type="data_collection" name="drep_compare" format="csv" label="drep compare Cdb.csv"/>
+        <param type="data_collection" name="drep_compare_clustering_dendrogram" format="pdf" label="drep compare clustering dendrogram"/>
+        <param type="data_collection" name="iphop" format="csv" label="iPHop Host prediction to genome"/>
+        <param type="data_collection" name="abricate" format="tabular" label="Abricate results"/> 
+        <param type="data_collection" name="vibrant" format="tabular" label="Vibrant Individual predicted virus AMGs" help="Vibrant output option 'Individual predicted virus AMGs by protein and its respective genome'"/>
+    </inputs>
+    <outputs>
+        <data name="report" format="html"/>
+    </outputs>
+    <tests>
+        <test>
+            <!-- <expand macro="test_collection" name="genomes" folder="genomes" ext="fasta"/> -->
+            <param name="genomes">
+                <collection type="list">
+                    <expand macro="zenodo_collection_element" id="NC_000913"/>
+                    <expand macro="zenodo_collection_element" id="NC_002737"/>
+                    <expand macro="zenodo_collection_element" id="NC_008261"/>
+                    <expand macro="zenodo_collection_element" id="NC_009012"/>
+                    <expand macro="zenodo_collection_element" id="NC_014168"/>
+                    <expand macro="zenodo_collection_element" id="NC_014212"/>
+                    <expand macro="zenodo_collection_element" id="NC_014364"/>
+                    <expand macro="zenodo_collection_element" id="NC_015761"/>
+                    <expand macro="zenodo_collection_element" id="NC_017033"/>
+                    <expand macro="zenodo_collection_element" id="NC_018068"/>
+                    <expand macro="zenodo_collection_element" id="NC_018515"/>
+                    <expand macro="zenodo_collection_element" id="NC_019936"/>
+                    <expand macro="zenodo_collection_element" id="NC_021184"/>
+                    <expand macro="zenodo_collection_element" id="NC_003450"/>
+                    <expand macro="zenodo_collection_element" id="NC_012982"/>
+                    <expand macro="zenodo_collection_element" id="NC_014008"/>
+                    <expand macro="zenodo_collection_element" id="NC_014211"/>
+                    <expand macro="zenodo_collection_element" id="NC_014363"/>
+                    <expand macro="zenodo_collection_element" id="NC_017095"/>
+                    <expand macro="zenodo_collection_element" id="NC_018014"/>
+                    <expand macro="zenodo_collection_element" id="NC_019897"/>
+                    <expand macro="zenodo_collection_element" id="NC_019904"/>
+                </collection>
+            </param>
+            <param name="checkm" value="checkm2.Quality_report.tabular"/>
+            <expand macro="test_collection" name="genomad" folder="genomad_virus_summary" ext="tabular"/>
+            <expand macro="test_collection" name="genomad_phages" folder="genomad_virus_fasta" ext="fasta"/>
+            <expand macro="test_collection" name="genomad_annotations" folder="genomad_virus_genes" ext="tabular"/>
+            <expand macro="test_collection" name="defense_finder" folder="defense_finder_systems" ext="tabular"/>
+            <param name="gtdb_summary" value="gtdbtk.bac120.summary"/>
+            <expand macro="test_collection_non_empty" name="checkv" folder="checkv_quality_summary" ext="tabular"/>
+            <expand macro="test_collection_non_empty" name="drep_compare" folder="drep_compare" ext="csv"/>
+            <expand macro="test_collection_non_empty" name="drep_compare_clustering_dendrogram" folder="drep_compare_clustering_dendrogram" ext="pdf"/>
+            <expand macro="test_collection_non_empty" name="iphop" folder="iphop_host_prediction_to_genome" ext="csv"/> 
+            <!-- TODO remove from test-data <expand macro="test_collection_non_empty" name="phatyp" folder="phabox_phatyp" ext="tabular"/>  -->
+            <expand macro="test_collection_non_empty" name="abricate" folder="abricate_results" ext="tabular"/> 
+            <expand macro="test_collection_non_empty" name="vibrant" folder="vibrant_amg_individuals" ext="tabular"/> 
+            <output name="report">
+                <assert_contents>
+                    <has_size min="100"/>
+                    <has_line line="&lt;html&gt;"/>
+                </assert_contents>
+            </output>
+        </test>
+    </tests>
+    <help><![CDATA[
+
+.. class:: infomark
+
+**What it does**
+
+Create a report for the PHI toolkit workflow.
+
+Usage
+.....
+
+**Input**
+
+- Genomes
+- Checkm2 quality report
+- geNomad Virus Summary
+- geNomad Virus genes
+- DefenseFinder systems
+- GTDB-Tk summary
+- CheckV Quality summary
+- drep compare Cdb.csv
+- drep compare clustering dendrogram
+- iPHop Host prediction to genome
+- Abricate results
+- Vibrant Individual predicted virus AMGs
+
+**Output**
+
+A html report summarizing the results.
+    ]]></help>
+    <!-- <citations>
+        <citation type="doi"> </citation>
+    </citations> -->
+</tool>
\ No newline at end of file
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/report.Rmd	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1081 @@
+---
+title: "PHI Prophage-Host Interaction Toolkit report"
+subtitle: "Toolkit for the Detection, Comparison, and Annotation of Prophages in Bacterial Genomes."
+date: "`r format(Sys.Date(), '%B %d, %Y')`"
+output: 
+  html_document:
+    theme: flatly
+    toc: yes
+    toc_float: false
+    number_sections: yes
+    code_folding: none
+    fig_width: 12
+    fig_height: 8
+    fig_caption: true
+    df_print: paged
+editor_options: 
+  markdown: 
+    wrap: 72
+params:
+  outdir: "data"
+---
+
+
+------------------------------------------------------------------------
+
+```{r setup_env, include=FALSE}
+knitr::opts_chunk$set(echo = FALSE)
+
+cat("params$outdir:", params$outdir, "\n")
+```
+
+```{r setup_libraries, message=FALSE, warning=FALSE, echo=FALSE, results='asis'}
+# Define required packages
+required_packages <- c("tidyverse", "janitor", "here",
+                       "kableExtra", "gmoviz", "circlize",
+                       "GenomicRanges", "patchwork", "fs",
+                       "tools", "scales", "formattable",
+                       "pdftools", "base64")
+
+# Load required packages
+invisible(lapply(required_packages, library, character.only = TRUE))
+```
+
+```{r helper_functions, echo=FALSE}
+log_file <- "debug.log"
+
+log_debug <- function(message) {
+  if (!exists("log_initialized") || !log_initialized) {
+    cat(paste0(Sys.time(), " - DEBUG: ", message, "\n"), file = log_file, append = FALSE)
+    assign("log_initialized", TRUE, envir = .GlobalEnv)
+  } else {
+    cat(paste0(Sys.time(), " - DEBUG: ", message, "\n"), file = log_file, append = TRUE)
+  }
+}
+
+load_file <- function(path) {
+  log_debug(paste("Attempting to load:", path))
+  if (file.exists(path)) {
+    ext <- tools::file_ext(path)
+    if (ext %in% c("tsv", "csv")) {
+      data <- read_delim(path, delim = ifelse(ext == "csv", ",", "\t"), show_col_types = FALSE) %>% clean_names
+      log_debug(paste("Loaded", nrow(data), "rows from", path))
+      data
+    } else if (ext == "fna") {
+      data <- Biostrings::readDNAStringSet(path)
+      log_debug(paste("Loaded", length(data), "sequences from", path))
+      data
+    } else {
+      log_debug(paste("Skipping", path, "- unsupported file type"))
+      NULL
+    }
+  } else {
+    log_debug(paste("File does not exist:", path))
+    NULL
+  }
+}
+
+get_file_info <- function(path, loaded_data) {
+  log_debug(paste("Processing file info for:", path))
+  if (file.exists(path)) {
+    ext <- tools::file_ext(path)
+    if (ext %in% c("tsv", "csv", "fna")) {
+      data <- loaded_data[[basename(path)]]
+      rows <- if(ext == "fna") length(data) else nrow(data)
+      tibble(exists = TRUE, rows = rows, size = file.size(path), path = path)
+    } else {
+      tibble(exists = TRUE, rows = NA_integer_, size = file.size(path), path = path)
+    }
+  } else {
+    tibble(exists = FALSE, rows = NA_integer_, size = NA_real_, path = NA_character_)
+  }
+}
+
+process_genome_folder <- function(folder, host_analyses_dir, virus_analyses_dir) {
+  log_debug(paste("Processing folder:", folder))
+  genome_name <- basename(folder)
+
+  paths <- list(
+    genomad = file.path(host_analyses_dir, "genomad", genome_name, paste0(genome_name, "_summary"), paste0(genome_name, "_virus_summary.tsv")),
+    genomad_phages = file.path(host_analyses_dir, "genomad", genome_name, paste0(genome_name, "_summary"), paste0(genome_name, "_virus.fna")),
+    genomad_annotations = file.path(host_analyses_dir, "genomad", genome_name, paste0(genome_name, "_summary"), paste0(genome_name, "_virus_genes.tsv")),
+    defense_finder = file.path(host_analyses_dir, "defense-finder", genome_name, paste0(genome_name, "_defense_finder_systems.tsv")),
+    checkv = file.path(virus_analyses_dir, "checkv", genome_name, "quality_summary.tsv"),
+    iphop = file.path(virus_analyses_dir, "iphop", genome_name, "Host_prediction_to_genome_m90.csv"),
+    drep = file.path(virus_analyses_dir, "drep_compare", genome_name, "data_tables", "Cdb.csv"),
+    phatyp = file.path(virus_analyses_dir, "phatyp", genome_name, "phatyp.csv"),
+    abricate = file.path(virus_analyses_dir, "abricate", genome_name, paste0(genome_name, "_virus_vfdb.tsv")),
+    vibrant = file.path(virus_analyses_dir, "vibrant", genome_name, 
+                        paste0("VIBRANT_", genome_name, "_virus"),
+                        paste0("VIBRANT_results_", genome_name, "_virus"),
+                        paste0("VIBRANT_AMG_individuals_", genome_name, "_virus.tsv"))
+  )
+
+  loaded_data <- map(paths, load_file)
+  file_info <- map_dfr(paths, ~get_file_info(.x, loaded_data), .id = "file_type")
+
+  virus_count <- if(!is.null(loaded_data$genomad)) {
+    count <- sum(loaded_data$genomad$virus_score > 0.5, na.rm = TRUE)
+    log_debug(paste("Virus count:", count))
+    count
+  } else {
+    log_debug("No genomad summary found, virus count set to 0")
+    0
+  }
+
+  log_debug("Returning results from process_genome_folder")
+  list(file_info = file_info, virus_count = virus_count, loaded_data = loaded_data)
+}
+```
+
+
+```{r compile_results, message=FALSE, warning=FALSE, echo=FALSE}
+compile_results <- function() {
+  base_dir <- params$outdir
+  log_debug(paste("Base directory:", base_dir))
+
+  host_analyses_dir <- file.path(base_dir, "host_analyses")
+  virus_analyses_dir <- file.path(base_dir, "virus_analyses")
+
+  # List all sample-level directories from all tools under virus_analyses
+  tool_dirs <- list.dirs(virus_analyses_dir, full.names = TRUE, recursive = FALSE)
+  
+  genome_folders <- list.dirs(file.path(base_dir, "host_analyses", "genomad"), 
+                              full.names = TRUE, recursive = FALSE)
+  
+  # cat(length(genome_folders), "sample(s) processed\n")
+
+  log_debug("Processing genome folders")
+  genome_data <- map(genome_folders, process_genome_folder, 
+                     host_analyses_dir = host_analyses_dir, 
+                     virus_analyses_dir = virus_analyses_dir) %>%
+    set_names(basename(genome_folders)) %>%
+    compact()
+
+  log_debug("Creating summary dataframe")
+  summary_df <- map_dfr(genome_data, ~{
+    file_info <- .x$file_info
+    tibble(
+      Sample = basename(file_info$path[1]),
+      Virus_Count = .x$virus_count,
+      geNomad = file_info$exists[file_info$file_type == "genomad"],
+      CheckV = file_info$exists[file_info$file_type == "checkv"],
+      VIBRANT = file_info$exists[file_info$file_type == "vibrant"],
+      dRep = file_info$exists[file_info$file_type == "drep"],
+      iPHOP = file_info$exists[file_info$file_type == "iphop"],
+      PhaTYP = file_info$exists[file_info$file_type == "phatyp"],
+      Defense_Finder = file_info$exists[file_info$file_type == "defense_finder"],
+      geNomad_Path = file_info$path[file_info$file_type == "genomad"],
+      CheckV_Path = file_info$path[file_info$file_type == "checkv"],
+      VIBRANT_Path = file_info$path[file_info$file_type == "vibrant"],
+      dRep_Path = file_info$path[file_info$file_type == "drep"],
+      PhaTYP_Path = file_info$path[file_info$file_type == "phatyp"],
+      Defense_Finder_Path = file_info$path[file_info$file_type == "defense_finder"],
+      Virus_Contigs = ifelse(file_info$exists[file_info$file_type == "genomad_phages"],
+                            file_info$rows[file_info$file_type == "genomad_phages"],
+                            0)
+    )
+  }) %>%
+    mutate(across(ends_with("_Path"), ~ifelse(is.na(.), "Not available", as.character(.))))
+
+  host_genomes_fasta <- list.files(
+    path = file.path(params$outdir, "genomes"),
+    pattern = "\\.fna$",
+    full.names = TRUE
+  )
+  
+  host_genomes_paths <- tibble(
+    name = tools::file_path_sans_ext(basename(host_genomes_fasta)),
+    path = host_genomes_fasta
+  )
+
+  data_gtdbtk_host <- read_tsv(
+    file.path(params$outdir, "host_analyses/gtdbtk/gtdbtk.bac120.summary.tsv"),
+    show_col_types = FALSE
+  ) %>% clean_names()
+
+  data_checkm_host <- read_tsv(
+    file.path(params$outdir, "host_analyses/checkm2/quality_report.tsv"),
+    show_col_types = FALSE
+  ) %>% clean_names()
+
+  log_debug("Returning summary dataframe, genome data, and host data")
+
+  log_debug(paste("summary_df dimensions:", nrow(summary_df), "rows,", ncol(summary_df), "columns"))
+  log_debug(paste("summary_df column names:", paste(colnames(summary_df), collapse = ", ")))
+  log_debug(paste("genome_data length:", length(genome_data)))
+  log_debug(paste("genome_data names:", paste(names(genome_data), collapse = ", ")))
+  log_debug(paste("host_genomes_paths dimensions:", nrow(host_genomes_paths), "rows,", ncol(host_genomes_paths), "columns"))
+  log_debug(paste("host_genomes_paths column names:", paste(colnames(host_genomes_paths), collapse = ", ")))
+  log_debug(paste("data_gtdbtk_host dimensions:", nrow(data_gtdbtk_host), "rows,", ncol(data_gtdbtk_host), "columns"))
+  log_debug(paste("data_gtdbtk_host column names:", paste(colnames(data_gtdbtk_host), collapse = ", ")))
+  log_debug(paste("data_checkm_host dimensions:", nrow(data_checkm_host), "rows,", ncol(data_checkm_host), "columns"))
+  log_debug(paste("data_checkm_host column names:", paste(colnames(data_checkm_host), collapse = ", ")))
+  
+  list(
+    summary = summary_df, 
+    genome_data = genome_data,
+    host_genomes_paths = host_genomes_paths,
+    data_gtdbtk_host = data_gtdbtk_host,
+    data_checkm_host = data_checkm_host
+  )
+}
+```
+
+```{r run_main_function, echo=FALSE, message=FALSE, warning=FALSE}
+log_debug("Starting execution of main function")
+result <- compile_results()
+
+if (is.null(result)) {
+  log_debug("Main function execution failed")
+  stop("Main function execution failed")
+}
+
+summary_df <- result$summary
+genome_data <- result$genome_data
+host_genomes_paths <- result$host_genomes_paths
+data_gtdbtk_host <- result$data_gtdbtk_host
+data_checkm_host <- result$data_checkm_host
+log_debug("Data extracted successfully")
+
+# Remove any extensions from names in data gtdbtk and checm2
+data_gtdbtk_host <- data_gtdbtk_host %>%
+  mutate(user_genome = str_remove(user_genome, "\\.[^.]+$"))
+
+data_checkm_host <- data_checkm_host %>%
+  mutate(name = str_remove(name, "\\.[^.]+$"))
+
+result$summary <- result$summary %>%
+  mutate(Sample = str_remove(Sample, "_virus_summary.tsv"))
+```
+
+# Summary {.tabset .tabset-fade}
+
+## Overview Table
+
+This table provides sample-by-sample information on detected viruses and key host genome statistics. It includes taxonomy, virus count, genome quality classification, CheckM2 metrics (completeness and contamination), and genome assembly statistics such as size and N50.
+
+```{r render_table, message=FALSE, warning=FALSE, echo=FALSE, results='asis'}
+data <- result$summary
+
+log_debug("Assigning checkm2 host data")
+checkm_host_data <- data_checkm_host %>% clean_names() %>%
+  select(name, completeness, contamination, 
+         contig_n50, genome_size)
+
+log_debug("Assigning GTDB-Tk host data")
+gtdbtk_data <- data_gtdbtk_host %>% 
+  select(user_genome, classification)
+
+log_debug("Defining color-blind friendly palette")
+cb_friendly_colors <- list(
+  green = "#009E73",
+  blue = "#0072B2",
+  orange = "#E69F00",
+  red = "#D55E00",
+  grey = "#999999"
+)
+
+log_debug("Defining function to color cells")
+color_cell <- function(values, color_true = cb_friendly_colors$green, 
+                       color_false = cb_friendly_colors$red) {
+  ifelse(values,
+         cell_spec("Yes", color = "white", bold = TRUE, background = color_true),
+         cell_spec("No", color = "white", bold = TRUE, background = color_false))
+}
+
+log_debug("Defining function to create bar plot")
+create_bar_plot <- function(values, max_value, color = cb_friendly_colors$grey) {
+  sapply(values, function(value) {
+    if(is.na(value) || !is.numeric(value)) {
+      return("N/A")
+    }
+    bar_width <- min(max(value, 0), max_value) / max_value * 100
+    sprintf('<div style="background-color: %s; width: %f%%; height: 10px;"></div>%.1f%%', 
+            color, bar_width, value)
+  })
+}
+
+log_debug("Defining function to format large numbers")
+format_large_number <- function(x) {
+  sapply(x, function(value) {
+    if (is.na(value) || !is.numeric(value)) {
+      return("N/A")
+    } else if (value < 1000) {
+      return(as.character(value))
+    } else if (value < 1e6) {
+      return(paste0(round(value / 1e3, 1), "K"))
+    } else if (value < 1e9) {
+      return(paste0(round(value / 1e6, 1), "M"))
+    } else {
+      return(paste0(round(value / 1e9, 1), "G"))
+    }
+  })
+}
+
+log_debug("Defining function to extract last known taxonomy level")
+extract_last_known_taxonomy <- function(classification) {
+  if (is.na(classification) || classification == "") {
+    return(list(level = "Unknown", name = "Unknown"))
+  }
+  
+  parts <- strsplit(classification, ";")[[1]]
+  for (i in length(parts):1) {
+    level <- sub("^[a-z]__", "", parts[i])
+    if (level != "") {
+      prefix <- sub("__.*$", "", parts[i])
+      return(list(level = prefix, name = level))
+    }
+  }
+  return(list(level = "Unknown", name = "Unknown"))
+}
+
+log_debug("Defining function to format taxonomy")
+format_taxonomy <- function(classification) {
+  result <- extract_last_known_taxonomy(classification)
+  if (result$level == "Unknown") {
+    return("Unknown")
+  } else if (result$level == "s") {
+    return(paste0("<i>", result$name, "</i>"))
+  } else {
+    genus <- str_replace_all(result$name, "_", " ")
+    return(paste0("<i>", genus, "</i> sp."))
+  }
+}
+
+log_debug("Defining function to calculate quality score and determine genome quality class")
+calculate_quality_score_and_class <- function(completeness, contamination) {
+  if (is.na(completeness) || is.na(contamination)) {
+    return(list(
+      score = cell_spec("N/A", color = "white", bold = TRUE, background = cb_friendly_colors$grey),
+      class = cell_spec("Unknown", color = "white", bold = TRUE, background = cb_friendly_colors$grey),
+      numeric_score = NA
+    ))
+  }
+  
+  quality_score <- completeness - (5 * contamination)
+  formatted_score <- sprintf("%.1f", quality_score)
+  
+  if (completeness > 90 && contamination < 5) {
+    class <- "High-quality draft"
+    color <- cb_friendly_colors$green
+  } else if (completeness >= 50 && contamination < 10) {
+    class <- "Medium-quality draft"
+    color <- cb_friendly_colors$blue
+  } else {
+    class <- "Low-quality draft"
+    color <- cb_friendly_colors$red
+  }
+  
+  list(
+    score = cell_spec(formatted_score, color = "white", bold = TRUE, background = color),
+    class = cell_spec(class, color = "white", bold = TRUE, background = color),
+    numeric_score = quality_score
+  )
+}
+
+log_debug("Preparing the data")
+
+table_data <- data %>%
+  #mutate(Sample = basename(Sample) %>% trim_sample_name()) %>%
+  mutate(Sample = basename(Sample)) %>%
+  left_join(checkm_host_data, by = c("Sample" = "name")) %>%
+  left_join(gtdbtk_data, by = c("Sample" = "user_genome")) %>%
+  mutate(
+    quality_data = pmap(list(as.numeric(completeness),
+                             as.numeric(contamination)),
+                        calculate_quality_score_and_class),
+    Quality_Score = map_chr(quality_data, ~.$score),
+    Genome_Quality = map_chr(quality_data, ~.$class),
+    Quality_Score_Numeric = map_dbl(quality_data, ~.$numeric_score),
+    Virus_Count_Numeric = as.numeric(Virus_Count),
+    Virus_Count = cell_spec(
+      Virus_Count,
+      color = "white",
+      bold = TRUE,
+      background = case_when(
+        Virus_Count == 0 ~ cb_friendly_colors$red,
+        Virus_Count == 1 ~ cb_friendly_colors$blue,
+        Virus_Count > 1 ~ cb_friendly_colors$green
+      )
+    ),
+    Completeness_Numeric = as.numeric(completeness),
+    Completeness = create_bar_plot(as.numeric(completeness), 100),
+    Contamination = create_bar_plot(as.numeric(contamination), 100),
+    `N50 (contigs)` = format_large_number(as.numeric(contig_n50)),
+    `Genome size (bp)` = format_large_number(as.numeric(genome_size)),
+    `GTDB Taxonomy` = sapply(classification, format_taxonomy)
+  ) %>%
+  mutate(`#` = row_number()) %>%
+  select(`#`, Sample, `GTDB Taxonomy`, Virus_Count,
+         Quality_Score, Genome_Quality, Completeness, Contamination,
+         `Genome size (bp)`, `N50 (contigs)`)
+
+log_debug("Creating the table")
+kbl(table_data, escape = FALSE,
+    align = c("c", "l", "l", "c", rep("c", 2), rep("r", 2), rep("r", 2))) %>%
+  kable_paper(full_width = TRUE) %>%
+  column_spec(1, bold = TRUE, width = "2em") %>%
+  column_spec(2:3, bold = TRUE) %>%
+  column_spec(4:5, width = "5em") %>%
+  column_spec(6:7, width = "60px") %>%
+  column_spec(8:9, width = "4em") %>%
+  add_header_above(c(" " = 4, "Host Genome Quality" = 2, "CheckM Metrics" = 2,
+                     "Statistics" = 2)) %>%
+  kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive"),
+                font_size = 9,
+                html_font = "Arial",
+                position = "left") %>%
+  row_spec(0, bold = TRUE, color = "white", background = "#333333") %>%
+  row_spec(0, extra_css = "border-bottom: 2px solid #000000;") %>%
+  column_spec(9, extra_css = "border-right: 2px solid #000000;") %>%
+  scroll_box(width = "100%", height = "100%",
+             extra_css = "overflow-x: auto; border: 1px solid #ccc; border-radius: 4px;")
+```
+
+## Tools Documentation
+
+The following tools are utilized in this workflow. Each tool name below is a link to its respective documentation.
+
+**Host-analyses**
+
+- [**CheckM2 v1.1.0**](https://github.com/chklovski/CheckM2): Assesses the quality of the host. Most useful when working with assembled genomes.
+
+- [**GTDB-Tk v2.3.2**](https://ecogenomics.github.io/GTDBTk/index.html): Assigns a taxonomy to the host genome.
+
+- [**Defense-Finder v2.0.0, models 2.0.2**](https://ecogenomics.github.io/GTDBTk/index.html): Detects known anti-phage systems in the host.
+
+- [**geNomad v1.7.1**](https://portal.nersc.gov/genomad/): Predicts and annotates proviruses.
+
+**Virus-analyses**
+
+- [**CheckV v1.0.1**](https://pypi.org/project/checkv/): Evaluates the quality of viral genomes.
+
+- [**dRep v3.4.5**](https://drep.readthedocs.io/en/latest/): Compares viral genomes within the same host.
+
+- [**Abricate v1.0.1**](https://github.com/tseemann/abricate): Identifies virulence genes in the prophage genomes with the [VFDB database](https://www.mgc.ac.cn/VFs/).
+
+- [**iPHOP v1.3.3**](https://bitbucket.org/srouxjgi/iphop/src/main/): Predicts other potential hosts of viral genomes.
+
+- [**VIBRANT v1.2.1**](https://github.com/AnantharamanLab/VIBRANT): Used to identify Auxiliary Metabolic Genes in the prophages.
+
+## Workflow
+
+The workflow begins with the input of bacterial genomes by the user. These are processed by the **host-analyses** tools. Prophage prediction is  
+performed by **geNomad** only. Afterward, prophages identified by **geNomad** are processed by the **virus-analyses** tools.
+
+If more than one prophage is recovered in the same sample, **dRep** is used to compare and determine if the viruses are identical or different within the same host.
+
+*PLACEHOLDER FOR PIPELINE*
+
+## R Session Info
+
+Information about the R session used to render this markdown document.
+
+```{r}
+sessionInfo()
+```
+
+
+# Results {.tabset .tabset-fade}
+
+```{r}
+# Creating combined_unique object
+
+combined_unique <- bind_rows(
+  checkm_host_data %>%
+    # select(bin_id) %>%
+    # dplyr::rename(Sample = bin_id),
+    select(name) %>%
+    dplyr::rename(Sample = name),
+  
+  data %>%
+    #mutate(Sample = str_remove(Sample, "_virus_summary.tsv")) %>%
+    select(Sample)
+) %>%
+  distinct(Sample) %>%
+  arrange(Sample)
+
+log_debug(paste("combined_unique samples:", paste(combined_unique$Sample, collapse = ", ")))
+```
+
+
+
+```{r main_workflow, fig.width=6, fig.height=6, out.height="100%", out.width='100%', dpi=300, fig.align='center', warning=FALSE, message=FALSE, results='asis'}
+# Process proviruses data
+process_proviruses <- function(data_genomad) {
+  proviruses <- data_genomad %>%
+    dplyr::filter(topology == "Provirus") %>%
+    dplyr::mutate(contig = sub("\\|provirus_.*", "", seq_name)) %>%  # take everything before "|provirus"
+    dplyr::mutate(contig = paste0("c", as.numeric(factor(contig)))) %>% # map them to c_1, c_2, ...
+    dplyr::select(seq_name, coordinates, length, contig, virus_score, n_hallmarks)
+  
+  proviruses <- proviruses %>%
+    tidyr::separate(coordinates, into = c("start", "end"), sep = "-")
+  
+  proviruses$start <- as.integer(proviruses$start)
+  proviruses$end <- as.integer(proviruses$end)
+  
+  proviruses_gr_features <- GRanges(seqnames = proviruses$contig, 
+                                    ranges = IRanges(start = proviruses$start, 
+                                                     end = proviruses$end))
+  proviruses_gr_features$length <- proviruses_gr_features %>% ranges %>% width
+  proviruses_gr_features$score <- as.numeric(proviruses$virus_score)
+  proviruses_gr_features$n_hallmarks <- as.numeric(proviruses$n_hallmarks)
+  
+  proviruses_gr_features$n_hallmarks_pos <- 
+    abs(start(proviruses_gr_features) - end(proviruses_gr_features)) / 2
+  
+  return(proviruses_gr_features)
+}
+
+plot_genome_ideogram <- function(genome_current, proviruses_gr_features) {
+  fasta_file_path <- file.path(params$outdir, "genomes", paste0(genome_current, ".fna"))
+  #cat(fasta_file_path, "\n\n")
+  genome_ideogram <- getIdeogramData(fasta_file = fasta_file_path)
+  
+  # Replace any seqlevel to c_1, c_2, c_3, ...
+  new_seqlevels <- paste0("c", seq_along(seqlevels(genome_ideogram)))
+  names(new_seqlevels) <- seqlevels(genome_ideogram)
+  genome_ideogram <- GenomeInfoDb::renameSeqlevels(genome_ideogram, new_seqlevels)
+  colours <- rep("#a58bc5", length(seqlevels(genome_ideogram)))
+  
+  par(mar = c(2, 2, 2, 2))  # minimal margins around the plot
+  
+  gmovizInitialise(genome_ideogram,
+                   sector_colours = colours,
+                   sector_border_colours = colours,
+                   sector_labels = FALSE
+  )
+  
+  for (i in 1:length(proviruses_gr_features)) {
+    name <- as.character(seqnames(proviruses_gr_features[i]))
+    start <- as.numeric(start(proviruses_gr_features[i]))
+    end <- as.numeric(end(proviruses_gr_features[i]))
+    region <- data.frame(start = start, end = end)
+    circos.genomicRect(seqnames = name,
+                       region,
+                       ytop = .5,
+                       ybottom = 0,
+                       track.index = 1,
+                       sector.index = name,
+                       border = "#e9d27d",
+                       col = "#e9d27d")
+  }
+  
+  length <- as.numeric(proviruses_gr_features$length)
+  length <- ifelse(length > 1000000,
+                   paste0(round(length/1000000, 2), "mb"),
+                   paste0(round(length/1000, 2), "kb"))
+  labels <- paste0(as.character(seqnames(proviruses_gr_features)), " (", length, ")")
+  circos.labels(sectors = as.character(seqnames(proviruses_gr_features)),
+                x = as.numeric(start(proviruses_gr_features)),
+                labels,
+                facing = "clockwise")
+}
+
+process_sample <- function(sample, combined_unique, host_genomes_paths, genome_data) {
+  genome_current <- sample  # Add this line
+  tryCatch({
+    log_debug(paste("Starting to process sample:", sample))
+    
+    # Check if sample exists in genome_data
+    if (!(sample %in% names(genome_data))) {
+      log_debug(paste("Sample", sample, "not found in genome_data"))
+      cat(paste("Error: Sample", sample, "not found in genome_data\n\n"))
+      return()
+    }
+    
+    cat(paste("## ", sample, "{.tabset .tabset-fade} \n\n"))
+
+    host_genome_path <- host_genomes_paths$path[host_genomes_paths$name == sample]
+    if (length(host_genome_path) == 0) {
+      log_debug(paste("Host genome path not found for sample:", sample))
+      cat(paste("Error: Host genome path not found for sample", sample, "\n\n"))
+      return()
+    }
+    
+    host_genome_ideogram <- tryCatch({
+      getIdeogramData(fasta_file = host_genome_path)
+    }, error = function(e) {
+      log_debug(paste("Error loading host genome ideogram for sample", sample, ":", conditionMessage(e)))
+      NULL
+    })
+    
+    if (is.null(host_genome_ideogram)) {
+      cat(paste("Error: Unable to load host genome ideogram for sample", sample, "\n\n"))
+      return()
+    }
+    
+    sample_data <- genome_data[[sample]]$loaded_data
+    genomad_summary <- sample_data$genomad
+    genomad_annotation <- sample_data$genomad_annotations
+    checkv_data <- sample_data$checkv
+    defense_finder_data <- sample_data$defense_finder
+    abricate_data <- sample_data$abricate
+    iphop_data <- sample_data$iphop
+    vibrant_data <- sample_data$vibrant
+    
+    cat("### Host Genome\n\n")
+
+    cat("**GTDB-Tk taxonomy**: \n\n")
+    data_gtdbtk_host %>% filter(user_genome == sample) %>%
+      select(classification) %>%
+      kbl() %>%
+      kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+      kable_paper("striped", full_width = TRUE) %>%
+      scroll_box(width = "100%", height = "100%") %>%
+      cat()
+
+    # Cat checkm summary for this genome
+    cat("**CheckM2 Summary**:\n\n")
+    #checkm_summary <- data_checkm_host %>% filter(`bin_id` == sample)
+    checkm_summary <- data_checkm_host %>% filter(`name` == sample)
+    checkm_summary %>% clean_names %>%
+      #select(number_contigs, n50_contigs, completeness, contamination, strain_heterogeneity) %>%
+      select(total_contigs, contig_n50, completeness, contamination) %>%
+      kbl() %>%
+      kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+      kable_paper("striped", full_width = TRUE) %>%
+      scroll_box(width = "100%", height = "100%") %>%
+      cat()
+    
+    # Display defense-finder as a table
+    if (!is.null(defense_finder_data) && nrow(defense_finder_data) > 0) {
+      cat("**Defense-Finder Systems**:\n\n")
+
+      defense_finder_data %>%
+        select(sys_id, type, subtype, sys_beg, sys_end, protein_in_syst, genes_count, name_of_profiles_in_sys) %>%
+        kbl() %>%
+        kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+        kable_paper("striped", full_width = TRUE) %>%
+        scroll_box(width = "100%", height = "100%") %>%
+        cat()
+    } else {
+      cat("No Defense-Finder systems detected.\n\n")
+    }
+    
+    if (is.null(genomad_summary) || nrow(genomad_summary) == 0) {
+      log_debug(paste("No geNomad summary data found for sample:", sample))
+      return()
+    }
+    
+    if (length(seqlevels(host_genome_ideogram)) == 1) {
+      host_genome_size <- sum(width(host_genome_ideogram))
+    } else {
+      virus_containing_contigs <- unique(sub("\\|.*", "", genomad_summary$seq_name))
+      virus_containing_contigs <- paste0("c_", as.numeric(factor(virus_containing_contigs)))
+      filtered_host_genome <- subset_and_update_ideogram(host_genome_ideogram, virus_containing_contigs)
+      host_genome_size <- sum(width(filtered_host_genome))
+    }
+    
+    # Process proviruses
+    proviruses_gr_features <- process_proviruses(genomad_summary)
+    
+    cat("**Genomad and CheckV Summary**:\n\n")
+    genomad_summary %>%
+      select(seq_name, taxonomy, topology, coordinates, length) %>%
+      left_join(
+        checkv_data %>% select(contig_id, gene_count, viral_genes, checkv_quality, miuvig_quality),
+        by = c("seq_name" = "contig_id")) %>%
+      select(seq_name, length, gene_count, viral_genes, checkv_quality, miuvig_quality, taxonomy, topology, coordinates) %>%
+      kbl() %>%
+      kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+      kable_paper("striped", full_width = TRUE) %>%
+      scroll_box(width = "100%", height = "100%") %>%
+      cat()
+    
+    cat("**Host Genome Ideogram with Phages**:\n\n")
+    plot_genome_ideogram(sample, proviruses_gr_features)
+    cat('In this circular plot, **"c"** indicates the contig, and the number that follows (e.g., **c1**) represents the contig number.  
+If multiple contigs are present in the genome, each will be shown with a distinct label (e.g., **c1**, **c2**, etc.).\n\n')
+    cat("\n\n")
+
+    # Process phage genomes
+    cat("### Prophages {.tabset .tabset-fade} \n\n")
+    cat("**Select prophage to show: ** \n\n")
+    for (i in seq_len(nrow(genomad_summary))) {
+      log_debug(paste("Processing phage", i, "of", nrow(genomad_summary), "for sample", sample))
+      process_phage(genomad_summary[i, ], genomad_summary, genomad_annotation, checkv_data, host_genome_size)
+    }
+    
+    # Plot dREP if applicable
+    if (nrow(genomad_summary) > 1) {
+      cat("### vOTUs\n\n")
+      plot_drep(sample, genomad_summary)
+    }
+    
+    # Creating table with Abricate data
+    if (nrow(abricate_data) > 0) {
+      cat("### Virulence Genes {.tabset .tabset-fade} \n\n")
+      cat("Screening of virulence genes present in the prophage contigs. \n\n")
+      abricate_data %>% select(-number_file) %>%
+      kbl() %>%
+      kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+      kable_paper("striped", full_width = TRUE) %>%
+      scroll_box(width = "100%", height = "100%") %>% cat()
+      cat("\n\n")
+    }
+    
+    # Creating table with iPHOP
+    if (nrow(iphop_data) > 0) {
+      cat("### Prophage-Host Prediction {.tabset .tabset-fade} \n\n")
+      cat("Prediction of potential hosts for the prophage contigs. \n\n")
+      iphop_data %>%
+      kbl() %>%
+      kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+      kable_paper("striped", full_width = TRUE) %>%
+      scroll_box(width = "100%", height = "100%") %>% cat()
+      cat("\n\n")
+    }
+    
+    # Creating table with VIBRANT AMGs
+    if (nrow(vibrant_data) > 0) {
+      cat("### AMG Predictions {.tabset .tabset-fade} \n\n")
+      cat("Prediction of auxiliary metabolic genes in the prophage contigs. \n\n")
+      vibrant_data %>%
+      kbl() %>%
+      kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+      kable_paper("striped", full_width = TRUE) %>%
+      scroll_box(width = "100%", height = "100%") %>% cat()
+      cat("\n\n")
+    }
+
+  log_debug(paste("Finished processing sample:", sample))
+  }, error = function(e) {
+    log_debug(paste("Error in process_sample for", sample, ":", conditionMessage(e)))
+    cat(paste("Error processing sample", sample, ":", conditionMessage(e), "\n\n"))
+  })
+}
+
+process_phage <- function(virus, genomad_summary, genomad_annotation, checkv_data, host_genome_size) {
+  cat(paste("#### Phage ID:", virus$seq_name, " {.tabset .tabset-fade} \n\n"))
+
+  current_contig <- sub("\\|.*", "", virus$seq_name)
+  
+  provirus_start <- as.numeric(sub(".*provirus_(\\d+)_\\d+", "\\1", virus$seq_name))
+  provirus_end <- as.numeric(sub(".*provirus_\\d+_(\\d+)", "\\1", virus$seq_name))
+  virus_length <- provirus_end - provirus_start + 1
+  
+  current_contig_base <- sub("\\|provirus_.*", "", virus$seq_name)
+  current_provirus_range <- sub(".*\\|provirus_", "", virus$seq_name)
+  current_annotations <- genomad_annotation[grepl(paste0(current_contig_base, "\\|provirus_", current_provirus_range, "_"), 
+                                                  genomad_annotation$gene, fixed = FALSE), ] %>%
+  mutate(arrow_pos = ifelse(strand == -1, "start", "end"))
+  
+  
+  cat("\n\n**Phage–Host Genome Ideogram:**\n\n")
+  
+  plot_phage_circos(virus, genomad_summary, current_annotations, virus_length, host_genome_size, provirus_start, provirus_end, checkv_data)
+  
+  cat("\n\n")
+  cat("\n\n**Genes Annotation (geNomad):**\n\n")
+  
+  current_annotations %>%
+    select(gene, length, marker, annotation_accessions, annotation_description) %>%
+    kbl() %>%
+    kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+    kable_paper() %>%
+    cat()
+  cat("\n\n")
+}
+
+plot_phage_circos <- function(virus, genomad_summary, current_annotations, virus_length, host_genome_size, provirus_start, provirus_end, checkv_data) {
+  tryCatch({
+    log_debug("Starting plot_phage_circos function")
+    log_debug(paste("Current virus:", virus$seq_name))
+    log_debug(paste("Virus length:", virus_length))
+    log_debug(paste("Host genome size:", host_genome_size))
+    log_debug(paste("Provirus start:", provirus_start))
+    log_debug(paste("Provirus end:", provirus_end))
+    
+    # Check for NA or invalid values in input parameters
+    if (is.na(virus_length) || virus_length <= 0) {
+      log_debug("Error: Invalid virus length")
+      return(NULL)
+    }
+    if (is.na(host_genome_size) || host_genome_size <= 0) {
+      log_debug("Error: Invalid host genome size")
+      return(NULL)
+    }
+    if (is.na(provirus_start) || provirus_start < 0) {
+      log_debug("Error: Invalid provirus start position")
+      return(NULL)
+    }
+    if (is.na(provirus_end) || provirus_end <= provirus_start) {
+      log_debug("Error: Invalid provirus end position")
+      return(NULL)
+    }
+    
+    # Extract contig information
+    current_contig <- sub("\\|.*", "", virus$seq_name)
+    log_debug(paste("Current contig:", current_contig))
+    
+    contig_viruses <- genomad_summary[grepl(paste0("^", current_contig), genomad_summary$seq_name), ]
+    if (nrow(contig_viruses) == 0) {
+      log_debug("Error: No viruses found for the current contig")
+      return(NULL)
+    }
+    
+    contig_length <- max(as.numeric(sub(".*_(\\d+)$", "\\1", contig_viruses$seq_name)))
+    if (is.na(contig_length) || contig_length <= 0) {
+      contig_length <- virus_length  # Use virus length as fallback if contig length is invalid
+      log_debug(paste("Using virus length as contig length:", contig_length))
+    } else {
+      log_debug(paste("Contig length:", contig_length))
+    }
+    
+    if (provirus_end > contig_length) {
+      log_debug("Error: Provirus end position exceeds contig length")
+      return(NULL)
+    }
+    
+    log_debug("Clearing circos")
+    circos.clear()
+    
+    log_debug("Setting circos parameters")
+    circos.par(start.degree = 180, gap.degree = 10, track.margin = c(0.01, 0.01))
+    
+    main_color <- "#a58bc5"
+    zoom_color <- "#e9d27d"
+    
+    zoom_start <- (provirus_start / contig_length) * 100
+    zoom_end <- (provirus_end / contig_length) * 100
+    
+    log_debug(paste("Zoom start:", zoom_start))
+    log_debug(paste("Zoom end:", zoom_end))
+    
+    log_debug("Initializing circos")
+    circos.initialize(factors = c("Zoom", "Main"), xlim = c(0, 100))
+    
+    format_genome_labels <- function(x) {
+      ifelse(x >= 1e6, paste0(round(x / 1e6, 2), " Mb"),
+             ifelse(x >= 1e3, paste0(round(x / 1e3, 2), " Kb"),
+                    paste0(x, " bp")))
+    }
+    
+    log_debug("Adding link")
+    tryCatch({
+      circos.link("Main", c(zoom_start, zoom_end), "Zoom", c(0, 100),
+                  rou1 = 0.8,
+                  rou2 = 0.97,
+                  h.ratio = 0.55, # width?
+                  lty = 2,
+                  lwd = 0.5,
+                  h2 = 1,
+                  col = "grey99", border = "grey80")
+    }, error = function(e) {
+      log_debug(paste("Error in circos.link:", e$message))
+    })
+    
+    log_debug("Adding zoom track")
+    circos.track(factors = "Zoom", ylim = c(0, 1), track.height = 0.15,
+                 panel.fun = function(x, y) {
+                   circos.rect(0, 0, 100, 1, col = zoom_color, border = NA)
+                   axis_labels <- seq(0, virus_length, length.out = 6)
+                   axis_positions <- seq(0, 100, length.out = 6)
+                   circos.axis(h = "top", major.at = axis_positions,
+                               labels = format_genome_labels(axis_labels),
+                               labels.cex = 0.7, direction = "outside")
+
+                   for (i in 1:nrow(current_annotations)) {
+                     gene_start <- current_annotations$start[i]
+                     gene_end <- current_annotations$end[i]
+                     arrow_start <- (gene_start - provirus_start) / virus_length * 100
+                     arrow_end <- (gene_end - provirus_start) / virus_length * 100
+
+                     circos.arrow(arrow_start, arrow_end, y1 = 0, y2 = 1,
+                                  arrow.head.width = 0.75, arrow.head.length = cm_x(0.1),
+                                  arrow.position = current_annotations$arrow_pos[i],
+                                  col = ifelse(is.na(current_annotations$annotation_description[i]), "grey", "#7fbfff"),
+                                  border = ifelse(is.na(current_annotations$annotation_description[i]), "grey20", "darkblue"))
+                   }
+                 }, bg.border = NA)
+
+    log_debug("Adding main track")
+    circos.track(factors = "Main", ylim = c(0, 1), track.height = 0.1,
+                 panel.fun = function(x, y) {
+                   circos.rect(xleft = 0, ybottom = 0, xright = 100, ytop = 1, col = main_color, border = NA)
+
+                   for (i in 1:nrow(contig_viruses)) {
+                     virus_start <- as.numeric(sub(".*provirus_(\\d+)_\\d+", "\\1", contig_viruses$seq_name[i]))
+                     virus_end <- as.numeric(sub(".*provirus_\\d+_(\\d+)", "\\1", contig_viruses$seq_name[i]))
+
+                     virus_start_percent <- (virus_start / contig_length) * 100
+                     virus_end_percent <- (virus_end / contig_length) * 100
+
+                     rect_color <- if (contig_viruses$seq_name[i] == virus$seq_name) zoom_color else adjustcolor(zoom_color, alpha.f = 0.7)
+
+                     circos.rect(xleft = virus_start_percent, ybottom = 0,
+                                 xright = virus_end_percent, ytop = 1,
+                                 col = rect_color, border = NA)
+                   }
+
+                   axis_labels <- seq(0, contig_length, length.out = 6)
+                   axis_positions <- seq(0, 100, length.out = 6)
+                   circos.axis(h = "top", major.at = axis_positions,
+                               labels = format_genome_labels(axis_labels),
+                               labels.cex = 0.7, direction = "outside")
+                 }, bg.border = NA)
+    
+    log_debug("Locating phage positions")
+    phage_positions <- sapply(1:nrow(contig_viruses), function(i) {
+      virus_start <- as.numeric(sub(".*provirus_(\\d+)_\\d+", "\\1", contig_viruses$seq_name[i]))
+      virus_end <- as.numeric(sub(".*provirus_\\d+_(\\d+)", "\\1", contig_viruses$seq_name[i]))
+      ((virus_start + virus_end) / 2 / contig_length) * 100
+    })
+    
+    log_debug("Annotating names on phage positions")
+    
+    # Extract start and end positions from sequence names
+    start_positions <- as.numeric(sub(".*provirus_([0-9]+)_.*", "\\1", contig_viruses$seq_name))
+    end_positions <- as.numeric(sub(".*provirus_[0-9]+_([0-9]+)", "\\1", contig_viruses$seq_name))
+    
+    # Create phage labels with the desired format
+    phage_labels <- paste0(round(contig_viruses$length / 1e3, 2), " Kb")
+    
+    # Apply labels to circos plot
+    circos.labels(
+      sectors = "Main",
+      x = phage_positions,
+      labels = phage_labels,
+      facing = "reverse.clockwise",
+      niceFacing = TRUE,
+      col = "black",
+      cex = 0.6,
+      side = "inside",
+      connection_height = 0.02,
+      line_col = "gray"
+    )
+    
+    center_x <- 50
+    virus_name <- virus$seq_name
+    taxonomy <- virus$taxonomy
+    
+    log_debug("Adding taxonomy and virus name to the plot")
+    circos.text(x = center_x, y = -0.2, labels = taxonomy,
+                sector.index = "Zoom", track.index = 1,
+                facing = "bending.inside", niceFacing = TRUE,
+                adj = c(0.5, 0.7), cex = 0.8)
+  
+    checkv_info <- checkv_data[checkv_data$contig_id == virus$seq_name, ]
+    if (nrow(checkv_info) > 0) {
+      checkv_quality <- checkv_info$checkv_quality
+      gene_count <- checkv_info$gene_count
+      viral_genes <- checkv_info$viral_genes
+      host_genes <- checkv_info$host_genes
+      miuvig_quality <- checkv_info$miuvig_quality
+      completeness <- checkv_info$completeness
+      completeness_method <- checkv_info$completeness_method
+      contamination <- checkv_info$contamination
+      
+      circos.text(
+        x = center_x, y = -0.5, 
+        labels = paste("CheckV Quality:", checkv_quality, " - miuvig Quality:", miuvig_quality),
+        sector.index = "Zoom", track.index = 2,
+        facing = "bending.inside", niceFacing = TRUE,
+        adj = c(0.5, 0), cex = 0.7
+      )
+      
+      circos.text(
+        x = center_x, y = -1.5, 
+        labels = paste("Gene Count:", gene_count, " - Viral Genes:", viral_genes, " - Host Genes:", host_genes),
+        sector.index = "Zoom", track.index = 2,
+        facing = "bending.inside", niceFacing = TRUE,
+        adj = c(0.5, 0), cex = 0.7
+      )
+      
+      circos.text(
+        x = center_x, y = -2.5, 
+        labels = paste("Completeness:", completeness, " - Contamination:", contamination),
+        sector.index = "Zoom", track.index = 2,
+        facing = "bending.inside", niceFacing = TRUE,
+        adj = c(0.5, 0), cex = 0.7
+      )
+    }
+    
+    log_debug("Adding legend")
+    # Add legend
+    legend("topright", 
+           legend = c("Annotated gene", "Unknown gene"),
+           fill = c("#7fbfff", "grey"),
+           border = c("darkblue", "grey20"),
+           cex = 0.8,
+           bty = "n")
+    
+    log_debug("Clearing circos")
+    circos.clear()
+    log_debug("Finished plot_phage_circos function successfully")
+  }, error = function(e) {
+    log_debug(paste("Error in plot_phage_circos:", e$message))
+    circos.clear()
+  })
+}
+
+plot_drep <- function(sample, genomad_summary) {
+  drep_file_path <- file.path(params$outdir, "virus_analyses", "drep_compare", sample, "data_tables", "Cdb.csv")
+  drep_data <- read_csv(drep_file_path) %>% clean_names()
+  drep_data <- cbind(genomad_summary$seq_name, drep_data)
+  
+  cat("When more than 1 phage is detected in the host genome, we perform a clustering step using the tool dRep.\n\n")
+  cat("A threshold of 0.95 was applied to the ANI similarity index to define clusters of virus operational taxonomic units (vOTUs).")
+  
+  cat("\n\n**Final cluster designations**\n\n")
+  drep_data %>%
+    kbl() %>%
+    kable_styling(bootstrap_options = c("striped", "hover", "condensed", "responsive")) %>%
+    kable_paper("striped", full_width = TRUE) %>%
+    cat()
+  
+  # Insert the PDF plot
+  plot_path <- file.path(params$outdir, "virus_analyses", "drep_compare", sample, "figures", "Primary_clustering_dendrogram.pdf")
+  png_path <- file.path(params$outdir, "virus_analyses", "drep_compare", sample, "figures", "Primary_clustering_dendrogram.png")
+  
+  if (file.exists(plot_path)) {
+    pdftools::pdf_convert(plot_path, format = "png", filenames = png_path, verbose = FALSE, dpi=150)
+    base64_str <- base64enc::dataURI(file = png_path, mime = "image/png")
+    cat("**Primary clustering plot**\n\n")
+    cat(sprintf(
+      '<div style="text-align: center;"><img src="%s" style="max-width: 100%%; height: auto; border:1px solid #ddd; border-radius:4px; box-shadow: 0 2px 5px rgba(0,0,0,0.1); margin: 1em 0;"></div>',base64_str
+    ))
+  } else {
+    cat("**No dRep clustering plot found.**\n\n")
+  }
+  
+}
+
+subset_and_update_ideogram <- function(ideogram, contigs) {
+  filtered <- ideogram[seqnames(ideogram) %in% contigs]
+  seqlevels(filtered) <- contigs
+  seqinfo(filtered) <- seqinfo(filtered)[contigs]
+  filtered
+}
+
+render_all_samples <- function(test_mode = FALSE) {
+  if (test_mode) {
+    if (nrow(combined_unique) > 0) {
+      cat("**Select sample to show:** \n\n\n")
+      current_sample <- combined_unique$Sample[6]
+      process_sample(current_sample, combined_unique, host_genomes_paths, genome_data)
+    } else {
+      print("No samples can be further analysed.")
+    }
+  } else {
+    cat("**Select sample to show:** \n\n\n")
+    for (i in seq_len(nrow(combined_unique))) {
+      current_sample <- combined_unique$Sample[i]
+      process_sample(current_sample, combined_unique, host_genomes_paths, genome_data)
+    }
+  }
+}
+
+# Execute the main function
+# Test mode processes one sample only
+render_all_samples(test_mode = F)
+```
+
+# Citation
+
+Cite this work: XXXXX
+
+
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_000913.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
+NC_000913.fasta	NC_000913.3|provirus_2461306_2476510	6550	6912	+	gtrA	1-363/363	===============	0/0	100.00	88.70	vfdb	NP_706257	(gtrA) bactoprenol-linked glucose translocase/flippase [LPS (VF0124)] [Shigella flexneri 2a str. 301]	
+NC_000913.fasta	NC_000913.3|provirus_2461306_2476510	6909	7813	+	gtrB	1-905/930	===============	0/0	97.31	80.66	vfdb	NP_706258	(gtrB) bactoprenol glucosyl transferase [LPS (VF0124)] [Shigella flexneri 2a str. 301]	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_002737.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,8 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
+NC_002737.fasta	NC_002737.2|provirus_1186916_1222544	2808	3614	+	mf3	1-807/807	===============	0/0	100.00	100.00	vfdb	NP_269520	(mf3) deoxyribonuclease [DNase (VF0252)] [Streptococcus pyogenes M1 GAS]	
+NC_002737.fasta	NC_002737.2|provirus_1186916_1222544	9081	10193	-	hylP	1-1113/1113	===============	0/0	100.00	100.00	vfdb	NP_269528	(hylP) hyaluronidase phage associated [Hyaluronidase (VF0246)] [Streptococcus pyogenes M1 GAS]	
+NC_002737.fasta	NC_002737.2|provirus_529627_569283	33078	34091	+	hylP	1-1014/1014	===============	0/0	100.00	100.00	vfdb	NP_268936	(hylP) hyaluronidase phage associated [Hyaluronidase (VF0246)] [Streptococcus pyogenes M1 GAS]	
+NC_002737.fasta	NC_002737.2|provirus_529627_569283	38950	39657	-	spec	1-708/708	===============	0/0	100.00	100.00	vfdb	NP_268943	(spec) streptococcal exotoxin C precursor phage associated [Spes (VF0248)] [Streptococcus pyogenes M1 GAS]	
+NC_002737.fasta	NC_002737.2|provirus_777501_820593	35641	36759	+	hylP	1-1119/1119	===============	0/0	100.00	100.00	vfdb	NP_269179	(hylP) hyaluronidase phage associated [Hyaluronidase (VF0246)] [Streptococcus pyogenes M1 GAS]	
+NC_002737.fasta	NC_002737.2|provirus_777501_820593	41680	42357	+	spei	1-678/678	===============	0/0	100.00	99.85	vfdb	NP_269185	(spei) streptococcal exotoxin I precursor [Spes (VF0248)] [Streptococcus pyogenes M1 GAS]	
+NC_002737.fasta	NC_002737.2|provirus_777501_820593	42383	43093	+	speh	1-711/711	===============	0/0	100.00	100.00	vfdb	NP_269186	(speh) streptococcal exotoxin H precursor [Spes (VF0248)] [Streptococcus pyogenes M1 GAS]	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_008261.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_009012.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_014168.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_014212.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_014364.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_015761.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
+NC_015761.fasta	NC_015761.1|provirus_1007223_1045009	24347	26694	-	sopA	1-2348/2349	===============	0/0	99.96	89.91	vfdb	NP_461011	(sopA) type III secretion system effector SopA E3 ubiquitin ligase [TTSS(SPI-1 encode) (VF0116)] [Salmonella enterica subsp. enterica serovar Typhimurium str. LT2]	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_017033.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_018068.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_018515.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_019936.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/abricate_results/NC_021184.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+#FILE	SEQUENCE	START	END	STRAND	GENE	COVERAGE	COVERAGE_MAP	GAPS	%COVERAGE	%IDENTITY	DATABASE	ACCESSION	PRODUCT	RESISTANCE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkm2.Quality_report.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,23 @@
+Name	Completeness	Contamination	Completeness_Model_Used	Translation_Table_Used	Coding_Density	Contig_N50	Average_Gene_Length	Genome_Size	GC_Content	Total_Coding_Sequences	Total_Contigs	Max_Contig_Length	Additional_Notes
+NC_000913.fasta	100.0	0.13	Neural Network (Specific Model)	11	0.876	4641652	314.20629775410976	4641652	0.51	4319	1	4641652	None
+NC_002737.fasta	99.99	0.48	Neural Network (Specific Model)	11	0.856	1852433	298.1390765765766	1852433	0.39	1776	1	1852433	None
+NC_003450.fasta	100.0	0.29	Neural Network (Specific Model)	11	0.872	3309401	313.8808205796158	3309401	0.54	3071	1	3309401	None
+NC_008261.fasta	100.0	0.14	Neural Network (Specific Model)	11	0.837	3256683	316.0170197985412	3256683	0.28	2879	1	3256683	None
+NC_009012.fasta	100.0	1.09	Neural Network (Specific Model)	11	0.849	3843301	320.7092407298411	3843301	0.39	3398	1	3843301	None
+NC_012982.fasta	100.0	0.05	Neural Network (Specific Model)	11	0.897	3455622	328.879173290938	3455622	0.45	3145	1	3455622	None
+NC_014008.fasta	100.0	0.02	Neural Network (Specific Model)	11	0.902	3750771	358.93038779402417	3750771	0.54	3146	1	3750771	None
+NC_014168.fasta	99.99	0.03	Neural Network (Specific Model)	11	0.907	3157527	311.3860162601626	3157527	0.67	3075	1	3157527	None
+NC_014211.fasta	14.07	0.01	Neural Network (Specific Model)	11	0.836	775354	308.61626248216834	775354	0.72	701	1	775354	None
+NC_014212.fasta	99.99	0.16	Neural Network (Specific Model)	11	0.904	3249394	303.41267387944356	3249394	0.62	3235	1	3249394	None
+NC_014363.fasta	99.7	0.35	Neural Network (Specific Model)	11	0.874	2051896	337.48281690140846	2051896	0.65	1775	1	2051896	None
+NC_014364.fasta	99.98	1.88	Neural Network (Specific Model)	11	0.931	4653970	337.5459421641791	4653970	0.49	4288	1	4653970	None
+NC_015761.fasta	100.0	0.14	Neural Network (Specific Model)	11	0.871	4460105	320.1726352185725	4460105	0.51	4049	1	4460105	None
+NC_017033.fasta	99.99	0.04	Neural Network (Specific Model)	11	0.872	3603458	329.2016938519448	3603458	0.63	3188	1	3603458	None
+NC_017095.fasta	99.95	2.67	Neural Network (Specific Model)	11	0.916	2166381	329.75584286424663	2166381	0.39	2011	1	2166381	None
+NC_018014.fasta	99.99	9.38	Neural Network (Specific Model)	11	0.891	5227858	357.07764759935674	5227858	0.6	4353	1	5227858	None
+NC_018068.fasta	99.99	0.42	Neural Network (Specific Model)	11	0.824	4926837	296.0867001528718	4926837	0.42	4579	1	4926837	None
+NC_018515.fasta	100.0	1.83	Neural Network (Specific Model)	11	0.834	4873567	302.3391304347826	4873567	0.42	4485	1	4873567	None
+NC_019897.fasta	99.95	0.34	Neural Network (Specific Model)	11	0.874	4206343	318.1461139896373	4206343	0.61	3860	1	4206343	None
+NC_019904.fasta	100.0	0.23	Neural Network (Specific Model)	11	0.869	5608040	351.0986827898942	5608040	0.45	4631	1	5608040	None
+NC_019936.fasta	100.0	0.13	Neural Network (Specific Model)	11	0.896	4575057	320.7199437543942	4575057	0.63	4267	1	4575057	None
+NC_021184.fasta	100.0	3.04	Neural Network (Specific Model)	11	0.823	4855529	289.67620906527867	4855529	0.45	4611	1	4855529	None
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_000913.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_000913.3|provirus_563848_584430	20583	Yes	9846	32	13	6	Low-quality	Genome-fragment	16.3	HMM-based (lower-bound)	52.16	1.0	low-confidence Provirus
+NC_000913.3|provirus_1196867_1213107	16241	No	NA	24	9	2	Low-quality	Genome-fragment	42.32	AAI-based (high-confidence)	0.0	1.0	
+NC_000913.3|provirus_1412000_1434224	22225	No	NA	27	13	1	Low-quality	Genome-fragment	34.35	HMM-based (lower-bound)	0.0	1.0	
+NC_000913.3|provirus_1627517_1653915	26399	Yes	17700	41	10	9	Low-quality	Genome-fragment	36.3	AAI-based (high-confidence)	32.95	1.0	low-confidence Provirus
+NC_000913.3|provirus_2461306_2476510	15205	No	NA	20	12	1	Low-quality	Genome-fragment	30.84	AAI-based (high-confidence)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_002737.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_002737.2|provirus_529627_569283	39657	No	NA	46	41	0	High-quality	High-quality	96.74	AAI-based (high-confidence)	0.0	1.0	
+NC_002737.2|provirus_777501_820593	43093	No	NA	65	42	1	High-quality	High-quality	96.04	AAI-based (high-confidence)	0.0	1.0	
+NC_002737.2|provirus_1186916_1222544	35629	No	NA	52	39	1	High-quality	High-quality	100.0	AAI-based (high-confidence)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_008261.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_008261.1|provirus_1070550_1127691	57142	Yes	43960	68	25	10	High-quality	High-quality	100.0	AAI-based (high-confidence)	23.07	1.0	
+NC_008261.1|provirus_1784095_1821197	37103	No	NA	44	21	1	Medium-quality	Genome-fragment	63.2	HMM-based (lower-bound)	0.0	1.01	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_009012.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_009012.1|provirus_1938476_1983993	45518	No	NA	52	23	2	Medium-quality	Genome-fragment	68.64	AAI-based (high-confidence)	0.0	1.0	
+NC_009012.1|provirus_2022140_2067593	45454	No	NA	54	21	0	Medium-quality	Genome-fragment	87.05	AAI-based (high-confidence)	0.0	1.0	
+NC_009012.1|provirus_2931283_2970170	38888	No	NA	62	28	3	Medium-quality	Genome-fragment	83.53	AAI-based (medium-confidence)	0.0	1.01	
+NC_009012.1|provirus_3339258_3389049	49792	No	NA	53	6	2	Medium-quality	Genome-fragment	74.06	HMM-based (lower-bound)	0.0	1.51	high kmer_freq may indicate large duplication
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_014168.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_014168.1|provirus_27479_67296	39818	No	NA	60	29	0	Medium-quality	Genome-fragment	88.69	AAI-based (high-confidence)	0.0	1.0	
+NC_014168.1|provirus_1141631_1162952	21322	No	NA	36	19	0	Medium-quality	Genome-fragment	51.44	AAI-based (medium-confidence)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_014212.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_014212.1|provirus_1170297_1209132	38836	No	NA	48	10	1	Medium-quality	Genome-fragment	62.91	AAI-based (medium-confidence)	0.0	1.0	
+NC_014212.1|provirus_1746722_1764354	17633	No	NA	38	3	0	Medium-quality	Genome-fragment	89.95	AAI-based (medium-confidence)	0.0	1.01	
+NC_014212.1|provirus_1893193_1914973	21781	No	NA	32	6	0	Medium-quality	Genome-fragment	65.66	AAI-based (medium-confidence)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_014364.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_014364.1|provirus_2121424_2157334	35911	Yes	29611	44	12	3	Medium-quality	Genome-fragment	63.36	AAI-based (medium-confidence)	17.54	1.0	
+NC_014364.1|provirus_2329685_2350621	20937	No	NA	29	6	1	Low-quality	Genome-fragment	22.17	HMM-based (lower-bound)	0.0	1.01	
+NC_014364.1|provirus_2666253_2703772	37520	No	NA	56	15	0	Medium-quality	Genome-fragment	73.62	AAI-based (high-confidence)	0.0	1.0	
+NC_014364.1|provirus_2976748_3014759	38012	No	NA	44	12	0	Medium-quality	Genome-fragment	69.42	HMM-based (lower-bound)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_015761.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_015761.1|provirus_847397_862760	15364	No	NA	19	11	1	Low-quality	Genome-fragment	44.56	AAI-based (high-confidence)	0.0	1.0	
+NC_015761.1|provirus_1007223_1045009	37787	No	NA	52	17	0	Medium-quality	Genome-fragment	54.82	HMM-based (lower-bound)	0.0	1.03	
+NC_015761.1|provirus_3084741_3115735	30995	No	NA	41	32	0	High-quality	High-quality	97.62	AAI-based (high-confidence)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_017033.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_017033.1|provirus_1052334_1094910	42577	No	NA	66	28	3	High-quality	High-quality	100.0	AAI-based (medium-confidence)	0.0	1.0	
+NC_017033.1|provirus_1557694_1600481	42788	No	NA	71	28	0	Medium-quality	Genome-fragment	89.2	AAI-based (medium-confidence)	0.0	1.01	
+NC_017033.1|provirus_2089294_2107522	18229	No	NA	25	3	0	Low-quality	Genome-fragment	29.18	HMM-based (lower-bound)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_018068.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_018068.1|provirus_1361108_1399802	38695	No	NA	52	24	0	Medium-quality	Genome-fragment	85.96	AAI-based (high-confidence)	0.0	1.0	
+NC_018068.1|provirus_2072558_2098541	25984	No	NA	36	4	1	High-quality	High-quality	100.0	AAI-based (medium-confidence)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_018515.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_018515.1|provirus_3418112_3436097	17986	No	NA	25	18	2	Low-quality	Genome-fragment	37.3	AAI-based (medium-confidence)	0.0	1.0	
+NC_018515.1|provirus_4659544_4694673	35130	No	NA	49	20	0	Medium-quality	Genome-fragment	66.0	HMM-based (lower-bound)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_019936.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_019936.1|provirus_2347508_2361929	14422	No	NA	24	2	0	High-quality	High-quality	100.0	AAI-based (high-confidence)	0.0	1.93	high kmer_freq may indicate large duplication; contig >1.5x longer than expected genome length
+NC_019936.1|provirus_3233292_3242961	9670	No	NA	14	2	0	High-quality	High-quality	100.0	AAI-based (high-confidence)	0.0	1.0	
+NC_019936.1|provirus_4295725_4304306	8582	No	NA	13	2	0	High-quality	High-quality	100.0	AAI-based (medium-confidence)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/checkv_quality_summary/NC_021184.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+contig_id	contig_length	provirus	proviral_length	gene_count	viral_genes	host_genes	checkv_quality	miuvig_quality	completeness	completeness_method	contamination	kmer_freq	warnings
+NC_021184.1|provirus_19778_35564	15787	No	NA	22	5	1	Low-quality	Genome-fragment	40.5	AAI-based (medium-confidence)	0.0	1.0	
+NC_021184.1|provirus_4466413_4519129	52717	No	NA	62	22	3	High-quality	High-quality	100.0	AAI-based (medium-confidence)	0.0	1.0	
+NC_021184.1|provirus_4563831_4615358	51528	No	NA	59	23	4	High-quality	High-quality	100.0	AAI-based (high-confidence)	0.0	1.0	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_000913.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,10 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_000913.3_Lit_3	Lit	Lit	Defense	NC_000913.3_1111	NC_000913.3_1111	NC_000913.3_1111	1	Lit__Lit
+NC_000913.3_RM_Type_IV_9	RM	RM_Type_IV	Defense	NC_000913.3_1130	NC_000913.3_1130	NC_000913.3_1130	1	RM_Type_IV__Type_IV_05
+NC_000913.3_Hachiman_1	Hachiman	Hachiman	Defense	NC_000913.3_2589	NC_000913.3_2590	NC_000913.3_2589,NC_000913.3_2590	2	Hachiman__HamA_2,Hachiman__HamB
+NC_000913.3_RnlAB_6	RnlAB	RnlAB	Defense	NC_000913.3_2591	NC_000913.3_2592	NC_000913.3_2591,NC_000913.3_2592	2	RnlAB__RnlA,RnlAB__RnlB
+NC_000913.3_CAS_Class1-Subtype-I-E_11	Cas	CAS_Class1-Subtype-I-E	Defense	NC_000913.3_2706	NC_000913.3_2713	NC_000913.3_2706,NC_000913.3_2707,NC_000913.3_2708,NC_000913.3_2709,NC_000913.3_2710,NC_000913.3_2711,NC_000913.3_2712,NC_000913.3_2713	8	cas1_I-E_1,cas2_I-E_2,cas3_I_5,cas5_I-E_3,cas6e_I_II_III_IV_V_VI_1,cas7_I-E_2,cas8e_I-E_1,cse2gr11_I-E_1
+NC_000913.3_MazEF_4	MazEF	MazEF	Defense	NC_000913.3_2734	NC_000913.3_2735	NC_000913.3_2734,NC_000913.3_2735	2	MazEF__MazE,MazEF__MazF
+NC_000913.3_MazEF_5	MazEF	MazEF	Defense	NC_000913.3_4140	NC_000913.3_4141	NC_000913.3_4140,NC_000913.3_4141	2	MazEF__MazE,MazEF__MazF
+NC_000913.3_RM_Type_IV_10	RM	RM_Type_IV	Defense	NC_000913.3_4262	NC_000913.3_4263	NC_000913.3_4262,NC_000913.3_4263	2	RM_Type_IV__FAM_1,RM_Type_IV__FAM_2
+NC_000913.3_RM_Type_I_8	RM	RM_Type_I	Defense	NC_000913.3_4265	NC_000913.3_4267	NC_000913.3_4265,NC_000913.3_4266,NC_000913.3_4267	3	RM__Type_I_MTases_FAM_2,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_52
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_002737.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_002737.2_AbiAlpha_1	AbiAlpha	AbiAlpha	Defense	NC_002737.2_745	NC_002737.2_745	NC_002737.2_745	1	AbiAlpha__AbiAlpha
+NC_002737.2_VP1853_2	VP1853	VP1853	Defense	NC_002737.2_750	NC_002737.2_750	NC_002737.2_750	1	VP1853__VP1853
+NC_002737.2_CAS_Class2-Subtype-II-A_7	Cas	CAS_Class2-Subtype-II-A	Defense	NC_002737.2_832	NC_002737.2_835	NC_002737.2_832,NC_002737.2_833,NC_002737.2_834,NC_002737.2_835	4	cas1_I_II_III_IV_V_VI_5,cas2_I_II_III_IV_V_VI_6,cas9_II-A_II-B_II-C_3,csn2_II-A_4
+NC_002737.2_CAS_Class1-Subtype-I-C_5	Cas	CAS_Class1-Subtype-I-C	Defense	NC_002737.2_1263	NC_002737.2_1269	NC_002737.2_1263,NC_002737.2_1264,NC_002737.2_1265,NC_002737.2_1266,NC_002737.2_1267,NC_002737.2_1268,NC_002737.2_1269	7	cas1_I_II_III_IV_V_VI_6,cas2_I_II_III_IV_V_VI_5,cas3_I_5,cas4_I_II_III_IV_V_VI_4,cas5_I-C_11,cas7_I-C_13,cas8c_I-C_1
+NC_002737.2_RM_Type_I_4	RM	RM_Type_I	Defense	NC_002737.2_1533	NC_002737.2_1535	NC_002737.2_1533,NC_002737.2_1534,NC_002737.2_1535	3	RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_51
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_003450.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_003450.3_RM_Type_IIG_2_7	RM	RM_Type_IIG_2	Defense	NC_003450.3_730	NC_003450.3_730	NC_003450.3_730	1	RM_Type_IIG__Type_IIG_FAM_0.einsi_trimmed
+NC_003450.3_Uzume_1	Uzume	Uzume	Defense	NC_003450.3_1364	NC_003450.3_1364	NC_003450.3_1364	1	Uzume__UzuA
+NC_003450.3_RM_Type_II_4	RM	RM_Type_II	Defense	NC_003450.3_1762	NC_003450.3_1764	NC_003450.3_1762,NC_003450.3_1763,NC_003450.3_1764	3	RM_Type_II__Type_II_MTases_FAM_0,RM_Type_II__Type_II_REase29,RM_Type_II__Type_II_REase38
+NC_003450.3_Wadjet_I_3	Wadjet	Wadjet_I	Defense	NC_003450.3_2782	NC_003450.3_2785	NC_003450.3_2782,NC_003450.3_2783,NC_003450.3_2784,NC_003450.3_2785	4	Wadjet__JetA_I,Wadjet__JetB_I,Wadjet__JetC_I,Wadjet__JetD_I
+NC_003450.3_RM_Type_IIG_6	RM	RM_Type_IIG	Defense	NC_003450.3_3041	NC_003450.3_3041	NC_003450.3_3041	1	RM_Type_IIG__Type_IIG_FAM_2.einsi_trimmed
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_008261.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,8 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_008261.1_RM_Type_II_5	RM	RM_Type_II	Defense	NC_008261.1_127	NC_008261.1_128	NC_008261.1_127,NC_008261.1_128	2	RM_Type_II__Type_II_MTases_FAM_0,RM_Type_II__Type_II_REase18
+NC_008261.1_RM_Type_III_7	RM	RM_Type_III	Defense	NC_008261.1_340	NC_008261.1_341	NC_008261.1_340,NC_008261.1_341	2	RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_008261.1_RM_Type_IV_8	RM	RM_Type_IV	Defense	NC_008261.1_962	NC_008261.1_963	NC_008261.1_962,NC_008261.1_963	2	RM_Type_IV__FAM_1,RM_Type_IV__FAM_2
+NC_008261.1_DRT_2_1	DRT	DRT_2	Defense	NC_008261.1_983	NC_008261.1_983	NC_008261.1_983	1	DRT2__DRT2
+NC_008261.1_RM_Type_II_6	RM	RM_Type_II	Defense	NC_008261.1_985	NC_008261.1_987	NC_008261.1_985,NC_008261.1_986,NC_008261.1_987	3	RM_Type_II__Type_II_MTases_FAM_0,RM_Type_II__Type_II_MTases_FAM_22,RM_Type_II__Type_II_REase34
+NC_008261.1_PD-Lambda-5_2	PD-Lambda-5	PD-Lambda-5	Defense	NC_008261.1_1563	NC_008261.1_1564	NC_008261.1_1563,NC_008261.1_1564	2	PD-Lambda-5__PD-Lambda-5_A,PD-Lambda-5__PD-Lambda-5_B
+NC_008261.1_RM_Type_I_4	RM	RM_Type_I	Defense	NC_008261.1_2512	NC_008261.1_2515	NC_008261.1_2512,NC_008261.1_2514,NC_008261.1_2515	3	RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_51
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_009012.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,14 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_009012.1_RM_Type_III_8	RM	RM_Type_III	Defense	NC_009012.1_532	NC_009012.1_533	NC_009012.1_532,NC_009012.1_533	2	RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_009012.1_SEFIR_3	SEFIR	SEFIR	Defense	NC_009012.1_1184	NC_009012.1_1184	NC_009012.1_1184	1	SEFIR__bSEFIR
+NC_009012.1_RloC_2	RloC	RloC	Defense	NC_009012.1_1211	NC_009012.1_1211	NC_009012.1_1211	1	RloC__RloC
+NC_009012.1_RM_Type_II_4	RM	RM_Type_II	Defense	NC_009012.1_1577	NC_009012.1_1579	NC_009012.1_1577,NC_009012.1_1578,NC_009012.1_1579	3	RM_Type_II__Type_II_MTases_FAM_38,RM_Type_II__Type_II_MTases_FAM_4,RM_Type_II__Type_II_REase32
+NC_009012.1_AbiU_1	AbiU	AbiU	Defense	NC_009012.1_1698	NC_009012.1_1698	NC_009012.1_1698	1	AbiU__AbiU
+NC_009012.1_RM_Type_II_5	RM	RM_Type_II	Defense	NC_009012.1_1826	NC_009012.1_1827	NC_009012.1_1826,NC_009012.1_1827	2	RM_Type_II__Type_II_MTases_FAM_16,RM_Type_II__Type_II_REase01
+NC_009012.1_CAS_Class1-Subtype-III-D_11	Cas	CAS_Class1-Subtype-III-D	Defense	NC_009012.1_2140	NC_009012.1_2149	NC_009012.1_2140,NC_009012.1_2141,NC_009012.1_2142,NC_009012.1_2143,NC_009012.1_2144,NC_009012.1_2145,NC_009012.1_2146,NC_009012.1_2147,NC_009012.1_2149	9	cas10_III-D_3,csm2gr11_III-D_6,csm2gr11_III-D_7,csm3gr7_III-A_III-D_2,csm3gr7_III_1,csm3gr7_III_1,csm3gr7_III_IV,csx10gr5_III-D_2,csx1_III_9
+NC_009012.1_CAS_Class1-Subtype-I-B_9	Cas	CAS_Class1-Subtype-I-B	Defense	NC_009012.1_2404	NC_009012.1_2411	NC_009012.1_2404,NC_009012.1_2405,NC_009012.1_2406,NC_009012.1_2407,NC_009012.1_2408,NC_009012.1_2409,NC_009012.1_2410,NC_009012.1_2411	8	cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-B_1,cas6_I_II_III_IV_V_VI_14,cas7_I-B_6,cas8b1_I-B_12
+NC_009012.1_RM_Type_II_6	RM	RM_Type_II	Defense	NC_009012.1_2429	NC_009012.1_2430	NC_009012.1_2429,NC_009012.1_2430	2	RM_Type_II__Type_II_MTases_FAM_2,RM_Type_II__Type_II_REase30
+NC_009012.1_RM_Type_II_7	RM	RM_Type_II	Defense	NC_009012.1_2587	NC_009012.1_2588	NC_009012.1_2587,NC_009012.1_2588	2	RM_Type_II__Type_II_MTases_FAM_4,RM_Type_II__Type_II_REase07
+NC_009012.1_CAS_Class1-Subtype-I-B_10	Cas	CAS_Class1-Subtype-I-B	Defense	NC_009012.1_3357	NC_009012.1_3361	NC_009012.1_3357,NC_009012.1_3358,NC_009012.1_3359,NC_009012.1_3360,NC_009012.1_3361	5	cas3_I_5,cas5_I-B_17,cas6_I_II_III_IV_V_VI_12,cas7_I-B_8,cas8b1_I-B_4
+NC_009012.1_CAS_Class1-Subtype-III-D_12	Cas	CAS_Class1-Subtype-III-D	Defense	NC_009012.1_3361	NC_009012.1_3378	NC_009012.1_3361,NC_009012.1_3365,NC_009012.1_3366,NC_009012.1_3367,NC_009012.1_3368,NC_009012.1_3369,NC_009012.1_3370,NC_009012.1_3372,NC_009012.1_3375,NC_009012.1_3376,NC_009012.1_3377,NC_009012.1_3378	12	cas10_III-D_3,cas1_I_II_III_IV_V_VI_10,cas2_I_II_III_IV_V_VI_3,cas4_I_II_III_IV_V_VI_1,cas6_I_II_III_IV_V_VI_12,csm3gr7_III-D_2,csm3gr7_III-D_3,csm3gr7_III_1,csx10gr5_III-D_3,csx19_III-D_11,csx1_III_21,csx1_III_9
+NC_009012.1_CAS_Class1-Subtype-III-D_12	Cas	CAS_Class1-Subtype-III-D	Defense	NC_009012.1_3361	NC_009012.1_3378	NC_009012.1_3361,NC_009012.1_3365,NC_009012.1_3366,NC_009012.1_3367,NC_009012.1_3368,NC_009012.1_3369,NC_009012.1_3370,NC_009012.1_3372,NC_009012.1_3375,NC_009012.1_3376,NC_009012.1_3377,NC_009012.1_3378	12	cas10_III-D_3,cas1_I_II_III_IV_V_VI_10,cas2_I_II_III_IV_V_VI_3,cas4_I_II_III_IV_V_VI_1,cas6_I_II_III_IV_V_VI_12,csm3gr7_III-D_2,csm3gr7_III-D_3,csm3gr7_III_1,csx10gr5_III-D_3,csx19_III-D_11,csx1_III_21,csx1_III_9
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_012982.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_012982.1_AbiC_1	AbiC	AbiC	Defense	NC_012982.1_420	NC_012982.1_420	NC_012982.1_420	1	AbiC__AbiC
+NC_012982.1_RM_Type_IIG_5	RM	RM_Type_IIG	Defense	NC_012982.1_623	NC_012982.1_623	NC_012982.1_623	1	RM_Type_IIG__Type_IIG_FAM_1.einsi_trimmed
+NC_012982.1_RM_Type_III_6	RM	RM_Type_III	Defense	NC_012982.1_1629	NC_012982.1_1630	NC_012982.1_1629,NC_012982.1_1630	2	RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_1.einsi_trimmed
+NC_012982.1_CBASS_I_3	CBASS	CBASS_I	Defense	NC_012982.1_1825	NC_012982.1_1826	NC_012982.1_1825,NC_012982.1_1826	2	CBASS__Cyclase_II,CBASS__Phospholipase
+NC_012982.1_Rst_DUF4238_4	Rst_DUF4238	Rst_DUF4238	Defense	NC_012982.1_2416	NC_012982.1_2416	NC_012982.1_2416	1	Rst_DUF4238__DUF4238_Pers
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014008.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_014008.1_RM_Type_I_6	RM	RM_Type_I	Defense	NC_014008.1_1177	NC_014008.1_1181	NC_014008.1_1177,NC_014008.1_1180,NC_014008.1_1181	3	RM__Type_I_MTases_FAM_3,RM__Type_I_REases_FAM_1.einsi_trimmed,RM__Type_I_S_52
+NC_014008.1_Viperin_3	Viperin	Viperin	Defense	NC_014008.1_1182	NC_014008.1_1182	NC_014008.1_1182	1	Viperin__pVip
+NC_014008.1_dGTPase_4	dGTPase	dGTPase	Defense	NC_014008.1_1769	NC_014008.1_1769	NC_014008.1_1769	1	dGTPase__Sp_dGTPase
+NC_014008.1_Ceres_1	Ceres	Ceres	Defense	NC_014008.1_2641	NC_014008.1_2641	NC_014008.1_2641	1	Ceres__CrsA1
+NC_014008.1_Gao_Mza_2	Gao_Mza	Gao_Mza	Defense	NC_014008.1_2741	NC_014008.1_2744	NC_014008.1_2741,NC_014008.1_2743,NC_014008.1_2744	3	Gao_Mza__MzaB,Gao_Mza__MzaC,Gao_Mza__MzaE
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014168.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_014168.1_RM_Type_II_2	RM	RM_Type_II	Defense	NC_014168.1_1355	NC_014168.1_1356	NC_014168.1_1355,NC_014168.1_1356	2	RM_Type_II__Type_II_MTases_FAM_41,RM_Type_II__Type_II_REase25
+NC_014168.1_RM_Type_IIG_3	RM	RM_Type_IIG	Defense	NC_014168.1_1738	NC_014168.1_1738	NC_014168.1_1738	1	RM_Type_IIG__Type_IIG_FAM_2.einsi_trimmed
+NC_014168.1_DS-20_1	DS-20	DS-20	Defense	NC_014168.1_2356	NC_014168.1_2356	NC_014168.1_2356	1	DS-20__DS-20
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014211.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014212.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_014212.1_Ceres_1	Ceres	Ceres	Defense	NC_014212.1_142	NC_014212.1_142	NC_014212.1_142	1	Ceres__CrsA1
+NC_014212.1_RM_Type_III_2	RM	RM_Type_III	Defense	NC_014212.1_571	NC_014212.1_572	NC_014212.1_571,NC_014212.1_572	2	RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_014212.1_CAS_Class1-Subtype-III-A_4	Cas	CAS_Class1-Subtype-III-A	Defense	NC_014212.1_712	NC_014212.1_723	NC_014212.1_712,NC_014212.1_713,NC_014212.1_714,NC_014212.1_715,NC_014212.1_716,NC_014212.1_719,NC_014212.1_720,NC_014212.1_721,NC_014212.1_722,NC_014212.1_723	10	cas10_III-A_1,cas1_I_II_III_IV_V_VI_1,cas2_I_II_III_IV_V_VI_8,cas6_I_II_III_IV_V_VI_22,csm2gr11_III-A_1,csm3gr7_III-A_1,csm4gr5_III-A_2,csm5gr7_III-A_2,csx1_III_21,csx1_III_21
+NC_014212.1_CAS_Class1-Subtype-I-E_3	Cas	CAS_Class1-Subtype-I-E	Defense	NC_014212.1_1246	NC_014212.1_1255	NC_014212.1_1246,NC_014212.1_1248,NC_014212.1_1249,NC_014212.1_1251,NC_014212.1_1252,NC_014212.1_1253,NC_014212.1_1254,NC_014212.1_1255	8	cas1_I-E_1,cas2_I-E_1,cas3_I_2,cas5_I-E_2,cas6e_I_II_III_IV_V_VI_2,cas7_I-E_16,cas8e_I-E_5,cse2gr11_I-E_8
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014363.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,7 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_014363.1_AbiE_1	AbiE	AbiE	Defense	NC_014363.1_207	NC_014363.1_208	NC_014363.1_207,NC_014363.1_208	2	AbiEii__AbiEi_4,AbiEii__AbiEii
+NC_014363.1_AbiE_2	AbiE	AbiE	Defense	NC_014363.1_473	NC_014363.1_474	NC_014363.1_473,NC_014363.1_474	2	AbiEii__AbiEi_4,AbiEii__AbiEii
+NC_014363.1_VP1839_3	VP1839	VP1839	Defense	NC_014363.1_1184	NC_014363.1_1184	NC_014363.1_1184	1	VP1839__VP1839
+NC_014363.1_RM_Type_II_6	RM	RM_Type_II	Defense	NC_014363.1_1186	NC_014363.1_1187	NC_014363.1_1186,NC_014363.1_1187	2	RM_Type_II__Type_II_MTases_FAM_0,RM_Type_II__Type_II_REase15
+NC_014363.1_CAS_Class2-Subtype-II-A_7	Cas	CAS_Class2-Subtype-II-A	Defense	NC_014363.1_1233	NC_014363.1_1236	NC_014363.1_1233,NC_014363.1_1234,NC_014363.1_1235,NC_014363.1_1236	4	cas1_I_II_III_IV_V_VI_5,cas2_I_II_III_IV_V_VI_6,cas9_II-A_1,csn2_II-A_3
+NC_014363.1_RM_Type_I_5	RM	RM_Type_I	Defense	NC_014363.1_1659	NC_014363.1_1664	NC_014363.1_1659,NC_014363.1_1662,NC_014363.1_1663,NC_014363.1_1664	4	RM__Type_I_MTases_FAM_2,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_04,RM__Type_I_S_04
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_014364.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,7 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_014364.1_TIR-IV_4	TIR-IV	TIR-IV	Defense	NC_014364.1_392	NC_014364.1_393	NC_014364.1_392,NC_014364.1_393	2	TIR-IV__TIR-IV_A,TIR-IV__TIR-IV_B
+NC_014364.1_SoFic_3	SoFIC	SoFic	Defense	NC_014364.1_418	NC_014364.1_418	NC_014364.1_418	1	SoFic__SoFic
+NC_014364.1_MazEF_2	MazEF	MazEF	Defense	NC_014364.1_697	NC_014364.1_698	NC_014364.1_697,NC_014364.1_698	2	MazEF__MazE,MazEF__MazF
+NC_014364.1_CAS_Class1-Subtype-I-C_5	Cas	CAS_Class1-Subtype-I-C	Defense	NC_014364.1_1062	NC_014364.1_1069	NC_014364.1_1062,NC_014364.1_1063,NC_014364.1_1064,NC_014364.1_1065,NC_014364.1_1066,NC_014364.1_1067,NC_014364.1_1068,NC_014364.1_1069	8	WYL_I_II_III_IV_V_VI_4,cas1_I_II_III_IV_V_VI_6,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-C_11,cas7_I-C_7,cas8c_I-C_4
+NC_014364.1_CAS_Class1-Subtype-IV-B_6	Cas	CAS_Class1-Subtype-IV-B	Defense	NC_014364.1_2494	NC_014364.1_2499	NC_014364.1_2494,NC_014364.1_2496,NC_014364.1_2497,NC_014364.1_2498,NC_014364.1_2499	5	csf1gr8_IV-A_5,csf2gr7_IV_1,csf3gr5_IV-B_1,csf4gr11_IV-B_4,cysH_IV-B_1
+NC_014364.1_AbiE_1	AbiE	AbiE	Defense	NC_014364.1_2619	NC_014364.1_2620	NC_014364.1_2619,NC_014364.1_2620	2	AbiEii__AbiEi_4,AbiEii__AbiEii
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_015761.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,9 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_015761.1_PrrC_6	PrrC	PrrC	Defense	NC_015761.1_263	NC_015761.1_265	NC_015761.1_263,NC_015761.1_264,NC_015761.1_265	3	PrrC__EcoprrI,PrrC__EcoprrI,RM__Type_I_REases_FAM_0.einsi_trimmed
+NC_015761.1_DarTG_2	DarTG	DarTG	Defense	NC_015761.1_279	NC_015761.1_280	NC_015761.1_279,NC_015761.1_280	2	DarTG__DarG,DarTG__DarT
+NC_015761.1_RM_Type_III_7	RM	RM_Type_III	Defense	NC_015761.1_310	NC_015761.1_311	NC_015761.1_310,NC_015761.1_311	2	RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_015761.1_PfiAT_4	PfiAT	PfiAT	Defense	NC_015761.1_932	NC_015761.1_933	NC_015761.1_932,NC_015761.1_933	2	PfiAT__PfiA,PfiAT__PfiT
+NC_015761.1_CAS_Class1-Subtype-I-E_8	Cas	CAS_Class1-Subtype-I-E	Defense	NC_015761.1_2549	NC_015761.1_2556	NC_015761.1_2549,NC_015761.1_2550,NC_015761.1_2551,NC_015761.1_2552,NC_015761.1_2553,NC_015761.1_2554,NC_015761.1_2555,NC_015761.1_2556	8	cas1_I-E_1,cas2_I-E_2,cas3_I_5,cas5_I-E_3,cas6e_I_II_III_IV_V_VI_1,cas7_I-E_2,cas8e_I-E_1,cse2gr11_I-E_2
+NC_015761.1_dCTPdeaminase_5	dCTPdeaminase	dCTPdeaminase	Defense	NC_015761.1_3620	NC_015761.1_3620	NC_015761.1_3620	1	dCTPdeaminase__dCTPdeaminase
+NC_015761.1_Mokosh_TypeII_3	Mokosh	Mokosh_TypeII	Defense	NC_015761.1_3957	NC_015761.1_3957	NC_015761.1_3957	1	Mokosh_TypeII__MkoC
+NC_015761.1_DS-17_1	DS-17	DS-17	Defense	NC_015761.1_3965	NC_015761.1_3965	NC_015761.1_3965	1	DS-17__DS-17
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_017033.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_017033.1_PrrC_3	PrrC	PrrC	Defense	NC_017033.1_586	NC_017033.1_589	NC_017033.1_586,NC_017033.1_587,NC_017033.1_588,NC_017033.1_589	4	PrrC__EcoprrI,PrrC__PrrC,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_02
+NC_017033.1_DS-6_1	DS-6	DS-6	Defense	NC_017033.1_1067	NC_017033.1_1068	NC_017033.1_1067,NC_017033.1_1068	2	DS-6__DS-6A,DS-6__DS-6B
+NC_017033.1_Mokosh_TypeII_2	Mokosh	Mokosh_TypeII	Defense	NC_017033.1_1863	NC_017033.1_1863	NC_017033.1_1863	1	Mokosh_TypeII__MkoC
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_017095.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,8 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_017095.1_RM_Type_I_4	RM	RM_Type_I	Defense	NC_017095.1_540	NC_017095.1_543	NC_017095.1_540,NC_017095.1_541,NC_017095.1_542,NC_017095.1_543	4	RM__Type_I_MTases_FAM_0,RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_51
+NC_017095.1_CAS_Class1-Subtype-III-B_7	Cas	CAS_Class1-Subtype-III-B	Defense	NC_017095.1_1486	NC_017095.1_1502	NC_017095.1_1486,NC_017095.1_1487,NC_017095.1_1488,NC_017095.1_1489,NC_017095.1_1490,NC_017095.1_1491,NC_017095.1_1495,NC_017095.1_1497,NC_017095.1_1499,NC_017095.1_1500,NC_017095.1_1502	11	HTH_III_1,cas10_III_6,cas2_I_II_III_IV_V_VI_3,cas2_I_II_III_IV_V_VI_3,cas6_I_II_III_IV_V_VI_14,cmr1gr7_III-B_1,cmr3gr5_III-B_III-C_6,cmr4gr7_III-B_III-C_1,cmr5gr11_III-B_4,cmr6gr7_III-B_3,csx1_III_9
+NC_017095.1_CAS_Class1-Subtype-III-A_6	Cas	CAS_Class1-Subtype-III-A	Defense	NC_017095.1_1495	NC_017095.1_1512	NC_017095.1_1495,NC_017095.1_1497,NC_017095.1_1499,NC_017095.1_1500,NC_017095.1_1502,NC_017095.1_1503,NC_017095.1_1504,NC_017095.1_1505,NC_017095.1_1506,NC_017095.1_1507,NC_017095.1_1508,NC_017095.1_1509,NC_017095.1_1512	13	HTH_III_1,cas10_III-A_1,cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas2_I_II_III_IV_V_VI_3,cas6_I_II_III_IV_V_VI_14,cas6_I_II_III_IV_V_VI_19,casR_III_1,csm2gr11_III-A_15,csm3gr7_III-A_1,csm4gr5_III-A_1,csm5gr7_III-A_2,csx1_III_9
+NC_017095.1_CAS_Class1-Subtype-III-A_6	Cas	CAS_Class1-Subtype-III-A	Defense	NC_017095.1_1495	NC_017095.1_1512	NC_017095.1_1495,NC_017095.1_1497,NC_017095.1_1499,NC_017095.1_1500,NC_017095.1_1502,NC_017095.1_1503,NC_017095.1_1504,NC_017095.1_1505,NC_017095.1_1506,NC_017095.1_1507,NC_017095.1_1508,NC_017095.1_1509,NC_017095.1_1512	13	HTH_III_1,cas10_III-A_1,cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas2_I_II_III_IV_V_VI_3,cas6_I_II_III_IV_V_VI_14,cas6_I_II_III_IV_V_VI_19,casR_III_1,csm2gr11_III-A_15,csm3gr7_III-A_1,csm4gr5_III-A_1,csm5gr7_III-A_2,csx1_III_9
+NC_017095.1_Esos_1	Esos	Esos	Defense	NC_017095.1_1541	NC_017095.1_1541	NC_017095.1_1541	1	Esos__VCA0450
+NC_017095.1_VP1840_2	VP1840	VP1840	Defense	NC_017095.1_1651	NC_017095.1_1651	NC_017095.1_1651	1	VP1840__VP1840
+NC_017095.1_RM_Type_II_5	RM	RM_Type_II	Defense	NC_017095.1_1662	NC_017095.1_1664	NC_017095.1_1662,NC_017095.1_1663,NC_017095.1_1664	3	RM_Type_II__Type_II_MTases_FAM_38,RM_Type_II__Type_II_MTases_FAM_4,RM_Type_II__Type_II_REase32
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_018014.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_018014.1_DS-6_5	DS-6	DS-6	Defense	NC_018014.1_132	NC_018014.1_133	NC_018014.1_132,NC_018014.1_133	2	DS-6__DS-6A,DS-6__DS-6B
+NC_018014.1_Pycsar_6	Pycsar	Pycsar	Defense	NC_018014.1_571	NC_018014.1_573	NC_018014.1_571,NC_018014.1_572,NC_018014.1_573	3	CBASS__2TM_5,Pycsar__AG_cyclase,Pycsar__AG_cyclase
+NC_018014.1_DISARM_1_4	DISARM	DISARM_1	Defense	NC_018014.1_3050	NC_018014.1_3053	NC_018014.1_3050,NC_018014.1_3051,NC_018014.1_3052,NC_018014.1_3053	4	DISARM_1__drmMI,DISARM__drmA,DISARM__drmB,DISARM__drmC
+NC_018014.1_CBASS_III_3	CBASS	CBASS_III	Defense	NC_018014.1_3068	NC_018014.1_3071	NC_018014.1_3068,NC_018014.1_3069,NC_018014.1_3070,NC_018014.1_3071	4	CBASS__Cyclase_II,CBASS__Endonuc_big,CBASS__TRIP13,CBASS__bacHORMA_1
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_018068.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,13 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_018068.1_Hachiman_2	Hachiman	Hachiman	Defense	NC_018068.1_1171	NC_018068.1_1172	NC_018068.1_1171,NC_018068.1_1172	2	Hachiman__HamA_1,Hachiman__HamB
+NC_018068.1_RM_Type_I_10	RM	RM_Type_I	Defense	NC_018068.1_1178	NC_018068.1_1180	NC_018068.1_1178,NC_018068.1_1179,NC_018068.1_1180	3	RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_03
+NC_018068.1_RM_Type_IV_14	RM	RM_Type_IV	Defense	NC_018068.1_1186	NC_018068.1_1186	NC_018068.1_1186	1	RM_Type_IV__Type_IV_03
+NC_018068.1_RM_Type_II_11	RM	RM_Type_II	Defense	NC_018068.1_1192	NC_018068.1_1193	NC_018068.1_1192,NC_018068.1_1193	2	RM_Type_II__Type_II_MTases_FAM_7,RM_Type_II__Type_II_REase10
+NC_018068.1_CAS_Class1-Subtype-I-C_15	Cas	CAS_Class1-Subtype-I-C	Defense	NC_018068.1_1411	NC_018068.1_1418	NC_018068.1_1411,NC_018068.1_1412,NC_018068.1_1413,NC_018068.1_1414,NC_018068.1_1415,NC_018068.1_1417,NC_018068.1_1418	7	cas1_I_II_III_IV_V_VI_6,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-C_11,cas7_I-C_13,cas8c_I-C_4
+NC_018068.1_RM_Type_III_13	RM	RM_Type_III	Defense	NC_018068.1_1541	NC_018068.1_1542	NC_018068.1_1541,NC_018068.1_1542	2	RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_018068.1_Ceres_1	Ceres	Ceres	Defense	NC_018068.1_3152	NC_018068.1_3152	NC_018068.1_3152	1	Ceres__CrsA1
+NC_018068.1_MazEF_6	MazEF	MazEF	Defense	NC_018068.1_3456	NC_018068.1_3457	NC_018068.1_3456,NC_018068.1_3457	2	MazEF__MazE,MazEF__MazF
+NC_018068.1_Rst_HelicaseDUF2290_7	Rst_HelicaseDUF2290	Rst_HelicaseDUF2290	Defense	NC_018068.1_3757	NC_018068.1_3758	NC_018068.1_3757,NC_018068.1_3758	2	Rst_HelicaseDUF2290__DUF2290,Rst_HelicaseDUF2290__Helicase
+NC_018068.1_Hachiman_3	Hachiman	Hachiman	Defense	NC_018068.1_3759	NC_018068.1_3760	NC_018068.1_3759,NC_018068.1_3760	2	Hachiman__HamA_1,Hachiman__HamB
+NC_018068.1_Septu_8	Septu	Septu	Defense	NC_018068.1_4412	NC_018068.1_4413	NC_018068.1_4412,NC_018068.1_4413	2	Septu__PtuA,Septu__PtuB
+NC_018068.1_RM_Type_II_12	RM	RM_Type_II	Defense	NC_018068.1_4429	NC_018068.1_4430	NC_018068.1_4429,NC_018068.1_4430	2	RM_Type_II__Type_II_MTases_FAM_25,RM_Type_II__Type_II_REase09
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_018515.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,10 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_018515.1_AbiAlpha_1	AbiAlpha	AbiAlpha	Defense	NC_018515.1_121	NC_018515.1_121	NC_018515.1_121	1	AbiAlpha__AbiAlpha
+NC_018515.1_VP1839_11	VP1839	VP1839	Defense	NC_018515.1_122	NC_018515.1_122	NC_018515.1_122	1	VP1839__VP1839
+NC_018515.1_CBASS_IV_7	CBASS	CBASS_IV	Defense	NC_018515.1_324	NC_018515.1_328	NC_018515.1_324,NC_018515.1_325,NC_018515.1_326,NC_018515.1_327,NC_018515.1_328	5	CBASS__2TM_type_IV,CBASS__Cyclase_SMODS,CBASS__OGG,CBASS__QueC,CBASS__TGT
+NC_018515.1_BREX_I_4	BREX	BREX_I	Defense	NC_018515.1_329	NC_018515.1_335	NC_018515.1_329,NC_018515.1_330,NC_018515.1_331,NC_018515.1_332,NC_018515.1_334,NC_018515.1_335	6	BREX__brxA_DUF1819,BREX__brxB_DUF1788,BREX__brxC,BREX__brxL,BREX__pglX1,BREX__pglZA
+NC_018515.1_Prometheus_9	Prometheus	Prometheus	Defense	NC_018515.1_337	NC_018515.1_337	NC_018515.1_337	1	Prometheus__ProA
+NC_018515.1_Azaca_2	Azaca	Azaca	Defense	NC_018515.1_349	NC_018515.1_351	NC_018515.1_349,NC_018515.1_350,NC_018515.1_351	3	Azaca__ZacA,Azaca__ZacB,Azaca__ZacC
+NC_018515.1_Wadjet_III_13	Wadjet	Wadjet_III	Defense	NC_018515.1_1811	NC_018515.1_1814	NC_018515.1_1811,NC_018515.1_1812,NC_018515.1_1813,NC_018515.1_1814	4	Wadjet__JetA_III,Wadjet__JetB_III,Wadjet__JetC_III,Wadjet__JetD_III
+NC_018515.1_SpbK_10	SpbK	SpbK	Defense	NC_018515.1_2272	NC_018515.1_2272	NC_018515.1_2272	1	SpbK__SpbK
+NC_018515.1_Kiwa_8	Kiwa	Kiwa	Defense	NC_018515.1_3261	NC_018515.1_3262	NC_018515.1_3261,NC_018515.1_3262	2	Kiwa__KwaA,Kiwa__KwaB_2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_019897.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,13 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_019897.1_RM_Type_III_11	RM	RM_Type_III	Defense	NC_019897.1_86	NC_019897.1_87	NC_019897.1_86,NC_019897.1_87	2	RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_019897.1_MazEF_3	MazEF	MazEF	Defense	NC_019897.1_128	NC_019897.1_129	NC_019897.1_128,NC_019897.1_129	2	MazEF__MazE,MazEF__MazF
+NC_019897.1_RM_Type_II_9	RM	RM_Type_II	Defense	NC_019897.1_789	NC_019897.1_790	NC_019897.1_789,NC_019897.1_790	2	RM_Type_II__Type_II_MTases_FAM_2,RM_Type_II__Type_II_REase27
+NC_019897.1_Mokosh_TypeII_4	Mokosh	Mokosh_TypeII	Defense	NC_019897.1_913	NC_019897.1_913	NC_019897.1_913	1	Mokosh_TypeII__MkoC
+NC_019897.1_Druantia_I_2	Druantia	Druantia_I	Defense	NC_019897.1_2741	NC_019897.1_2744	NC_019897.1_2741,NC_019897.1_2742,NC_019897.1_2743,NC_019897.1_2744	4	Druantia_I__DruB,Druantia_I__DruC,Druantia_I__DruD,Druantia__DruE_1
+NC_019897.1_CAS_Class1-Subtype-III-D_14	Cas	CAS_Class1-Subtype-III-D	Defense	NC_019897.1_3030	NC_019897.1_3035	NC_019897.1_3030,NC_019897.1_3031,NC_019897.1_3032,NC_019897.1_3033,NC_019897.1_3034,NC_019897.1_3035	6	cas10_III-D_3,csm3gr7_III-D_2,csm3gr7_III-D_3,csm3gr7_III_1,csx19_III-D_17,csx1_III_11
+NC_019897.1_CAS_Class1-Subtype-I-B_12	Cas	CAS_Class1-Subtype-I-B	Defense	NC_019897.1_3046	NC_019897.1_3053	NC_019897.1_3046,NC_019897.1_3047,NC_019897.1_3048,NC_019897.1_3049,NC_019897.1_3050,NC_019897.1_3051,NC_019897.1_3052,NC_019897.1_3053	8	cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas3_I_2,cas4_I_II_III_IV_V_VI_6,cas5_I-B_17,cas6_I_II_III_IV_V_VI_20,cas7b_I-B_I-C_2,cas8b1_I-B_8
+NC_019897.1_CAS_Class1-Subtype-I-C_13	Cas	CAS_Class1-Subtype-I-C	Defense	NC_019897.1_3155	NC_019897.1_3158	NC_019897.1_3155,NC_019897.1_3156,NC_019897.1_3157,NC_019897.1_3158	4	cas3_I_5,cas5_I-C_5,cas7_I-C_7,cas8c_I-C_4
+NC_019897.1_Wadjet_II_6	Wadjet	Wadjet_II	Defense	NC_019897.1_3286	NC_019897.1_3289	NC_019897.1_3286,NC_019897.1_3287,NC_019897.1_3288,NC_019897.1_3289	4	Wadjet__JetA_II,Wadjet__JetB_II,Wadjet__JetC_II,Wadjet__JetD_II
+NC_019897.1_RM_Type_I_8	RM	RM_Type_I	Defense	NC_019897.1_3326	NC_019897.1_3328	NC_019897.1_3326,NC_019897.1_3327,NC_019897.1_3328	3	RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_51
+NC_019897.1_RM_Type_II_10	RM	RM_Type_II	Defense	NC_019897.1_3527	NC_019897.1_3528	NC_019897.1_3527,NC_019897.1_3528	2	RM_Type_II__Type_II_MTases_FAM_16,RM_Type_II__Type_II_REase01
+NC_019897.1_Ceres_1	Ceres	Ceres	Defense	NC_019897.1_3704	NC_019897.1_3704	NC_019897.1_3704	1	Ceres__CrsA1
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_019904.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,18 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_019904.1_HEC-05_12	HEC-05	HEC-05	Defense	NC_019904.1_318	NC_019904.1_318	NC_019904.1_318	1	HEC-05__HEC-05
+NC_019904.1_RM_Type_I_19	RM	RM_Type_I	Defense	NC_019904.1_371	NC_019904.1_374	NC_019904.1_371,NC_019904.1_372,NC_019904.1_374	3	RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_01
+NC_019904.1_dCTPdeaminase_15	dCTPdeaminase	dCTPdeaminase	Defense	NC_019904.1_408	NC_019904.1_408	NC_019904.1_408	1	dCTPdeaminase__dCTPdeaminase
+NC_019904.1_RM_Type_I_20	RM	RM_Type_I	Defense	NC_019904.1_411	NC_019904.1_413	NC_019904.1_411,NC_019904.1_412,NC_019904.1_413	3	RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_03
+NC_019904.1_Gabija_8	Gabija	Gabija	Defense	NC_019904.1_430	NC_019904.1_431	NC_019904.1_430,NC_019904.1_431	2	Gabija__GajA,Gabija__GajB_2
+NC_019904.1_Gao_Qat_11	Gao_Qat	Gao_Qat	Defense	NC_019904.1_1323	NC_019904.1_1326	NC_019904.1_1323,NC_019904.1_1324,NC_019904.1_1325,NC_019904.1_1326	4	Gao_Qat__QatA,Gao_Qat__QatB,Gao_Qat__QatC,Gao_Qat__QatD
+NC_019904.1_SoFic_14	SoFIC	SoFic	Defense	NC_019904.1_1676	NC_019904.1_1676	NC_019904.1_1676	1	SoFic__SoFic
+NC_019904.1_Gabija_9	Gabija	Gabija	Defense	NC_019904.1_1900	NC_019904.1_1901	NC_019904.1_1900,NC_019904.1_1901	2	Gabija__GajA,Gabija__GajB_3
+NC_019904.1_RM_Type_II_22	RM	RM_Type_II	Defense	NC_019904.1_1947	NC_019904.1_1949	NC_019904.1_1947,NC_019904.1_1948,NC_019904.1_1949	3	RM_Type_II__Type_II_MTases_FAM_2,RM_Type_II__Type_II_REase06,RM_Type_II__Type_II_REase38
+NC_019904.1_Sirona_13	Sirona	Sirona	Defense	NC_019904.1_1950	NC_019904.1_1950	NC_019904.1_1950	1	Sirona__VCA0356
+NC_019904.1_CBASS_II_5	CBASS	CBASS_II	Defense	NC_019904.1_3143	NC_019904.1_3145	NC_019904.1_3143,NC_019904.1_3144,NC_019904.1_3145	3	CBASS__Cyclase_II,CBASS__E2,CBASS__Effector_2TM_Sa_NUDIX
+NC_019904.1_AbiE_2	AbiE	AbiE	Defense	NC_019904.1_3195	NC_019904.1_3196	NC_019904.1_3195,NC_019904.1_3196	2	AbiEii__AbiEi_3,AbiEii__AbiEii
+NC_019904.1_RM_Type_I_21	RM	RM_Type_I	Defense	NC_019904.1_4383	NC_019904.1_4389	NC_019904.1_4383,NC_019904.1_4387,NC_019904.1_4388,NC_019904.1_4389	4	RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_01,RM__Type_I_S_51
+NC_019904.1_AbiD_1	AbiD	AbiD	Defense	NC_019904.1_4385	NC_019904.1_4385	NC_019904.1_4385	1	AbiD__AbiD
+NC_019904.1_Cernunnos_7	Cernunnos	Cernunnos	Defense	NC_019904.1_4390	NC_019904.1_4390	NC_019904.1_4390	1	Cernunnos__VCA0410
+NC_019904.1_Gabija_10	Gabija	Gabija	Defense	NC_019904.1_4391	NC_019904.1_4392	NC_019904.1_4391,NC_019904.1_4392	2	Gabija__GajA,Gabija__GajB_1
+NC_019904.1_Ceres_6	Ceres	Ceres	Defense	NC_019904.1_4414	NC_019904.1_4414	NC_019904.1_4414	1	Ceres__CrsA1
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_019936.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,11 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_019936.1_Gabija_5	Gabija	Gabija	Defense	NC_019936.1_617	NC_019936.1_618	NC_019936.1_617,NC_019936.1_618	2	Gabija__GajA,Gabija__GajB_3
+NC_019936.1_RM_Type_I_12	RM	RM_Type_I	Defense	NC_019936.1_860	NC_019936.1_862	NC_019936.1_860,NC_019936.1_861,NC_019936.1_862	3	RM__Type_I_MTases_FAM_3,RM__Type_I_REases_FAM_1.einsi_trimmed,RM__Type_I_S_52
+NC_019936.1_Shango_6	Shango	Shango	Defense	NC_019936.1_896	NC_019936.1_898	NC_019936.1_896,NC_019936.1_897,NC_019936.1_898	3	Shango__SngA,Shango__SngB,Shango__SngC
+NC_019936.1_RM_Type_I_13	RM	RM_Type_I	Defense	NC_019936.1_1070	NC_019936.1_1072	NC_019936.1_1070,NC_019936.1_1071,NC_019936.1_1072	3	RM__Type_I_MTases_FAM_1,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_03
+NC_019936.1_RM_Type_IV_16	RM	RM_Type_IV	Defense	NC_019936.1_1377	NC_019936.1_1377	NC_019936.1_1377	1	RM_Type_IV__FAM_0
+NC_019936.1_AbiC_1	AbiC	AbiC	Defense	NC_019936.1_2817	NC_019936.1_2817	NC_019936.1_2817	1	AbiC__AbiC
+NC_019936.1_RM_Type_I_14	RM	RM_Type_I	Defense	NC_019936.1_3312	NC_019936.1_3317	NC_019936.1_3312,NC_019936.1_3313,NC_019936.1_3314,NC_019936.1_3317	4	RM__Type_I_MTases_FAM_3,RM__Type_I_REases_FAM_1.einsi_trimmed,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_52
+NC_019936.1_CBASS_III_4	CBASS	CBASS_III	Defense	NC_019936.1_3322	NC_019936.1_3325	NC_019936.1_3322,NC_019936.1_3323,NC_019936.1_3324,NC_019936.1_3325	4	CBASS__Cyclase_II,CBASS__Endonuc_big,CBASS__TRIP13,CBASS__bacHORMA_1
+NC_019936.1_RM_Type_I_15	RM	RM_Type_I	Defense	NC_019936.1_3936	NC_019936.1_3940	NC_019936.1_3936,NC_019936.1_3939,NC_019936.1_3940	3	RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_06
+NC_019936.1_dCTPdeaminase_7	dCTPdeaminase	dCTPdeaminase	Defense	NC_019936.1_4004	NC_019936.1_4004	NC_019936.1_4004	1	dCTPdeaminase__dCTPdeaminase
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/defense_finder_systems/NC_021184.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,25 @@
+sys_id	type	subtype	activity	sys_beg	sys_end	protein_in_syst	genes_count	name_of_profiles_in_sys
+NC_021184.1_SoFic_11	SoFIC	SoFic	Defense	NC_021184.1_113	NC_021184.1_113	NC_021184.1_113	1	SoFic__SoFic
+NC_021184.1_RM_Type_I_21	RM	RM_Type_I	Defense	NC_021184.1_221	NC_021184.1_224	NC_021184.1_221,NC_021184.1_223,NC_021184.1_224	3	RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_51
+NC_021184.1_RM_Type_I_22	RM	RM_Type_I	Defense	NC_021184.1_242	NC_021184.1_244	NC_021184.1_242,NC_021184.1_243,NC_021184.1_244	3	RM__Type_I_MTases_FAM_2,RM__Type_I_REases_FAM_2.einsi_trimmed,RM__Type_I_S_52
+NC_021184.1_MazEF_8	MazEF	MazEF	Defense	NC_021184.1_395	NC_021184.1_396	NC_021184.1_395,NC_021184.1_396	2	MazEF__MazE,MazEF__MazF
+NC_021184.1_CAS_Class1-Subtype-I-B_29	Cas	CAS_Class1-Subtype-I-B	Defense	NC_021184.1_509	NC_021184.1_516	NC_021184.1_509,NC_021184.1_510,NC_021184.1_511,NC_021184.1_512,NC_021184.1_513,NC_021184.1_514,NC_021184.1_515,NC_021184.1_516	8	cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas3_I_2,cas4_I_II_III_IV_V_VI_6,cas5_I-B_17,cas6_I-B_III_1,cas7b_I-B_I-C_2,cas8b1_I-B_9
+NC_021184.1_CAS_Class1-Subtype-I-B_30	Cas	CAS_Class1-Subtype-I-B	Defense	NC_021184.1_770	NC_021184.1_779	NC_021184.1_770,NC_021184.1_773,NC_021184.1_774,NC_021184.1_775,NC_021184.1_776,NC_021184.1_777,NC_021184.1_778,NC_021184.1_779	8	cas1_I_II_III_IV_V_VI_7,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-B_17,cas6_I_II_III_IV_V_VI_20,cas7_I-B_8,cas8b1_I-B_14
+NC_021184.1_Wadjet_II_17	Wadjet	Wadjet_II	Defense	NC_021184.1_925	NC_021184.1_928	NC_021184.1_925,NC_021184.1_926,NC_021184.1_927,NC_021184.1_928	4	Wadjet__JetA_II,Wadjet__JetB_II,Wadjet__JetC_II,Wadjet__JetD_II
+NC_021184.1_RM_Type_I_23	RM	RM_Type_I	Defense	NC_021184.1_963	NC_021184.1_967	NC_021184.1_963,NC_021184.1_965,NC_021184.1_967	3	RM__Type_I_MTases_FAM_0,RM__Type_I_REases_FAM_0.einsi_trimmed,RM__Type_I_S_06
+NC_021184.1_Kiwa_6	Kiwa	Kiwa	Defense	NC_021184.1_1016	NC_021184.1_1017	NC_021184.1_1016,NC_021184.1_1017	2	Kiwa__KwaA,Kiwa__KwaB
+NC_021184.1_PfiAT_10	PfiAT	PfiAT	Defense	NC_021184.1_1033	NC_021184.1_1034	NC_021184.1_1033,NC_021184.1_1034	2	PfiAT__PfiA,PfiAT__PfiT
+NC_021184.1_BREX_I_4	BREX	BREX_I	Defense	NC_021184.1_1159	NC_021184.1_1165	NC_021184.1_1159,NC_021184.1_1160,NC_021184.1_1161,NC_021184.1_1162,NC_021184.1_1165	5	BREX__brxA_DUF1819,BREX__brxB_DUF1788,BREX__brxC,BREX__pglX1,BREX__pglZA
+NC_021184.1_AbiE_1	AbiE	AbiE	Defense	NC_021184.1_1208	NC_021184.1_1209	NC_021184.1_1208,NC_021184.1_1209	2	AbiEii__AbiEi_4,AbiEii__AbiEii
+NC_021184.1_RM_Type_III_26	RM	RM_Type_III	Defense	NC_021184.1_1419	NC_021184.1_1420	NC_021184.1_1419,NC_021184.1_1420	2	RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_021184.1_Gabija_5	Gabija	Gabija	Defense	NC_021184.1_1422	NC_021184.1_1423	NC_021184.1_1422,NC_021184.1_1423	2	Gabija__GajA,Gabija__GajB_2
+NC_021184.1_PD-T7-2_9	PD-T7-2	PD-T7-2	Defense	NC_021184.1_1424	NC_021184.1_1428	NC_021184.1_1424,NC_021184.1_1428	2	PD-T7-2__PD-T7-2_A,PD-T7-2__PD-T7-2_B
+NC_021184.1_RM_Type_IV_28	RM	RM_Type_IV	Defense	NC_021184.1_1656	NC_021184.1_1656	NC_021184.1_1656	1	RM_Type_IV__Type_IV_05
+NC_021184.1_RM_Type_II_24	RM	RM_Type_II	Defense	NC_021184.1_3394	NC_021184.1_3396	NC_021184.1_3394,NC_021184.1_3395,NC_021184.1_3396	3	RM_Type_II__Type_II_MTases_FAM_16,RM_Type_II__Type_II_REase01,RM_Type_II__Type_II_REase17
+NC_021184.1_Wadjet_I_15	Wadjet	Wadjet_I	Defense	NC_021184.1_3691	NC_021184.1_3693	NC_021184.1_3691,NC_021184.1_3692,NC_021184.1_3693	3	Wadjet__JetA_I,Wadjet__JetB_I,Wadjet__JetC_I
+NC_021184.1_Wadjet_I_16	Wadjet	Wadjet_I	Defense	NC_021184.1_3803	NC_021184.1_3806	NC_021184.1_3803,NC_021184.1_3804,NC_021184.1_3805,NC_021184.1_3806	4	Wadjet__JetA_I,Wadjet__JetB_I,Wadjet__JetC_I,Wadjet__JetD_I
+NC_021184.1_CAS_Class1-Subtype-I-C_31	Cas	CAS_Class1-Subtype-I-C	Defense	NC_021184.1_4025	NC_021184.1_4031	NC_021184.1_4025,NC_021184.1_4026,NC_021184.1_4027,NC_021184.1_4028,NC_021184.1_4029,NC_021184.1_4030,NC_021184.1_4031	7	cas1_I_II_III_IV_V_VI_6,cas2_I_II_III_IV_V_VI_3,cas3_I_5,cas4_I_II_III_IV_V_VI_6,cas5_I-C_11,cas7_I-C_7,cas8c_I-C_2
+NC_021184.1_RM_Type_III_27	RM	RM_Type_III	Defense	NC_021184.1_4091	NC_021184.1_4092	NC_021184.1_4091,NC_021184.1_4092	2	RM_Type_III__Type_III_MTases_FAM_0,RM_Type_III__Type_III_REases_FAM_0.einsi_trimmed
+NC_021184.1_Lamassu-Hypothetical_7	Lamassu-Fam	Lamassu-Hypothetical	Defense	NC_021184.1_4235	NC_021184.1_4237	NC_021184.1_4235,NC_021184.1_4236,NC_021184.1_4237	3	Lamassu-Fam__LmuA_effector_hypothetical,Lamassu-Fam__LmuB_SMC_hypothetical,Lamassu-Fam__LmuC_acc_hypothetical
+NC_021184.1_AbiH_2	AbiH	AbiH	Defense	NC_021184.1_4301	NC_021184.1_4301	NC_021184.1_4301	1	AbiH__AbiH
+NC_021184.1_RM_Type_II_25	RM	RM_Type_II	Defense	NC_021184.1_4531	NC_021184.1_4532	NC_021184.1_4531,NC_021184.1_4532	2	RM_Type_II__Type_II_MTases_FAM_27,RM_Type_II__Type_II_REase01
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_000913.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000002.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000003.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000000.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
+sequence_000001.fasta.fasta,4_0,0.010000000000000009,average,ANImf,4
+sequence_000004.fasta.fasta,5_0,0.010000000000000009,average,ANImf,5
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_002737.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000001.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000000.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_008261.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_009012.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000002.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
+sequence_000003.fasta.fasta,4_0,0.010000000000000009,average,ANImf,4
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_014168.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_014212.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000001.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_014364.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_1,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,1_2,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000003.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_015761.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000002.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_017033.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000001.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
+sequence_000000.fasta.fasta,3_0,0.010000000000000009,average,ANImf,3
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_018068.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_018515.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000000.fasta.fasta,1_0,0.010000000000000009,average,ANImf,1
+sequence_000001.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_019936.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000001.fasta.fasta,1_1,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,1_2,0.010000000000000009,average,ANImf,1
+sequence_000000.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/drep_compare/NC_021184.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+genome,secondary_cluster,threshold,cluster_method,comparison_algorithm,primary_cluster
+sequence_000001.fasta.fasta,1_1,0.010000000000000009,average,ANImf,1
+sequence_000002.fasta.fasta,1_2,0.010000000000000009,average,ANImf,1
+sequence_000000.fasta.fasta,2_0,0.010000000000000009,average,ANImf,2
Binary file test-data/drep_compare_clustering_dendrogram/NC_000913.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_002737.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_008261.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_009012.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_014168.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_014212.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_014364.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_015761.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_017033.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_018068.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_018515.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_019936.fasta.pdf has changed
Binary file test-data/drep_compare_clustering_dendrogram/NC_021184.fasta.pdf has changed
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_000913.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1685 @@
+>NC_000913.3|provirus_563848_584430
+TTATATTAATTCGTATAATTTGGCGTAGTCGATAAGCTCTACAATTGAATGCAAACCTAG
+CTTGCCATAAATATTAGATTTATGCGCACTAACTGTTTTATTGCTAAGTAATAACTTATC
+GGCAATTTCTTTATTAGATAATCCGCTAACCAGATAACGTAATATGGTCACTTCACGATT
+AGATAGCACAGTGACCGTTGAACTATTCGTACTACATTTATTGCTTTTTATATAGTTAAG
+CGTTTCGCTGGGAAAAAACGTGTATCCGGAGAGGATCATCTGAACGGCATGAAAAATATC
+ATTCTGATCATTGCATTTACTGACAAAACCGTTAGCACCAGCTTGTATCGCTCTGCCAGC
+ATAAAAGCATTCTGATTTCGATGATAAAAATAACACTTTCACTGTGCTCTGGATTTGTTT
+GATCCTTTTCAGGAAGGTAAAACCGTCTGTTCCGGGCAAGTCTATATCCATAATGATTAA
+ATCAACAGGACGGGTTCGGAGATAATCGATGGTTATGCGATAATCATCCGTTTTCAGGAC
+AATCTGCAATTCACTGTTTTTTTGCAACAGAACTTCAATAGACATTCTGATGATAGGATG
+AGTATCCATAATGATCACCGACGTTGGTTTCATAGTTACCAGTCTCATAGGAGCGGACAA
+TTTTCCGTTAGGTCGGGAAATTGTACTTTGATACATGAAAATACGGGTTTTCTTGATTCA
+GACGCGCAGCGGTGTGCGTTTGTTTGCCGCTATAGCGAAATAAATCAGAAAATCAGACGC
+GGTCGTTCACTTGTTCAGCAACCAGATCAAAAGCCATTGACTCAGCAAGGGTTGACCGTA
+TAATTCACGCGATTACACCGCATTGCGGTATCAACGCGCCCTTAGCTCAGTTGGATAGAG
+CAACGACCTTCTAAGTCGTGGGCCGCAGGTTCGAATCCTGCAGGGCGCGCCATTACAATT
+CAATCAGTTACGCCTTCTTTATATCCTCCATAATTTCAGAGTGGGACATATTTGGGACAT
+TATCACCAAAAATGTCGTCTATTTTCCTCGCATGCTCTGTCAAATGATTAGGCGCAAGGT
+GAGCATACCTACGAACCATTTCTATGGACTCCCATCCGCCCATTTCCTGAAGCACTGATA
+ATGGGACGCCTGACTGAATCAGCCAGCTTGCCCAGGTGTGTCTGAGGTCATGGAAACGGA
+AATCTTCAATTCCTGCACGACGACAAGCTGATAGCCATGATGTCTTGCTGTCGATGCGCA
+TCTTCCTGACCGCAGGCGTTGATGTTCCATCTGCTCGCTTAGCCGCCTTGGTATGTACAA
+ACACCCATTTGTGATGCTTGCCTATTTGATCACGCAACACTTTACAGGCGGTATCGTTCA
+GCGCCACACCAATGGCGCGGTTTGATTTGCTCTCTTCTGGATTCACCCAGGCAACTCGTC
+GCTGCATGTCGATTTGTTGCCATTCCAGATTTATGATGTTCGACTTTCTCAGACCAGTTG
+CCAGCGCAAACTTGACGACAGATTTCAGTGGTTCGGGGCACTCATCAATAAGGCGTTTTG
+CTTCCTCCTTTTCCAGCCATCTGACTCGCTTGTTTCTGACCGCTGGTATCTTGATGACAG
+GCGCTTTTTCCAGCCACTTCCAGTCGCGTTCTGCAGCACGGAGAATGGCCTTTATCATGG
+CAAGATGCTTTGCCTTTGTCTGAGTTGATACTGGCTTTGGTTCATAAACAGGCAGTTCTT
+TACCTTTCCTGATGGCGGCCTGAACTTTCTGTTTCCATATTTCTTTCGTCTTTCTGTTAT
+GCATTCTGCTTACAGCAGAGTAAATCTTTGCCTCCGAGATATCTTTAAGCCTTATACCCT
+CAAAATGTTCAAGCCAGAACTCAATCCGGCTTTTATCTGAATCGAGAGATTTTTTATCAG
+CTTTTTCCTCAAGCCATCTTAGGCAGGCCTCTTCAAAAGTGACATCAGGTAAATCCCCTA
+GCTTTTCTACTCGCCAGAGTTCTGCTTTTCGCTTGTCGTGCAACTCCTGAGCTTGCCGTT
+TGTCCTTTGTGCCAAGAGATTCCTTAATTCGTTTCCCGCCCGGGAGCGAATACGAGGCAT
+ACCATATTTCATTTCTGCGGAAGAGTGACATTTTCTTTCCTCTGTTATGCCATCACCCGC
+GCTCACCTGGACAGTATGCAGCGGAGACTGAAGCGCCGCAATGCAGGCTTGCCGTGTTGT
+GAGGTACCCGGATATTATCGTGAGGATGCGTCATCGCCATTGCTCCCCAAATACAAAACC
+AATTTCAGCCAGTGCCTCGTCCATTTTTTCGATGAACTCCGGCACCATCTCGTCAAAACT
+CGCCATGTACTTTTCATTCCGCTCAATCACGACATAATGCAGGCCTTCACGCTTCATGCG
+CGGGTCATAGTTGGCAAAGTACCAGGCATCTTTTCGCGTCACCCACATGCTGTACTGCAC
+CTGGGCCATGTAAGCCGATTTTATTGCCTCGAAACCACCGAGCCGGAATTTCATGAAATC
+CCGGGAGGTACGAGTATTGCCGGAAGCGTGGCCTGTATCCGGATGCAGAGTCTTATCCGT
+GGAAATCGAACGCGCATTACTGGTTGGTTACCAACTTGTACCAGAACATGCGGGCCAATG
+CGCTGGCTGACGCGGAATTACGGCGCAAGGCTGCCGATGAACTGACCTGTATGACAGCGC
+GAATTAACCGTGGTGAGACGATACCTGAACCAGTAAAACAACTTCCTGTTATGGGCGGTA
+GACCTCTAAATCGTGCACAGGCTCTGGCGAAGATCGCAGAAATTAAAGCTAAGTTCGGAC
+TGAAAGGAGCAAGTGTATGACGGGCAAAGAGGCAATTATTCATTACCTGGGGACGCATAA
+GAGCTTCTGTGCACAGGACGTTGCCGCGGTAACAGGCGCAACCGTAATCTGATCTTACCC
+AGCAATAGTGGACACGCGGCTAAGTGAGTAAACTCTCAGTCAGAGGTGACTCACATGACA
+AAAACAGTATCAACCAGTAAAAAACCCCGTAAACAGCATTCGCCTGAATTTCGCAGTGAA
+GCCCTGAAGCTTGCTGAACGCATCGGTGTTACTGCCGCAGCCCGTGAACTCAGCCTGTAT
+GAATCACAACTCTACAACTGGCGCAGTAAACAGCAAAATCAGCAGACGTCTTCTGAACGT
+GAACTGGAGATGTCTACCGAGATTGCACGTCTCAAACGCCAGCTGGCAGAACGGGATGAA
+GAGCTGGCTATCCTCCAAAAGGCCGCGACATACTTCGCGAAGCGCCTGAAATGAAGTATG
+TCTTTATTGAAAAACATCAGGCTGAGTTCAGCATCAAAGCAATGTGCCGCGTGCTCCGGG
+TGGCCCGCAGCGGCTGGTATACGTGGTGTCAGCGGCGGACAAGGATAAGCACGCGTCAGC
+AGTTCCGCCAACACTGCGACAGCGTTGTCCTCGCGGCTTTTACCCGGTCAAAACAGCGTT
+ACGGTGCCCCACGCCTGACGGATGAACTGCGTGCTCAGGGTTACCCCTTTAACGTAAAAA
+CCGTGGCGGCAAGCCTGCGCCGTCAGGGACTGAGGGCAAAGGCCTCCCGGAAGTTCAGCC
+CGGTCAGCTACCGCGCACACGGCCTGCCTGTGTCAGAAAATCTGTTGGAGCAGGATTTTT
+ACGCCAGTGGCCCGAACCAGAAGTGGGCAGGAGACATCACGTACTTACGTACAGATGAAG
+GCTGGCTGTATCTGGCAGTGGTCATTGACCTGTGGTCACGTGCCGTTATTGGCTGGTCAA
+TGTCGCCACGCATGACGGCGCAACTGGCCTGCGATGCCCTGCAGATGGCGCTGTGGCGGC
+GTAAGAGGCCCCGGAACGTTATCGTTCACACGGACCGTGGAGGCCAGTACTGTTCAGCAG
+ATTATCAGGCGCAACTGAAGCGGCATAATCTGCGTGGAAGTATGAGCGCAAAAGGTTGCT
+GCTACGATAATGCCTGCGTGGAAAGCTTCTTTCATTCGCTGAAAGTGGAATGTATCCATG
+GAGAACACTTTATCAGCCGGGAAATAATGCGGGCAACGGTGTTTAATTATATCGAATGTG
+ATTACAATCGGTGGCGGCGGCACAGTTGGTGTGGCGGCCTCAGTCCGGAACAATTTGAAA
+ACAAGAACCTCGCTTAGGCCTGTGTCCATATTACGTGGGTAGGATCAACCAGCATAAATC
+AGGCTGCGGCTAAAATGGCGCGGGCAGGAATCCTGGTCGTTGATGGTAAGGTCTGGCGAA
+CGGTGTATTACCGGTTCGCTACCAGAGAAGAATGGGAAGGAAAGGTGAGCACGAATCTGA
+TTTTTAAGGAGTGTCGCCAGAGTGCCGCGATGAAACGGGTATTGAGGGTATATAAAAGAA
+CATCAATGGGAACACAATGATGAAACAGGTGAGTTGAGTTCAAACTGTAGTACAATTCTC
+TCCAGTTTGAACAGGAAAGAATATGCTATGAACCCTTATATTTATCTTGGTGGTGCAATA
+CTTGCAGAGGTCATTGGTACAACCTTAATGAAGTTTTCAGAAGGTTTTACACGGTTATGG
+CCATCTGTTGGTACAATTATTTGTTATTGTGCATCATTCTGGTTATTAGCTCAGACGCTG
+GCTTATATTCCTACAGGGATTGCTTATGCTATCTGGTCAGGAGTCGGTATTGTCCTGATT
+AGCTTACTGTCATGGGGATTTTTCGGCCAACGGCTGGACCTGCCAGCCATTATAGGCATG
+ATGTTGATTTGTGCCGGTGTGTTGATTATTAATTTATTGTCACGAAGCACACCACATTAA
+AATAATTTGTTTCTAAACGACTAAAATATGGAGGCTCTTATATTTATATGAGCCTCGTTT
+TATGCTTTTTGTTAATGTCTTTATTTTTTATGTATTCTTTTGTGCTTTCAAGATTATGGC
+GTAAGAAAATTGCAATACGATTATTGTTGTATATTCAAGATAATGTGACCTTAATTGTCT
+TTTTAAATAAAAAATAAACAAAAATTATATCCCACCACTAAGGTTTATAAAAGCATACGT
+TAGCAGGTGTCACCATGAAAAAAGCCATAGCATATATGCGATTTTCATCACCAGGTCAGA
+TGTCTGGCGACTCATTAAACCGACAGAGAAGACTTATTGCTGAATGGTTAAAGGTAAATA
+GTGATTATTATCTTGATACCATAACATATGAAGATTTAGGATTAAGTGCATTCAAAGGAA
+AGCATGCACAATCAGGAGCTTTTTCGGAATTTTTAGATGCTATAGAGCATGGTTATATAT
+TGCCAGGAACTACATTGTTAGTTGAAAGTCTGGACAGACTTTCAAGAGAAAAAGTCGGTG
+AAGCGATTGAACGTCTGAAATTGATTTTGAATCACGGTATTGATGTTATAACTCTTTGCG
+ACAATACAGTCTATAATATTGACTCTTTGAATGAGCCATATTCATTAATAAAAGCCATAC
+TTATAGCACAAAGGGCAAATGAAGAAAGCGAGATAAAGTCAAGTCGGGTTAAATTATCAT
+GGAAGAAAAAACGGCAGGATGCACTGGAATCAGGTACGATTATGACGGCGTCTTGTCCGA
+GATGGCTCTCCTTAGATGACAAAAGAACGGCTTTTGTTCCAGACCCCGACAGGGTGAAAA
+CTATTGAGCTAATTTTTAAACTCAGGATGGAAAGGCGCTCATTGAATGCAATAGCCAAGT
+ATTTAAATGATCATGCTGTAAAGAATTTCTCAGGAAAAGAAAGTGCATGGGGACCTTCTG
+TAATTGAAAAATTATTAGCGAATAAAGCTCTGATAGGTATTTGCGTACCTTCATATCGTG
+CAAGAGGGAAAGGGATAAGTGAAATCGCTGGCTATTATCCCAGAGTCATATCAGATGATT
+TGTTTTACGCTGTACAGGAAATTCGGTTGGCACCTTTTGGTATTAGCAATAGTAGCAAGA
+ATCCTATGCTAATAAATCTACTTCGAACAGTTATGAAGTGTGAGGCTTGTGGTAATACCA
+TGATTGTTCATGCGGTATCTGGAAGTTTGCATGGCTATTATGTTTGTCCGATGAGAAGAT
+TACATCGATGTGACAGGCCATCAATAAAAAGAGATTTGGTTGATTATAATATCATTAATG
+AATTGCTTTTTAATTGTAGCAAAATTCAACCAGTTGAAAACAAGAAAGATGCTAATGAAA
+CTTTAGAGTTAAAAATTATTGAGCTTCAGATGAAAATTAATAATTTAATCGTTGCATTGT
+CTGTCGCGCCTGAAGTTACCGCTATAGCAGAGAAAATAAGACTATTAGATAAGGAATTAC
+GAAGGGCTTCGGTATCATTGAAAACTTTGAAGAGTAAAGGTGTAAATTCATTCAGTGATT
+TTTATGCTATTGACTTAACCAGTAAAAATGGACGAGAGTTATGCCGTACACTTGCCTATA
+AAACATTCGAAAAAATCATAATTAATACGGATAATAAAACCTGTGATATCTATTTTATGA
+ATGGCATTGTTTTTAAACACTATCCTTTAATGAAAGTAATATCCGCCCAGCAGGCGATAA
+GTGCTCTCAAATATATGGTTGATGGTGAGATTTATTTCTAAATAATGATCTCGGATTTTA
+AGTTATGCTATGGTGATAAAGTGCAAGACAGAATTAATTATCTTTGACGAAACTTAATGG
+GTAATTACTTTGTTTGCTCCCACAAGCGAGTTTTGTACGGCTGTATTGGGGTAGTAAATG
+AGCTATACAATCTTAATCATTTGTTAGGTGAGAACTCTTGGTCGCAGATTCAAATACTGA
+AAATACGTGACAAATTATTATGAGCAAAATGGTGTATGTCACGTATTTTGAATGGTAGGT
+TAAAAAATAACACCGACTTTCGTAGGTGTTACTAATAATAAAGCAGAGTTTTTAGATAGT
+ATCAATGTGCTTTGTGTATATTGTGGCAAATAATTGGGTTGGGGGTACAATTGTGATTGC
+TTTTGCATGAACATTGCGCCTTTATGCATAATGAGATAAAGGAATATCAAATAAAATAAC
+GATAGGTCATAACAAAGAGGTTTTTATGAAAACACTTATCGTTTCAACTGTATTGGCATT
+CATAACATTTTCTGCGCAGGCTGCAGCATTTCAGGTCACTAGTAATGAAATAAAAACAGG
+AGAGCAACTTACAACGTCTCATGTCTTTTCTGGATTTGGGTGTGAAGGTGGTAATACATC
+GCCCTCATTAACCTGGTCTGGTGTTCCTGAAGGTACCAAAAGCTTTGCCGTAACTGTATA
+TGATCCAGATGCACCTACAGGCAGTGGTTGGTGGCATTGGACTGTTGTTAATATTCCAGC
+AACAGTAACATATTTGCCCGTTGATGCAGGGAGACGTGATGGAACAAAACTGCCGACTGG
+TGCTGTTCAAGGCCGAAATGATTTTGGCTATGCTGGGTTTGGTGGCGCATGTCCTCCTAA
+AGGAGATAAACCACATCATTACCAGTTTAAAGTATGGGCTCTAAAAACTGAAAAGATTCC
+TGTAGATTCTAACTCCAGCGGAGCGTTAGTTGGTTATATGCTTAATGCTAATAAAATCGC
+AACCGCTGAGATAACACCAGTTTATGAGATAAAGTAGGGTGAGAGTATGCTGGCAAGAGG
+TAAGACTAACTTAAAGATCGAAGAAATACGGATGCATAAACATCATGAGATTCATAGGGT
+TAAGCCTCTTATGCCAGCTTTGTGTCGTATCCGTCAGGGAAAGAAAGTTATCAATTGGGA
+GACGCATACTTTAACTGTTGATAATAATCAAATAATATTATTTCCTTGTGGTTATGAATT
+TTATATTGAGAATTATCCTGAAGCAGGGCTTTATCTTGCAGAAATGCTTTACTTACCCAT
+TGATTTAATTGAGAGTTTCCAAAAACTTTATACGGTAACTGATCAAATACGTAACAAAAC
+AAGTTTCTTTTTACCTCAGAATCCTGAGTTAATATATTGTTGGGAGCAACTAAAAACATC
+TGTTTCCCGAGGCTTCTCAACTAAAATTCAGGAGCACTTAGCAATGGGCGTTCTACTTTC
+GTTAGGAGTGAATCATGTTAATCATTTACTTTTATCATATAGTAAACAATCATTGATAAG
+TCGTTGTTATAACCTGCTGCTATCCGAACCCGGCACAAAATGGACAGCAAACAAGGTTGC
+TCGATATCTCTACATTTCTGTTTCTACATTACATCGCCGTCTAGCAAGCGAGGGGGTAAG
+TTTCCAAAGTATACTGGACGATGTGAGGTTAAATAATGCGTTGTCTGCTATACAAACGAC
+GGTAAAACCTATAAGCGAGATTGCCAGAGAAAATGGTTATAAGTGTCCTTCTCGTTTTAC
+TGAAAGATTTCATAATCGTTTTAATATAACACCAAGAGAGATAAGAAAAGCTTCCAGAGA
+GTAAAAGTGTTTTAAGAAGGAGCAATTCTATCGATTTTGATTTTGGGAAATCAACACGGC
+ATAATTATGTCACCGGAGCCTGAACAACTCCGGTGACTTCTGCGCTAAACGGGGACGTTT
+ATGCGCACATACAATCCAAACTCTCTTCTCCCTTCACAGATGCAGAAATGCACCTGCAAT
+TCTTTGCATCTAGCGTTTGACCTCTGCGGAGGGGAAGCGTGAACCTCTCACAAGACGGCA
+TCAAATTACATCGCGGCAACTTCACCGCTATCGGTCGGCAGATCCAGCCTTATCTGGAGG
+AGGGCAAATGCTTTCGCATGGTGCTTAAACCGTGGCGTGAGAAACGCAGTCTTTCCCAGA
+ATGCACTCAGCCACATGTGGTACAGCGAAATCAGTGAATACCTCATCAGCAGGGGTAAAA
+CGTTCGCCACTCCAGCTTGGGTAAAAGATGCTCTCAAACACACATATCTCGGTTATGAAA
+CCAAAGACCTGGTTGATGTCGTAACCGGTGATATCACCACTATCCAGTCGTTACGCCATA
+CCTCCGATCTTGATACCGGAGAGATGTATGTCTTCCTGTGTAAGGTTGAAGCCTGGGCGA
+TGAATATTGGTTGCCACCTGACTATTCCACAGAGCTGCGAGTTCCAGCTGCTGCGCGACA
+AGCAGGAGGCGTAATGGCTACACCGCTTATTCGTGTCATGAACGGACACATCTACAGAGT
+ACCAAATCGTCGTAAGCGTAAACCTGAGCTGAAGCCATCCGAAATACCAACACTGCTCGG
+ATATACCGCCAGCTTGGTTGATAAAAAATGGTTGCGACTGGCAGCAAGGAGGAGTCATGG
+CTGATTTGAGAAAAGCAGCGCGTGGTCGGGAATGCCAGGTAAGAATCCCTGGCGTATGTA
+ATGGCAACCCTGAAACGTCTGTACTGGCACATATCCGGCTGACTGGATTGTGCGGCACCG
+GTACGAAACCGCCAGACCTGATTGCCACCATTGCATGTTCTGCCTGCCACGACGAAATCG
+ACCGCCGCACGCATTTTGTTGACGCTGGATATGCAAAAGAATGCGCGCTGGAAGGTATGG
+CGAGAACACAGGTTATCTGGCTGAAAGAGGGGGTTATTAAGGCGTGAATACCTACAGCAT
+CACATTACCCTGGCCTCCGAGCAATAATCGCTATTACCGCCATAATCGCGGGCGCACGCA
+CGTCAGCGCAGAGGGGCAGGCATACCGCGATAACGTCGCCCGAATCATTAAAAACGCAAT
+GCTGGATATCGGCCTGGCTATGCCTGTGAAAATCCGCATTGAGTGCCACATGCCGGATCG
+CCGTCGCCGTGACCTGGATAATCTGCAAAAAGCCGCTTTTGACGCACTCACTAAAGCAGG
+TTTCTGGCTGGATGATGCTCAGGTCGTTGATTACCGCGTTGTGAAGATGCCTGTTACCAA
+AGGTGGGAGGCTGGAACTGACCATCACCGAAATGGGGAATGAATGATGTTTGAGTTTAAT
+ATGGCAGAACTTCTTCGCCACCGCTGGGGGCGTCTGCGCTTATATCGTTTCCCCGGTTCT
+GTTTTGACCGATTACCGAATACTGAAGAATTACGCCAAAACCCTGACAGGAGCAGGAGTA
+TGAAGTCAGAGATAACAATCAACTAATACTGTTTTGTTGATTTTTGCTTGTAATTGGCGT
+TCTGGTCTGATTTTTGTGGAGTAAGTTGATGCGTGATATTCAGATGGTTCTTGAGCGTTG
+GGGAGCGTGGGCGGCTAATAATCATGAAGATGTGACCTGGTCGTCCATTGCCGCCGGTTT
+TAAGGGATTAATTACTTCAAAAGTAAAATCTCGCCCGCAATGTTGTGACGATGACGCGAT
+GATCATTTGCGGGTGCATGGCCCGTCTGAAAAAGAACAACAGCGATTTGCACGATTTATT
+AGTAGATTATTATGTAGTCGGTATGACATTCATGTCACTGGCAGGTAAGCATTGCTGCTC
+TGATGGTTATATCGGGAAAAGGTTACAGAAGGCTGAGGGCATAATTGAAGGGATGTTAAT
+GGCATTAGATATCCGGTTAGAGATGGATATCGTTGTTAATAACTCTAATTAATATGCCAA
+TTGTTTACTAAAAATTATTAAAAATGGGGCGTTGAGACGCCCCCAAAAATAAAGGGTAAT
+ATATAACAGAAGGTTTATATAGTTAGAAGCAAGGTTGTGCTTCTAAAGGAAGTGGCTTGA
+GGGAGCCACTTATATGTTGGGGAGGCAACGCCTCCCGCAACATATCTTTTTCGTAATCAG
+ATTAGAACTGGTAAACCAGACCTACAGCAACGATGTCATCAGTGCTTACACCGAGTGCTT
+TAGGGAAGGTGCGAATAAGCGGGGAAATTCTTCTCGGCTGACTCAGTCATTTCATTTCTT
+CATGTTTGAGCCGATTTTTTCTCCCGTAAATGCCTTGAATCAGCCTATTTAGACCGTTTC
+TTCGCCATTTAAGGCGTTATCCCCAGTTTTTAGTGAGATCTCTCCCACTGACGTATCATT
+TGGTCCGCCCGAAACAGGTTGGCCAGCGTGAATAACATCGCCAGTTGGTTATCGTTTTTC
+AGCAACCCCTTGTATCTGGCTTTCACGAAGCCGAACTGTCGCTTGATGATGCGAAATGGG
+TGCTCCACCCTGGCCCGGATGCTGGCTTTCATGTATTCGATGTTGATGGCCGTTTTGTTC
+TTGCGTGGATGCTGTTTCAAGGTTCTTACCTTGCCGGGGCGCTCGGCGATCAGCCAGTCC
+ACATCCACCTCGGCCAGCTCCTCGCGCTGTGGCGCCCCTTGGTAGCCGGCATCGGCTGAG
+ACAAATTGCTCCTCTCCATGCAGCAGATTACCCAGCTGATTGAGGTCATGCTCGTTGGCC
+GCGGTGGTGACCAGGCTGTGGGTCAGGCCACTCTTGGCATCGACACCAATGTGGGCCTTC
+ATGCCAAAGTGCCACTGATTGCCTTTCTTGGTCTGATGCATCTCCGGATCGCGTTGCTGC
+TCTTTGTTCTTGGTCGAGCTGGGTGCCTCAATGATGGTGGCATCGACCAAGGTGCCTTGA
+GTCATCATGACGCCTGCTTCGGCCAGCCAGCGATTGATGGTCTTGAACAATTGGCGGGCC
+AGTTGATGCTGCTCCAGCAGGTGGCGGAAATTCATGATGGTGGTGCGGTCCGGCAAGGCG
+CTATCCAGGGATAACCGGGCAAACAGACGCATGGAGGCGATTTCGTACAGAGCATCTTCC
+ATCGCGCCATCGCTCAGGTTGTACCAATGCTGCATGCAGTGAATGCGTAGCATGGTTTCC
+AGCGGATAAGGTCGCCGGCCATTACCAGCCTTGGGGTAAAACGGCTCGATGACTTCCACC
+ATGTTTTGCCATGGCAGAATCTGCTCCATGCGGGACAAGAAAATCTCTTTTCTGGTCTGA
+CGGCGCTTACTGCTGAATTCACTGTCGGCGAAGGTAAGTTGATGACTCATGATGAACCCT
+GTTCTATGGCTCCAGATGACAAACATGATCTCATATCAGGGACTTGTTCGCACCTTCCTT
+AGTGAAGTCATTTTTGTCAAGCAGGTTGATTTTGTAATCAACGAAAGTAGACATATTTTT
+GTTGAAGTAATAGGTTGCACCTACATCAACATATTTGACTAAGTCCTGATCGCCCCATAC
+TCCAAGATCCTTACCTTTAGATTGCAGGTAAGCAACGGACGGACGCAGACCGAAATCGAA
+CTGATATTGTGCAACAGCTTCGAAGTTTTGGGCTTTATTAGCAACGAAGTGATCAGCAAA
+TACAGTCATATTCTGGGTTTCAGAATAGGTAGTGGCCAGGTAAATGTTGTTAGCGTCATA
+TTTCAGACCTGCGGCCCAAACTTCTGCATTTTTACCGGAAGCAAATACTTCAGGAAGAAC
+TTTCCCTGCATTAACTTGAGTGTCGGTACGATCAGATTTCGCATAAGTTGCACCGATACC
+GAATCCTTCGTATTCATAGGTAGCAGAGAAACCGAAGCCATCACCGTTACCTTCAGTGTA
+GTTATCGAAATCGCTACGATCGTTTTTGCCTTGGTACTGAGCAGCAAAGTTCAGACCATC
+AACCAGACCAAAGAAGTCGTTGTTACGATAGGTTGCAACACCAGTTGCACGTTGAGTCAT
+GAACACGTCGGTTTGAGTCCAAGTGTCACCACCGAATTCTGGCAGGACGTCAGTCCACGC
+ACCGATGTCGTATGCTACACCGTAGTTACGGCCGTAATCGATGGAGCCGTAGTCACCGAA
+TTTCAGGCCAGCGAAGGCAAGACGGGTTTTATCTTTGGAGGAACCTTGAGATTCAGCGCG
+GTTGCCTTTGAATTCATATTCCCACTGACCGAAACCAGTCAGTTGATCGTTGATTTGGGT
+TTCACCTTTGAAGCCAAGACGGGCATAAGTAGTATCACCATCATCTGCATCATTAGAGGA
+GAAGTAGTGCTTAGCATTAACTTTCCCGTACAGATCCAGCTTGTTACTGTCTTTATTATA
+AATTTCAGCTGCCTGAGCAGACATCGCCATTAGTACTGATGCAGCTACAGCAGAAATTGC
+CACTGTTAATTTTTTCATCGTGAGCCCTTTTTTTGAACTATTATTAAAAAATGATGTCAC
+TGCGCGATAAATATTCATCTAATCAATGTGATTATTTCAAGATGTAAGTTTTGGTTTCTC
+GTTTGATTTGTGAAGTAGATCTCTATTTTTATCTGAACTTTTTTCTATCGAATCCTATTC
+ATGGCTCTTGGCTGAATAAAAATAAATCTATTAGCCAATTTATATTAACGGCTGTTATTT
+ATAAGTGCTCTATAATTTGAAGGTTCAATTTAAACCGGCTAAAAATAACACTGGAAATTA
+TTTTTTGGTTATTTGTTGAGATTTGCTTATGTATTTGTAGTGGTGTTTTCAATACTCGGT
+AGCATTCTCTCAAATATCATTTAGTGGTTTACGTACGTAAAAAATTGGTTATGCTGTTAA
+GAGTGGTTACTTCGTCACACAGCTTAAACCCGCCGTCGAGCGGGTTTTTCCATTTTTTGA
+GTCTCGATATTAGCTGATAACCCAATACCTGAGTTATTCACTGACTCCGAGTCTGTTACG
+TTTCGTAGTATTCCCTCAATTTACACCCGCTTTGTCTGCGAGGTGGGGTTATGAAATCCA
+TGGATAAGTTAACAACGGGTGTCGCCTATGGCACCTCAGCAGGTAGTGCCGGGTACTGGT
+TTTTACAGCTGCTAGATAAAGTCACTCCCTCACAGTGGGCAGCAATAGGTGTGCTGGGTA
+GCCTGGTATTTGGCCTGCTGACGTACCTGACAAACCTTTATTTCAAGATTAAAGAAGATA
+AGCGCAAGGCTGCGAGAGGTGAATAATGCCTCCATCATTACGAAAAGCCGTTGCTGCTGC
+TATTGGTGGCGGAGCAATTGCTATAGCATCAGTGTTAATCACTGGCCCAAGTGGTAACGA
+TGGTCTGGAAGGTGTCAGCTACATACCATACAAAGATATTGTTGGTGTATGGACTGTATG
+TCACGGACACACCGGAAAAGACATCATGCTCGGTAAAACGTATACCAAAGCAGAATGCAA
+AGCACTCTTGAATAAAGACCTTGCCACTGTCGCCAGACAAATTAACCCGTATATCAAAGT
+CGATATACCGGAAACAACGCGCGGCGCTCTTTACTCATTCGTTTACAACGTGGGTGCTGG
+CAATTTTAGAACATCGACGCTTCTTCGCAAAATAAACCAGGGCGATATCAAAGGCGCATG
+TGATCAGCTGCGTCGCTGGACATACGCTGGCGGTAAGCAATGGAAAGGCCTGATGACTCG
+TCGTGAGATTGAGCGTGAAGTCTGTTTGTGGGGGCAACAGTGAGCAGAGTAACCGCGATT
+ATATCCGCTCTGATTATCTGCATCATCGTCAGCCTGTCATGGGCGGTCAATCATTACCGT
+GATAACGCAATCGCCTACAAAGTCCAGCGCGACAAAAATGCCAGAGAACTGAAGCTAGCG
+AACGCGGCAATTACTGACATGCAGATGCGTCAGCGTGATGTTGCTGCGCTCGATGCAAAA
+TACACGAAGGAGTTAGCTGATGCGAAAGCTGAAAATGATGCTCTGCGTGATGATGTTGCC
+GCTGGTCGTCGTCGGTTGCACATCAAAGCAGTCTGTCAGTCAGTGCGTGAAGCCACCACG
+GCCTCCGGCGTGGATAATGCAGCCTCCCCCCGACTGGCAGACACCGCTGAACGGGATTAT
+TTCACCCTCAGAGAGAGGCTGATCACTATGCAAAAACAACTGGAAGGAACCCAGAAGTAT
+ATTAATGAGCAGTGCAGATAGAGCTGACCATATCGATGGGCAACTCATGCAATTATTTTG
+AGCAATACACACGCGCTTCCAGCGGAGTATAAATGCCTAAAGTAATAAAACCGAGCAATC
+CATTTACGAATGTTTGCTGGGTTTCTGTTTTAACAACATTTTCTGCGCCGCCACAAATTT
+TAGCTGCATCGACAGTTTTCTTCTGCCCAATTCCAGAAACGAAGAAATGATGGGTGATGG
+TTTCCTTTGGTGCTACTGCTGTCTGTTTGTTTTGAACAGTAAATGTCTGTTGAGCACATC
+CTGTAATAAGCAGGGCCAGCGCAGTAGCGAGTAGCATTTTTTTCATGGTGTTATTCCCGA
+TGCTTTTTGAAGTTCGCAGAATCGTATGTGTAGAAAATTAAACAAACCCTAAACAATGAG
+TTGAAATTTCATATTGTTAATATTTATTAATGTATGCCAGGTGCGATGAATCGTCATTGT
+ATTCCCGGATTAACTATGTCCACAGCCCTGACGGGGAACTTCTCTGCGGGAGTGTCCGGG
+AATAATTAAAAACGATGCACACAGGGTTTAGCGCGTACATGTATTGTATTATGCCAACAC
+CCCGGTGCTGACACGGAAGAAACCGGACGTTATGATTTAGCGTGGAAAGATTTGTGTAGT
+GTTCTGAATGCTCTCAGTAAATAGTAATGAATTATCAAAGGTATAGTAATATCTTTTATG
+TTCGTGGATATTTGTAATCCATCGGAAAACTCCTGCTTTAGCAAGATTTTCCCTGTATTG
+CTGAAATGTGATTTCTCTTGATTTCAACCTATCATAGGACGTTTCTATAAGATGCGTATT
+TCTTGAGAATTTAACATTTACAACCTTTTTAAGTCCTTTTATTAACACGGTGTTATCGTT
+TTCTAACACAATGTGAATATTATCTGTGGCTAGATAGTAAATATAATGTGAGACATTGTG
+ACGTTTTAGTTCAGAATAAAACAATTCACAGTTTAAATCTTTTCGCACTTGATCGAATAT
+TTCTTTAAAAATGGCAACCTGAGCCATTGGTAAAACCTTCCATGTGATACGAGGGCGCGT
+AGTTTGCATTATCGTTTTTATCGCTTCAATCTGGTCTGACCTCTTTGTGTTTTGTTGATG
+ATTTATGTCAAATATTAGGAATGTTTTCAATTAATAGTATTGGTTGCGTAACAAAGTGCG
+GTCCTGCTGGCATTCTGGAGGGAAATACAACCGACAGATGTATGTAAGGCCAACGTGCTC
+AAACCTTCATACAGAAAGATTTGAAGTAATATTTTAACCGCTAGATGAAGAGCAAGCGCA
+TGGAGCGACAAAATGAATAAAGAACAATCTGCTGATGATCCCTCCGTGGATCTGATTCGT
+GTAAAAAATATGCTTAATAGCACCATTTCTATGAGTTACCCTGATGTTGTAATTGCATGT
+ATAGAACATAAGGTGTCTCTGGAAGCATTCAGGGCAATTGAGGCAGCGTTGGTGAAGCAC
+GATAATAATATGAAGGATTATTCCCTGGTGGTTGACTGATCACCATAACTGCTAATCATT
+CAAACTACTTAACCTGTGACAGAGCCAACACGCAGTCTGTCACTGTCAGGAAAGTGGTAA
+AACTGCAACTCAATTACTGCAATGCCCTCGTAATTAAGTGAATTTACAATATCGTCCTGT
+TCGGAGGGAAGAACGCGGGATGTTCATTCTTCATCACTTTTAATTGATGTATATGCTCTC
+TTTTCTGACGTTAGCCTCCGACGGCAGGCTTCAATGACCCAGGCTGAGAAATTCCCGGAC
+CCTTTTTGCTCAAGAGCGATGTTAATTTGTTCAATCATTTGGTTAGGAAAGCGGATGTTG
+CGGGTTGTTGTTCTGCGGGTTCTGTTCTTAGTTGACATGAGGTTGCCCCGTATTCAGTGT
+CGCTGATTTGTATTGTCTGAAGTTGTTTTTACGTTAAGTTGATGCAGATCAATTAATACG
+ATACCTGCGTCATAATTGATTATTTGACGTGGTTTGATGGCGTAGATGCACGTTGTGACA
+TGTAGATGATAATTATTATCATTTTGTGGGTCCTTTCCGGCGATCCGACAGGTTACGGGG
+CGGCGACCTCGCGGGTTTTCGCTATTTATGAAAATTTTCCGGTTTAAGGTGTTTCCGTTC
+TTCTTCGTCGTAACTTAATGTATTTATTTAAAATACCCCCTGAAAAGAAAGGAAACGACA
+GGTGCTGAAAGCGAGCTTTTTGGCCTCTGTCGTTTCCTTTCTCTGTTTTTGTCCGTGGAA
+TGTGCAATGGAAGTCAACAAAAAGCAGCTGGCTGACATTTTCGGTGCGAGTATCCGTACC
+ATTCAGAACTGGCAGGAACAGGGAATGCCCGTTCTGCGAGGCGGTGGCAAGGGTAATGAG
+GTGCTTTATGACTCTGCCGCCGTCATAAAATGGTATGCCGAAAGGGATGCTGAAATTGAG
+AACGAAAAGCTGCGCCGGGAGGTTGAAGAACTGCTGCAGGCCAGCGAGACAGATCTCCAG
+CCAGGGACTATTGAGTACGAACGCCATCGACTTACGCGTGCGCAGGCCGATGCACAGGAG
+CTGAAAAATGCCAGAGACTCCGCTGAAGTGGTGGAAACCGCATTCTGTACTTTCGTGCTG
+TCGCGGATCGCAGGTGAAATTGCCAGTATTCTCGACGGGATCCCCCTGTCGGTGCAGCGG
+CGTTTTCCGGAACTGGAAAACCGACATGTTGATTTCCTGAAACGGGATATCATCAAAGCC
+ATGAACAAAGCAGCCGCGCTGGATGAACTGATACCGGGGTTGCTGAGTGAATATATCGAA
+CAGTCAGGTTAACAGGCTGCGGCATTTTGTCCGCGCCGGGCTTCGCTCACTGTTCAGGCC
+GGAGCCACAGACCGCCGTTGAATGGGCGGATGCTAATTACTATCTCCCGAAAGAATCCGC
+ATACCAGGAAGGGCGCTGGGAAACACTGCCCTTTCAGCGGGCCATCATGAATGCGATGGG
+CAGCGACTACATCCGTGAGGTGAATGTGGTGAAGTCTGCCCGTGTCGGTTATTCCAAAAT
+GCTGCTGGGTGTTTATGCCTACTTTATAGAGCATAAGCAGCGCAACACCCTTATTCCAGC
+TGGCTTCGTGGCTGTTTTCAACAGTGATGAGTCATCGTGGCATCTCGTTGAAGATCATCG
+GGGTAAAACGGTTTATGACGTAGCGTCAGGGGACGCGTTATTTATTTCTGAACTCGGTCC
+GTTACCGGAAAATGTTACCTGGTTATCGCCGGAAGGGGAGTTTCAGAAGTGGAACGGTAC
+AGCCTGGGTGAAAGATGCAGAAGCAGAAAAACTGTTCCGGATTCGGGAGGCGGAAGAAAC
+AAAAAACAGCCTGATGCAGGTAGCCAGTGAGCATATTGCGCCACTTCAGGATGCTGTAGA
+TCTGGAAATCGCAACGGAGGAAGAAACCTCATTGCTGGAAGCCTGGAAAAAATATCGGGT
+GTTGCTGAACCGTGTTGATACATCAACTGCACCTGATATTGAGTGGCCTACGAACCCTGT
+CAGGGAGTAATCATTGGGATTATGCCGCAGCACGTCTTAAGCAAGAACATGCTGCGGTTG
+GATGCTATTTTTTTCCTGAAGCGGAAAACATTACTACAGTACCTTGAACCTTGGTTTTAA
+CATTCTCGAAATGCTCTGAGAGTATATGTGTTAAGCCTTCTTCGGAATCTTTTGTGTTTG
+AAAAGATGCCTTTCTGATTGTAAATGCGCATCAGTTTTTGACCGAAGCTATTGTGCACAA
+CTCCATCGCCAAGAATTGTGGCTCCGTATAGAGTTCCATCGTCAGTTAAGGCCTGCGCCG
+CATTGCGTATTACACAGCTTTTTGTAGATATATTTCCAGGCAGGCAGTGAAGAAGGTAAG
+ACATGGAAATGGAATCAAATTGACCATGTAACGCCGCGGGATAAGGTTCAAAAACATCAT
+GGCTAATTTTATGTTTAATTTTTGATTCCCCAGCCCTTGTAGATGCCGCGTTCAGGCTAG
+CTTCGTTCAAATCCATTAAAGATATCAGACTACTCTCAGGTACGTGAGTAAGGTAAAACC
+CAGTTCCAACACCAATATCCAGATGGTTGTTACCTAAATGTTCCAGAAAGTGTGGAAGAA
+GGTGTTCCTTTGTAGGACATCCCCATGCAAGCCGATTTGATACTCCCAAAACCCACCAGT
+CATAAAGCTTTAGGGTAAGTGGTGTGTAAATTCTAGCCCCATCATCTGTGTTTTTTTATT
+AATTTCACCATGTTATAGTTTTATTTGTGAATTAAATCAATTATGGCAATGAATTACAAG
+GGGTTAAATGCTGCCGCAGCATAGCGATATTGAAATAGCCTGGTATGCTTCAATACAGCA
+GGAGCCGAATGGCTGGAAGACCGTCACCACACAGTTCTACATCCAGGAATTCAGTGAGTA
+TATTGCGCCACTGCAGGATGCTGTAGATCTGGAAATCGCAACGGAGGAAGAAAGATCGTT
+GCTGGAAGCCTGAAAAAAGTATCGGGTGCTGCTAAACCGTGTGGACACTTCCGTAGCACC
+AGATATCGAGTGGCTTATTCAACCATAATAAACAGTATGTATATCATAGGTTATTAATTG
+TGAGTTTTTTCGGTGTGTTATTTGTTTGTTTGATGTTATGCTTTTGCGCCCCAAAAGGTT
+GTTTAGATGTATTTTATCAATTGATTTTCAATATCGTTTAATAAAGAAAAATTAAGCAAG
+CTGGATGTTGGTTTTTTGTTAATTGAATGGTTCTAATAATGTTTTTTTACTGTTGTTGAA
+TGTGACTTGATAAGAAATGCAAGTAAAAATGATACTCTTTTTATTTTAAATTCAAACGGT
+TGACATATATATAGCAAGAGGTTTCAGGTGCGTTGTAGTGAGTTTATGTTAATAAAAAGC
+ATAGTAAGCGTTGAAAAATGTAACTTTGAAATAAGTTAGAATAAAAAACAACATACATAT
+AATAATTTAATCTTAAATGAAATTTATTAAAATTTGCAAACTATAATTTTGTGTATAAAA
+ATATAAATGCACATCATCCTGATTATGATTGTGTATTTAATTGGTTGTTATTTGACTACT
+ATCAACTTGTTTTAATTTTATGATAGGTGCAAGATGGATTATGTTTGCTCCGTAGTTTTC
+ATCTGTCAATCATTTGATTTAATTATAAACAGGAGAGTTATCTCGTTCAAAAAAAATTCA
+TTGTTTATTGTAAGCGACAAAATTAGAAGGGAGTTACCAGTATGCCCCTCTAAACTAAGA
+ATTGTTGATATAGATAAGAAAACATGTTTATCCTTTTTTATCGACGTGAATAATGAGCTG
+CCTGGCAAATTTACTCTTGATAAGAATGGCTATATTGCTGAAGAGGAACCTCCATTATCG
+CTTGTTTTTTCTCTGTTTGAAGGGATTAAAATAGCAGACTCACACTCCCTTTGGTTAAAA
+GAAAGACTATGTATATCCTTACTTGCCATGTTCAAAAAACGCGAAAGTGTAAATTCATTT
+ATACTAACAAATATAAATACATTTACCTGTAAAATTACTGGAATAATCAGTTTTAATATT
+GAGCGGCAATGGCATTTAAAAGATATTGCGGAATTGATTTATACGAGTGAAAGTTTAATA
+AAAAAAAGATTAAGGGATGAAGGAACGTCATTTACTGAAATATTGAGAGATACTAGGATG
+AGGTATGCAAAAAAACTCATAACTTCAAACTCTTATTCTATCAATGTCGTAGCCCAGAAA
+TGTGGCTATAACAGTACTTCATATTTCATATGTGCATTTAAAGATTATTATGGTGTCACG
+CCATCTCATTATTTTGAGAAAATAATCGGCGTCACAGATGGAATAAACAAAACAATTGAC
+TGA
+>NC_000913.3|provirus_1196867_1213107
+TTATATTGCATTACAACTCCCAACAGTGACATATGAACTTCCTGCTTTACTCCACGACTT
+TAATATTTCAAGGCCATGTGAAGAACATATTTCTTGCACTGCGAGTTCATCGAGTAATCC
+ATAGTAAGAAACACTTTTTGAATTTTTGTAAATGTATCCGTAAAGATGTTTTCTTCCTGT
+TTCGTATTTTTTGAAGTATGAGCTTTTATATTGATTTACAATAAGAGTCTCACCTCCTGA
+TTTTAGTAATCTCTTGATGCTAAGAACTATTTTGTCGATTGTATCCCGACAAGGAACGGC
+AGAGAGAACATTAGAGCAAAGGATGAAATCGTAACCCCCAATTATTTTGTCGACATCCTC
+GAAAGCAACTGTATTTGCATTTTTATAATATCGTGGGACATAGTCAATAATTTTAGTTTT
+AATTCCTCTAATAATTTGCTCTCTTTCAAGTTGCCTTTTCGAGTCTAGAAAAGTAACTTC
+ATCAAATTTACTGATTAATTCATCAGAATATCTAAGTTTTCCGCAGCCAAAATCAAGGGC
+GTGGCCATTTTTCTCAATGCTTCTAATATACTCGCAAAGATATCTAGAGGGCATCGTATG
+AGGTTTTGCTGCATTCTCTGAGCGAATATTAACTCCGTGCATATTATAGTTCAAAGCAAG
+TACCATTCAATTAATGTTATTTTTAGTGAAAAATTCTTTTATTTTATCGTCCGGGATTTT
+TCCGACTTGACTTTCAGTTCTGGGCTTAACTGTCAAAGCAAAGATAATACCACTCACTGA
+GAATGATAAAATTACAAAAAAGAATAAAGACAGCAAAGAACCTTCAACATGAAAAATATC
+CATTTGTTTGCAAAAAAAGATTATTAGGAAGGAAATTAATGCAATTATCGAAAATTCAAA
+AAATATCCAAAAATAGTATACTTTATTCCAGAAGAGTTCAATATAATGTTTGTCTTCAAT
+TTTTCTTACTTCAGGGTAATATAGATTGCTCATTACATTGTGAGCTTCATCTTTATTTAA
+TTTTCTGTTGACTCCAGCTCTCCGTGATAACGGTTTTATAATTAGATGCTTATCCCAAAG
+ATATCGCACCCGAAGTAGTTTGGCTGCATTGTTATGTAGGTCTAACGCACCGCTAATTAA
+ATATGCAAAAATCGCAAAAGCACAAGGTAATATACCAAAAGATAGTGCCCAATTAATAAA
+GCTCTCATGATCTTTAATAGGTGGGACATACTTGGTTGGTAATGTTATTAAAGGGATGTA
+TTCGTAAATAACTAGAAGTATGCAATATATTAGCGTATTTAAGAAAGTTGCTTTATGAAG
+TTTAGGCAACATTTCATTATAATTTTTGGGGGGTTCGAACATATTATTCACCTGAGTCAC
+GCTTTAGGATAGTGTAATGGTAATATTTAATTAAGTGTCATTATATACTTTTCAGTAGGT
+TAGTTACAATTTTTTGTATCTGTTCAGGCTGACCTAGCTTCGCTGACAGACAATATTGTG
+ATCAGTAGCACGTATCGAGGAGGAGTAGCGCTACAAATTTGACGCTGGGTGAGAATCTGA
+AATTGATAGAAATGAAATAATGAAATAATGAAATGATGAAATGATGAAATGATGAAATGA
+TGAAATGATGAAATGATGACAGAGTGTCCAGTGGGCACGGATGGTGTCTTACGACATGCT
+TACCTTAATCGTTCCCAGTGTGCCTATAGCAGATATTCTAAACATGTCGATAATTCATTA
+CGCATATAGTATCGAACATAGAAAAAACTGAAGATTCATCTTATTTTGTATATACTACCT
+AGCCCAACAATGTAGAGGTTAACGAAAAATGCGCTCACCAATTTGTCATCTTTTCTCAGC
+AATTAATTCATCACCATTTAAGATTGCACCAGAGAAGGAGCAAGATCTTAAAACGATAGT
+TGACGACAAAAAAATTATAATTTCAGTTGTGAGTGAACCTGGTTTTAATATCCGAGTCAG
+GAAGAATGAGAGTAATAATTCACATGAAATAGTTCTAACAGTAGCTTCACTTGAATATAT
+TTGGGCATTTTCCAATTTCTTTTGGGTTTTTACGCAAGAGTACTCCAAATCTCAGAAAAA
+TAATGATGAGCACTTTGATTTAACAGGAAAAAATAGGCTTAAAAAGTCTGATGAACTTCT
+TAAATGGGCAAGGAAAAACTTGCAAACAACAGGTTGCGAATCATGGCCTAAAAAATGTCC
+CAAGCCAGAAGCATATTTACAAGGAAGCGAAGACTCACAAGTTGCTAGCGAGATATTTCT
+TTGTGCTATTGCTTGGATTCTTCATCATGAAATAAGTCATGTTGTTTTACAGCATCCATT
+GGTCACTACAGCATTCTCCACTCAAGAGGAGCGTGAAGCAGATTCACATGCTACAAAATG
+GATATTAGGCAACCTGTATGAATCCGCTCCTGAATTAAAGAAACGTGCACTTGGCATTGC
+TACGGCAGTGCTTTGTATACAAAGCTTAGAAGTTGAAAATTACTTCTGTTTACAAAATAC
+ACACCCAGCTGCATATGAGCGTATATATTCGAATATTTCATGCTACCCTGTCGGAAATGA
+AGAGTTGATTGAAGCTCTATGTACAGTGATGCTTCAATATCTTTTCCATGGCAAAAATAT
+CAATGTGAATCTAGATGGGGAGTCCTTTTCATCGATTTTAGGTGATCTTCTCTGTGATAT
+TTCACGTCTTACCAGTAACTGATATGGCTGTCCGCCGCTCGCTTAAAGTGGACTTTTTAG
+TTTTTATCATGTGCGGTGAGAAATTCAATGTGGCGTTGAGATGCTTAAAGGTTCACAACG
+CTACTTTGCTCCATCCTTTACCTCGATCATCATGATAACGATCGGTTTGTTGTTGTGTTT
+TATGACCAAGTAGTTTTTGTGTGTCTAACCCCTGTTCTTTATACAGACGTTCAGATAAAG
+ACCTTTGCTCATGGAATGTCGCAGGTGAACCCTCTCCCCAGTCAATTCTTGCTAAATCTC
+TCGCTTTACTAAAATTCATCGTCAATGTATTGGCTTTAACCTGCGCTCCGCGCTCTGCTT
+GTGAAGTTGAACGAAAAAAATGCACTAAGTATGCACTGACTGCATAGTCACGGCAGCGGG
+CTACTACATCGCGTAAACTCCAGTTAATCGCATTGAGGCGAAGAGAAAGAGGAATTGCGA
+TTTTGCTCCCGGTCTTTTCCTGAATGACATGAAGATGATCATCCCAAATATCGCTAAATT
+TCATACGCGAAATATCACCTAACCGCTGACCAGTAACCAGCGCTAACAGCATGGCATTTC
+CCATGTAACGATGAGTAGCGTCTGCGATATCGAAGATTTTTTTCCATTCTTCAAGGCTCA
+GCCGTTGTCGGGTAATTTTTCTTCTTGGTTGTTTAGTGGCTAATGCTGGGTTATAGCCAG
+GAGGTACTTCTCCGTAGTGCTGCGCCTCTTTGAAAACATCAATCAGGACGGAGCGAACTA
+CTTGTGCCATTCTTGGCCGCCCAGCGGCGATATACTCATCAAGCAATTGTGCTATATCTC
+TGACATCAACGGCTGAGATCAACTTCATTCCTGCTCGTTCTCTGAGCAAGGATACTGGTT
+TAGCTTTTTGTTTATAGGTGTTGAGTCTTATATCACCACTTTTAAGCCTGTCATCCTGGA
+TCGCTTGATAGCGATCTAACCAGGTTGACGTTGTGATAGCCTTTCCTTTGCTGGTTGCGA
+TCCTGTCACTGATAGCCAGAATCTGCCGGGTTCTTTGTTCAGCCAGGCGAGTGTTGGCCT
+CAGTGGCAATAGCGATAGCTTCAGCTTCGTTTGTTCCCAAAGCATGGAATTTTCCTGTCA
+CTGGATGCTTATACCGCCAATAGACTTTATTTACCTTCCTACTATAAAGCGGATATAAGT
+TAGGGACTGAAACATTATTCTTACGCGGTCTGGCTGCCATTACTCAAAATCCGTTGCAAA
+AGTAATGAGTCATTTTTCTTGATTACAGGTGTTACCAACTCCCCAACTAACTCGGCGTCC
+TCACGCACTCGCCATAACCGGCCTTGTTTCATGGCCGGTGGACAAAATAAATTCTGCTTA
+GCATAACGACGCAATGTGGACACACTTGGAGGATTACTTCTGTATTTTTCAGCAGCCCAT
+TCTTCAAGAGTTAACATTTGAAGCATATGCGATCACCTTATTACTACACTAACTGCTTAG
+TCTCAGCATATCGACCCTGCACGGTCGGTTAGTTTCTCCACAAAACAGAGAAGAGCACCT
+GTGGCCACAGCTATCAGGATGGGTCGGGTTATTAACCCGTCATCCGGGGATACTCTTCTC
+TGTTTTGTAAAAAGGGCGGTACCAGAAAGGACTAAGGAAAAAACTGGTACCGCCAAGACT
+ACACACAGCATAAAGTTGTGGTGTCGGGTGCCCCCGGTGCCTGGCGAAGGTTGCACACCA
+GGCGGGTGGGTATCCACAGAAGGTCGATTGTCAGCCTCAACCTTAACCCGCGTGCGCTGA
+GCCGCATTCACCACAACGCTAAGGATTCTCTCTGGTTGAAAATACTTAGCTGTTATGTGC
+CTGTCTTTTCACCACTTCAGGCTCGGTGGTATGCTGGAGTTCTCACACAGCCAGCAAGCA
+AGGAAACTTAATGAACCAGTTTTATGTTCACGTTCGTCTATTTGAAGACACAGCCGAACA
+GACCAAAAAATTTGAAGAATTAATGCTTAACTTTCTGTACCAGAAAACAGTTAAAGAGTC
+TGACGATAGCTGCTGCAGACTGATTCCAGAGGGATATATCCTCAAAAGTACAATGAACTG
+CCAACAAATCCTTGATCAAACATTTTCAATTGCTAACAGTGCCGGTGTTGACGCAAATAT
+ATTTGTCTGTAAATTTGAACAAAGCGCATGCTTACTTCCGTCTGCTTCCTTAGTTGGTAA
+CGATTTCGTTCATTACGATCTTACGCCTAAGCCCATCAAGCTCGATTCTTAAAGCCTTAA
+CCATTGTGTCGTGATAAACACGGCTCACCTTCTCTCCATTGCATGGCAGAGGGGTGAGTG
+TGTTAGCCATGAAATTCATGAACTCGGTTCGACCAGGGGCTTGCGCCCCGCAAGTCTTTA
+ATGCCTGTTTTGCTAACAAAATGCGGGCCTCAGTGCCTGCATTTGGCTCTATCTGCTGCA
+AACGTTTAGCGTCTTCCAGCAACAATGCGATCACATGCTTCAAATTCTGCTCATTCATCT
+ATTCTCTCCACTGAAATCATCCGCTAACGAATCATCCCGGTCTTCGTACGTACCGGGCGG
+GCTACTTCGTGGGCGTCCTGCCTGTTTGTTGTTTCTCTTGGGTACATTATGTATCTCAAA
+GGTACATTGTCAAGTATAAAAAAACCTGCCGAAGCAGGTTCATAAACATTGATTAGGCTT
+TGATTTTGTATCTTCTTGGTTTTCCTGAGAAAATCACAGTACCAATTATAGAGCAATTAC
+CGTTGATCTTAATGTAAGGCTCAGGCCAGTTTGGGTTTAACGCTTTGAGATAACGCTGTG
+TCCCATCTTCTATCAACCTTTTGAAGGTGGTTTCACCTGTATCGTGCATCAATGCAATAA
+CGTCGTCACCGTGGCAGGCAGGTACTTCAGGATCGACAAAAATCATGTCTCCCGGGCGGT
+ACTCATCAATCATTGAATCACCTATTACCCGCAAGATATAAGTCATTTCCCCACAGGGTA
+CAGGGCAGGGATACGTTTCTGCTGTGCTCAAATCAACCTCAGAATATCCAACTTCTTTCC
+ATGCTCCGGCCTGTACCCATGATATGACAGGGACTAATGTGATTTGTTTATTAGTGATTG
+AAACATCAGGTTTTTTTGTGATGTTCGTTGTCTGGTGTTCTTGATCGAGCCATCCTACAG
+GCAGGTCGAAACATTTTTCGATGTGTCGTGCCATGCTGTCACCGATATTTTTAGTAGCAC
+CATCTCCCATAAACCTGCTGGTCTGGGTTGGCTCGCGATCAATCATAGTGGCAAAGGAAG
+AATTCCCGCCAACACCATCTCTCAGTTTTCTGGCGTTAGACCGCCGGATGTCATGGATTG
+TTTTCATAACGAAATTAAAACCCTTGTACCGTTAAGGTACAAGTATCTTGAAGGTTCATT
+TCAATCATGTAATATGTACACCGGAGGTACATATTGTATGAAAGCGTATTGGGACTCTTT
+AACCAAAGAACAGCAGGGCGAGTTGGCCGGAAAAGTTGGCTCAACACCTGGCTACTTACG
+GCTGGTTTTCAATGGCTATAAAAAAGCCAGTTTTGTGCTGGCTAAAAAACTTGAGCAATA
+CACATCAGGTGCAATTACGAAATCTGACTTAAGACCGGATATCTATCCGAAAGATTAGCA
+GAACACTTTCAATTTTTAACCACAGAACGATGAGGCTAATCGTGGGTAAGCATCACTGGA
+AAATAGAAAAACAGCCTGAGTGGTACGTGAAAGCTGTCAGAAAAACTATCGCGGCGTTGC
+CGAGTGGTTACGCTGAAGCGGCTGACTGGCTCGATGTAACAGAAAACGCTTTATTCAACC
+GCCTTCGTGCAGATGGCGATCAGATTTTCCCGCTGGGATGGGCAATGGTTTTACAGCGTG
+CTGGTGGCACTCACTTCATTGCTGATGCTGTGGCGCAGTCTGCAAATGGCGTCTTTGTGT
+CTCTTCCTGACGTCGAGGATGTGGACAACGCCGATATTAACCAGCGTCTGCTGGAAGTCA
+TTGAACAGATCGGCAGTTATTCAAAACAGATTCGTTCAGCAATCGAAGACGGTGTAGTGG
+AACCGCATGAGAAGACAGCAATTAACGACGAGCTGTATCTCTCAATTTCGAAGCTGCAGG
+AGCATGCAGCACTTGTCTACAAAATTTTTTGCATTTCAGAAAGTAATGACGCCCGCGAGT
+GTGCAGCTCCGGGCGTCGTGGCGTCGATTGCTTCTGGTTGTGGAGAAACTAACGCATGAA
+CAGTTTAACAACACACTACCGTCGCTCGCAACTGATTGCGCTTCCTGTACCGGGTGGAAA
+AGCGAAGGTGGAATATTGCTATGCAGTGAATGTACCAGGTGACAGGGAAATTGTAACCCA
+CAGCTTTGCAGAGTGGGCTGTGGGTGATTTCAACCGGCAGAAGGAGACAGTCCTTTGCGA
+CAAGTTAACCGCTGGTTCAAAGATCACTACGGAGTGCCCGTCAGAGTCATTCGTTGGGAG
+CCGGAAACACAACGGGTTATCTACCTCCGCGAAGGTTATGAGCATGAATGCTTCAGCCCG
+CTCGAACAGTTTCGTCGTAAATTCAGGGAAATAGAGGTCGGTCATGAGCACTAAATTAAC
+CGGCTATGTATGGGATGGTTGCGCTGCATCAGGCATGAAGTTATCCAGCGTGGCAATTAT
+GGCCCGCCTGGCTGATTTCAGTAATGACGAAGGTGTGTGCTGGCCATCAATTGAAACCAT
+TGCCCGTCAGATTGGCGCGGGGATGAGTACCGTCAGAACGGCTATCGCACGGCTGGAAGC
+AGAAGGCTGGTTAACGCGTAAGGCGCGTCGCCAGGGTGATGGTTCATCACCCCACTGTGC
+CGTGGTGGATGAATATCACGAGCACGCCACAGATGCGCTTTACACCACGATGCTTACCGG
+GATGGGGGCGCGACGCCAGCCACTGATGTGGGCCATTACCACCGCCGGGTACAACATTGA
+GGGGCCGTGCTACGACAAACGGCGGGAAGTCATCGAGATGCTCAACGGCTCGGTGCCAAA
+CGATGAACTGTTCGGGATCATCTATACCGTTGATGAAGGTGACGACTGGACCGACCCGCA
+GGTGCTGGAAAAAGCCAATCCAAATATTGGCGTGTCGGTTTATCGCGAATTTTTGTTAAG
+TCAGCAGCAGCGTGCGAAAAATAACGCCCGTCTGGCAAACGTCTTTAAAACAAAACACCT
+CAATATCTGGGCGTCGGCGCGTTCGGCGTATTTCAACCTGGTGAGCTGGCAGAGCTGCGA
+GGATAAATCACTGACCCTTGAGCAGTTCGAGGGGCAGCCGTGCATTCTGGCCTTTGACCT
+GGCGCGTAAGCTGGATATGAACAGCATGGCGCGACTTTATACCCGCGAGATTGACGGTAA
+AACGCATTACTACAGTGTGGCCCCGCGTTTCTGGGTACCGTATGACACGGTGTACAGCGT
+CGAGAAAAATGAAGATCGCCGGACAGCCGAACGCTTTCAGAAATGGGTGGAAATGGGCGT
+TCTGACCGTTACCGATGGTGCGGAGGTGGATTATCGCTACATCCTCGAAGAGGCCAAAGC
+GGCGAACAAAATCAGCCCGGTCAGTGAGTCACCCATCGACCCCTTCGGGGCGACCGGGCT
+GTCACATGACCTTGCTGATGAAGACCTGAACCCCGTCACCATCATTCAGAACTACACCAA
+CATGTCCGATCCGATGAAAGAGCTGGAAGCGGCGATTGAATCGGGGCGCTTTCATCATGA
+CGGCAATCCCATCATGACCTGGTGTATCGGCAACGTGGTCGGCAAAACCATTCCGGGTAA
+CGATGATGTGGTGAAGCCCGTCAAGGAGCAGGCGGAAAACAAAATCGATGGTGCAGTTGC
+GCTGATTATGGCGGTTGGCAGAGCCATGCTGTACGAGAAAGAAGACACGCTGTCTGATCA
+CATTGAGTCCTACGGGATCCGCTCGCTTTAACTGAGGTAATTATGATCATGCTGATTCTC
+GCGCCTCTGGTGGGCGTGCTGGGTGCGCTTTTGCTGGCGTATGGTGCCTGGCTGATTTAT
+CCCCCGGCGGGTTTTGTTGTTGCCGGGGCGCTGTGCCTGTTCTGGTCGTGGCTGGTGGCG
+CGATATCTCGACCGTACACAGTCGTCTGTCGGCGGAGGTAAATAGTGTTCTTTTCGGGAT
+TATTTCAACGAAAAAGTGACGCACCGGTGACCACGCCAGCAGAGCTGGCGGATGCCATCG
+GGCTGTCGTATGACACCTATACCGGAAAGCAGATCAGCAGTCAGCGGGCTATGCGACTGA
+CGGCGGTTTTTTCCTGCGTCAGAGTGCTGGCAGAGTCGGTCGGGATGTTGCCCTGCAATC
+TGTATCACCTGAACGGCAGCCTGAAGCAGAGAGCCACCGGCGAACGTCTGCATAAACTGA
+TCTCCACGCATCCCAATGGCTATATGACGCCGCAGGAGTTCTGGGAGCTGGTGGTCACCT
+GTCTGTGCCTGAGGGGAAACTTTTACGCCTACAAAGTGAAAGCATTTGGCGAAGTGGCTG
+AACTGCTGCCCGTCGATCCCGGCTGTGTGGTATATGCGCTGGGAAGGTGTCAGCGATGGC
+CTGAAGGTGACCGCCGGGAGTGTTATTCAGCGCGATGACCTGGTGCAGTACACGACAACT
+GACGATGCAACCAGCTCCGGTGGTGTCCTGCGCGTGCCGATCGCCTGCTCAAGTGCAGGT
+GCGGTCGGTAACGCTGACGACGGTACGGCATTAATCCTGGTCACGCCGGTGAATGGTCTG
+CCGTCTTCCGGTGTGGCTGACACCCTGACAGGCGGATTTGATACTGAAGAGCTGGAAACG
+TGGCGCGCCCGCGTCATTGAGCGGTATTACTGGACGCCGCAGGGCGGGGCTGACGGGGAC
+TATGTCGTCTGGGCTAAAGAAGTGCCCGGCATTACCCGCGCATGGACATACCGTCACTTG
+ATGGGAACGGGAACTGTCGGTGTGATGATTGCCAGCAGTGACCTGATTAATCCCATTCCG
+GAAGAATCAACGGAAACGGCGGCAAGACAACATATCGGGCCACTGGCCCCGGTGGCAGGC
+TCTGATTTGTATGTGTTCAGGCCGGTGGCACATACGGTGGATTTTCATATCCGCGTGACG
+CCGGACACACCAGAAATACGGGCTGCCATTACCGCGGAGTTGCGTTCGTTCCTGCTGCGT
+GATGGTTATCCGCAGGGAGAACTCAAGGTATCGCGTATCAGTGAGGCGATTTCCGGTGCG
+AACGGGGAATACAGCCATCAGTTGCTTGCACCGGTGGACAATATCTCCATTGCGAAAAAC
+GAACTGGCGGTACTGGGGACGATTTCATGGACGTGACAAACGATGATTACATCCGCCTGT
+TATCGGCACTGTTGCCGCCCGGTCCGGTGTGGTCAGCCAGCGATCCGGCGATTGCCGGTG
+CGGCACCGTCATTAACCCGTGTTCATCAGCGTGCGGATGCCCTGATGCGGGAGCTGGATC
+CGCGCACCACCACTGAACTGATAAACCGCTGGGAGCGTCTGTGCGGTCTGCCGGATGAAT
+GTATTCCGGCGGGAACGCAGACCCTTCGCCAGCGTCAGCAACGGCTGGATGCGAAGGTTA
+ACCTGGCGGGCGGCATCAACGAGGATTTTTATCTTGCACAGCTTGCTGCCCTGGGCAGAC
+CAGATGCCACCATCACGCGATACGACAAAAGCACTTTCACCTGCTCATCGGCCTGTACTG
+ACGCGGTGAATGCGCCGGAATGGCGGTATTACTGGCAGGTCAACATGCCAGCCACCACCA
+ACTCCACCTGGATGACATGTGGCGATCCCTGTGATTCCGCACTGCGTATCTGGGGTGACA
+CCGTTGTCGAGTGTGTGCTTAACAAACTCTGCCCGTCGCATACCTACGTAATTTTTAAAT
+ATCCGGAGTAATCCATGCATCGTATAGACACGAAAACCGCGCAGAAGGATAAGTTCGGCG
+CGGGTAAGAACGGTTTTACCCGTGGTAACCCCCAGACCGGCACGCCTGCCACCGATCTGG
+ATGATGACTACTTTGACATGTTGCAGGAGGAACTTTGCAGCGTGGTGGAGGCATCCGGTG
+CCAGCCTGGAGAAGGGGCGGCACGACCAGTTACTTACCGCACTTCGCGCGCTGCTGTTAA
+GCCGCAAGAATCCGTTTGGCGATATCAAATCGGATGGCACTGTGCAAACGGCTCTCGAAA
+ACCTTGGTTTGGGAGAAGGAGCAAAACTCAATGCAGCAACGGCTACATTAGGACGCACCG
+GTTTCATAGCTATACCGGTTATGATTGGTGGTATTGAGCAATCAGTAATCATTCAGTGGG
+GGTGGAATGCCGCAAAAGCATCTGCCTCTGGGGGGGATGGAAATACAGTTGTATTCCCGG
+TTGCGTTTAATAATGCCTGTGTTGCCGTTGTTGCAAATTATGACAATGTCAGCGCACCTA
+TCAATGCAGTGGCAACGGGGGGATATACAACCACTTCGTTTTTATTACGGTGCGCAGCTC
+AAACGGGTAGTTATTACTATAACTGGATTGCTATTGGGTATTAAGATGAAAATATACTGT
+TGCTTAAATACCGTTGGTTTTTTTATGGATGGCTGTGGCGTCATTCCGCCAGATTCTAAA
+GAAATAACGGCAGAACACTGGCAGTCATTATTAAAATCTCAAGCTGAAGGAGGCGTGATC
+GATTTTTCTGTTTTTCCTCCTTCTATTAAAGAGGTTATCCGTACTCATGATGATGAAGTC
+GCAGATGCGAACTTTCAAAAGCAGATGCTTATCTCTGATGCAACTGATTTTATCAATAGC
+AGACAGTGGCAGGGTAAGGCTGCATTGGGAAGACTTAAAGAAGATGAGCTGAAACAATAT
+AATTTGTGGCTGGATTATCTGGAAGCACTGGAACTGGTTGATACATCCAGTGCGCCAGAT
+ATTGAATGGCCTACGCCTCCGGCAGTTCAGGCCAGATGACATCCGGCGCGGTGCTGGTAT
+CTGTTGCCGTCACCGCGTCAATGTAATCCAGCACAGCGTTAAGTCTGGTTGTTTCTGCCT
+GCGTCAGTTTACGTCCGGCCTGCAATTTCAGTTGAATCAGACTAATGGAAGCCATTGCAG
+CATCAATCAGTGACTGGCGCTGTGCTTCTGCCGCGTCTACTGCGGCGCTATGCTGTGCTT
+CAGTATCGGTCACCCATTTCTCACCATCCCATTTATCGTATGGAGATAAAGGGGCGATAG
+TGGTTGTATTTTCAGGGTAATCACCCGGAGCTTTGATTTCTTTTGATTCTCCAGTTTTGG
+TGCTATAGACCGTTTCACCGCGATGGTCTGGCACATATTCCCATGAGTTAAAATCTGCAG
+AACGGCAGATTGCATAACCAGCCTTATGTGTACCAGGGGCATCTAAACAGGAACATGCCG
+GAATGCCGACACCAACGGCAAGATATTCATTTGAAGTGGAAATATATTCCCGTGTTTCAC
+CATCGTAGTTATAAACGGTAACATCCCCTGCCTTTGTTGCAATAAGGTCACTATTTAATA
+TTGCTTTATGCATCAGGCTGCCCTCACGATATAGTTAAATGCAATATTACGCGGACGCGT
+TTCTGAGGCTGCGGCACCTAAACCATCCACTGATTGTTTATATGTTTTAAAGGTTCCATA
+ATCCGGGGCTGGTAATCCGGCATCGTTTGTGTTTCCTCTTTTGATAATGTCAGTGCCACT
+ATTTACCCATATTTCATCAAAATAGAAATTAATCGTTGCATCAGTCACAATCGTGGATCT
+TGACGGTAATCCATGAGCATGATCCTCCGTTGCATACCCCTGAATACTTAAAATAGAGCG
+ACCTGTATCAATCCCCCGCCCGTCATCCCAGCCACGAATAAACTCACCACGTAAATCAGG
+CAATTTATTTGTCGGATAAGCCTTTGCCAGTTCCGGGTATTCTTCAGCAGAAAAAGCGGC
+ACCATTGCATTTCAGCCAGCCTGTTGGCGGAGTGGCTGAAGGCCACGGAACCGGGACACC
+AACAGGTAATGCAGAGCCTTCTCCCAAACCAACGTTTATGAAAATGAAGAAATAACAAGC
+AAATGGCATCATTCCTGCTTTTACCAGGGGGATTTAACATGCTTATTGGCTATGTACGCG
+TATCAACAAATGACCAGAACACAGATCTACAACGTAATGCGCTGAACTGTGCAGGATGCG
+AGCTGATTTTTGAAGACAAGATAAGCGGCACAAAGTCCGAAAGGCCGGGACTGAAAAAAC
+TGCTCAGGACATTATCGGCAGGTGACACTCTGGTTGTCTGGAAGCTGGATCGGCTGGGGC
+GTAGTATGCGGCATCTTGTCGTGCTGGTGGAGGAGTTGCGCGAACGAGGCATCAACTTTC
+GTAGTCTGACGGATTCAATTGATACCAGCACACCAATGGGACGCTTTTTCTTTCATGTGA
+TGGGTGCCCTGGCTGAAATGGAGCGTGAACTGATTGTTGAACGAACAAAAGCTGGACTGG
+AAACTGCTCGTGCACAGGGACGAATTGGTGGACGTCGTCCCAAACTTACACCAGAACAAT
+GGGCACAAGCTGGACGATTAATTGCAGCAGGAACTCCTCGCCAGAAGGTGGCGATTATCT
+ATGATGTTGGTGTGTCAACTTTGTATAAGAGGTTTCCTGCAGGGGATAAATAAAGTTAAA
+GACACTTTGTGTACAAAAGAAAGTAAAACAACAGCAACTTGTTGCAATTTTATCAATAAA
+AGTAGTATTGTCGTGAAAAATTGATTAAAGATTAATATTATGCATGTTTTTGATAATAAT
+GGAATTGAACTGAAAGCTGAGTGTTCGATAGGTGAAGAGGATGGTGTTTATGGTCTAATC
+CTTGAGTCGTGGGGGCCGGGTGACAGAAACAAAGATTACAATATCGCTCTTGATTATATC
+ATTGAACGGTTGGTTGATTCTGGTGTATCCCAAGTCGTAGTATATCTGGCGTCATCATCA
+GTCAGAAAACATATGCATTCTTTGGATGAAAGAAAAATCCATCCTGGTGAATATTTTACT
+TTGATTGGTAATAGCCCCCGCGATATACGCTTGAAGATGTGTGGTTATCAGGCTTATTTT
+AGTCGTACGGGGAGAAAGGAAATTCCTTCCGGCAATAGAACGAAACGAATATTGATAAAT
+GTTCCAGGTATTTATAGTGACAGTTTTTGGGCGTCTATAATACGTGGAGAACTATCAGAG
+CTTTCACAGCCTACAGATGATGAATCGCTTCTGAATATGAGGGTTAGTAAATTAATTAAG
+AAAACGTTGAGTCAACCCGAGGGCTCCAGGAAACCAGTTGAGGTAGAAAGACTACAAAAA
+GTTTATGTCCGAGACCCGATGGTAAAAGCTTGGATTTTACAGCAAAGTAAAGGTATATGT
+GAAAACTGTGGTAAAAATGCTCCGTTTTATTTAAATGATGGAAACCCATATTTGGAAGTA
+CATCATGTAATTCCCCTGTCTTCAGGTGGTGCTGATACAACAGATAACTGTGTTGCCCTT
+TGTCCGAATTGCCATAGAGAATTGCACTATAGTAAAAATGCAAAAGAACTAATCGAGATG
+CTTTACGTTAATATAAACCGATTACAGAAATAAAATTATTTATTAAAGTCACATTTAAGA
+CGTAATACCCTACAGGGTAAAAATTTTCTCTGATCTTAACTTCTGCAAATGTTAACTGCT
+ATTTTTATGCTAAAAATGGTTATCAAAACTCAAAAACACATGTTTATAATCAATGAGTTA
+TAGAAATGCTAAGGGCTAATGAGTTATATGCAAATTAGTAAAATTATGTTGCTATGTCAG
+ATAGTTACGATTTAGTCATCTAACTAATGCTGCGCCATATGGGTTGGACTGAAGCGGCTG
+ACCTGATTGTTAAAGGTATGGAAGGCGCAATCAATGCCAAGACCGTAACTTATGACTTCG
+AACGTCTGATGGAAGGCGCTAAGCTGCTGAAATGTTCAGAGTTTGGTGAAGCGATCATCG
+AAAACATGTAATCTCTCCATGTGTTAAATATTGAAACGGGCGTATAACACGCCCGTTGTT
+TTATTTATGTGGATATTATTAATAGCATATCGAGCATATTTATATGAAGCCCATTACTTG
+AGCCCATATGGGCATATTTTTATAATGCAACTATTATGTAAACATTTATTTGTTATTTTG
+CTTTCTCCTGGAGGACACTCTTGACTGCTTTTGAGTAAACTCCATAAATCCTTGTTGAAT
+GGTGCGATGTGATAAATAGTAATAGGATATTCTTTATCCTTAAGGATAATACCAGACTTA
+ACCGGTGTAAATATACTGCCAGGAGGGAGAAATATAGTAGATTGATACCAGATGATCATT
+TTCATATTACCCCATATGGCTGAAAAAGATATACCACATGTAGGTTGAATTACCGTGTCA
+ATTACTATCCACTTCATTTGTTATGTCTTATCCCACGGTATTTAATATGGTTCATTAGGA
+TGTTTATTTCTTGATTTTGCATATGAGTATATTACCCCCCCCTCAAAAAAATAAATTAAT
+TAAAATGATGGCTTATATAAAATAAAATTTAAAGCAAGGAATCTCAATGGATGTTAAACA
+AAATGAGATTTTGTGAAAGCAATAAATTATTGACTTCGTTTTAGATTTGTTTAGCTATAA
+TGTTATACATTCAAATGACTGAACATCCTGTAATTAAAACATAGCCTTTATGCTACTTTG
+TGCCAATTTGCTAAACATTATGGTTGCCTTTTTATATAACGATAATAATGAATATAAGCA
+TGACATGAGAATAAGGTTTCAATTTTTGAGTTATATAGGAATGATTTAACCTGTTCCTGG
+CTAAAATACATATAACCGGATGATGACTAAACCAAAATACATGTGCGTTAAGTATTGAAA
+CGGACGTGTGGCACGGCCGTTGTTTTTATAAATATGTTAACCGTTATAAAATAACGTATC
+AAAAGTCAAGTGATCACATTTCAAATATCAAGTTGATAGTATTAGTCTGGTGATTATTTA
+TGGGTGACAATAAAAAGACAGTATTAATCATCCATAGAGATAGTCTCTGCACTTTTATTT
+CCATTATGCTAATGCCTTACTGAATTATGAAGCATTTCTTAAGTATCCAACTTTAGCTAG
+ATTAATGGTTTATTATTTTCTACATCTTCAATATATAAAAGCGTATTATCAATGGCGTAG
+TAACTGCGTTTGTTATGATTAACATCAGTAACCCACCGGAAAACGCCCGCGCCTGCCAGT
+GTTGAACAGTATTCCCGAAATGTAGATTTTCCGCAAATATGAAGCAATGCGGCCTCTTTT
+ATTTTAGCAGGGTTCTTGGTCGTACTAACTTTTAACAGGTTCCTGGTTCCTCTTAATAAC
+AAAACCGTATCATCGTGAGTAATAATTCTGATGTTATCCGTAGCCAGATAATAAATGTAA
+TGTGCAATACGGTGATGTTTTAATTCTGAATAAAACCAGGAGAAGTTTTGCTCTTTTCTC
+ACTTGCTCAAACATCTTTTGAAAAACAACGACCTGATCCAT
+>NC_000913.3|provirus_1412000_1434224
+CTACGATAACCGCGCATTCAACATGGCTATCTGTTCGTCGTTCATGTCATCAATCCACAT
+ACCGTAAATTTCATACACCATCTGCGCAGTTTCATGCCCCATTTGGCTGGCTATAAATGC
+CGGGTTCGCTCCTGCCGTCAACAGCCAGCAGGCAAAAGTATGCCGCGTATGGTACGGATT
+ACGGCGGCGAATACCAGCACGTTTTACTGCTGCATTCCACCTTGCCCCCAAACTGCTTAC
+CGAGTAATAAGGTTTTTGTTTTCCGTTACACACCCTGGGCATGAAAACAAAATGCAGTTT
+TTGCTTTTCGGTTCTGCCGTACTCCCGATGATAAAAGGTGATTTCGCTTTTGCGATGATG
+CCCGGTCAGTTTGTATTGCTCCTTCAGTGCTTCAAGAGCAGGCTGCAGTAGTGTTACTGT
+TCGGATCCCGGCATTTGTTTTTGGGGGACCGAACATATCAAGTATCGTCAGGTTTCTTCT
+GACATTCACTATTCCCTTTTCGAGATCCACATCCTCCCACGCCAGAGCTGCCAGTTCCCC
+GTGACGAAGTCCTGAGTAAACGGCAAATTTCCACAAGTTCTGGCTCTGTCCTTTTTCACT
+TTCCATTAATGCATTGAATTCTGTTTTAGATAACGGATCAGGCTTTATTCTGTTTCGCTG
+TAATTTTTTTACTCCTTCAAATGGTTTGGTTGATATAAATCCCGACTGATACGCAAAACG
+CAACAGCGAACAGAGCAGGGCGATATAGTTATCAACTGTGCGCACGGTTCTTCCTTTTTT
+GTTGGATCTTGGATTATCCAGGTAAAGCGTTTCTCCATGCAGCAGTTCATTCCGGTAGTT
+TAAGATATCGCTATAACGAATATGTGATATCGGGGTACTTTCACAAATTATTATTCTGAG
+TGTTTTTAATTGTGATTTCGTTTTCTTCATTGTGTTTGTTGTTAACTCTGTCTCTTTAAT
+TTTTGTCCAGATATCACAAAGCTCTCCGAACGTTTTTATGACTCTCGTTGTCACCATTTT
+TGCCCCAGTGCTGGACTGGGGAAAACGTCTTAAATACTCAAATTCACCGGAGTTTATTTC
+ATGAACTATCAGCGCTCTTAAATTTCCGGCCTTTTTAATATTACTGTTTGTAATCTCCCA
+GCCTTTTAATGTTTCCCGACATCGTTTTCCTCGAAACATGAACCAGATGCGAATGTATCT
+ACCTCTAATCTCGACACCTGTTGGTAATTTAGACATATCATGAGTCTTTGATAAACTGAT
+TTATCTTTGGATAGTTGTACCAGATAATCCCTCGTTTGCTGTCTGGCTTACCTAAAGGAG
+ATACTCGTTTGAAGTGGAAGCCCTCCACCCAACAGTTCTGGCGGTATGCTTCAATTTGTC
+TGGCCCCCAGACCAGTGCGAAGCATCAGGCCGTATTCAACCATCCACTCTTCATTAAAGA
+TTACTTGTGCCATCGCATCACCTCTGGCAGGCGCCAATGTTAGACTGAAATTGACGCCCG
+ATGTTGATTATTAATAATCAGCTATGAAGTTTTAATTTGAATACAATGCAATTCTCGAGG
+ACTGAAGTTTCTCGCAATTAAAATTTATCAGTTTTACTTTCTGCTCTCTGGAAACGCCTG
+CTTCTTTTTTACCTGAGAGCATTTTTTCGCATTCTGATTTCGTTAGTTTAGATTTTGAAT
+ATCTTGTCCAGTTAGTAGGAGTGCCACCTTCCTTTTCAATAGTGGCGGTAATTTTATACA
+TGAACACCTCCATTATTATTTCCAGTGGTTCGTTTATTCCATCTTTCGAGTGCTTCTTTT
+TCACTTCCACCATAACCGGTTCGGGATTCGCATCCGTTACACTTCGCTCGGTAATATCCT
+GAAATGGCTTTCACCGTTACTGATGGACAACCACAAAATGGACATGGTTTAACATTGTCA
+TATCTCATAATTTTTCTCATAAAAAATATTTCAAGTTGGCGGTGCATTACACCGCCAGGC
+TGAATTATTCCTCTGAATTATCGATTACACTGTATTCCCCGGTTAATACAGAGGAATCTG
+CAGGATCGATTGTCAGTGGTTCCTTTTCATCCATTGATACTGCACGCTGGATCTCAATTG
+ATACGGGCAAATATTTGAACAGGCGACGAATAGCCGTTTTCTTTGCCATTTCTTCCCAGT
+GAGTTACCCACGGCCCGTTATTACCAGCTTTACTCAGGCTGCGCACCAGCTCAATCTGTT
+TGCGCGTCATAACTTCAAACTGAGTACCTCCGTCTTTCAGTCTTGCGACAGCATAGACGT
+GGGTAACCGGGGCATCTTCGTTTTCTCCCGGGCGGTGTATTAACTTTTCATCAAGGCCAA
+ATTCGAAGCTAAACTCGTCACCTTCACGGACAACACGGGCTGACAGGCTGGCGATTTGAC
+CAGAACGGCGAGCCAGATCAATCATGCCGCGATAGCCAATGATTAGCTGAACGTTCTTTT
+TACCGCTCTTTTCGTTTTTATTACCAAAAGGCAGTAAATATGCATGACCGAGGGCGCTAC
+CTGGCTCAAGTCCGAGCTGTGAACACTGTACGATCGCACTGACAAAACTCATAGTGTCAC
+AGTTTCCTAACGCCGGAACTTTACGAATTTCTGTGGTGGCGATACGGATCATACGTTCAG
+CCGTCATATGGCGTGGAAGAGCTGCTGCCAGTTGCTCTTTCATTGATGGCTGGTTAATAA
+AACTAATCACGTCGCTATTTTTAACTGCTGCTGGTGCACGGTTTCCCTGAGTTTTTTGCA
+GATCGGCTTTTGCGATTGGTGGTTGCTTAGTCATTTGCATATTCCTTAGCCCAGCGGGGC
+AGTGATAATGTCTTAATAGCTGGCCATTCATCGGTATTCAGGCAGTCAGACAGGGTTCGC
+AGATTGCGGTGATATTCCTGTTGACCTGCCAGTTTTGCTTCTTCGCCCATCATGAAAATT
+TCAACCGGATAACGTCCGCATTCAATAGTTGTGCTGGCAACCAGAAAAACGAAAGTTGGC
+TGCACTCCAAACTGTGCTTCATAACCGTCACTGTAGAATGCATCCTGAACGTGATAGCGG
+TAGTCGTAATAAGCGGTTTTGAATCGTTGAATATCCGCCGTAGTTTTCACGTCCATGATC
+CAGTGAAATTCAGGGATAATTTTGTCCGGACGGCACCGACACAAAATTCCTGTTTCAGGA
+TCTTCCCAGTAAATTGATGATTCAGCGTGTCCGGCGCTTTCAACAAGCCATTGCCCCAGC
+GGCAAAGCCATAACGCTTTGATACATGAGTTCAATTTTCCGGCCTTCTTCCGCAGTGATA
+ACCGTTTTTCCTGTGCTTGCGCATTCCATCAGAAACGCTTTCTCTTCTTCTTTTCCGGCG
+TTTGTACGGCGGTTAAATTCAGGTGCTACGATAAAGCGGTTACTGAATTCTTCCGGTTCA
+AGTACCCGGCAGTGGAAAGCAGTTCCTAAATCGAGCGTTTTTGTCTTTGTGGTGTCCACG
+GGGGCATTTTTACGCCACAAATATAGTGCCGGAGTATCAGCAATGTCATCGAGCTGAGAC
+TTACTGATACCGGGACCCGCGTGGTAATTCTCATTCGAAATTCCGTAATAAATACCTGGC
+TCTATGTCTTCTACGATTACGGGATCTGCGACTTCGCCAGTTTCATCACTGCAATCGCGA
+TGCGGATCGCTGCCAGCATTCTCATTGTGCGGATGTTCAGCGCCTTCCATTTCCTCCGGA
+TCATTTTCCTTAGCTTCAACCTGACTCTCTTCATCGAATGTTTCCTGGTATGTTGCGTCG
+CCCATCACCGCACCACAGTCAGGGCAGTTATCCCCGCCAGTCTGGCCGCAGGCATTGCAG
+GCTATTTCCGGTTCCTGTTGCACTACTGGCTCAGGTTGATTCATATCTGGGCTGGTTTTT
+TCCGTTTCTGGCTGGTTCTGGTACACACAATCGCGAGTCTGGATCCCCTTTACCCATTTC
+GGATCGTTCGGGTCGCTAATTCCGTCAACAAATTCACCACGTGATGCAGCAAGCAATTTA
+TCGTCATCGACAGGATTTTTTGATGGAATGTTTTTCCGGGCTTCATGGAGTTCTGCCCGC
+AGTTCCTGATATTTCGCATCAACAGAATTTACCTGTGACTGAGCATCCAGCGGCTGCGTG
+TCCTGATGATGTTCAGTTGCGTCCGGTTCCATTGTTTCAGCCTCTCCCTGTTCAACTGCC
+GTTGTTCCAGATGGTTGCGGTTTTTCTTCATCATCCTGTTTTCCTTCTTCTGTTACTCGC
+TGCGGCATCGGGGCAGAGGAGCGACCGCAGGCAATATCCACGATTTCCGGATCAGGGTTG
+GCATGATCGGTTTCAGTCAGTACTTTGTTCAGATATTCAGTGACGTGCGCGGGGATGACC
+TCGATCCCAATTGGTGCTTCTTTTACGGACGCAACCACGATGGCGCGGGAATAATCCAGC
+CCGCCAGGCATGGTGATGAATTTGTCGCGGAAAACAGAAAAGGGCGGTTTATTTTCAGCG
+ATAATTTCCTCAATGCGTTTAGCGTGTGCCGGATGAAGGTTATAGATGTCCAGATCCATT
+GAACGGGCCAGTACGCCAGTGGCTACGTCGCGCGCCAGTGACGTCAGATCGTGTACGAAA
+CCTTCGCCGCGATCGGTGAGGTTTCCGCCGCCAGCATTAGCACCGGAAGCCGTGCGAGTG
+ATGTGTGAAACACGATTACCCTTCATCCACTCTTTTGTCAGCAGTCCTCGATCGGTGTAG
+TCAGCGTTCAGGTATGCTTCGAAAAAAGCAGTTATCAGTCCCAGGTTTGAATTACCAGGA
+TTAGGGAAAACTTTGTCAGTGTCACGAACCAGTTTGTGGAGTTCGCGAATTTCCAGCGGG
+TCGAGCAGGCTGGTTTTGTGGGAAACAGCCAGGGCAGTAACAGCCGGTAGTTCTTCAGCC
+CGAGCAATGTGTAATGCCTGGAGTCCGTCGCGTGAAACGTGCGTTACCGGTTTTTCGCTG
+CCGTGTTGAGCAAGCCAACGAATGGGCAGTTCCTGGCCAGAAATTGGGAGTAGCATATTC
+TCCTCAATCTCAGTCATGTCTTCGCCGTTGACGTTGGTATTGCCTTGATAGTGAGCGTTG
+TCTGGTGCTGCTCCCGGTTTTAGTTCCCATGTCATGGAGTCTTTGCTGAGTTGATAGCGT
+TCACTCCAGGTAAAATCGATCTCACCTTCAGCGGGCAGGTCATTAACGACAGGAAAATTC
+GTGGCAACAGCTTTAAAATAGCTGCTCAGTTTTTTACCTGACTTAACGATCAGGTAGTCC
+AGAGTGGCACAGGTCGATTCAAAATCGTTGCTTGCCCACAGGACGACGTCAGGTTCACCG
+GATGATTTTTTCGCTTTCCGTAACAGGAAGAGTGGTTTTGTGCTCATTGTTTTTTAACCT
+CAACTCAGATTAAAATTCGTTTTGTTCAGTGAATGATCTTGCCGGATACACACTGTTCAT
+AGCCTGCGCCATACGCAGGCTATTTCTTTCAGATTTCACCTTTTAATTTCATTGCAATTA
+GAGTTGCCAGAAATTCGGCTTTTTTTTCTGCGGGCAGATTCTTTCCGATATGCACCAGGC
+ACATTTTTTTGACACCTTCATCAAGTGTTTTTACGTTGCCTGATGGACCATCGATATCAA
+CCACAGTGAATGGGGTTTCTTTATTTTCTGTTTTAATTACGTAGCCAATGCGCTTTCCTT
+CCAGATTCACCTCGTGAACAATGTCATCGGTAGTTACAACAGTGGCTTCATAATTGGTAA
+TCATGTTTTTCTCCTTAATTAAGGTTGAGCGAATACCTGCCATTTCTGGCATAAATTCAG
+TTTCGAATAGTCAATTAATTAAAGTTCATGTGCCATCTGGTCTTTTTCGGCACAAGCTTC
+ACTGCAATATTTTCTCGGTTCGTCTTTTGATAAAATCCCGTGCATGAAGTGAAGCATTCT
+TTCAATAGCTTTGCTTTCTTCAACGTCTTTTTTGCAAAGGTGGTAAGCACATTTTATTTT
+CTTAGTCATCACCATGACTCCGCCTTTACAGGTAAACCATCACGACCGAGGAAGACTTTA
+ATCATGCGGTCAGTAATGAATGTTTTTGTGGTCAGGTTACGAATATATAGTTTTCGCTTT
+TTAATATTGTTTGCCGAGGCAATATATGTCCGGCCTTCATGAAGAACATAATCGCCAGGA
+GTCACACACTGACGTGGTATTTCATCAGTTCCGAAGTGATGTGCAATCATAATTATCTCC
+ATTTTTACAAATGAACTTTGTTGATGCGGTGTCTGGTGCCTCCAGGTGACTGCAACCAGT
+TAACAATTACAGTCGGCTTTCCCACCCAAACCAATAAGGACTAACATGACTTTTAACTGT
+GCCACGTGCGCTTAGCCGCATTCACCGCATCACAAAATTCACTTTAAAAAGGGCGGACAT
+CAGCCGAACTTCAAGAAAAAAACTGATGCCGCCAGGACTACACACAGCAATGTCGTTATT
+TACAACCGGAGGCGCACTCCCACCATTTAAATTTAACAGACAAGACCGACTCTTTATGGA
+TATCGGAAATGCGCCTTCGTGTTGTGCCCGGTTTTATTTCACCACCTCCGGGCTTCGGTG
+GTCTCGGCTATACCCCTACAGCGAGAGCTTGTGTTAACATTTCAATACCCTTACAGTTGA
+GAGTTATTGATATGTTGGATGTATTTACTCCATTGTTGAAACTTTTTGCTAACGAGCCAC
+TCGAAAGACTTATGTATACGATTATCATTTTTGGTCTCACTCTCTGGCTGATACCGAAAG
+AGTTTACTGTCGCATTCAATGCTTATACTGAAATACCTTGGCTCTTTCAGATTATCGTTT
+TTGCCTTTTCTTTCGTGGTCGCCATTTCCTTCTCAAGATTGCGAGCACATATTCAAAAGC
+ATTATTCATTACTACCAGAGCAACGAGTATTGCTTCGTTTATCTGAGAAAGAAATCGCTG
+TATTTAAAGATTTCCTTAAAACAGGAAATCTTATTATCACTTCTCCTTGCCGTAACCCGG
+TTATGAAAAAATTAGAACGGAAGGGCATCATTCAACATCAGAGTGATAGCGCAAACTGTT
+CTTATTATCTCGTCACCGAAAAATACTCCCATTTTATGAAGTTATTCTGGAACAGCAGGA
+GTAGACGTTTTAATCGTTAGCTTACTGTGTGCTTCTCCAACCATCGGCGCGCACCAGTTT
+CGGTTTTAAATGTTTTGCTTTTGGTATACGTCATGGCAGTGAACGTTCCATCCTGGTTGG
+GGAACACGCCGCACACCAGGGATTCGTTGTTGCCGAGGTCGATTTTTTGCATTTTGCGAA
+TCTCACATCTTGTTGCTACGTATAGCGACTTCTGCCTGCCAGAGATCCCAGTCGTTGCTG
+CGTAAAGCCTGCACAGCCTGGTTGTAAGTGATACCGCAACAATCCATCAAATACTGAACT
+ACTTCGTAATGCACCATCTTATCTCTCCCCTTAACGCCGGGTGGCGGAACTAACTGCTGC
+ACTGCAAAATTTGAATCCCGCCGTCATGTTCATACGCCTCGGGCTGGCTACTTAACCCCT
+TACCACTGCCTGGTAACTCGAAGTATTGCCCGGCGTTCTGTGGGGCGGGGTGGGTGGTAT
+GCTGGAACTATAGGTAATGCCTAATTGATTGTCAATAGGCTATGCCTAATGTTTTGAGCG
+TAACCTAATAGGTGATGGCGACAGCAGAAAGTGATGGGGGGGTTAAATAACGGAATCCAG
+GAGTTTTCCGTCAGACCATATAAGTTTAAGTTCCAGTTTTTGTGATGTTCTGGCTTTTCC
+GTTCAGATTCAAGAGCTTTCAGATACTTACCCACTTTCATTTCCATCGCTGCTATGTAGG
+CGCGAACATCGTGGTCAACCCAATCTGGTTCTGTAGCATTTCCAGATAACAGGAAAGCTA
+CAATCGCTCTTATTTCATCAGAGGCTGCTTGATAAAGGTTGTTTATATCTAAAAGTTCAC
+TTTTTGTATCTGAATTGGTGGGGGTTGGTATGGGGTATTCGTTAAGCCCCCAATGCTCTG
+GACCAACAACATCAGAAAAGAAACGCCATAATTCTGGAAGTTTATCTTTACTTATAGAGC
+CTTTCTTAATCCAGTCATAAATTGATGGTGGTTGGACTTTAAAGTGGCGTGCGACCTCCG
+CCTTTGATTTGACGGATCCCGATGCGATTTTTTTGTTAATGGCCTGCTCTATCGCTCGGC
+CTAAGTCTTTACCACTAAGCATTGCTTAATATTCTCCTATGCGCATTACATTAGGCAATC
+CCTACCCTTACTGCATTAGGCACAGCCTATTGACAATTGCGTTAGGCGTCGCCTAATATT
+TCTGTGTGTTTTTGGAGTTCATTCGATGAAAAAAGAGAACTATTCATTCAAGCAAGCTTG
+TGCTGTTGTCGGTGGGCAATCAGCAATGGCTAGGCTTTTAGGTGTATCACCTCCAAGCGT
+AAATCAATGGATCAAAGGGGTACGTCAATTGCCTGCCGAGAGATGTCCAGCAATTGAACG
+TGCAACAAGAGGTGAGGTTCTGTGCGAAGAACTTCGTCCTGATATTGACTGGTCATATTT
+ACGACGTTCGGCATGTTGTTCGCAGAATATGTCAGTGAAGCAACTAAATGACAGTAACAA
+ATCCTCATTTGATCATACCTGAAACATCAAGAGGCAAATGATTCATGAAAATCAAGCATG
+AGCACATCGAATCAGTGTTGTTTGCCCTAGCAGCCGAAAAAGGGCAGGCATGGGTAGCCA
+ATGCAATTACTGAAGAATATCTGCGCCAGGGGGGCGGCGAATTGCCCCTGGTTCCAGGCA
+AGGACTGGAACAATCAGCAGAATATCTATCACCGTTGGTTGAAAGGTGAAACGAAAACGC
+AAAGAGAAAAAATTCAGAAGCTGATCCCAGCAATTCTGGCAATCCTTCCGCGCGAGCTGC
+GTCACCGACTCTGCATCTTCGATACCCTGGAACGCCGTGCATTACTGGCGGCGCAGGAAG
+CGTTAAGTACGGCAATTGATGCGCATGATGATGCAGTCCAAGCCGTTTACCGGAAAGCGC
+ATTTCAGCGGCGGCGGTTCTTCCGACGATTCTGTCATTGTTCATTAAGCAAAAGTTTCCA
+TGCTGTTTGTGCTTATTCTAAGCCACCGGGCAGCATCATACGGGGCAATTATGGCCGCAT
+TACCATACATGCAACTGTACATAGCTGATTACCTGGCTGACACCATGCATTTGTCAGCAG
+AGGAGCATGGTGCGTATTTGTTGCTGATGTTCAATTACTGGCAAACAGGAAAGCCAATAC
+CTAAAAACAGGCTGGCAAAAATTGCCCGTCTGACTAACGAGCGATGGGCTGATGTTGAAC
+CATCCTTGCAGGAGTTTTTTTGCGATAACGGCGAGGAATGGGTGCATCTTCGGATTGAGG
+AAGATCTGGCATCAGTCAGGGAAAAATTAACCAAAAAATCAGCCGCAGGAAAAGCATCTG
+TTCAGGCCAGAAGAAGCAGAAAGGAAGCAGATGTTCAAACAAAACAAGAGAGAAATTTAA
+CAGGTGTTCAAACAGATGTTGAAGTGGTGTTTGAACATGATGTCAACACAAAGGCAACTA
+ATAAAGATACAGATAAAGATCTAAAAACAGATCCCCCCCTAAATCCCCCCCGGGGGAATC
+GAGGTGTCAAAAAGTTTGACCCTCTGGATATTACTTTGCCGAACTGGATTTCTGTCTCGC
+TTTGGCGTGAGTGGGTTGAATTTCGCCAGGCATTGCGAAAACCGATTCGAACGGAGCAGG
+GCGCTAACGGGGCGATACGGGAGCTGGAAAAATTCCGCCAGCAGGGTTTTTCACCTGAGC
+AGGTGATTCGACACAGCATCGCCAATGAATACCAGGGCTTGTTCGCGCCGAAAGGTGTTC
+GACCTGAGACGTTACTCCGACAGGTTAACACCGTCTCGTTACCGGATAGTGCGATCCCGC
+CAGGCTTCAGGGGGTAACTGACCATGAAAAATATTGCGACAGGCGATGTTCTTGAACGTA
+TCCGCAGACTGGCCCCGTCACATGTAACCGCGCCATTCAAGACGGTAGCGGAGTGGCGCG
+AGTGGCAACTTTCCGAAGGCCAGAAACGTTGTGAGGAGATCAACCGTCAGAATCGTCAGT
+TGCGGGTGGAAAAAATTCTGAATCGCTCTGGCATCCAGCCATTGCACCGCAAATGCTCGT
+TTTCGAATTACCAGGTGCAGAACGAAGGGCAGCGATACGCGTTGAGTCAGGCGAAATCCA
+TCGCTGATGAACTGATGACCGGGTGTACAAATTTTGCGTTCAGCGGAAAACCTGGTACCG
+GGAAGAACCACTTAGCGGCAGCTATCGGGAATCGCCTGCTGAAAGACGGTCAGACAGTGA
+TTGTGGTTACCGTGGCTGATGTTATGAGTGCCCTGCACGCCAGCTATGACGATGGGCAGT
+CAGGCGAAAAATTTTTGCGGGAACTGTGCGAAGTGGATCTGCTGGTTCTTGATGAAATTG
+GCATTCAGCGCGAGACGAAAAACGAGCAGGTGGTACTGCACCAGATTGTTGATCGCCGGA
+CAGCGTCGATGCGCAGCGTGGGGATGCTGACAAACCTGAACTATGAGGCCATGAAAACAT
+TGCTCGGCGAGCGGATTATGGATCGCATGACCATGAACGGCGGGCGATGGGTGAATTTTA
+ACTGGGAGAGCTGGCGTCCGAATGTCGTCCAGCCAGGAATTGCGAAGTAATTTTTACCGG
+GAGAAAAATTTAATGGAGACTGTTTTTGACGCACTGAAAGCAATGGGAAAAGCCACATCC
+ATAGAACTTGCTGCGCGACTTGATATCAGTCGTGAAGAAGTGCTGAACGAACTATGGGAA
+CTGAAAAAGGCTGGTTTTGTTGATAAAAGCGCGTACACCTGGCGTGTGGCTGATAACAAT
+GTTCAGCAGGAACAGCCAGCGCAGGCAGAACTGCCGGAAGAAATCACCACAGCAACAGTA
+GCGAAAATCTCAGAGTGCGATTTAACCGCGACGATTGAACAACGAGGACCACAAACGGCT
+GATGAGCTGGCTACATTGTTTGGTACCACATCACGCAAAGTGGCTTCAACGCTGGCAATG
+GCAATCAGCAAAGGTCGTCTGATTCGCGTAAATCAGGGCGGTAAATTTCGTTACTGCATA
+CCGGGCGATAATTTACCAGCAGAGCCGAAAGCAGCATCGGTATCTCCGCTCTGGTTATCT
+GCATCGTCGTCTGCCTGTCATGGGGTGTTAATCATTACCGTGATAACGCCATCGCCTACA
+AAGAACAGCGCGACAAAAATGCCAGAGAACTGAAGCTGGCGAACGCGGCAATTACTGAGA
+TGCAGATGCGTCAGCGTGATGTTGCTGCGCTCGATGCAAAATACACGAAGGAGTTAGCTG
+ATGCGAAAGCTGAAAATGATGCTCTGCGTGATGATGTTGCCGCTGGTCGTCGTCGGTTGC
+ACATCAAAGCAGTCTGTCAGTCAGTGCGTGAAGCCACCACCGCCTCCGGCGTGGATAATG
+CAGCCTCCCCCCGACTGGCAGACACCGCTGAACGGGATTATTTCACCCTCCGGGAACGAC
+TGGTAATGATGCAGGCCCAACTTGAAGGTGCTCAGCAATACATAACCGAGCAGTGTTTAA
+AGTAAAATCTTAACTACAATATGATTCATTTTGATGATTGTTTCATAAGGAACAGTGAAG
+TAAGATCTAAGAGGAGTTAAATTTTATACAGTATAATCATAATATTGCAGCAAGGTGGTT
+ATAATTGAAAGAATATTTAGATATGAATACATCTCATGTAAGAGTTGTTACTCATATGTG
+TGGGTTCCTGGTTTGGCTCTATAGTCTTTCAATGTTGCCACCAATGGTTGTAGCATTGTT
+TTATAAAGAAAAAAGCCTGTTTGTTTTCTTTATAACTTTCGTTATATTTTTTTGCATTGG
+TGGCGGAGCGTGGTATACAACTAAGAAATCTGGCATTCAATTACGTACCCGTGATGGGTT
+TATTATAATTGTAATGTTTTGGATTTTGTTTTCTGTTATTAGTGCATTCCCTTTATGGAT
+TGACTCAGAACTTAATTTAACGTTCATTGATGCTCTGTTTGAAGGGGTTTCTGGAATAAC
+AACAACAGGAGCAACTGTAATTGATGATGTTAGTTCATTACCTCGGGCATATTTGTACTA
+TCGGTCACAGTTAAATTTTATAGGTGGTTTAGGAGTTATTGTTCTGGCGGTTGCTGTATT
+GCCATTATTGGGTATTGGTGGTGCAAAGCTTTATCAGTCAGAAATGCCGGGGCCATTTAA
+GGATGACAAACTCACTCCCCGCCTGGCCGATACGTCACGGACACTGTGGATAACTTATTC
+TTTATTAGGTATTGCTTGTATTGTCTGTTATAGACTTGCAGGAATGCCTTTGTTTGATGC
+TATTTGTCACGGGATTTCCACAGTTTCGCTTGGTGGTTTCTCAACTCATAGCGAGAGTAT
+CGGATATTTTAATAACTATTTGGTTGAGCTGGTGGCTGGTTCTTTTTCCCTGCTATCGGC
+TTTCAACTTCACTCTTTGGTATATTGTTATTAGCAGGAAAACGATAAAACCTTTAATCAG
+AGATATTGAACTTCGTTTCTTTCTGTTAATAGCCTTAGGGGTGATCATTGTTACCTCTTT
+CCAGGTCTGGCATATAGGTATGTATGACTTGCATGGAAGTTTTATTCATTCGTTTTTTCT
+TGCCAGCTCCATGCTCACTGATAATGGTTTAGCTACGCAGGATTATGCAAGTTGGCCCAC
+GCACACGATAGTGTTTTTGCTGTTGTCAAGTTTCTTTGGGGGATGTATAGGTTCAACTTG
+TGGTGGAATTAAGTCACTTCGATTTCTTATACTTTTCAAACAAAGCAAACACGAGATAAA
+TCAGCTTTCTCATCCCAGAGCGTTGTTGAGTGTAAATGTAGGAGGGAAGATAGTTACAGA
+TCGTGTAATGAGGTCTGTATGGAGTTTCTTTTTTCTTTATACTCTCTTCACGGTGTTTTT
+TATACTGGTGTTAAATGGTATGGGATATGATTTTCTTACATCATTTGCAACAGTGGCTGC
+ATGTATTAATAATATGGGATTAGGTTTTGGGGCTACTGCATCGTCATTCGGAGTGCTTAA
+TGACATTGCAAAATGCTTAATGTGCATAGCTATGATTCTTGGTCGCCTTGAAATTTATCC
+TGTTATTATATTGTTTTCAGGTTTTTTTTGGCGCTCCTAATATATGGCTGATTTATAATT
+GTGAGTTTAATATTATGTTGACTCACTCATTGATCCAATACCTAACTTTACCAGCAACAC
+CTCCGTCCCCAGTAGCACTGGCTGCTGGGGTGCGTTTTATTCATAAAGCAAGGCTGTATG
+AGCGAGAAATTAAAGATAGTCTATCGCCCATTACAAGAATTGTCACCGTATGCGCACAAC
+GCCAGGACGCACAGTACTGAGCAGGTGGCACAACTGGTAGAAAGTATTAAGCAATTCGGC
+TGGACTAATCCGGTGCTGATTGACGAAAAGGGCGAAATTATTGCGGGTCACGGTCGTGTT
+ATGGCGGCTGAAATGCTCAAAATGGATTCTGTTCCGGTCATTGTTCTGTCTGGCCTGACG
+GATGAGCAGAAGCAGCGATAACGATCAGTATCGCTCCCGTAATGCATTAATCCGTCGCCA
+CATTGAGAAAATGGATGCCAGTTTGCACGTCGGAACGAAGGAGTTTGATATTTCAAAGGT
+TTCCGAGGTGGATTCTGTTGATGATTTACTCATTGATAATGCCGCTCGTTATCTGCTGAA
+AGACTGGAAAGGGGTTGGTGAACTGGTTAATGGTGTTGAGGTTGCACTGGAATATACGGC
+AGAACGAGGGATCGCGCTGCTTAAGCAGAATCCAGAGTTGTACTGGCAGATCCTTGCAGA
+AGCAGCCAGCATCGCCCAGGGTAAAGAGCAGCAGAAGCAGGATACGATAAAAAAGCCATA
+GCTGCCCAGCGGTGGTTATCGGAGTTCGGGGGAGAAAGGGGGGAAAAGGCAAGATGGAAG
+CGAGAAAAACTCAGGTTGCCACCGATACCGGAACCAGAAATAGACCCGGTGCTTAAGGAG
+TTGTTGTACGCCTATTCGGTAATATCCCGTGCCCGACGTTATGCTGGAATGGCTGGGGTG
+CCTTTGCCTTTATCTCTGACAGAGATAAATGAATATTTAGCCACTCATCCGGTATTGATT
+GAGCGCGATGAATTTGAAGCAGTGATCTTTGCACTGGATGACCAGTATTTTCAGGAGCAG
+TGTGTGTAGTTGTTAATTACGTACACTCTGTTACAGAGATGTGATGGTGTCTTTAATTAA
+ATCGATGATGCTCCTGGAGAAAAGCATTGCGTGGCCTCGTAATCGCTATATCTACTATTA
+TGTCGCCTGAAACCCACTTCGCGGTGGGTTTTTTGTTGTCAGGAGTTTTAATAAATGGCA
+GAGCAAACCTCGCGTCTCGCAATAATTATTGATAGCACTGGAGCGAAAAATAATGCTGAC
+AATCTGACCTCCTCATTAGTCAAAATGACGCAGGCTGGGGAAACTGCTGCAAATAGCGCA
+GGGAAAGTGACTAAGGCAACAGAAGATGAGAAGAACGCGCTCGCAAAATTAAAAGCAGCT
+ATTGATCCAGTTGGTGCCGCAATTGATACTGTCGGTCGACGCTATTCTGAATTAAAGAAA
+TTTTTCGATAAAGGGCTTATTGATAAAGAAGAATATGAATTTCTTGTCCGTAAACTTAAT
+GAAACCACAGAGGAATTGAGCGGGGTTGCGCAAGCGCAGAGAGAAGCCGAGAAGGCCGGA
+AAACTTGCTGCCGCTCAGCAGGAAGCGCAGGCTCAGGCCTTTCAAAGAATGCTGGACAAG
+ATCGACCCTCTGGCTGCGGCGCTAAGAAATCTTGAACAACAGCATGATGAACTTAATGCT
+GCGTTTGCATCCGGGAAAATAAATGGTTCTCAGTTTGAGAATTATAGCCGAAAAATACAG
+GAAACACGGCGAGAGCTTACCGGAGAGGCTCAGGCAGAGCGAGAAGCAGCAAAAGCGCAT
+GATGAACAGGTTGTTGCTTTGCAACGTCTGATTGCTCAACTTGATCCTGTCGGAACTGCT
+TTTAATCGTCTGGTAGAACAACAGAAACAGCTCAATGAAGCAAAAGCTAAGGGGATGCTT
+TCTCCTGAAATGTATGAGGAGCTTTCTGGAAAACTTCGTGCTATGCGGAGTGAGCTTGAG
+GTTACTCAATCACAATTAAGCAAAACCGGAATGTCGGCAAAACAAACGGCTTTTGCTATG
+CGCATGTTGCCTGCACAAATGACGGATATTGTTGTTGGGTTGTCCACTGGTCAGTCGCCA
+TTTATGGTGTTAATGCAGCAGGGCGGCCATTCAGCTATGCAGGAGACAAGAATCGCCAGC
+TTACCCGTTACAGCGATACCCGCTGGCATGAAGATTCCGTGCGTAACCGCTGGTTCAGCG
+TGATGGTGGGGCCGTCTGTGCGCGTGAATGAATGGTTCAGCGCGTATGCGATGGCGGGTA
+TGGCTTACAGCCGTGTGTCGACTTTCTCCGGGGATTATCTCCGCGTAACTGACAACAAGG
+GAAGGTGCGAATAAGCAGGTCATTTCTTCCCAAGCTGACTCGCTGATTAAAATTTCGCGG
+ATCTGGGCCGATTTTTTTCCCGCAAACACATCGAATCAGCCTATTTAGGCTATTTTTTCC
+ACCATTTCTGGCGTTATTTCCGGTTTTTACTGAGATCTCTCCCACTGACGTATCATTTGG
+TCCACCCGAAACAGGTTGGCCAGGGTGAATAACATCGCCAGTTGGTTATCGTTTTTCAGC
+AGCCCCTTGTATCTGGCTTTCACGAAGCCGAACTGCCGCTTGATGATGCGAAACGGGTGC
+TCCACCCTGGCACGGATGCTGGCTTTCATGTATTCGATGTTGATGGCCGTTTTGTTCTTG
+CGCGGATTCTGCTTCAAGGTTTTTACCTTGCCGGGACGCTCGGCGATCAGCCAGTCCACA
+TCCACCTCGGCCAGCTCCTCGCGCTGTGGCGCTCCTTGGTAGCCGGCATCGGCTGAGACA
+AATTGCTCCTCTCCATGAAGCAGATTACCCAGCTGATTGAGGTCATGCTCGTTGGCCGCG
+GTGGTGACCAGGCTGTGGGTCAGGCCACTCTTGGCATCGACACCAATGTGGGCCTTCATG
+CCAAAGTGCCACTGATTGCCTTTCTTGGTCTGATGCATCTCCGGATCGCGTTGCTGCTCT
+TTGTTCTTGGTAGAGCTGGGTGCCTCAATGATGGTGGCATCCACCAAAGTGCCTTGGGTC
+ATCATGACGCCTGCTTCGGCCAGCCAGCGATTGATGGTCTTGAACAATTGACGGGCCAGT
+TGATGCTGCTCGAGCAGGTGGCGGAAATTCATGATGGTGGTGCGATCCGGCAGGGCGCTA
+TCCAGGGATAATCGGGCAAACAGGCGCATGGAGGCGATTTCGTACAGGGCATCTTCCATG
+GCACCGTCGCTCAGGTTGTACCAATGCTGCATGCAGTGAATACGCAGCATGGTCTCCAGC
+GGATAGGGCCGTCGGCCATTGCCCGCCTTGGGATAAAACGGCTCGATGACAGCGGTCATA
+TTCTGCCATGGCAGAATCTGCTCCATGCGGGAGAGGAAAATCTCTTTTCGGGTCTGACGG
+CGCTTAGTGCTGAATTCACTATCGGCGAAGGTGAGTTGATGGCTCATGATGTCCCTCTGG
+GATGCGCTCCGGATGAATATGATGATCTCATATCAGGAACTTGTTCGCACCTTCCCAAGG
+GGAAAACGCACGACGTGCTGACCGGAAGTGATGACGGTCGCCACAGCAACACGTCTCTGG
+CGTGGGGAGCTGGCGTGCAGTTTAACCCGACCGAATCCGTGGCCATTGATATTGCTTATG
+AAGGCCCCGGCAGTGGCGACTGGCGCACTGACGGTTTCATCGTGGGTGTCGGTTATAAGT
+TCTGATTAGCCAGGTAACACAGTGTTATGACAGCCCGCCGGTTCAGGCGGGCTTTTTTGT
+GGGGTGAATATGGCAGTAAAGATTTCAGGTGTACTGAAAGACGGCACAGGAAAACCGGTA
+CAGAACTGCACAATCCAGCTGAAAGCAAAACGTAACAGCACCACGGTGGTGGTGAACACG
+CTGGCCTCAGAAAATCCGGATGAAGCCGGGCGTTACAGCATGGACGTTGAGTACGGTCAG
+TACAGCGTTATTCTGTTGGTGGAAGGATTCCCGCCGTCACATGCCGGGACCATTACCGTG
+TATGAAGATTCTCAACCCGGTACGCTGAATGATTTTCTCGGTGCCATGACGGAGGATGAT
+GCCCGTCCGGAGGCACTGCGCCGTTTTGAACTGATGGTGGAAGAGGTGGCGCGTAACGCG
+TCCGCGGTGGCACAGAACACGGCAGCCGCGAAGAAGTCAGCCAGTGATGCCAGCACATCA
+GCCCGTGAGGCGGCAACCCATGCGGCTGATGCTGCGGACTCAGCACGCGCAGCCAGCACG
+TCAGCCGGACAGGCCGCGTCGTCGGCTCAGTCAGCGTCTTCCAGCGCAGGAACGGCATCA
+ACAAAGGCCACTGAAGCATCAAAAAGTGCTGCCGCTGCAGAGTCCTCAAAAAGCGCGGCG
+GCCACCAGTGCCGGTGCGGCGAAAACGTCAGAAACGAATGCTTCAGCGTCACTACAATCA
+GCAGCCACATCTGCATCCACCGCGACCACGAAGGCATCAGAAGCTGCGACCTCGGCCCGG
+GATGCGGCGGCCTCAAAAGAAGCGGCAAAATCATCAGAAACGAACGCATCATCAAGCGCC
+AGTAGTGCAGCTTCCTCGGCAACGGCGGCAGGAAATTCCGCGAAGGCGGCAAAAACGTCC
+GAGACGAACGCCAGGTCTTCTGAAACGGCAGCGGGACAGAGCGCCTCGGCTGCGGCAGGC
+TCAAAAACAGCGGCTGCGTCGTCTGCCAGTGCAGCGTCAACAAGTGCCGGGCAGGCCTCA
+GCCAGTGCCACCGCCGCCGGAAAATCGGCAGAAAGCGCCGCATCGTCTGCTTCAACAGCC
+ACAACGAAGGCTGGCGAAGCCACTGAACAGGCCAGCGCAGCAGCGAGGTCTGCTTCCGCA
+GCGAAGACATCCGAAACGAACGCGAAAGCGTCGGAAACAAGCGCAGAATCCTCAAAAACG
+GCTGCCGCATCGTCAGCCAGTTCGGCGGCGTCATCGGCATCATCGGCGTCTGCTTCAAAA
+GATGAGGCGACCAGACAAGCGTCAGCAGCGAAGAGCAGCGCCACGACGGCATCCACGAAG
+GCGACAGAGGCTGCTGGCAGTGCGACGGCGGCAGCTCAGAGCAAAAGTACGGCGGAATCC
+GCGGCAACGCGCGCCGAGACAGCAGCTAAACGGGCAGAGGATATTGCATCCGCCGTGGCG
+CTTGAGGATGCAAGTACGACGAAAAAGGGGATAGTACAGCTCAGCAGTGCGACCAACAGT
+ACGTCTGAAACGCTGGCGGCAACGCCAAAGGCAGTAAAATCAGCCTATGACAATGCAGAG
+AAACGTCTGCAGAAAGACCAGAACGGCGCTGATATACCCGATAAGGGATGCTTCCTGAAC
+AACATTAACGCGGTCAGTAAAACAGACTTTGCTGATAAGCGTGGTATGCGTTATGTGCGG
+GTTAACGCTCCTGCAGGTGCAACATCTGGAAAATATTACCCTGTTGTTGTTATGCGTTCT
+GCTGGCTCAGTAAGCGAACTGGCATCAAGAGTCATTATCACCACGGCAACGCGAACCGCA
+GGCGATCCGATGAATAACTGCGAGTTTAACGGATTTGTTATGCCTGGTGGCTGGACTGAC
+AGGGGGCGTTATGCTTATGGCATGTTCTGGCAATATCAAAACAATGAACGAGCCATTCAC
+TCAATAATGATGAGTAATAAGGGCGATGATTTGCGCTCTGTGTTCTATGTTGATGGCGCT
+GCTTTCCCTGTTTTTGCGTTTATTGAAGATGGCCTGTCAATATCCGCACCTGGTGCTGAT
+CTCGTTGTTAATGATACGACCTATAAGTTTGGGGCAACAAATCCGGCGACTGAATGTATC
+GCGGCGGACGTTATCCTTGATTTTAAGAGTGGGCGTGGTTTTTATGAGTCTCATTCGTTA
+ATCGTTAACGATAACTTGTCGTGCAAAAAACTTTTTGCCACAGACGAAATTGTAGCGCGT
+GGTGGTAATCAGATTCGAATGATAGGTGGGGAGTATGGTGCATTATGGCGTAATGATGGC
+GCTAAAACTTACCTGCTGCTTACCAATCAAGGTGATGTTTATGGTGGCTGGAATACATTA
+AGACCGTTTGCTATTGATAACGCAACCGGCGAACTGGTTATTGGAACCAAACTGTCCGCA
+AGTCTGAACGGTAATGCATTAACAGCAACAAAGCTGCAAACGCCAAGACGGGTTTCTGGT
+GTTGAGTTTGATGGTTCCAAAGATATTACTTTAACCGCCGCGCATGTGGCTGCTTTTGCC
+AGAAGGGCAACGGATACATATGCCGATGCGGATGGTGGCGTTCCATGGAATGCCGAATCT
+GGCGCTTACAATGTCACCCGCTCTGGCGACAGCTATATTCTGGTTAACTTCTATACCGGA
+GTCGGAAGTTGCCGGACCCTGCAGATGAAGGCGCATTACAGAAATGGTGGTCTGTTCTAC
+CGTTCTTCAAGAGACGGTTATGGTTTTGAGGAAGACTGGGCAGAAGTTTATACCTCGAAA
+AATCTTCCACCAGAAAGCTACCCAGTCGGCGCACCAATCCCGTGGCCATCAGATACCGTT
+CCGTCTGGTTATGCCCTGATGCAGGGGCAGGCTTTTGACAAATCTGCTTACCCGAAACTT
+GCAGCCGCTTATCCGTCAGGCGTGATCCCTGATATGCGTGGCTGGACGATTAAGGGCAAA
+CCTGCCAGTGGTCGGGCCGTATTGTCTCAGGAACAGGACGGCATTAAATCGCATACCCAC
+AGCGCCAGCGCATCCAGTACAGATTTGGGGACGAAAACCACATCGTCGTTTGATTACGGC
+ACTAAATCCACGAATAACACCGGGGCACATACACACAGTGTGAGCGGCTCTACAAACTCG
+GCTGGAGCACACACACACTCACTAGCCAACGTGAACACGGCTAGTGCTAACTCCGGTGCT
+GGTAGTGCATCAACAAGATTGTCTGTTGTGCATAATCAAAACTATGCAACATCATCTGCT
+GGCGCACATACCCACTCACTGTCCGGCACTGCTGCAAGCGCAGGTGCACACGCGCATACT
+GTCGGTATTGGTGCTCATACGCACTCCGTTGCGATTGGTTCACATGGACACACCATCACC
+GTTAACGCTGCTGGTAACGCGGAAAACACCGTCAAAAACATCGCATTTAACTATATTGTG
+AGGCTTGCATAATGGCATTCAGAATGAGTGAACAACCACGGACCATAAAAATTTATAATC
+TGCTGGCCGGAACTAATGAATTTATTGGTGAAGGTGATGCATATATTCCGCCTCATACAG
+GTCTGCCAGCAAACAGTACCGATATTGCACCGCCAGATATTCCGGCTGGCTTCGTGGCTG
+TTTTCAACAGTGATGAGTCATCGTGGCATCTCGTTGAAGATCATCGGGGTAAAACGGTTT
+ATGACGTGGCTTCCGGCAACGCGTTATTTATTTCTGAACTCGGTCCGTTACCGGAAAATG
+TTACCTGGTTATCGCCGGAAGGGGAGTTTCAGAAGTGGAACGGCACAGCCTGGGTGAAGG
+ATACGGAAGCAGAAAAACTGTTCCGGATCCGGGAGGCGGAAGAAACAAAAAACAACCTGA
+TGCAGGTAGCCAGTGAGCATATTGCGCCGCTTCAGGATGCTGCAGATCTGGAAATTGCAA
+CGGAGGAAGAAATCTCGTTGCTGGAAGCATGGAAAAAGTATCGGGTATTGCTGAACCGTG
+TTGATACGTCAACTGCACAGGATATTGAATGGCCAGCACTGCCGTAGGGTAAAACATATA
+AATTCTATAATTAGATGTATCTTTCCATTTACGGCAAGGAAGGGGGCTTGGAAGACGTAA
+AGCATCTCACACCGAGATTATTTTTTATATGTCAGGTGTCTGAAGTTTTGCTTTGGCTCT
+TAAAATGGTTTGCCGCGAGGTTTTGAATTCCCGGGCAATGGCACTTATACTTACACCTGA
+CTTAATTCGTTCGAATACCACCTGTTTCTGTTCTTCATTTAACACAGGAGGTCGACCAAA
+ACGTTTCCCTGCGCCGCGGGCTCTTACTATCCCGGAATGAGTGCGTTCAAGTAAAAGGTC
+TCGTTCAAATTCAGCGACTGCTGAAATTACTTGCATCATCATTTTTCCTGTTGGACTGGT
+CAGGTCAATGCCACCCAATGCTAAGCAATGCACTCTGATACCTGTTTCGGTCAGTTGTTC
+CACTGTTTTCCTGATATCCATTGCATTACAACCAAGGCGATCCAGTTTTGTCACAATCAA
+TTGATCACCACATTTCAGGCGAGCAAGCAACCGGTTAAAACCAGGACGCTCACTGGTTGC
+TGCTGAGCCGCTAATGTGTTCTTCGATTATTTGCTGAGGTTTGATTTTAAAACCTGCACT
+TTCGATTTCCCGGCGTTGATTTTCGGTGGTCTGATCCAGCGTTGATATCCGACAGTAAGC
+AAAAATTCGAGACATAGTGAGACTCTATACGAAATTGGTGTTCATATCATAATGCATCTC
+AGAAAATAATTATGATTATTTTTGTGCATATTTGTATGTACACGTTCGAAAATAAACGAA
+TGCGTATGCAACCCCGTAATTTTGGTGAGACCCAAAATCGATTTTGTGAAAAATGGCTTT
+AACTCGGTTTGTTTTTCGAGTTCCGGGCGGACTCAAGGAAGAAGAATAGTGTTGCGTGTT
+ATTTTAACCAGATTTCAAGTTGTTTGGTCGTGGAAAAGTGGAGCAAAATGTTGTTAAAGT
+GGAAAAATGATAAAAAAGTAAGTTTATTATATTACATTTTACCATTTAAATTTTGGTTGT
+CTTTAAGAACTGATATCGCTGTTTGTAATAATTCTTTGTTATCCAGCCATGATGTTTTCT
+TTATGTTTCCTTCAATGTAATCAAGCAATGTTCTGGTATTGATAGGTCTTCCCTGTTTTG
+CTACTTCCACTACAGCATCCCCTAGGATAATTCTTACTTCAGGAAGCTGCGCAGGGAACC
+ACTTTAGGGTGTCTTTTGATTTCAT
+>NC_000913.3|provirus_1627517_1653915
+ATGATCGTTTTAGTAACTGGAGCAACGGCAGGTTTTGGTGAATGCATTACTCGTCGTTTT
+ATTCAACAAGGGCATAAAGTTATCGCCACTGGCCGTCGCCAGGAACGGTTGCAGGAGTTA
+AAAGACGAACTGGGAGATAATCTGTATATCGCCCAACTGGACGTTCGCAACCGCGCCGCT
+ATTGAAGAGATGCTGGCATCGCTTCCTGCCGAGTGGTGCAATATTGATATCCTGGTAAAT
+AATGCCGGCCTGGCGTTGGGCATGGAGCCTGCGCATAAAGCCAGCGTTGAAGACTGGGAA
+ACGATGATTGATACCAACAACAAAGGCCTGGTATATATGACGCGCGCCGTCTTACCGGGT
+ATGGTTGAACGTAATCATGGTCATATTATTAACATTGGCTCAACGGCAGGTAGCTGGCCG
+TATGCCGGTGGTAACGTTTACGGTGCGACGAAAGCGTTTGTTCGTCAGTTTAGCCTGAAT
+CTGCGTACGGATCTGCATGGTACGGCGGTGCGCGTCACCGACATCGAACCGGGTCTGGTG
+GGTGGTACCGAGTTTTCCAATGTCCGCTTTAAAGGCGATGACGGTAAAGCAGAAAAAACC
+TATCAAAATACCGTTGCATTGACGCCAGAAGATGTCAGCGAAGCCGTCTGGTGGGTGTCA
+ACGCTGCCTGCTCACGTCAATATCAATACCCTGGAAATGATGCCGGTTACCCAAAGCTAT
+GCCGGACTGAATGTCCACCGTCAGTAATTTTTATACCCGGCGTAACTGCCGGGTTATTGC
+TTGTCACAAAAAAGTGGTAGACTCATGCAGTTAACTCACTCACAAGCAAGAACGAATGAC
+CGTCGAAACGCAACTTAATCCCACACAGCCTGTCAATCAGCAGATTTATCGTATTCTTCG
+TCGCGACATTGTCCATTGCCTGATTGCTCCAGGCACACCGTTGTCGGAAAAAGAAGTTTC
+TGTTCGTTTCAATGTGTCACGCCAGCCGGTTCGTGAAGCCTTTATTAAACTGGCGGAAAA
+CGGCCTGATTCAAATTCGTCCGCAACGTGGCAGCTACGTCAACAAAATTTCCATGGCCCA
+GGTGCGCAACGGCAGTTTTATCCGTCAGGCCATTGAGTGCGCGGTGGCGCGTCGGGCGGC
+GAGCATGATTACCGAAAGCCAGTGCTATCAACTGGAACAAAATCTTCACCAGCAACGCAT
+TGCCATTGAGCGCAAGCAACTGGATGATTTTTTTGAACTTGATGACAACTTCCATCAACT
+CCTGACGCAGATTGCCGACTGTCAACTGGCGTGGGATACCATTGAGAACCTGAAAGCGAC
+CGTTGATCGCGTGCGCTATATGAGTTTCGACCACGTTTCTCCACCAGAAATGCTGTTACG
+CCAGCATCTTGATATTTTCTCTGCCCTGCAAAAACGTGATGGCGATGCGGTAGAACGTGC
+AATGACGCAACATTTGCAGGAAATCAGCGAATCCGTGCGCCAGATCCGCCAGGAAAACAG
+CGACTGGTTTAGCGAAGAGTAATTCATTTCCTCTCATCCCATCCGGGGTGAGAGTCTTTT
+CCCCCGCCTTATGGCTCATGCATGCATCAAAAAAGATGTGAGCTTGATCAAAAACAAAAA
+ATATTTCACTCGACAGGAGTATTTATATTGCGCCCGTTACGTGGGCTTCGACTGTAAATC
+AGAAAGGAGAAAACACCTATGACGACCTACGATCGTAACCGTAACGCAATCACCACTGGC
+AGCCGTGTTATGGTTAGCGGCACCGGTCACACTGGCAAGATCCTGTCGATTGATACTGAA
+GGTCTGACCGCTGAGCAAATCCGCCGCGGAAAAACCGTAGTTGTTGAAGGTTGTGAAGAG
+AAACTGGCACCACTGGACCTGATTCGTCTCGGCATGAACTAAGCGTGTGAATGCCGCCGA
+TGGCGGCATTGCTTTTTTACTTCACGGAATATTTTGCCACGGTCGCTTTCGCGCCATGCG
+CTAATAAAGACAAGTACGTTTCCGTCACTCTTGCAGTAAACAAACTATTGTCTGGCAAAT
+CATCACCAAAGATCGCCTTAATCGCCAGCAATGACTGGACGCGCGCTTTCCCTTCGGCAC
+TACTTTGTACAGCCTTCTGAATAACAGGTAACAGTGGGTCACTGATTTCTATCGGATTTC
+CCTGTTCATCAACACCACCGACATAACGCATCCAACCCGCGACGCCCAGCGCCAGCAGAT
+CGAACTTGCTGTCATGCGCCAGATGCCAGCGAACAGAATCCAACATCCGCTGTGGCAATT
+TCTGGCTACCATCCATCGCAATCTGCCAGGTTCGATGACGTAACGCCGGGTTGCTATAGC
+GTGCAATTAATCGGTTAGCGTAATCTTGCAAATCAACGCCCTGCACTTTCAACGTCGGCG
+CTTGTTCCTGCAACATCAAGCCATACGCCGCATAACGATAATGTTCATCTTCCATACAGT
+CATTAATGTGCTGATATCCTGCAAGATACCCCAGATACGCCAGGAATGAATGACTGCCGT
+TGAGCATGCGCAACTTCATCTCTTCATAAGGCAGCACATCGCTAACCAGTTCGGCTCCCG
+CTTTTTCCCATTCCGGACGTCCGGCAACAAAGTTATCTTCTATTACCCACTGGCGGAAAG
+GTTCACAGGCAACGCCCGCAGGATCGCGCACACCGGTAAGTTGTTCGATTTTCGCCAGCG
+TATCCTCTGTCACTGCGGGCACAATACGGTCCACCATTGTTGATGGGAAAGTCACGTTAT
+CTTCGATCCATTGTGCCAGTTTTACATCAACGGCTTGTGCGTAGGAAGTGACAACGTCAC
+GCATAACATGACCGTTTTCTGGCATGTTGTCACATGACATGACGGTAAATGCGGGAAGTC
+CTGCCGCTTTACGGCGAGCCAGCGCCTCAACAATCACCCCTGTTGCTGTTTTCGGCTGGT
+GGGGATTTTGCACGTCGGCAGCTACCATCGGGTGATCGAGCATTAACTGTCCGGTCGCCG
+GAGAGTGGAAATACCCTTTTTCGGTGATTGTCAGAGAGACAATCGCGATTTGCGGTTCAC
+ACATCGCTGCCAACACGGTTTCTAAGCCATCTATCTGTACGTGCAAGGCTTTTTTAACGA
+CGCCAACGACGCGAGCCGTCCACACATCGGCCGACATTTCCGCAACGGTATAAAGATTAT
+CTTGCTGTTGTAAATCGGCAATTTGCTGTTCGCCGCCGATTAAGTTGACCTCATAATATC
+CCCAGTCACTGAAATGTTCCGTAGCAAGAATATCGGCATACACACCCTGATGCGCACGGT
+GAAATGCACCAAAGCCTAAATGAACAATTCTTGGAGCCAGGTTATTAAGATCATAAACAG
+GGAGTGTCGCTTTTGCTGATAACAAATTATTTCCCATAACAATTCCTTAAATATAAATAT
+GGCAAGCTATATGTTTTGTTATATGAATAAAAATCCCCTCTCCGGTAAGAGAAGGGATTA
+AGGGTTTACAGACTTCTGGAAGGTTGCGCAGCTCTTACAACACGCGGTTGATCTTCCGCA
+GCGTCTTCCAGCGCACTTAAATCACGGTCTTTCACCTCTGGCATTTTCAGCGCAGAGATT
+AAACCAATCACTGAATATGCCATGATCATAATGGCGATCGGATACCAGGATTCCGTCATG
+GTGCAGAAAATACCCGCCAGGATAGGACCAAAACCGGAAGCGATAAGACCACCAATTTCT
+TTAGAAATAGCCATCCGGGTAAAGCGGTTTTTACAGCCGAACATTTCTGCCATGGTAATG
+TTTTCCAGAGCAAATAATCCCAGCACCGCACAGTTATGAATCACAATCAGTGCAACCATA
+ATGGTGCTCGGGGCATAGCTTTTATCTACAATGATAGAAAGCATTGGCCATGCCAGCACA
+ATCGCGGAGGTATTCATAATAATATACGGGATCCGGCGACCAATTTTATCGGATAACCAA
+CCAAGGAACGGAATGGTCATAAAGCCGAGAATCGAACTGATCATCAATGCATCTGTTGGA
+ATTGCTTTGTTAAACAATAACGTCTGCACTAAATAGCCTGCAAGGAAAGTCTGAATTAAC
+CCGGAGTTACCCGCCTGACCAAAACGCAGCCCTGTTGCCAGCCAGAAGGATTTGCTCTGG
+AACATGCTACCAGCAGGTGCAGGTTTTGCTGTCGGTTGGTTACTGTCGTTAACCTTCTCA
+AAGACCGGGCTTTCTTTCAGATTCATACGCAACCAGATAGCAAAGACCATCACGACAACA
+CTCGCCAGGAACGGTATACGCCATCCCCACGCCAGCAGTTCCTCTTTACTGAGAATGAAG
+AACATAAAGGCCCAGATTGCCGTTGCGCTCAAGGTTCCGCAGTTAGTTCCCATAGCCACA
+AATGAGGAGATAATTCCGCGCTTACCTTTTGGCGCATATTCCGCCAGCATCGTACCGGCA
+CCGGAAATTTCCGCACCTGCACCCAACCCCTGAATAATACGCAACGTCACCAGCAAGATG
+GGTGCAAAAACACCAATCTGTGCATAGGTCGGTAACACACCAATTAAGGTGGTACAGATC
+CCCATCATGGTGATGGTAATAAAGAGCACTTTTTTACGCCCTATTCTGTCGCCCATTTTG
+CCGAAAATAAATGCTCCGACAATACGCGCCACATAACCTGCACCGTAGGTTCCCATTGCC
+AGAATTAACGCCATTGCCGTTGATGATTCAGGAAAAAATATTTCATGAAACACTAACGCT
+GCGCCGAGCGAATATAACTGGAAATCCATAATTCACAGGTGTTTTTTCCCATCCTGTGGT
+TTCCTTGGCGTTTTCTAGGTTTTTTCAGATAGTTGCATTTTTTTAAAAAGCATCCTAAGT
+TCGATCTCAGTGTCTATCTGGGGCCTATTTCTGTCCCATATATGCCCCAAAAAAACTCCC
+CAACAGATAAGTAGTTTTTTCATGGATTTATGCGTAAAATCAAGAACGGCTGGAAATCAT
+TCAATACTCACACTATCGAAAAATTTACCAGCCAATCGCAGCACGTTCTTGCATAAGGTG
+TGTCTGCGGTTTTTCAACTATTCAGATACATCACTCCCATCACATTCATTCCTCCGCATC
+AAAGGCATATAGGCTATATCACCTTGATATTTTTCTTTTTCAGATAAAAACTGTTATCTA
+TGTATACTTTTAAACCCAATCCGTGTAGAGTCTCTACATAAGATAGTTTGCAGTTGCCGC
+TTCAGCTTGCGCCATAAACCGCCTGATTTTTGCTGCCACCTGTTAGCATTCCTGTATACC
+TGAAACGACAATGTTTATCTACGAACTTTAAGAACACCCAAGATAAAAATTGTCAACTAT
+ATCATATATAACACATTACTAATTCGAGGCTATATGAACAGCATACTGATAATCACATCT
+CTCCTTATCATATTCAGCATTTTTAGTCATGCCCTAATAAAATTAGGGATTGGCATATCC
+AATAACCCAGACAAAACCGATGTATAAGTCAACATATCCTGAATCAGACATACAATATCG
+CAATGAAAATCAATAATATTTTAAGGAATATCTTCATGAAATCAAAAGACACCCTAAAGT
+GGTTCCCTGCGCAGCTTCCTGAAGTAAGAATTATCCTAGGGGATGCTGTAGTGGAAGTAG
+CAAAACAGGGAAGACCTATCAATACCAGAACATTGCTTGATTACATTGAAGGAAACATAA
+AGAAAAAATCATGGCTGGATAACAAAGAATTATTACAAACAGCGATATCAGTTCTTAAAG
+ACAACCAAAATTTAAATGGTAAAATGTAATATAATAAACTTACTTTTTTATCATTTTTCC
+ACTTTAACAACATTTTGCTCCACTTTTCCACGACCAAACAACTTGAAATCTGGTTAAAAT
+AACACGCAACACTATTCTTCTTCCTTGAGTCCGCCCGGAACTCGAAAAACAAACCGAGTT
+AAAGCCATTTTTCACAAAATCGATTTTGGGTCTCACCAAAATTACGGGGTTGCATACGCA
+TTCGTTTATTTTCGAACGTGTACATACAAATATGCACAAAAATAATCATAATTATTTTCT
+GAGATGCATTATGATATGAACACCAATTTCGTATAGAGTCTCACTATGTCTCAAATTTTT
+GCTTACTGTCGGATATCAACGCTGGATCAGACCACCGAAAATCAACGCCGGGAAATCGAA
+AGTGCAGGTTTTAAAATCAAACCTCAGCAAATAATCGAAGAACACATTAGCGGCTCAGCA
+GCAACCAGTGAGCGTCCTGGTTTTAACCGGTTGCTTGCTCGCCTGAAATGTGGTGATCAA
+TTGATTGTGACAAAACTGGATCGCCTTGGTTGTAATGCAATGGATATCAGGAAAACAGTG
+GAACAACTGACCGAAACAGGTATCAGAGTGCATTGCTTAGCATTGGGGGGCATTGACCTG
+ACCAGTCCAACAGGAAAAATGATGATGCAAGTAATTTCAGCAGTCGCTGAATTTGAACGA
+GACCTTTTACTTGAACGCACTCATTCCGGGATAGTAAGAGCCCGCGGCGCAGGGAAACGT
+TTTGGTCGACCACCTGTGTTAAATGAAGAACAGAAACAGGCGGTATTCGAACGAATTAAG
+TCAGGTGTAAGTATAAGTGCCATTGCCCGGGAATTCAAAACCTCGCGGCAAACCATTTTA
+AGAGCCAAAGCAAAACTTCAGACACCTGACATATAAAAAATAATCTCGGTGTGAGATGCT
+TTACGTCTTCCAAGCCCCCTTCCTTGCCGTAAATGGAAAGATACATCTAATTATAGAATT
+TATATGTTTTACCCTACGGCAGTGCTGGCCATTCAATATCCTGTGCAGTTGACGTATCAA
+CACGGTTCAGCAATACCCGATACTTTTTCCATGCTTCCAGCAACGAGATTTCTTCCTCCG
+TTGCAATTTCCAGATCTGCAGCATCCTGAAGCGGCGCAATATGCTCACTGGCTACCTGCA
+TCAGGTTGTTTTTTGTTTCTTCCGCCTCCCGGATCCGGAACAGTTTTTCTGCTTCCGTAT
+CCTTCACCCAGGCTGTGCCGTTCCACTTCTGAAACTCCCCTTCCGGCGATAACCAGGTAA
+CATTTTCCGGTAACGGACCGAGTTCAGAAATAAATAACGCGTCGCCGGAAGCCACGTCAT
+AAACCGTTTTACCCCGATGATCTTCAACGAGATGCCACGATGACTCATCACTGTTGAAAA
+CAGCCACGAAGCCAGCCGGAATATCTGGCGGTGCAATATCGGTACTGTTTGCTGGCAGAC
+CTGTATGAGGCGGAATATATGCATCACCTTCACCAATAAATTCATTAGTTCCGGCCAGCA
+GATTATAAATTTTTATGGTCCGTGGTTGTTCACTCATTCTGAATGCCATTATGCAAGCCT
+CACAATATAGTTAAATGCGATGTTTTTGACGGTGTTTTCCGCGTTACCAGCAGCGTTAAC
+GGTGATGGTGTGTCCATGTGAACCAATCGCAACGGAGTGCGTATGAGCACCAATACCGAC
+AGTATGTGCATGCGCGCCTGCGCTTGCAGCAGTGCCGGACAGCGAGTGGGTATGAGCACC
+ATCTGATGATGTCTTCCCTGCATTACGAGTCTGGCCACTACCGCTTGTTGTGCTCATAAT
+CCCCGCGCTTAGATTTGAAATCGCGGTATAACCATTAGGGAAAATGCTCGTGTTCGTGCC
+ACCAAATGCACCGGAACTCTTGTGTTGGTGCGCACCGGCACTATTTGCGGTCCCGCTAAT
+ACTATGGGTATGCGCCCCGGTGTTATTCGTGGATTTGGTTCCGTAATCAAACGACGATGT
+GGTTTCCGTCCCCAAATCCGTACTGGATGCGCTGGCGCTGTGGGTGTGCGATTTAATGCC
+GTCCTGTTCCTGAGATAATACGGCCCGACCACTGGCGGGCTTGCCCTTAATCGTCCAGCC
+ACGCATATCAGGGATCACGCCTGACGGATAAGCAACTGCAAGTTTCGGGTATGCAGATTT
+GTCAAAAGTCTGCCCCTGCATCAGGGCATAACCAGACGGAACGGTATCTGATGGCCACGG
+GATTGGTGCACCGACTGGATAAAACTCTGCAGGAGGATGAGCCGAGGTGTAAAGCTGCGC
+CCACGGCGACCAGTTTGCGTCGGTCGTATCCCGTCGTGAACGAATAAATGCCGGAGCATG
+AGCACCGCTTGTACCACTCCAGCCGATGAGTAACTCACCTTCGCCAACGGCTGTCATCCC
+TTTCAGGTGAATGATATTTCCATACGCTGTTGGATATCCGTTGTTATACACCTCGTATAA
+CTCAAGACCTGCTGCCCCCTGCGTATTGTCTGTCAGCGCGGTTATATTCACTCAGCAACC
+CCGGTATCAGTTCATCCAGCGCGGCTGCTTTGTTCATGGCTTTGATGATATCCCGTTTCA
+GGAAATCAACATGTCGGTTTTCCAGTTCCGGAAAACGCCGCTGCACCGACAGGGGGATCC
+CGTCGAGAATACTGGCAATTTCACCTGCGATCCGCGACAGCACGAAAGTACAGAATGCGG
+TTTCCACCACTTCAGCGGAGTCTCTGGCATTTTTCAGCTCCTGTGCGTCGGCCTGCGCAC
+GCGTAAGTCGATGGCGTTCGTACTCAATAGTCCCTGGCTGGAGATCTGTCTCGCTGGCCT
+GCCGCAGTTCTTCAACTTCCCGGCGCAGCTTTTCGTTCTCAATTTCAGCATCCCTTTCGG
+CATACCATCTTATAACGGCGGCAGAGTCATAAAGCACCTCATTACCCTTGCCACCGCCTC
+GCAGAACGGGCATTCCCTGTTCCTGCCAGTTCTGAATGGTACGGATACTCGCACCGAAAA
+TGTCAGCCAGCTGCTTTTTGTTGACTTCCATTGTTCATTCCACGGCCAAAAACAGAGAAA
+GGAAACGACAGAGGCCCAAAAGCTCGTTTTCAGCACCTGTCGTTTCCTTTCTTTTCAGGG
+GGTATTTTAAATAAAAACATTAAGTTACGACGAAGAAGAACGGAAATGCCTTAAACCGGA
+AAATTTTCATAAATAGCGAAAACCCGCGAGGTCGCCGCCCCGTAACCTGTCGGATCACCG
+GAAAGGACCCGTAAAGTGATAATGATTATCATCTACATATCACAACGTGCGTGGAGGCCA
+TCAAACCACGTCAAATAATCAATTATGACGCAGGTATCGTATTAATTGATCTGCATCAAC
+TTAACGTAAAAACAACTTCAGACAATACAAATCAGCGACACTGAATACGGGGCAACCTCA
+TGTCAACGAAGAACAGAACCCGCAGAACAACAACCCGCAACATCCGCTTTCCTAACCAAA
+TGATTGAACAAATTAACATCGCTCTTGAGCAAAAAGGGTCCGGGAATTTCTCAGCCTGGG
+TCATTGAAGCCTGCCGCCGGAGACTGTGCTCAGAAAAAAGAGTTTCTTCTGAAGCAAACA
+AAGAAAAGAGTGACATTACTGAATTGCTCAGAAAACAGGTCAGACCAGATTGAAGCAATT
+TAGATAATCGTGCAGACTACGCCCCCTCATATCACATGGAAGGTTTATCTATGGATCAGG
+TAGTCATTTTTAAACAAATATTTGATAAAGTTCGAAACGATTTAAACTATCAATGGTTTT
+ATTCTGAGCTAAAACGTCACAATGTCTCACATTACATTTACTATTTAGCCACAGAGAATG
+TTCATATTGTATTAAAAAATGATAATACAGTGTTATTAAAGGGCCTAAAAAACATTGTGT
+CTGTCAAATTTTCAAAGGATAGGCATCTTATAGAAACGACCTCTAATAAGCTGAAATCCA
+GAGAGATCACATTTCAGGAATACAGAAGAAACCTTGCTAAAGCAGGAGTTTTTCGGTGGG
+TTACAAATATCCACGAACAAAAAAGATATTACTATACCTTTGATAATTCATTACTATTTA
+CTGAAAGCATCCAGAAAACTACACAGATCTTACCACGCTAAACCATAACGTCCGGCTTCT
+CTCACTCCTGAGCCGGACTGCATTGGTTTAATAAAAACCATCAACAATTGTGATTTAGAT
+ATTCGGAACCATTCAAATATAACAAAACCCCGTAAAAACGAGGTTTATGGATAAATTTTA
+TTATTGAATACATCAGATTAAATTAATCTTGACATCATAGCTTTCAAGACCCGTCATTTT
+TTCCCGTGCGGTAAACTGAATACTGGTAACTTCTTTCCCGGTCTTTTTCTTAAGTTCAAT
+AATTTTTTTTGTTATATATTCAGAAATATCTGCTTCTGCTTTTGTTTTTAAGTTTTCAAT
+ATTCATCATTTCCTCTTTTAGTCTGTTATGACTTTCCAGTTACACAGTAAGTCGATTATA
+TGGTGCAAACGTGTAAAAGATAAGATGAAACATCGCAATAATCAACATACGATAGTCTAA
+ATTTTACACAAACAGACAAAGAGAATTTTCCTGAATTATCAATGCAATAGCATCAAATCA
+ACTCAAGAGCCTTATTGCTGCTTCCAGAATTTCTTCTGAAGTAACATGTCGATCCGCGGC
+TACATAAATGACTTTATGATCTCCGGTCAGAGATGGAAACCCTGCGGCCATTACAGTAAG
+GTGTGTTTTTTCGCCATTTGGATATTCACGCATGATGGTGTTAACTCCAGTCATCGCTGG
+CACTACCACTGCTGGTTCAGAGTTAAAAAAACTATGATTTTTTTCATGATGTTACCGTAG
+TATGTGAGTATCCATCGAATAGACACCAAGCAAAAAAGCTCCCGAAGGAGCCTTCATTTT
+CACTTTTTTAAATCCAACGACAGACGGCTGGCATTTAAGTATTGTGAAATATTATCAAAT
+GTAATCATCATTGATTTACAAAAGATACATTTTGCCCCGAAAGGATTCATGTCAGAAACA
+TCAAAAGATGATGTTCTATACTGGGAACCATGACAACACGGGCATCTAAAGTGAATATGG
+TTTGTAATATTGTCTACCTCAAAGCGCCACTACATGAACAGCGGCAGGACCTTTAGGTCC
+GTTCTCAATACCAAATTCAACTTCCTGATTCTCAGTTAATGTTTTGAAATCGTTGCTCTG
+AATTGCTGAGAAATGGACAAACACATCTTTGCTGCCATCTTTCGGCGTGATGAAACCAAA
+ACCTTTTTCAGGGTTAAACCATTTCACTAAACCAGTCATTTTGTTAGACATAATTATTAC
+CTTTTGAAGAAATTAGCCCTTGGGCAGAATGGTCCGAAAAAAAATATCAGAGAGAAAAAC
+CAACAAGGAAATCTCAAGAGGTACAAATAATAAAATTATAACAATGACTGCTTCAGATAA
+ATTTGTAACAAACCAGAACACCATTAACGCATGATTAACCACCCATAGCAAGGATTACTT
+TTGTAAAGAAAAACACAGCAATGAAAGAATAGCTTTATTTATTAATAAAACGTGTCATTC
+TGATTAAGACCTTTTATCTTACCCTTAAGATTTCAGGAATTTTGGCTCATGGAAGAGTCC
+TTTTTATTTAAATTTTACATTCCGCGATGTAAATGTTCCGATTTAATATTACCCTACATT
+TGATGCTTTTTATCTCTTAAAGATTCATAGATCTGTTGACAAGTCACTCCTGCGATGTAG
+CGTTCGTCAGCAATTTCAGCATAAAGCTGAGCTTCTGCTGCAATATCTCCGAGCATGTTG
+GTGAGCATTCCTTCGGCGGTTTTGGTTGTTTTGCCTCTGACGGCAGCGGCAAGATCTGCG
+GTATGCTTCGCTGCGTCAAGGCGTATGGCATATTTTTTTGCTTCGGCACGCAACTGGTTA
+ACACTATCAGACAGATAAGCAGCCCTGGCAGAAATTTCAGCAGATTTCTGTTGCGCATCT
+TTAACAGCCTCATCACGGGCTATAGTTCGCCCCTGTTCAATTATTCGAGCAGCAAATTGA
+GCATTTACCTCTTGTGATAATGCGGCAGCATCACGTTCCGCCCATTTTTTTTGCCATCCT
+CGGTCGCTCCAGACATTTCCGACGATAAATCCTGACAACACGAGAAAAATCACCATGAAT
+ATCTGATTCACTGTTCTATCCCCCAGCAGGTTAATGCGCTCTCCTGGTCACGACGAATAA
+CCTGACCGTAACAGTTATTTGAACGAATGCGGCAATCGCGTCCGCCATCCTTAATCCACC
+AGCGAATCGCTTCGCATGCACCTTTACGATCACCAGCATTCAGCCGCTTATAAAACGTCG
+ACGGGAAACACTTACCGGGGCCAATGTTATAGGGACAAAATGACGCGATACCCGCTTTTT
+GTGGTTCGGTCAGTGGTACTTTAATATTGCGCTCCACCCATGCCAGCGCCTTATCACGCT
+CAATGGCGTTGACCTGGTCGCATTTTTCCTTCGACAGTTTCATATTGGGAAAAACGGTTT
+TTCCATCCACCACTGTGGCACCCCGACAGATGGTCCATATGCCAGAACCATCGCGGTATG
+CCATTGTGTGGTTACCTTCTTTTTCGTCCAGAAACTGGTCAAGTATCTGAGGAGCAGATG
+CGCCAGCACCAATCAGCGCCAGAACGGCAGCCGACAGGCCGTATCTGATTTTTGTGTTCA
+TAGATATTTATGATGAGGACGCTCGTGCTTATTGGCAGGATTTTCAATCTTAAAGGAGTA
+CTGATGCTGCAGATAAGACTCAACTTTTTCTGACAATTTTTCTGCTACTTCCAGGAAGAC
+TTGCCGGACGCTCCTTCTGGCTGCTGCCTCATAAAACTCCAGCGCAGCTCCTTCAACACG
+GTCCATGGCGACATCCAGGTCAAAAATTTCACCGTCAAAGCGTTCTTTGTCCTGTAAGGC
+TACAGTTACCGTAACTTTATTCTCAAAATTACGGACTCCTTTCACAACCAGTTCATAGTC
+TTGAGTCATTGGATTACTCTCCTCTCGCAGCCTTACGCCTGTCTTCTTTAATCTTGAAAT
+AAAGATTTGTCAGATACGTCAGCAGGCCAAAAACCAGGCTACCCAGCACACCGATTGCAG
+CCCACTGTGACGGAGTTACTTTATCGAGTAACTGCAATGCCCAGAAACCAGCATTACCCG
+CCGATGTGCCATAGGCAACACCTGTTGTTAACTTATCCATTGATTTCATATCCTCACCCC
+GATGTACACGGATGGTGCAATATGTTTGAAAAGATCGGAGTCTACGGGGTAGTTTTGACA
+GCACACGTTGTTCTCAACGGCGCTAAAAAAACATACACATTAAAAATGTGGGTAATTATT
+TTGAAAGAAAGTCATATATAAAATAATAATACGAGAAATGTTTTCATATTTAGTGTACTG
+TATACGGCCATTTATACAGGAAAAGCCTATGTCAGAACGTAAAAACTCAAAATCACGCCG
+TAATTATCTCGTTAAATGTTCCTGCCCAAACTGCACCCAAGAGTCAGAACACAGTTTTTC
+AAGAGTACAAAAAGGTGCCCTTTTGATCTGCCCTCATTGCAACAAAGTATTCCAGACAAA
+TCTTAAAGCTGTAGCCTGATTGATTTTATTAGTAACAAGTATTTTTTATATTTTAATAAT
+ATATTTAAAGCAGATAATAAAAAACCCGCCTGAGCGGGTTTGAGATTGTGGTGCTTTTTG
+TGGGAGTCATCCACTTACGCACTTTGTTTTGCCATGCCAGCAGTTAGCTTCTGCTGTAAA
+ACTATTCATGCAGCAAACCTGCACTTCACCACAATGGTTAGCATACTTTTCCTGATTAAG
+ATTTTGCCAAATATGCTAGCCATTGTTTCATGTATTGGACCTCCTTACTTTTTATTAAAG
+AGATCCAATATTCACTACTCTGTCCGTATCTCTACTCAGGCATCAGCCTTCTTCGTTATC
+GTATACAGACGAGCGATGAATTTTAATCAGTAATGATGACATTTGCTGCTGCAGGACCTT
+TAGCACCACTCTCTATAGAGAAGGTAACCTTTTGACCTTCAAATAAGGTTCGATAATTAT
+CATTCTGAATCGCAGAAAAATGCACAAACACATCTTTACTACCATCAACAGGAGAAATAA
+AGCCGAAACCTTTATCAGCGTTAAACCATTTTACTAAACCAGTCATTTTATTTGACATTC
+TACATTCCTTAACTTGAGCCTTTCGGCATAAATGGTTTGCATAACAGAAACGACTTCGTA
+CTTAATTGGAGAGACTCAAAGAAGGAATAAGTGAATAACACCTGAAATGAGAACTGCTTT
+AGTAAACTACTTCGTATATCGTCTGTTCTTCAAACCGACGCAATCATTAACGCATAGTTG
+AACATATGAAGCAATGTTTATTTTAGACATCCAGCCATCTTCAACCCCATCAAAAAACTA
+TAGCTTTCTTCAGGAACGTGTGTATAGTGCGCCAAGTTATCAGTATTAAGGAATTTTTTT
+GTCCCGTAAAATGACAGGAATTGTCAAAACCTTTGACGGCAAAAGCGGCAAGGGTCTTAT
+CACCCCATCCGATGGTCGTATCGATGTCCAGCTTCATGTTTCAGCGCTCAATCTCCGCGA
+TGCAGAAGAAATTACCACCGGATTACGCGTGGAATTTTGCCGGATAAATGGTCTGCGTGG
+CCCTTCAGCTGCCAATGTTTACCTTTCATGAGCTATATTAAAGCTTTAATTTCAGGCCCC
+ATCGGATCACACATGGAGAGTTTTTATGAATAACCCCGTCTGTCTTGATGACTGGTTGAT
+TGGCTTTAAAAGCTTATGCTGTACTTTGGCCGTAATAGCTCTGCTAATAATATAATAAGC
+AGACTCATTGTGTTTAGGGACATTGTACTGGAAGAAAACATTTTAAACATCAGGCAAATA
+ACCAAGTCACCAGCTAAATAATAAGTTAACAGACATGAGTCCCGGGATGAGATTCAACAT
+TACCATTGCCCCATTTAAAGCACAAAACCCGCTCATCAGCGGGTTTTCTACTTTTTCTTA
+ACGTCGGGTATACAAAGCCCATCGTTGAAAAAATTTTATCCATATTTTTTGAAAAATGCA
+AACATCATGTCGCCATCTTCAGCAAAAATCATTTATCTCGTCACCTTCCTCAATTGCGCT
+TCCGCGTATGCTTCTTCCTGCCAGCACTTTGTTACCAGTTTACCAATGACGTCCGCATAC
+CCCTTATACCACTGATAATCGGTCAGGTCTGGTACCAGCTTCTGGACATGACGTCGTGCC
+AGCGTGGTCGGTAAACGACTAAACCGGTTTCCATTACAACGCCCACAAATCTTATATACC
+GGTACGCCATGAAACCGGGTTCTTTTTTCATCCAGAACAATCCCTTTACCCTTACACCCT
+CTGCACGCTGTGCTGGCTTCGCCCTTACCATGGCAATGCTGACATAGTTCCTTCACCCAT
+TCTTCCTTGATTACAGATTCCCCGCGTCTGTAGTGTTTCACCACTTCGCGCAATACATTA
+TAAAATCCCGTACCTGAACAATGCTCACAGCGAGCCTTACTTGCCGCAGACCTGGAGTAA
+TCAGCAAAGGCAAAACTCACGAGGTAAGGAATAATCTGTAACCGGATTTCTTCACTCAAT
+TTGTTCAATGTCGGGTTATCCAGTGCCATCGCGTAATTTAGCAGGCCTTCAATCGCAAAC
+TGAGGGTCCTGAACACCAACTTTTGCCAGAAATAAGGCCAACCCAAGTGGTGCTTTCGAC
+TGCACCATCCCCTGCGCTGCCATTACATCCGTAATTGTTAAACAACCGGTGCCTGTCGCT
+GGAGCGTCATCGCTCAATTTTGGAGATTTTGGGGAGTAATATTTTGGTAAGGCTTCAAGG
+TTCATGCTCGTTCTCCACTTACGCCAGTACGCCAATTGCCAGCGCGCGATCGATAAAACG
+AAATATCAGCTCCAGTTGGGAGCCATACTTATCTTCAAATGCCACTGTATCCGTATGCAG
+CTCGTTGTGATGCTTTCTGCACAAAGGCAACACAAAGAGATCATGTGCTTTTGTTCCCAT
+TCCGCCCTGCCCGTGACCAATCAGATGATGCGGATCGTCGGCTGGCATACCGCAGCAAGC
+ACACGGCTGTGTCTTAACCCAACGTGTGTATTTCTCCTTAACCCAGCGGCGACGTTTAGG
+CAGCTTCATGAAAGATTCCGGAGACTCTGGATCAACGGTGATGCTTACCACCGTCTTTTC
+CTGTGGTGATTTTTGTTGCTGGTGGGCGTAAGGCAACGGTGCAAGATTTTTTGTGCGTTG
+TTTCAATATGCTGGTGGCGGTCAGCTCTCCCGGTACGATGTCGCTTTCGCGGTACACCGA
+GCAGATTTTTTCCGCTGGTAATCCCAGCGAACGACGCGATACAGCCTCAGGTAGTGCATC
+CACCACCTGATTGCAGACCGCCCACCAGGATAATTCAGCCAAAGATAATTCCCGCTCCTG
+CGTACCGCTTATTGCGTGACGGATGACGTCAATCACCCATGCTGTCAGATTTTGTTGAGC
+AAGCAGCTCCAGTGATTCCGATGTCTGGTCACGCAGTTGGTTGTCGCAGTGCCAGCACAA
+CACCATTGCGCCGGTACCATAACGGTGAATGACTGTTTCAGTGTGATGGTAATCGCCATT
+AGGCCACTGGCAGGATGTAACATGACGTAATAGCCAGTCGGACAATGCGCCAACGCCGCC
+AGCAGCACGAATCACCCGTTCGTTACTAAAAAACGGCAGCAATGTTTTGTCTTCCGCCAG
+CGGCTGGCGAACGGCAGGAACGACTCCGGATGGCAGATTACGCATGCTTTTTGGTTCCGG
+TTCCACCAGCACTCGAGGATTATGAAATATCTGTATGGATTCACGGCCCGGCTTAAGGAC
+CACCAGCCCAAGCTCAGGCACCAGAACAGGTCTAAGTAATACCCGCACGTTACCTCCAGA
+TCCGTTGCTGGAAAGTGCGGGACGCACGTGGTGGGCGTTCGGAATAAGGCAGCCTGACAG
+AGATTATCCAGTGCCGATAGTCGAGACTGAGAGCTTTCTTAACCTCGAACCCGCGCCTGC
+GGTAAGAATGAATCAGCCATTCGGCCTGTTCTGCAGTGCATGGAGGGTGCTGGAACCATT
+CAGACTTGAATGCGTGAGAATACCGCCCGTGCGTGCAGGCAAGAACGGGCGAATTATCAG
+AATTGTAATATTTTGCGTTGCGTGCCATCGGTTTTCTCCGGTGGCACGGTGTTACTCAGC
+GGGAGTTCAGCCCCGCGCAAGATTGTAGATGAGTTTATTCTCCTGAAAAAGCAGAAAAGC
+CAGCTTTTATTCCGATCTCTTTCAATGCCTGTAATGAAGTGACAAACTCACCTTCGCGCA
+AGATAAATCCGTCCGTGACCCGAGCATCCACAAAATTAATTAACGCAGCCCCATTCTTTC
+GCAAACACATAATGCGGTAATGACTAACAAGATTTCCATTTTCAACGCACACAGCATAGA
+GGCCATCTTCACAAAAAATTTTACGCAGTTCTTCGATGTTCATCATCAGAATCCTTCCGG
+ATAATTAGCTCTCCCCTTTAAGGGACCATCCCTCTTATCCCTGCGCGCTACTTAAGTATT
+TTTGATTCTATTCCGGCACCGTCCAGAACTTCAAACGCGTTGAAAATAAAAACAAAAACC
+CGCCGAAGCGGGTTAAGTGCGGGTGCGTTGAGGATGCCTGCCACATCAGAGGTGGCGAGG
+GATTTCTCCCCCGCCGGGTCTCTTACTCCTCAGGTTCGTAAGCTGTGAAGACAGCGACCT
+CCGTCTGGCCGGTTCGGATTCGTACCTCGCAGAGGTCTTTCCTCGTTACCAGTGCCGTCA
+CTATGACGGTTAAACAGATGACGATCAGGGCGATTAACATCGCCTTTTGCTGCTTCATAG
+CCTGCTTCTCCTGTCAACGCAAAGCAGAAGTGTCACCTTCGGTGCGAAACAGAGATGTCA
+TGCTTTGGTTCAGAGAATGCGTTTGACCGCCTCGCTATATACTTCCGAGCGTTCTCTTTT
+CCCAACAGAAATCACGAAAACGACAACTTTCTCGTCTATAACCTGGTATACAAGGCGATA
+GCCTGAAGACCGGAGCTTAATCTTGTAACAATCAGGCATACCACGGAGCTTGTTTGCTTC
+AATCCGGGGTGACTCAAGTACTTCAACCAGCTTCTTTTTCAACTGTTCACGTACCGTCGA
+GCCCAGCTTTCGCCATTCCTTTAGTGCCCGCTCGTCAAAATCCAGAAAATACGCCATCAG
+AGTTCATCCAGCGTCACACGTACTGGCTTAGGATTACGAAGCCGTTCTTTCACTATCTCC
+ACAAGTTCAGCATCTTCATCACTCAGGAGTGTCTGTTTGAACGGCAAGCGTTCATTGTCA
+GCGATATACTCGAGCATGAGACGAAGCGCTTCAGAAGGAGTTACACCCATTTTTTCAAGC
+GCGGCGTAAGAACGCGCTTTAAGTTCATCGTCAATACGCAGGTTAATGCTACCCATGTCT
+TACACCTCTTGTAATTACAAATGTCATTACAAGTATCGCACTACAACATGCTTAGGGCAA
+GTCACGAAGGAAGTCAGAAAGTAGTCGTAAGAACGGTGATCACTGTCCGCTTTGTGCCAG
+GAGCAGCCATTGCTAAGTCCATCCTGTATTGTGCAGGTCAGCTCGTTTTTAAAGAGTCCG
+GCCATCATCTTACTGGTACAGACACCATATACTTTGTGACGGTCAGGCTACATATGCACA
+ACTCAACTTATTCATCTATTTTTTGCTTTAGCATGTCAGTGTTGCTTTCTCGTCGGCGGG
+TGAGCGGTGACCTGACCTGTCGATAAAGGAACGTAACACGTTTTATGCAACACCCGCATG
+CGGCAGAAAATTATTGCCGAACGTTTACCCCTGTCAACAAGCTTTACTTTCTGAGGCGCG
+CCAGCCCGCGAGGAAAACAATCTGAACATCAAACAATTAATGACACAAGAAATACGATTA
+AAGATTTTTTTGTGCATGCCGATAGTGCTTTTTTAAAAGGAGAAATCTATGTCTGTCACA
+ATTCAGGGAAATACCTCAACCGTTATTTCAAACAACTCCGCCCCGGAAGGAACATCAGAA
+ATAGCCAAAATCACAAGACAAATTCAGGTGCTGACTGAAAAGCTTGGGAAAATCTCATCG
+GAAGAGGGGATGACGACACAGCAGAAAAAAGAAATGGCTGCATTGGTACAGAAGCAAATT
+GAAAGCCTCTGGGCTCAACTGGAGCAGTTGTTAAGGCAGCAGGCAGAGAAAAAGAATGAA
+GACGCGACAGTTCAGCCTGATAAAAAAGAAGAGAAAAAAGACGATACAAATACCGCTGGC
+ACCATTGATATTTACGTCTAAGTGACAGCCGTATTGTGGCCCTCATCGGGCCACTTTTCG
+CCATCAGCCTTTTCTTTAAAGACATATTATCTTTGTATCATTTCTGATAGTTAACATTAC
+AAGATATAAGTAATGGACGCACTCCCAATTAGTCTATTTAAATCGCCACGAGTTTAACTG
+ACAACCCATGATCAATTATGAATTGCAACTATTTCTGTAGTCACTTTTGTGGGGACAGTC
+CACAAAACTGCCAACTTCCGCTTCTTGCTCTTAGCGGACATTAGCATAGGCTATTTACCA
+TAACGCCTCATTACGCGCACCGCCCAGACTGACTCAGCGCGTTTCTGGCATATCCCCGGT
+AAAACAAGTAACAAACCACCCGAAAATGAACACCAGAAACGCGACTTAAGAATCTACCCT
+ATGAATGGATATGCACTCAACCGAATCGATCTTGGTTTCAATCTTTTTTATCGGGATCAG
+GCTTCTTTTTAGGTAACTTCGGGGGCTTAACTTGCTGATGACTTTGCGTTCGGCGCGTAA
+GCCAGGGATGGTCAGCTTTAGGTTTAACATAGTATTTTGAGCGTAAATCAATACGGGCAT
+TATCCACTCGTTCATGGACACTCTTTTCATCATCCAGTGGTAGCCTCCATAATTGCAGGC
+ACTAGCGCCGTGAACTTTTCACGCTTATCCCTGGTGTCGATAGCCTTCCAGCGTTCAAAT
+ATCTTCACTCGATTAACGCCAAGCGCTCGCTGATCAATCGCGCCACCTTCATATGTGACA
+CGCTGAACATCGATGTTCGGGCGCTCTTTCAAAGCCCAGAATGCTTCAGTGATTAATATC
+GTCGCCTGCTCCTGTGTCATTCCTGGTCGACATATCCAGGCATCCAGAGCCTCACGAGCC
+TGTTCAGGAGTGATTTTCATTGTTCAACCGCCCCGCCCGCTTCGTCTTACGATATTCATC
+ATAAACTTTGGGATCATACTGAAGCTCCCCGCCAGATGCCTCCTGTAGACGCATCGCGCG
+ACCTTCGGGAACTAAATCCCCTTTCCAGCTATAAAGCGAAGCCAAACGAATACCTGCTGC
+TTGTGCAAGTTTTGTTTTTGAACCGAAATACAAAAGAGCGTCAGTTTTAAGCATTTAAAA
+CACCTTTATTGTTAGTCATAACTAACAAGATAGATGTTAACAAAAACATAGTCAATACGA
+TTTAGCATTAGCTAACTATGGAAACAAAAAATTTAACTATCGGCGAACGCATCAGGTATC
+GTCGGAAAAACCTCAAACACACCCAAAGGTCTCTTGCTAAAGCCCTGAAAATCTCCCATG
+TGTCTGTATCACAATGGGAACGGGGTGATAGTGAACCTACAGGGAAGAACCTTTTTGCCC
+TCAGTAAAGTATTGCAATGCTCACCAACATGGATTCTATTTGGCGATGAAGACAAGCAAC
+CAACACCACCTGTTGAGAAGCCAGTTGCCTTATCCCCCAAAGAACTAGAGCTCCTTGAGC
+TGTTTAATGCACTGCCAGAATCAGAACAGGATACCCAGCTCGCCGAAATGCGAGCTCGAG
+TAAAAAACTTCAATAAACTCTTTGAAGAATTACTAAAAGCCCGTCAGCGGACAAATAAAA
+GATAACATCATCAATGAGTTATCTTTTACCACATCAATTATGTTAGCTATAGCATACAAA
+ATCACTTGACCGATATGTTAGTCATGGCTAATCTTGTTTGCATCAACACACCGCACGGTG
+TTCTCAGCAAACAGTTCCGCTACCCCAGCGTTAAGGGGAAATGAGGTCAGCATGGATACT
+ATCGATCTTGGCAACAACGAATCTCTGGTGTACGGCGTGTTTCCAAACCAGGACGGCACG
+TTCACCGCAATGACGTATACCAAAAGCAAAACGTTTAAAACCGAAAATGGTGCCCGTCGC
+TGGCTGGAAAGAAACTCAGGTGAGTGATATGGATTTCGACACAATCATGGAAAAGGCTTA
+CGAAGAATACTTCGAAGGCCTTGCCGAAGGCGAAGAAGCTCTCAGCTTCAGTGAGTTTAA
+ACAGGCGCTTTCCAGTTCGGCAAAATCTAACGGCTGATAAGCGAAACAGCACCGCGAGGA
+ATCAGTATGCAGAAACGAGAACCCGTCATCATCGCGCCAGACTATACCGATGATGAACTT
+TATGAGTGGATGCGCCAGAAAATTAATGCAGCGCAGGATCTGAAATGGGCTAATGAAGCC
+AGGGCTAAGCAGGCTGAAAATCTGTCCGCTCTGGAGCAGGATATCACCAATCTGGAAAAA
+GCAGCGGCATTAAGCATTGCCAGAATGATTACATACCCGCGTTAGTAGCTAATCAACAAA
+GCTAAGGTTAGTAATTAAGGAGTTCTCCACGGGTGAGGTGGAGTGCGTGCGCCGGACACG
+GGTGCGCATCCGGAACTGACAGTTTACTGAAAGGATATTTCCCTGAAAAGTCAGACCATA
+ACGCGAAAGCGCATGGCGAGGTAGCTGGTTCATAGATAGCCTGTCGTTAAATTTTCGTCG
+ACCGTGCGCTTCCGGTTGTGGCAACCCGCGAAATGGCGCGGCGGTAAGTATGGCGGGGTT
+ATTCCTTCCCCGTTGAGGACACCGGGTTGTCAGGTTGACCATACGCTTAAGTGACAACCC
+CGCTGCAACGCCCTCTGTTATCAATTTTCTGGTGACGTTTGGCGGTATCAGTTTTACTCC
+GTGACTGCTCTGCCGCCCTTTTTAAAGTGAATTTTGTGATGTGGTGAATGCGGCTGAGCG
+CACGCGGAACAGTTAAAACCAAAAACAGTGTTATGGGTGGATTCTCTGTATCCGGCGTTA
+ATTGTTAACTGGTTAACGTCACCTGGAGGCACCAGGCACTGCATCACAAAATTCATTGTT
+GAGGACGCGATAATGAAAACGTTATTACCAAACGTTAATACGTCTGAAGGTTGTTTTGAA
+ATTGGTGTCACTATCAGTAACCCAGTATTTACTGAAGATGCCATTAACAAGAGAAAACAA
+GAACGGGAGCTATTAAATAAAATATGCATTGTTTCAATGCTGGCTCGTTTACGTCTGATG
+CCAAAAGGATGTGCACAATGAATTCAGCATTTGTGCTTGTTCTGACAGTTTTTCTTGTTT
+CCGGAGAGCCAGTTGATATTGCAGTCAGTGTTCACAGGACAATGCAGGAGTGTATGACTG
+CAGCAACCGAACAGAAAATTCCCGGTAACTGTTACCCGGTCGATAAAGTTATTCACCAGG
+ATAATATCGAAATCCCGGCAGGTCTTTAAAACAGTTCCGTAATAAATATCCGGTTTCATT
+CTTATATGCCAGCAATGGCAGGGATTTGTTCATCCTTAAATCTGTCATGAGGTTAAAACA
+AATGAGTAAAGTCTTTATTTGCGCCGCTATTCCTGACGAACTGGCAACAAGGGAAGAAGG
+CGCTGTGGCTGTAGCCACAGCCATTGAAGCTGGCGACGAACGCCGTGCTCGAGCAAAATT
+TCACTGGCAATTCCTGGAACATTATCCGGCTGCTCAGGACTGCGCTTATAAATTTATTGT
+CTGCGAGGATAAACCTGGCATACCCCGCCCTGCCCTCGATTCATGGGATGCTGAATATAT
+GCAGGAAAACCGCTGGGATGAGGAGTCTGCTTCTTTTGTCCCGGTTGAGACTGAATCCGA
+TCCGATGAACGTCACTTTTGACAAGCTGGCCCCTGAAGTACAGAACGCTGTCATGGTTAA
+GTTCGACACATGTGAAAACATCACCGTTGATATGGTTATTAGCGCACAGGAATTGTTGCA
+GGAAGACATGGCAACATTCGACGGACATATCGTTGAAGCGTTGATGAAAATGCCAGAAGT
+TAACGCCATGTATCCGGAGCTTAAGTTGCACGCCATTGGGTGGGTTAAGCATAAATGTAT
+TCCTGGTGCTAAATGGCCCGAAATTCAGGCAGAGATGCGCATCTGGAAAAAACGTCGCGA
+AGGTGAACGCAAGGAAACCGGAAAATACACGTCTGTTGTTGATCTCGCCCGCGCCAGAGC
+CAATCAACAGTACACTGAAAATTCAACAGGAAAAATCAGCCCGGTCATTGCTGCCATTCA
+TCGCGAATACAAGCAGACATGGAAAACACTGGATGACGAACTGGCCTATGGGCGCTGCTT
+CGCAGACAGGCAGAACTTGATGGTATGCCTGCGATCAATGCCAAACGTGTTTACCGGATC
+ATGCGCCAGAATGCGCTGTTGCTTGAGCGAAAACCTGCTGTACCGCCATCGAAACGGGCA
+CATACAGGCAGAGTGGCCGTGAAAGAAAGCAATCAGCGATGGTGCTCTGACGGGTTCGAG
+TTCTGCTGTGATAACGGAGAGAGACTGCGTGTCACGTTCGCGCTGGACTGCTGTGATCGT
+GAGGCACTGCACTGGGCGGTCACTACCGGCGGCTTCAACAGTGAAACAGTACAGGACGTC
+ATGCTGGGAGCGGTGGAACGCCGCTTCGGCAACGATCTTCCGTCGTCTCCAGTGGAGTGG
+CTGACGGATAATGGTTCATGCTACCGGGCTAATGAAACACGCCAGTTCGCCCGGATGTTG
+GGACTTGAACCGAAGAACACGGCGGTGCGGAGTCCGGAGAGTAACGGAATAGCAGAGAGC
+TTCGTGAAAACGATAAAGCGTGACTACATCAGTATCATGCCCAAACCAGACGGGTTAACG
+GCAGCAAAGAACCTTGCAGAGGCGTTCGAGCATTATAACGAATGGCATCCGCATAGTGCG
+CTGGGTTATCGCTCGCCACGGGAATATCTGCGGCAGCGGGCTTGTAATGGGTTAAGTGAT
+AACAGATGTCTGGAAATATAGGGGCAAATCCACAGGTGAACTACGCTCCTCTGTTTGTTA
+CGCAATAAAAACTGGTGTTTTCGACTATGCAAAACAGTTTCCCTCCTCACGCAATCTGGA
+AAAATTTGGTGAGGCCCGACAAGATTTAACCATAAAAGAACTGGCTGAAAAATTTCTGGC
+ACTGAAAGAAACTGAAGTCGCCAAAACATCACTCAACACATACCGTGCCGTCATCAAAAA
+TATCCTGAGCATAATCGGTGAAAAAAATCTTGCCTCATCGATTAATAAAGAAAAATTACT
+GGAGGTTCGTAAAGAGTTACTGACTGGATACCAGATCCCCAAAAGTAACTATATTGTTAC
+ACAACCAGGGAGATCGGCTGTAACTGTAAATAATTACATGACAAATCTTAACGCCGTGTT
+CCAGTTTGGTGTTGATAACGGTTACCTGGCAGATAATCCGTTTAAGGGGATCTCGCCATT
+AAAGGAATCAAGAACCATTCCGGATCCTCTTTCGCGGGAAGAATTTATCCGTCTTATCGA
+TGCGTGCAGAAATCAGCAAGCAAAAAATTTATGGTGTGTTTCTGTTTATACTGGAGTTCG
+CCCTGGTGAGCTGTGTGCACTTGGATGGGAGGACATAGATCTGAAAAATGGAACAATGAT
+GATCAGGAGAAATTTAGCAAAAGACCGTTTCACGGTACCAAAAACACAGGCGGGAACCAA
+TCGGGTCATTCATCTTATTAAGCCAGCAATCGACGCTCTCCGGAGTCAGATGACATTAAC
+GAGACTGAGCAAAGAGCATATCATTGATGTTCACTTCAGAGAGTATGGCAGAACAGAAAA
+ACAAAAATGCACCTTTGTTTTTCAACCTGAAGTGTCAGCGAGAGTAAAAAATTATGGTGA
+CCATTTTACCGTTGACTCAATAAGGCAGATGTGGGACGCAGCGATAAAACGTGCCGGACT
+CCGCCATCGAAAATCATATCAGTCGAGACATACTTATGCCTGCTGGTCGCTGACAGCTGG
+TGCTAACCCGGCATTTATAGCAAACCAGATGGGCCATGCAGATGCGCAAATGGTATTTCA
+GGTATACGGAAAATGGATGTCTGAAAACAATAATGCACAGGTAGCTTTGTTAAATACACA
+GTTAAGCGAGTTTGCCCCAACCATGCCCCATAACGAAGCAATGAAAAATTAATTTAATAT
+TTATCAAATAGTTAACACGCATGACTCTTGAAATCCATAAATTCAAGCGCAGTGCCCAGC
+CATCCCGATACTGCTGCTTTCACCAAATCCTTAGTGCTTCTTTCGTGTTTTTCTATTGTC
+ATAATGGTTATCTCTAAAAAAGAGGTAAGATGCGTACTACTTACTCGCCGTTATTGGTAT
+TATTCAGAAAAAGTGAGTAAGACTTTGCAGCAATGTTTTTGATCCTGTTCAAATAAACTA
+ATGGCATCAGCAACATGCTGGAAATCAAACGTATGGGTAATTAATTTTTCTGGTTTAATT
+AACCCTTTACTTAACCAGTCGATAACGATCGGGAATTTATTTGCATTTAAGCGTGAAGAG
+AAAATAGAGAGTTCTTTTCCGGTAATTCCTTGCTGAATCACTTCAGACGGTTCACTGGAG
+AACCCCATCAATACAATACGTGCCGCTGGAGAAGCCAGCGTTACGGCCTCTTTCAGGATA
+GAAGGATGACAAGCCGCATCGATAATTAATGTCGGCTTGATGCCTTTTTCAGTGAAAATC
+TCGCCAAGCGGTGTCTGGCTGTTATTAATCGCCCAGTCAGCCCCGCTCTCTTTCGCTTTT
+TCCAGTCGTTCATCAATGCGATCGGCAACAATCACATTTTTAACGTTATAGACGCCTTTT
+AATACCTGAACGATCGTCAGGCCGATTGGACCGGCACCATAAACCAGAACGGTATCATTT
+TCAGTCGGTTGACCATGTCCGGTTACGTTAGCCGCAATGGTAAAAGGTTCGATCATTACC
+GCATATTGATCGGCCACTGCTTCAGGAATTTTCCACGCATTTTTTGCCGGAACCACGGCA
+TATTCACTGAAACCACCGTCAGCGTGCACACCTAATACAGCCAGTGTCGTACAAACGTTC
+GGTTTACCTATAGAGCACGGATAGCAATGCCCACAGCTGACCACCGGATCGACAGCAACA
+CGTTCACCGACTCTGGCGCTTTCCACGCCTTCACCCACTGCATCAATGACGCCAAAGAAT
+TCATGACCAATGACGCGCGGATATTTCGCAAAAGGATTATGCCCACGATAAATATGGCTA
+TCTGAACCACAAATTCCGGCAAGTTTCACTTTTACTCGTACTTCACCCGCTGACGGGGTG
+GGTATTTCACGTTCGACAATCGCCAGTTGATTCGGTTTTTCAATTAATATGCTTTTCAT
+>NC_000913.3|provirus_2461306_2476510
+ATGAGCCAGAAAACCCTGTTTACAAAGTCTGCTCTCGCAGTCGCAGTGGCACTTATCTCC
+ACCCAGGCCTGGTCGGCAGGCTTTCAGTTAAACGAATTTTCTTCCTCTGGCCTGGGCCGG
+GCTTATTCAGGGGAAGGCGCAATTGCCGATGATGCAGGTAACGTCAGCCGTAACCCCGCA
+TTGATTACTATGTTTGACCGCCCGACATTTTCTGCGGGTGCGGTTTATATTGACCCGGAT
+GTAAATATCAGCGGAACGTCTCCATCTGGTCGTAGCCTGAAAGCCGATAACATCGCGCCT
+ACGGCATGGGTTCCGAACATGCACTTTGTTGCACCGATTAACGACCAATTTGGTTGGGGC
+GCTTCTATTACCTCTAACTATGGTCTGGCTACAGAGTTTAACGATACTTATGCAGGCGGC
+TCTGTCGGGGGTACAACCGACCTTGAAACCATGAACCTGAACTTAAGCGGTGCGTATCGC
+TTAAATAATGCATGGAGCTTTGGTCTTGGTTTCAACGCCGTCTACGCTCGCGCGAAAATT
+GAACGTTTCGCAGGCGATCTGGGGCAGTTGGTTGCTGGCCAAATTATGCAATCTCCTGCT
+GGCCAAACTCAGCAAGGGCAAGCATTGGCAGCTACCGCCAACGGTATTGACAGTAATACC
+AAAATCGCTCATCTGAACGGTAACCAGTGGGGCTTTGGCTGGAACGCCGGAATCCTGTAT
+GAACTGGATAAAAATAACCGCTATGCACTGACCTACCGTTCTGAAGTGAAAATTGACTTC
+AAAGGTAACTACAGCAGCGATCTTAATCGTGCGTTTAATAACTACGGTTTGCCAATTCCT
+ACCGCGACAGGTGGCGCAACGCAATCGGGTTATCTGACGCTGAACCTGCCTGAAATGTGG
+GAAGTGTCAGGTTATAACCGTGTTGATCCACAGTGGGCGATTCACTATAGCCTGGCTTAC
+ACCAGCTGGAGTCAGTTCCAGCAGCTGAAAGCGACCTCAACCAGTGGCGACACGCTGTTC
+CAGAAACATGAAGGCTTTAAAGATGCTTACCGCATCGCGTTGGGTACCACTTATTACTAC
+GATGATAACTGGACCTTCCGTACCGGTATCGCCTTTGATGACAGCCCAGTTCCTGCACAG
+AATCGTTCTATCTCCATTCCGGACCAGGACCGTTTCTGGCTGAGTGCAGGTACGACTTAC
+GCATTTAATAAAGATGCTTCAGTCGACGTTGGTGTTTCTTATATGCACGGTCAGAGCGTG
+AAAATTAACGAAGGCCCATACCAGTTCGAGTCTGAAGGTAAAGCCTGGCTGTTCGGTACT
+AACTTTAACTACGCGTTCTGATAACGCGTTCGCCTGGATAAAGTCACCTGCATAGCAGGT
+GACTTTAACTCCCCCACTTCACCGAAAGTAGTGTCCTCATTGCTTACCTCCTGAGTTTTG
+CAAACAGCCTGTTGGCAGCTTGCCCTTTCAAATCAATAAGCGGTATCCACAGACAAACCT
+GAAGGGAAAGGCATATTTTCAGGCGTTCTGCTCGTCCTTCTCAAAGAGTTTACTTTTCTG
+CATTTCCAGGATACTCCCCCCCCCTGGCTATTGTGCGCTCATACACTCAAATTAAAGATA
+GGTTCTAAATAAATGAGCGTTTTTTGATAGTCTATTTCATTAGGTAATATATATTTGTAA
+CAAATCAATCAAAATGGAATAAAATCATGCTACCATCTATTTCAATCAACAATACCAGCG
+CAGCTTACCCAGAATCCATCAATGAAAATAACAATGATGAAGTTAATGGATTAGTACAAG
+AGTTCAAAAACCTTTTTAATGGTAAGGAAGGAATAAGCACCTGTATTAAACATCTACTTG
+AGCTTATAAAAAACGCCATACGAGTAAACGACGATCCTTATAGATTTAATATTAATAATT
+CCTCAGTTACTTATATTGATATTGACTCCAATGATACAGACCATATTACTATTGGTATCG
+ACAACCAAGAACCAATAGAATTACCTGCGAACTATAAAGACAAAGAACTCGTCCGTACTA
+TCATTAATGACAACATAGTTGAGAAGACTCATGATATCAATAACAAGGAAATGATCTTCA
+GCGCATTAAAAGAAATATATGATGGAGATCCTGGTTTTATCTTCGATAAGATATCACACA
+AACTCAGACATACGGTAACGGAATTTGATGAGAGCGGGAAAAGCGAACCAACGGACTTAT
+TTACCTGGTACGGTAAAGATAAAAAAGGCGACTCTCTCGCTATTGTAATTAAAAATAAAA
+ACGGAAATGATTACTTATCTCTCGGTTACTACGATCAGGACGACTACCACATTCAAAGAG
+GAATTCGTATTAATGGTGATAGTCTCACCCAATATTGTAGTGAAAACGCCAGGAGTGCTT
+CAGCGTGGTTTGAAAGCAGTAAAGCTATCATGGCAGAATCATTTGCAACTGGTTCCGATC
+ATCAGGTTGTAAACGAGCTCAACGGGGAAAGACTGAGAGAACCAAACGACGTTTTTAAAC
+GTTATGGTCGAGCAATAAGATATGATTTTCAAGTGGACGATGCAAAATATAAATGCGACC
+ATCTAAAAGAAATAGTTTCTACTTTAGTCGGTAACAAAATTAACGTTGGCCATTCTCAAA
+AAATATATAAGCATTTTAAGGATCTCGAAGGTAAAATTGAAGAAAGGCTTCAAAATCGCC
+AGGCTGAATATCAAAATGAAATTAATCAACCATCTGCGCCAGGTGTTAATTTTGATGATA
+TTTAAAATTATTTTTCCAGTTTTTTGATTTTTCAACAGCTGAATATCGGAAATAGTCAGT
+GACGAACATCAGTATTTTTACATAATTACGTCTAGGTCATTGTCGGTTTATCTCCTTTTA
+CTTGTGGTAATTGAGGGATAACAACAAAAAAGGTGAGTTTTGCGACTCACCTTTTTTATT
+TGTTTCTTATTCAGAATCAATATCTTTTAAATCATCCTGAATCGCTTGTGCGTTCGGATT
+TTCCTGCGGTTTGAGTTCGCCGCCATTAGCGATGAAATCATGACGCTGGAAGTACGCTTC
+GCGCACCATAATATAAGGATCGGACGACTGACGCAGCAGACCATCGGAATCCAGCAGCTG
+AGCGCGGGTTTCGATCCCTTCAAGCGTCCATTTACCCACAGACATCGGCCAGGTCAGCCA
+GGAAAGAACCGGGTAAAAACCATCCGCCATATCACCACCGTCATCACGCAGCGTGAAGCT
+ACCGTAGAACGGTAACTGAACGTAAGGCCCATAACCCACGCCATAATGACCAAGCGTACT
+ACCGAAGCGGTGAGGTTCAGTCCGTTGCAGTTTCGGGTTCGCCATCCCTGCAACATCAAT
+AAAACCGCCCATCCCCAAAATGGTGTTCAGGAAAAAGCGGGTAAAGTGGACCATCCCCTG
+ATAAGGGTCGCCCTGCAAGAAGTAGTTAACCATCACCGCAGGTTCTTCAAGGTTGCCAGT
+AAAGTTGCTCAAACCGTTACGCGCCGGTTGCGGAACATAATCACGCCAGGCGACAGCGAC
+CGGTCGAACAATATACGGGTCTAATACATTGAAGTTGAAGTTGTACATGGTGCGGTTGAA
+CCCTTCTAACGGGTCAGAACGCCCTTGCTGATCTGTACCGGAACTCGCACACCCCACCAG
+AAGCGTAGTTCCCAGAGCAAGCGCCGACAGGCGAAGCTTCATAAATGTCTCCCTGTTTTT
+TTATGGCTTATGCAGTTTGCCATCCATGACGGAACGATACCGTATCCGCCTGTTTAGGTG
+TGGGCGATTGTAACAGCACGTCAACTGATGTCCAGACGCCCTGATTTGCTGATTTGATCA
+TAGCCTGGTAATCGCCGCCCTGTAGGCTACTTGATTCTATAGAAACAGAAAAAGGCAAAC
+GCAGCCTTTTCTACATTTTCAGAGTAACTCCCGTCAGTTGCGAGCAAAAAAGCCGCTACG
+CTTTAGCTATACGTGCTAATTCAAGAGAAGAGACCATGGACAACGACAAAATTGATCAAC
+ACAGCGACGAAATTGAAGTTGAGAGCGAAGAAAAAGAGCGCGGCAAAAAAATAGAAATAG
+ATGAAGACCGACTCCCCTCCCGGGCGATGGCAATTCATGAGCATATCCGCCAGGATGGTG
+AAAAAGAGCTGGAACGCGACGCAATGGCGCTACTGTGGTCAGCCATTGCGGCGGGTCTGT
+CGATGGGCGCTTCGTTACTGGCAAAAGGGATATTTCAAGTCGAACTGGAAGGTGTGCCGG
+GCAGCTTCTTGCTGGAGAATCTCGGTTATACCTTTGGTTTTATTATCGTCATTATGGCCC
+GCCAGCAATTATTTACCGAAAATACCGTGACTGCGGTACTACCCGTCATGCAAAAACCGA
+CAATGAGCAACGTCGGCTTACTTATACGGTTATGGGGCGTCGTGCTGCTGGGTAATATTC
+TCGGGACAGGTATTGCGGCGTGGGCATTTGAATATATGCCTATCTTCAATGAAGAAACTC
+GCGATGCATTTGTCAAAATCGGCATGGATGTGATGAAGAACACCCCCAGCGAGATGTTTG
+CCAACGCGATCATTTCCGGCTGGCTGATCGCCACTATGGTTTGGATGTTTCCTGCAGCGG
+GTGCGGCAAAGATTGTGGTGATTATATTGATGACCTGGCTTATTGCCCTGGGTGACACCA
+CCCATATCGTGGTCGGTTCTGTTGAAATCCTCTATCTGGTGTTTAACGGTACGCTGCACT
+GGAGCGATTTCATCTGGCCCTTCGCACTACCTACTTTAGCGGGGAACATCTGCGGCGGCA
+CCTTTATCTTCGCGTTAATGAGTCATGCACAGATTCGTAACGACATGAGCAATAAGCGTA
+AAGCAGAAGCACGCCAAAAAGCAGAACGTGCGGAAAACATTAAGAAAAATTATAAAAACC
+CGGCATAAATGGCGAGGGTTTAAGCAATCGAGCGGCAGCGTACTTACCCCGCACTCCATT
+AGCGGGTATACTCATGCCGCATTGTCCTCTTAGTTAAATGGATATAACGAGCCCCTCCTA
+AGGGCTAATTGCAGGTTCGATTCCTGCAGGGGACACCATTTATCAGTTCGCTCCCATCCG
+TACCAGTCCGCAAAATCCCCTGAATATCAAGCATTCCGTAGATTTACAGTTCGTCATGGT
+TCGCTTCAGATCGTTGACAGCCGCACTCCATGACGGGTAAAAAGTGGATAAAATAATTTT
+ACCCACCGGATTTTTACCCATGCTCACCGTTAAGCAGATTGAAGCAGCAAAGCCGAAAGA
+AAAACCATACCGCCTTCTCGATGGTAATGGCCTGTACCTTTATGTCCCTGTGTCAGGGAA
+AAAGGTATGGCAGCTTCGCTACAAGATTGACGGTAAGGAGAAAATCCTGACCGTCGGAAA
+ATATCCGCTTATGACTTTGCAGGAGGCAAGGGATAAAGCATGGACTGCGAGGAAAGACAT
+CTCGGTTGGCATCGATCCTGTAAAGGCGAAAAAGGCTTCGTCTAACAACAATTCCTTTAG
+TGCGATTTACAAGGAATGGTACGAGCACAAGAAGCAAGTATGGTCAGTAGGGTATGCAAC
+TGAACTTGCCAAAATGTTTGACGACGACATTTTACCTATCATTGGCGGCCTTGAAATTCA
+GGATATTGAGCCGATGCAACTGCTGGAAGTAATCCGCAGGTTTGAAGATCGCGGTGCAAT
+GGAACGAGCCAACAAAGCACGCAGAAGATGCGGCGAGGTTTTCCGTTACGCTATTGTCAC
+CGGAAGGGCTAAATATAACCCGGCACCTGACCTTGCTGACGCCATGAAGGGATACCGCAA
+GAAGAACTTCCCGTTTCTTCCTGCAGACCAGATCCCGGCATTCAACAAAGCACTGGCAAC
+ATTTTCAGGAAGTATCGTATCGCTCATTGCGACCAAAGTTTTACGCTACACAGCCCTAAG
+AACGAAAGAGCTTCGTTCCATGCTATGGAAGAACGTCGATTTTGAAAATAGGATTATCAC
+CATCGACGCCAGTGTGATGAAAGGACGCAAAATTCATGTGGTTCCTATGTCAGACCAGGT
+AGTTGAACTTCTCACTACGCTAAGCTCCATCACCAAACCAGTCTCAGAGTTTGTTTTTGC
+CGGGCGCAACGATAAGAAGAAGCCAATCTGCGAGAACGCGGTACTGCTTGTGATCAAACA
+AATCGGCTATGAGGGTCTGGAAAGCGGTCACGGATTCAGGCATGAATTCAGCACGATTAT
+GAACGAGCACGAATGGCCTGCTGACGCTATTGAAGTGCAACTGGCACATGCAAACGGCGG
+ATCTGTGCGTGGGATTTACAACCATGCTCAGTATCTCGATAAACGCAGAGAAATGATGCA
+ATGGTGGGCGGACTGGCTTGATGAGAAGGTGGAGTGAGCGACCTTAACAACTATCGAATA
+GCACAAAGTCTTGCAATCCAGTGCAAAGCTTTGTGTGTATAAGTTTTGTCTCATCAACCA
+CAGCAAGTATCGATCGATTAAGACTTGGATGATAGACTTCATTCCTTTGATTATTAGCTG
+ATAGAAGAAATGTTAAAGCTATTTGCAAAGTACACCTCTATTGGTGTGCTGAACACCCTT
+ATACACTGGGTGGTTTTTGGTGTTTGTATCTATGTCGCGCATACAAACCAAGCTCTTGCA
+AACTTCGCAGGTTTCGTTGTGGCTGTGAGCTTTAGCTTCTTCGCGAATGCAAAATTCACA
+TTCAAGGCATCGACTACAACGATGCGCTACATGCTATATGTTGGGTTCATGGGGACACTG
+AGTGCTACTGTTGGATGGGCTGCTGATAGATGCGCACTTCCCCCGATGATAACTCTTGTC
+ACCTTCTCCGCCATCAGCCTGGTGTGCGGTTTCGTCTATTCAAAGTTCATTGTCTTTAGG
+GATGCGAAATGAAGATATCTCTTGTAGTTCCTGTCTTCAATGAAGAAGAAGCGATACCAA
+TTTTTTATAAAACGGTACGTGAATTCGAAGAATTGAAGTCATATGAAGTGGAAATCGTTT
+TCATAAATGACGGCAGCAAAGACGCTACGGAGTCAATCATTAATGCTCTGGCTGTTTCAG
+ATCCTCTAGTTGTTCCGCTGTCATTTACACGCAACTTTGGTAAAGAACCAGCATTGTTTG
+CAGGGTTAGACCATGCAACCGGGGATGCGATAATCCCAATTGATGTTGACCTGCAAGACC
+CGATTGAGGTTATTCCTCATCTTATTGAAAAATGGCAAGCAGGTGCTGATATGGTTCTTG
+CTAAAAGATCTGACCGCTCAACTGATGGACGCCTGAAGCGAAAAACGGCTGAGTGGTTCT
+ATAAGCTCCACAATAAAATAAGCAATCCTAAAATTGAAGAGAATGTTGGTGATTTCAGGC
+TGATGAGCCGTGATGTTGTCGAAAATATTAAACTTATGCCAGAACGAAACCTTTTCATGA
+AAGGTATTCTGAGCTGGGTAGGAGGAAAGACAGATATTGTTGAATACGTGCGAGCGGAAA
+GAATTGCTGGAGATACAAAATTTAATGGATGGAAACTTTGGAATTTAGCACTTGAGGGTA
+TTACAAGCTTTTCCACATTCCCTCTTCGCATCTGGACATACATAGGGTTAGTGGTAGCCA
+GTGTAGCATTTATTTATGGGGCGTGGATGATTTTAGATACTATCATATTTGGAAATGCTG
+TTAGGGGATATCCTTCACTACTTGTTTCAATACTGTTTTTAGGTGGAATTCAGATGATTG
+GAATAGGAGTATTAGGTGAATATATTGGACGCACATACATTGAAACCAAAAAACGCCCGA
+AATACATCATCAAGAGAGTCAAAAAATGAATAAAGCAATAAAAGTATCATTGTATATATC
+TTTTGTTTTGATTATTTGCGCCTTATCTAAAAACATAATGATGTTAAATACATCTGATTT
+CGGAAGAGCCATTAAGCCATTAATTGAAGACATACCAGCATTTACATATGACTTACCTTT
+ATTGTATAAATTGAAAGGTCATATTGATTCAATTGATAGCTATGAGTATATAAGTTCATA
+TAGTTATATTTTGTATACATACGTCCTGTTTATTAGCATTTTTACTGAATATCTTGATGC
+TAGGGTGTTATCGTTATTTCTAAAAGTAATATATATTTATTCATTATATGCGATATTTAC
+TTCATATATAAAAACAGAAAGGTATGTAACTTTATTTACATTCTTTATTTTAGCTTTTCT
+TATGTGTTCTTCATCAACACTGTCAATGTTTGCATCATTCTATCAAGAGCAAATAGTTAT
+AATTTTCCTTCCATTTTTGGTGTATTCATTAACATGCAAAAACAATAAATCTATGCTTTT
+GCTATTTTTTTCGTTGCTAATAATATCTACTGCTAAAAATCAATTTATATTAACCCCACT
+AATAGTGTATTCATATTATATTTTTTTTGATAGACACAAACTAATTATTAAATCTGTAAT
+ATGCGTGGTGTGCTTGCTTGCGTCAATATTTGCAATATCTTATTCAAAAGGTGTTGTTGA
+ATTAAATAAGTACCATGCAACATACTTCGGTAGTTATCTTTATATGAAAAACAACGGGTA
+TAAAATGCCATCGTATGTTGATGATAAGTGTGTTGGGTTAGATGCCTGGGGTAATAAATT
+CGACATATCATTTGGCGCAACCCCAACAGAAGTTGGAACGGAATGTTTCGAATCTCATAA
+AGATGAAACGTTTTCGAATGCACTCTTTTTATTGGTTAGCAAACCAAGCACCATCTTCAA
+ACTTCCATTTGATGATGGTGTGATGTCTCAGTATAAAGAAAATTATTTCCATGTATATAA
+AAAACTACACGTAATATATGGAGAATCAAACATACTAACGACTATTACTAACATAAAAGA
+CAATATATTTAAAAACATTAGATTTATATCATTGTTATTATTTTTTATTGCTTCTATTTT
+TATTAGAAATAATAAAATAAAGGCATCTTTATTTGTAGTATCTCTTTTTGGAATATCTCA
+ATTTTATGTGTCATTTTTCGGGGAAGGATATAGAGATTTAAGCAAGCATTTATTTGGAAT
+GTATTTTTCGTTCGACCTTTGCTTATACATAACAGTCGTTTTTTTAATTTATAAAATAAT
+TCAAAGAAATCAAGACAATAGCGATGTAAAGCACTAAGTTTAAATTGCGCGCCAATCATG
+GCGCGCACAAGCTATAATACCAACCTAATTTCTCCTCCTCTTAGAGTGACTATATCTCCT
+GATAGAATTGCGGTATTGACTATCAAATGCCCTGATTCGTTGTTTATTGTAATATCTCCT
+CTATCTGCAGACGATAACTTAAATGCATCATTGCCCACAACAAACCCCCTCCAGAACCAA
+GTGCTGATATTATCATCAACAGTGATAGATACATATACTAACTGATTATCGTTATAAGTG
+ATTCCTGTCTTATACTTAACATAAGGACTTCCACTTTGATTCTCGATAGACACATAACAT
+CCAGGGGTTATGTTTGTATGCGTCCCGCGACTATCGCCCCATTAACGCCATACGATAAAT
+GGGATGGTGAGAAATGGGTGACGGATACCGAGGCACAGCATAGCGTCGCAGTAGATGCAG
+CAGAAGCACAGCGCCAGTCGCTGATTGATACTGCAATGGCTTCCATTAGTCTGATTCAAC
+TGAAATTACAGGCTGGGCGGAAGCTGATGCAGGCAGAGACCTCCCGACTTAACACTGTGC
+TGGATTACATTGACGCGGTGACGGCAACAGATACCAGCACCGCGCCGGATGTCATCTGGC
+CTGAACTGCCGGAGGAGTAGGCCATTCAATATCTGGCGCACTGGAAGTATCGACCAGCTC
+CAGTGCGTCCAGATAATCCAGCCACAAATTATATTGCGCCAGTTCCTCACCTTTCAGACG
+ACCAATAGCCGCTTTACCAGCCCATTGTTTACTGTTCATATAATCGTTGGCCTGATTAAT
+CAATTGCTGCTTTTTCAGTTCGGCTGCAGCAATCTGTTCCTCATGTGTTGGTGGTGGAAT
+TTCAGACCATGCAGGAAAACCATTTTCTCCAGCGATACGGATTTTTCCTTTCGGCGGTAA
+TCCGGAAAACTCAATATACACTTGCTCATCAACTTCAACAGCATCATCTGGCCATGAGCC
+AGCTTGCGTGTAATCCTCTTTCATCTCCAAGGGATAGAAAGAGTTTGTAGTCGCGGAATA
+TATGTAATTCATTTTTCACTCCATAAAGTTAAAAGAAATTAACACCCTAATGCGAAAAAT
+GAAGCACCGATACCGGGTACGCCTGCTCTGGAAATAAATTTCACCGGGTCCTGGTTATAA
+CCGGCACAAGCTATATAGCCAACATTTGCACTGCCGGGAGTGTAATCCTGAGTCGCAAAT
+ACCCGCAGACATCTATTCGGAAATGCAATCGGAAAATAGGTTACTGTGTCCTGAGACGTC
+AGCGGAACATCAATTGGCCCCCATTGAATAATTAAACCGGATGGCAATTTTTGATATCCA
+GGAACTGAAGCAGAAAGCATAAAACTACCCATATCAGGTATCTGATTCGCCCCTGTCCCT
+ACATTTCTTTTAGCCGCTTCTCCCAAACCAAGGTTTTCGAGAGCCTTTTGCACCGTGCCG
+TCCAATTTGATATCGCCAAACGGATTCTTGCGGCTTAACAGCAGCGCACGAAGCGCGGTA
+AGCAGCTGGTCATGCCGCCCCTTCTCCAGGCTGGCACCGGAGGCCTCCACAACGCTGCAA
+AGCTCCTCCTGCAACATGTCAAAGTAGTCATCATCCAGATCGGTGGCAGGCGTGCCGGTC
+TGGGGGTTACCACGGGTACGGGGGATTACCAAAGGCAGCACCTTTAAGCTCCGCAAGACG
+TTCTGACCAGTCATGCGCCAGCGCGTTGTCTTCCGCAGTGTAATACGCGGCACATTTGGC
+GTTATCACCATCAGTAAACAGATCCAGAACAAACGGGCCAAACAGGGTGTTAATTCCCCA
+GAAAATGTTGTCCGGCGTGCGCCACTGATCGCCCACTTCCTTCAGTTCATGGGCTGGTTT
+GTTCCGCAGCTCCACCAGCGCCTGGCAATATTTATTACTCATTAAGCCCCCACGTAATTC
+CCTGAGAGATACCACTCTTCACCTGATGCAGCCCGCTTACTGCTTTTCCGTAAACACCGT
+TCACGACGCGCCAGAAAATTGTTTCGTTCTGGCTGGGAGTGGCTTTCACGGAATGCCGCC
+ATCCACACCGTTGCAGCACGACGGTATAAGCCCCTGGACTCCAGTTCTTCCGCCTGGCGG
+GTCAGGCACAAAATCACCCGCGGGTCGTTAGTGCCGACATAGAAATTGCGCACAGGTCTG
+GTTTCACGAACTGGTTGTGGTTCCGGATCCTGCGCTCTCTCAGTCAGGCGCGGGAAATGT
+CTGTGTGTATCTCCTTCACAACGGTGAGCCACACGCCCACTCTGACGTAACTTGCTTGCT
+GACTGCAGAACGCGCTGCCGTGAGTAACCTGCAAAAGCATCCGCAATGTCTCCGGAAGTA
+CAGCCCGGATGGGCTTCAATGAATTTCTGAACGTCATTCAAAAGACTCATGCTCACCCCC
+TGAATCCTGCCGGGATCTGGCTGTAGTCCACATTGTCGTAACTGGCTTTGAAGTACGGGT
+CTTCGCGTTTTTCTGTGTACGTGCTGACGGACGGCGATAAGCGCAGGGAAAGCTCATCCC
+ATTTTTCCCGCAGCTTCGACGGGCTGAGCACGTTACGGCACCAGAACGGATCGCGGCTGA
+CGCGGCTGTACATCTCGCAGATTTGTTTGTGAGTACGACCATCCTGCACACACATCAGGC
+GAATTTCGTTTGCCCAGGCTGTCCAGTTCGGTTCTTTGGGACGAACCACCTCGCCGTCAC
+ATTCGGCGGCCTGCTCGTACAGGGCGATGATTTTTTTCCAGAGCCACTGTGCGCAGGTCA
+AATCATCCTGCGTTCCCCACTGGCGCTTTTTAGGGCTGAATACAACCGCATCAGGATGGC
+GAGTTAAAAAATCCTGTTCATCCGTCTGCGTGTCCGGTTGCGAAGCGTCCGGACGAGAAG
+GTTTTTTATCTGACGGATCATGTTTTGATTTTACTGACGGATCCCCGCCAGATTCTGACG
+GGTGAAAACCCGATTTTTTGCCAGATTTCGACGCATCAAATTTTGACGGGTCAGATTTTG
+ATGCGTCAGATTTTGACGGGTCAGAGTCTGACAGTTGAGAAAATGCCGCTGCCTGAAGCT
+TCGCAACGTTAAGCTGATAAACATTCGACGCATTGCGGTTATGATGAGGAGCAGCAAAAT
+GGCTAGCGAACGCAGTACTGATGTGCAGGCATTTATCGGGGAGCTGGACGGCGGCGTATT
+TGAAACCAAAATCGGCGCAGTTCTCAGTGAAGTCGCTTCCGGTGTGATGAACACGAAAAC
+CAAAGGTAAGGTCTCACTCAACCTGGAAATCGAACCATTTGATGAGAACCGTCTGAAAAT
+CAAACACAAACTCTCATATGTTCGCCCGACTAACCGTGGGAAAATTTCCGAAGAAGACAC
+CACCGAAACGCCGATGTATGTCAATCGCGGTGGTCGCCTGACTATTCTGCAGGAAGACCA
+GGGACAATTACTGACTCTTGCCGGTGAGCCTGACGGAAAACTCCGCGCAGCAGGTCATTA
+ATATCATTCTTAATTAACTAATTATTTATCTCATCACTGAATATCTTAATATAGTGAGGA
+CTTATTATGTCTCAGAACTTAGACGCAACCGCAATTAATCAAATCCATGCCCTTATTTCT
+GCTCAGGGTGTTAATGAAATTATCAGTAAGATTGGTGCCGATGCTGTGGCATTGCCTGAG
+AATTTCCGCATTCATGATCTGGAAAAATTTAATTTAAATCGCTTCCGTTTCCGTGGTGCG
+CTTTCCACTGCCAGCATCGATGACTTTACCCGTTATTCTAAAGATCTTGCAGATGAAGGC
+ACCCGCTGCTTTATCGATGCTGATAATATGCGTGCCGTCAGTGTGCTTAACCTGGGTACT
+ATTGATGAACCAGGTCACGCAGATAACACCGCCACTCTCAAACTGAAAAAGACAGCACCG
+TTCTCTGCCCTGTTGTCTGTTAACGGCGAGCGTAACTCCCAGAAATCACTGGCAGAATGG
+ATTGAAGACTGGGCCGACTACCTTGTGGGCTTTGATGCTAATGGTGACGCCATTCAGGCA
+ACAAAAGCGGCTGCGGCAATCCGTAAAATCACGATTGAAGCAAACCAGACCGCTGATTTT
+GAAGATAATGACTTCAGCGGCAAACGCTCCCTGATGGAATCTGTCGAAGCGAAGACCAAA
+GACATTATGCCAGTGGCATTTGAATTTAAATGCGTTCCGTTTGAAGGTCTGAAAGAACGT
+CCGTTTAAATTACGCCTCAGCATTATCACTGGCGATCGTCCTGTACTGGTTCTGCGCATT
+ATTCAGCTGGAAGCGGTGCAGGAAGATATGGCTAACGAATTTCGTGATCTGCTTGTTGAG
+AAATTCAAAGACAGCAAAGTAGAAACCTTTATTGGTACTTTCACCGCCTGATTTCATTAC
+TGCAAATGCCCCTGCGGGGGCATTTATGGAAACGTAATTAACTCAATAATCACCGGATGG
+TGAGGGCTTCCTTTTACCCAAACTCAGCGCGGTGCAGCGCATATACGTGGAGAACAAAAT
+GTCATTTATTAAAACTTTTTCCGGGAAGCATTTTTATTATGACAAGATAAATAAAGACGA
+CATCGTGATTAACGATATCGCGGTTTCCCTTTCAAATATCTGCCGCTTTGCCGGTCATCT
+TTCTCACTTCTACAGTGTCGCCCAACATGCGGTGCTTTGCAGCCAGCTGGTGCCGCAGGA
+ATTTGCTTTTGAAGCATTAATGCATGATGCAACAGAAGCGTATTGCCAGGACATCCCCGC
+ACCACTGAAACGCCTTCTTCCTGACTATAAACGGATGGAAGAAAAAATAGATGCAGTAAT
+CCGTGAGAAATACGGGTTACCTCCTGTTATGAGCACGCCAGTGAAATATGCCGATCTCAT
+TATGCTGGCAACCGAACGCCGTGATCTCGGGCTTGATGATGGCTCTTTCTGGCCTGTACT
+GGAAGGCATCCCGGCAACAGAGATGTTCAACGTGATTCCACTGGCACCGGGTCATGCCTA
+CGGGATGTTTATGGAACGTTTTAACGATTTATCGGAGTTACGCAAATGCGCATGAATGTT
+TTCGAAATGGAAGGGTTTCTTCGCGGGAAATGTGTACCGCGAGATCTGAAAGTGAACGAA
+ACAAATGCTGAGTACCTGGTACGTAAATTCGACGCGCTTGAAGCTAAATGTGCGGCACTG
+GAAAACAAAATAATACCAGTGTCAGCTGAACTGCCACCAGCAAATGAAAGTGTTCTGTTA
+TTTGATGCTAACGGAGAAGGCTGGCTGATTGGCTGGCGTTCTCTCTGGTACACCTGGGGA
+CAAAAAGAAACCGGAGAATGGCAGTGGACATTTCAGGTTGGGGACCTTGAAAACGTCAAT
+ATCACTCACTGGGCAGTAATGCCAAAAGCACCGGAGGCTGGAGCATAATGACCACATTTA
+CCAATAAAGAACTGATTAAAGAAATCAAAGAACGAATCAGCAGCCTAGAGGTTCGAGACG
+ATATTGAGCGCCGTGCTTATGAAATCGCACTCGTATCTCTGGAAGTAGAGCCAGATGAAC
+GCGAAGCCTATGAATTATTCATGGAAAAGCGTTTCGGTGACTTAGTAGATCGTCGGAGAG
+CAAAAAACGGCGATAACGAATACATGGCATGGGATATGACTCTCGGTTGGATCATCTGGC
+AGCAACGAGCTGGTATCCATTTTTCAACAATGTCACAACAAGAGGTGAAATAATAGAGCC
+ATACAGCCTCACACTCGATGAGGCCTGTCAGTTTCTTAAAATATCCTGATCTACCATCGC
+CGTCATAGAGCGTATTTTTATTACCTGATTTGCAGGTTCGATTCCCTATTCGGAGATAGC
+ACTCATGCAACACGAACTACAGCCTGATTCACTGGTTGATTTGAAATTCATCATGGCTGA
+TACTGGCTTTGGTAAAACCTTCATCTATGACCGGATTAAGTCAGGCGACCTGCCAAAAGC
+CAAAGTTATCCACGGGCGAGCAAGATGGTTATATCGTGACCATTGTGAATTCAAAAATAA
+GCTCTTAAGCCGCGCCAATGGGTAA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_002737.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1977 @@
+>NC_002737.2|provirus_529627_569283
+TTAAAACTTAAAAATAATATCGATGTTATCCATAGTAACCTCGACTCTATCTATCAATTG
+CTTAACTATCCTAGATTGAACATCATACGAAGATTTTCTAATGTCAAGGTTATCCATCAG
+CATTCCAAGAGAGTCTTCGTTTTTCTTGTCTAAATAATTCAATTTAATTGCTTTGTTATA
+ATCATCTTTTAAATGATTGAGTTCTTCGATGTCTTTTTTTAGTTTTGGTAGGTCAATCAA
+ATCATTAATATATAAATCGTTTAGACGATTGATTTTTTTATCGATTATCTCTATTTCTTT
+TTTTAAAGGTGTAATATCAATTATATTGTCATCTTTTTTTATTTTTTTAAGATATTCTTT
+ATCGTGTTGAAGTTTATAAAGAACATCAATAACATATTTTTCGATGTGTTTTTTTTCATA
+TCGACCAGTGTTACAAATCTTTTGGTTATTATAATTATTAACACTTCGTCTAGCCAAACT
+TTCTGTTTTATTAACACAAACGTAAGTTTGCCTTCTCGTACCATCGTTCTTAGCTCTTCC
+TGTGCATACTTTTAAAGGGGCACCACAATAACCGCATTTTGCTATGTGAGAAAGCATATA
+TTTCCCTTGAAAAGGTCTAGTATTTGTTTTCGTATCTGTCCTATGTGCTAAAGCTATTTG
+CGCTTTATTATATGTTTTTTCGTCGATAATGGCTTGATGATCACCTGAGAAAGTTTGTTC
+CCTATACTTCACTAATCCTTTATATGTTTCGTTTTCTAATATTCTTTTTACTTTTACATG
+TGTCCACGTATTCCCGACGAAATTGTCTCTCGCGTAATTTGTAATTGACATGATTGAGCA
+GCCAGAGATTATCATGTCAAACATCTGCCTGACATTAGCAGCCTCTAACTCGTTGACCGA
+CAATGTTTTTTCGTCTTTGTTGTATCTATATCCATAAGGTGGTGTTTTCCAAGCCGTTGT
+TTTTCCAGATTTTGCTCTATTCATAACACCAAACTGCATTCGCTCTTTAATCTGTTCTCT
+TTCAAACTCTGCAATAGCTGACAAGAGAGTGAGAAAGAGATTTCCCATTGCTGAAGAAGT
+GTCGATATTTTCTTTTAAGCTGACAAAATGGATATTGTTAGCAGTAAATACATCTTTGAC
+TAAGTAAAGTGTGTCTTTTACATTTCTTGATAGCCTGTCTAGTTTATAGACTAAAATAGT
+ATCAAATTTATTGTTTTTACCGTCTTCAATCAATTCTGTTATTGCCGGTCGTTCAAGTTT
+ACCGCCTGAAAAACCTGCATCAGAGTAGTTTTTGTAAATTTTCCATTCCATTGCCTCACA
+ATACTTTGTTAAAGCTTCAATCTGTCCTTGAATGGAATATCCTTCTTCGGCTTGATTTAT
+TGTTGATACTCTAGAGTAAATAGCTACTTTTCTCATTGTTTTTTACCTCATTTTTTGTTA
+AAATGAGTACAGTAAAGAGACCTACTTAAAGCAGGTTTTTACTATACTAGATTCGCCTCA
+CGCTCGCACCGACCAAAGTTGAGCGGGGGGCTTTTTTTATTTTGTCTCAAATATACAGCT
+GCACTCGTTACAGTGCCATTGCTTCTTCCCTTTTTCTCCTAAAAATCCCATAACTGTTCC
+ACCTATTAAAAGAGTTCCTGCGACGGCCTTTTTAACAGAAAATGTCTTTTTACCTTGCTG
+CATAAATCCAACATTAGTACTTTTACATTTTGGACATCTTACCGCCTCTTTTTCTTTTTT
+TATCACTTGTTTTATTTCGCTATTTAATTGGGTCTGTCGTACTGAGTTTTTCATTACTTG
+CTTTAAGCCACGGTTTTCAATCTCATTCATCTTTTCTGCATTGTTTTTTGCTTCAAAATA
+TTCTCCCAGATTTTTTGATTTTAAAAGTTGTTTTAACGTCATATCATTGTCCTCTCTAAA
+AACATTAGTTAAAATTCAATCGGTGTAAAACTACCAACAACGTCATATATTTTAATGTAT
+GTATCTTCTGCTGGTGGATAGCCAATAAAAATATCGCTATATTTTTTATTAAGTGATACT
+AATCGAAGTCCATCATGTTCAGTGTAAACTTTTTTAAAATAAGTGTTCCCGTTATGTACA
+ACAATACATAATTGTCCGCTGTATGTTGACATTCCTTTATCAACGATATAAAGCATATCT
+CCTTGCTCGTACTTTGGTAACATGCTATCGCCTCTTATGCCAATAGCATAATCATAATGT
+GGAGGTTCTTCGTCTGTATAAACTGTATAAGTATCATAGTCATCTGCTTCAAAACCTCTA
+CCAAATCCGCTTGCTGCTGCAGCAAAAGTCGTTCCTTTAACTTCAAAAATATCTTCGATA
+TCAGTTTTTTTATCACTGAAATTGATGATTTTTGTTTGTTCTTCCAATTGCTCTTTTGCT
+GTATCTAAAACAATTACTCTTCGTTGTTCTTCTAATTCGCGGTATATTCCAAGCAGTTCC
+GAACCATCTACTTCGCTATTTAAATCAATACCAAGTAAAAACTCTGTTGATATATTAAGT
+GCTTTAGCAAAATCATCTGCCCTGTTTAAAGGAAATTCTCTTGTTTTATTAAAATATCTA
+GACATCGTTGATTTTGCAATACCAACATTTCTAGCCAACTCACTCATTGACATCTTTCTT
+TCTTCTACTTTGCTCTGTATCAAAGAAATAATTTCGCTGTTTGTTCTCATGTTTTGTTAT
+CCTTAATGTTATTTAGTAATATCATTATACCATCGTTCCCAAAAAAATACAATAAAACGC
+TAAAAAACAAATAAACGTATTTTTTTTAGAAAAAATCGTTGACAATTTGGAACGTAGGTT
+TTATAATAAAGGTGTTCCAAAACGGGAACAAAAATAAAAAAAGGAGTATGTATATGACAA
+TCAATTTGAAGCGACTAAAAGCCGAGCGAATTGCTAGCGGTATGACACAATGTGAAGTTG
+CACAATCTATGGGGTGGAAAACACGAACACCATATGCAAAAAGAGAGAACGGTATTGTTT
+CAATTGGAGCTGATGAGCTTGCAAAAATTACTTTGATTTTTGGATTACCAATCGAAAAAA
+TAGCAATTTTTTTTGATAAAGACGTTCCCGTAATGGAACGATGATGCAAATAAAAAAGCC
+CTGTAAAATAGCAGTTTACGGGACAGACAGATTCTTATGAGGCAATTTTACCATGAAAAA
+CAAAAAAGAGCAATGGACCCCAAAAGTTCACTGTTTTCGAAAAGATGGTTCACAATGTGA
+GCCAGAAAATATAACAGTGCCAATTTCTTTTGCAGGTTACTATCAAATTTTATTAGAACT
+AGGAGTATAACATGAAACTATTAGATTTTATTTTTACAAAACCAAAAAAACAGGAACCGA
+TTAAACACGATACTAAGCGATTGTCATCTGAAAAGCAGTATGATGCATTCCACGCTTATA
+TGAGAAAAAAAGTATGAAACAACAACTAATTAACGACAACGAATTTTTGCGAGACGAAAA
+TCGCAGGTTAAATAATGAATTGGCGGAACATTACTTTGTAGTTACAGCTAAAGCAAATTT
+ATTAGATGTCATTATTGCTAGTGATTTTATCTTGAAAAGTACGCTAGATAAATGCATTGC
+TGAATTGGATGAAATTGATCAAATAGCCCTGTTAAAAGCATGGAACAAGGGAGAATTATA
+ATGTCAATAACAATAAACAAACTTGAAATCGAAAACGTTAAGCGTATTAAAGCGGTAAAG
+ATTGAACCATCTGCAACAGGCTTGACCATTATCGGTGGTAATAATAACCAAGGCAAAACA
+AGCGTATTAGATGCTATTGCTTGGGCACTAGGCGGTAATAAATACAAGCCTAGTCAAGCT
+ATGCGCGAAGGATCGCAAGTGCCACCTACGCTTAAAATTACCATGTCAAATGGACTTATT
+GTTGAACGGAAAGGCAAAAATGCCAGTCTTAAAGTAATTGATCCAAACGGCCAAAAAGGT
+GGTCAGCAGTTGCTAGATAGCTTTGTAGAAGAATTGGCTATTAACTTGCCGAAATTTATG
+GATAGTACACCAAAAGAGAAAGCAGATGTCTTGCTTGAAATTATTGGTGTCGGTGATCAG
+CTAGCAGAGTTAGAGCTAAAAGAAAAAGAAATATACAATCAACGTCACGCTATCGGTGTT
+ATAGCAGACCAAAAAGAAAAGTTTGCTAAGGAGATGACATATTATCCTGACGCACCTAAA
+CAACTGGTAAGTATTTCTGAGCTTATCCAACAACACCAAGCTATCTTAGCCAAAAACGGA
+GAGAATGCTCAAAAGCGTCAAAATGTAGAACGTATTCGCTATGATTATAATCAATCTATC
+TTGGAAGTTGACCGTTTACGCAAGTTATTAGCAGATGCAGAAGCTAAGACGAATAAGTTA
+AGCGAGGATTTAAAAATAGCAAATACTGACGCTATGGATTTACATGATGAATCAACAGCT
+GAAATCGAGGCGAATATTGCCGATATTGATGAAGTCAACCGCAAAGTGCGCGCTAACTTT
+GATAAAGATAAAGCTGAAGAAGATGCTAAACAGCAGCGTGAACAATATAACATATTGACT
+AATGATATTGAGTCAATTCGTCAACAAAAAAGAGACTTATTGATTAATGCAGATTTGCCG
+CTTGAAGGCTTATCAGTAGATGATGGAAAGTTACTTTACCTTGGTCAAGAGTGGGATAAC
+ATGTCAGGCAGCCAACAACTAATAGTAGCAACTGCTATTGTACGTAAACTAAAACCAGAT
+TGTGGCTTTGTTTTGATTGATAAACTCGAACAGATGGACAACATCACACTTGAACAATTT
+GGTAAACGGCTAGAGCAGGAGGGTTTGCAAGCTATTGCAACCCGTGTATCAATTGGTGAA
+GAGTGTGCCATCATTATAGAAGATGGATACTCAGTGGAAAACAAAGCTCATAACTTTAAA
+ACAGCAGAGGGTGGTAATTTTGCTGAAACAGTAGCACCGACTTGGAAAGGTGAGTTTTAG
+AAAGAGAGGTAAATATGCAAATTACAAGAGGTAAACGAGCACGTGCTCAACGTGTCATCA
+TTTATGGACCAGAAGGAATCGGTAAATCTAGTTTTGCTGCTAATTTTCCTGAACCATTGT
+TCATTGATACGGAGGGATCAACAGACAATATGGATGTGGCCCGTATGGATAAACCAACAA
+GCTACACTATGCTAAAAAATCAAATTGCATGGATTAAAGCGAATCCAACATGTTGCAAGA
+CACTGGTCATTGACACAATCGATTGGGCAGAAAGCTTAATAGTAGATGATGTCTGTGCTC
+AACATGGCAAGAAAGGTATCGAGGACTTTGGTTGGGGCAATGGTTATACCTACACAAAAG
+AGGAAGTAGGTCGATTCTTGAATATGCTCCAAGAACTGATTGAACTCGGTATCAATATTG
+TATTAACTGCCCATGCACAAATGAGAAAATTTGAACAACCTGACGAGATGGGAGCTTATG
+ACCGTTGGGAGTTGAAACTTGGTAAAAAGACAAGCTCACAGACTGCCCCCTTGGTCAAAG
+AATGGGCTGATATGGTCTTGTTTGCCAACTACAAAACAGTAGTTATGACTAGCGAATCAA
+AAAAGAAAAAGGCAACTGGTGGTCAACGTGTGCTATACACGCAACATCACCCAGCGTGGG
+ATGCAAAAAACCGTCATGGGTTACCAGACGAAATGCCTCTTGACTATGCAGTAATCGCAC
+ATCTATTCGCACAAGTACCAACTCAACCAGTGCCACAAACGCCACCAGTACAGGAAACTC
+CTGCATCACAAACCGCACATGAATCCGTACATGAGCAAGCTGAAAAAGCACCAGAACAAC
+CACCTATGCAACCGACATCTGCGCCGGTAGCCTACCCACCAAGTATGCCAAAAGCATTGA
+CTGACTTGATGTCGGCAGAGCAGGTCACTCCTGATGAGCTTGTGGCAGTAGCAAACATCC
+GAGGACACTTCCCGCCAATGACACCAATTGAAAACTTCCCGTCAGATTATTGGAATATGA
+TTGTGGCCAATTGGTTAGCTACGTTAGAAGTGATTAAAACGCAAGTGCGTACTGTCGAGC
+CACCCTTTACTGTGGAAGGCGCATAGGTTTTGGGAATTAGAAATTATAGCGAGGTATAAC
+AAACAATGAATAAAACAATCAAATTAGACTTGTCTGCCATCGGAGAAGGTGGCTTACAAG
+AAAAAGTAGACAAGGAATTGGAAAAAGTCTTTGACAATATCTTAGATCCTAATACAGAAA
+CAAAAGTAGCCCGTAAAGTAACTATTACGTTAACTATGAAACCAGACGATGCCCGTCAAA
+CTGTTTCAACAGCTATGGAAGTTAAGTCAACGCTAGCACCACAGACAGGCGTGGCTACAA
+CGGTCCTTGTTGGTCAAAAAGATGGTAAGGTTTATGCTAACGAGCTCAAAAGCGCGATGC
+CTGGTCAAACTTATTTTGACGATGAGGCAGTGCTAAGAACTGACATCGGTGAACCAATTG
+ATCACCTTGAAAAAGGTATTAATGAAGATGTTATTGATTTTAATAAGCAAAAGAAAGTAG
+GAAACTAACATGACAGAAAACATTAAAGAAGCTTTGGAATATGCAGTAAATACAGCTCAC
+GAAAAACCTAAGACTATCTTGGGTAGTGATGGTAAAGAGTATTATGATCGCAACAAATAT
+TCTTTGGTTGAACTTAAAACTAAGTATTATCCAAAAACATTGAATTTAAACACGCTTGAC
+AGTTTAATTGATTATCTTAAATCAGATATGAACAATATTAATTCCAAGCGTCTTATGGTC
+ATTGTAGAAGGCCCTCGTGAAGTTATTGTTTGCGAAGAAGATGATGACGACCTTAATCGA
+AATGTGTTAGTAACTGTGGAGGCAATTATTCCAAATGTTCAATTTGGCCACTATGATTCA
+CCTTCTGATTTTAATATTAGTCTGCAATCATTATTCGTTAACGCTGACGATCGTAACACA
+GTTATTGAATTCGCTAGTGCATTAAAAATCGAAAATGGCTCAGAAATTGTTGATGATGGC
+ATTGGTCAAACTGCCACAATTAAACAAGGTGTGGCAAGCCTTGCAAAAGCTAAGGCGCCA
+AACCCAGTTACATTACGTCCATACCGCACATTTTCTGAAGTAGAACAACCTTCAAGTGAG
+TTCATTTTCCGCATTAATCAACTTGCTAATATGGCTTTGTTTGAAGCAGATGGTGGAAAG
+TGGCGCTTAGATGCTATCAATAATATTGCTAACTACTTAAAAGAAGAACTTGCTGATCAA
+ACTAACATTACAATTTTAGCTTAATAGAAAATAGGAGAAATAAAAATGACTGAATACAAT
+AACAACTTTGACCGTGAATTGGGATGGGATGATGAAATTACACAAGACAGTGTAGGTTTT
+GTTCAATTAGTGCCTGGTGATTATCAATTCACAGTAACCAATATGGAGCGTGCTCGTCAC
+ACACCTAATCCGAAGAGTCCAGGAAAATTACCAGCGTGTAACAAGGCGGTCGTTACGATT
+CAAATAGAAACATCAGAAGGAATCGCGCAATTAACTCATAACTTATTCCTACATACTACA
+ACAGAAGGTATGCTATCAGCTTTCTTTGGAGCTATTGGTCAAAAGAAACATGGGGAACCA
+CTTAAAATGAACTGGAATACCGTCATCGGAGCTAAGGGGGTTGCTCGTATTAATAAACGT
+AAAGGCACCGGCGATTATGCTGATCGCGAATACGATAACATCAAATCTATGATTTACGCT
+GATGAAGTTGATTGGACAAAAGTATTAAATAAAGATGTCGCACAACCACAGCAAATGACA
+CATCAACAATCTGCTCAACCTACATATCAGGGACAACAGGCACAAGGCACTAATTTTGCA
+CAACAACCAGCAACGCAGTCATATCAACAAGGTCAAATGCAAACACCTCAACAACCTCAA
+GGCGGATGGGGAGGATTCTAATGCAGCTTAGACCTTACCAAGAAGAGGCAAGGTCAGCAG
+TGCAACACGAGTGGGAAGACGGCAAGAAGAGAACTCTTCTTGTCCTTCCAACTGGTTGCG
+GTAAAACTATTGTCTTTTCGAAAATTATCGAAGACCGTGTAAGGCTCGGAGAGAGAGTTT
+TGGTTCTGGCTCATAGGTCCGAACTTTTAGAACAGGCTAGTGATAAATTGATGACAGCAA
+CTGGATTAGGGACAGCATTAGAAAAAGCAGAGAATACTTCTTTAGGGTCATGGTTCAGGG
+TTGTAGTTGGATCAGTTCAAACGATGCAGAGAGAGAAGCGTTTGAGTAAGTTTCCTACAA
+ATCATTTTGACACAATTATTATTGATGAAGCCCATCATGCCATCTCTGATGGTTACCAAA
+GAGTTTTGCAACACTTTGATAGTAGCAATGTTTTGGGAGTGACAGCGACACCAGATCGCG
+GTGACAAACAAAATCTAGGTAAGTATTTCGATAGTTTAGCTTATGAATATTCCTTAGTAG
+ATGCCATCAAGTCTGGTTACTTATCTAAAATTACCGCAGTTACTATCCCGTTGACTTTGG
+ACTTATCTACAGTTAGTCAGCAAGCTGGAGATTTTAAAGCAAGTGAGATTGGGACGGCGC
+TTGACCCGTACCTAGAACAAATTGCCGATGAAATGGTGAAGCAATGCGCAAACCGTAAAA
+CAGTTGTATTTCTTCCGCTTGTTAAAACTTCCCAAAAATTTCGTGATATTCTAAACCAAA
+AAGGATTTAAAGCAGCAGAGGTCAATGGGGAATCGAAAGACCGCGCTGAAGTCCTAGAAG
+ACTTTGATAATGATAAATATAATGTACTATGCAATTCAATGCTTTTAACGGAGGGGTGGG
+ATTGCCCGACAGTCGATTGCGTAGTTGTACTGAGACCCACAAAAGTAAGAGCTCTTTATA
+GTCAAATGGTTGGTCGTGGCACACGATTAGCGCCGGGGAAAGAAAATCTACTATTATTAG
+ATTTTTTATGGCATACCGAACGCCATGAACTTTGTCGTCCTGCTCATCTAATTGCAAAGA
+CACCAGAAGTTGCTCAAAAAATGGTCGATAACATGACAGAGGAAACTGAAGTAACCTTTG
+AATTGTTAGAAGCTGAAGAAGTAGCTAGCAAAGATGTTGTCGCAGAACGAGAAGAAGCAC
+TCGCTAAGCAGTTAGCAGAAATGCGTAAGCGTAAACGTGCATTAGTTGATCCGTTGCAAT
+TTGAAATGTCTATCAATGCTGAAGACTTAGTGGACTATGTACCAGAATTCGGCTGGGAAA
+TGGCTCCTGTTTCTGATAAACAAAAGAACGCTTTAGAAAAATTTGGTATTTTTACCGACG
+ACATTGGAAATGCAGGTAAAGCTACTAAATTATTGGAGCGATTGGCCAAGAGGAGAGAAA
+CTGGCCTAACAACACCTAAACAAATCAGAATGCTAGAACGATACGGATTTAAAAACGTTG
+GAATGTGGAAATTTGAAGTAGCATCAAACATGATTAACCGCATTGCTGCTAGCGGATGGC
+GCCTACCAAAAGGCATCAATGCTCGAGAATACCAACCTGAATAGGAGACAAAAATGGGAG
+AATATTGTCACTTAAAAGAATTAGATGGACTTAGATTTGGATCATTGACAGTCATTAATA
+GAAACCGTAACAATTCTAAGGGTGGCAATGCACGATGGAATTGTCTTTGCGACTGCGGAA
+ATAAAACAGTTGTTATTGGAAGTAAATTAAGAAGTGGTTATACAAAATCATGTGGATGTG
+CACGTAAAAATGACAACGCTAAAGGTTATTCATCTACAAGACTTTACAGAATTTGGAAAG
+GCATGATGAATAGATGCTATAACCACAAAAACGATAATTACAAATATTATGGTGGAAAAG
+GTATTTCAATCTGTGATGAATGGCTAACTTTTATTAATTTTAGAACATGGTCGCTCTCTA
+ATGGATATAAAGAATCATTAACCATTGATAGAATAAATCCAAAAGGTAACTATACTCCAC
+TAAATTGCAGATGGGTAAGTATGAAAATGCAGCAAAACAATAAAACGAATAATAGGTATT
+TATCATATTTAGGTCAAGAATATACTATTGCTGAATTTTCAGAGAAGTTAAATGTTACCT
+ATTGGACTGTAATAAATCAATTGAAATTAGGTTGGAGTGTAGAAAGAATAGTAGAAGAAG
+CGAGAATGAAAAATGACAGATGATAAATTTGATTTATTACCTTTACTTGATTATATTGAT
+CCATCAAAACTATCATATCAAGACTGGGTGAATGTTGGTTTTGCCCTAAAACACGAAGGA
+TATACTGCTATGGATTGGGACATTTGGTCACAGTCTGACAGTAGATACAAAAAGGGTGAA
+TGTTTCGCTAAATGGGATAGTTTCCAAGGTAATGGACTTGGGACTGTCACTGGCGCAACT
+ATCACACAGTTAGCGAAAGAAAACGGGTGGACATCTGACTACCGTACGAGTGATGAAGCC
+CACGAGCTTGATTGGGATAGCACTATTGATCGTGACTATAAAATTATTGACAAGAACTGG
+ATCGAAGCAAAAGAAATTAGAGAACCTACTAACTGGTCACCCGTTCACGATTTGATTACT
+TACATCAACACTCTTTTTGAATCAACTGACAAAGTCGGATATGTAACAGAAACATACCCG
+ATTGAAATAGATAAGGGCATTATCTATAAACCAACAAAAGGAGCCTATGACAGGACAGCT
+GGTCAGCTTATCCAAGAATTACAAAAAAATCCTAATGACATTGGTGCTGTCCTCGGTGAC
+TATAAAGAAGAAGCTGGTGCATGGATACGATTTAACCCTTTAGATGGCAATGGTGTCAAA
+AACGACAATGTAACAGACTTTAGGTATGCCTTGGTTGAATCCGATAGTATGGAACTTGGT
+AAGCAGTATGCTTTATTTAAAGAACTAGAATTGCCAATAGCGACATTGGTCCATAGCGGT
+AAAAAATCATTACACGCTATTGTCAAAGTAGATGCTAAAGATTATCAGGAGTACCGCAAA
+CGGGTTGATTACATCTATCAAATCTGTAAGAAAAACGGCCTTGATATTGACACACAGAAT
+CGTAATCCAAGTCGTCTATCACGAATGCCAGGTATTATGCGAAATGGTCACAAGCAATTT
+TTGATTGATACAAATATTGGTAAAACCAATTATGAAGAATGGTATCAATGGATTGAAGAT
+TTAAATGATGATTTACCAGAGCCAGAAACGCTAGCTGATGAATGGGATAATTTGCCAGAG
+CTGGCTCCTGAATTAATTAAAGGAGTGTTACGCCAAGGACATAAAATGCTAATTGCAGGA
+CCATCAAAAGCCGGTAAGTCATTTGCATTGATTGAGTTATCTATTGCTTTGGCTGAGGGA
+CAGAAATGGTTAGGTTGGCAATGTGAACAAGGGAAAGTCCTCTATGTCAATTTGGAGCTA
+GACAGACCATCAGCTTTGCACCGCTTTAAAGATGTTTATGATGCGATGGGATTACCTCCC
+GCTAATGTGGCAAACATTGACATTTGGAACCTCCGTGGAAAAACAGTACCAATGGATAAA
+TTAGCACCTAAACTTATCAGACGCTCACTGAAGAAAAATTACCAAGCTGTTATTATCGAC
+CCTATTTATAAAGTTCTCACTGGCGATGAAAACAGTGCTGATCAGATGGCCCATTTTACA
+AATCAATTTGATAAGGTGGCCACTGAACTTGGATGTAGCGTAATTTATTGCCACCACCAT
+TCTAAAGGAAGTCAAGGTGGCAAAAAATCCATGGACAGGGCAAGTGGTTCTGGAGTATTT
+GCTCGTGACCCTGATGCATTGATTGACTTAGTGGAGCTTGAGTTGACTGAAGACCTTATC
+AAGGCACGCTCAGAAAAAGCAGCTGCTAAGATTTACCAACAAGCGTTGCAGGAAAAAGCT
+CTAGGATACTATCAACAGGAAGTAACGCTAGACGACCTAGAAAGTCGTTATCAGATGCAA
+CAACATTTTGACAAAGCTATCAAGGATATCATGGTTAAACAGCCATATCTTGAGGCCGTC
+AAAAAAGCCCAGCATGAGGTAGAAATTGCCACAGCGTGGCGAGTTGATGGAACGCTACGT
+GAGTTTGCGAAGTTTCAGCCAGTTAATATGTGGTTTAGTTATCCCAAGCACGAGGTGGAT
+ACAACTGGCGTGTTGGCTGATATTCAGTTGGAAGATAGTAAACCTCTTTGGAAAAAAGCT
+AAAGAAGCTAGGAAAAGTAAAGAAGAGAATCTCAAGGAACGGAACCAAAAACTTGAGACA
+GCTTATAGCGCCTTATTTGATGGTTCAACACCGGTTACAGTGCAAGAAATTCGTGAATAC
+TTGGATTTAAAATCCAATAAAAGCGTTGAAAATTATATCAAGGAACACGATGGTTACGAT
+GTCAAAAAAGGTGTTGTGTTCCAAATTTCTGATAACAAAGAAACGGAAAAGAAAGAAAAT
+AACTAGAAGAATTCTAAAGAAAAATTACGTTATTTTCTTTTCTCAAATCAGAAAAATACT
+AGTTAATTTCTTTTCTGTTTAATTTTAGAAAAACAAGAAAAATACTAGTTAATTTCTAAG
+AAAATACAGCCTATAACTCTTTCAGAGTTATTATAAAATGTTTTTCCTTCGTCAAAAGTC
+AAAGGGAAAAGGAAGAGGGGCGACTGAGCTACGCCCCCTCTGTCCTTTGTCCCATATTTG
+ACAAAGGCGCATATAAAAAACACAAATTGGAGATGAGGTAAAAATGGAAATTTACAAACA
+AAGAATGATTGAAGAATATAAACAGTTAAAAAAACGCGCAGAAAAACTATCTATTGTGCT
+AAACAGATACTACCTTGATGAGTTAGATTTTGAATTATCTTGCCCAATTGAACTTTTACA
+AACGCAATGGCATATTATGGGAGCGTATTTGAAAATTCTAGAACAAAGATTTTTGGTTGA
+AGGGATTTATTTTAATGATTGAATTTTTTTTGCCTATGGATAAAATCCCGACGACAACTC
+ATCAGCAAAAGAAAGTGACTGTCATAAATGGCAAGCCTCACTTTTACGAGCCTGAGAGTT
+TGAAAAATGCTAGGGATAAGTTTACAAGTCTTTTGGCTCAGCATGTACCACCCAGTAAGT
+TAGATGGTCCTATCCGTCTGACAGTCAAGTGGCTATTTCCCAAAATCAAGGGCAGCACAA
+ACGGACAGTACAAAACGACAAAACCAGATACCGACAACCTGCAGAAGCTGCTTAAAGACT
+GCATGACCGAATTGGGATTTTGGAATGATGATGCGCAGGTTGCTTCGGAAATTATTGAGA
+AGTTCTGGGCTGATACAGTAGGAATATACGTAAAGGTGGAAGAGTTATGAAAATTGATTA
+TATTAATTTTTTTGAACAAGTGGTTCCTGACTGGATGAGAGAGAGTAATGTCAAAATGCA
+AGAAGTTGGATTTAATACTGAAGCGTATTGGCAATGGGCAAATCAATCTATTGTTGCAAT
+CTGCGAAAAGTACGGAAATGACAGTCTGATCAATGGGCAGTTTCATCTGATTTGGGAATG
+GTTGGAGGATAAAGCAAACGGAGGTTAACGATGACTGAAGAGCAAGAACTAATAAAACCG
+CTGCTAGAAGAGATAGAGCGGAAAGATGATAGATTGTATATGCAGTCTAATGTAATTGCC
+GTCTTAATGACAGCAGTTCTTATGTTACTGATGATAAGTATAGCCTTACAAAACCACTAC
+GAGTCGCAAATCACAGGACTACGTACACAGCTAAGCAGGACACAAAAGCAGCTTAAACGT
+GCTAGCGAAGATAGAGCTAGACAGACAAAGCGAATTGCGGAACTTACGCACAACGGAGGG
+TAACATGATTAAGATCGATGAGATACATCGCATACTAGGCATCGACGAAGTTTATAAAGC
+ACCCAAACGACTTACGGACATACTCTTTGATAAAGATAGTCGTGAGGATATATTTAGACA
+GTTTTTGAAATATGAAACAGATGTATCTTACGACTGGTTTATGCAATATTTTGAGGAAGA
+ACAAGCTGACCGCAAAAATAAAAAGCAAGACTTTACTCCTAAATCGGTTAGTACACTATT
+ATCTAAAATAATAAGTGGTAATCAATACTACGAGGTAGCAGTCGGGACGGGTGGGATACT
+TATCCAAGCATGGCAAGAACAACGATTAAATGACAGTCCATTTACTTATCGTCCGAGTAA
+ATACTGGTATCACGTAGAAGAGTTATCGGACAAAGCAGTACCGTTTCTACTCTTTAATAT
+GTCTATAAGAGGGATAAATGGTGTGGTGGTGCATGGCGACTCTTTAACAAGACAAGTTAA
+AAACATTTATTTTTTGCAAAATACAAAAGACGACATGCTGAGTTTTAGTGATATTAACGT
+TATGCCAAGGACTCAAGATATTGAGCGAGAATTTAATGTCAAAGAGTGGATTGGTGATGG
+GATAGAACACATTGAAAATCCACTAATTGAATGGATATAACCAATAACGGTATCCCGCAC
+GTTCGACTCGTGCGGTTGGTATTGACCGAAATTGAAAAATAGAAACGAGGACCTCCTTAC
+ACCAAAACAAAATCTAACGCTGGTTATCGGTCACTGGCTATTATTTAAGGCGCTAATACT
+GACATCGTACGCCTGTGTCAAAATAAAAAAAGGAAGAGAGGGCTTTTCTCCACAAAACAA
+AAAGACGTCCACACGGAACGCCCCCTTGGTTAAATTTAAGCTTAAATAAATTATACCATA
+CTGGAGGCTTTCATGACGTTTTTTCCTGAGATTGATATCCAAAAAACAAAATCCAATGCC
+AAGCGTAAATTGAGAGAGTATCCACGCTGGCGAAGGATAGCTAATGACGTAGATACTCAA
+AAAGTTACAGCTACTTACTCCTTTGAGCCAAGGCAATCACATGGGGTTCCTAGCAAACCG
+GTTGAGAGACTAGCGCTAAACCGTGTGTCAGCAGAACAAGAGCTGGATGCGATTGAGCAA
+GCCGTCAGTATGATACTAGAGCCAGAGAGACGCAGGATTTTGTATGACAAATACTTAGCG
+CCTTATAAAAAGGCAGATAAGGTTATTTATACAGAATTGTGTATGTCAGAGAGCTTTTAC
+TATGATACACTTGACATTGCTTTGTTAGCTTTTGCAGAGCTGTACAGAGAGGGTGTGTTG
+CTTGTTGAGGAAGGAGTTTTTAGCTAGTTTTTATACAGTAATAAGATAGTTTATACATAT
+TTTTACATGTTATTATAGTATTATCAAAATAACAAGAAGAGATAACCTTTTAATCACTGA
+CTATTTTATTTAGTCGCCAACTTTAACTACGATCAAACTTGTTATTTTATGGTATGTGGG
+ACGTGCAGGTTCGATTCCGACTGTTCCTGTGAAAAGCTCTAAGAAGCCTACGGGCCTTAG
+GAGCGATGAAGTTAGAGAATTGCATATCGCTCTAACTCAATATGCACTAGTCATCACACC
+GTGGTGGCTTTTTATTATGTAAAAAAGGAATAAAACATGGAGTTTGTGGACAAAAAATTA
+AGTGAAATAACACCTTATAAAAATAACCCTAGAAACAATGATGAGGCTGTTGGACCAGTT
+GCTGAATCTATTAAAGAGTTTGGTTTTAAAGTGCCTATTGTCGTTGATAAAAACGGCGAA
+ATCGTAAACGGCCACACTCGTTATAAAGCAGCCCAAAAATTAGGGCTAGAAACAGTTCCT
+GTTATTGTCGCAGATGACTTATCTGAAGAGCAAATTAAAGCGTTCAGACTTGCTGACAAT
+AAAGTTGGTGAGATTGCGGTTTGGGATTTAGATTTGTTAAACGAAGAATTAAACGACATT
+TTAGACCTCGATATGTCTGCTTTTGGATTTGACGTTTTAGATAATTTAGATGATTTAATC
+GAAGATGAAAAAGATTTAGACGATTTTACAGGGACTGTGCCAGATGAGCCAAAGTCAAAA
+CTTGGTGACATTTATCAACTTGGTAGTCACAAGTTGATGTGCGGCGACAGTACAAATGGA
+GCCGATGTTAAAAAACTTATGAATGGAGAATTAGCTGATTTACTACTTACAGACCCACCA
+TACAACGTGGCTTATGAGGGTAAAACAAAAGATAGTTTAACTATAAAAAACGACAGTATG
+GATAATGACAGTTTTAGACAGTTCTTGGTTAATGCTTTTAGTTCTGCAAATGAAGTTATG
+AAGCCAGGCGCTGTTTTTTATATTTGGCATGCTGATTCAGAAGGCTATAATTTTAGAGGT
+GCTTGTTTTGATATCGGTTGGACAGTACGTCAATGCTTAATTTGGAATAAAAACTCAATG
+GTTCTCGGTCGCCAAGATTATCATTGGAAGCACGAACCTTGTCTTTATGGCTGGAAAGAT
+GGCGCTGGTCACTTGTGGGCTTCAGACAGAAAGCAAACATCAGTTATTGATTATGAGAAA
+CCTCAACGAAATGGCGTTCATCCAACAATGAAACCTGTCGGACTTTTTGATTACCAAATC
+AAAAACAACACAAAGGGAAGCGACATTGTCCTTGATTTGTTTGGTGGCTCTGGGACAACG
+TTAATTGCTTGTGAGTCAAATGGTCGTCACGCTAGATTAATGGAATATGACCCAAAATAT
+GTAGATGTCATTATAAAACGCTGGGAAGAATTAACTGGAGAAAGTGTTATACAACTAAAC
+TAAAAATCCCTTAAAACCGTTGACTTAACAGTGTTTCAGAGCTATCATGTGATCACAAAG
+ACAAAGAGGTAAATAACATGCTAGTAACAAAAGTAATTCACAAAATCTAAAATATTGAAC
+CAAGCGAAAAAGATTCGGCCTTAAAATATAGATACGCCAACGAACTTGAGTATCTCGTTT
+ACAATCTGTTTTATAGCGCAATTAAAGAAATAACTGCAAAAGATATCAAAAATAACTTTT
+TTTATCAAGATGATCAAGCCTTTATTATTAATTGGCTAGGACTATAAAATAATTTTAAAA
+GGGCGAAAGCCTTTTTTTTATATTTAAAAGTAAGGAAGTGAGGCGATGGCAAATGAAGAT
+AATTTGATACCAAACTCCAAACGAACCCCGAGCGAACTCCGAGAAATTGCAAAAAAAGGA
+GGCATAGCTTCCGGCAAAGCTAGGAGGGAAAAAGCGAATTTGAGAAAAGCTGTGGAGCTG
+GTGTTAGGATCAACTGTACCAAGCGCCTTGCTTCGAGAACAATTAGAACAATTGGATATT
+TCCCCCACAAATCAATCAGCTATTGCACTCAAGCTTGTGGAAAATGCTTTAAAGGGTGAT
+GTTAGATCTGCAGAGCTATTAGCTAAAATTACAACTACCGAGGTCAAAGATAGCCTGGAT
+AGAAAAGAACAAAGACAGCGAATTAAGGCCGCGGAGCTCGCCACAGACGAGCAACGAACG
+CGCATCGAGCTGCTTAAAGTCAAACTTGACGCAGAGAAGGGCGCTAAGCCTGATACTAGC
+TTAATGAGAGCCTTGTTAGATGCTGTGGAAGGAGGTGATTAGCCTTGGAGATTATCTTTT
+CAAATAAACAAAAAGACGTCATTAGACGCCCTTTTAACTACGAATTAGAGGTCAACGAGG
+GCACTTGACCCCTCGTAGCGGAAAGACCACAGCTGGGCATTTTCGTTATGCTAGGTATCT
+GATTGAGTCAGAAGATGAAAATCACCTTGTGACTGCTTATAATCAAGAACAAGCTTATCG
+TTTGTTTATCGACGGCGATGGTACGGGTTTGATGCATATATTTGACGGTAACTGTGAAAT
+AAAACACGACGAGCGTGGAGATCACTTGTTAATCACGACACCAAAAGGCAATAAGCGCGT
+TTATTATAAAGGCGGCGGTAAAGTTAACAGTGTTGGTGCTATTACAGGTATGTCTTTAGG
+ATCAGTAGTATTCTGCGAGATTAACTTACTGCACATGGATTTTATCCAGGAGTGTTTTAG
+GCGTACTTGGGCGGCTAAGCTACGTTATCATCTAGCAGATTTAAATCCCCCAGCACCTCA
+ACATCCAGTAATTAAAGATGTCTTTGATGTTCAGAACACGAGGTGGACTCATTGGACCAT
+GGATGATAACCCAATACTAACCGCAGAGCGTAAACAAAACATTATCAACAGTCTTAAAAA
+AAATCCATATCTATACAAACGAGATGTACTTGGACAGCGGGTCATGCCTCAGGGAGTTAT
+TTATGGCCTTTTTGACACGGAAAAAAATGTTTTGGATGCTTTGATTGGCGAACCAGTAGA
+GATGTATTTCTGTGCAGATGGAGGTCAATCAGATGCCACCTCTATGTCTTGTAATATCGT
+AACAAGAGTTAGAGATAACGGTAGGATAAGCTTCAGACTTAATCGTGTAGCTCACTACTA
+CCACAGCGGAGCTGACACTGGCCAAGTAAAAGCTATGTCAACCTACGCTTTAGAGTTAAA
+AGTTTTTATAGACTGGTGCGTTAAAAAGTATCAGATGCGCTATACAGAGGTATTTGTGGA
+TCCTGCCTGTAAATCTTTGAGAGAGGAGCTGCATAAGTTAGGAGTATTTACTCTGGGAGC
+TCCGAACAATTCTAAAGATGTATCTAGCAAAGCAAAAGGTATTGAGGTCGGTATCGAACG
+CGGCCAAAACATTATCTCAGATGGCGCTTTTTATCTTGTTAATCATAGCGAAGAAGAGTA
+TGACCACTACCACTTTTTAAAAGAGATAGGGCTGTACAGTCGTGACGACAATGGCAAACC
+TATTGATAAAGATAACCATGCCATGGACGAGTTTAGATACAGCGTCAACGTGTTTGTGCA
+TCGGTATTACAACTAAAGGAGTTGCTTAAATGGGAGTAATCCAAAAAATAAAAAATCTTG
+TTACAAGGAGTAAATACGTGATGACAACGCAGAGTCTTACAAATATAACTGATCATCCTA
+AAATAGCTATCAGTAAGCTAGAGTACGATCGTATAACAACCAATCTAAAGTATTATAAGA
+GCGATTGGGATAGTGTTTTATACTTAAACACGGACGGCGAGACTAAAAAAAGAGATCTTA
+ACCATCTACCAATTGCACGGACAGCTGCTAAAAAGATTGCCAGTCTAGTCTTTAACGAGC
+AGGCAGAGATTAAGGTTGATGATGATGCGGCTAACGAATTTATTAGTGAGACACTAAAAA
+ACGACAGGTTTAATAAAAACTTCGAGCGGTATCTGGAGAGTTGTTTAGCGTTAGGCGGAT
+TAGCTATGAGGCCTTATGTGGATGGTGATAAAGTTAGGGTAGCATTTGTTCAAGCGCCTG
+TTTTTTTGCCGCTGCAGAGTAATACGCAAGACGTTTCGAGTGCCGCCGTCGTCATTAAGT
+CCGTTAAGACAATCAACGGCAAAGAGGTCTACTATACCTTGATAGAGTTCCATGAGTGGC
+AGAGCTCTGATGATTATGTTATCTCAAATGAGTTATATCGCTCGGATGATAAAGCCAAAG
+TAGGTAGCCGAGTGCCGTTATCTGAGGTATACAAGGACTTAAAAGACGAGGCAAAAGTTA
+CAGATGTGACTAGGCCTATCTTTACTTATCTCAAGACCCCTGGAATGAATAACAAGGATA
+TTAATAGCCCACTTGGGCTATCTATCTTTGATAACGCCAAGACAACGATTGACTTTATCA
+ATACGACCTATGACGAATTTATGTGGGAAGTTAAGATGGGTCAACGTCGAGTTGCTGTGC
+CAGAGAGTTTGACCGCTTTAACTGTTCGTACCGCTGATGGCGATGTTGTTCCAAGGCCTC
+GGTTCGAGTCTGATCAAAACGTTTATATCCGTATGGGCGGCAGGGATTTAGACTCAAGCG
+CAATACAGGACCTAACAACCCCTATTAGAGCTGATGACTATATCAAGGCTATCAACGAGG
+GCTTGTCGTTGTTTGAAATGCAAATAGGCGTATCCGCTGGGTTATTTAGTTTTGATGGCA
+AAAGCATGAAGACTGCAACAGAAATCGTCTCTGAAAACTCAGACACCTACCAAATGCGTA
+ACAGTATTGTTACTTTAGTAGAGCAATCGCTAAAAGAGTTAGTTATCTCTATTTTTGAGA
+TTGCTAAAGCTTATGATTTGTACCAAAGCGAAGTTCCAAGCATGGATAACATCAGCATAA
+GTCTTGATGACGGTGTTTTTACAGATCGAGACGCTGAGTTAGACTACTGGATAAAAGTTG
+TTAATGCTGGCTTTGGCACTCGTGAGATGGCCATCCAAAAAGTGCTAAACGTGACAGAGG
+AAAAAGCCCAAGAAATAGCTGCAGAAATTAATACTGGAATCGTTGACGAAATCAATCAAC
+AGCGCACTGATACACATTTATACGGAGAGTGATTAGATGAAAAAGAAGCCTATTAAGTTA
+AATGACGAACAGCTTCTTTTGGAAGCTAGTCAGTTATCTGATATGTATCATCAGCTGACT
+CTTGATTTATTTGATCAAGTGATTGAGAGGATAAAAGCCAGAGGCTCAGCGAGCTTAGCC
+GATAATCCTTATCTTTGGCAAGCTAATAAGTTACATGACGTTGGACTGCTTAATGCAGAT
+AACATCAAGCTTATTGCAAAGTATTCTGGCATTGCGGAAGCTCAACTTCGCTATATTATC
+AAGAATGAAGGATTTAAAATTTATAAAAACACGTCTGAGCAGCTAGAAGAGGCTCTAGGT
+AGAGAGTCTGGGGTAAACAGTACTATCCAAGACGACCTATCTAACTATGCTAGACAAGCT
+ATTGATGATGTGCATAATTTGACTAACACCACCTTGCCATTTAGTGTTATAGGAGCTTAT
+CAAGGGATAATCCAAGACGCTGTTGCTGGTGTGGTGACAGGCTTAAAAACGCCTGACCAA
+GCTATCAATCAAACTGTGATTAAATGGTTTAAAAAGGGGTTTTATGGTTTTACAGATAAA
+GCTGGGAGAAAGTGGAGAGCAGACTCTTATGCTCGTACCGTTATCAATACTACGACTTGG
+CGAGTCTTTAACGAAGCCAAAGAAGCCCCTGCTAGGGAGTTTGGCATTGATACCTTCTAT
+TACTCAAAAAAAGCTACAGCTAGAGAGATGTGTGCACCTTTGCAACATCAAATTGTCACT
+ACTGGCGAAGCGAGAGAAGAAGGAGGGATAAAAATCTTAGCTTTATCTGATTACGGGCAT
+GGTGAGCCTGATGGATGCTTGGGAATCAACTGCAAGCACACTAAAACGCCGTTTGTCGTC
+GGTGTGAATAGTAAGCCAGAATTGCCAGAGCATCTAAAAAATATCACTCCTGCACAAGCT
+AAAGCTAATGCGAATGCGCAAGCTAAGCAGAGGGCAATCGAGAGATCAATACGTAAGAGT
+AAAGAGCTACTGCACGTTGCGAAGCAATTGGGTGATAAAGAGTTGATTAGGCAATATCAA
+TCGGATGTTAGAAGTAAACAAGATGCACTCAATTATCTGATAAACAACAATGCCTTTTTA
+CATCGCAATCAAGCCAGAGAAAAGCGTTACAATAATCCTTATACCAAAACTCAAAGTGAA
+GTCGAAGTTAGAAAAGAAAAAGCTAAATTAGATAAACGTAGGGATGTTGAAAGTGCTATA
+ATAGGAGTAGAAACTAGTGAAGGGATACCGCTAAAAATAACAAAGCATTTAGCCGAAAGG
+GCGGTGCTGAGAAATATAGCACCTATTGATATTGTCGATTCTATAAAAGAACCGTTGAAG
+ATAGCTCCTATTAAGTACGATAACCTTGATAGACCTTCCCAGAAATACATTGGTAAGTGT
+GTCTCGACAGTAATAAACCCGATAGACGGAAATATTGTTACAGTTCATGCTACTAGCACG
+AGAATCCGCAAAAAATATGGAGGAAATTGATGAAATTAAAAAGTATTTTAAATGATAGTC
+AAATCGATTTTGTCAAAAATGAACTTCCGGGATTACCTGTGGATATAGATGTTAATTCCG
+AAAAGTATGATGTTTTTTGTGAAGGTATAGAGACTTACTACCAGACAGAAAGCTTTGATG
+AAAAGTACAATATAACAGCTAAAGGTAAACTAGCTGAGAGTATTATTGATTTACTGACTG
+ATAAAGGTTATTGGTGACTAGTACACCAAACTACGACTTATTAAATCTAGAGCATTTAGC
+TAAAAGCTAGGTGCTTTTTTGTACTTAAAAAATAGGAGGGAACATGAATAAACGCATTAA
+GAAAAAACGTAAACTAGAAACAGCAGTTGTGATGCTTGTTGCAGAAAATGCCATGCAGGT
+TGAAGCAATTAAAAATCAAAACAAACAAATCATGGAGCTAAAATCAATCGTTCAACGAAA
+CGCTCTGGCAACAAACGAAGAGTTAGCGACTGTTAAAGCTGCTACTTTAGATAACCAATC
+AGTTATCAAGGCAATTGGTGACACGGTTGACTATATTAAGAAAAACTACAAACGGAAGTG
+GGGGAAATAAAGTTTAACCGTGTCGAATTCGACCCCTTTAGAAATCAAAGTCGTAGCAAT
+ACGGCTTTTTATTATGCCTTTATCCGCAGGCGTTAAAGAACGGAAATCAGCGACCTATCG
+CATTTATAGGAGGGAATGCACATGGAAAATGTGACAAACGAAAATGTCGACCAAGAGACT
+ACTGACTTGGAAAATAATCAACAAGAAGATAAAGCATTTACACAAGATGATCTCAACCGA
+GTGGGAACTAAAGAGCATTCTAAAGGCTATAACAAAGCAGTTAAAGACTTGGGTTTTGAT
+GATGTAGAGTCTGCCAAGGATGCACTAAAAGCCTTCCAAGAGTGGCAAGAGTCACAAAGA
+AGCGAGTCAGAAAAACAAACAGAAATCTTGAATGCTAAAGACAAAGAGCTTGAGGAAGCT
+CGGGCAAACAATAAGGCTCTTAATGCAAAGCTAGCAGCAATGTCTTTAGGTGTGAACGCT
+GAATCTATTGATGATGTGATTGCACTATCTGAGCGTCTTGTCACTGACGAGACAAGCATA
+GAGGATGCAATCAAAACGGTTTTGGGTAAGTATCCTCACTTTGGCCAAACAAAGGATAAA
+GCTCCCAAAATCACAGTGGCAGGCAACCCGTCTGCTGATAACGGACAAGGTTCGGTGTCT
+AAGGAAGACTTTGCAAAGATGTCTTACCAAGAAAAACTGGACCTAAAACTAAAAAATAAG
+AATCTTTATGACCAATTGAAAGGAAATTAAAAAATGGCAGTAGGAACAACTAAAATGGCA
+CAAATGCTAGACCCTGAGGTTCTAGCGGATATGATTGACGCAGAGGTAGGGAAAGCGATT
+CGCTTTGCTCCTCTTGCTGAAGTAGATACAACTTTAGAAGGACAACCAGGTACAACTTTA
+ACAGTGCCTAAATGGGATTACATTGGTGACGCAGAAGATGTTGCCGAGGGTGAAGCTATC
+CCAATGACTCAACTTGGCTTCAAAAAGACTACTATGACCATTAAAAAAGCCGGAAAAGGT
+GTAGAAATCACTGACGAAGCTATCTTATCTGGGTATGGGGATCCTGTAGGTCAGGCAGCA
+AAGCAAATCGTTGAGGCTATTGACCACAAAGTCGATGCAGACGTGCTTGATGCGTTAAGT
+AAATCGACTCAAACTGTGGAAGCTACTGCTACGGTTGATGGTGTATCTAAAGCGCTAGAT
+ATTTTTAATGACGAAGATGACGCAGAGACAGTCATTGTCATGAATCCGGCGGATGCCTCT
+ACCCTACGTTTAGATGCCGCGAAGGAGTGGTTAGGTGCTACCGAGGTTGGAGCAAATCGT
+GTTGTCTCTGGTGTTTATGGTGAAGTTTTAGGGGTACAAATTGTGCGTTCTCGCAAATGC
+CCTAAAGGAACTGCCTACATGGTTCGCAAAGGTGCACTACGTATCATGCTTAAACGTAAC
+ACAATGGTTGAAACAGACCGAGATATCACAAAAGCGATTAATCAAATCGTAGCTAATAAG
+CATTATGGTGTTTATCTTTATAAGGCAGAAAAAGCCGTCAAAATTACACTTAAAGATGCC
+GCAAAAAAGTAGCTAAGGCTAAGGCTGCCAAGAGAGAGGAAGATGACGCTCTCGAGTCTT
+AGCCGATGGAGGTGGTTATTATCGCTTTTTTAACGCAAAAAGAATTTGAAGATTTGGGTT
+TTGACGAGGTAGAAGATTTTGAAAAAATGGAAAAACGTGCTAGCCACGCTGTCAATCTTT
+ACTGTCGTAATCGCTATGATTACAAAGATTTAAAAAAAGAAATAGCCCTAGTGCAAAAGG
+CTGTAAAGCGGGCAATCGCTTATCAGATAGCATATTTAAATGACTCAGGAGTAATGACAG
+CAGAGGATAAACAATCCTTTGCTGGAATATCTCTAGGACGGACAAGTATTAGCTACACTG
+TCGGGCATGGCCAAGGCAGCCAACAAAAAACTCTGGCAGACAGGTTTAATCTCTGTCTAG
+ATGCAGAGAATGAGTTACTAGCTGTTGGGTTGGGATATACGGGTATTAGCTATGATCGAT
+AAAAGACTGCTTATTGACGAACTGCAGGTAAAACTTGTCAAAGATAAAGGTGATTATGGA
+GGGTTTGTCTATGACGAACCTTTTACACTCTCTCCCGTTAGGTTTGACCGTAATCTTGCA
+ACCGCAGGTAAAGATAATGCAAGGCAAGAGACTAAGCCGTCGGTTATCTTTATTTATCCT
+AAATACTGTAAGACAGTAGCCGATAGGTCATGGGTTGATGCTGTTGTCATTGATGGTGAT
+ACTGAGTACACCGTTGATAAAGTGATACCAGTCTACCACCCACTAACAAACAAAATTTTT
+TGTTTTGAAGTGGAGGTTATCTAATGGCTAAGGTAGTGGTAGAGTTGGGAGGCATCAAGC
+GTAAAGTATCTCCGCAAGCATTAGCTAAAGGAAAGCTCATCATGAACAACCAAGTCATGA
+TGTCCATGAACCCTTATGTTCCTTACAGAGACGGAGCTTTGAGAGGAAGCTCGAGAGCTA
+ACAGTGTAGGTGTAACGTGGAGCGGACCACACGCCAGAGCCCAGTTTTATGGTGGTGCTT
+ACAACAAGTACAAGTCCTTTAAATTTAAAAAGTACACAACACCAGGTACAGGCAAACGTT
+GGGATAAACGTGCGTTAGCTAATGCAACAATTGTCAAGGATTGGGAAAAATCCTTACTGA
+GAGGAATGGGATTTAAATGACAAATGACTTTGCAACTGTTTTGAGGCAATTTGTCGAAGG
+ATTAGACTTAGGCATAAAGCCCAGACTTGACTATCTAACAAGACAAGAAGATTTAGCCAT
+TTATCCAATGCCAGGTGGGAAGGTAAATAACGAGTACATGGACGGTACTCGTGAGATAAG
+CCTGCCTTTTGAGATTGCAATCAAAACTAAAAATCAGGAGTTAGCAAGCACTGTGATGTG
+GACTATTAACAGTGCTTTGTCTAACTTTGACTTAAAATTACCAAGTCTTAATCATTCGTA
+CACATTTATTAGCCTTGATGTCGAAAAGCCGTTTTTAAATGACTTAAGCGATCAAGGTTT
+TTATATTTATGTGCTGGATATTACAGCACACTTAGAAATAGAAGGGAATAACTAATGAGA
+CAAAAGAACGCCCTACGTGGGCATTTTATCGCACCTTATGTAAAAGGTGAGGAAAAGACA
+GAAGTTACAAAAGAGAAGCTTTTGGAATTGGCTAGATGGATTAAAGACATCTCAGACGAT
+ACCGACGAAAAGACAGAAGATGAGGCGTACTATGACGGAGATGGAACAGAAGAAACAACC
+GTTGTAGGAGTTAAGGGCGCGTACACTTTCGAAGGGACGTATGATCCAGAAGACAAAGCT
+CAAGCTCACATTGCAAGTCTTAAGTATAAGCTAGGAGATGAGCGAAAAGTTTGGCATTTG
+ATTGTATCGGCTGATGGGAAAACCCAGTGGCTAGGGGTTGCAACAGTGACAGAAATTATT
+GCTGGTTCTGGTGCTGCCGCCGATTTTGAAGCCTTTGGTTGCAAGATTACTTATAACTCT
+CTGCCAAAGGAAAGCAAGGAAATTATACCTAAAAAAATGAATTGAGCGTAGCGATGTGAG
+ACAAGGGTGGGCTAAACCACCCTTTTAAGGAGGAATTATGTCTGGAATTGTAGTTGACCT
+AAAGCGCACAGGGTTTCCGGTCAAAATTGGGCAGGTAGAGCTTTGGTTTGATACAAGCCA
+AGAGCGATTGATTGAGTTTTTTGATATTGAGACAGAAGTAAATCGTCGCCTCAATGAATA
+CGAAAAACAGGTTATCGAAGCCAACTTAGACAACGAAATTGAAGATAAAGGGGTTACGAA
+AGATGTTGCCCAAAGTGCTTTAGATTTGGAAGCTAAATACTTAGAAATCAATTATGATCT
+ACTATTCGGAGAAGGTACATTTGCACAGCTCTACGCGGAGTATCCCGACAAAGAAGCACT
+CGAGAATACTCTGGAAATTGTTTGCAGGGAAATCGAGGTCAAACTCAAAGAGTTAGCTAT
+CGAAAGAGAAAAAATCGTTAAGCAGAAAACGAAAAAGTACAAAAAGGAGTAGCCTATGAA
+ACTAAACGATCCATTAGTAGAGTCGTTTGAGTTTAGAGGTGAAATCTATCCTATTGATTT
+GAGCTTTAACAAGGTTTTAGATGTCTTTGATGTTATTGATGATGATTTTTTAAACGAGGC
+GGAAAAGTGTTTTTTGTGCCTTGATATTTTGCTAGATAGGACAGATTTACCTTTTACTTA
+CGCGGTGGATCTTTGGGTTTATATCAAAACCAATTTTATCGATGCAGAAAGGCCCGAGAA
+ACCTCAGCTCGACATCAAAGGGAATCCAATGCCTGTAGTAAAAGAAAAAGAGGATAACAA
+AAAAGTCATTGATTTGAGTTTAGACGCTGAGTTTATCTATGCGAGCTTTAGGCAAGCCTA
+CCAAATCAATCTTTTAAAAGAGCAAAACAGATTGTCTTGGATTGAATTCAAGGCTCTTTT
+AAATGCTCTTCCAGACGATACTGTCATGCAGCGTATCATAGCCATTAGACAGTGGGAAGA
+TGATGGTGAAGGCAGTAAAAAATACAGAGATAACATGCGTAAGCTAAAGGCTAAGTACAG
+TTTAGATGAAAGAGAGGAGGAGGACGATGGCAGCTGATGGTAAGGTAACGATACTTGTTG
+ACGTTGATGGTAAGCAGGTAAAGGTACTCAATAGTGAGTTAGATAAAGTTGCCAAGCACG
+GTGACAAAGGCAGCTCCTCTCTTAAAAAATTTGCGGTTGGTGCAGGAGTCTTTAAATTAG
+CTTCGGCTGCAGTTGATTTGGTTAGTCAATCTCTTGGCAAGGCTATCACAAGATTTGACA
+CGCTTGAAAAATATCCAAGGGTCATGAAAGCTATGGGGCATAGCGCTGAGTATGTTGCTA
+GATCAACTGATAAGTTAGCGAACGGAATTGATGGACTACCAACAACTTTAGACGAGGTTG
+TCGGAACCGCTCAACGTTTGACCTCTATTACTAAGGATATCAATAAATCAACTAATCTCA
+CACTAGCATTAAATAATGCCTTTTTAGCTTCAGGAGCTTCATCAGAGGCTGCAAGCCGAG
+GGCTGGAGCAGTATGCCCAAATGCTATCAGCTGGTAAGGTTGATATGCAAGCTTGGAAAA
+CCCTCCAAGAAACAATGCCTTATGCCTTGCAACAAACTGCGGAAGCTTTTGGATTTGCAG
+GGGCATCAGCTCAAAAGGATTTTTATGAGGCATTAAAAAACGGGCAAATAACATTTGACC
+AATTTTCTAATAAGTTGATTGAGTTAAATGATGGTGTCGGCGGTTTTGCAGAACTAGCCA
+AAGAAAATAGTAAAGGGATTGAAACCTCTTTTAACAACATCAAGAACGCTATTGCAAAAG
+GTGTGGCCAACAGCATTAAGGCTTTGGATGATTTATCTAAGGCTGCAACAGGTAAGGGCA
+TAGCTGATCATTTTGATAGTTTGAAAGTTGTTATCAATGCCTCTTTTAGCGCCATCAATG
+CAAGTATTAAAGCTAGTACATCGCTATTTAAACTTTTGTTTAGTGTTATTGGTGCTGGAA
+TATCAGTCGTCAAAGCTCTGTCGCCTGCCTTAGTTGGTGTAGCATCTGGTCTAGCTGCCA
+TGAGGGCAGTTAATGAGACTATAACAATGATTAAAGCGCTAAATAGAGCTTGGGTTATGG
+CATCTGCATCAATGAGTATTGGAGCAACAACCATTAAGACTGTGACTGCGGTACAAGCGG
+TAAGTACCACGATGACTAAAGCAGATATGGTTGCAAGACTATCTCAGTTAGGTGTCTTAA
+AAGCCAGTACCGTGATTTATGGTGTTATGACAGGCGCTATCAGTTTATCTACTGCTGCAA
+CCATAGCCAGTACTGCTGCGGTAACTGCGTTAAAAGCAGCACTTGTAGCCTTAACAGGTC
+CCGTTGGTTGGGTAGTTGGAGCTATCGGTGCTTTAGTTGCTGTCGGAGTAAGCTTATGGT
+CATGGCTAACTAAAGAGTCAGACGAGACCAAAAAGCTGAAAAAAGAGCAGGAGGGGCTAG
+TCGAAAGCAACAAACAGCTAAGAGATTCTGTCCGTGAGGGCGTGCAAGAGCGTAAGAAGG
+GCCTTGAGTCCGTCAAAGAGAGCACTGCAGCTCATCAAAAATTAGCTGACGAAATCATTA
+AGTTAGCCGCCAAAGAAAACAAAACTGCAGGCGAAAAACAAAACTTAAAAAATAAGATTG
+ATCAGCTTAATGGGTCTATTGATGGCTTAAACTTGGCCTATGACAAAAACTCCAATTCTC
+TTTCTCACAATGCAGATCAAATTAAGTCACGCATTAGTGCCATGGAAGCAGAAAGCACAT
+GGCAAACAGCACAACAAAACCTGTTAAATATTGAACAGAAACGTAGTGAGGTTAGTAAAA
+AGCTAGCTGAAAATGCCGAGCTACGTAAAAAGTGGAATGAAGAAGCTAACGTCTCCGACT
+CTGTCCGAAAAGAAAAGATTGCCGAACTCACAGAAGAAGAGGGTAAGCTTAAAAATATGC
+AGACTCAATTGCAGGAGGAGTATAACAAGACATCAGCTACTCAACAAGCTGCTGCAGACG
+CTATGGCTGCCGCTGAAGAATCAGGATCAGCAAGACAGGTTATAGCGTACGAAAATATGT
+CAGAAGCTCAACGAACTGCCATAGACAATATGCGCACTAAGTACTCTGAACTTTTAGAGA
+CAACGACATCTATTTTTGATGCTATCGAACAAAAGACTGCTCTGTCAGTGGAGCAAATGA
+ATGCCAACCTTGAAAAAAATAGAGCTGCTACTGAACAATGGGCTACGAATTTGGAAATTT
+TAGCTCAGCGTGGTGTAGACCAAGGCATCTTGGAACAGCTTAGGCGGATGGGACCTGAGG
+GGGCAACACAGACACAGGTTTTTGTGGATGCCACAGATGCCGAGCTAGCACCCTTGCAGG
+AAAACTTTAGAGCAGCCACAGAAACTGCTAAAAATGCAATGGGGAGCGTTTTAGACTCAG
+CAGGTGTGGAAATGCCAGAAAAAGTTAAAGGGATGGTCACTAATGTTTCTACGGGATTAC
+AGGCGGAACTGCAAGCTGCTAACTTTGCTCAACTTGGTCAAGAAATCCCTAATGGGGTTT
+CTCAAGGTATAAGTCAAGGGGCAGGTAAAGCAAGTGACGCAAGTGTCAAAATGGGTCAAG
+AAGTTAAACGCTCTTTCCAAGGAGAGTTGGGTATCCACTCGCCATCGCGAGTATTTACTG
+AGTACGGTGGCCATATTACTGATGGCTTGAGTAATGGTGTGACAAATGGAACGTCAAAAG
+TTATGCAAACCATGCAGAGCTTGGCTCAACAGATGTCTCAAAAAGGACAGCAGATTGTTA
+ATGACATGCGTAGCAAGTCGAACCAAATCACAGATGCTTTTAGCACGATGAGTGGTCCAA
+TGCACTCTCATGGTGTTAATGCCATGCAAGGTTTGGCCAATGGTATTTATGCAGGGTCGG
+GGGCAGCTTTAGCGGCAGCTCAAAGCATTGCGGCACGTATCACCGCAACAATTCAAAGTG
+CCTTAGATATCCACTCGCCATCTCGTGTTATGAGGGATGAGGTTGGACGTTTTATCCCTC
+AGGGTATCGCTGTAGGTATTGATGCGGATAGAAAAGTCATTGACTCATCTATGCAAAAGC
+TAAAAGAGTCAATGACGATTAATGCGACCCCAGAAATAGCCTCTGGATTTGGCGGAGGAG
+TTGCGGGGATTGCTAATCAGACCACAAATAACTCAAATAACAGTTTTACCCTTAATGTCA
+AGGTTGATGAATCCGACGGTAATAGCCGCGAGAAATATCAACGCTTATTCAGAGAATTTA
+GCTGGTATATTCAACAACAACAAGGAAGGTTAGGTGATGTTAAATGACAGCTTTTATCAA
+GTTTGATGGTAAAAAATCTTCAGATTTTGATTTGAGAATTATTAATGACGTTGAGCATGA
+CTCGTCCTTTTACGATGTTGATCAAGTTAAGGTACCTGGTCGTGATGGTGTGGTTTTAAA
+GGACAATAAAAGGCTTGAGGCTATTGAACGGTCTTACCCTTTACGTCTATATAGCAAAAG
+ACGACTCACCGAAGTAGAAACTGACATAAGCAATTGGCTGAATGTAAAAGGTTGGAAAGA
+CTTAGAGTTGTCATGGGAGCCTGATTATATCTATAAAGCAACACATATCACCCCTTTTAG
+CATAAAGGAGGTTTTAAGGAATTTCGGCAGACTGAAAATCAACTTCTTAATCCACCCTAT
+CAAATATTTAAAAACAGGTAAGCAAGAGGTGCCTCTCGTTAATGGCGGTACTCTACAAAA
+TCCCGGCAATGTTCAAGCTAAACCTATCCTAAAAATCAAAGGCACAGGCAATGGTATTTT
+AACCATTAATGACTTTGAGACAGGACTTGAAAATGTGCAGAGCGAGCTTGTTATAGATAT
+GGAAAGGCACCTAGTCTATAAAGATGTCCTATCTGCTTGGGATAATATCGTAAGAACAGA
+ACGCCACCGCATGCCGTTATTTGACGTTGGACAAAATAAAATCTCGTGGACTGGTAGCTT
+TACAATTACCGCAGTGCCAAACTGGGGGGTTAAAGTATGATACCAGTTTTGTATGAGGCT
+AAGGAAACCAAGTTTAGGACTTTTGGTCTCGGTGAGATTGCGGATGCTTATGAGGTTAAA
+GCCACTCGTGAGCGCAATGGTAATTACTCACTGTACATCAAATATCCGCTAGATGGTGTC
+TTTGCCTCAGTTTTTAAAGAGGAAATGAAGATTAAGTCTGACGCTGGTCGTAGAACCAAA
+TGGCAGACTTTTGAGATTAATCGGGTACTACGAAATAGTAAAGACCACATCGAGATTTTT
+GCGCGTCATATCTCTATGCGCACACAGGATATTGCTTTAAAACCGTTTGTAAACGGTGCG
+AGCGTAGGAGCCGAATCAGCTTTAGAAATCTGGAAGAAAAACCTTGTCGGTGATGATAAG
+TTTGACGTTAAAAGCGACATCTTAACGCTTGGTAGCTTTAACTGGGAAATTGATAAAATC
+GGCAATGCCCGTGGTGCTCTAGGAGGTGTCGCTGGCTCTATCCTAGATGTTTACGGTGGT
+GAGTACGAGTTTGACAACCGTACAATCATCTTACGCAAGCAAATGGGGCGTAAAGCTCCC
+ACGGTATTGGAGTATGGCCGTAATATCGTCAGCGTAGAGGAGGAGCGATTGCTAGATGGC
+AATTACACCTCTATCTATCCTTACGTAAGATATACGCCACAACCAAAACCGCAAGAGGAA
+CCCCCTGGTAAGCCGCATGTAGGCGAGCATAAACAACCCGAAGAACAGCTAGTGACATTG
+CCTGAATTTATCCTAGATGGTCAGTATCTCAGCTTATATGCTCAGCGCAGAATCCAAATG
+GTTGATTTATCAAGTCATTTTAACGATGACAAAAATAAAAAAGAGCCAACGATCGAAGAA
+ATCCGAAAGCTGGCTCAGAAATACCTTAAGGATAATAACGTTGGTGCACCAAAAGTCAGC
+ATTGAGGTTGATTATATTGACTTGTCACAAACGCTTGACTATCAAGATTTTAGAGTCATG
+GAAGAGGTTGAGCTTTGCGACATTGTACCACTTTATTATCCAAAGTTTGGCATCACAACT
+GAGTCTGAAAAAGTCGTTGAGATTGTCTATGACGTCTATACAGATAGCAACCATACAATA
+AAACTTGGCACGATTGGTCAGTCCATCTCTAAGAGTTTGACAGGTGGGGTCTCAGAGCGT
+ATCAATGCTTTGGAAAATAACCAAAAGGTTATCACCAACAGCCAGAAGCAGTTTGAACTC
+AATCTGCCTAAATACCTCAATGACCTCAATGGTAAACGCGTTTGGTACGAAAAACCAGAT
+GACAATATTGAGCACAAGATAGGCGACTATTGGTTTGAAAAAAATGGCAAGTATCAGCGT
+ACTTGGATTTGGGATGGCAATCAATGGGTCAAGGTACTAGATACAGAGGATTTAAACCCC
+AATCAACGAGCTTTTGATGCCGCAATAGCCGAACTCGAAAAAGCAAAAAAAGCGCAAGAA
+GAAATCAACCAGCGTACTGACAAAGAGCTTGAAGAATTTAGAGCCACCCTCAAAAACCTA
+GCTTTACCAGAAGAAGCGATTAAAAAAATCACAGAGGCTATCAAAGTTGATGACATCCCG
+TCTATTAAACAAAGCTTTGATGACCTCAAAAATAGAGTGAGTGAGACAAGCGAAGAATCT
+CGTTTAACTGCCGAAATTTTAGGAAACAACGGTAAAACCCGCTACAACAAAAATTTATTG
+GTTGGTGAGCCTAATCGCACGAAGTCTTACGACCAGGATTACATCGAGGTAGAAGCCAAC
+GACGGTGGTTTCAAGCGTGGCGAGACCTATACGATTAGCTTTAGCCAGACATGTGAGCCA
+CTCAAAAAAGTGGCTATCACGCTGACACAGGCTAACAACAAGGGAGTTAAGTTAGTGCTG
+ACACCAACTAAAGCAAAAATGGAGTCGCAGACCTTTGACCTCACTAAAGATAAAGAGGCT
+ATCAGTGTTTATCCGTTTAGCTACACAGTGCTTGTAACCAGCGACTGGTATAAATCTAAG
+CAGATAGATTTAAACGCGTCGGAGGTGAAGGAATTGGCTCTGGAGATGGATTATAAAGAG
+ATTGCAGATGCCAAAGGTGCAACTATCACAGGGGCATGGTCAGACAGTCCACAAATTATA
+TTAGACGGAGGTAAAAAATGAGTGAAAATATACCGCTGCGAGTCCAATTTAAGCGCATGA
+AAGCCGCCGAGTGGGCTCGTAGTGATGTCATCTTACTGGAGAGCGAGATAGGCTTTGAGA
+CAGACACAGGTTTTGCCAGAGCAGGTGATGGCCACAATCGATTTAGTGACCTTGGATACA
+TTAGCCCACTCGATTACAATCTACTGACTAACAAGCCAAATATCGATGGATTAGCGACAA
+AAGTCGAGACCGCTCAGAAACTACAACAAAAAGCAGATAAAGAGACCGTCTATACAAAAG
+CTGAATCGAAGCAAGAGCTTGACAAGAAATTAAATCTCAAAGGTGGCGTTATGACAGGTC
+AACTAAAATTTAAGCCAGCCGCCACTGTTGCTTATTCCTCGTCAACGGGTGGAGCGGTCA
+ATATTGACTTGTCGTCTACCAGAGGTGCTGGTGTTGTTGTCTATTCTGACAATGATACCA
+GTGATGGGCCGTTAATGAGCTTGCGGACGGGTAAAGAGACCTTTAATCAATCGGCGCTTT
+TTGTCGACTATAAGGGGACAACAAATGCTGTTAATATTGCGATGCGTCAGCCAACCACCC
+CCAATTTTTCATCGGCGCTTAATATTACTAGCGGCAATGAAAATGGTAGTGCAATGCAGC
+TACGAGGGTCAGAAAAAGCGCTAGGAACGCTAAAAATTACTCATGAGAACCCAAGTATTG
+GAGCGGATTATGATAAAAATGCGGCAGCGTTATCCATTGATATTGTCAAAAAGACAAACG
+GTGCAGGAACAGCCGCTCAGGGAATCTACATTAACTCAACCTCAGGCACGACAGGGAAGT
+TGCTTAGGATTAGAAACCTTAGTGATGATAAGTTCTACGTCAAGTCTGACGGTGGTTTTT
+ATGCCAAGGAAACTTCGCAGATTGATGGCAACCTGAAACTCAAGGACCCCACAGCGAATG
+ATCATGCGGCAACCAAAGCTTATGTAGATAAAGCAATTTCTGAGTTAAAAAAACTCATAC
+TAAAAAAATAGATTAAGGAGGATAAATGAGCAGAGACCCAACACTTATTTTAGACGAGTC
+AAACCTCGTTATTGGTAAGGATGGACGTGTGCATTACACATTTACCACAGAGGACGACAA
+CCCAAAAGTCAGACTAGCTAGCAAGTGTCTAGGCACAGCGCATTTTAATCAGCTCATGAT
+TGAGCGAGGAGACCAAGCTACTAGCTATGTTGCGCCAGTAGTAGTTGAGGGTACAGGTAA
+TCCGACTGGACTATTTAAAGACCTCAAAGAGATTAGCTTAGAGCTGACAGATACTGCTAA
+TTCCCAGCTTTGGTCAAAAATCAAGCTGACTAACCGTGGTATGTTGCAGGAATACTACGA
+CGGTAAGATCAAGACCGAGATAGTCAACTCCGCCAGAGGTGTCGCTACACGTATCAGCGA
+GGATACTGATAAAAAGCTAGCGCTCATCAATGACACCATTGATGGTATCAGGCGTGAGTA
+TCGAGATGCTGATAGGAAGCTATCCGCAAGCTATCAGGCAGGCATCGAGGGGCTAAAAGC
+CACAATGGCCAATGATAAAATCGGTTTACAAGCTGAGATTAAAGCCTCAGCACAAGGGCT
+ATCGCAAAAGTATGATGATGAGTTGCGCAAGCTATCGGCTAAGATCACAACAACCTCAAG
+CGGCACTACAGAGGCCTACGAGAGTAAGCTTGCGGGCTTACGTGCTGAGTTTACTCGCTC
+AAATCAAGGCACGAGGACAGAGCTCGAGTCACAAATTAGCGGGCTAAGAGCGGTACAGCA
+GTCAACAGCTAGCCAAATCTCTCAAGAGATTAGAGACCGTGAAGGTGCTGTCAGTCGTGT
+GCAGCAGAGTTTGGAGAGTTACCAAAGGCGGATGCAGGACGCAGAAGAAAACTATAGTAG
+CTTGACCCATACGGTTAGAGGGCTACAGAGCGACGTTGGATCTCCGACTGGTAAAATCCA
+ATCGCGCCTTACTCAACTAGCAGGACAAATTGAGCAGCGGGTTACTAGAGATGGTGTCAT
+GAGTATTATTAGTGGCGCTGGAGACAGCATTAAATTAGCTATCCAAAAGGCTGGCGGCAT
+TAATGCCAAAATGTCTGGTAATGAGATTATCTCAGCAATTAACCTCAACTCCTACGGAGT
+AACAATCGCAGGTAAACACATCGCTCTCGATGGGAATACGACGGTTAATGGCACCTTTAC
+CACAAAAATAGCCGAGGCTATCAAGATTAGGGCTGATCAGATTATTGCAGGCACGATTGA
+CGCTGCTAGGATTAGAGTGATTAACCTTAACGCAAGTAGTATCGTTGGTTTAGACGCTAA
+CTTTATCAAAGCTAAAATTGGCTATGCTATCACTGATTTGCTCGAGGGTAAGGTCATTAA
+GGCTCGTAATGGAGCGATGCTTATCGACTTAAATACAGCTAAGATGGACTTTAATAGCGA
+TGCCACAATTAATTTTAATAGCAAAAACAATGCCTTAGTACGTAAAGATGGCACACATAC
+TGCCTTTGTACATTTTAGTAATGCGACGCCCAAAGGTTATACAGGGTCAGCGTTGTATGC
+ATCGATCGGGATAACCTCATCTGGTGACGGTGTTAACTCGGCTTCTTCCGGTCGTTTTGC
+AGGGCTAAGGTCATTTAGGTACGCTACGGGATATAATCACACTGCGGCAGTCGACCAGAC
+TGAAATTTACGGTGATAATGTTTTAGTTGTGGATGATTTTAATATTACTCGGGGATTTAA
+GTTTAGACCAGACAAGATGCAAAAAATGCTTGACATGAACGACTTGTATGCGGCTGTAGT
+AGCCTTAGGCCGCTGTTGGGGGCACTTGGCTAACGTCGGCTGGAATACTGCTCATAGCAA
+TTTTACAAGTGCTGTGAATAGGGAATTGAATAACTACATCACAAAAATTTAACAGGAGAT
+AATATGCAATTAACTATTAAAAACAAAGATTTAAACACACTATATCGTGTACTAGACAAA
+ATCAAAATCACTAATATGCGTGCTAATCGTGGCCGTGCTAAGCTACTCGCAAAAGTAGTC
+GATAAAATCAACGAGTATGCAAAAGATGAGACCGACTTAATTGATATGTATGCAGCTAAG
+GATAAAGATGACAAATTTGTCATTGATGAGCACAAAAACATCAAGCTAGCAGACCCCGCT
+AAACTCGACGAGCTCAACGACCTACTCAACGAGCTAGCAGACGAAGAAATTGTGATTAAA
+GGGGGTGAGTACTCCAAGCGATTTATTGACTTTTTAAACTTTTTAGAAGAGTGTGAAGAT
+GAATTTACATCATCTGAAATCATTCTTATCGACAACATTTTGGAACAATTTGAAGAAAGT
+AAAAAAGGAGAATAACCATGAGAAATTGGAAAGTGACAGGAAAATACCCACAATTTGACA
+GCACAGGAGCAGTCGCAAGCACACATATTATTATCACTGCTGAGGATGGCTCAGTCATCT
+CTCAACCAATCAAGCAGGACTTAACCTCAACTAATGACACAGAGATTATCAAAGCTACTT
+TGGAAGAATTTAAAAAATCTGAATACGTTGAAATCGCTATGGGCGAAGCCGTGCAAAAAG
+TAGACGACCTTGAAAAAATCTCACAGGAAACCGCTAAGACCGCTAAAACAGCCCAAACAG
+CCGCAGGATTAGCTAAGGTGTCCGCAGAGCGTACACAGCGAATGATTAACTTGCAAACCA
+TCCACATGTTAACGAGCGGCGGCAAGATTGATTCTGACATTTATAAAGGCATGCTTGAGC
+TAATCGAGCCAGCCCAAAAAGGTGAGTATCAAGCCTATGATGTCTTTACGGTGGTCGACA
+GTACTAAAGAGGAAGACGGAGAGGCTGGTGAAGGTAACCTAGTCTTCGTACACGTTAACG
+AAGCATTTGAGTATGACAAACAAACCTTAGAGGAGCTAGAGTCAGAAGCCAAAGTAACAG
+TTATCAAGTACGCTGATTTGGTTAAACAAGATTAGAGGTGGTTTATGGCAACAGAGTTGA
+TATTTGGCGTTGGTGGCTTTATTTTAGCTATCGTCACGACTTACAATATTTTTAATGCAA
+AATCCATCAAGCATGCGACAGATATTACTTTGTTGCAATCTGAGGTAGAGCATTTAAAAA
+TTGTTACACGCCAAAATGCTCGGCGGCTTGAAGAGCACGCTGAGCAAAATAAAACGTTGA
+TTACAATGACAGAGCAAATTAAAAATTTAACAGATGATGTTAAAGATTTAAAAGATATGA
+TGAGAGGAGAAATCAAATGATCAATTTAAAATTACGACTACAAAACAAAGTAACCTTGAT
+GGCTATTTTGGGAGCTATCTTTTTACTGGCACAGCAATTAGGTATTAAACTACCATCAAA
+CATCGCAGATATTGCAAACACAGCTGTAACGCTTTTGGTATTGCTCGGTGTTGTCACAGA
+TCCAACCACGAAAGGCCTGTCAGATAGTGAGCAAGCATTGACTTACCATGAGCCCAAAAA
+ATAGGAGGAGCCATGCGAGCAATCACACGATTAGCGTTAATACTAGCAATCGCAATACTG
+TATGTGCCATTATCTGTGGTTGCTCTTATCTTTTATCCGTTTTTAGATAAGGAGGACAGA
+TGACCTTTTTAGATAAAATTAAACAAGGCTGTTTAGATGGCTGGGCTAAGTACAAAATCT
+TGCCATCCTTGACCGCAGCACAAGCTATCTTAGAGAGCGGGTGGGGCAAACATGCCCCAC
+ACAACGCTCTGTTTGGTATTAAGGCAGATAGCTCTTGGACTGGTAAATCATTTGATACCA
+AAACCCAAGAGGAATATCAAGCAGGTGTTGTCACGGATATTGTGGACCGATTTAGGGCGT
+ATGATAGTTGGGATGAGTCGATAGCTGATCACGGACAATTTTTAGTTGATAATCCACGCT
+ATGAGGCAGTTATTGGGGAGACTGACTATAAAAAGGCTTGTTACGCTATTAAAGCAGCTG
+GATACGCTACGGCAAGTAGCTATGTCGAACTTTTAATCCAACTGATTGAGGAAAACGACT
+TACAAAGTTGGGATAGAGAAGCTCTTAAAAATAATAAGGAGGAAACGATGACAACCGCAA
+ACGAAATTGTACAATACTGTGTTAACCTTGCTAATTCAGGCATGGGTGTTGACAAAGACG
+GTGCTCACGGGACGCAATGCTGTGACTTGCCTTGTTTTGTCGCTAAAAATTGGTTTGGTG
+TTGATCTTTGGGGCAATGCGATTGATTTATTAGACAGCGCAAGTGCGCAAGGCTGGGAAG
+TCCATCGTATGCCAACAGAGGCAAACCCAAAAGCAGGCGCTACATTTGTCCAATCAGTGC
+CGTATCATCAATTTGGACATACGGGAATTGTTATCGAGGATAGTGACGGTTACACCATGC
+GCACTGTCGAGCAAAACATTGATGGCAATCCTGATGCTTTGTATGTCGGTGCACCAGCTC
+GTTTTAACACTCGTGACTTTACTGGCGTGATAGGTTGGTTTTACCCACCATATCAAGGGG
+ATACAGTCACGCAACCAGTCAGCACCGAGCCGCAAACTTCTGACACTATCGTAGAGACAG
+CAAAAACAGGCACCTTTACCCTTGATGTTGCAGAGATCAATATCAGACGCTGGCCAAGTC
+TAGCCAGCGAGGTTGTAGGTATCTACAAGCAAGGTGATACTGTCAGCTTTGATAGCGAGG
+GCTACGCTAATGGCTATTATTGGATTAGCTATGTTGGAGGCTCAGGTATGCGTAACTACC
+TAGGTATTGGACAGACTGATAAAGATGGGAATCGCATCAGCCTTTGGGGTAAATTAAATT
+AGGAGGTAAAGCTCCGAGATAAGACAAAACCGCTCAGATTATTCTGGGCGGTTTTTTGTG
+TATGATGAATTATTTTTCAAGATAAATATCGAAATGACTAAAGTTCTTCATATTGATAAT
+TCTATTATCTTTATATTTTGCAAAAATATCTGATCTAGTCCCTTCATTTGGTGAGTCAAA
+TAAGTCTATTTGCTCATGTTTCCCATCTTTTGTGCCAATTTCGATTCTGCCGCTTACATA
+AGGAGAAGTAGCGTCATAAATTTTATAATTATCCATAAGGTATTTTCTGATTTTAAAGTC
+AATTTCCTGGAAAGTTACGATATCTTTTTCTAGAATAATTTTGTTATTTAAGTTCTGTTG
+AGATTCTCCCGAAATAAATAGATTTCCCAATAATTTATGATTTACTTTATTATTTTGAGC
+AGGCGTAATTCCTCCATAGATGTACTCACCGGTGTGAGAATTAAGAATATAAAATAATCC
+AAAAACATCTACATGATCATCTCGTTTAAATTTTTGAGAGGCCTCATAAGACATTTCGGA
+ACTAATATAATAGTCTTTCCCTCTATATTTTTGAGTATCAATGTTTAATGTGTGTGTCGT
+TGAAAAATTTACCCTGCAATTTTTATAATCATAAGGAGTTATAGTGTATGCATAAAGTAA
+ATCACTTTTAACATTCGAAATGTCTTTCTTAGAGTCACTTTTGATGATAGGTGAAATAGT
+AGAAATCAGTATGACTGTAATTATGAAAACTATTTTGATGATGTTAATCTTTTTCAT
+>NC_002737.2|provirus_777501_820593
+ATGTATAAAAATATTATCGTAACTGGTGGAGCTGGTTTCATCGGATCTAACTTTGTGCAC
+TATGTCTACAATAACCACCCAGATGTTCATGTAACTGTCCTTGATAAATTGACATATGCA
+GGTAACCGTGCTAACATTGAAGCTATTCTTGGTGATCGTGTTGAGTTAGTTGTTGGTGAT
+ATCGCTGACGCTGAATTGGTAGATAAATTGGCTGCCAAAACGGATGCTATTGTTCACTAT
+GCGGCTGAGAGCCACAACGATAACTCATTGGAAGATCCAAGTCCATTTATCCATACAAAC
+TTTATCGGAACTTACACTTTGCTTGAAGCAGCTCGTAAATACGATATCCGTTTCCACCAC
+GTGTCAACTGATGAAGTTTATGGAGATCTTCCACTTCGTGAAGACCTTCCAGGACAGGGT
+GAAGGACCAGGTGAAAAATTCACTGCTGAAACAAAATACAATCCATCATCACCTTACTCA
+TCAACTAAGGCAGCTTCTGACCTTATCGTTAAGGCATGGGTACGTTCCTTCGGTGTGAAA
+GCGACCATTTCGAACTGTTCAAATAACTATGGACCATACCAACACATCGAAAAATTCATT
+CCACGTCAAATTACAAATATCTTGGCAGGAATCAAACCAAAACTTTATGGTGAAGGTAAA
+AACGTCCGTGACTGGATTCATACTAATGATCATTCTACAGGAGTATGGGCTATTTTGACT
+AAGGGTCGTATCGGTGAAACATACCTTATTGGTGCCGACGGCGAGAAAAACAACAAGGAA
+GTTCTTGAGCTTATCCTTGAGAAAATGGGTCAACCAAAAGACGCTTATGATCACGTAACT
+GACCGTGCTGGTCACGATCTTCGTTACGCTATTGATTCTACAAAATTGCGTGAAGAACTC
+GGCTGGGAACCACAATTTACAAACTTTTCAGAAGGTTTGGAAGAAACTATTAAGTGGTAC
+ACAGAAAATGAGACATGGTGGAAAGCAGAAAAAGATGCTGTAGAAGCCAAGTATGCTAAA
+ACTCAAGAAGTGATTAAATAAAACATTAAAGAACCTTGTCATATCAACGTTTGTTGAAGA
+TATCAAGGTTTTTTCTTGTGTTTTGGGGCATTTTTGGGGCATATTTGGGGTATATTATAG
+CCGGTTTAAGATGTCGACGACTTCATTTTTCATGCTTTTCGTGACGTGGGTATAGATTTG
+TTGAGTAGTTTTCGAGTCAGCATGTCCAACTCTATCCATGATAGTTTTTAAGGGCACTTT
+GTTTTCTGCAAGGCGACTCACCAGGGTGTGACGGAAGATGTGGCTGGTGAGTTCTTTTTG
+AATCGGTTTTTCTAGTCTCTTATTTGCCGCTCTGATAGAGGTGTTGAGGGCGTTGTCTTG
+AATAGGAACACCATTTCTGGAAATGAAGATGTAGCCCATGTCCTTGTAATTAGGATTAGT
+ATTTTTTTCAAGAGCATTAATTTTCAGTATATCCTGAATAATTTCTTTTTCACGTTTGGT
+TATCAATGTTTCACGCCAACTGGAATTTGTTTTAGGGGTGGTTTTGATAGCGTTTCTATA
+GCCATTTGAGGTGTAGTCAAGAGTTCCGTGGATTTCAATGATATCATTTTTGATATTGTC
+TGGCTGTATAGCTAGAGCTTCTCCAATGCGGCAGCCATTTAAGCTCATAAATTCTGCCAG
+ATAAGCCATTTTAATCGATCCTTTACGTCTATACATTTCATCTAATAGCCTTTTGAGTTC
+ATCTTTTTCTAAAAACTTCTGGGCAACGTCTTCAAAGTCTTTGATGGTCTTAACAGGTTT
+TGCGAGTTGGGTACTAATAACTGGATTGATTGAGACATACTCTAAAGCGATAGCGTAGTC
+GAAGGTTTGTTTGAGCAGCTGCCGTGCTCGTTTACGTTTGTCATAACTACCTGGTATTTT
+GTCGATAATACTTTGCAGGTATTTCGTGGTTATCTTGGCAATCATCACTTCTGGATCAAT
+TAAGTTTCGCAATTCTCTTATTCTAAAATCAAGAGAGCGGACAGAAGTTGATTTGAGTGA
+TTTCTGATGATGTTCCCACCATTCGTTCATGACATCTAGTAGGTAGGCATCGGTTGTGGT
+AAGACTTGTTAAGATTTTAGATATTTTTTCGTCAAGATATTTTTGGGCTTCTTTTCGTAT
+TCGTGGCGTGTCTTTTTCCATAAGGACAGAAGCTCTGCACCACTTGCCAGTGTATGGGTG
+TTTGTACCGTTCTACAAAATTTACTTTTCCGCTTTTGTGTTTTTCTGACCACATTGTTTT
+TTACCTCATTTTCTGTTAAAATAGGTATAGTAAAGAGACCTACGGCAAAGCAGGTTTTTA
+CTATACTAGATTTGCCTCGCGCTCAGAGTCGCCAAACTTTGAGAGCGTGGGGCTTTTTTA
+TTTTTCTAAAACAAAAAAGAGCACTTATTCGAAAACAGGCGCTCACAGTGGAGTTGGACA
+CTCCAAAATAATGTTTCAGTGGTAGCGAGGCTACCAAGATTACACCTTAATTCTAACATA
+GTGATATTTAATTGTCAAGTTTCCCCCACTGGCCAGATAATAACTGCCTTGCGAGAGCTT
+TATCAATGTTGTCCATGATTTCTTTAGACAATGTTATTTTTCCGACAGGGTCAAGATCGT
+TAATTGGTTTAGCGATTTTTAGTTTACTGACAGAAGTGATTGAGTCCAGCTTGGCGTAGG
+ACACCTTGTCATAATTTGCATATCTTTTTTTGAGGAAGTTAATTTTGTCTAAGTCTGATT
+GTATCCATTTTCGGACGGTAATGTTTGCTACGGGGACATGAATCCCTTTAGGGTCATTCC
+TATTGTAATATTTCATCCATATATCATGATATTTATTTTCTTTTTTAATCTGAAAAAACG
+CTGGGGGAACTGGTAACGAGTGGTGTATCCGTTCTACTTCAGTTGTTAGGTTTAGCACAT
+TTTGAACTGTTTGAACTGTTTTTTCGGCATCATCCATTATGCTCGTAAAAATCTCTTTGT
+TAATTGACAGACTCTCTTTAGAGTTTTTTGATGTTAGCGGTAAGATAGTTAGCTTTCCGT
+TATTGGGATGATCTTTTTTATTCAGCACAATCCCAAAGTGCGAATCGGAAAATTCATTGC
+CGATATTTACTCCAAAATGAATAAAGACGATAGTTCCTCGTTTGTATCTCTGATATTTTT
+GAGATTTAATTAAGTTTTCTGTTTTAAAAATTTTAGCGCGCTCGAGTTCTTGTCTTGATA
+ATTTGTAAAATTTGGGATTTTTCGGATTATCAGAGATATTCAACAGAATTTTCTTGCTAC
+GGCTTAAATTTTGTTTATTCAATGCTTTACTATCCATTTCTGCTCCTGCCTATCTCTCCC
+TATAACTCCCCATAACTTCACCAATAATCCTAAAGTCGCTATCTCTATCTATCGGTATAT
+CTGGATAATCACCGCATTGATTTAAACTGTGTAAAAACGCCCCCTTGTCATTTATAAGTA
+GCTGTTTGATATAAGCGTCACCATAGTATTCAAAGACGCCTATATCGCCATCTGTAAGCT
+CTACGGATAGCTTAACAAATACATAATCCCCAGAGTGATACTTCGGTTCCATGGAATCAC
+CATAAACAGGGATAACAAAGTCTGCGTCATAATCGACTGGTAATTCAATTGTTTCTACTT
+GTACATCATTTAGATACTGACCTGTACCAGCTGAAGCTGCGTGGTCGTAGTAATTGTAGG
+TGTAGTAGGTGGCTTGTGGTTCTTCTACTGTGTTTTGTTGTTCTAATTGTGTTTCGGCAT
+AATCAAGCACGTTTAGTTGTCGCTTGTGTTCTAATTGAGAAGAAGTAGAGTTTATTTTTT
+GTAGGGTAGATGGGATGAGTTCAACTTGGGGGGCGGTGGGAGTGGGATTATCTCCAAACA
+TCATTTTCTTAGGCTCTACACCGAAGAATTTTGCTATCTCTTCAATCTCATATATTTTAG
+GAGAACGCGTCCCTTTTTCCCATTTTGATATTGTCGACTTTGTTTTTCCAACTTCTTCTG
+CCAACTGTTCCATGGTCAAATTCTTACTAAGTCTAAGTTCTTTGACCATTGCCGGAAATG
+CAATAGTGGAAGCCATATAAATTCTCCTTTTTATAGCTTATTTATCTACATTATAATTAC
+ATGTTTACAAAATGTCAACAAAAATGGCAAATAATCAAATCCAAAAAAGTTGACATTTTT
+AACACAAAATAGTTGACAAAAAGGAAACTCGGAGTTATACTATAATCAAGCTTAAGGAAT
+TAAGCAAAACGAAAGGAGGTACAAAATGAATTGGAAAAAACTAATGTTTGGCGATTTAGA
+ACACACGTTTACTAATCATGATGGCAAAGAAAAAACAAGCATCGAATTTGAAGGTGGAGT
+TTTACCAGCTCTGTTAGTGTTGGGCGGTATTGCTTGGATGATCGCTTGGTTTATTACAAA
+ATAAAAACTCCCAAGAGGGAGTGGAAAGGAGGAAAATATGATATTCATAGCAATAATTCT
+ATCTGTATTAATATCGTTTCTGGTATCACTGGTTATGATGAAATGGCATATATGGAATGC
+CAATAAATTACTGAATAAATATTTCGATATTGAACAATCAAATATAGAGAAGTTTTCAAA
+ATCTATTCTAGACAAACTGAAATAAATTTTTTTCCGAAATCTGTTAAGGAGACCTTTCCT
+TTTTCAATCTTAATATCATATTTTGTGTTTGATGTTTTGAATAAATTAAGAGTGTTAATT
+TCACTTTCAAGAGATTTGTAAATTGTTGTTTGTTTAATTGATTCATAATTTGAATCCAAT
+GGATAATGAAGATAATCAACTTTGATTAGCCCTAATCTGGTTAAATTATCAATAGAAGAA
+GCAATAATATCTGGTGAGTAATCTAACTTTGATAAGTATATATTATTTGCCTTGTTAACG
+GTTCCTGAAAGGTTTTCTTTACTGTAGTGTACTCCTATTTGTAGATTTGCAATGAGATTA
+TTTCCCTCTTGATTTATCAATAATAGATTTTGTGCATCAAGTGGTGTCATTTGTTTGATG
+ATTTGAACAAAAGCTGAGTGAAGATCCTTTTCTTTGTCCTGATTAAATGTTGAAGCTATC
+GTTCTAGCGAACATATTTCTAAGTGTTTCGTTACTTAAATATTGCTCTGACTCATTTATC
+GCAGGATATAAGATATACTCAACGGGTTCTTTTAAACTAGTTTGCGGTATTTTAGAAAAT
+TCGCAATCAATCTCATTTTTGAATTTTTCTTGATTTTCTAATTTTCTTTTTTCAATCTCA
+TAGATGTATTCATTTTCAATCTCTTTTAATTTTGCTTTTCGCTCAGTTAGGTATCCATAT
+TTTGAATACCACATGTGGTTTAGCGATGTAAAGATAGGTTTCAGACCACCTTGGGTAATA
+AACAAACCAAAAGCACTAGAAGTCATTGGCCAATATGTTTCGATATTACTAAAATCAATC
+ATACTTTTTTTGCCTCACATTTTTATTTCAATTATACCACAGAAAGGGGGTGGGGGAGAA
+AATGGAGAAAATGAAAGCACCTAGCCTAGAAGTTAATCTACGGCTAGGCGAAAAGGAAAT
+CAAGGCAGTTGTTTCTGGATCAACTCATCAATCCTCTGAGCAATCAAAGGTTGAAGTTGA
+TGAGCAAAATCTTGAGAAATAGAAATCGAAAGCTCTTCTGTTAGTTCTTGCAGATTACTA
+AAACTGTCTAATTGTGGCAATTCAGAAGGTTCAAAAGTATTTGCAAGTTTTAAAACAACT
+TGACGGAAATCGCCGTCAAACTTTATGTTAATTTTTAATGGATCCATCACATTCACCTCC
+TTTCTGCTCACATTATAGCAGATTAGAGGTACTAAAAACAGATAGAAAGGAGGTGGGGGA
+ATGCAGGAAAATGCTTTCGAGCAATTAATTGATGATAGCGGAATTAAAAAGAAAGTTATC
+GCAACTAAAATGGGTTTTACGCGCTCTGGATTTTATCAGAAACGTAAAAAACCCAAAAAA
+TCATTCGATGCGTCAGAAGTGGCAATGCTAGCGGATATTTTAGGGGTAGACCCCGGAAAA
+GTCCTGGAAGCCATTTTAATTTCATAGAAAAGTTGACAAAAATAACACAACACTGGAAAG
+GACAATATGAATCAACTAATTAACGTAACACTAAACGAAAATCAAGAACCAGTTGTCAGT
+GGTCGTGATTTGCACAAAGTACTTGAAATTAAAACACAATATACAAAATGGCTTGAGCGA
+ATGAGCGAATATGGTTTCGTTGAAAACGAAGACTTCATGGCTATTAGTCAAAAAAGACTA
+ACAGCTCAGGGCAATCAAACAGAATATACAGACCACGTTCTAAAACTAGACATGGCAAAA
+GAAATAGCTATGCTTCAACGCAATGAAAAATCTAAAGAAGTCCGTAAATACTTCATCCAG
+GTTGAAAAAGATTTCAACAGTCCTGAGAAAATCATGGCAAGGGCGTTGCTGATGGCGGAC
+AAGAAAGTGCATAAATTAGAGGCTCAGATTGAGGCAGACCGTCCAAAGGTGCTATTTGCT
+GATGCCGTAAGTGCTAGCCATACCTCTATATTGGTCGGAGAACTTGCAAAGTTACTCAAG
+CAGAATGGGGTAAATATTGGAGCGACTCGTCTCTTCACTTGGCTTCGTAAACACGGCTAT
+CTTATCAAGCGTAATGGCCGAGATTGGAATATGCCTACTCAGAAAAGCGTAGAGCTTGGA
+CTTATAAGGGTCAAGGAAACTAGCATCACCCATTCTGATGGCCATATTACAGTAAGCAAG
+ACACCTCTGGTAACCGGAAAAGGTCAGCAATACTTTATCAACAAATTTCTTAATCAGGAA
+TATCTACCAGTTTAGAAACGTAACAAAACTAACGAAGGGAGAAAATATGGAAGAGAAAAA
+ATTTTTTACTACATATGAAATGGATCTGATGAATTCAGTTGTAACTCTTCAAAAATCAAT
+CTTAACGCAAACGGAACATTTGTCAGATCAACTAACAAAAAAGCTTCATCACCTAGAAGA
+CTACAATAGTCCGATTGATGATGAAGCAATTAGATTGGCTGAGGTAACAGCAGAATTTTA
+CAAGTTGTTAATCAAGTCTCCTAGTGTTGGAGCAACTGTCAAGGAGATTGTGAGCGAGGG
+ACATAAGCGTTAAGGCCGTAAGAGCGTCATTGAGATTATCTGGATTGTAGTATTTGAGTT
+TGTGAGCTTTAGAGTTGCGATAAAGGTGAGCGATTGCAAGTAGCAAATTTTTTAATCCCT
+TATACTCACTTTGTTCGTCTAGAGTCTGCAATTTATTACCGTTGATAATCACAATGGGTT
+CTCCGGGTTTGAAACATTGATCTATCAGACTAGCTGAGTCCATTGCTGAGCCCGTTAGCA
+GACGAATACGATGAAAAACACCTTTACTTGCTTCAAATACGGCATGAAAATAGTTTTCTT
+GTAAGAGCTCTTGAGTGCAGAATTTTAAAACGTGAGGGTGTACTTTTAATTCTTTTAATC
+TACTATCAAGTGTTTCGAAGCGTTTTTTGGCCTCTGATAAAGTTTTTGAAGTAGTAGTAG
+TAACAATTTGTCCGCTATCTGATACAATCAAACCTTTTAGCGAGAGCGGAATGTTAATGG
+CGGTTCTTAACTGTTCAAAAATTGAAACTTCATTAATGTATCTTAAAGGATTACAGACGT
+ATTCAATCACAAGTTTTATATTATCTGTATTCTGTGTCCTATTTAATATATCGGACACGA
+GATTGTGCACCCGTTTGTGCTTGTTAAATCCAGAATTTTGGTCGTTTTGGGGATAACCTA
+AAACTTCGCCCATTCGGGTTATTTCAGAATGCGAAACATAGTCAGATAGTATTTTACCGA
+TTGTATCAACGAATTGGGTGTCAATATTTAACATAACAAACCTCGTTTTTATTTAAATTA
+TACCACAGAAAGGAGAACCACATGAGACCAAAACGATATCCGTATAGCGGAGAGAAAAAG
+AGAGCCTATCATAAGATAGACCCTGAACTGATAAAAACCGGTAAAGTTGATTGCATCAAT
+CTCCCTTAAGTACGCCAAGCTCTAACAATGCATTTGTCATAGCTGCGATAGTAGATTTAG
+AGGTTGACTTAGAGACATACTCCAAAATATTAACGATATGCTGAGCTTGCTTTTGTGTAA
+TAGGTGCATTCATTTGATTAAGTTCCGCAACGACAAATTCAACTAATTGGTTGTCAACAT
+TGAAATTTTGGTTGATATGTTTTGAGACAACAGAAAGGAAGAAAAAAATCATTGAAATTT
+GATGATGTCGTTAAAATCGCCGATGTCTTAGGTGTCAGCTTGGACGAATTCAGATAACAA
+AAAAAGTCCGACGGCAATCGGACTCAAAACTAGATTAATTTACTTAATTATACCACAAGA
+GAGAGGATATTAATATGCCGCAGAAATTACTTATAGAGCAGTTGATGTTAATGAAACAGC
+TTCTCATGGTGATTATAAACACTTGATTCAACAATGGGAGGGGTTGACAGTTGCTACTGC
+AAAGCAGTGGGCGACAGAAATGCGTGATCATCCAGACTTTAAACAGTTTGTATTAAATCC
+AACGCATAGAATCGTATTCATTGATTACGAAGGATTCAAACTGTTTGTACAGTGGAAATC
+TCGCAATCGTTATAAAACAAAAAAAGAGACACTGTCAGAAATGCTTGAAAATATTAAATT
+CGAAAAAAGAGTAGGAGCATAACATGAACAAATTAGAACTATTTTTATTAGTAACAACGA
+TCATCTTAGCAATCATCACTAGAGTACAACACGAAGTCATTAAAAAACATAATTCGCCAG
+AGAATAAACGCAGAATTTTTAGAGAAGTGGCTTTAGAAAACAGCAAAGGGTGGAGCGAGA
+AGCGTTCTGGAGGAAAGGTGGTCAGCTGATGCAGTACATTTTTCAAAAATACGACAAGTA
+GCTATACATCCGTTAGCAACGAATTTATAGATGATTGTGAATTATCCCTAAAATCAAAAG
+GCCTGCTTATGGTAATTCTTAGAAATAAAGAAGATTGGAGAGTATATCCAGAGGAATTGG
+CTAGAAGGTCCAGAGATAGCGTGAGAGTTGTAAGGACTTGCTTAGAAGAATTAGAGAGAG
+TCGGATATGTGAGAACTTACAGAAAATCTTTAGGGCGAGGGAAAGGCATACAATATTATA
+GATTTTGCTCAGATAAAAAGATATCCGAACAAGCATTTAAAAAAATGATTAGTGATTTTA
+CAACTTAACGTTTTACAAAGTTGTATTTTACAAAGTTGTATTTTACAAAGTTGTAAAACG
+TAACACTAATAATTACTAACTTATAAATAAATACTAAATAACAATAAATACTAACAGATA
+ATAAGCATCATCATCAACATCAGGAGGAGCTATGGACGAAAAAAAGCTTTTTGAAAATTT
+CCAATTAACTTTTGGACGGATGATATCGCCATTTGAAATCGAAGATATTCAAAAGTGGAT
+TCACGAAGATAACATGCCAATTGAAGTTGTCAACCTTGCCTTAAGAGAAGCGGTAGAAAA
+CAACAAAATCAGTTGGAAGTATATCAATAAAATCTTAGTTGATTGGTATAAATCTGGAGA
+TACGACAGTAGAAAAGGTCAGAGACAGGTTGCAACGGTTTGACGATAGTAAAAAACAACG
+AAGTGTAACTACCTCAAACGTCCCAAGCTGGTCGAATCCAGACTACAAAGAACCAGATTT
+AGAAGAATTTGCTCTAGGAAGCATGGACGGTATAGAAGATGGATCAGGAGATTTTTAATT
+TTTTTAACAAACAAATCAAAAAAGATTTTGGTAAAACGGCGAGTAAAGAGACTTTTGCTA
+AGTTTGCTAGTTACTGCGCCGAAGGAATCGAAAAAAATGGAGTTAAGCCAATTTTTAATT
+GGATAAACCTATACGCTTTTGGAACTGGTATGACAACAGCAGAAGCAGACCGGTTGAGAA
+TAGAGCGATATAAACAGGAGAATGCGTTATGACAAAACAACATAGAGAAACACTTATCTG
+GTACCGAGCAAGTCATCAAGAGCGTGAGAGATTGCTTGATTTTGGACTAGTTGATAAAGC
+ACGGTACGTGACACTATTGCGGCAATTGCGTAAGAAATATGCGATTTAGGAGGAAATATG
+ACACCAGAACAAGTAGAAAAAGCAAAAATCAGAGCTAAACAAGAACTTGAAACGTTTAGC
+ATATACCTTGACCAGGCAGTTGATGAACTCGGTGGAGTTTTAACTTCGCGAGAAGTCTTT
+TTGGCAGCGGGATTCACCTACCTTGGCGCAGGTCAGACAGATATACATGCTGCAGTCGAG
+GGATTATGTGAGCAAATCCAATGATTTTAAATTTAGTGAAGACTGGGAGAGCAACTAAAA
+CACAAAAAGAGGAAATGAAATGAACATCAAAGAAAAAATTGTAGTGCTAAGAAACACTGA
+AGACGGAAGTTTTTTAAAGAGTTTCAAAAACAAAAAAGATGTACTTGCTTATAATGTGGA
+ACTTACAGATAGCATTCAACTGGCATCATTTTTACCAGAAGAAGCTTACAACATACAAAA
+AGAAAAAATTGATAATTTGGCAGAAACGCTTGGGTGTGATGTTGTAGTTATCGAAGCATC
+ATATGACCTAAAATTTGTTGATGGCGAGGATGTTCCAGAGTTAACAAAAGAGCAAAAAGT
+TAAAAGTATGGTAAACGGAATGTTTGAGCAGGTTTTTGGAGGTGAATAGAGATGGCAAAT
+CAATTATCAACACAACAAGTTAAACGTGATATCACAACTGATCCAACTTTGCTGACAGGA
+GCTGATATTAAAAAATATTTTGATCCTCAGAACTTGCTTAGCGAAAAACAAGTAGGGCAA
+GCTCTGGCTTTGTGTAAGGGGCGCAACCTTAATCCATTTGCAAACGAAGTTTATATTGTG
+GCCTATAAAAATAATAGCGGCACAGATTTCAGTTTGATTGTATCTAAAGAGGCATTTATG
+AAACGTGCTGAACGTTGTGAAGGATATGATGGATTCGAGGCTGGCATTACTGTTATGAGA
+AATGGTGAGATGGTTGAAATTGAGGGCTCTCTAAAACTACCTGATGATGTTTTGATAGGT
+GGATGGGCCATTGTTTACCGCAAAGACCGCTCACATCGATACAAAGTTACTGTTGACTTT
+AACGAATATGTCAAACTTGACAAATATGGTAATCCACGAAGTACTTGGAAATCAATGCCA
+GGAACAATGATTAGAAAAACAGCACTTGTTCAGACACTTAGAGAGGCTTTTCCTGATGAA
+CTCGGTAATATGTACACCGATATTGACGGTGGCGATACTTTTGATGCTATTAAAGATGTG
+ACTCCTCAGGAAACACAGGAAGAAGTCAGAGCACGGAAGATGGCACAGATTGAGCAGTAC
+AAGCAAGAACAGACTCAGAAACAAACTCAAAAAGCAGACACTAGCTATCCCGTTGATGAA
+GTGTCTGAACATACTGATGATCCAGTACAAGGAGAACTACTTGATGGAGAACTGGAGTAT
+TAGGAGGAAACCATGCAAGAATTACAATTAAAAGTCACACAGGCACAAGTTGAAATTATT
+GATCGTGAAAAATTTGAACAAAACATCAACGAAGTTGTGGCAAAATACCAAAATTATGCA
+GTCACAGCTGGAACTATCAAAGATGACAAGCAAGTCCTAGCTGATCTACGCAAGCTCAAA
+AAACAGTTGTCTGATGAGCGTATCAAAGTAAAAAAGGAACTCTCAAAGCCTGCTGACGAC
+ATTGATGGATATATCAAACAGGCAAGCAAGCCACTAGATGACACGATTGACAAGATTGCA
+ACTGATGTCAAAGAATTCGAAGACCATCAAAAAGCGCTGCGATTAGATACAGTAAAGAGC
+TACTTGTCTAATAAGGCATCCGAGTATATGCTTGACCCCCGTATTTTTGACGAAAAAGCT
+ATGGAGTACACCAAAGCTGGCAATTTTATGGCGGACGGTGTAACCCTCAAAAAAGTCACC
+ATGAAATCTCTTGAGGACTTGGTTACCTTTGAATATCAAAAGGAGCAAGAGGTCGAAAAA
+GCAAAAGCTACCATCTCAGGACAATGTGCTGAGTATGGTATGACTGACCAACCTTACATC
+CGTATGCTAAAAGAGATGACGCTTGTAGAGGTGCTAGGTCAGATTAAAGCTGATTATCTC
+GCTGAAAAGCAAAAGTAGGAAATGCGAAAAGCCGAGGAGGAAAGAGAGCAACTTTTAGCA
+GCTCAGCAAACTAAAGAACAAGAACAGGCTCAGAAATCAGCAGAAATACCACAAATCGAC
+AAGGAAACAGGCGAAATCTTGGATGGTTGGCAATTATCCCAAAACAACCAAGAAACGCTC
+ACAGGAGCTGAAAACGAGTTTAAAAAGTACAATCAAAAAATGACACTTGAGGTGTACTTT
+GAAGATACGGCTGAAAAAGACCGTTTCAAGACCGGTCTAACTCAGCTAGGTTTTGATTTT
+AAAAAAAATTATCAAGTCAGCGGTTATCAAAATATAGAGCCTCTTACTCAAGCTGAATTG
+GCTCGGCGGTGCGGATGGTAAATAAAAAATAGTTTTTTAACAACCTATTGCAAAGTGAAG
+CTCAGCCTTTGCAGTATCAATATTTTCCGAGTGAGAAAGGAAAGTTGGAATATCGTCAAG
+TTAACAGGATTGATGATATAAAAAATTGCTACACTCGTCCTTGCCAATGCTCACACACAA
+TTTTAGGGCGAGTGTGGATTTTAAAAGGTGAGAAATATGGAACAAATCAAAATTACAGAA
+ACAGGAATGGTCGTTATAAGCGATAAAGCACTCAAAACTTTTGTGATTGCAGGACATTTA
+TCGGAGAGGTGGGAATTTACCTCTAAATTTAAAAAATTAGATGAGCCATCACTTGATGAA
+AACGGAGATTTGTTTGAGCCTGTATACGAGTTGATGCTTGAAGCCAGGTCGAAGGGACAA
+ATTAGCATAACATCATCATATTGTGGCAAAAATCACAAAAAAGACACAGACGAAATCATA
+AAAGTATTCTCGTTTATCGAAGATAACAAGAGAAATATTTTTGAAAACCTTGGTATTCGT
+GGGGTGCTTGAATGAGCAATCTAGTTTTATCGTTAGACATCTCAACATCTGGAACAGGGT
+GGGCCTTATTTAAAGGCTCAGACCTTATCCAGAGTGGTGTCTTAAAACATAAGAGTAAAT
+CCTACTTTGAGCGCGGACGCTATATGGCTAGCCAATTAGGACTAATCCAGTCACGAGCAT
+TAAAAAAATACGATTGCTATTTTAGTACAATCGCAGTCGAAAAAAATTCAGTTATGGGAC
+CTAACCAGCAATCCATGCTTAAAATCGGTATTGTTACAGGAATTATCTTAGGAAGATTAA
+TAGCTGATAACGTCGCCTTTATAAATGTATCAACGTGGCGTAAGCACTGGAAGTTTAGCT
+ACAAAGACCGCTCTAAAAAAGCGATGAAAGCACAATCGAAAGAAAAAGCTCTCGAATATT
+GCGGAAAAACAGTAAAAGATGATGAAGCGGATGCTATTTTGATTGGCTCATACTATGTCA
+ATCAAGGCTATCTTGATGAATTGGAGACACATGACTACTACTAAAAAACACGTTGTGAGA
+GTTTACAACAAAGGTATTACAGCGACTTACGCGATCTATGACAAAAAACTGTTTAAGGAG
+CACGAGTTCGCAACCAAAAACGAAGCGATGCGGTTTATTAGACAGCTAGAGTTAGCTAAT
+GATAAGCGAGCGACAGAATATTATTTGAGAGAGGTAGAGAAATGATACCAAATTTTAGAG
+GGTTTAACAAAAAAACTAAAAAAATGTATAGCATTGATGGCTTTAAATCAAGTGAACGCA
+AAATATACAGATGCAGCTTAGCAGATGATGAGTTTCGCTCTGGTCGCTTAGAGACATTCC
+ATTTTGTAGAGGATAATCTTGTGGAAAAGTGCAACAGACCACCTGAACGATTTTATCGAC
+AAAAACAAGTACGCAAAAGTGACAGGCGACTTATGGCAAGGCAGTGATCAAGTCATTGCT
+GAGCAGTGTTTTTTAAAAGTATTAGAGGAGATGCAAAAATGAATATAGAAGAAGCGAAAG
+AATTAGTAGATAATTCAAAATTTTATGGAAAGACTAGCAGTGTTATAAAAGCCGAGGTTC
+GCGACATTATAGACCAGTTAAACCAACCAAAACCAGAAGTACCGCAGTGTGTGGCGGATT
+GGATAGAAGAGTGCAAAGAAGAAGATTTAACTTTAAAAGGCTTGTTTTCTAACAGCGATA
+TGCCTGCAAAAATTTTTGATTGGATTTTTGGTAGTGACGAAAATTGTAGGTTAATGGCTG
+AAGCATGGATTAACGGCTACACAGTAGAAAAAGAAAAGCTCTACACTGTCGACTTACCAA
+ACGGTCAACCTTTAGTGCGCGGCATAAACACTTTGTATTTTAGTCAAAATCTAGCAACCG
+AAAATGTAAAACTCACCGAATCCGAAATCCGCAAAGATTTTGAATGGGCGTGGCAGTTTG
+CTGAAGAGGTGACTGAATGACTGAAGAGTTAGGAGTGTTATATAGCGAAAAATGGCATAA
+GTATTATTTATATAAAACTTGCAGGTATATATCTTATGTTGATAATCCACATCAGGCTAC
+TAAATGCACCCGCAAACAAGCAGAACAGTTTCCACAGTTTAAATGGGTATCGCTGACAAA
+ATTATAACCCCACGCAAGCGCTCAAGAGCCTGCGATGGCTCTGTGGGGGTGGACCGAAAT
+TAAAAAATAGAAACGAGAACCTCCTTACACCAAAACAAATCTAAAGCGGGTTATCGGTCA
+TCCGTGATTATCCAAGGCGTCGCTAATGCTTTAACACGACATCGTGCGCCTGTGTCAAAA
+AACAAAGGAAAGAGAGGACTTTTCTCCACAAAACAAAAAGACGTCCATACGGAACGCCCC
+CTTGGTTAAATTTAAGCTTAAATAAATTATACCACATTGGGGGGCTTTCATGACGTTTTT
+TCCTGAGATTGATATCCAAAAAACAAAATCCAACGCCAAGCGTAAATTGAGAGAGTATCC
+ACGCTGGCGGAGGATAGCTAATGATGTAGATACTCAAAAAGTTACAGCTACTTACTCCTT
+TGAGCCAAGACAACCGCATGGAACGCCAAGCAAGCCTGTTGAGAGACTAGCGCTCAACCG
+TGTGTCGGCAGAACAGGAGCTGGATACGATTGAGAGAGCAGTCAACGGGATATTTGATCC
+AGAGTATAGATTGATACTGATTGACAAGTATTTGCTCACATATCCAAAGACTGATTGTGA
+TATTTATACAAAACTTGGTTATGAAAAAAGCCAGTATTACAACATGCTAGATAATGCTTT
+GTTGTCGTTCTCAGAGCTATATAAAGAGGGAATGTTGCTTGTCGAAAAATTGGAAAAAAG
+CTGGAATTAATATGGAATAATTATGTACTTTATATATAATTATTCATGTTATTATAGTAC
+TATCAAAATAACAAGAAGAGATAACCTTTTAATCAATTGGCTATTTATTTAGTCGCCAAC
+TTTAACTACAATCAAACTTGTTATTTTGTAGCCTGATGGCGGTACAGCGAGTTGAGACGA
+CAACTGGGTATGCAGGTTCGATTCCGACTGTTCCTGTTGCATTTAATGCAAACTCCATAT
+TTTTATTAAAAAGCCTATTATACCTATTGTGTAAGGGCTTTTTTAATAGTATTATTAAAG
+TGATAAAAAATATGGAGATAAAATATGGAAAACAAACCCGCAAAAGCAAGTTTCTTTAAA
+TTAAGTTCTTCTAAAGAATCTAATTTAAAATTGTTTATCGAAAAGATGGAGGAAATGTTT
+GATAATTTTAGAAAAAAACAATATAGTAACATTCCAACATTAGAGATAAATGATCTTATG
+TATTATATAAATGCAATGCAGAAGGTAACAAGTGAAGAAGAATTAAATGGAACGAATCTA
+TTTTATTGGTTAGTCACCATTTCACGGGTGGACACAGAATCTCCAATTATTCTTGCGAAT
+CTTGAAAAAAATATTGATGTAAGAAAAAGGGAAATTGAACATGGGGATAATGAGGGCCTT
+GTGGTTGATACAAGATTATTATTTGATCCATTTAGACAAATTTTAGTTGTTTATAATCAA
+AGAGGTACAATTAATAATTACGACTTAAGAAGGTTTTTTTGTCAAATAATTGGAGTTAGA
+GGATTGAAGTTTGATATTATATTAAACAGTGATGCTTTCAAAAGGGTTGGTAAGCTTGAC
+GTTGTAAATTCAATTAGTTATACTGTTGCAAGCCCAACAAACTTTAAGGAGTTTCGAGAT
+GATACTCAAAGTGAAAATGCCGATTTAAAGTTTGCAAATTCTATGCTAGGAGAGTCAATG
+CAGGTTGTTATAAAGTCAAACCATCTTTCTAAAAAAAATATATTTGATAAATTTTCAGAT
+ATGTTAGTTAATGACTCAGTTAATGTAAAAAATGCTAAAGTTGAAGGTTTTACCGATGGT
+CATCCGGAATTAATAGACTTAATAAAAAATAAATTGGAATATAAGGGAACTATTTTTTAT
+GAAAATACTTTAGACGATGAGGCTGTTTATGCATTTCTGAATACCGCGTATAGCTTTCAT
+TTTAGTCATTTAAAAAGAATGTTTACTATAACTTTATAACTTATATTGAGGTATGCGATG
+AAAAAAGGAAGGTTTAAAAGAAACTGGCCGATTATACTATTTGGTATAATAGTTTTTATA
+TTTAGTTTTTATTTTAAAATTTCTCCAAAAAGTTTAAAAAATTTTACTGATATAATGTCG
+GCATCTCTATCATTTTCAGCAATTGTAACCGCAATATTCTTTGCTAGTTTTTCATTGATA
+CCAACTTCCGGTTCTAATAAATTAGTAGTGATGATGGAAGATTTAGGGACAGAGATAAAA
+ATAATGGACCGCCTATTAGTTGCTACTTTTTTATCTTTCATTAGTTCTTTATTATCTTTT
+ATTTCTCTATTCTTTAGTAAGACTGATACTGATTTAATTTCAATTTTAGTAGTTTCAAGT
+TGGTTGAGCTCAACAGTAATGATGTTCCTAAGTTCGTTCTTTGTGCTAAGAACATTAATT
+TTGTTAGTTGAAACTTATAATAATTTCAAAAATAAATAGGTCATCACATTGTGGTGGCTT
+TTTATTATGGATTGGAGGTGGTGGAAAATCGCATACGAGGAATTAACCGAAAAACAACAG
+CGTTTTGTGGATAAGTACATCACCACATTTAACGCTACTGAGTCTGCAAAACAAGCTGGA
+TATTCTGAAAAAAGCGCTTATAGCCAAGGTCAACGCTTGTTGAAAAATGTTGAAATTCAA
+AAAGCAATGAAGGAACGTTTTTTGGAGGCAAAAGATACTAAAGGAGACCGTATTCAAGAT
+GTTGCAGAAACGTTGGAACAAGATACATCGATAGCCCGTGGAGAAATCCAAATATCTGAA
+TTCAAAGAAACAGATATGCTGACAGGTCAAGTGGTTATCCACACGAAAAGAGAATATACC
+CCAAGTCACGAAGAACAGGGTAGGGCTAGGGATAGAATTTATAAAGTTAATGGAGCTTAC
+TCAGAAAAACGTGAATTAGAGCATTCTGGAACGGTGGTGTTTGCAAATGAAGACAACATC
+CCTGATTAAAGTAGATTTGCCATCAACAATCGGTATAGGTTATGGCGCTTTTTGGCGGTC
+TAGAAATTTTTATCGAGTAGTTAAAGGCAGCCGTGGATCTAAAAAATCTAAAACGACTGC
+TTTAAATTTTATCGTCAGACTGCTGAAGTACCCTTGGGCTAACTTATTGGTCATCCGTAG
+ATACTCAAACACTAACAAACAATCTACTTATACCGATTTTAAATGGGCGTGTAATCAATT
+AAAGGTTACACACCTTTTTAAGTTTAATGAGAGTTTGCCAGAAATAACTGTAAAGGCAAC
+GGGCCAAAAGATACTGTTCCGTGGACTTGATGATGAGTTAAAAATCACATCTATTACTGT
+CGATGTTGGCGCTTTGTGCTGGGCTTGGTTTGAAGAGGCTTATCAAATTGAGACCGAAGA
+TAAGTTTTCAACAGTTGTCGAATCAATCCGCGGTAGTTTAGATGCTCCTGATTTTTTTAA
+ACAGATAACAGTCACGTTTAACCCGTGGTCAGAAAGACATTGGCTTAAACGTGTCTTTTT
+TGATGAAGAAACTAAACGGGCTGATACATTTTCTGGGACTACAACATTTAGAGTAAACGA
+ATGGCTTGATGATGTCGATAAAAGACGCTACGAAGATTTGTACAAGACTAATCCAAGGCG
+GGCTAGAATCGTGTGCGATGGTGAATGGGGCGTTGCTGAAGGTCTTGTTTTTGATAACTT
+TGAAGTCGTAGATTTTGATGTTGAAAAAACAATTCAACGCGTTAAAGAGACCTCGGCCGG
+TATGGACTTTGGGTTTACTCAAGACCCTACAACTCTTATATGTGTTGCAGTTGACCTCGC
+AAACAAAGAGTTATGGCTTTACAACGAACATTATCAAAAGGCTATGTTAACAGATCATAT
+TGTCAAAATGATAAGAGATAAAAACTTGCATAGGTCTTACATCGCAGGGGATAGCGCCGA
+AAAACGCCTCATTGCAGAAATAAAAAGTAAAGGGGTGTCTGGAATTGTCCCGAGTATTAA
+AGGTAAAGGGTCAATCATGCAAGGGATTCAATTCATGCAGGGGTTTAAGATATATATTCA
+CCCATCTTGCGAACACACAATAGAAGAGTTTAATACTTACACTTTTAAGCAAGACAAAGA
+AGGTAATTGGTTAAACGAACCGATAGATAAGAATAACCACGTTATTGATGCGATTAGATA
+TGCGCTTGAAAAATACCATATCAGAAGCAACGAGTCAAATCAGTTTGAAGTTCTTAGGGC
+TGGTTTTGGTTACTAGAAAGGAAAATAATGTACACAGAATCATTTAGAGATAGTACGGGA
+AAGACTAAAACATTAGAGTTTAGGTTCCACCGTGAAGCTCGCATGAGGTATCAAGCGGAA
+AGTCTAGAAAGCTTGTTAACCGAAAAATATAAGCTACTCCGTGAAATGATTGAACACCAC
+GATAAAGTCCAAAAACCACGCATACAAGAGCTTCTAGATTATGCAGAGGGAAATAACCAC
+ACCATCAGCGAAATAGGCCGTAGGAAAGACGATGACATGGCTGATGTTCGTGCTGTGCAT
+AACTATGGTAAGTATATTTCAACGCTCAAACAGGGCTATTTGGTGGGTAATCCTATTCGT
+GTAGAGTATATTGATGGTACCGAGCAGTAGCAAGACCTATTAAAGGACCTATCTGTTAAA
+AACAATTTCCACCAGCTGAACCGCAGATTAGTAAAAGACCTATCCAAGGTTGGTCGAGCG
+TTTGAATTGATTTATCGCAGCATGGATGACAAGACAGAGGTCGTTAGACTAGATCCACGG
+GAAGTATTTGTTATCTATCAAAATAACCTAGAGCAATCAAGCTTAGCTGGTGTGCGGTAC
+TATAACAAAAATCAATTAGATGGTACTACAAAAATTGTCGAGCTTTACACCGATAATAAA
+ATCCTGAAGTTTGAATATGATGGTGATTTAACACCTATCGGAGAGACTTCCTCTCATGCG
+TTTGGTTCGGTGCCAATCACGGAGTACCTCAACACAGATGACGGCATGGGTGACTACGAG
+ACAGAGTTGTCTTTAATCGACTTGTATGATGCAGCGCAGTCTGACACAGCTAACTACATG
+CAGGATTTGTCAGACGCGATTCTGGCAATCATTGGTCGTGTATCATTCCCTGGCTATGTC
+GACACTGCCGAAAAAGCCATTGAATACTTACGTAAGATGCGTAAAGCTAGATTACTTAAC
+TTAGAGCCTCCTGTCGACCAAGACGGGCGTGAGGGATCTGTAGATGCCAAATATCTATAT
+AAACAATATGACGTACAAGGAACCGAAGCCTATAAAAATCGTATTGTGTCCGACATCCAT
+AAATTTACCAATACGCCAGACATGACAGACAGTAAGTTTGCCGGTCAACAATCTGGCGAG
+GCGTTGAAATGGAAGGTGTTTGGACTTGACCAGGAACGTGTAGATATGCAAGCTTTATTT
+GAGCAATCTCTTAAACGTAGGTACAAACTAATCGCTCGTGTAAGCCAACTGCTTAAAGAG
+ATTGATGACTTTGACATCAGCAAGCTTAAAATCACATTTACGCCAAACCTACCTAAGTCG
+CTACAAGAAAAGATTGAAGCCTTTAAAGCATTGGGTGGAGAGTTGTCGCAAGAGACAGCT
+ATGGCTATTACAGACATCGTGGAAGATGCTAAGAAAGAAATTAGCCTTATCAACAGCGAG
+TCGAAATCACGTAGTCAACTAGCGCAGAAGTTAGAAGAAACCAGTAGATTGACTGATAGG
+GAGTTAGCTCATGACCACCAGAAAGAGTAAATACTGGCGTGACCGTATCAAGAAAGAAAT
+GGATGCTAAAGAGGCAGACGATATCTCTCTTGAGCAATCCATGAAGCAATTGCACGATTA
+TCATTTCAGGAATATCGAAAAAGAAATTGAGTCGTTTTATCAACGTTATGCTGACAAAGA
+GAAAATAGACCTTTCAGAAGCCCGTAAGAGAGCTTCTGAGCTTGATATTTCTGCTTACCA
+GAAGAAAGCTAAGGAACTTGTTGCAAAGGCTGAGAAACTACGAAGAGAAGGTAAGATAGT
+AACAAGAGATGACTTTACCCACCAAGAAAATGCAGACATGTCTATTTACAACTTAGCCAT
+GAAAACGAATGCTTTGGAACTATTGCGCTTAAACATTGATTTAGAAATGCAAGAACTTGC
+CAACGGCGAACACAAGCTAACCAAGAAATTTCTTGATGAAGGCTATCGCAAAGAAACCGA
+GTTTCAAGCTGGGCTATTAGGATTATCAGTTGCTAGCCAAGCGAGTGTGAAAAGCTTAGC
+TGATGCCGTTATTAATGCTAATTTCAAAGGAGCAAAATGGTCAGATAACATTTGGGACAG
+ACAAGATAAGTTACGTAGCATCATATCTCAAAGCGTCCAAAGTGCTATCCTAAAAGGTAA
+AAATGGCTTAACTATTGCAAGGGATATCAGACGAGAATTTGATGTGTCAGCGTCTTACGC
+AAAGCGACTAGCGATAACGGAGCATGCAAGGGTTCAGATGGAAGTTGGTAGATTATCCAT
+GGCGGAGAATGGCTTTGCTATGTTTGATATATTGCCTGAGCCTAAAGCATGTGATGTTTG
+CAAGGATATAGCTAAGCATGGTCCATATCACCTTGACAAGTGGAGAATAGGGGAAAACTC
+TCCGCCGTTTCATCCGTATTGTCGTTGTGCGATTGTAGGGGTAGATGAAAGTGGTGTTGC
+AACAGACAGGCAATTGGACTATAATCGAAACATGAACAATATTGATTTGATGGCTAAAAC
+TCAATCTTTTATCATTAACAAAGATGTCCGAGTAAGTGCCAAGAAAGTTGTCGGCACAAG
+ATATGATTTTTGGGCGCAAGATAATACCAAAAAAATTAGAGATACGATTCAAAGTGTTGG
+AGAGCACTTAGACAACTTAGAAGGGTATAGCATTCCTAAAATTGTATTTGTTAAAAAAGC
+TAAGCTCCAAGGCTGGGCGGGATATGATTATAAACAAGACACTTTGTTTATAAGTGATTT
+GTTGAATTCAAAAGCCGCTGTGAGTGATATGCTGCTGGATAACTACTTTGCGGCTGTCGA
+CTTAAACGGTATTCTAGTGCATGAGTTAACCCACAAAAAACATTGGGATACTGCTAAACA
+ATTTTACAAACATAATAAAAAGCGTTATAATACACTTGAAGAGGCAAAAAATGCACTTGA
+TTCGTCTCTAGTTTCCTATATTAAAGAACAAAAGCAATCTGATTATAATTATTTATATAA
+AATAAGCGAGTATGCTGATGTTGCTAGTTTACAAGGGAAATATAACGAAGTTATAGCCGA
+GGCAATGACTGCGGGAGATAAATTATCAGATCCGCTATTGTTAGAAAAAATAAAGGAGGT
+ATTCAGATGGAAATGATGTCAAGACCGACTCAAGAAGTGCTAACGTTTTCTAAAATCATC
+CGCCGATGGATTGTAGGCGATGAAACCATTGGCGGCAAGAAAAAATTCATTTTCAGAGAT
+GATACTCCGGAAGATGTTTTAGAGCTATATCAAAAAATAAAAAATAAGTTAGATTTTGCA
+TATTAATTAAGCGCTTAGCTATTATAGTTAAGTGCTTTTCTTATGCTTAAAAACAGGAGG
+AAAACGTGAATAAACGAATCAAGAAAAAACATAAATTGGAAACAGCAGTTGTGTTGCTTA
+TCGCAGAAAATGCTATGCAGGCTGAAGCTATTAAGAATCAAAACAGACAAATTGCAGAGC
+TGAGATCGATTATACAACAAAACGCCCAAGCAATAAATAGAGAGTTTGCAGCAGTTAAAG
+GTGTGTGTCTTGATAATCAAGCAGCTATTACAAACATTGCAGTTGATATTAACTACGTCA
+AGAAAAACTACAAACGGAAGTGGGGGAAGAAATAGGCTTTTTCATATTTTTAAAAATTTT
+TTAAAAATCGCTTGACAAATGTCGACAATAGTTTTATTATACTTATGTCGGCAAAAGTGA
+GGTGATGAACTTGACTGACAAAAAGAAAATGGGGCGACCTACTAGCGACCCTAAGACTGT
+TAAATTGACTGTTAGAATTAACGAGGATACGAACAAAACTTTGGAAGAATATTGTAAGAA
+TAATAATGTTTCCAAAGCTGACGGTGTTAGAGAAGCTATTAGTCGTCTGAAATAACAAAT
+ACCGTCTAGCTCTCGGTCGGCAAACTTGCGAGCTAAACGGTATCACCACAGAAGTGTTTC
+TGCATGAAATATTATATCATGTAGAGACGCTCTTTTCAAGATACACGAAGGAGTGTTTTT
+ATTATGGCGAAAATTGATATTATTGATAATTATGAGACATTGCTAATTAGTGTCGAAGAA
+ATTAGAGCAAGTTTGGAATCCTTGCATGCCTGGCTGGATAAAGACATTGATTGGGATAGT
+CAGTGTGATTGGTACGATTTTATTTCTCAACACAGTTCCCAAATTGCGATTCTAAACTTG
+ATTATGTACCGTTTAGACAGTTTAGAAGTGGAACACAGAAGCGTTATCGAAAACACAATG
+AAAGGTAAATAATATGGAATTACAAGTATTTACTAATGAACAGTTTGGAGAAGTGCGTAC
+AGCGACAATCAACAATCAAATTTATTTCAATCTTAACGATTGTTGTCAGATTTTGGAATT
+AAGCAATCCTCGTAAAACAATTGAAAGACTTAATAAAGATGGTGTAACTACTAGTGACAT
+CATCGACAGTCTTGGTCGAACTCAACAAGCCAACTTCATCAACGAAAGCAACTTCTACAA
+GCTAGTCTTCCAATCTCGCAAGCCAGAAGCTGAAAAGTTTGCGGACTGGGTAACATCGGA
+AGTCCTACCATCAATCCGCAAACATGGCGCATATATGACCGAACAGACTTTAGAGCAGGC
+GCTGACAAGCCCAGACTTCCTCATACGGCTTGCCAATGAGTTAAAAGAGGAAAAGGAGCG
+CAGTCGTCAGTTAGAGGCTGAGAAGTCAATTTTGAGCGTTGAGAACATGGTTATGAAGCC
+AAAGGCTGATTATTTTGATGATTTGGTTGACCGCAATTTATTGACTAGTTTCCGTGAAAC
+TGCTAAACAATTAAAAGTTAAGGAACGACGATTCATTCAATTTCTACTTGATAAGAAATA
+CGTTTACAGAGACAAGAAAGGTAAGCTTATGCCGTTTGCAGATAAAAATAACGGGTTATT
+TGAAGTCAAGGAAAGTGTTAACGAAAAGACCAACTGGGCAGGAACTCAAACCTTAATAAC
+TCCAAAAGGTCGTGAAACTTTTAGACTGTTATTTATTTAATTCACTTTAAAGTCGTAGCA
+ATACGGCTTTTTATTATGTCCAAGCATTGACGACGTAAAAAGCTATGGATTTTATAGTCG
+GGGACGACTTAAAACATAGGAGGTGCCAACCATGGCAGAAGAAACACAAACAGTTGAAAC
+GGTTGAAGAGCAAGTGGTACCAGAAGCAAAACAACCGCAAGACGAAAAAAAGTACACAGA
+TGCAGATGTGGACGCTATCATCGACAAAAAGTTTGCGAAGTGGAAGTCAGAACAAGAAGC
+GGAGAAATCGGAAGCTAAAAAAATGGCTAAGATGAATGAAAAAGAGAAAGCAGACTACGA
+AAAGCAGAAGCTGTTAGACGAATTGCAAGAGCTAAAAAACGATAAGACACGCAATGAGTT
+AACAGCAGTAGCTCGTCAAATGTTTGCAGAATCTGAAATCAACGTCAACGATGACGTACT
+TGGTTTAGTTGTGACTTTGGACGCAGAACAAACAAAAGCAAATGTAACAACGCTAGCAAA
+CGCATTTGCTAAAGTTATCGCTGATGACCGCAAGGCTCTTGTACGCCAGACTACTCCGTC
+AACAGGTGGTGGATTGAGCAAACAAACCAATTACGGTGCTAACTTGGCTAGTAAGGCAGC
+ACAACAAAGCACCAAACTTTTTTAGGAGGAAATTATGAATAAACGTAAAGTAACAACATC
+TAAAGAGATTCTACACAATCTCGACTATGAAGCTATTTCAGTAACTTTGGATTCAAACAA
+AATCGGCAAGAAAGTTGTTCCAGCTGGGACAATTTTGGCAGGCAAAGATAAATCCATTTT
+TGAAGACCGCAAACAGAAAGTAGAAACCGTGACAAATGAAGAAGTCTCTACAAAAGAATA
+TGTCGATGGTATTTTACTTACAGATGTCGATTTAACAAATGGCGATGCAGTCGGTTCCTG
+TGTTTATCGTGGGACTATCAATGCAGACAAGCTTGCTGATTCATCTGTTGCGGAAAATTA
+TGATGATTTGGAAGAAGTACTACCACACATTGTCTTTATCAAAGGAGGTAAATAAACATG
+GCATTGATCCACGAAATTATCACATCGGAAAATATCAAAGGTTTTTATAACGCTAAAAAC
+GAAAATGTTGAAAATACATTGGGAGAAAAAGCATTCCCGCCAAAACAACAACTGGGCCTT
+AAGTTGTCATTTATTAAAGGTGCAGCAGGAAAACCGGTTACTCTTAAAGCGGCCGCTTTT
+GACACTAAGGTGCCTCTACGTGACCGCATGGCTGTTGAATTGATTGACGAAGAAATGCCA
+TTCTTTAAAGAGGCTATGCTTGTTAAAGAGGCTGACCGTCAACAACTCAACATGTTAGCG
+CAAACTAAAAATAACGAACTTATCGACACCATCTTGGCATCTATCTACAATGACCAGGCT
+ACGCTTATTGCAGGTGCTAAAGCACGCCTTGAAGCAATGCGCATGGAAGTGTTATCTAAA
+GGTAAAATTCATATCCAGTCTAACGGCGTGATGAAAGACATCGACTATGGATTGGCCGAA
+GATCAAACGACCAAACCAGACGCCAAATGGGATAGCGCAGGAACAGCTACACCACTTAAA
+GACATTGAAAAGGCTATCGAAAAAATGGCAGAGCGTGGTTTTGTGCCAGAAGCTATCATC
+ATGAACTCTAAGACATTTAGTTTGATTAAAAACGCAGAGAGCACCTTAGATGTCGTGAAG
+CCTATGGCACCAAATGGGGCAGCGGTTACTAAACGTGACCTAAACACATATCTTGAAGAT
+GAACTACAAATCAAAGTCATCCTAAAAGATGGCATGTTTGTTGGTGATGATGGTGAATCT
+CGTAAATACTTCCCAGATGGTTTTGCAACATTAGTACCTAACGGCAACCTTGGCTACACT
+GTATTTGGCACAACTCCAGAACAGTCAGACTTGCTTGGTGGTGAAGCGACAGATGCAAAT
+GTCTCAATTGTCGAAACTGGTATCGCAATCACAACAACCAAGACAACTGATCCAGTAAAC
+GTCCAAACCAAGGTATCTATGATTGCCTTGCCATCATTTGAACGCTTGGAAGAAGTACAT
+ATTATTAATGGCTTGCAAGATGCATAAGGAGGTGCTTTATGGCCAAAGTTATTAAGACTT
+TTAGAGATAAAGTGACGACTAATGCTTATTATGTAGGCGATGATTACAAAGGAGATCGTA
+TCGAGGAATTGACAGCCAATGGTTACTTGGCCGGAAATACTCCTAAACTGGATACTGTCG
+AAGAAGTTGACCTAGATAAACTCAAAAGCGATGAAATCAAGGCAAAACTTGACGAATTGG
+GCATTGAGCACGATTCTAAGCTTAAAAAGGCGGAATTGTTGGAGCTTTTAAAAGCTAACA
+TTTAACGGAGGTGTTTATGGCAAATGTAAACACATTTAGCATTGTAAAAAATGTCAAGCT
+CGATTTAGGCATTGAGGACGACAATCAAGACCAGTTGTTGGAGATGTTGCTAAATCGTAT
+TACAGACCACTTCAAAGCAAATTATGGCGTGTTAGAAATTGACAATGCTTTTTCTTTTGT
+CTTGGAAGATTGTCTGATTGCTCGTTTTAACCGTAGAGGTTCAGAGCGTGCCAAAACAGA
+GGAAGTGGAAGGTCATAAAACAACCTACTACGACCATTTGAATGAGTTTGAACCCTACGA
+TGCCATGATTATGGCAAAGCTTAATTTAATCAAAGACAAATCTCGTAAAGGGGGACTGTA
+CTTTTTATGAGATATGCAGATAGAGTTACATTTGTTAAAACGACGGATGAGCAATACAAT
+CCCGATTTAGGTGAGTATACGCACACAGAGGTCATAAGTATCACAAAACCTTGTTTTGTG
+ATGGACATGGGCATGGAAAAGTCCGTACAGATTTTTGGAGATTATCAAAAGGATCGTAAA
+GTTATCTACCTAAAGCAGCCTTATACAAAAGCATTTGATTATTGCGAGTATGAGGGCAGG
+AGATACAAAACGCAGGCAAATAAGCTTGGCGCTATTGTTTTTTATCTGGAAGGAGATGAC
+TCTATTGGTGGCTGATATATCTTTAAAAGTAGTTGGAACAGCTGGTTTAAAAAAGAAACT
+TGAGCTTATTATCAAAAAAGATGCCGTCAAGAAGATTGTCAGAGACAATGGGACGCAGCT
+TCAAAGGAAAATGATTAATAAAGCGGTATTTACAAAAGGCTATTCAACAGGTGCAACTAG
+ACGTTCTATTACCATGCAAATCGGCGATGGTGGATTGAGTGTCAAGGTTAAACCAGGAAC
+TCATTATGCCGGCTACCTTGAAAGAGGAACTCGCCTTATGAGCAAACAACCGTTTGTTTT
+GCCAGCTCTAAAAGAGCAAAAAGTAAAATTTAGAAAAGATTTGGAGGCGCTTGTCAAATG
+ATTAAAACTAGAGATCAGTCTATTTTTGACGAAATGTTTAAACGCATCCAGTCTTTAGGT
+TTTAAGGTTTACGATTATAAACCGATGACGGAAGTTCCATATCCATTTGTGGAAATGGAA
+TCTACTGATGCGGAATATATTCCAAATAAAGATGACATTAAAGGTTCTGTTGAACTTATG
+TTGTCTGTTTGGGGGGTGCAGAAAAAACGGAAGCAGGTGTCTGACATGGCATCTGCTATT
+TTTTCGCAAGCTTTGACAGTAGAGAGTTCTGACGTTTTCCGCTGGTCATTAAATACTCGT
+CAATCATCTATTCAAATGTTAGATGACACAACAACTGTGACACCTCTTAAACGAGCGATT
+GTCACACTTAGATTTAATTTGAGATAGGAGGTAGAAATGCCAGAATCAGAAACATTATCC
+CCTGACATTCATACCAAAAGTCACGAAGATAGTCCAAATACTGTAAAAAAACAGGAGGAA
+GTAATGGAAACACAATTAGAAGCAAAACAAGGGATTCATTCAATCTTGTTATTTCGTTTG
+TTGAAAGAAGCATCTAGTGAGGCAGCAACTAAACTTGCTTTTCAAACAGAGCATGAAGTA
+GGTAAAAGCCGTGACGTAGATGGACAAAAAACTAAAGATGGTATTATCCAGTCCGTGGGG
+GCTTTGGAGTACGACTTTAAAGCAACATCTATTTTAGCTAAAGGTGACGTACTAGCAGCT
+AAACTAGAAAAAGCCATGGAGAATGGTGAGCTTGTAGAAATTTGGGATATTGATTTAGAA
+GAAACAAGCAAAAACGGCGACAGCGACAATAAGCTTGCAAACGTTTGGGGTATTGATAAA
+AATGGAACAAACAGAGGAAACGGTAAATACCTAGCGACTTATTACCAAGGGTACATCTCA
+AGCTTCAGTGCTAAGAAAAATGCTGAGGAAAATATTGAAATTGAAATGGAATTTGCCATC
+AACGGTGTTGGCCAAAAAGGATTCGCTACATTAACAGATGCCCAAAAAGCAGCTGTACAG
+TACGCATTTAAAGATACAACGAAAGGTTAATCAACAAGGCCAGTTAATTACTGGTCTTTT
+ATTTTTAAGTTTTTAAAGGAGAAAGAATAATGCAATTGGAAATTAAAGGTAAAACTCATA
+ACGTAAAATTTGGTACACGATTTGTTGCCGAGATGGACAAAAATCATATAGCAGAACGTC
+AGGGATTTAAATTTGGAGCTGGTCTACAATCTAGCGTTCCGTTTTTAATCGACCACAGCG
+TTGTTACTCTTGCGGAAGTAATTTATACAGGTACAATCACCGAACCACCACGTCCTAGTT
+TGAATGATATTTACGACTATATTGACGAAGTTGAAGATATTGAAAAGCTTTTTGATGATG
+TTTTAGACGAACTACGTCAATCAAACGCATCAAAGTTGTTTATGGCTCAGGTGGAAAAAG
+ACCTGGCGGAAGCCAAAGCGTAACAAATATAAAAAAGAGTTATTCTTCTCAAGAAAGCTT
+TGAGATGATTGTGCTTAATTGCATTAGATACCTTGGCATGACTGACATCAATGAAATCGG
+GCGATTAACTTTGTATGAATATGATTTATTAATGACAGGCAAAGCACTAGCGGCTGTTGA
+TGAATCACATAAAGCTCACAAACAAGCTTGGATAAACCACCAAGTTACGGCAACAAAACT
+TGTTGGTGGCAAGAAAAATAAAAAAGAAGTCCCTGTTTATAAAAAATTCAAGGACTTTTT
+TGATTATGAGGAAGAAATCCGAAAAATCACTCAAGAAATTGATGAAGGTTACGACAAGAA
+AGGTATGGATTTACTTCTCAAAGCTAACCTTTAAAGAAAGGAGGTTAAATGGGAGAATCT
+TATTCTGTTGAAGCGGTTTTGACAGCTGTTGATAAAACCTTTGGCAAAACATTACAATCG
+GCAATCCGTTCAATCGATGGCTTGGAAAAGCGTTCAACCGGTTTTTCATCGGTGTCTCAA
+AAAGCTAGTTCCATGTTTAAATCCATGTTAGGAGCGAATTTAGCCGGACAAGCTATCTCA
+GCAATGACAAGGACAGTGTCATCAGGCCTTGGCTCTATGCTTGGCGAGATGAATAGTTCA
+GCGAAAGCGTGGAAAACTTTTGACGCCAATTTAGCGGACATTGGGTTTGGAAAAAAACAA
+ATTTTGGCAGCTAAAACGGCGATGCAAGACTATGCAACTAAAACAATCTACTCGGCATCA
+GATATGGCTAGCACGTATGCACAGTTAGCGGCAGTTGGTGTGAAAGATACCGGAAAGCTC
+GTAAAAGCTTTTGGCGGTTTAGCTGCATCTGCTGAAAACCCGAAGCAGGCCATGAAGTCT
+ATCAGTCAACAAATGACGCAAGCAGTAGGAAGACCAACAGTTGCATGGCAAGACTTTAGG
+ATAATGCTGGAACAGGCGCCTGCAGGGATGGCTAAAGTCGCTAAATCTATGGGTAAAAAT
+CTTGATGAACTCGTCGCCGATATCCAGGCGGGTAGGGTTAAAACCAGCGATTTTTTGGAA
+GCGGTAAAAAAAGCAGGCAATGATAAGAGTTTCCAAAAGATGGCAACTGAGTTCAAAACT
+GTTGACCAAGCCATCGACGGTATGCGAGAAGGCTTATCCAACAAATTGCAACCAGCGTTT
+GAAAAAGTGAACCAATTTGGAATTAGAGCGATCGAAGCAATCGGTAAACAACTCGATAAA
+GTTGATTTTTCTAAGTTTGCTAGTAATCTTGGGAAATTCCTTGAAGGAATTAATATCGAT
+AAAATTGTATCTAATATTTCATCGGCGATTTCATCTGTCACTTCAAAGGTTAAAGAATTT
+TGGGGCGGTTTCAAACAAACTGGAGCAATTAGTGCTTTTTCAGGAGCTTTAAAAAGTGTT
+TGGGGAGCGTTAAAAAATGTAGCTAGCGCTATGAGTGGAGGCAGTTGGAAAAACTTTGGC
+TCTATTGTAGGCGGAATTGTAAAGCATGTGTCTAATTTTGCAAAAGCTATTGCTGATGTT
+GTCGGTAAAATGGAACCTGGCAGATTGCAAAGCTGGATAGCCACTTTTGCAGCAGTCGGG
+GGAGGGTTAAAGTTATTTGAAAAGCTAACAGGACAAAGCGTTGTTGGCTCTTTTTTAGAT
+AAAATCAGTACAAAATTTGGATTATTTGGCAAAAAAGCTAAAGAAGGAACCGATCAAGCA
+GCGAATGGCTCTCGTAAAAGTGGTGGAATCATCAGCCAAATCTTTAATGGCTTGGGTAAT
+ATCGTTAAGTCTGCTGGTACAGCCATATCAACAGCTGCAAAAGGTATCGGTACAGGGATT
+AAAACCGCCTTGTCTGGGGCACCTCCTATCATTAGTTCTCTAGGAACCGCAATATCAACA
+GTTGCGCAAGGTATAGGCACTGGGCTAGCAATCGCTTTTAGAGGTTTAGGAGCTGCAATC
+GCTATGGTGCCTCCCACCACTTGGCTAGCTTTAGGAACGGCTATTTTAATGGTAGGAGCG
+GCTTTTGCCTTAGCAGGAACTCAGGCTGATGGCATTAGTCAAATTTTAAGGACTATTGGC
+GATGTTGTTGTACAAGTTTTACAACAGGTCACTGATAGTCTAGCCACTTTACTAACTATT
+ATCGCAAACGCTATTGGCTCTATGTTGCCAATTGTAGCTGGAGCTATCTCTCAGATTGTA
+GGCGCAGTAGCGGGCGGATTATCTCAGCTCATTATAGCCGTTTCAACAGGGGTATCTCTC
+GTTATAGGAGCTTTCACAGGACTTCTTGGTGGTATTTCTGGGGTTATTAACTCCATTAGC
+GCTGTTATCCAATCGCTAACTGGTGTGATTACCGCAGTATTCAATGGCATAGCTACTGTT
+ATTTCATCTGTCGGTTCGACTATCAAAGATGTATTGACGGGTCTAGGAACCGCTTTTGAA
+GGATTTGGGAATGGTGTAAAATCAGCTCTAGAAGGTGTTGGGGCAGTAATTGAATCATTT
+GGTAGTGCAGTTAGGAATGTCCTTGACGGTGTTGCAAATATCCTTGATTCTATGGGGACT
+GCGGCACTTAATGCAGGCCGTGGCGTCAAAGAGATGGCTAAAGGTATTAAGATGCTTGTT
+GATTTATCCCTTGGAGATTTGGTTGCTACATTAGCAGCTGTGGCAAGCGGTCTAGGGAAG
+ATGGCTAGCTCAGCTGGCGAAATGACAACATTAGGTTCTGCTATGAGCAAAGTAGCCAAT
+GGTATGACACGTCTAGCAACAAGTGCTACGATAGCAATTACTGGATTAACAGTCTTTGCC
+ACCACCATGGCAACTATTAAGACAGCAGTTGCAACTCTACCGCCAGTCCTAACGATGGCA
+GCGAGTGGGTTTACCACATTTACTACTCAGGCGGTGGCAGCAGTGACTGGATTGGCTGCA
+ATTAATGCTCCAATCACTATGTTTAAAGCTCAACTAATGACAATAACACCAGCTCTAGCA
+CAAGCTGGCGCTGGCTTTGCCGCGTTTGTTGCTCAATCATCAACATTTAGTACAGGTTTA
+GCATCTGCCGGTCCTACAATAGCAGCATTCAATGCTAATTTGATGAGCTTATCTGCAACA
+ACAGGAGTGCTAGTTGCATCAATAGCTGGTTTATCAGCTGTGCTTTCTGTTGTATCAGCT
+GGCTTTAGCCAAATAGGGGCTTCTGCGACAGCAACTGTTGGTCAAATACAAGCTTTTGCT
+TCTAGTACAACAGTTGTTTCGTCAGCATTTGCTAGCATGCAATCTATGATTCAATCTGCC
+ATGGCTGCAATAGTAAGCAGCATTATAACATCATTTAATCAAGCGGCCTCTCAAATGCAA
+TCAATCTTATCTCGAATGCTATCTCAGGCCAGGACATTTGGGTCTCAACTAGAGCAACAA
+ATGAGACAATCGGGACAGCGTTCAGGACAAAATCTTGCTCGGGGGCTATCTTCTCAACAA
+GGTGCTGTTATTAATGCTATTTCTAGCATGGTTAATGCTGCGGTATCAAGAGCCAACGCG
+GGAGCTGGTCCTATGCGTCAAGCTGGAGCGTACATCGGACAAGGGCTTGCGCAAGGAATG
+TATTCAGCGCTAGGAGCTGTAACAGCTGCAGCAAACGCCCTTGTAGCACAAGCCGAGAGA
+GCAGCAAGAGCCAAGGCGATGATTCATTCGCCGTCAAGGTTGTTTGCAAAACGAGTTGGT
+CAATATATCCCGCAAGGGGTAGCTATGGGTATCGACAAAAACGCTGATGTCGTTGACGAC
+TCTGTTGGCGGGTTATTTGATAGCATCAATAGCTTTGATTTTAATATCGCAGATAGACTG
+ACTAGCATTGGAGCTAAATTCCAAGGTGTTGTCAAATCAGAGAGTTCGCAATCGTTATCG
+CAGCAACAAGAGTTTGTACATACAGCTCAACCAGCGTATATAAACTTTAGTTTAGGCGGA
+AACGAATACGAAGCATTTGTAAGTGACATCACTAATCAACAAGCAAAAATTGAAAAAATC
+AGACTAAAGAGAAGCAGCTGGTAGTTGTTTCTCTTAGTTTTTTTGAAAGGAGTAAAATGT
+ACGAATTTAACGATACTATCAGAGGTACTCCGAAAGTTACTTTTAATTTAAAGACAACAA
+TTGGTGGAAAGGTATTAGAAGACGAACTCAATAATGGTTTCGGTACCTTTAGGACATTGA
+CTGTTTCTGGTCGTGATGTGGTGGACTTAGAGCATCAAACAACAAGTGTGTTAGGACGAA
+ACGGAGAGTATTTCCACAATGCCACAGTTGAAGTCAGAAAACTAGAAATAAAAGCTAAAA
+TCAGTGGAAAAGATAACAAGTCAATGCGTTTACAATATGAAAAATTAAACAAATTAATTG
+TTAGTCACAATCAAGTTTTTTTATCATTTTCAGACGAACCTGACAGAAATTATCTAGGCA
+TCTTTAAATCTAAAGATGTCCCAGAAGAAGTTTCTAACGAGCAGATTATAGGACTAACAT
+TCATCTGCTACAATCCGTTTAAAATGTCTGATGTAAAAACTAAAAAAGGAACATCTATCC
+AAAATGGTGGGTTATTTCAAACAAAGCCTATCATCACTCTCAACCTATCATCACCAACAA
+AAGAAATTAAGTTGTTGCATGTCGAAAGCCAGAAGTATATCAGATTGACTGGAACTTATA
+CCACTGACGAAATCAAGATTGATATGGCCACGGGTAAGATTACCCAGAACGGACGCAATA
+TCCTTGGCGATTTAGATATGATTAATAGTAGGTATTTTGAGCTATTACCTGGTAATAATA
+CATTACAGTGTGCCAATGCCGCCATAACCGCAGAGTTTAGAGAGGTTTATCTATGATATA
+CCTGTTTGATAAACTTGAGCGATTGGTCGCTACTGTTGGTACTGATGACTTGCTCTCATG
+GCACTTTAAGGTCAAAAACAATGATTGGGACCAGGCTAGTTTTGAGGTGCCAGTTGATTA
+TGACGTAGAGCCATTTGTCTACTTTGGTTTTTTTAACTACGACCCTCATCAAAAAGAAGA
+TGTCTTTAAGCTCTTTAAAGTCATTGATTACAACCTAGAAGATAGCAAGTTTTACAAAGG
+CTTAGACAAAGCTGAGAGTGATCTTGATACCATTGCCATTATCAAAGATAAGCGATTTAG
+ACAATCGTCCGCAGATGCTTGTATTGATGGTGCTTTAGAGGGTACGGGTTATCAAGTCGG
+CAAAGTTGAGGGAATAACAAATGTTAGAACACTTAGTTATTACTACATCAGTCCACGAGC
+GGCTCTGATTAAGATTGTGGAAGCTTTTAACTGCGAGTTCAATGTCAGGTATACCTTTAT
+TAATAACAAAATCACTAGTCGTTATATCGACCTCAAAAAGCGCTTTGGAAAGCCAACAGG
+CAAGCAATTTGAACATGGCAACAACCTACTAAAAGTCGTCTACGAGGAATCAACAGATGA
+CATTGTGACTTGTCTGATTGGCAGAGGTAAGGGTGAGGAAATCCAACACGAAGAAGCTGA
+GCCTAAAGATGTCGAGGGACACTTGCCACAGGAAGAAAGGCGGCAAGGCTACGGTCGAAG
+AATCGAATTTACTGATGTTGTCTGGTCGGTCGAAAAAGGCGACCCGATAGACAAACCAGC
+TGGTCAAAACTTTGTAGCACTAGATAGTGCAAGGGAAGAATACGGTTTGTCTCAAAATGG
+TGAGCTAAAACACCGCTGGGGTGTCTTTGTCAATGAGGAAATCGAGGATAAGACAGAACT
+CTTAAAAGCAACTTGGGAAGAATTGCAGCGTTTGTCAATCCCTATCAGAATTTACAAGGC
+AGAAATCTTAGACATTGGTCCAGAGACGTGGAAAGGCGACTCAGTAGCCATTATCTATGA
+TGAGGTAAAAATAGCTTTTGAAACTCGGGTTGATGAGATTGATATTGACAAGCTTAATTT
+TAACAGGTCAGTCGTAACACTTGGTGATTACAGCGTTGTCCAAAATCGTGAGTCACGGTC
+TCGTAAAGAGGCTGTCCAAAACATGATAGATGAATCTTTAGAGACTATCACAGACTTAGG
+GATGACATTTCAGGAATTTTTGCAAGGCATCGAAAAACGCATCGAGACTGGCAAAAAGGA
+GATGGAAGACAATTGGCGCAAAGTTAACCTTGAATTTGATAACTTTAAAAAGAAGGTTGA
+GCAAGAAGGCTTGCAATTCAACACCTTGAAAGAACAAATCAAAGAAGTTGATGAACGCAC
+CGATAAAGAGCTTGAAGAGTTCCGAGCCACCCTCAAAAACCTAGCGTTACCGGAAGAAGC
+CATCAAAAAAATCACCGAGGCTATCAAAGTTGATGACATCCCGTCTATTAAACAAAGCTT
+TGATGACCTAAAAAACAAAGTCAGTGAAACGAGCGAGACGTCCCGTCTAAACGCCGAAAT
+TTTAGGTAACAACGGTAAGACCCGCTACAACAAAAATTTGCTGGTTGGCGACCCTAACCG
+CACCAAAACCTATGATGAGGATTACATAGAAGTAGAAGCTAACGACGGTGGTTTTAAGCG
+TGGCGAGACCTACACGATTAGCTTTAGCCAGACTTGTGAGCTACTCAAAAAAGTGGCTGT
+CACGCTGACACAGGCTAACAACAAGGGAGTTAAGTTAGTGCTGACACCTACCAAGGCTAA
+GATGGAAGCACAGACGTTTGAGGTCGCTAAGGATAAACAGTCTATAGAGGTTTATCCTTT
+GAGCTACACGGCTGTTTTAACTGGCGACTGGTATAAATCTAAGCAGATAGATTTAAACGC
+GTCGGAGGTGCAGGAATTGGCCCTGGATATGAGCTATAAAGATGTTGTGGACGGTAAAGG
+AGCAACTATCACAGGGGCATGGTCAGACAGCCCACAAATTATATTAGACGGAGGTAATTA
+ATGGCTGAAAATATACCGCTACGAGTCCAATTTAAGCGGATGAAAGCCGCCGAGTGGGCA
+AGTAGTGATGTCGTCTTACTGGAGGGTGAGATTGGCTTTGAGACTGACACTGGTTTTGCT
+AAGTTTGGCGATGGTCAAAACACTTTTAGTAAGCTTAAGTACCTTACTGGTCCCAAAGGT
+CCTAAAGGAGACACTGGTCTCCAAGGTAAAACTGGAGGAACTGGTTCTCGGGGCCCTGCT
+GGCAAGCCTGGAACGACAGATTATGATCAACTCCAAAATAAACCAGATCTAGGTGCGTTT
+GCACAAAAAGAAGAAACTAATAGTAAAATCACCAAATTAGAATCAAGCAAAGCAGATAAA
+AACGCTGTTTACTTAAAAGCAGAGTCAAATGCAAAGCTAGACGAAAAATTAAATCTCAAA
+GGCGGCGTCATGACAGGACAACTACAGTTTAAACCTAATAGTGGTATTAAACCCTCATCT
+TCCGTAGGAGGAGCGATTAACATTGATATGTCTAAATCGGAAGGTGCTGCTATGGTGATG
+TATACAAATAAAGATACTACTGATGGACCATTGATGATTTTACGCTCTAACAAAGATACG
+TTTGATCAGTCAGTTCAATTTGTCGATTATAAGGGAACAACAAATGCCGTTAATATTGTG
+ATGCGTCAGCCAACCACCCCCAATTTTTCATCGGCACTTAATATAACCAGTGCTAACGAA
+GGCGGTAGTGCGATGCAAATTAGAGGCGTCGAAAAAGCATTGGGAACGCTCAAAATCACA
+CACGAAAACCCAAGCGTTGACAAAGAATACGATAAAAACGCTGCAGCGTTATCCATTGAT
+ATTGTCAAAAAACAGAAAGGCGGAAAAGGTACTGCTGCCCAAGGAATCTACATTAACTCA
+ACATCAGGCACGACAGGGAAGTTGCTTAGGATTAGAAACCTTAATGATGATAAGTTCTAC
+GTCAAGCCTGACGGTGGTTTTTATGCCAAGGAAACTTCGCAGATTGATGGCAACCTGAAA
+CTCAAGGATCCCATAGCGAATGATCATGCGGCAACCAAAGCTTATGTTGATGGTGAAGTC
+GAAAAATTAAAAGCACTCTTAGCGGCTAAGCAAATGTAAAAAGGAGGATAAATGAGTAGA
+GATCCAACGTTGACATTAGACGAGTCAAATCTCGTTATTGGTAAGGATGGACGTGTGCAT
+TATACATTTACTGCTAGTCAAGACAACCAAACAGTTAGACTAGCCAGCAACTGCTTAGGC
+ACAGCGCACTTTAATCAGCTCATGATTGAGCGAGGGGATAAAGCGACTGGCTATGTGGCG
+CCTGTGGTTGTTGAGGGTAGCGGTGAGTTGACAGGTGTGTTTAAAAGTCTTGAGGAGATG
+CTTAGTAGCTTGAGATCTATTAATTTAGAGCTGACAGACACCAAAGACTCTAAGCTTTGG
+TCAAAAATCAAGTTGACTAACCGTGGCATGTTGCAGGAGTACTATGACGGTAAGATCAAG
+ACTGAGATAGTCAACTCCGCACAAGGTGTGGCTACTCGTATCACAGAGGAGACTGGCAAA
+AAGCTAGCACTTATCAATGAGTCTATCAACGGTATAAGGCGAGAGTATCAAAACGCTGAT
+AAAAAGCTATCAGCTAGCTATCAGCTGGGCATAGATGGTCTCAAAGCCACCATGCGTAGT
+GATAAAATCGGCTTACAAGCTGAGATACAAACAACCGCTCAAGGCTTGTATCAAAGGTAT
+GATAACGAGATACGCAAGCTGTCCGCTAAAATAACCACTACCTCGTCAGGCACTACAGAG
+GCCTATGAAAGCAAGCTCGATGGCTTACGAGCTGAGTTTACTCATAGTAATCAAGGTATG
+CGCGTAGAGCTGGAGTCAAAAATCAGTGGGTTGCAATCAACGCAACAAGCAACTGCCAGG
+CAAATCTCACAAGAGATAAGTAACCGCGAAGGTGCTGTCAGTCGTGTACAACAGGGCCTA
+GACAGTTACCAACGACGATTACAGTCCGCAGAGGGTAATTACAATAGTTTGAGAGAGACT
+GTAGCGGGTTATGAGCGCAGGATATCCAATCAGGATAACACTATCTCCTCTAACTTTACA
+CAGCTAAAAAGCTTGATAAATCAGTCTGTGACCTTAGGAAAAATACAGTCCCTCTTGCGG
+CAATCTGGCGACAGTATCATGCTTGCGATTAAAGACAAAATCCCGCAAAGTAAAATGTCT
+GGCAGCGATATTATCTCAGCGATTAACTTGAATTCCCGCGGTGTGCAAATAGCTGGTAAA
+AACATCGCTCTTGATGGCAATACGACGGTTAATGGAGCTTTTGGGGCTAAGTTAGGGGAG
+TTTATCAAGCTAAGAGCCGACCAGATTATCGGTGGGACAATCGATGCAAACAAAATCAAT
+GTGATTAATCTCAAAGCTAGCAGTATTGTTGGTTTAGACGCTAATTTTATCAAGGCAAGA
+ATTAGCTATGCTATCACTGATTTGCTTGAGGGTAAAGTTATTAAGGCTCGTAATGGTGCG
+ATGACAATAGACTTGCAAAGCGGTCAAATCAACCATTACACAAATGAGTCAGCCATGAGA
+CGTATCGATAGCAGTACAGCTAGTCAGTTTATAAAGATGACAAAGTCAGGCTTTATATCT
+GAGATAGGTAACATGCAAGCTGCAATGACGGTTATAGGCTCTAATAGCGATGGGTCAGAA
+AACCATGAAAATAAAACCTTCGGAGGCATAAGAATTTGGAACGGGAAGTCATCTTATCAA
+TCGACAAGTTTTGTTGAATTAGTTGGTAACCGTGTAGCAATCTATGGAAATAAAAATCGT
+AGTCCATGGCTCTTTGACTCAACAACGTCAGGATATGCTTACCTTATCCCTCAAAATGAC
+AGAGGTATAAAGCATGTCATAGGGAGAGCTGATCGTAAGATAGACCAAATCCACGTTGGA
+GATATCTATGTGCAAGGCGAACGTGTAGCCATGATGTTAAAAGATTTAGCACTTAAAATT
+GGCTATATAGGTACAGGTGGTTGGGCTAACCGCATAGGATAAATTAGGAGAAACAATGCA
+AGAAAAATTATTAGGTAAAATTATTAACGATTTAGCACTTAAAGTTGCTAATTTAACGCT
+AGAAAATGCTCAATTAAAAGCACAGCATGAAATCGAATTGGAAGAACTAAACGCACAATT
+GGATGAAGCAACAGCACCGAAGGAAGAAGGTAAATAAACATGAGAAATTGGAAAGTAACA
+GGAAAATATCCACAACTTGATGGCACAGGAGCAGTCGCAAGCACACATATTATTATCGCT
+GCTGAGGATGGAGCTGTTATCCCGCAACTTATTAAGCAAGACTTAACCTCAACTAATGAC
+ACAGAGATTATCAAAGCCGCTTTGGAAGAATTTAAAAAATCTGAATACGTTGAAATTGCA
+ATGGGCGAAGCCGTGCAAAAAGTAGACGACCTTGAAAAAATCTCACAGGAAACCGCTAAG
+ACCGCTAAAACAGCCCAAACAGCCGCAGGATTAGCTAAGGTGTCCGCAGAGCGTACACAG
+CGAATGATTAACTTGCAAACCATCCACGTATTGACAAGTGGTGGGAACGTTGAACCCGAT
+ATCTACAAAGGTATGTTAGAGCTTATTGAGCCTGCTAAACAAGGCGAGTATCAGGCTTAT
+GACGTGTTTACTGTTGTAGATGAGTCGCACGAAGATCAAGCGGTAGAAGGGAACCTTGTC
+TTTGTACATGTCAACGAGCCGTTTACTTATGAGGCGCAAACTCTTAAAGATTTGGAATCA
+GAGGATAAAGTCACAGTTATTAAATATGCGGATTTGGTTAAACAAGATTAGAGGTGGTTA
+GATGATAGATTTTGTACAAATTGGTGCTTTTTGTGGCGCTGCTTTGTCTATCTTGGGTGT
+TTGGGGATTTATCGTCAATCCCTTTAAAAAAGCCATGGAAGCTAATGAGTTTGCCATGGC
+TCAACTCAAGGACTCAATTAAGGAGTTAGCTTATGAGCTTAAAAATCTTGATCGTGAACG
+TGAGATTACCAAAAAAATTATCGACAGACACGAGGAGCGTTTAGGTCGCGTAGAAGACGA
+AGTTATTATCAACAAGGAGCGTATTATTACGCTATTTAAAAAAGGAGAAGAAAAATGAAT
+AACTGGTTTAAAAAAGTAGCAATTAAAACAATTAAAACAATGGCACAAATGGCCGTTGGT
+CTAATCGGGTCAAGCGTGTTAATCACGGATATTAATTGGCCAACAATGTTGTCAGCAGTG
+CTGTTGTCAGGACTAACATGTATCCTGATGAATGTGTCACAAATCAAGGAAGAGGAATAG
+GTCATGCGAGCAATCACACGATTAGCATTAGTTATAGCAATCGCAATACTGTATGTGCCA
+TTATCTGTGGTTGCTTTGATTTTTTATCCATTTTTAGATAAGGAGGGATAAATGGCTACA
+TATCAGGAATATAAAAGTCGTTCAAATGGCAATGCTTACGATATTGATGGATCGCTTGGT
+GCGCAATGTTGGGATGGCTACGCAGACTACTGTAAGTATCTAGGACTGCCATACGCAAAC
+TGTACAAATACAGGATATGCAAAGGATATATGGGAACAACGTCACAAAAATGGTATTTTA
+AACTACTTTGACGAAGTAGAGACTATGCAAGCTGGAGATGTCGCAATTTTTATGGTAGTT
+GCAGGTGTTACACCGTATAGCCATGTGGCTATTTTTGATAGTGATGCAGGTAGTGGATAC
+GGATGGTTTTTAGGTCAAAACCAGGGTGGAGCAAACGGAGCATATAATTTAGTAAAAATA
+CCATATTCAACGACTTATCCTACTGCATTTAGACCAAAAGTTTTTAAAAATGCAGTTACT
+GTTATAGGTAATATAGGACTAAATAAAGGCGATTATTTTATTGATGTATCAGCTTATCAA
+CAAGCAGACTTAACCGCTACTTGTCAGCAAGCTGGCACTACTAAAACGATTATCAAAGTA
+TCCGAGTCACTCGCTTGGCTGTCTGATAGGCATCAGCAACAAGCTAATACTAGTGACCCT
+ATTGGTTATTATCACTTTGGACGATTTGGAGGAGATAGCAACTTAGCGCAACGAGAAGCA
+GATTTATTTCTGTCCAATTTACCAACCAAAAAAGTCTCTTACTTAGTCATTGATTATGAA
+GACTCTGCAAGTGCCGACAAAGAAGCTAACACTAATGCAGTTATTGCGTTTATGGATAAA
+ATTGCAAACGCTGGATATAAGCCTGTTTATTACAGCTATAAACCATTTACGCTTAATAAT
+ATTGATTATCAGCAAATTATCGCTAAGTACCCAAACAGCATTTGGATAGCTGGTTATCCA
+GACTACGAAGTACGAACAGAGCCACTTTGGGAGTTCTTCCCTTCAATGGATGGTGTGCGC
+TGGTGGCAGTTCACAAGTGTAGGAGTAGCAGGTGGTTTAGATAAAAATATTGTATTATTA
+GCAGATGATAGTAGCAAAGTGGATATACCTAAGATTGACAAACCACAAAGCCAGCTTACT
+TTTAATCAAAAGCTAGATACTAACACTAAATTAGACAACTCGAATGTACCTTACTACGAA
+GCAACCCTTAGAACAGACTATTATGTAGAGTCTAAGCCAAACGCAAGTAGCGCTGATAAA
+GAATTTATCAAGGCAGGAACTCGTGTAAGAGTCTATGAAAAAGTGAATGGATGGTCACGT
+ATTAACGCTTCTCAGTCTGACCAGTGGGTCGAAGATAAGTATTTATCTAATGCAACACAA
+GTATAAAATAGGAGGTAAAGCTCCTTTAGATAAGACAAATGCCCTCGCTTTTGCGGGGGC
+TGTTTTTGTTATAAAGATTTTAATTGTTATTTAAGCATTTTCGTTGATTTTTTTCTTTTT
+TGTGCTAAAATATTTTGTGATTTCTTATTATTAAAGAAGAATAGGGTACACTTATAAGTG
+AGAAAAATTGTAAATGTTAATTTTAAAAAGTTTTTAACTTCATCTTTTCTATTGTGGGTA
+TTTATATCAGCTATAATTCCAACGTGTTACGCGTATGAGATGAGTAGTGTGGGAGTTATT
+AATTTAAGGAATTTATACTCTACATATGATCCAACAGAAGTAAAAGGAAAAATAAATGAA
+GGTCCGCCATTTTCAGGTAGTTTGTTCTACAAAAATATTCCTTATGGCAATAGTTCGATT
+GAATTAAAAGTAGAACTTAATAGCGTAGAAAAAGCTAATTTTTTTTCTGGTAAAAGGGTG
+GATATATTTACTTTGGAGTATTCTCCTCCCTGTAACTCTAATATAAAAAAGAATTCATAT
+GGAGGTATTACTTTAAGCGACGGTAATAGAATTGATAAAAAAAATATACCTGTTAATATT
+TTCATAGACGGCGTTCAACAAAAATATAGCTATACAGATATAAGTACAGTGAGTACTGAT
+AAGAAAGAGGTTACGATTCAGGAACTTGATGTGAAATCAAGATATTATCTTCAAAAACAT
+TTTAATATATACGGATTCGGTGATGTTAAAGATTTTGGCCGCTCCTCTAGATTTCAATCT
+GGCTTTGAGGAAGGAAATATTATTTTTCATTTGAATAGTGGAGAGAGAATTTCTTATAAT
+CTTTTTGATACAGGACATGGTGACAGAGAGAGTATGCTAAAAAAATACAGTGATAATAAG
+ACCGCTTATTCTGATCAACTTCATATTGATATATACTTAGTTAAATTTAATAAATAAAAC
+TCTCACTTCTTAAGGAGAAAAAATGAGATATAATTGTCGCTACTCACATATTGATAAGAA
+AATCTACAGCATGATTATATGTTTGTCATTTCTTTTATATTCCAATGTTGTTCAAGCAAA
+TTCTTATAATACAACCAATAGACATAATCTAGAATCGCTTTATAAGCATGATTCTAACTT
+GATTGAAGCCGATAGTATAAAAAATTCTCCAGATATTGTAACAAGCCATATGTTGAAATA
+TAGTGTCAAGGATAAAAATTTGTCAGTTTTTTTTGAGAAAGATTGGATATCACAGGAATT
+CAAAGATAAAGAAGTAGATATTTATGCTCTATCTGCACAAGAGGTTTGTGAATGTCCAGG
+GAAAAGGTATGAAGCGTTTGGTGGAATTACATTAACTAATTCAGAAAAAAAAGAAATTAA
+AGTTCCTGTAAACGTGTGGGATAAAAGTAAACAACAGCCGCCTATGTTTATTACAGTCAA
+TAAACCGAAAGTAACCGCTCAGGAAGTGGATATAAAAGTTAGAAAGTTATTGATTAAGAA
+ATACGATATCTATAATAACCGGGAACAAAAATACTCTAAAGGAACTGTTACCTTAGATTT
+AAATTCAGGTAAAGATATTGTTTTTGATTTGTATTATTTTGGCAATGGAGACTTTAATAG
+CATGCTAAAAATATATTCCAATAACGAGAGAATAGACTCAACTCAATTTCATGTAGATGT
+GTCAATCAGCTAA
+>NC_002737.2|provirus_1186916_1222544
+TTATTTAAAAGAAAGTAAACGCAAGCCATTTAAAATCACTAAAATCGTTGAGCCTTCGTG
+TCCAACAACACCAAGCGGCAAGTTAACTACCTGAAAAACATTGGCTAAAATCAATAAGGT
+AATCACAGATAAGGCAAAAACAATATTTTGTTTGATAATGGTCTTCATTGTGCGGGAAAG
+TTGAATCGAAAATGGAATACGAGTCAAGTCATCCATAATCACACTGTCTGCACTTTCCAT
+TGCAATATCTGTTCCTGATCCAATAGCATAAGAAACATCTGCTTGAGCAAGGGCAGGAGC
+ATCATTAATACCATCTCCTACCATAGCCACAAAACCATATTTAGTCTTTAATTCTGCTAA
+CTTAGCCACCTTATCTTGAGGCATACAGTTGGCTACCACTTCATCAATACCAAGTTTTTG
+TGCCACATAATTGGCGGTTCGTTCTTGGTCACCTGTTAACATGACTGTTTTGATTCCCAT
+GGCATGAAGAGACTTAATAGCACGTTTTGATTCTATTTTGATATCATCCAAGAGGGCATA
+GTAAGCTATCAATTGATGGTCACGTGAAACAAAGATTAGGGTTTTCCCTTGATTTTCTTC
+CACTTGAATAGTTTCTTCAAAAGCTGATAGGTCTTGAACCTTTTCCAAAATGTAGGTTTT
+CTTGCCAATTCGCCATTCTTGCCCTTGATAGAAGCCCTGAAAACCTTTCCCAGAAATTTC
+TTCTAAGTGGTCAAAGGTCAGTGGCTCCAATTTTTCAGTGTATTCAAGAAGGGCTTTAGA
+AATAGGATGGGTACTAGCAGTCTCTGCTCCTTTTACCAGTCTATTCACGAGCAACTCATC
+TTCCAAATAATGAGCATTCACAACAGAAGGTTTTCCTTGGGTGAGCGTTCCCGTTTTATC
+CATGACAACAGCCTTAATATCTCCCATGTTATCGACAATATCCCCTCCTTTGATAATCAA
+TCCCTTTCTGGCTGCACGAGAAATAGCAGCCAAGCTAGCAGGTGTGGAACTGGCAATTAG
+GGCACATGGTGAAGCTACTGTTAAGAGAATCATCCCTCGGTAAAAAGCAGCCAACCAAGT
+CCAAGAAAGCACAAAGTGGCTAAAGAGGATAAAGGCAGGAATAAGGACGAGCACAAATTT
+GACATAACCATCTTCTAAGCTTTCGATAAAGGTGGCGGTTTTGCTTTTCTTTTCTTGGGC
+AGATTCCACCAGATTAATAATCTTGGCAAAGAGAGTATCGTCATTTTCAATAGTAACCAA
+CATATCTATGGTTTGTCCTTGGTTAATGGTTCCCCCAATCAGATCCTGGCCTTCTGCCTT
+ATCAACAGTGATAGGCTCACCAGTGACCATAGATTCATCAAATTGACCAAAAGGACTAAG
+CAACTGCCCGTCAATTGGAACAGCTTCGCCTTTACGAACTTGTAAACGGTCACCAACACT
+CAAGGATCTGGTCTCAACTTCTAAAATATGGCCATCTTCTTGGTATTGACGAGCTGTATC
+TGGCGTCAAGGACATCAAGGCTGAAATAGCATCCTTACTTTTTTCCATGGCCATTTCTTC
+AAGCGTATTGGACAACGAAAAGATAAAAATAAGCAGAGCACCCTCCAGCCAATAGCCGAT
+AATTCCAGCACCGATAGCTGCCAAAATCATCAAAATATCCACTGACAAGTGTTTGTTCTT
+CACCAAATCCAATATACCCGTTTTTGCAGACGCATATCCTCCAATCAAGAAGGCTGTAAT
+GAAAATAGCGGAAGCCACTTGTGGAAATGAGTGTAAAAAGGCTAGGCCAATTATTATTAA
+TACCAAACACGCTAAAGTCTCCATCAAATGAAGATGGTCTGCCATCCATTGTCTGATTGT
+CATTTTTAGTTCCCTCGCAATTAAAAGTTATTCAATCTTTAAGATATATTAATTATAATA
+ATTCTAAATAAATAAGTCAAGTAATTTAGAAACATTCTAAATAAACTTTTTTAAACTTAC
+CTTTTGCTTTCAAAAATCCTAACTTCAACTATTTGCAAATATGAAAAAAACTCCCCCTAC
+CTGCGGAAATGATATACTAATAGAAGGATGACTGACCATTATAGAGTGCATGCTTTAGAA
+CTTGGCTTAACTGAAGAGAAAACTACTAACTTTATGCCCCAAATATAAAAAAAGAACCTT
+GTCGCTATCAATAAACATCGATAGCAACAAGATTTTTCTAGACGAATTATTTAACAGCGT
+CTTTTAAAGATTACTTAATATTGTGCACATATAATATAATAAACTTTGATTTTATAAAGC
+TACAAAATAACGAAACTTTATATAATTGCTTCGAATCAACTATGTAAGTTTTAAACTTAT
+GCCCCCTATTTACCCCTTTAATAAAACTACTTCTCAGGGGGCAAAGAAAATACTTATCTC
+GAAAGCTCCACCAGCACCTCTTCCACTTTTTCCTTAGTCACAACTTCTCCATTCTTTACT
+TTCTCATGTGGCAACACATAATCAAAAATCTGTCCGTCTTTACGCACGATCGCTACTGTA
+TCGCCTGCGATATATCCATTGTCAATCGCTTGCTTAAACTCGTCGTATGTTAGCATTTTT
+ACCCTCCTACTTATTTATTCGTATTTTACAGGAAATAATATAATTAAATTTAAAGGTCGT
+TTAAATTTAATTAACATCTTTTTTGTTACAAACTAAAATATTGATTGTTAGCGAATATTA
+AATAAAAAGAAATTTTAGCGTAATATTATTGATAAATTAATTTTATTAATTTTAAGTTTT
+TTTAATTTAAAGTGATATAATTAACCTGTAAATAATAAAAGGAGGACATGGATATGTCTA
+AATCAAATCGTCGTACTTGGCAAGGTTTAGTTGTTATTTTAATAGCTATTCTCACCACTT
+TTACCACAAGTACTGTTACGGCAGCCAGAAAAATTAGAAATTTCCCTGATACCACGGAAA
+TTTTGTTAGGAACGAAGGCGACTGAGACACCAGGAATCTTACCATTCACTGGTAGCTACC
+AATTAGTTTTGGGCGATCTTGACAATCTGCAAAGGCCAACCTTCGCACACATCCAGCTAA
+AAGATCAAGATGAGCCTAATATTAAACGAAAAGGACTTAAATTCAATCCTCCTGGCTGGC
+ATAATTACAAATTGACTGACGCTAATGGAAAAACAACTTGGTTAATGGACCGTGGCCATT
+TAGTTGGTTACCAATTTAGCGGCTTAAATGACGAGCCTAAAAACCTAGTTACAATGACAA
+AATATCTTAATACTGGCTTTAGTGACAAAAATCCTTTAGGAATGCTCTATTATGAAAATA
+GATTAGATAGCTGGTTAGCTCTACACCCTAACTTCTGGCTAGACTATAAAGTTACTCCTG
+TTTATCATAAAAATGAGTTAGTTCCTCGCCAAGTAGTTCTACAGTATGTTGGAATTGATG
+AAAATGGAGATCTACTTCAAATTAAGTTAGGTAGTGAAAAAGAAAGTGTAGACAACTTTG
+GAGTAACATCAGTTACATTAGATAACGTATCTCCTTTAGCTGAATTGGATTACCAAACAG
+GAATGATGCTAGATTCAACTCAAAACGAAGAAGATAGTAATTTAGAAACCGAAGAGTTTG
+AAGAAGCGGCTTAACATAAACTTATACTTAATAAAAATATCTAGATTGTGAACATTATCC
+CAAATGTTAGATTATTTATTTAATATTTGGGGTAATTTGTATAAAGTTAAATTTTGAAGA
+AAAATTAGTATAGGCTACTATCTGTGCTATTTTTTAAAAAAACAACGTCTATTTAGAAAG
+TCCCTTAAATAGGACTTTGAGAAATTAGTCTGTTTTAACGGCCTTTGTTGAGGATGATTG
+AATCGAGTAATATGTATAGTAGATTGAAAAAAAAGGGTGATTTTATGAAAAGGTCCAAAA
+AAGCATCGTTACTTAGTGTTATTGTTGGAATGGCTTTAGCTGTGATACCAATTTATATTG
+TTAATTATGACAATGAACTTATCGTTCTTTTAATGAGTATTTTTTTTAATGGGATAATTG
+TTTCCGCTTTTGAACTTATTAAAACATATGATGGTTTGCAGGAAGAATATAAAAAGCTAA
+CTGTAGATAGATGGAAGAATACTATTTTACTGGCTTTCAATTCATTATATTTTGCTTCTA
+TTTTGACAAATAGTCTATCAAATAATTTATCGACCATTTTATCAACTAATCGTTCTGACA
+AAGTAAGTGCAATATTTCTTACAGGTTGTTCTATTTTAGCACTACTTCCATTCCTCCTTC
+ATAGGTTAATAAAACGAGAAATAGAAATTGAAAATGAAAGAAAAAAATTAAAAAAATAAT
+TACTTAAACACAAAAAACCGCCCTCGATTAAGAGAGCGGTTTTGTCTTATCTAAAGGAGC
+TTTATCTCCTAATTTAATTTGCCCCAAAGGCTGATAATGTTACCGTCTTTGTCAGTTATC
+CCAATAGCCGTGTAGTTTCGCATACCCGAGCCGCCAACGTAGCTAATCCAGTAGTAACCA
+TTGGCGTAACCCTCACTATCAAAGCTGATAGTATCACCTTGTTTATAGCTACCTACTACC
+TCGCTAGTTAAACTTGGCCAACGTCTGATATTGATTTCTGCGACATCAAGCGTAAAAGTA
+CCTGTTTTTGCTGTCTCTACGATAGTGTCAGACGTTTGTGGCTCGGTGCTGACTGGTTGC
+GTGACAATATCTCCTTGGTAAGGAGGGTAAAACCATCCTGTCACGCCGGTAAAATCACGA
+GTATTAAAACGAGCTGGTGCACCGACATACAAAGCATCAGGATTGCCATCAATGTTTTGC
+TCGATAGTTCGCATGGTATAACCGTCGCTATCCTCAATGACAACTCCTGTGTGACCAAAT
+TGATGATATGGCACTGATTGGACAAAAAATGCTCCAGTCTGTGGATTTGCATCTGTCGGC
+ATGCGGTGGACTTCCCAACCTACGGCAGCAGCGCTATCTAGTAAGTCAATCGCATTTCCC
+CAAAGATCAACACCAAACCAGTGCTTTGCTGCATAACAAGGCACATCTGTGCATTGCCAG
+CCCGCAAAACCATCTTTATCCACGCCAACCCCAGCATTTACCAAGTTAATAAAAAATTCA
+ATGACTTCTCGACATTGAGAACTAATCATTTGCTTCTCCTTTCTGACAATAGCCTCTTCA
+TCCCATTCCTGAAGGTCATTTTCCTCGATTAGTTGGATAAGCAACTCTGCATAACCGCTA
+GCTGTGGCATAACCTGCATCTTTTATAGCGTGACAAGCTTTTTTGTAATCAGTCTCACCA
+ATCACAGCCTGATACCGTGGATTATCGTTTAAAAATTTACCGTGATCAATAATGCTGTCA
+GTCCAACTATCATACGCCCTAAATCGGTCCACAATATCCGTGACAACACCTGCTTGATAT
+TCCTCTTGGGTTTTGGTATCAAATGATTTACCAGTCCAAGAGCTATCTGCCTTAATACCA
+AACAGAGCGTTGTGTGGGGCATGTTTGCCCCACCCGCTTTCTAAGATTGTCTGCGCTGCG
+GTCAAGGATGGCAAGATTTTGTACGTTGTCCAGCCATCTAAACAGCCTTGTTTAATTTTA
+TCTAAAAAGGTCATCTGTCCTCCTTATCTAAAAATGGATAAAAGATCAGAGCAACAACAG
+ATATCGGCACATACAGTATTGCGATTGCTATAACTAATGCTAATCGTGTGATTGCTCGCA
+TGGCTCCTCCTATTGTTTTGGTTCGTGGTAAGTCAATGCTTGCTCACTGTCTGACAGGCC
+TTTTGTGGTTGGATCTGTGACAACACCGAGCAATACCAAAAGCGTTACAGCTGTGTTGGC
+AATATCCGCGATGTTTGATGGTAGTTTAATACCTAATTGTTGCGCTAACAAAAAGATAGC
+TCCCAAAATAGCCATCAAGGTTACTTTGTTTTGTAGTCGTAATTTTAAATTGATCATTTG
+ATTTCTCCTCTCATCATATCTTTTAAATCTTTAACATCATCTGTTAAATTTTTAATTTGC
+TCTGTCATTGTAATCAACGTTTTATTTTGCTCAGCGTGCTCTTCAAGCCGCCGAGCATTT
+TGGCGTGTAACAATTTTTAAATGCTCTACCTCAGATTGCAACAAAGTAATATCTGTCGCA
+TGCTTGATGGATTTTGCATTAAAAATATTGTAAGTCGTGACGATAGCTAAAATAAAGCCA
+CCGACGCCAAATATCAACTCTGTTGCCATAAACCACCTCTAATCTTGTTTAACCAAATCA
+GCGTACTTGATAACTGTTACTTTGGCTTCTGACTCTAGCTCCTCTAAGGTTTGTTTGTCA
+TACTCAAATGCTTCATTAACGTGTACAAAGACTAGGTTCCCTTCGCCTGCTTCACCGTCT
+TCCTCTTTAGTACTGTCGACCACCGTAAAGACATCATAGGCTTGATACTCACCTTTTTTG
+GCTGGCTCGATTAGCTCAAGCATGCCTTTATAAATGTCAGGATCAATCTTGCCGCCGCTC
+GTTAACATGTGGATGGTTTGCAAGTTAATCATTCGCTGTGTACGCTCTGCGGACACCTTA
+GCTAGTCCAGCAGCTGTTTGAGCAGTTTTGGCAGTCTTAGCGGTTTCCTGTGAGATTTTT
+TCAAGGTCGTCTACCTTTTGCACGGCTTCGCCCATTGCAATTTCAACGTATTCAGATTTT
+TTAAATTCTTCCAAAGTAGCTTTGATAATCTCTGTGTCATTATTTGAGGTTAAGTCCTGC
+TTGATTGGTTGAGAGATGACTGAGCCATCCTCAGCAGTGATAATAATATGTGTGCTTGCG
+ACTGCTCCTGTGCTGTCAAATTGTGGGTATTTTCCTGTCACTTTCCAATTTCTCATGGTT
+ATTCTCCTTTTTTACTTTCTTCAAATTGTTCCAAAATGTTGTCGATAAGAATGATTTCAG
+ATGATGTAAATTCATCTTCACACTCTTCTAAAAAGTTTAAAAAGTCAATAAATCGCTTGG
+AGTACTCACCCCCTTTAATCACAATTTCTTCATCAGCTAGCTCGTTGAGTAGGCCGTTGA
+ACTCGTCGAGTTTAGCGGGGTCTGCTAGCTTGATGTTTTTGTGCTCATCAATGACAAACT
+TGCCATCTTTGTCTTTTTGAGCATACAGATCAATAAGGTCACCCTCATCCTTGGCGTACT
+CTTTGAATTTATCTACTACTTTTGCGAGTAGCTTAGCACGTCCGCGGTTTGCTCGCATGT
+TCGTGACTTTGATTTTGTCTAGTACACGATATAGTGTGTTTAAATCTTTGTTTTTAATAG
+TTAATTGCATATTATCTCCTGTTAAATTTTAGTGATGTAGTTATTCAATTCCCTACTCAC
+AGCACTTGTAAAATTGCTATGAGCAGTATTCCAGCCGACGTTAGCCAAGTGCCCCCAACA
+GCGGCCTAAGGCTACTACAGCCGCATACAAGTCGTTCATGTCGAGCACTTTTTCCATTTT
+GTCTGGTCTAAATTTAAATCCTCGATTGATGTTAAAGTCATCTGCAATCAAGACATTATC
+ACCGTATAGCTCGGTTTGGTCGACTGCAGCAGTATGGTTATATCCCGTAGCGTACCTAAA
+TGACCTTAGCCCTGCAAAACGACCGGAAGAAGCGCTGTCGATGCCATCTCCTGATGAGGT
+AATGCCGATAGAGGCATATAACGCTGAGCCTCTATAGCCTTTTGGTGTGGCATTACTAAA
+ATGTACAAAAGCAGTATGTGTGCCATCTTTACGTACTAAGGCATTGTTTTTGCTATTAAA
+ATTAATTGTGGCATCTCGATTAAAGGTCATATTGGCATTATTTAGGTCCCACTGACTTGC
+CCCATTTGTAGCGGCTAATACACCTCCAGTAATTTTGCTAGCTGATAGTGTTACAGATTG
+GACTGATGTTGCAAAGATGTCTTTGGCAAACAACGTCCTAAAATATCCCTCGTTAGCAGT
+GAGTTTATTAAAAAAGGCATAGTCCATCTTAATTTTCTCACCAGTAATGGCCTCGGTTGC
+AATCCTATTAGCATTAAGATAACCAGTATTAATCTTACCGGCATCCATGTTAGCAATATG
+AGCATCTTTGATGACAGCGTTGCTGATGTAGCTGTTACCATCAAGAGTGATATTTTTTCC
+AGTGATTTTAACCCCAGACCTATCAAGATTGATTGCCGAGATAATCTCACTGCCAGACAT
+TTTGCTTGCTGGGAGTTTATCCCTGATTGCGAAGGCTATCTTGTCGTAACTCTGAGCAAT
+AGTTGTCTCAACATCACCTTTTGATACCTTTGTGCTGATCAGGTCACTTAACTGATTAAT
+CCGACTTGTAGCATTTGATTGATTATCACGTACAGTTGTTTGTAGTCCCTGTACAGTCTG
+AGACAAACTGCTGTAATTTTGGTTTGCATTTGTGATTTGTGACTGCAATCCTTGTGCTGT
+CTGAGACAATCGAGAAACATCATTAGCTGCATTACTAACTCGTAAATCAATGCCACTTAC
+CTTTTGAGATAGCGTTGAGTAGTTACCAACACCATCATCAAGACGACTGCTAAGACTATC
+AATTGTTTGGCTCAAACGACTGTATTTGCCATCAAGTCCACTAATACGACTATCAAACAT
+TGATGCTAGCTGAGTACGTGCGGATTCAACTGACTCACTTTTGACAGTTTGTTTGATACC
+ATTCAGAGTTTGCTCAAATTTGGAATATCGTTCATCATCAATAGACTTGACTTGTAACAA
+TATCTGCTCAGCTGATTGCGCAATGGCACTTGACATCTCTTTGTTGGCGTACTCGACTAG
+CATTGCCTTATTATTGAACTTGATTTTGCCCCACAAATCTGACTTAGGGTCTTTTAGCTG
+TAAATCAAGCTCTTTGACCTGCTGAGCTAGTCCAAAAGCTTGTTGAGTGGTAACTTTAGG
+CTTTACAAAGTCGTGCATTGTATTGTCATCCTCGACCTGTAGCTTTTTGATTATGGTATT
+GCCAAGGCAACTACTGTTAAGTCTCACAGTCTCACTTGACTTATCTGCCTTAAAGGTCAC
+ATAAAAACGACCATCTGCAAAAGATAAGTCGTGCTCGTTTATTGTATATGTTGGGTCTCT
+GCTCATTTATCCTCCTTAATCTATTTTTTTAGTATGAGTTTTTTTAACTCAGCAATTTTT
+TCATCTACGTAATCTTTAGTCGCAGCATGTTTTCCAGATGTTGGATCTTTAACTGTTAGA
+TTACCATCCACAATTGAACTTGCACATGACCAAAAGTCACCATCTGGACCTACATAAAAT
+TTGTCTTTATTTTTATTTCTGATTCTGAGCATTTTACCAGCTGTGCCTGATGTTGAGTTA
+ATGTAGATTCCTTGAGCAGCAGTACCTTTTCCGCCTTTCTGTTTTTTAACGATATCAATA
+GATAACGCTGCAGCGTTTTCATCGTATTCTTTGTCAACGCTTGGGTTTTCGTGTGTGATT
+TTGAGCGTTCCCAATGCTTTTTCGACGCCTCTAATTTGCATCGCACTACCGCCTTCGTTA
+GCACTGGTTATATTAAGTGCCGATGAAAAATTGGGGGTGGTTGGCTGACGCATCACAATA
+TTAACGGCATTTGTTGTTCCCTTATAATCGACAAATTGAACTGACTGATCAAACGTATCT
+TTGTTAGAGCGTAAAATCATCAATGGTCCATCAGTAGTATCTTTATTTGTATACATCACC
+ATAGCAGCACCTTCCGATTTAGACATATCAATGTTAATCGCTCCTCCTACGGAAGATGAG
+GGTTTAATACCACTATTAGGTTTAAACTGTAGTTGTCCTGTCATGACGCCGCCTTTGAGA
+TTTAATTTTTCGTCTAGCTTTGCATTTGACTCTGCTTTTAAGTAAACAGCGTTTTTATCT
+GCTTTGCTTGATTCTAATTTGGTGATTTTACTATTAGTTTCTTCTTTTTGTGCAAACGCA
+CCTAGATCTGGTTTATTTTGGAGTTGATCATAATCTGTCGTTCCAGGCTTGCCAGCAGGG
+CCCCGAGAACCAGTTCCTCCAGTTTTACCTTGGAGACCAGTGTCTCCTTTAGGACCTTTG
+GGACCAGTAAGGTACTTAAGCTTACTAAAAGTGTTTTGACCATCGCCAAACTTAGCAAAA
+CCAGTGTCAGTCTCAAAGCCAATCTCACCCTCCAGTAAGACGACATCACTACTTGCCCAC
+TCGGCGGCTTTCATCCGCTTAAATTGGACTCGTAGCGGTATATTTTCAGCCATTAATTAC
+CTCCGTCTAATATAATTTGTGGGCTGTCTGACCACTGCCCTGTGATTGTGGCATTATTAC
+CGTCAACAACATCTTTATAATCCATCTCCAGAGCCAATTCCTGCACCTCCGACGCGTTTA
+AATCTATCTGCTTAGATTTATACCAGTCGCTGGTTACAAGCACTGTGTAGCTAAACGGAT
+AGACATTGATAGTCTCAGTATCCTTAGTCAAGCCAAAACTCTCGACAACTAATTTGGGAT
+TTTTAGGTGTTAACACTAAGCGAGCACCTTTCATGTTAGCCTGTGTCACTGTGATTCCTA
+CTTTACGCAGTAGCTCACAGGTTGCCTCAAAGCTGATAGTGTATGTCTTGCCTTCTTCAA
+AACCTTCACCATTATGGGCAATGTCAATATAACCTTGTTCAAAAGTGATAACTTTGTCAG
+TATCACCATCCAGTCTGTTGCGATTGTAAAACGTGCCGCCAGTTGATCCAACAATGTTAG
+CTGTAACTGTGGCAGTTTCAGACGTGTCTTCCAGTTTAGCTTTAATGTCAGCTAAGCTAT
+CCTTGCTAAAACCGGCTTTGGCCAAAGCATCATCAATCTGCTTTTCATCAACTTCAAGGT
+CTTTAAGAGACGTTCTAAATTCTTCAAGTTTTTTATCAAAATCTTGCTCTTTAGTGTCAG
+CATCAGATAAAAATTTTTTGAGTCGCTCATCGACTGCCTTGGCTAGCTCCTCAGCTTCCA
+GCACTTTAGCGTTAACCTCAGCAACTTTGACCTCTGCATTAGCTTCAGCTTTTTTGATGC
+CATCTTCAATCTCTTCACGGAGTTTAGCTTCTTTTGTGTCAAAAATACGATTAGCATTAT
+CAATCTGCTTTTGTAATTTTGCTTCAAATGCTGCGTCATGTTGAGCAGTTGATTCAGCTA
+CCTTATTGTCAATTTGATTGCTAATTTGTTTTGCTAAGTTGGTCTTAATCTCTCCAAAGA
+TGATGGATTTTAACCGATTAGCCATAGGGGCGAACCGATAGCCAGTGATTTGCATTCGTA
+AGTCTCTGTCATAGAGCTCGTGGAAGACAATTGCTGTGTCAAATAGCCTAACAGCGCCCT
+CGTAGTTATTAGTAACATCAATTTTTAAACTATTACCTGGTATGTCGCAAAGAGTTTTTT
+CAAAGTATTTCTTACCATATGCAAGCAAGTCCTCTTCTGTTTTGACATCTTGATCCTGCA
+CCTTGATAGTCTTTTCAACAATTATCGGATGAGTGTCTTTGAGCTTGCTCTCAACAGATA
+CCCTAATTGTTTTCTTTTTCGGTGATTCACTATGACCAATGTTTCCATCTGAAGCTTCTC
+TGGTTTCTACTTCATGTTCTTCTTCTACTTCAGCAACTAAATGAAGGATAGAGACAAGCC
+CTTTGATAGTATCTGTTTCCTCATAAGATTTGAGGTTTTTCTTGTACATGAACAAGGTTT
+CGGTATCTTTGCCAGCTTTTTTGAGCAAGTTAATTTGGTATTTATTTCGTACAAGTTCGC
+CACCCCACTGCCCCATGATTGAGTGCTTGCCATTAGCTAAAGCGTCCATAACAGATACGT
+CTGATTGATTAAATGTGTGACGACCGTCAATATCACTAAAAAAGCTAAAAGGATGCTCAC
+GCTTGATACTACCTGCTAACTCTGACATTACTGTCATGCCTTGCACCCTATCAACACTGA
+TAGTGTCAATTGCATAGCCATTTAAGTCATCAGCGACCTGATTAGCGTAAACGTTAATAT
+AGCCATGCCGCTTAGTAATTTCAAAAATCCTAAAAAGCTGAGAACCATGCAGATCATCAG
+CTTCTAAGATTATTCCTTTTTTTATTAAAGGGCGATACTCGTGTTTAGCAGGATACTTAA
+AATTTAGTTTGTAATCACTATTGGCCTCCTGTGTAATCTCATCTTCAAAGGCTGCTACAA
+GAGGGGTATTATCATCTTTAATCGATATCAAACCTTATACCTCCACCTTGGACTAATTAT
+TGTTCTAGTAATGCCTCCACTGACGGCAATACCTTGTGTGCCAGGTTGTATTTCAAAAAA
+ACTTCCTCTTATTCGGATTGAGTTTTTCACATTACCTTCAGCATCATAGACGCATTGTTG
+GCCATGTTTGCACTCAATCGTTGCTTTACCTGACAAATTTAATTCCATGACCTGTTTGCC
+AATGGTTAGCGTTCCTTTACCAGTACCCTCAACAACTATCTTAGGTTCGCTGAAAACATT
+TCCTGCATTGTTAATGTTTCCGTTGCCTGCAATTACTACATCTGAGACACCTTTTGCGTA
+TCTAAATGGATAAAGAGCAAGTTTGAGAGTCACACGCCATGATGACATGGTTACCGCATT
+GATTTTGACAGATAAGCAATCATAGTAATAAATAGAGTTAGGTATGTGCCAAAATTCGAT
+TTTTTTACTAAGGCCGTCTAAATGATTAATTAGATTAACTGCATCATCAAAAGTACTCAA
+ATGCCACATTATGGTTGGTTTAGATTCATTATATGACTCCAATTCCCTACTAGTTCCATT
+CATGCCATAAGCTTCATTTTCGACAAAACTAGGGGATAGAATATCCCCCACATCGTAACC
+GGTCAAAACACAATTAGGGATTGAAGATGTGTCAAAATCATCAATAATAACTTTAGGTAT
+CATACAATCCCCTCTCTAGCCATAATTTTGGCAAATTCTTCGTATAAAATAGCGCTGACT
+TTTTCTTTGTCTAGATAGACATCCGTATTTTTATCAAGGATATCTTGCAACAGAGCAAGC
+ACCTTAACAAAGAATAATGACAAGTCACTTGTAGCAGAACCGACTGTAGTTTTAGTACTA
+ATATTGCTTGATAGTAAGTCATCAGCTGTGACGCTTGGTTTAGCATCGATACCGAGAGAT
+AGACTTTTACCTGTCATGGTGCTTGCAAGGTCGTCAGCCATGCCAGAGACATTTGATTTA
+ACCTCTTTAAAGCCGTCAATCAAGCTTGTATTAAGTCCACCCATAATTGCTTTACCAGCA
+GGTTTTAGTAGAACTCTATCATAAGAGATAGGTCCTTTATGTTCTGCAATCCAGTTGGCG
+ATACCGCTCACAAAACTTTTGACGGCTCCCCAAGCTGATTTCAAACCGTTTAAGAAACCA
+TTCATAATTGCGGCACCAGCTCCAGAAATATCAATGTTTGCCAAACCTCTAATTGTGCTT
+GAGATTGAATCGATAACTCCATTTACTGCTGAACCAACACTAGACACTAAGCTACTAAAA
+CTACTGAAGGCTGATTTTATGCCATTTATAACAGAGCTTATGATACCCTTAGCCACATTT
+ATTGCGTCTCCCATTGCCATCCAAGCAAGTGAGAAAATGTTTTTTAGGACGCCAACTGCA
+GAACCGGCACCACTGAACGCTAATTTTATGTAGTCAATAACCGTAGATATGATTGTTCCA
+GCAGTTGAAATTGCAGTCTGAATGTTAGTCCAAGCGCTCTTAATAAAAGCGCTCAAGCCT
+TGGCCGGCTGTGCCTAAATTACCAAACATACCGATAGCAACTCCAATCCATTCTGCAATG
+ACACTGAGAACAGGTTGTACAAAATTAAGACCTTGAACCAGCAAGTCAATAATTGGTGTG
+ACTAGTTGTATAGCCACTTTAACTGCATCAAAGGCAAAGCTAACTCCCATAAGCGCACCT
+TTTACAACACCACCTAAGAAAGACCCTAAAATTTGAAATACTGGCATCAAGGCATCACTT
+AGTATCGAAATTAAAGGTTGTGCTGCATTCCACATGCCAACAAACGAGTCAACAACTCCT
+GAGATAGCTGGTCCAACAATCGCAGCGAAGTTAGAAAAACCTGCCTGTAGGGCTGGTAAA
+ATTGCTGAAATTAAAGCCTCAAAACCACTGAAATCTAATCTGGCTAATCCGCTAATAATA
+GTGTCTATTACTGGTGCAACTGCACTACCAATGCTAGTAAAAAATGATGGCAACTGACTA
+AAAGCCGTTTTTAAACCGTTAAAAACAGGTTGTAAATTTTGGCCAATCTGTGCAAATTTA
+GCAGTAATAGGACTTAAATCAATACTAATTCCAAGGCTACTCATTAGACCTTGGAATTGA
+CTTGTGATAATAGGAGCTGCGGCTCCAATAAAAGTACCAATTGCCGATGGTAATCCTTTA
+AAGATATTTGCCACCATCGGAATAAAGTTACCAAATAAGAAATTAGAAGTTGTCTCAGCC
+AGTCCTCGTAAAGCCGGTCTGATATCATCTCCTAGTGATAAACCTGCCATTACATTTGTA
+AAAGAGGACTTCATAGCAGCTAGTGAGCCTGAAAATGTAGTTTTTGCTTCTTCAGCAGCA
+ACTCCAGCGATACCCATGTTATCCTGTACCAAGTGTATAGCCTCAACCACATCAGCATAA
+TTACTCAAATCAAACTTCTTGCCCATAGCGGCAGGTAACTTTTCAGCGTCTGATAAAAGA
+CGCTTCATCTCTTCTTTTGTGCCGCCGTACCCAAGTCTTAGGTTATCAAGCATTGTATAG
+TTTTGCTTAGCAAATCCCTGGTAAGCCATTTGGATTGATGTGATATCAGTACCCATCTTA
+GCCGAGTTGTCGGCCATATCCATGATTGCCATGTTAGCAGCCTTGGCAGCCGCGACAGCA
+TCACCTCCAAGTGATTGCTTTAGAGATGCACCCATTGAAACTGCTTGCTCTGCATAAGTA
+TTTGCTGATATTCCAGCTTTGTATGCCTCTTTAGCAAACCCTTTGACAGCAGTCTCAGCG
+CCCTTATACAATGTGTCAATACCACCAAAAGATTGCTGCAAATCAGCACCAGCGGACAAG
+GCAGACGAAATCATCTTACCGATTCCAGCAGCTGCAATGGCACCACCAATCATTTTAACG
+AGATTACCACCAATGAGCGAACCAGCGCTCAATCCAGCCGACCTTGCTTCGGGATCAAGT
+TGCTTCGAGATTGCTCCACTTATTCCACGAGCGGATGGCATAATTTGCACATACGCTTGA
+CCAAGTTCTGTTGCCATTAGCCATCACCTCCTAGTAATTGTTTACGTGCATTTTCAAAAT
+CCTCGCCAGACACAAAAGAAATGACATCATTAGCTTTTTGTGATTTAGATCCAGATATAG
+CTTCCACCACGGATTTAGGTTTGTTTTGACCAGATTGACCATCCTTAGTTTTAGACCAAA
+ACAGCAAATTAGTATTATCATAAATACCAGCTAACAAAACAGTATCCAAAGCCTCAGTCT
+CTCCAGATAATGCCATTTTTATCCTAGAGTTAGATCTCAAACCGACAGCAAAAACAGCCA
+CCTGATAAGCAGGTAGCTGTCTGTAATCATATATGCCGTATGTTTCAGCTAAATCACAAG
+TCAATGCATCATCATCTTTTGCTATCATCTGAGCGAGGATTGCTAGTTTTTTAAATCTTT
+TTGACTTTCAAAAATTTCTTTGATTTCTACTCCGATAGCTTCAACGTCTACGATACCTTC
+TGCATCTCGTACATGTTCTTTTAGAGACTTAGCAGCATCACCAAGTAACAAATTAACGAT
+TTTAACTACCGCTGTTGGATCAGTTTCCTCTTCTGCAATAGCTTCAACAAGTTCAAAGTT
+TTTTAATCGTTTTTTAGGAATTTCGTATTCAAATCCTGATGTTGTTTTTCCTTTTAAGAT
+TTCCATTTACTCCCCTTTACATTTCAAAGCTGTTTTCTTTTTTATTAGCTTCTCCAGGTT
+TTACAATATACTCACGGTGTGTATCACCATCCTTGTCCGGGAAACATTTTAGTGTTGTTT
+CATAACCAACGACTTCGCCGTCAACATACTTAATTTCACCTACCTCATCGACTTTTGCAT
+TTGGTAAGACAATTCGTTTAAGAATGCCGCCATTCATGATCATGTCAACAACAATTACGT
+GAGCTTCTAACTCTTTTGAATTTGATTTAATCTGGATTCCCCCACTTAAATCTCCAGTAA
+CATTGACAGCGCCATAAACTTCTTTTAAGACTTCTACATTTAGTGACTCAATCAGCTTAT
+AAGTAAATTTATCCTCTTTTTCTGTCTGTACAGCCCCGACAATATCTCCACCCCACGCTT
+TAATATTTTCGGATGAACGTGTATCTTCATTGACCACACCATCCTCGGATACATAACCCA
+AATTCTTAAATTTAGTATTTAATTCTGATTTTGCATCCTTGGGCAATTCAGTACCAAGCG
+GTGCCGAATAAATCGCCCCACCGGTCTTGGGCTTTGCAGATGTTACATTTTTAGTATCAT
+TCTTATTCATCAATATCTCCTTTAATAATGATTAATATCAAATACAGCTTGATAACGATA
+GCGCTTAGTTGCTGTATCTGTAAAATTGTAGTCAGCGTTAAGATGTACACCAGAAACTTG
+TGGCAAGACATCAAGCTGCTCAATTACTTGCTTTACTTTGTCATTAAGTAAAGCCGCCTC
+ATACAACGATTCGGCATAACTTTGAAAAGCAAACGTGGAACTTAGCAAATGATTTTGCTT
+AGCCCCACTAGTCTTTTCTAAGATGATGAATCGTGCAGGTTCATCTTTTTGATGTTCAAA
+AAAAGACGGCACATCTAAGTGCTCGTCTAAATATTTTTTGATAATTACTTCAATCAATCA
+TCGCACCGCCTTCAACAGTGTGTTATTTTTTGAGTTATCTTTCTTGGCCTTTATGGTTTT
+AGTACTGACCATAGCATTAGCCCTATTTTTCCCAACATGGATATCTTGGACATAACCATC
+ACCACAACGTTCTCTGATGGCTGTGGCCTTAGTGGTTAATACCTGCTGCATTTCTGATGA
+TTTCATCAATTCGGCAACACCAGCTCTATTAAGCTTGAATTTAAACTTACTCATATCTTT
+CCACCATAACTTTCTTATTCCAGTCTAGTGGTATAAGCTCTTCAATACCTTCTAGTGGAA
+TTCCTACTGTGCGCCATTTTTTGCCGAAAAATCTAACTTCCTTATTTTCCCAATCGTGTT
+CGTCTCCTTTTGGTATAGCCAAGACATATTCAACCTTTTTTCCGGTCAAAGATAACTGAT
+TAGTGATATCTTCGGTAGTTGCTGGTGCAACAAGCACATTCTCAATTTTGATATCAAAAT
+CAACTGTTACAGGATTTCCAAAAGGGTCTTTTCCGCTAATCGACTTATCGGCTAAAGCAA
+CTGTTATCCCTTTCAATTTCGCCATAAAGTTCAATTCCTCCATATCGTTGTTTTTTTAGT
+CCAAGACGCTTCAACTCACTGTCCTTAATAAAAAGACCGCCGCCTGGAACTAAATAAGTG
+CCTGACCATGTGTATCCTAAAGCTGATTGGCTCTCTTGGGCCATTGGTTCGCCTCGAGTA
+GATGTCATCAGCGTTCTCGCTACAATGTCAACCGTAACCGATTTAATAACATTAACAAAA
+TAAGGCTTATCAACCATCGTTTTATCTAAGTCTTTGCCAACTTTGTCAGCTTCCATTCTT
+AATGTATCTGATACGACTTTCAAGAGTGCATTTGCACGTTTCAATTCGTCAACAGATAAG
+GGACGCCATAACAAAATGACGTCATCTGTTGTTGCGAAATTGCCCACTTTTACCTCCTAA
+CCAGGCAAGAGTGCCTCTAATTCAGGTTTCTTAGCTTTAGAGCTATATTTTATCCCAGCA
+GCATCTAACTGACGTTTAATTTCTGCTACTGTTTTTGCTTTTTCGCCTGTCTGCTGTTCA
+ACCAAAGTCCAATCTCCACCACAAACAGGGACGGAGCTATAAAAACTAGCTCCAGTCTTA
+CTGTTAACGTATAACATTATACTTCTCCTTTAGTGACACGAGCAAAGCTCTTAGCGTCCA
+AAATACCCCAGCCGATATACGCCTCAGCACGTAAGTAAATTTGGTTATACCCTTTAAGGT
+CTTTCCCCGAATTATCAGGATCACCGTATTTAATGATTTCCATTGGAATTTGTTTTGCAT
+AACCCCACTTAAACATGCTTTCAAAATCGCCAATAATTACTAAATCTTTGGATTCTGCTT
+CATCAGCTCCAGCACCAACAGTAGTATTGACGGACGATTTCAAGCCATTGATGCTATCTG
+GATTCGCTCCCCAAGCAAGTTCAGGGTACATTTTAGGCCCCATCTCCCCATTGGTAACTT
+TCGCCAGTGCTGTTGAAAACTCTGTATCCATCGCAAGCCCTGTCACTACACCTTCAGACC
+CCTGAATTAGATTAACAGCTGCTTCGATATTTGCATCAGCGTCTTCGCTCTCTGTAAATT
+TAACCACTTGCGTCACTTTACTATCAAAGTGATTCGTGCCGATAACGTCAGACGCTTTTT
+TTGTACGTGGATTGATACCATGCATCGCCATTAGGTCAATACCACGAGCGAGTTTTTTCG
+CAAACCCTTCGTTAAAAGCTTTCAAAATATCAATCTTTTCCTCTTCTGTTGCATATAAAA
+ATTCATCAGAAAGACGAGCACCATACTCAACCTTGATTGGTACGATAGTAACAGGCTCTA
+GCGATAAGCCACCGTGTGTTTTTTTACCGTTTTCAGCAACCACATCAATATCAGAATCTA
+ATGTAAACGTAAATTCTTTAGATCCGTTAAACGGAATAGGTTTTTGGCTAGATAGTTTAG
+CTAGTGAGCTATGCCCCTTAACTTTATTGATAAGATCTGATACTAAATGTTTGTCAAATA
+AGCTCGCTTTTGATGTTTCTGTTCCCATATTTTTTCTCCTTTAATTAATCTTCTAATCTT
+CTGTACTTAATCCTTGCACTAACGCTCTGTAATTTGCGTCTGCATTACTATCGATATTTG
+GTTCGTTTGATTTTGCTGGCGGTTGTGGTTGGGATGGCTTAATAAAGGATGCTAAGCGTT
+CTGCATCTACTTTGAGTCCATCTTCATCATCTCCTTGCAAACGATCAGCTAAATCAATCG
+GTAAGCCATACTGTAACGCTACCTTTGTCCGTAAATTTGCCGTCTCATAATCGGCAATTT
+GATTCTTCAGGGTGCTAATCTCTTCCGTATAGCTATCAGTGTTTGATTTAGCATCATTCA
+AAGCAGTTTGTAAGCTGCTGTTTTCGGTTTCTAGTTCTTCAACACGAGTTTTCAGTTGGT
+CGTAATCTTGATATTTCTCACGTTCTCGAGCAATGCGAGCTTTCACAATCGTGTCCAACT
+CTTCTTGTGTTTCAATAACTTTAAATTCTGACATATTAACGTCCTTTCTCCTGCTTTCCC
+GGCAGTTCGGTAGATTTTTTAGCAGTAAAAAAACACCCTTTCGGATGTCGTTTTTTAACA
+GCTGGTTCTTTGCTTTCTTTTTGGCTTCGTTGTGTAACAAATCCAGTGCGCAAGCAATGC
+ACTGTCCATTAAGCTAATGTCTCTATCATCATAAAGCGATTTATACCCAAAACCACCATT
+AGAGCCAATTTGCCTCTTTTCACAGTTTGTGACTACTGCTGTCAAAGATGGCTGATCACT
+ATGACAAATGGTTTCCTGCATGATCCCCTGCTCCCACATCATGTTAGCTGTGATAATTTC
+AGCAACTTTAGGCAATTCTGGTTTCTTTAGACCTTGATCTTTCATCTCCTGAGCAAGTAA
+TTCTTGACCACTTGCACCATCAATGACAACCTTAGCGATATCAGCCGATTTCAAAAAATT
+AATAATCCATTGAGTTCCATTTCTGACCGATAAACAGTCAATAGTCTCAACAAATACCTT
+ATTTTCTGATGTTCTTGCTGCAATTGATAGTGATACGTTGTTGCCATCTTGACCAAACTT
+GATACCGACAAAAAGCTTGCTTTTGAGTTCTGGCACTTGCTCAACTTTGAGTTTTGCCCA
+TTCTTTTTCGGATATAACTGATTTTTGGTTAAAGGATGGCCAATAACCTAAGCGTTGGAT
+GTTGTGATCAATCTCATCTTCACCTAATTCAGCTTCGATTTTCCTCTCGTTGAGGTGGAA
+TCCCATAGATGGGTTGGAAATATACCAGGAAGATACATCGTTAATCTTAACCATCTCAGG
+AACTGACCATTCAGCCCAACCAGAATAACGCTTATTGCCTTTTAAGCAATCTTTCCGATA
+TGCTTCAAATACTGTACCAGTAGATACCATCGTTGGCGGCGTTCCACACATAATAGTCAT
+TGGATTATCACTATCAGTAACTGTGTACTTCAATGCTGATTCTTGCTCAGATGTGTATTC
+TTGTGCCTCGTCAATGATAAGTAAGTCAAATCCCTCACCAAGTCCACCGTTTGATGTCCT
+AGTTCGGAACTGGATAACAGCGCCGCTGGCTTTGAACTCTATACGCTCTTGACCCTTGGC
+TTTATTTGATATAAAGTCTTCTCCATCAACATAACCTGACATCTCAAGGTATTTTTTTAC
+CTTTTCGAATGATGCATGAGATGTGCTAATTCGATGAGCTGTATGCAAGATTTTTAAACC
+TTTATGCAAAGCCCACAGCTCAACAATATAGACTACTTCCGTCTTACCGTTACGCCGTGG
+GATAGCATACCCATACTTTTGATGAACCCACAGACCATTTTCATCTATGGCCATAATTGG
+GATAAGCATATTTACTTGCCATGGATAGCAGCTTAGCCCTGTTTTTTTGTAGTAATTAAT
+AGCTTCATGCGCTAGAGATTTAGCAAAATGTAAATTTACCGATTGAGTAGGTCGCTGATT
+GCCAAGCTTTGTTTTCGTCTTAGTAACCATACTTATTCCTTTCAATCGTACTGCCTAGTT
+TTTAGCCATGCGACAGGGCACAATAAAAAGCCGTATTGCTACGACTTTGATTTCTAAAGG
+GGTCGAATTCGTTTAAAATTTATTTTCCCCATTTTCGCTTGTAATTTTTCTTAATATAGT
+TAACGTCAATTGCAATATCTGCAATAGCTGATTGGTTATCTAAAGTAGCAGCTTTAACAG
+ACGCAAACTCTTCGTTTGTTGCCAGAGCGTTTCGTTGAACGATTGATTTTAGCTCCATGA
+TTTCTTTGTTTTGATTTTTAATTGCTTCTGCTTGCATAGCATTTTCCGCAACCAGCATCA
+CAATAGCCCGTTCGAGTTTACGTTTCTTTTTGATTCGCTTATTCATCGCCTTCTCCTTTA
+TTTAACTTTGTTGCACACGACATTTTAGGGACAAAATTTTCCGCAGCTTCTAAGGCTTTT
+TCGTAAGCTTCTTTTGTTTCATTGACTTTATTCATGATTTGTTGAAATTCGTCTTTGTTT
+TCCCAAGTCATTTCGACATTTAATGATATTTTATTCATATTTTTCTCCTTTTTGGGCATA
+AGAAAAGCACCAGATTGCTCTAGGTGCTTAATATATTGCGTTTTCTGGATCTGGACCAAT
+CGCCACCCCGCTATTAATAGCTTTGTTTAATTCCAGTGTTGCATCTGGTAGAACCTTTTT
+CCACTCATCAAAGTAAACGTCTGGCTCCCAAAAAAATACTCTATCAAGCGAGTCTTCTCC
+AAACTTTTCAAGATATTGTTTTTCAGCGTCGTCATATTTTTGACGCAGTTGCCGATGTAA
+TTTTGGTTCCATATTTATCACACTTTCACAAATAATCCAATAATAAAATTCAAAAATTCA
+GGGTCGTCATTGATTGTCTTGTAGTCATATTTCCATGTTTTTTTGTCAAAGGACTTAGCA
+AATCGTTCTTCAGGAACAAAAATACCTTGTAATCCCATAGTGAAAACTTCAGCTGCATCG
+CTGTAGTATTTACCAATATATGGTGATATAAAGTCATCTTTCTTAGTAACTTCCCCAATA
+CCATAATTTGAACTTGGAAAAATATCTTTCAAGCGAACCTCAGCTTCATTAGCAGTTCTT
+TTATCTACCCAGGCTTTCTCTAATCTTACTAAATCAGGATTAACCAGTTCAATCATATGT
+CCTATCTCATGGTAAGGTGTTGTTTTTCTTGTTCCATTTGTAGCAATAACTAAATCTTCA
+TCATATCCATCGAAGTAACCGCGCTTCCTTTTTATAGCTTTTAGTTTTTTACCAATACCG
+TCCGGAACAGCTGCCCACTCAGTTGGATAATTTTGAAAAGCCTCTTGTAGCTGGTCTTTA
+ACAAGTTTAGATGAACCTTTTGCCCAAGTATTTTTAGGTATTTCTCCACCGATTTCACGA
+AAATTTGAGAAAATTTCTTTTAATTTCTCTTTATCTCCTATATGTTCTGAAACTCTAAAG
+TGATAATTGATACGTTTCCCTATATCAATTATATCACTCGGACCAACCTTTGTCATATCT
+AACTTAGCGATATCATTTTTGATAGATTCTACTAGAGCACTTTCCTTAAATTTTTCAACC
+CTTTCTATAGATTCTTGAGTTTTTTCTTTCTTTCGCCAGATTTTACTCCAAGCACTCTGA
+ACTTTTCCATTCTTCGGGTCATAGTCAAGCGTACATCGACACCGCTGATGTCTTCTCCAT
+ACGTCCTTAGGGACTTTTGGATAACTATAAGTGCCAACAACCTCACGACACCATTCACAA
+CAGTTGCCACTTTCTGTTCTGACAACCTGTGGCGTCATACCTGTTTTATATTGTAAATCC
+GCATTTGCCTTGATGGTATCATCCACAATGGACTGCGAAAAATTAACAATCGGTTCACCA
+AACAGCCATTTTACATCATCAAATGTATTCTCGCTATCCAAACGATTTACCATCCCGTTA
+ATCTTGTCTCGATTTAGCGGTGGACGTTGCACCTTTAGACCAATCTGAGCATTCTCATTT
+AAAATCCGCTGAACATCACCAGCATAACCTGAAATCAATTTGTAATTCCGTCCCATAGTC
+TCATCTAAGAGACGCTTAGCGATATTGTAATACATTTTACCGTCTGGTAATTTATCCGAG
+CTAACAGAACCTGTCAGAGCCAAAGATAAAAGTCTTCCGACTTCAATAGCAAACTCATTG
+ACTGTTTTATAGGTCACTTTTTTAGCTTGCAATTCTGCAAAAGCCTTGGTTACAACATCA
+CTTTCGCCAAAATACTTTTCAAAATCTTGTCGAACAGATTTTAGTAGCTTAGGTAAGACA
+TCATCAACCATCAGTTGTTACCTCCGTGATAGCAGGTATAGGTTTATCAGCCCCTTTTAC
+TCCCGTTAAATCACGGATAACATCTGCATCCATGAAACCAGGGATAGCTTGATTAAGTTT
+GATAGCTCCATCCCCTACTAAAGTTAGCATATTTGCATCAGCTTCAAAGAGAGGCTCCCA
+TTTAATTACTGTATCCATGAATTGATTACGAAGATAAGGAAATTCATCTCTTAAACAAAC
+AGCAATATACGCCACATTTAGAAATCCAGAAGAAAAAGAACGTTGAGCTTTGCGTCCTGC
+TGCTCTCAAATTCTCATGTGCCGCTTTTATTGACTCAACAGACGATGGGTTGTCAGATGG
+AAAACCAAGGTCATCAAGAGTGAGACCGGAACCACCAGCAAATAGCGAAGCATACATTTT
+CAAGTGTTCCATGAAAGGGGCCATGCTTGCTGTTGTGAATTGCCCAACTGTTGGCTTGTC
+GCCATCCTCGTCTTTTGAGATTTCGAGTAACGTTGACACCGTAGCACGCCACTTTTCCAT
+CGGTTCAGCGTCTGGATCCATTCCCAAAACATATTTTTGTGGGAATGAGTAAAACTCAGC
+CGTAACCTCTGCTCTCTCAAGCGTTCTCTTCGCTGCCTTTTGATGATACATTCCAGCCTT
+GGTAATGCGACTGCGACCAAATGGTCTAACTGCGTCTGGTCTGTGAATGATAGGTACAAG
+CAAGGGGTGACCTGTTGGATTTTTAATATTATATGGTTTCCCTTTTTTTGGATAATACCA
+GATGTCTTTGTCTGTGAAATAGGCCTCTAACGTAGGATTACCGTTTGAGTCAGACTCTAA
+AATTGCATAACCCTCTGTTAATAAAAATGTAGTTGGGTCAAGTATCCCCGTCGCTTTACT
+AGCTTCGATAACTTGCATTTTAGGTAAGCCGTCTTCCGCTCCTGGCATGATGTACACAAA
+GCAACAAGATGCAATTAATGCTGACTGTATGGCTGTATCAAAAAAGATATCAGGGTTATT
+CGCTTTAAAAATTTCCCAAGCATTAAAATCATCGTTGGTAAACTCCCTGAAAATAATACG
+GTCCGCAAGGCTATCAACCCCTTTAGCGGTCCATTCTAACACAGACCTGTACATTTCACG
+CACATTATTTGGCATGACAATACTTCGTGTGTCGTCTCTGTCATCCATGGCATAATAACG
+ATATCTTTTATCAACTCCAGTTTTAAAAAGAGCTAACTTCCTACGAAGATAGCCCATACC
+CATATAATTCATTTCTGCTCCTTTATTTTTTGCATGACTAAATCTACAAAGTTTTCTTCA
+TGTACATCTATTCCTTCAATAAGTGTTATTCCAGTAAAACCAAATTCAGATTCATTTGCC
+AAAATTTCCTTTTTTAGTTTTTTATAGTGCTGCGCTAAATTACGTATTTTTTTAGGCTTT
+TCTGTCACATCTGTGTTAGGATTTAGGACTTTCTTTTTTTCTTTCCTCTGTTCAGCCCGT
+TTTTGTTTCATCAATTTACGTTGTTTCTCACGATTGCCTTTCTTACGGCATTCTTCAGAG
+CAATATAAAGTTCTATTGGTTTTTGCTTGGAAGTTTTTTTTGCAAATTAAGCATTTCTTT
+TTCAATGAAATTCAACCTCCAAAATTTTCTAAATCCTAACGTGAGAAAAAATGTACAGTG
+ACGGCGTGAAGCTCGGCCGACCGACCGGGTAGGGAGATACCCCCCATTTCGCTTCTAAGA
+GCTTTTAGTATAAATCAATATATTTGCCTAAAATCACTTTTTAAATGCAAAAGATGACCA
+GTCTCGACTTTGAGGAAGGTTTCTGTTGCCAATTGTCTTTGGCTCGTTGCTTGCTTGGTT
+AGCAAACAACTTATCAGACTTCTGCCTGTTGCACTGCCAGTGAGTTAACTGTAAGTTCTC
+AAGCGCTGATGGATGACCACCTTTTGCGATAGGAACTATATGATCTATTGCTGCGCTTAA
+TGGATGTGGATACTTAAGAGACTTGTCCACTGGCTTGCCACAGATACCACAGACAGTGGC
+TGCCTTTAGTAACTTCTTTTTATTTCTGTCAAATGCTACCCGGTGGGTACCTTTTTTATC
+TGCCCTTAACTGAGACATGGATGGGCCTTTCTAAATTTAAAAGAGGGGGGTATTTTCTTA
+CCTGTCCCTCATTTCTTGATAATACTATATTATCACTTTAAAACTGTCATGCACTGTTAT
+TCACTGTCAATCGCTGTCATTTACTGTCAAATTATTTAATTCCTTAGTTGCAACTCTTAA
+CAGTCTGAAATAGGTGCTTTCGCTGCAATTTAGCTCATCAATCACTTGCCATCTAGTCAT
+CTTATCAATATAGACCATGCTCAAAATCGTTTGACTGTCTGTATTTTCAAGGCTATCAAT
+CAGGTTTTGAAGCTCTCTTTGTTTTCTTATAGCTTCAGCAGTCTTCTTTTCAATATCTTT
+GGCAGTTGCAATCAACTCTACGTAAACATCATCTTGCTTACGTTTTATACCACCATTCAC
+CTTATCAGACGACCATTTAGGGCTAGAAAGCAACGAAGCCTCAATCTTATCTCGACGTCT
+GATTAAACTAGCGATATATAAATCTAAATTGCGTAAGTCTTTTAAAATTGCCTTAGCTTT
+GCTCACTAACTAGCTCCTTTTTGATATAATAGATTTGTCAAATTATTAACTAAGGAGTCA
+GCTGTGAGCTGGCTTTTTTGTGGAGAAAAGCCCTCTCTTCCTTTTTTTTATTTTGACACA
+GGCGCAGGATGTCAGTATTAGCGCCTTAAATAATAGCCAGTGACCGATAACCAGCGTTAG
+ATTTTGTTTTGGTGTAAGGAGGTTCTCGTTTCTATTTTTTAATTTCGGTCAATACCAACC
+GCACGAGTCGAACGTGCGTGATACCGTTATTGGTTATATCCATTCAATTAGTGGATTTTC
+AATGTGTTCTATCCCATCACCAATCCACTCTTTGACATTAAATTCTCGCTCAATATCTTG
+AGTCCTTGGCATAACGTTAATATCACTAAAACTCAGCATGTCGTCTTTTGTATTTTGCAA
+AAAATAAATGTTTTTAACTTGTCTTGTTAAAGAGTCGCCATGCACCACCACACCATTTAT
+CCCTCTTATAGACATATTAAAGAGTAGAAACGGTACTGCTTTGTCCGATAACTCTTCTAC
+GTGATACCAGTATTTACTCGGACGATAAGTAAATGGACTGTCATTTAATCGTTGTTCTTG
+CCATGCTTGGATAAGTATCCCACCCGTCCCGACTGCTACCTCGTAGTATTGATTACCACT
+TATTATTTTAGATAATAGTGTACTAACCGATTTAGGAGTAAAGTCTTGCTTTTTATTTTT
+GCGGTCAGCTTGTTCTTCCTCAAAATATTGCATAAACCAGTCGTAAGATACATCTGTTTC
+ATATTTCAAAAACTGTCTAAATATATCCTCACGACTATCTTTATCAAAGAGTATGTCCGT
+AAGTCGTTTGGGTGCTTTATAAACTTCGTCGATGCCTAGTATGCGATGTATCTCATCGAT
+CTTAATCATGTTACCCTCCGTTATTCGTTAAATCAGCAATCCGCTTTGTCTGTCTCTGAT
+TTTGCTCACTCGCACGTTTAAGCTGCTTTTGTGTCCTGCTTAGCTGTGTACGTAGTCCGT
+ATATTTGCGGTTCATAATAGCTTTTAAGCGATACGCAAAGCCCTGATACGACAATCAGCA
+TAACTGTTAGTGCAGCGATAATGATGCTTTTCTTTTTGATTGCTTTGTCTTTTTTTACTA
+ACTCATAAAGCAAGCAATCAATCATCTGTTCTTCAGTCATCCGTTTACCCCTTCATGTAG
+TACTCGTTTACGCGCTTGCCGCTAGCTAACTCTAGCTGTCTAATAAACCGCATCGCTTCG
+TTTTTAGTAGTAGTCATGTGTCTCCAATTCATCAAGATAGCCTTGATTGACATAGTATGA
+GCCAATCAAAATAGCGTCTGCTTCGTCGTCTTTGACCGATTTATTAAATTCTTGCTCCAC
+TTTTATTTTTGACTGTAATTTCATGGACTTCTTGCTTCGGTCTTTGTAGCTAAACTTCCA
+ATACTTACGCCACGTTGATACATTGATAAACACGACGTTATCAGCTATTAATCTTCCTAA
+GATAATTCCTGTAACAATACCGATTTTAAGCATGGATTGCTGGTTAGGTCCCATAACCGA
+GTTTTTTTCGACTGCGATTGTACTAAAATAGCAATCGTATTTTTTTAATGCTCGTGACTG
+GATTAGCCTTAATTGACTAGCCATATAGCGGCCGCGCTCAAAGTAGGATTTACTCTTATG
+TTTTAAGACACCACTCTGGATAAGATCTGAGCCTTTAAATAAGGCCCACCCTGTTCCAGA
+TGTTGAGATGTCTAACGATAAAACTAGATTGCTCATTCAAGCACCCCGCGAATGCCAAGG
+GTTTCAAAGATATTTCTCTTGTTATCTTCGATAAACGAGAATACTTTTATGATTTCGTCT
+GCGTCTTTCTTATACTCTTTAGCAAAATATGATGATGTTAGATTGATTTTAGTTTTGGGT
+TTAGCTTCAAGAATGAGGTCGTAGGCTGTTTCGAATAACTCTCCATCTTCATCAAGTGAC
+GGTTCGTCGTCAATCTTTTTAAAATCACTAATAAAATCCCATTGCATAGTCAAACTGCCA
+GAGATGGCAAAGATTCGGTTTACTCTATCTAAAATTAGTGCTGTTCCTGTTCCTGTAATT
+TTGATTTGTTCCATATTTTTCACCTTTTTAAAATCCACACTCGCCCTAAAATTGTGTGTG
+AGCATTGGCAAGGACGAGTGTAGCAATTCTTCATATCATCAATCCTGTTGACTTGACGAT
+ATTCCAACTTTCCTTTCTCGCTCGGAAAATTTAAACTTGCAAAGGCCAAGCTTCACTTTG
+CAATAGGTTATTAAAAAATCTCTACCCTTACAGACAATTTATTTTGTCTGCAATATTCGC
+ATTTTCCACAAGGCTTAGGCTTTTCTATGCCTTTTTTAACGTCATCTAATCGCTTAATGC
+TTTGTGCTAGGCTATCTAACTCTATCTGCATAGCATCTACATTTTGGATCCTGATGGCTC
+TTGTATCTGGTGGTGTCTCTTTAGTAACTGCGTAAATAATCGGTTCAAACGGCTTATTGT
+ATTTAGCTTCTAGCATGGTTTTGTAAGCAGCCATCTGCAAAATATATCCATAAGCTTCAA
+ACCATCTGACACGCTCTTCTCTATTCCAGATTGTGTCGTCAATCGGCCCTTTTGTTGTTT
+TGATGTCTACAAAATAGCCACGTTCAACATTCAAGCAGTCGATTTTACCCTTGAATTCAA
+CCTCGCCAAGAAATCCTGTGATTGCTGCTTCTTTTTCTCCTTGGTATATGGCCATGAAGT
+TACTGTCATTTTTAAGTGCTTCAATCATCTGTTCTGCGACTAAATAGTCTTTTTTGAGCT
+GACCTTTAGTTGTTCCTCTGGTCGAAATCATTTCAGAGCCGTTTTGGGCTTTGAATTCTT
+CATGAGCTTCTTTACTCTCAAAGTAAGAGTGGACATAGTTCCCGACGAGCAGCGCAGTGT
+TATCTCTGGTATCTGTCCAATTCCCTTGTAATTCAGCAAGCCCCCTCGCTTCGCACTCTC
+TAAAACGCTTGTACTGACTAATAGACCAGTATCTGATAGCTGATTCACGACTATAATAAT
+CCTTTCCGAGTAAATCTAAACTAGTCATCTAGCAACCTCTTAATTACTTCATCAATAGGT
+GTATCGCAAAAGACAAACTCTTCTCTTTCCCTATCTCCAACGAATTGAACAACCACTACT
+TTTTCATCTAAATTGTCAAAATTTAAAGCAGATCTTTCCCAAACGCCAACAACATATTCT
+GGATTAATATAATATCCTTCGATTTTTACAAGTTTAATCATATTAAGTCTCCGAGGTTAT
+CAAATAAGTTGCCTTCGCTAGCTTTAATTTCCCCTGTTTCTTGGTCAAAATCAGGAATCT
+CATCTGCTGGATAAGAGGTGTCTTCTAAAACCGTCTTATTTTCGTCTGTGAGCGTTTTTT
+CTGGTTCTGAATGTAAATCTTTAATTACATCTTTTAAATTGCTAGGAGCGTCCTTTTTTT
+CGTTCTGCGTGCCGATTAAGTCATCAAGGCTGTTTGTTTCTTGTGGTGTGACATCTTTTG
+GAATGACAATCGTTGAATCTGCGTTATCCGCTTCTAGAGCATCCTGCATTTCAACAGAAA
+GAGGGGCATACTTGCTCAGTAATTCCTTGAGTAATGTCTTGATAGCCATTGGATCAAATT
+CTGTCGCCCAAGGCGTTCCTGGTTTAAAATCTCCTGTTTTCTTATCAAAAGTTTTAGAAT
+ACTTTTTGGCATGTTCGTACACTTTTTCTTTCGGCCAGAAAATCATCTTGTAAAAGCCGC
+TGATTAGTTCTAAACTTGCAAAGTAGCCTTTTACAACACCAGAGTCAACGTAGTCGCCCG
+TTAGCTTCAACTGCCCTCTAATCTTGTCATAACCAAGGAATTCCTCTTCGTATATGATTC
+CGTGTTCAATATTTCGGACTTGTCCACTTCTTTGAGCTAGCTGTATAAGTCCTCTATATC
+CGATTTGAAATTGCGCTTCGTTTACTGTGATCCAACGATTTCCATCCTTGTAATTTCGGT
+TGTACGGCACCACGTAAGCAAAACCAAGACTAGGCTCGATTGGTAAATTAAGCACTGCTG
+CTTTCATAGCCGCTCCCATAATTGACTCAGATGTTGCTTTGGCTAGAAGGTTATTATTGC
+TGATGATTGATAATAAGCTAGTTGTAAATTGTTCGGCTCGTGCGCCGACAACCTGCTCAA
+TCCTGTTTTTTACTGCTGGCGATTTAAAAAAGCTGTTGTGGTTGTTTTGTGCTAATTGAT
+TTGTCATTAGATACTACCTCTTAAAATTTCGTCAAACATTCCGTTTACCATACTTTTAAC
+TTTTTGCTCTTTTGTTAACTCTGGAACATCCTCGCCATCAATAAATTTTAGGTCATATGA
+TGCTTCGATAACTACAACATCACACCCAAGCGTTTCTGCCAAATTATCAATTTTTTCTTT
+TTGTATGTTGTAAGCTTCTTCTGGTAAAAATGATGCCAGTTGAATGCTATCTGTAAGTTC
+CACATTATAAGCAAGTACATCTTTTTTGTTTTTGAAACTCTTTAAAAAACTTCCGTCTTC
+AGTGTTTCTTAGCACTACAATTTTTTCTTTGATGTTCATTTCATTTCCTCTTTTTGTGTT
+TTAGTTGCTCTCCCAGTCTTCACTAAATTTAAAATCATTGGATTTGCTCACATAATCCCT
+CGACTGCAGCATGTATATCTGTCTGACCTGCGCCAAGATATGTTATTCCCGCTGCTAAAA
+AGACTTCTCGTGAAGTTAGAACTCCACCGAGATCATCAATTGCCTGATCAAGGTATATGC
+TAAACGTTTCAAGTTCTTGTTTAGCTCTGATTTTTGCTTTTTCTACTTGTTCTGGTGTCA
+TATTTCCTCCTAAATCGCATATTTCTTACGCAATTGCCGCAATAGTGTCACGTACCGTGC
+TTTATCAACTAGTCCAAAATCAAGCAATCTCTCACGCTCTTGATGACTTGCTCGGTACCA
+GATAAGTGTTTCTCTATGTTGTTTTGTCATAACGCATTCTCCTGTTTATATCGCTCTATT
+CTCAACCGGTCTGCTTCTGCTGTTGTCATACCAGTTCCAAAAGCGTATAGGTTTATCCAA
+TTAAAAATTGGCTTAACTCCATTTTTTTCGATTCCTTCGGCGCAGTAACTAGCAAACTTA
+GCAAAAGTCTCTTTACTCGCCGTTTTACCAAAATCTTTTTTGATTTGTTTGTTAAAAAAA
+TTAAAAATCTCCTGATCCATCTTCTATACCGTCCATGCTTCCTAGAGCAAATTCTTCTAA
+ATCTGGTTCTTTGTAGTCTGGATTCGACCAGCTTGGGACGTTTGAGGTAGTTACACTTCG
+TTGTTTTTTACTATCGTCAAACCGTTGCAACCTGTCTCTGACCTTTTCTACTGTCGTATC
+TCCAGATTTATACCAATCAACTAAGATTTTATTGATATACTTCCAACTGATTTTGTTGTT
+TTCTACCGCTTCTCTTAAGGCAAGGTTGACAACTTCAATTGGCATGTTATCTTCGTGAAT
+CCACTTTTGAATATCTTCGATTTCAAATGGCGATATCATCCGTCCAAAAGTTAATTGGAA
+ATTTTCAAAAAGCTTTTTTTCGTCCATAGCTCCTCCTGATGTTGATGATGATGCTTATTA
+TCTGTTAGTATTTATTGTTATTTAGTATTTATTTATAAGTTAGTATTTATTAGTTGGCTA
+ATTTGTTGATTAGCAAATTGCACATTAGCAAATTAGGTATTAGCAATTTTTTCTAGTTCT
+AAGTCCTGTTCTGCCTTCAAAGTATTGAACGCCTCGTCGCTTATTTTTCTGTCAGAACAG
+AATCTATAGGCTTCGGTACCATATCGCCCGCCAAATGATTTTCTATAAGTTCTGATATAC
+TTGGCATTCTCTAACGCTTTCAACTGGCTTCTGATTGCAGATTCGCTATCCTTACAACGT
+CTAGCGAGTTCTTCAGGATAGACTCTCCATTCGTCTGCATTACTCAAAATGGTTAGCAGC
+AGTCCTTTTTCCTTATTGAAAAGTTCTTTGTCCTGAATAAATTCATTGCTAACAGCTGTG
+TAACTACCTGTTAATGTCTTGAAAAATGTACTGCATTAGCTGACAACCCCTCCTCTTGCA
+CGCTTCTTGCTCCATCCTTTGCTGTTTTTTAAAGCTACTTCCCTAAAAATTTTCCGCTTA
+TTCTCTGGCGAATTGTGTTTTTTAATGACTTCGTGTTGCACCCTAGCAATGACCGCTAAG
+ATAACGGTTGTTGCTAACAAAAATAATTCTAATTTGTTCATGTTATACTCCTACTCTTTT
+TTCAAATTTAATATTTTCAAGCATTTCTGGCAGTGTCTCTTTTTTTGTTTTGTAACGATT
+GCGAGATTTCCACTGTACAAACAGTTTGAATCCTTTGTAATCAATGAATACGATTCTATG
+CGTTGGATTTAATACAAACTGTTTAAAGTCTGGATGATCACGCATTTCTGTCGCCCACTG
+CTTTGCAGTAGCAACTGTCAACCCCTCCCATTGTTGAATCAAGTGTTTATAATCACCATG
+AGAAGCTGTTTCATTAACATCAACTGCTCTATAAGTAATTTCTGCTTTTGGCATATTAAT
+ATCCTCTCTCTTGTGTTATAATTAAGTAAATATTTTTTGTTTGGAGTCCGATTCCCGTCG
+GACTTTTTATTATCTAATTAAGTTGGTTCTATTAGTAAAACTCAGGCTTAATGTTTACAT
+TGAATCGAAGTCTATCCTTTGGATGGGCTTCTTTTAGTTTCTTTACTTCCGTGATTGCTT
+CTTCAGATGTTGTGCAATATAGGGTAAATGTTATTTCGTTCATGTGTGTCCTTTCTACTA
+TATGATTTTAAATCATATAGTGTTTAAAATTTTTGTGTTGCTTGCTTGTTTATCCCAAGA
+ATGTCATCGGTAGATACATCGAAAAACAAAGCTAGACTAATAAGATACTCACCTGAAATC
+TTTGTCTGGTCTTTTTCCCAGTTGCTGATAGATGTTTGAGTAACACCTAATTCTTTTGCC
+AATTCACGCTGTGACATCTTATTATGTTTAGCTCTTAATTCTGCAATAGTTACCATAGCT
+GAGTCGCTCCTTTCTTGATGATGATTACATTCTATATGATTTTAAATCTTGCGTCAAGTG
+TTTTATATGATTTATTTTCTGTTTTTTTGAAAAAATCGTAAATCATATAGTTTATTTAAA
+ACTTTTTTCTTATATGGTTGATTTATAATCATGGTTTTGATATAATTTACTTATCAAAAT
+TAAAAAGGAGGTATCCTATGGAGCAATTAGGGGACCGAATAAGAAAGTTGAGAGAAGGGC
+GCAACATGACTCAGACTGAACTTTCAGAAATATTGGGCATGAAAACCTATACTACTGTTT
+CAAAGTGGGAGAAGAATGAAAATTTTCCAAAAGGTAAAGACCTAAAAAAACTAGCAGAGA
+TTTTCAACGTTACCTCTGACTATCTTTTAGGACTCACAGATAGTAAACTTGGGAAAATCA
+CAATACAGAACGAACAACCTGAAATCGTTTCTATATACAACCAACTAGAACAACCTAGAC
+AAGAAAAAGTCCTCAACTTCGCTAACGAACAATTAGAAGAACAAAATAAAACCGTTTCTA
+TATTCGATAAAAAATCTGAGGAGACAGAAGATTATATCACTGACTACGTTGAGGGATTGG
+TTGCCGCTGGTCTTGGGGCATACCAAGAAGACAATTTACACATGAAAGTTAAACTACGTT
+CTGATGATGTCCCCGATGAGTATGATACTATTGCAAAAGTAGCTGGCGATTCAATGGAAC
+CACTTATTCAAGACAACGATTTGCTATTCATCAAGGTATCTAGCCAAGTCGATATGAATG
+ATATAGGGATATTCCAAGTCAATGGTAAAAACTTTGTAAAAAAACTCAAGCGTGATTATG
+ATGGCGCTTGGTACTTGCAAAGTTTAAATAAAAGCTATGAGGAAATCTATCTATCAAAGG
+ATGACGACATCCGCACAATCGGTGAAGTTGTGGATATTTATAGGGAATATTAAAGGAGAC
+TGTTATGGCAAAAGTCATATTCCAAGATAACTTTCTCTTAATGGGAACAAATTATCATGA
+AAAAGAAGCTAATAAAGTTATGGCTGAAATTGGTAAGAAATCACCATACTGGGATAAGGA
+TAAAGATTTTATTTCTGACTACATAAAATCAAACTTCAAGGATATCTACAAGTATTACAG
+GGTCTCAACAAAAGATGTAGAGATTGTCAGAGAACCTCTTAATCGTCACGATCCAAATGC
+CATAAAAGTCATGGTAAACAAAACTTTTGTTGGCTACTTTCCAGCAGACTTAGCTAAACG
+ATTAACCCCTTATGTAAAAAAATCTAGTCATTACCAAATGGAAGCAACCCTTACTGGTCG
+TGGTGGACAATACAAAACACTCAAAAACGATTTAAAGACCGTGGTTACTAAAAAGAAAGA
+TATAACTTATAAGTTACGATTGACTATTTTAAAAGTAGATAGAGTATCAAAAAGTAAAAA
+TGCTGGATTATTAGAGTCGATAGCATCTTGGTTTCTCAACTAACAAAAAAGCCCCACGCT
+CAAATTTGGCGAGGAGAGCGTGAGGCGAATCTAGTATAGTAAAAACCTGCTTCGCAGTAG
+GTCTCTTTACTATACCTATTTTAACAGAAAATGAGGTAAAAAACAAATGTGGATAGAAGA
+AACTGATAACGGTAAATTCAAATTTCGTGAAAATTATAAAGATCCTTACACTGGAACATG
+GAAACCTGTATCCGTTACTATGGAGAAGGATAATTCAAGAGCTTATAAAGCAGCTCGAAA
+AATCCTTGAACAAAAAATAACAGAAAAAATAGCGCAATTAAAGGCCTCTGAGTTACTTTT
+CACGGAACTTTTAGATGAATGGTGGGCGTTTTATAAGAAAGAACTTAAAAGGTCGTCTGT
+AGCTTCTCTGAGAGGTAATATCGAAGAGATAAGGGAAACTTTTGGAATAGGTGTTAAAGT
+AGTGAATATTGATCCTAAATACGTTCAGAATTATCTCGATAACCTAGATTGCTCTAGGAA
+TAAAAAAGAGCGTAATAAGTCTATGCTAAACTTAGCATTTGATTATGCTGTTGGTTTGGA
+TATTATCCAAGATAATCCTGCAAGACGTGCTAAACTCCCAAGGGTAAAGAAAACTCTTGA
+AGACTGGAAAAAGGCTGAAGAAAAATATCTTGAAGAAGATGAAATTAAACCATTATTGAA
+AGAATTGTACAGAAGACCTAGCACTTACCGACTTGGTTTGTTGGCTGAGTTTATCAGTTT
+GAACGGTTGTCGTATCGGTGAAGCTGTCAGCATTGAGCCGTGCAACTACGAATCTAAGTC
+AAGAATATTGCAGTTGCACGGAACATTTGATCATACAGAAGGATATCGTAACGGGGAAAA
+GACAGCACCAAAGACATTAGCTTCTTATCGTGAAACCATCATGACAAGTAGAGAACTTGA
+AATTCTACAAGAGTTAGAATTTATGAACGAACTAGAAAAAAATACAAATCATAGATATAG
+AGATATGGGATACCTTTTTACAACAAAAAACGGTGTTCCAATTCAGACTAACTCATTCAA
+CTTAGCTTTAAAAAAAGCTAATGAAAGATTGGAAGACCCAATTACAAAAAAACTTACTAG
+CCACATCTTCCGTCACACTCTTATTAGCCGTCTAGCAGAGAATAACGTGCCGCTAAAATC
+AATCATGGAACGTGTAGGACATGCAGACGCTAAAACTACTGCCCAAATTTATACTCATGT
+CACAAAGAAAATGAAATCAAGTGTAGCTGATATTATGGAAAACTATTAA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_008261.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1574 @@
+>NC_008261.1|provirus_1070550_1127691
+ATGAAAAAAAGGGTGTTTTGGGTAAGTATAGTATTTTTAATAATTATAACGGTTTTAGGT
+ATTACAATTAAATTTGATGGTAAGAAAGTTAATTGTAACAGAAAAACAGTTAAAGTAGGA
+TTTTATGAATATTATCCTTATTATTATCTTAATAAAAATTCTATGCCAGATGGCTATTAT
+AATGAAATACTAGAATTAATATGTAATAAGTTAGATTTAAATTATAAGTATGTAGATTGT
+AATGTAACAGATGCTTTAGAAAAGCTTAAATCTGGACAGATAGATTTAGTCTTTGGAATA
+AGTAAGACTCCTGATAGAGAAAAGGAATATGAATTTACTGACCACTATCTAAATAATGAT
+AACTTTGCCATATATACTAATAAGAATATAAAAAATGGTGATTTAAAAGCTTTAAATGGA
+TTAAAAATGGGATTTTTAAAAGGAGAAGAAAATAATGAGTGGATTTTAAGGCTTTTAAAG
+GATAAAGGCATAAATGTGAAACCTATAGATGTTTCTAATTATCCTGAAGATGAGGAATAT
+TTGTATAATAATAAAGTGGACTTTGTAGTAGAAAATACAAGAAGCAATATAAATTATGAA
+AATAAAAATATTAAAAAGATTTTTGAATTTTCTTCTGGACCAGTTTATATAGTTAGTAGA
+AAAGGTAATGAAAAATTAATTGAAGGAATAGATTCTGTCCTTGGAGAGCTTGAGGAAGAT
+GAGGAACAAAAAGATATTAATTTATATTCTAAGTATTTTGATGAGCATTTAGATAAATTA
+AAAAATGAGAAATTACTAGTTGTAATATTTTTAATTATAATATCATTATTTATTTATAAA
+AAAAGAAAAAATAAAATATTCGCTATAAGAACTAAAAGAAAAATTAGAGACTATATTAAA
+AATGATAAATATATATTATATTATCAACCTATAGTAGATCCAAAGAAAAATAGAGTAAAG
+GGATTTGAATCTCTTTTGAGATTAAATAAGGATGGAAAAATTTTAACTCCCTATAGCTTT
+ATAAAGGAAATTGAAGACAATAATATGTCTTTAGAGGTTTCTTTATGGCTTTTAAAGAAG
+GTTATTTTAGATTACAGAATAATAAAAGATTATGATATGGTTAAAGGAAGAGATTTTTAT
+ATATCCTTAAATGTTTCATTTAAAGAAATAGAAAATCCTAAGTTTTTAAGATCCTTAATG
+AAAATTGCAAAAGATTATAAGATTGATGATTGTAATATTTGTTTAGAGATAGTAGAAAAG
+TTTGGTATGGAGGATATAGGAAGAATACAAAGTGCAATAAGAATAATAAAGGAATATGGA
+TTTTTAATAGCTATAGACGATTTTGGAGTGGAATATTCTAATTTAGATTTATTAAATAAA
+ATTGATTCTGATATAGTGAAGCTAGACAAGTACTTTGCTGATAATTTAGACAAGTCTATT
+ATAAATGAAAAAACAGTGGAATTTATATCAGAAATATGTATCATAGCTAATAGAACTATA
+GTATTTGAAGGGATAGAGGAACAGTATCAGGTTGACATTGTTAAGGCATTTCCATATGAA
+AAAATATATATTCAGGGATATTTCTATTCAAAGCCAGTAGATATTGAGAATTTAAAGGAT
+TTTAAATTTAAGGATAGTTAATTTTCAAAGGATAGAAATAGTAAGAATTAATGAGAAGGA
+TTTATAATATAATAAGGTGGTTATAATTAGGAGGTACAAAAAATGAAAGTATTATTAGTT
+AATGGAAGTCCCAATAAAGAGGGATGTACTTATACAGCATTAAAGGAAGTAAGTAAAACT
+CTAGAGGAAAATGGAATAGATACTGAAATATTTCAAGTAGGGAATAAGCCTATAGGTGGA
+TGCATAGGATGTGGTTCTTGTAAAAAAACAGGGGAATGTTTTATGAAGGATGGTGTAAAT
+GAATTTGTAGAAAAAGCTAAGGATGTAGATGGATTTGTATTTGGTTCACCAGTTTATTAT
+GCAGCAGCTTCAGGTTCAATAACTTCATTTTTAGATAGAGCATTTTATTCTGGGGGTAAA
+CATATGGCATTTAAGCCAGGGGCAGTTATATGTAGCGCAAGACGTGCTGGGACAACCTCT
+ACTTTAGATCAATTAAGTAAGTATCTTACAATATGCAATATGCCAGTTGTAAGTTCACAA
+TACTGGAATATGGTTCATGGAAATACTCCAGAGGAGGTTAAAAAGGACCTAGAAGGTATG
+CAAACAATGAGAGTGCTAGGAAGAAATATGGCATGGCTTATTAAGTGTATAGAATTAGGT
+AAGAATAATAATATTCTTAAACCAGAATTAGAAGAAAGAGAAAGAACTAATTTTATTAGA
+TAATGGGACTATAAAGAGTTATATCATCAAAAGATATAACTCTTTATTTTTTATATAATT
+ATACTTTGGTTGTTTTTTAAAATTTTCATATAAAAATATTTATATATTTTAAAACAAAAC
+AATAAGGGAAATAAATTAATATTATTTTTATTATTTTGTTTTTTTAGTAATAAAAATACA
+TAGTCTTTAATAATGTTTATATAGATTTAAACTTTAAAATTAAAAAATATATTTTATAGG
+AGAGTGATTATGAATAGTGTACGTAAAATAAAGTGTTTATTTCTAATATTCTTAGATATT
+TTATTTATAAATTTAGGGTATTTCATAAGTTTATGTTTTGAATATGGAAAAGAAATGAAA
+ATAGAGTATTTTTTTAATATTAGAAATTTAATTATATTAGCAATTTTTACGAATATATTG
+ATATTTTGCTTTTTTAATCTTTATAAAAATATTTGGCACATGGCAGGGATTAGCGAGTGT
+ATAAGGTGTTTAATAGCGTCTTCAATAAGTTCTATATTATTAATATTATATAAATTTATT
+TTTAATATGGATGTAACAATAGTATTTTTAATTAATAGTAGCATTTTAATTTGTATGTTT
+TCATTACTTACACGTATGTCTATAAGAATTTTTAGGAAAATATATTTTCCTTATAAACTT
+GAATCCAACTTAAGAAAAAATGTTCTTATAGTTGGAGCTGGTCACTGTGGACGTATTGTT
+ATAGATGAGATGAATAAAAATAATAAATTTAATCCTATTGGTATAGTTGATGATGATTTA
+AATAAAAAAGGAACTTTTTTAAATGGTGTGAAGGTACTTGGAAATAGAGATGATATAGAA
+AAAATATGTAAAAGAATAAAAGTAGATATTATTTTAATTGCGATTTCAAATTTATCATCA
+AATGACAAGGATGAAATTATAAAAAGATGTGAAAATACAAAGATAAAAGTAAAAATAATT
+CCAAGTATATATGATTTAATTGATGGAAATGTTAAATTAACTAATATTAGAGACATTGAT
+TTAAGAGATTTATTAGGAAGAGATGAAACTAGATTAGACAAAGAGGAGGTAAATAATTAT
+ATAAAAGAAAAAATTGTTATTGTAACTGGAGGAGGAGGTTCTATTGGTTCAGAACTTTGT
+AGGCAGATAGCAGTGTTTAATCCTAAAAAGCTTATTATATTAGATATTTATGAAAATTAT
+GCTTATGAATTAGAAAATGAATTAAAAAGAAATTTTAAAAATTTAGATTTAGAAGTTATT
+ATAGCTTCTATAAGAGACAAATCTAGATTAAAGAAAATATTTGATAAGTATAAACCAGAT
+TTAATATTTCATGCGGCAGCCCATAAGCATGTACCTTTGATGGAAAATAATCCAGAAGAA
+GCTATAAAAAATAATGTTTTAGGAACTTTAAATGTAGCAGAATGTGCTGATGAATTTAAT
+TTAGAGAAGTTTGTATTTATATCTACTGATAAGGCAGTTAATCCAACTAATATAATGGGG
+GCAACTAAAAGAATTGGTGAGATGATAATACAAGCTATGAATGAAGTTAGTAAAACAGAT
+TTTGTTGCAGTAAGATTTGGAAATGTATTAGGAAGTAATGGTTCAGTTATTCCACTATTT
+ATAGAACAAATAAAAAATGGAGGACCTGTTACTTTAACTCATAAGGATATAACAAGATAT
+TTTATGTTAATTCCAGAAGCAGCACAACTTGTACTTCAGGCAGGAGCTTATGCAAAAGGT
+GGAGAAATTTTTGTTCTTGATATGGGAAAACCAGTAAAAATTTATGATTTAACAGAAAAA
+TTAATAAGATTATCAGGGTTTGAACCGAATAAAGATATACAAATAAAGATTGTGGGACTT
+AGACCAGGAGAAAAGCTTTATGAGGAACTTATTTTAAGTGAAGAAGAGCTTAAAAAGACT
+AAGAATGAAAAAATATTTATATTAAGTCCATTTAAGTTTGATATTAAAGAGATTAAAAAG
+AAAATAGTAGAACTTTTAAATGTAGCTTTAAATGAAGATAAAAAAGCCATTAAAGAGAAG
+CTTAAAGAAATTGTGAAAAATTATAGAGATTTAGAGCAAATAGATTTTATATAAAAGTGT
+ATTAATATATAAACTTTATAAATTAGCTTTTGTCATAATTGTTAATTTTTTATCAATTTA
+AGATGTAATAAAAATAGTTTTAAAATAAAAAAGGAGATAAATCTTAATGAATATACCATT
+TTCACCCCCAGATATTAGAGAAAAAGAAATTAATAATGTAATTGAAGTATTAAAATCAGG
+TTGGATAACTACAGGAAATAAAACCAAAGAATTTGAAAGAAAAATAGCAAAATATTGTGA
+AACTAAAAAAGCTATATGCTTAAATTCAGCAACAGCTGGATTAGAACTTATTTTAAGAGT
+TTTGGATATAGGAGAGGATGATGAGGTAATAACAACAGCATATACTTACACTGCGTCAGC
+AAGTGTAATAAATCATGTTGGAGCTAAAATTGTTTTAGCAGATACTTCAAAAGATACCTA
+TGAAATAGATTATGAAAGATTAGAAAAATTAATAAATGAGAGAACAAAGGCAATAATTTT
+AGTGGATTTGGCAGGAATACCTTGTGATTATGATAAAGTGTTTGAAATTGTAAATTATAA
+AAAGAAAAATTTTAAAGCCAAAGGTATTATTCAAGAATTTTTAGGAAGAATTGCAATTAT
+ATCAGATGCTGCACATTCTTTCGGAGCAATCTATAAAGGAAAAATAAGTGGAAGTATAGC
+AGATTTCACTAGTTTTTCATTTCATGCAGTAAAGAATTTAACAACTGCTGAGGGAGGGGC
+AGTAACTTGGAATATTAAAGATAATGAATTAAATGATATTTTATATAAAAAATTCAGTTT
+ATTTTCTTTGCATGGTCAGACAAAAGATGCTTTATCTAAAACTCAAGTAGGAAATTGGGA
+GTATGACATAGTCTCTTTAGGATATAAATTTAATATGACAGATATAATGGCAGCAATAGG
+GTTAGCACAATTTGAAAGATATGATGAGATACTTAAATATAGGAGAAAAAATATTGAATT
+ATACGATAAATTATTAAATGTTGAAAATATAAAAGTTTTAGATCATTTTAATAATACATT
+AAAATCTAGTGGCCATTTATATTTCATAAATATAAATGGAAAAGATGAAAATTTTAGAAA
+TAATATAATAAAGAAACTTGCAGAAAGAGGGATTTCAACTAATGTACATTATAAGCCTTT
+ACCTATGTTTACAGCATATAAAAAATTAGGATTTAAAATTGAAGATTATAAAAATGCATA
+TAATTTATATAAAAACGAAATAACTCTTCCTCTTAATACTATATTAACAGAAAGTCAAAT
+TGAATATATATGTAATGAGTTAAAAGGAGCTTTAATTTAAATGATATGTTAAATATTGCA
+AAAAGGACGTTTGATTTATTTTTCTCTTTGATAGGAATAATTATTACAATACCTATTTTT
+ATTTTAGTAAGTATTATGATAAAACTTACTTCCAAAGGACCTATTATATTTAAACAAGAG
+AGAGTTGGTAAAAACAAAAAAATATTTTATATATATAAACTTAGAACTATGACAGATTGT
+GATGTTAAAGCTAGTGATAGACAAGTAACTGTTATAAATGATCAAAGGATAACAAGAATA
+GGAAGAATACTTAGAAAATATAAAATAGATGAATTACCTCAATTATATAATGTATTAAAA
+GGGGATATGAGTTTTGTAGGGCCTAGGCCTGAAGTTAAAAAGTATGTAAAGTTTTACGAG
+GAAGAATATGATGAAATATTAAAAATTAAACCAGGTATAACAGATTTAGCTTCAATAGAA
+TATATAGATGAAAATACAATCATATCTAAATATAGTGATCCTGAAAAAGTATATATTGAA
+GAAGTATTGCCTAAAAAACTAATGTTAAATAAAAGGTATATAGAAGAAATGTCTATAAAA
+AATGATATTCTTTTAATTTTAAAAACTATTAAAAAAATAATTAATTGATTATAAATTAAG
+GGGTAAACTTATGTTAGTTTCATTTATTATAATAGCTCATAATGAGGAAAAAAATTTAAA
+AAATTTATTAGAAGATTTAAATGGACAAACTTATCCTAAGAAATTAATTGAAGTGATATT
+AATTGATAGTATATCTAGTGATAATACTAAGAATGTAATGAATGAATTCAGAAATTCAAA
+TAAGGAATTTAATAAAATAATAATAAAAAGCAATGTTAAAAAAATACTACCTTGTGGATG
+GAATATTGCAATATCAGAATCTAAAGGGGATATCCTTTTAAGGGTAGATGCTCATTCTAG
+AATTCCTAAAAATTTTATTGAAGAAAATGTTAATTGTATAAAAAGTGGTGAAAAAATTTG
+TGGTGGATATAGAGAAAATATTATATTAAATAAAAATAATTGGAAAGAGACGTTGTTATT
+AGCTGAAAAATCTATTTTTGGTAGTAGTATTGCACCATATAGAAGAAATATAGGTAAAAG
+GTATGTATCTTCTATATTTCATGGTGCTTATTCTAGAGAAGTTTTTGAGAATACAGGACT
+TTTCAATGAAAATTTAGCTAGAACTGAAGATAATGAAATGAATTATAGAATAAGAAAAAA
+TGGATATAAAATATGTTTTAATCCTAATATAAAATCATATCAATACACTAGAAATAATCT
+TTTAAAAATGTTAGAACAAAAATTTTTAAATGGTTATTGGATAGGACTAACTTTAGGGGT
+ATGTCCTAAATGCATTTCCATATATCATTTAATTCCATTTTTATTTGTGTTAGCCTTAGC
+ATTTACAACCATTAATATATTTTTAAATTCATACGGGCTATTTATAATTTTAGGAATGTT
+ATATAGTTTTTTAATAATAATAAATACTTTATTTATTATTAAAAATAATGAATTTAATAT
+ATTTTATATTTTTTTACCTATTATATTTCTACTATTACATCTAAGTTATGGAATAGGTAC
+ATTTATAGGAATTATAAAATTACCATTTTTTAAGATTAAAGTTTATAAGGGGAGAAAAAT
+AAATGAACAAAATTAGAGTTTTGCATATGGTTTCAACTTTAAGTAATGGAAGTGGAGTAA
+TGGGCTTTATAATGAATGCTTATAGAAATATTGATAGAAATAAAATTCAGTTTGATTTCA
+TTTATTTTGATAATGAAGAGAGAAGTATAACCTATATAGATGAAATATTAAAGCTTGGTG
+GAAAAGTAAATTATATAACAAAACCAAATAATTTAAGGAATATAAATGAATTTAAAAATG
+AATTAAGTGAAATTTTAAAGAAAGAAAATTATAAAATAATTCATTTACATGAAGTATATT
+TAAATAAATTTGTAAATGATGAAGCGAAAAAAGTAGTAGGTGCTAAGGTAATAGCCCATA
+GCCATGCAACAAAATATTCAGATAACAAAATAAAGGCTATTAGAAATAAAATATTATGTT
+TTAATTTAAAGAAGAATGTAGATATATTTTTTGCTTGTTCTAAGGCGGCAGGAAAGTTCT
+TATATGGGAAAAAAGCTTTTTATGATAATAGAGTATTTGTAATTAATAATGCAATTGAAA
+TTGATAAGTTTAAATATAATGAGAATATAAGAAATAAAGTAAGAAAAGAACTTAATTTAG
+AAGAAAAATTTGTTATTGGTAATATAGGAAGATTTGCTAAACAAAAGAATCATAAGTTTT
+TAATTGATATTTTTTATGAGGTTAAAAAGAAAAAAGAAAATGCTTTTTTATTATTAATAG
+GAGAAGGAGACTTAAGAGAAAGTATAGAAAGAAAATTAGAAAAATTAAATCTAAGAAATT
+CTGTTTTATTTTTAAGCTCTAGAAAAGATGTTAATGAAATTTTACAAGGTATGGATGTTT
+TTGTATTACCATCATTATATGAGGGACTTCCGGTATCCGTAATTGAGGCGCAAACTTCAG
+GGTTACCTTGTATTATTTCTAATAAGGTAACTGATGAGGTCAATATAATTGATTGTAAGT
+TTTTAAGTATTACTAATGCGAAAGTATGGTGTAAATATATTTTAAAGTCAGAGGATCACC
+TTAGAGTAGATACTAATGAAAGTATTACAAAAGCAGGATATGATATCAAATATGAAGCTT
+TGAGAATTCAAAACATTTATGAAAAACTTTATGCAGGAAGGGATATTTAAAGTATGTATC
+TTTATTATTTTTTCATAATATATATCTTTTTATGTGCATTAATTATATATAACAAAAAAA
+ACAAATTAAAATTAAGTGAAAAAAATAATATATATTTATTCTTAAATTTTAGCATGTTTA
+TTTTTATTAGTGCTTTTAGGGGAAGAAATATAGGAAATGATACTTGTAAATATTTAGATT
+TATTTAATAAGGTCAGATTTAAAAGTATAACTGAGCTAAAAGATAGGTATGAAATAGGAT
+ATTTATATTTAAATAAGATGCTTTCATTAATATCTGATAACCAGCAAATAATATTAATAG
+TAACCAGCTGTATTATATTAATTTGTTATGCATATTTTATAAAAAAATATTCTGCAAATG
+TTTGGTTGAGTGTATTTCTATTTTTTATATTAGGTTACTTTACATCAAGTATGAATACAA
+TAAGACATCAAATTGCCTTAGGATTAGTATTAATTTCTTATAAATATATAAAAGAAAATA
+AAATTTTTAAATTTTTAATTTTAATTTTAGTTGCATCAACATTTCATAGTACCTCAATTA
+TATTTTTAATTTCATATCCAATATCTAAATTGAAAATTAATTTTAGAAATATTATGATGT
+TTTTTTGGTTTGCTATATTAGGATATGCTCTATTTGATAAGATATTTAGATTTATATTAT
+TAGGAACAAAGTATGAATATTATTTAAAAACTGATTATCTAAATGGTGATGTAAGATTAG
+CGACTGTAGTTAATATATTAATAATAAGTACAGTTTTATTATTTGGAATTATTTCATCAA
+ATAATATAAAAAAGAGTAGAGATTATAATATTATGTGTTTATTTTTGTTTACAAGTCTAT
+CAATAAGTATAATATCACTAAAGTTTAATTTATTGGATAGAGTTGCTGATTATTTTCAAG
+TCTTTATTATAGTATATCTCCCTAATGTTATTAGTAAAATAAGTAATCAAAAGAAAAGGA
+TTATTGCAATATATTTAGTTATTGTTATGTTTTTTTTATATGGAATATCAATACAGTATT
+TAAAACCAGAGTGGAATAAAGTATTTCCATATAGCTTTTTTTGGAATTAGAATTATATAA
+ATATACAAATTTAAAGAGGTATTTAAATGAATATAAAAGAAAATATATTAAGGATATTTT
+CAGCTAACTTTTTAGAAGTTATTTCACGTATAATCATATCTTTTATTATTCCAATTATAT
+TATCTATAACTGAATATTCTAATTTAAAAACATATATGTTATACATTTCATATATAACTG
+TTTTTACATTAGGATTTGAAGAAGGAATGTATATAAAATATGGAGGAAAAGAGTTTAATG
+AAATAAATTTAGAAACATTTAAGTATGAACATAGGTTATATATATTATTACAAATAGTAT
+TTTCAACTATAGTTTTCCTTTTGGGAGTATTTAGTGAAAATTTAATCTTAATTCTTATGG
+CAATAACAATAGTTCCTTATAATATAGTAGTTTTTTTTAAGGCTAATTATAAGGCTTTAG
+GAGAATTTAAAATATACACTAAAATAGTATATTTACAGACAATTTTAGATTTAATATTAA
+ATATATTATTAGTTTTTTTTATAAAAAGTAGTAGTTATATAATGTTTTGTTTAGCTATTA
+TAGTTATTAATTTAGCTGGAGCTTTTTATGTTGAAGGAAATTTTTATAAAAAATTAAAGG
+GTATAAAATGTGTTTATAATAAAAAAATAAAAAATAACTTTAAAGTTGGATTTGTTATAC
+TAATTGCTAATTTATCTATAATGATATTTTACGGTTTAGATCGTTGGTTTATAAAAATAT
+TCTTTACTGAGTATGATTTTGCGTATTATTCATTTGCTATATCTATGCTAAATTTAATAA
+ATATTTTAATAAATTCTATATCAGTAATATTTTATAATTATATAGCTAAAGATGAAAATA
+AAACTATAATAAATAATTTAAAAAGGTATTTATTAATTTTAGGAGCTTTTGCAAGTTTAT
+CTTATTTTGGATTTGCAGCAGTTATTAATATATTTATAAAAAAATATATACCTTCTTTGA
+ATATAATAGCAATATCTTTTTCTGCATATCCTTACATCATAGTAATAAATATAGTAATTG
+TTAACTTATATAAGGCAAGAAAAGAAGAAAGAAAATATTTGAAAGTAGTATTAAAAATGC
+TTGGAATAGCATTTCTATATAATTTAATTACAACAATTCTATTTAAAAATTCAATATTAA
+TAGCGGCATCTACAACAGCTTCATTTATTACGTGGTATTTTTATTCTTTAAAGGATTTTA
+GTTATTTATTTAAAGATAAGAAAGAATTAAAATTTTTAACTATTAATTTAATAGGATTCT
+TGATATCATCCCATTTATTTAATTGGTTTTTAGGAGGAATAATCTACTTAGCAATTATAT
+TATTAACAGTGAAAATATTCTTTAAAAATGAATTCTTAAAAGGAATGGATTATATAAGGA
+ATAATAGATATTTAAATTAAATAAAATTATATCGGGGGAATAAATGAGAAATTTAGGGGA
+ACTTCAAAAAATAAATTTAGAAATGCTTTTAGAAACAAAAAGAATTTGTGAAAAAAATAA
+TATAAAATATTTTTTGATTGGAGGATCTTTAATAGGGGCAGTAAGACATAAAGGGTTCAT
+ACCTTGGGATGATGATTTAGATATAGGAATGCTTAGAGAAGATTATGAAAAATTTTTAAG
+TGTTTGTAAAAATGAATTAAGCAATGATTATTTTTTACAGAATAAAGATACAGATAGCAA
+TTTTGGTTTCTGTTTCACTAAAATGCTTAAGAATAATACTTTGTTAATTGAAAAAGCAAC
+AGTAACCTCAATGTGTAAAAAGGGAATATTTATAGATATAGTACCTTTTGATAATGTACC
+TAATAATTTTTTGCTTAAAATATTACAAGCTTTGAGAATAGACGTACTAAAAAGATTAAT
+TTTATTAAAAACTAATTATGATATATCCATGGGGAGAAGAGGAATAAAAAGAATTATATT
+TGTATTTTTTAAGTGGTTGTGTAAATTTTGGAGTAAAGAGTTTCTTTTCAAAAAAATATT
+TACCTATATAAAAAAATATAATACAAAAGAATCAAAAGAAGTTGTTTATATAAGTGGTGC
+ATATGACTATTTAAAAGTTTGCGTCAATAAAAAATGGGTTGAAGAAACTATATATTTAGA
+TTTTGAAAATGAAAAAATAAGTTGTCCAAAAGGATACCATAATTATCTTAAAAAGGTATA
+TGGAGATTATATGAAGTTTCCATCTAAAAATAAAAGAGGAAATAAGCATAATATTATAAA
+ATTGGAAATAAATTAATTAGGAGAATTTGATTTGAGAGAGGATAATATAGGTATAGAAAG
+ATATATTAATATCTTTAGGAGTAAAGCTAAAGTTATATTTTTAATAATGATGATTTTTGT
+ATTAACATCTACATTAATAAATTTTTGTTTAATAAAACCAAAGTATGAGATAAAGTCTAA
+AATATTTATAGGAAAAGAAGATAAACAAAATAATGGAAATTATGATAATAATGATGTTGA
+AATGTATAGAAGACTTGTAGGAACATATTCAGAAATTATGAAATCGGAAGATTTAATTAT
+TAATGTTATAGAATCAAAAAACTTAAATTTAAATTCAGAAGAGGTTTATAAAAAATTAAA
+GGTAATACCAAGAGATGAGACTCAAATTATTGAAATTTCGTATAGAGATATTGATAAGGA
+ACGGGGGTTAACTTTAATAAATGGTATTATAAATGATTTTACTGAAAAATCAAAAGAATT
+AATTCCAAACGGAAATGTCCAAGTTATAGAAAAAGCAAAACTTCCAACAAAACCAGTTAG
+TCCCAATAAATTTTTAAATATATTTATAGCTTTTATTTTAGGAATAGTCTTTAGTATAGG
+GTTAATTTTAGTTTTAGATTTTTTTGATAATACAATTAAAACTAGAGAAGATATTGAAGA
+TGATATAGGGCTTATACTTATAGGAGATATACCGGAAATAAGAGGAAATGATATTAAAAA
+TTTAAAGGAGGAGCTAAAAGAATAATGTTAATAAATAAAGAAACAAGTTGTTCTACAGCA
+GAAAGCTATAGAAAATTAAGAACTAATATAAAATATTTATTTAAGGATAAAAGTTTAAAA
+AAAGTATTGGTAACAAGTACAGAAAAAGGAGAAGGAAAATCAACTGTATCCTCAAATTTA
+GCTTGTATTTTTGCAAAAGATAGTAAAAAGACTTTAATAATTGATTGTGATTTAAGATCT
+CCTAGTATACATGAAAATTTTGAAGTTTCTAATGAAATAGGGTTTTCAGATGTGATTATA
+GATATTACAAAATTAGAAAAGTCAATAATAAATTATTGTGAATATTTAGATATACTTCCA
+TCAGGAAAAATTCCTAAAAGTCCTTCAGAACTTTTAGGTTCAACCAATATGGATATTTTA
+CTAGAAAAACTTTCGGAGAGTTATGATTTAATAATAATAGATAGTACTCCTTTACTTTCA
+GTAACAGATGCTCAAATTATATCAACTAAAGTAGACGGAACTTTACTTGTAATTAAAGCT
+AATAAAGTATCTAAAAAAAATGTTTTAGTATCAAAATCTATATTAGAGAAATTAAATTCA
+AAAATTTTAGGAGCAGTTTTAAATTGTTCTTATAAAAAATAAAATAGATAGATAATTATA
+TAATATTTATGATAAAATACAATTAAGGAAATGATTACATTAATATATATAATATGGGAT
+TAAAGTGTTTTATTGTTTATTATAATATATTAAGTAGTTTTATTTTAATTTAAGGTTTAT
+TTTAGAAGATTAAGGAGTTTACTATGGAATCAAAGGAAATGAGATTAGCTAAAAAAGCAA
+AAAAACTTATAGATGAGTTTGAAAGGGTTCAATCGGTTCTTCTAAGTGGAGAATTATCTG
+ATCAAGAAGTGGAAATAAGAGATGATGGAGCTACTATTGTTCTTAAAAATATAATGCCAG
+GATATAGTGGAGAAGCTATGTTTAAGTTAACTCACATATCTGATGTGGTTAAAGCTTACA
+TTGATCATATGGATGAAGAAAATGATGAAATGATTAAGAGTTACGAAGTTGAAAATACTA
+ATTGGCATGAAAGTGATTTAGGAGATATTTACAGAGAATCTGCTATGGAACATTTAGAAA
+AAGTTGAAGTAGTAGGAGATAAAGTTAGACATACGTATAAGGAACTTAAAAAGATAGAAG
+AGAAAGCTAGAGAAATAGAAGGACTATAGGATTTAGTTTTTATTTGTAAAGTAAGGTTAT
+ATATTAAATAAACCTTACTTTATTTTATTTATAAATAAAATAACAATATTAATTAAATAC
+ACATTTAGGAGATATATTTTTTTGGATTCTATATAGTAAATAAAAGAATAATGAGAGTTA
+AGTACTTTAAAATAAGGAGAAGATAATTTTGAGGGGAATAGTTTTAGATAAAGGGCAAGA
+ATATTACACAAATTTAAGAAAGGTTTTTAAAGCTTTTAATAACATTCATCTTGAGTATAA
+CTGGCTTATTACAGATTGTTGTGCTTATCCAGAGAATGAAGATATAGAGGAGCTATTATC
+AAGAGAATATTGTTTTATATCTGGAGAAGAACTAAATAGCATAATTAAAAAAGAAGATTT
+TCAATTGATTTGGGGTGTTTTAAGTGGTTTCAATAAGAAAATCACTTTAGAAGAGATTAT
+GAAATATAATTTACCATACGCAGAAGATAATAAAAATATTTGGGAGAATCCAGTTTGCAT
+TCAACATCCTCTTTCAGAGATAGAGATAATTTCATGTGATAGCGATAAAACAGTTTTAAT
+AAGCAAAGATGAAAATTTATTAGGTAGTTTTAAAAGCAATTTTCCCTTAAGTGAAGATTT
+AGAATTTTACAATAGAAAATTAAAAAATAGATTATAAAACTTTAATAAAAAAAGAAATTA
+TTAAAAAATTTATGTTTTTTAGAAAGTAGGAAAATACAATGTTTCATTATGTTTTTAATA
+GTTTAACTAAAATTTTCTTTGAGTTTTTTGAAAAAAGTTAAGAGGTTCAAAGAACTTAGA
+TTATAAGAGACATTAAGAGTATTTCCATAAAAAACAAATAATTAATTGATTATAAACATA
+TAGGTATATGAGTATTTATTATAATACTTTGAACTGATGTATAATGTCAGTATAAATAAA
+AGGGATGTAAAAAAGGATGTGAAAAATATGTTATCTAGTAAGAAAATAGTAGATGATTAT
+ATTAAAAAAATAGACTGGAGAGTCAATGAAAATTCCAATTCACCATATAGTTTTGGGAGT
+CTCAATAAACATATAATAGCTGAGGTTTCTAAAGATTACTGGCTTAATGAAGTTTATAAG
+GATAAAAGAATAATAGATGCTTATAAAAATGGAGATATGCATATTCATGATCTAGGAGGA
+TTAACACTTTATTGTTGTGGATATTCCTTAAGAAACATAATTTTAATGGGAGTACAGGGA
+ATTCCTAATATTCCAACTAGTAGTCCTGCAAAACATTTTGATGCTATATTAAATCAAATA
+GCTAATTTGGTTACAATATATCAAAATGAGATTATGGGAGCCGTTGCTTTTAATTCATTT
+GATACATTATTAGCACCTTATATAAAGAAGGATAATTTAACATATGAAGAGGTTAAACAA
+AATCTACAAAACTTTATATTTAGTATAAATAGTAATAGTAGGGCAGGAGCTGAACCAGCT
+TTCACTAATATTACCTTTGATCTTTTTCCACCAAAAGACTTAGAAAATGACCCTGCTTTA
+ATTGGAGATAAAATTCAAGAGTTCACATATAAGGAATGTCAAAAAGAAATGGATATGTTA
+AATAAGGCATTTTATGAACTTATGAATGAGGGAGATTATAATGGAAGACCATTTTCTTAT
+CCAATACCAACTTATAATATAAACAGTAATTTTGATTTTGATAATCCTAATAATGATATG
+TTATTTGAGATGACAGGGAAGTTTGGGTATCCTTACTTTGCAAACTTTGTTAATTCAGAT
+ATGGATCAAAGTGATGTAAGATCAATGTGTTGTAGACTAAATCTTGATTTAAGAGAGCTT
+AGAAAGAGAAATGGTGGTCTTTTTGGAAGTGGAGATAGTACAGGAAGTATAGGTGTTGTT
+ACAATAAACTTACCAAGATTGGCATATAAACACAAAAATAATGAAAAAGAGTTTTTTAAT
+GCTTTAAAAGAAATATTGATTATAGCAAAAGATAGCTTAGAAAAGAAGAGAAAATGGTTA
+AATGACAATATTATAAATAAAGATATGTTGCCGGCATTTTCAACTTATGTAGGAACCTTG
+AAAAATCATTTCAGCACTATAGGAATAGTTGGATTAAATGAGATGTGTGAAAACTTTAAT
+GGAAATAATATATTAACTGAAGAAGGAATGGAGTTTTCAATAAAGGTTTGTAATTTCATA
+AGAGAAGAATTAATAAACTTTCAAGAAGAAACAGGAAATCTTTATAATTTTGAGGCTACT
+CCAGCTGAATCAACTTGTTATAGATTAGCTAAAAAGGATGTAGAGGACTTTGAGGATATT
+ATAGTTAGAGGGGGAAGAGAATATCCATACTATACAAACTCATGTCATATGCCGCCTAAT
+GAAGTTAAAAACTTAAAGCAATTATTTGATCACCAAGATAAGCTTCAAGTGTTATTCACA
+GGAGGAACTGTGGTGCATATTTATTGTGATGGAGCTATAAGTGGAGAAAAGTCAAAACAC
+ATAGTAAATACAGTTTGTAAGAAATATAGAACACCTTATGTAAGTATTTCTCCTTTAAAT
+AGATACTGTAAAGAGCATGGATATGTAAAGGAAAGGGTAGAAGAGTGTCCTATATGTGGC
+AAAAAGCTAGATTTATATCAAAGAATAACAGGCTACTTAAGAAAAGTTGAATTCTTTAAT
+GATGGTAAAAAATCAGAATTTAAGGATAGAAATCAGTTAAGCCTATGATTATAAAAACAA
+AGGGCATTGTTCATGAGAGAGTAGAGGATGCGCCTTTTATGGGAGCATTAATAAGTGCAG
+TAGATTGTAACTTAAACTGCAAAGGATGCTTTAATCAACATTTAAAGGATTTACCAAACA
+TAGAGATGGATTCAGAAGATATATTAGATAAAGTGACAAATGATCCTTTTAATGAAGGAA
+TTATACTTGCAGGACTTGAATGGTCACTTCAACCTAAGGAGTTAAGGGAAATGGTTAATT
+CGGCAAGGAAGAGAAACCTTAAGGTTATAGTTTATTCTGGACTAAGTGAAGAAGATTTTA
+AGAAAAAGTTCCCTGATATATATGGTTTAAAAGGAGACATGTACTTTAAGTTTGGAAAGT
+ATGATGAAAAATTAAAGGTGAATAATAATATTCAATATGATGTTAAGTTAGCCACATCAA
+ATCAAAAGATATTAAAGAAATAAAGATAAAGAACTGTACCAAGTATTATATAAGTTTTTA
+TACTTTGGTATAGTTCTTTTATTTTGTAAAAATTATTTAGAATAATATTGTTAACTAAAT
+AAAAAAGTTTCATAAATTATATATAAGATTTAAATGATATATATCCCAATAAATATTCAT
+ATAATTTTACTATAGATTATTAATAAAAGGTGAATTTATGAAAGATAGAAAAGCTTCAAA
+GTACCATAGTAGAAGTTCAAGAGTATTTGCACCAGTTCATATTAATTCAAAGGGAGTTAT
+AGACTATAAACTCCCTTTATGTGATTTAATGGATAGTATTCTTAGCAAAAAGAGTTTTAA
+TACAAGTGTAATAACAGAAACATTAGATGGAAATCAATATTATTATGATTATGATTTTGA
+TGGAAAGAATATTATAGTATCTAAAAGTCAGATAATTAATGATTCTCCTGGATTAAAGTT
+AATTGAGAGATATAAAGGGAATTACTTAGAAAAAGAATTATATAATGACTTAGTTGTTTT
+AGTATTATATAAGGATGATAAAAAGGTTACAGACACTATCTCTTACAAAAAAGATTTAGG
+TTTAAATGTTGATATGGTTATAGAGGTAGGGAGTTATTTTTATAGACTACCATTATGTGA
+GTTTATAGACAATATTATAAGGAAAACTCCAGATATTTTAAATTTTATATATTTTGGATT
+TGAAGGTGATATGTATTATATTACTCTTGAGTTTGATGGAAAAGATATAAATTACATAAA
+ATATAGTGTTAATAATTCTAAGCTAGATGAAATTGAAAAAGCTATAGGTAATAGATTGGT
+TAAAGAATTTAGTGGTCATAATAATATTATTCTTAGTTTATATGATGATAATACTCGTGT
+AAAAGATATTGTTGCTTATAGTAGTAAGTTTTTATATTGAATATTATAAGTAAGCAAAGA
+ATTTATGGTGATATTTTAAAAGGATGGGTTATTGAAGAGTATAAAAATAAATGATTATAA
+TTTAAGATTTGAGCATCTTATTTAAAATAATATTTAGAAGAAACTCAGTTATTACTGAGT
+TTTTTATGTATTTTATAAAGAAATCTACTAAAAGATTTTTAGAATATTATAGAAATATAA
+ACTTCTTAATTGTTTTTATTTTTAGTTTTTCCTCTAATGAAATTTTTTAAGCTAGATATA
+ACTAATACTAAAACTACAAAATACATTAATATGTAGTTTAAGGATAATAGATTACCATTT
+CTATCAAAACCGAATCGGTATAATAAAAATGATATTGTTACTAATATGATAAAAATTAAA
+TTAACTTTATTTTGGTATTTTATATTAATCTTTTCGTCTTTCATATAAAAGCTCCTTTTT
+TTAAGATTATTAAATATATTCTTGCATTAATTTTTAAAATTTTCAATTACATGTGTAAAA
+CTGGCAATATTTTATGAATAATTGGGCAAATATAGAGTTTTATAGTGATTAAAAGTATGA
+CATTGCTTACAGCATACCTTTCAAATATGTAAGAATGATATTTCGCTATAAATGGCTAGA
+AATAAAGGATTTATATTGAATCGTCAAAAGTTTCGTCAAAAATAAATTTAAAAAATATTT
+TCTATGATAGAATGTGCTTTATTAAACATATCATTATTGACATGAGAGTATACTTTCATA
+GTTTGTTCTACTGAATGACCTAATATTTTTGCAGCAGTTTTAAAATCAACTCCATTAGCA
+ATTAATTTAGTAGCGTATGTGTGTCTTAATTCATGAAGAGAAATGTTGAAACCATATTCT
+TTTAAAAGTATGTTTACTCTTGAAAGAATAGTGTTTTTACTTTTAAAATTGAAAACTCTA
+TTATCTATATTTATTATAGTTTTATATTTTAATAGTTCTTCAGAAACTGAATTAGAAATG
+GGAATAATTCTAATTGAATTTTTACTTTTAACACTACCTAATCCCCATGAATTATCTTTT
+AGTATTTTCCATTGTTTATTAACACTTATTAGACAATTATTAAAATCTATATCATTCCAT
+GTTAAACCTAGAATTTCACCGATTCTCATACCTGTATTAACAGCTAAATATACTACTAGA
+TAATATTTATTATTTTTAAATTTTAATAATAAATCGTTAATTTCATCATCATTCAGTGCC
+TTTTTCTTAGTTGGTATTGGTTTACCTATTTTTATATATTTACTTGGAACTTCATCTAGT
+ATATTGTATTTAAATTTTGCACATAAAAATATGCTATTTAATATTTTTAAATAATATCTT
+ATTGTATTATTATTAAGATGTTCCTTAGTCATATTATCTATTAATTTTTGTATATCTAAG
+TTAGTTATTTTGCAAAGTTCTTTGTCATTTAAATCTTGAAACCTATGAAGCACTGTTACT
+AAGCCGTCTATTGTCTTAGGTTCTTTGTATAGCTTTTCATGCTCTAGATACATATCTGAA
+AAAGCTTTAAAAGTTATTTTCCCAAAACTATTATTGCTTGTTTTTATATTTTTCTTTAAA
+TCTTGTAGCATCTTTTCAGCAATAGGTTTAGCTTCTTTTTTTGTCTTAAATCCTTGTTTA
+GATTTTTGCCTCCATTTTCCATTGTAATCCTTATAGCTTATTATAAATTGCCATCCTTTA
+TCTTTTTGCCTATAAGTTACGTTATACTCCATATCTAACACCTCTTTTAAAATTAAAATA
+AAATTTTTTGATACGAATATATGTTCTATAAAATCTATAAAATAAACAGTTGAAAATCAA
+CTGGTTAAAACATTTTACATATTCCTAATGATGGAATAAAGTATATTATGTAATTATCAA
+TTTTATACATAACGCCATATTTAGCTCTGTAATAATCAATTGCTTGATCAAAGTATTCTT
+TAGTTACACCTAAAAAATCAGCTATTTCAAAAGCATTTCTACAATTATTTTCAAAAGCGT
+TAATTAATCCAACTAAGCCAACAGCTTTATCAAACCCCCAGCGCCTGGCAACTAATTCTT
+GTTTTTTATTACATATTTCAGTTTGATCAGTAATATCACCTAAATTTTTAATATAGTGTC
+CAAGTTCTTCAGCTAAAATACATGTTTTTTCTTTGGTATTTATATTACTATTAATAACTA
+TTATATTATCAACGCATTTTCCGCAAGGTTTATCTGTGCCAAGATCAATTTCAATGACCT
+TAGCACCATGACATTCGGCTTCATACATTAATCTTTCGTATTTAGTCATATAAACCCACC
+TAACTTATTTGAGATTTTTTAAAGCTTTATTTATTTTTTCATTCATTAAAGCTTTTTCTT
+CATCAGTTAAATTGTCATCATGACAAGCTACTAAATAAGGAGTTTTTTGATTTTCTATTA
+GAGTAGCAGCAAATTCAGTATCTAAAGAATACTTAGGCATTTCTAATAAATCCTTAGTAT
+ACGAAAAAACTTTATCTTTTCCTAAGTCATTAAGTTTTCTTAAGTCTTCTATATGTATTT
+CTTCATCTTTAGATAAGTTGTTTGAATTTTCGCCAACTTCATCTAAACCTAAAAGCCATA
+TAGGACTTACGTCTAAAGCAGCAGCTATAACTCCTAATTTATCTACAGGCATATTTTTTA
+TTGATCCTGTCTCATATCTTTGTAGAGTAGATTTACTCATATTAGTTTTAGAAGCTAAAT
+CTTGATATGAAAGCTTTAGTTCTAATCTTCTACTTTGTATTCTATTCATTATCATTTGCA
+TGTTTGAGTCATCAAGTAAATTTTTCATTTAATCACCTCATAGTTTAATTATAAAATATT
+TTTTCATAAATGCAACGATTTTTTGAAAAAACTTAAAGAAAAGTTGCATAAATGGGTTGA
+CTACATTTTTCAGAAGTGTTATGATTTAATCATCCTAAATATGCAACGGAGGTGAGAAAA
+TGGTTTATAGCAAATTAAAAGGGATTATGAAAGAAAATGCTTATTCTCAGGGTAAGTTAG
+CAAAAGAATTAAATATAACCACTCAGAGTTTAAATGCTAAGTTAAATGGGAGAAGTCAAT
+TTACCATTAAAGAGGCTATAAATATTATATCTATTTTTAATATAAAAAATCCAAATGATA
+TATTTGAAATTTTTTTTGCAAATAATATCCCAAATATGCAACGAGATATAAGTTAAGGAG
+GAAATAAATGAATAACTTAATGATTTTCAAAAATGAAGATTTATCAATCGATGTAAGAAC
+AATTAAAAATGAAGATGGAAGTATTTCAATTAATGCTGAAGATACTGCTAGAGGGCTTGG
+ATTTATTCAAAATCAAAATAAGAATGGAAAACTTTATATAAGTATAAGATGGGAAACAAT
+CAATAATTATTGTAAGGAATTTAATTTCCCCAACAAGTTGGGGAAAGATGATTTCATTCC
+TGAGAGCTTATTTTATTTATTAGCAATGAAAGCTAATAATGAGGTGGCAAGAAAGTTTCA
+GACTTGGCTAGCTGTGGATGTAATACCTCAGATAAGGAAAAATGGACAATATCAAATGAA
+ACCAACATCTAATTTAGAACTTTTAGAGTTACAAGTTAAAGCGTTAAGAGAAGTTGAAGA
+GAGGGTAATTGAAGTAGATAAGAAGTTTGATGATTTACCGCTATTTGAAATAGACAGTAA
+AGATTTAAAGAAGAAAGTTAATAGAGTTGTAGTTTCATTACTAGGTGGTAAGAAGTCTAA
+TGCATATAAGCCTTTAAGTAAAAAAGTGTTTTCAGATTTATATGGACAGATTCATAGAGA
+ATTTGGAGTTGATACTTGTGCAGCTATTAAGAGAAAAGATTTAGATTTAGCTAAAGAGAT
+AGTTGATAGTTATACATTACCAAGAGTATTAAAAGAAGAAATTGAACTTGCTAATAGCCA
+ATTAGCATTTGCTCAATGATAAAGAAATGAAAGGAAAGATTAAGATGGAAAATAAAATAA
+CTGCCCAAGTCAATAAAGAGCAGTTAAAAGTTAAATCTATAATACAAACTGTATTAAATT
+GTTTATTAATTATTACTGTTTTAGTAAATATAGTTTCTCTTTTTAAAAGAGAGAATATAA
+ATAAGCAATTACAAATGCAGATTGAAGAAAATAAATTGGCTATACAAAAGGTTGATTTAA
+TAGTTGACCAGCTTGAAAAAGAAATTACTAATCTTCAGAAGAAAGGTTCTTTAGATTAGA
+GTTTAATTTTTCTAATTCTTTAGTTAACTTAATATTGGTTTCAGTATTTTGTTGAATAGT
+TTTAGTCATATGTTCATTAGATATATTACTTTGTGTATCAGAATAAAGTCCATATACAAA
+AAATAATAGGGTAACAACAATATTAATAATATTTAAAATATCTGATTTACTAAGTTTACT
+ATTTTCAAAAGTTTCCTTTGTCGAGTCTATAGAACTAACATAAGAATCGATATCACTATT
+GACTATATTATTTTCATTACAAAATTCTTTAAGTGAATCAGTGAATGAATATATGCTTTC
+AGCTAATTCATTTGAAAACAAATTATAGTTTATATTTGAAGTTAATTTAGTTAATTGATT
+TAAGTTAATAAATGAGTCATTATATATTGCTTTTACCATAGAACTAATATTTTCAATATT
+TAAAGTATTAAAATCTTTAACCATTTGTTGGAGTTGTAAATTAATATTTGGCAATGGAAA
+AGTAATTTTACTAAGTTGAGAAATTTGTTTCATGCAACTTTCGATTGAGTAAACACTAGA
+AGCAAGAGTGAAATTTGGCTTGTAAATTGGAGTAGGAATTTTTATAGAGTTTCTAATTAA
+TTTACTATAAATTTCATTATTAGATTTCATATTAACCATAATTATACCACCTTTCATAAT
+TTATTTCGACTTGGCGGAGCCGATACTTAAATTATAAAGGTTGGAAATATATAGGACAAG
+TATCAGTAAACAGCGAATCCCTCTGATACTAAGGGAATGAATAAGACAAGCTTTAATTAA
+AACCTAAGGATAAGTAAATCGAAGGAGGGCAAGAAATGGCACAACTATTAACACAAAAAG
+ACTTAGCAGAACGTTGGCAAATGAGTGTTAAGTCTATTGAGGAGTATAGAAAAGCAGGAA
+TTATCCCTACTGTAGAAGGGATTCCTGCAATAAGATTTAATTTACAAACTATTTTGGAGC
+TAGAAGGAACTAAATTAGAAAGATTTAGTCCATTAGAACGTAGACGTATGGAAATGGAGT
+TAGATGAAGTAAAAGAAGAGAACCAAAAGTTAAAAGATATCTTAAGTAATGTACTAAGTA
+ATTTAGCACCAATAATAAGTCTTGTAAAGGAGGTTTGATATGTTTACGCCAGGAGGAAAA
+ATAGTCTTTGGAATAATAACAACAGCAACAACTTTATTTTTAAGTGTTTATTTTTTAGAT
+AAATCTATAAATGAGAAAGATCCTAAAAAAAGTTTTAAGTATTTAATGTTATTTGTTGGA
+TGTACTTTAAGTTTTATCTTTTCAATAAATGTAAGTTAGGGGTGATGTTATGAACTTTAA
+AGATATACAGAGTTTAAAGGCTAGACATAGTAAAGAAGAGTTTGAAAGTATCTTGTTAGC
+TGTAGAGCAGGATTTAAAATTTAATAATATTAGATTTAAGAAACCTATTCCAAAGAAAAA
+GTTTTTAGAGGTTCTTAACATAACAGAAAGTTTGTTTAGGAGGATTATATGAAGAAAGTA
+AATATAGGATGTTTAGTAACTGTAATAGGTTTAGTTATTATATGGTGTTTCTTTTACTAT
+TTATCTTATAAGGTTTGGTGTTGGTTATGGACTTAGTAAAAGTATCAAAGAACATAGCTG
+ATAGAGTACAAGAAAGGTTTAGCGATTTAAAAGTAGACAAGCCTTTAAGTAATTTAATAG
+AGGAAGAAATAAAAAGAGAGTGCATTGGCACCGACCAAAGTAACCAATGTACTCATAAAA
+AATAAATTTCAAAGAAAGTTTAACATAATAAATTTAAGGAGGCAAGTTATGATTAATATA
+CCAGATTGTTGTTATGAATACGGAAATGATGAAAAAGAGCCAAAAGTAGCTTTTGAGTGT
+AGTTGGTGTGGTGAGTGTATATATGTTGGAGATGATTATTACGATATAGGGGATATAAAA
+ATGTGCTGTGAATGTAATGATGAATGTAAGTCAGTAGCAGAGGAGGGATTCTAATGGAAG
+AGAGATTAGAGTGGCTTAGAGAAAGACAGAAAGGAATAGGAGGCTCCGATATAGGAGCTA
+TCCTAGGATTAAATAAATATAAAACAGCTTTTGAAGTTTATTTAGAAAAAACAGAACCTA
+TTTTAGAAGTAGGAGAGCAATCAGAATCAGCCTATTGGGGAGATCAATTTGAAGAAGTAG
+TTGCTAAAGAATTTGAAAAGAGAACTGGTAAGAAAGTAAGAAGAGATAGAAGGCACTTTC
+AAAATAAAGATTATCCATTTATGGTTGCTAACATAGATAGAAGAATTGTAGGAGAAAATT
+CAATTTTAGAATGTAAAACAGCTAATCAGTATTTAGCTAAGGAATGGGAAGAGGAAGAGG
+TACCTGCTAGTTATTTAGTACAAGTTCAACACTACTTAGCAGTTACAGGAGCAACTAAAG
+GATATATAGCAGTTTTGATTGGTGGACAAAAGTTTATTTGGAAAGAAGTTGAGCGTGATG
+ATGAACTTATAGAATACATTATTGAAGCTGAAAAAGATTTTTGGAAAATGGTCAAAGACA
+AAACACCACCTGCATTAGATGGTTCAAGTGCTGCTGAAAAATGGGTTAATGAGAGATATA
+AAAAAGTTAATGAAGGTGAAGTTATAAAACTAGATTCATCATGGAAGGAGTTACTTAATA
+AAAGAAAAGAACTCAAAGAATATAAAGATAATGTAGAGCAAGAAATTAAAGAGATAGAGA
+ACCAATTAAAGCAAAACATAGGATATGCAGAGTATGCTAATGTTCCTGGATATAGCATTA
+GTTTAAAACAATCAGTAAGAAAAAATTTAGATAGTTCAAAAATTAAAGAATTACTTAAAG
+ATGATTATGAAAAATATTTAAAAGAAAGTATAAGCAGAAGATTAATAATTAAGGAGGAAA
+AATAATATGGCAACAGCATCAAGTTTAAAAAATCAATTAGCAAAGAAGGGAACTGGTAAT
+AGTTTATCAGTTGGAAATACAGTTAAAGGATTAATGGATAGTCCAACTATAAAGAAAAGG
+TTTGAAGAGGTATTAAATGAAAAGGCACCTCAATATATGAGTTCAATAGTTAACTTAGTT
+AATTCAGATACTAACTTACAAAAATGTGAAGGAATGAGTGTAATAGCAAGTTGTATGGTA
+GCAGCAACAATGGATTTACCAGTGGATAAGAATTTAGGGTATGCATGGGTAGTCCCATAT
+GGTAATAGAGCTCAATTTCAAATGGGTTATAAAGGGTATATTCAATTAGCATTAAGAACA
+GGTCAATATAAGTCTATAAATGTAGTTGAAATAAGAGAAGGCGAATTAGTTTCATGGAAT
+CCATTAACAGAAGAAATTGAGGTTGACTTTAGCAAACGTGAGAGCGATGCAGTAATTGGA
+TATGCAGGATATTTTAAATTAATAAATGGATTTGAAAAGACAGTATTCTGGACCAAAGAA
+GAAGTTAATAATCATGCTAATAAATTTTCAAAGACAGTTAATTCAAAAAATTCTGTTTGG
+AAAAGCAACTTTGATGCGATGGCCAAGAAAACAGTTCTAAGAAACCTACTATCTAAATGG
+GGAATTTTAAGTATAGAAATGCAAAAAGCATATACAGCAGATGAAAACTTAATTAATAAA
+GGTCTAATGGATGATATAGAAAATGTACAAGCTAACATTGAAGGTATTCAAGAAAACAAT
+GAGAATGAAGGTGTTATTGAAGCTGATTATACAGTTGATAGTAACAATGAAGTGCTTGAA
+GGGCAACAAGATATATTTGAAGGAGCATCATTATAAGATAGGAGGGGTTAGTTATGGCAG
+AAGGATGGATAAAGCTTTATAGAAATATTCAAGAACATTGGATATGGCAAGATCCACAAA
+AGTTAAAATGGTGGCTAGACATTCTTCTTCTAGCTAACCATAAGGAAAATAAATTTTTGC
+TAGGGAATGAATTAATGGAAGTTGAGAGAGGGGAACATCACACATCAGAGTTAAAATTAG
+CCGAAAGATGGGGTGTATCAAAAACAACAGTAAGAAAGTTCTTAAAGTTACTTGAAAGTG
+AACAAATGATTGAACTTAAAAAATCGAAAAAGGGTACCACCTTGAAAGTTAGTAATTACA
+ACGATTATCAAGATTTTTCAGAGGGTGAAAAAACCATAAAAAAACCACAAAAAAACCATA
+GCGTATACCACAAAGAAACCATAGAAGAACCATATGCTATACCACAAAAAAACCATGAGG
+TATACACAAACAATAATGAAAAGAATGAGAAGAATGAAAAAAATGAGAAAGAAGGAGAAG
+AAGTAGTAAAATCAACCTCACCTCGTTCCTATCCTTCTCCTAGTCATAAATTATTAGCTA
+ATTACTTAACAGATGTATGTTATAGAACTTTCTTTAACAATGCAGATATTGTTGAAGAAA
+ATGAAGTTATAAAAATTAAACCAGAGAATGATTTTTCTAGAGGAGCTATTGAGAAGTATG
+TTCCAACACTAGAAATTCAAACTCATAAAAAAATAGAGGTGATTTAAGTGAAAGTTAATT
+TACTAGAAGTTTATTCAGTACATGAGCTAGCATTAAAGACCTACAGAGATTTAGCTAAAA
+GAAAAATAGAAAGAAATAGAGAAGTAGATGCTTATTTAAAAGTTAGAGAAATAAGTGGAA
+GAAAGAAATGGAATGTTAGATTTGGAGGATATAGGTGGTAGTAGTTACAGGAAAGATAAG
+AGGAAAGGCTAGGCCGAGAGTTTGTAGAGGCCATGCCTTTACTCCTAAAGATACAATTGA
+GTATGAAAAGTTAGTAAGAGAGTGTTATAAGAAACAAGATGGAAGATACCTAGAAGGAGC
+TATAAAGGCTTTGATAATTGCTTACTATAAAATACCTAAGTCTTATACTAAAAAACGTGT
+ACAAGTCATAAGGGATGGATTAGAAAAGCCAACAAAGAAACCAGATGCGGACAATATAGG
+AAAGGTTATATTAGATAGTTTAAATGGAGTAGCTTATAAGGATGATAGCCAGATTATAGA
+TCTTAGAATTAAAAAAGAATATACGGAAGAACTTGAGAGAGTTGAATTTGAATTTAGATA
+AATAGAAAATGTTCTTTTTAAATTTAATAATGCGGTATTGAGGGCATATACATGCCAAGC
+AACAATTAGTATAATTTTATTATTATGTAAGTTTATTATTCAATAAACTATATGATAATT
+TCAAATTTATTAGGAAGGAGTTAATCTATAATGAAAATAGACTGGAATTTTTTACTTTCA
+GTAATAACTATTATTGTTGCTAGTTATGCACTAATACAAACCCACCATCAAATGAAATTG
+AGCAACAAACAACATTTATTTGATAAGCGTATGGAAAACTATCTAATTGCTATGGGATTG
+ATACAGTTATATAGAAATAACTGTAAGGATTTCGATAAGGATTTCGATGAAGAAAAAGAT
+GAACCAATTTTTGCTTTAAAGTCATACTTTATATGGTTGACAAATAACACTTATTTGGAA
+GAAATCACTACTGCAATAGATAATCCACTAAAAAACCCAGGTCATAAAGAGTTTTTAATT
+AAATTGGAGAAATTAAAGGAAGTTGGAACTAAGATCAAATTTTTATTTCCTGATAATGCA
+TCTGATGCATTAGGAGACTTTGTTTTTAGTTATCAGGAATTGCTATTTTCAATGTATCAG
+TATCAAATACTTTTAAATAATATGTATGAAATTAATAAAGATCATAAATTAAGTCTTGAG
+GAAATACAACAAAAATTTGGGGAACCAAAGCATAGGCTTAAGCTGCAAAGGTCTTTTCAA
+AATTTAAAACAAGCAGACGATTTATTAAAAAAGAAAAATGTTGAAGAAAAAATTAAAAAT
+CAAATAAAATTATTATAGATAACAGTTTGTTAATTAATTACTTAAATAAAAAAATAAATC
+AAATATATTATTAAAATACCGTATTATTCAAAATGAATATGCGGTATTTTTATTTAAATT
+CAGAGATTAAGAGAAGTGATATATATGACAAAGAATCAAATAGGTTTCTTTGATAAACCT
+AAAATAAAGTTGTTGGAGGATTGGACAAGGCTCCATCCTCTATTAACTAAAAATAGCGTT
+CATGAGGTTTTTATTGAAAGGGAGAACTATTGCATCATCTTGATAGATAAAACTTTCTAT
+GGCGTTTATAAGAAGGATATAGAGCGGTGTTAGATTTTAGCCATGTATTAAAATTTATTT
+TATATAATAAAAAAACGGATACTTAAAGTATCCGTAAACTATCACACGAGGGGATTCGAA
+CCCCCACGGCCATATGACCGACAAGTTGGCAACTTGTTGCGTCTGCCTATTCCGCCACAT
+GTAGAAAATGAATTATTTCTAATTCATTTATATTTTAGATCAAATGAACAAAAATGTCAA
+CAAAAATACAAATATAATAAAATTTAGGAGGTATATATGAATAAAGAGCTATTCAGAAAA
+ACAGAAAATTTACTTAAGAATTACAATAGATTAGAAACTGAAATTAAATTAATAAAAGCA
+GAAATTGAAGATATTAAAGAATCTTATACTGGTTGTGTGGCCATTGGATATAGTGAGAAA
+AGTGGATCAACAAATAAATTTAGCAGTATGGTTGAGGATGAAATTATAAGAAAAGAGAAA
+GATCTATTCTATCTTAAGAGAGATTTAGAGTATAAGGTTAAGTTGAAAAGAAGAATAGAC
+TTAGCTATACAAACACTTAGAACTAAAGAAGAGAAAGATTTAGTTAAATTAAAGTATATT
+AATCAGCCCAATGTTAGTTGGGGGAATGTGGCTTACATTTTAAGATATAATAAGGATTAC
+TGCAGGAAAGAACTAAGGAATAAGATAATAAGGCAGATTGCAGATTTTATATTCTATAAT
+CCAGGAGTTCAAGAAAGGTTTATTATATAAATATACCCCATATCTATACCCGTTTAATAC
+CCACCATATACCTACTTTTATATGTTATTATGTAATTGTGGATAGGGTAAAGCGTTCATT
+GATGATCCTCCTGGATGTAAATTAAAACTTAACTAACGGAAAGAGCAAGGTGTAAAAGCC
+TTGCACGTGGAAGGAAGAGTATTAATAAAGGTGCAACTCCTTTACCTTCCTAAATAATAC
+TTCCTTTTAAGTTTATTTTTTCATACAAAGTCTAAGCTGGATTAAGTTCCTGCTAATATG
+GGGAGATAGTTTAATTGGTAAAACATTGGTCTCCAAAACCAAAGTATGAGGTTCAAATCC
+TTGTCACCCCGCCATTAAAAATTAAATAACCTCTGGATTACGGAAAAGAATTTAGTTTAG
+ACTAGGTTCTTTTTTATTTTGATTTTTGTAAAACTTTACCTTATAATAATTATGTGAAAT
+TTTATTATATATTAAGTGTTGGGAGGGGAACTATGAGAAAAGCTTTTTGGGGGTATATTC
+CATATGATGATAAGACTTTTGAAAAATTGTGGGAAACTGCAGATTTTGTTTTAGATGCTA
+ATATACTATTAAATCTATATAGATATTCGAATAATACAAAAGAAAAAGTGTTAAATAGTT
+TAGACAAAATATCTGAGAGGATATGGATACCAAATCAAACTGGTATAGAATATTTTAATA
+ATAGAGTCTCAATAATTTTAGAGCAAAGTAAGATTTATGATGAGGTTTTAGAAGAATTAA
+GTTTTTCTAAAAGTATAGATTATATAAAAGCTTTAAGACATTCAACTTTAGAAGATAAAA
+AGCCGGAAATTATAGAACTTTTACAAAAGTGTGAAAATAAAATAAAAGAAATTATAAATG
+AGGATAAGAAGAAATCTGAAAATATAATTGAAGATGATTACATTTTAAAAAAAATAGTTA
+ATATATTTGATGGTAAAGTGGGTTCGTCTTTAACTGATAAAGATTTAGAAAGCTATAAAA
+AAGATATTGATATAAGATATTCTAAAAAGATACCACCTGGATACAAGGATAATAAGAAAA
+ATGATGATAAAAAATATGGTGATGCTATAAATTGGTTAGAAATAATAAAATACAGTAAAA
+ATAATAAAAAAAATATTATTTATATAACAGATGATAGAAAAGAAGATTGGATTGAGATAA
+TAGAGGGTAAAAAAATTGGTCCAAGAAAAGAATTATTAAATGAGTTTTATCGTTCAACTG
+ATGGAAATATTATATACATATATAATACCTATAGTTTTTTAGAAGCATTCAATAAATATA
+TTAATACGGAGAATAACATAGGAAAAGATGTAATGGATGAAATAAAAGACTTAGATACTA
+TTTTAAATGATTTTGATAGTAAAAAAATTAGTATAATGAGCAAAAAAATATTTGATAAAT
+TTGTAGGATTGGGTGTAGAACCTAATTGTTTGATAATGATTAATCAAGAAAAATTCAATA
+AATATATGGAAATCATTAAAGATTGTCAAGAAGGTGGAGCAGATTTTCATTTATTTATAG
+ATGATTTAAAATTTTTGGAGTTCGTAGATAATTTATTAGTGTTGGAACCAACGATTTCAT
+TATCTAAAAATAAATATTATTATGAGTTGTATAAGAATTTTATAATAAAAAATAAAGTAA
+CTGTATAAATTTAAGTAGATAGAGTTTTTTTAATAAAAGCTCTATTTTTATTCTACTAAA
+GAAAGGTGGTGTTGTTATGAAGCTTACACCAAAACAGAAGGCGTTTGCTGAATATTATAT
+TGAAACAGGCAACGCCACAGAATCAGCTATTAAGGCAGGATATAGTAAAAAGACAGCTAG
+GGTAATAGGACAAGAGAACTTGCTAAAACCTGCCTTGAAATCTTATATAGATGAAAAGAT
+GAAAGAATTAGAAAGCAAAAGGATAGCTAAAGCAGAGGAAGTGCTAGAGTATCTAACTAG
+AGTTCTAAGAGGAGAAGAAACAGAACAAGTAGTAGTTACTGAAAATATAGGTGATTTTAT
+GAGTGAGGCTAAAGTTGTTGATAAGGAAATTTCGGCTAAAGATAAAATCAAAGCAGCAGA
+ATTATTAGGTAAAAGATATAGATTGTTTGTTGATAAAGTTGAAAAGGATAGTAACGTAAA
+TGTTAATTCTACAACTAAACTAGATTCTATACTTAACCAGTTAAAGGATGATGACGATGA
+GTGATGAATACAAGTTATCAGATAAGTATTTAGCTTTTTTAAAACATAGAGCACCAGTAG
+AAGCATTGGAGGGAACAACAGCAGCAGGAAAAACTACAGTAGGAATATTAAAGTTTATGC
+TGATGGTTGCAGAATCTCCTAAGAAAATGCATGTTATTGCTGCTAAAACAACTGGCGTTG
+CTGAGAAAAACTTAATACAAAAAGAATATGGAATTACTGATGTATTTGGTGATTTAGTCA
+AGTATAACGGTAATGGTGATAAAGATAATAAAATACCTCATATAAGATATATAACTCCTA
+ATGGTGAGAAAATAATATATATACTAGGTTATGATAACGTAGATAAATGGAAGATGGCCT
+TAGGTTCTCAATTCGGTTGTGTACTTATAGATGAGGTTAACACAGCTAGTATTGAATTTG
+TAAGAGAAATATGTACTAGAAATGATTATCTTATGATGACACTTAATCCAGATGATCCTA
+ACTTACCTATATATTCAGAATTTATTAATTGTTGTAGACCATTAGAAAAATATAAGAAAG
+ATGTTCCAAAAGAGATAATGGAGCAGTTAAATTCGGAACCAAAGCCTAACTGGACTTATT
+GGTTCTTTTCTTTTTATGATAATGCATCATTAAGTGAGGAAGCTATTGAAAAGAAAAAGA
+CGAGTGCTCCTAAAGGTACTAAGCTATATAAGAATAAGATACTAGGGTTAAGAGGAAGAG
+CAACAGGATTAATATTCTCTAATTTTGAAAGAAAGAATAATGTATTATCTAAAGAACAGG
+TTATTAAACAAATAAAAGATAAGAAATTAAAGTTTGTTCAATTTACAGCAGGATTAGATA
+CCTCATATTCTCAAAATAGTCCTGATACCTTTGCATTTACTTTCTTAGGTATTACAGATA
+AGAAAGAATTAGTAATGCTAGATGAAGAGGTGTATAACAATAAAGACCTAGAAACTCCAT
+TAGCTCCTAGTGATATAGCTCCTAAATACTTTAAGTTCTTAGAGAAGAATAGAAATGAAT
+GGGGATTTGCTAGAGATGTATTTGTAGATTCAGCAGACCAAGCAACTATAACGGAGCTTA
+AGAAGTTTAAGAGAACTAATCCATGTATGTATAACTTTATTAACTCTTATAAGAAAGTAA
+CTATATTGGATAGAATACATTTAGCTTTAGGTTGGATTAATACCAATGGTAAAGTATTTT
+ATTATGTTTTAGATACTTGTAAAGAGCATATAAGAGAACTTGAATGTTATTCATGGAAAG
+AGGATAAGTATGAGCCAGAGGATGCAAATGATCATACAATTAACTCTAGTCAGTATGCAT
+GGATACCTTTTAGAAAGATAGTAGGAGATTATATAACATAAGCACTTTCCTTAATTGTAT
+ATTTATTGTAAAATTACAATGAACGGAGGTGATAATTTGAATAAAATAATAAAATGTTTG
+AAAAAAATAATAAATTTTTTAAAATTAATACTCATTATTATTGCTATAGTATTTTCGTCT
+ATAGTATTAATAGCAAGTATTGTTTATTTATGTTTTGCTATAATATATTTACTACCTATA
+GGAATTGAATTTATAAATGGCAATTATGTTGCTACATCTACTATGATGCCAAATTACTCA
+ACAGTTTTCCAATCAATCTTTACATTGGTTAGTATATTTACTTCTTTATCAGTTAGTTTA
+TTATTATATAAGTTAAATAAACAACAAAATGCAGTTAAGTATAATAAAGAATTAGTAGCT
+CCTGCTAATTTAGTTTATTTTAAGATAAAATATTATCTTATACATCATTTAATTGAAGAG
+TTACGAAGAAATAGGAATAGGATAAGTAATGATCAATATCGAACTCAAAATGGATTAGAA
+GAAAGTGATTCAATAATTTATGAAAATATTGCTCAAGTTAATGTTGATACTTTAGAAAAT
+AATATTTATAAAATTTTATGTGAGTTAAATGATGATAGAAGTATAAATAAACTATTAGGT
+CTATATGAGGATATGAGAAGAAGTAATTCAATAATATATATTTTAAAAGATGAATTAACA
+AACTCATGTAATCTTGTTGAAACTAGGGGATATGAATGGGTTAAGGTACTAGTAGGTCTA
+CATAATAATAACTTTGAGTGTTTAAATGAAGATTATAAAAAAATCATGTATAGATTATTA
+GAATTAAGCAAAAGGAAAAAATAAACCGATAAAAATTTATCGGTTTATTTTTTGTAAGGA
+GGAGTAGAAGTGGGGTGGTTTAAGAGTATGTTAACTAAAGCAGCAATTAAATATTTAAAT
+GTTCAACCAGCATTAATTAATCCTATTACTATACAAGAAGCTTATACCTATGAAACTAAT
+GTGATTAGAAATAAGCTTTGGTATAGGGGAGAACCATACGAATTGGACCAATTCTTTAAG
+AATATATCAAGTGATCCAGTAAATAAAGCTAGGTTTTGGAGTGCTGTTCCAAGTGAAGAT
+TTAAGTATAAGAAAAATACATAGTGGATTACCTGCAATGATAGCTGATAAGTTAAGTGAT
+ATAGTTGTAGCTGACTTAGATAGTATAGAAGTTACAGGAGAGAATTATAACACATTATGG
+GAAGAAATAAGAAAAGATAATAAGTTTGATGATATGCTAGGTGATATAATTGCTACTACA
+TTAGTTAGTGGTGATGGAGCTTTTAAACTATCTATAGATACAGAGATAAGCAAATATCCA
+ATAATAGAGTTTTTCGATGGTGATAAGGTTGAATATATAACTCAAAGAGGAAGATTAAAA
+GAAATAAAGTTCTATACTTTTTATACTAAAAATAATAGACAATATAAATTAAGTGAAACT
+TATGGAAAAGGATATATAAACTATAATTTATATGATAGTAATGGAAATGAAGTTTCTTTA
+AATACACTTGATGAAACTAGAGAACTTGCAGATGTAACATATAAAGATGATTTTATAATG
+GGAGTACCATTAATGTTCTTTAAATCTCCTAAGTTTGAAGGAAGAGGGAAGAGTATATTT
+GATAATAAATCAGATGCCTTTGATGCATTAGATGAAGTTATATCTCAATGGATAGATGCC
+ATAAGGGATGGGAGAGTCCAAAAGTATATACCAGAGGATTTAGTTCCAAAAGATATTAAT
+GGTAATTTAATGAAACCTAATCCTTTTGATAATAGATTCTTAAAAGTAGGTTCTAGCCTT
+GCAGAAGATGCAAAGAATGAGATAGATATGAAGCAAGCTAATATAAATTATGAGGCTTAT
+GTTGAAAGTTATTCTAATGCTATTGATATGTGTCTACAAGGTATAATAAGTCCTAGCACT
+TTAGGAATAGACCTTAAAAAAACAGATAATGCAGAAGCTCAAAGAGAGAAAGAAAAAACT
+ACTTTATATACTAGAGGAAAAATGGTTGATATATTAACAGAGGTTATACCAGAGTTAGTT
+AATATAATCTTAAAGACCAATGATGTATTAAATAAAAAGAATACTGGAGAATATGAAGTA
+AGTATTGTATTTGGAGAATATGCAAGTCCTAGCTTTGATACAGTAGTAGAAACTGTAGGG
+AAAGCTAAAACCTATGGAGTAATGTCTATAGAGCAATGTATTGAGGAAATGTATGGAGAT
+ACATGGACAGATGAAGAAAAGGAAGAAGAGATAAAAAGAATAAAGGAACAGAATGGCTAT
+CTTGTAGCTGAAGAACCTAAGACAGTAGATGATTCTGATATTTCATATACTGATGATAAT
+GAGGTTGAAACAGATGGACAAGAGGGATAAGGATATACAATTATTAGCTGATATACTTAG
+AGGAATTACTGAAAATAAAATAAAAGAAAATGCTAAAAAGGAAAGAGATAAGTCTTATGA
+TATTAGAAATATATTCGAGCAAATGGAGCTTGATTTAATTTCTAGTATGCATAGGGCTTT
+TTATTTTCACCAAGCCGAGCAGAGTAAAGAAGGATTTCAATGGGAACAATGGCAAAGGAC
+TAAGCTTAGAGAAATTGAAAAGTATAGAAAGAGAAATAAGAAACTAGTTGAGGAATATAA
+CAAGCCTATCCAAGAAGCTATAAACAGAGAGATTCAAGGGGATTTTACTAAAGGTCAAGA
+AAATGCAGAAAAGTTAATAGATGAAGTAAAGATAAAGTTTCCAGAGAATATAAAAGAACC
+TCAAACAGTTAGAGAGTATATTGCTAAAGAACTAGGGAAAAAGACTAATCCACAAGTTGA
+AGAAAACTTCTTTGGTATTAACGAAAAGAAACTTAATGCATTACAAGAAACTGTTACAAA
+TGATTTAAAAAAGGCTCAAATGTCAGTTTTAAGAAAGATGGATGATGTATATAGGCAAAT
+AATATTTAAAACTCATGTATATTTGCAAAGTGGTACTAAGACTATTAATCAAGCTATAGA
+TATGGCTACTAAGGATTTTCTTGAGAAAGGTATAAATAGTATAACTTATAAGAATGGTAA
+ACAAGTTAATATTACTAGTTATGCAGAGATGTGTTTAAGAACAGCAAGTCAAAGAGCTAC
+ATTTTTAGGTGAAGGAAAGAAAAGAGATGAATATGGAATACATTTAGTAGTTGTTACGGC
+TCATGCTAACACTTGTAAAATGTGTGAACCATGGCAAGGAAAAGTATTGATTGATGATAT
+ATTTTCTCATGGTACTAAAGAGGATGGAGATTATCCATTATTAAGTGAGGCTGTAGGAAA
+AGGATTCTTACATCCTAACTGTAGGCATACATTAGCAACTTATTTCCCTGGTGTAACAAG
+ACTTCCAGTAGTTCCTAATGGTGAAGATGCTATTAAACTTTATGAGGTTGAACAGAAACA
+GAGATATTATGAAAGACAATTAAGAAAGTGGAAGAGATTCAAGGCTGGTACTTGTGATGA
+AGAGAATAAAGAAATAGCAAGTAAAAAGGTTAAAGAATTAGAAAAAGCTTTAAAGGATCA
+TTTAGAAAGTAATAAAGAGCTTAGAAGAAATAATTATAGAGAAAAAGCTAGAGAAGGCTT
+AAATATTAAGGATGCTAATATAGAGGCAGAAGTATTGAAGCAAAAGTTTCAAAATGCTAA
+AATTAAAGAAATAAGAGATTTCATTAAGAATAATCAACCTTTAAAAATAGAGGTTGGGAA
+ACAAGGTAAACATATTTTAGGACATAACAACTACATTGAAGGTAGAAGTTATTTAACCAT
+ATCTTTAGAAGAGGCACAAGAACTTATTAATAAGTATGCTGGTACTGGTGCTTTAGATAT
+GGATTCTAAAGGTAACTGGAGAAAAAAAGAAATAATAAAAACAGATAAGAAAATAGGTGT
+TAATGTAAGTATGTTAGATGGTTCAGAAAACAAAACAAATAACTTTAAAATACATTATTC
+TAAAAAAGGAACTCATATAGTTCCTAATTAAAGAGGTGATTCCATGTTTAACTTAGTAGA
+GACATTAAGAGATATAATGAAAACTCATAAGCTAGATAATAATCTTAAGTTAAAAATAAA
+AACTGTTGATGGGAATATCATTATTGGACCATATGAAGGATTTACACAAGCTTTAGATAA
+TGAACCAGAGATAGCAAGTATAGAAATAAAAAAAGATGAATATAACATAGAGCTATATGA
+AAATGAAATAGCTTCAATAGAAGTGTAGTAAGTTAATTTTGTTTTGGGGGATAAAATGGA
+AAGAAAAGTATTTATAGAAGGTAAAAATAAAAGTGAACAAGCTTATATAGGTTGGGAGTC
+AGAAGAATTATACCTAATTGGAGTAAAGGATGGATATAAAAGTTCAGCTGATGATCTTCT
+TGACAAAGCAATATTAGAAGGCCATAAAAATAGAATTGATATATTAGATAAATATATATT
+TCCAATAATGTTCTTATATAGACATAGTATAGAAATAAGCTTAAAACTTATATATAGAAG
+AGTTAATGGAAAGATACCAACTGGACATAATCTTATGACATTATGGGATAGAGTTGACAA
+GGATGTTTTAAACCTTTTAAATAATGATATTAAATTAAAAAAGCTTGAAGAAAAATATAA
+TACTAAAATTTATAGATTAAATATTGATAAAAAGTTATTAAATGAGATTAAAAACTTGAT
+AAAAGAATTACAAGGTATTGATTCTAATGGAGATGTTTGGAGATATCTTATCAATAAAAA
+TGGAGATTTATATTTTAATAAGTGGAAATTTATAGATTATCCGAATTTAAAAAATACTAT
+TAATTATATCTATGAGTTTTTAGATGGTTTATATTGTGAAGTTGATGAAATTCTAGTAGT
+AAGAAAGTCTTAGGAAACTAAGGCTTTTTTATTTTGTCCAAAACTTGCTTAAGACCTTAA
+ACTGTGCATGGAATTAACAGCCGACAGGCTATAAATGGAGGTATTTATGTCTATATCAAA
+TTTAAATTTAAGAAAAAGATTAGGTATGAAACTAGCACAAGATGATGGAGCAGGTAATGG
+GGGAGTAGGTTTAGAAACTAATCCAACTGATGGTGCAGGTGGAGAAGGTGAAGGAACAGA
+AACTAATCCAACAGAAGAAAAGACTTTTACTCAAGAAGAAGTAAATAGGATGATTAAGGA
+TAGGGTGGCAAGAGAAAAGAAAGGCCAACTATCTAAAGAAGAACTTAAAGCTTATCAAGA
+TTGGAAAGAAAGCCAAAAAACAGAAGCAGAAAAGCAAAGTGAAGCTTTAACTAATGCAGA
+AAAAGCTAAACAAGATGCAGAGGAGAGAGCTAATACATTAGAGGCAAAAGTAACTTGTTT
+ATCTAAAGGTGTTTTAGCTGATAGTGTTGACGATGTTGTTATATTAGCTAAAGCTATGGT
+AAGTGATGATGTTACTATGGATCAAGCAGTAGATAAAGTTTTAGAAAAATATCCAAGCTT
+TAAAGGAGTGCAGCAACAAGATGAAAACAAAGGCTTTAAAATAGGTGCTGATGGTGGAAA
+ACAAAAAGGAAATGTTGATGATGCATTAGCAAGAGCCTTTGGAAATAAATAATAAAAAGA
+TTAGGAGTGATATAAAATGGCAGTATACAGTTATGCTGAACAATTTGAAAGACAATTACA
+ACAAAAATATGCAAGAGAATTAACTTCATATGCATTAGAGCAATCTAATCCACAAGTTAA
+ATTCATTAATGCACAAACTATTAAATTACCTAATATAACAGTAAGTGGATATAAGGATCA
+TAATAGAAGTGCTATGGGATTTAATACAGGTTCAATGTCAAATGATTGGGAACCAAAGAA
+GCTATCTCATGATAGAGATATTGAGTTTGCAATAGATCCCATGGATGTTGATGAAACAAA
+CTTAACATTAGAGATGGCTAATATTCAAAATGTTTTTGAAACAGAACAGGCGATACCAGA
+AAAGGATAGTTATAGATATTCTAAGCTTTATGCAGAAGCTAAAACATATAAAGCAAATGG
+TGCTGTTATAGATAATACAGTTTTAACAACAGCAAATATATTAGATTGGTTTGATACTCA
+AATGGAGAAAATGGATGACTTAGGAGTACCAAGTGAAGGTAGAATACTTTATGTTACACC
+AGCTATTAATAAACTTCTTAAAAATGCGGAAGGATTAACAAGAACTATTAATTCTGATAA
+GAATACTGGAAAAGTTGATAGAAGAGTTTATTCATTAGATGATGTGACTATTACTAAAGT
+TCCAAGTGCGAGAATGAAAACAAAATATGATTTTACAAATGGATGTGTTCCAGCAGGTGA
+TGCAAAGCAAATAAATATTATACTTATTCATCCATCATGCCAAGTAACAAGAAGTAAGTA
+TTCTTATATTAAAGTGTTCACTCCTGGAACAGATAGTAGAACAGCAGATAAGTATGTATT
+CCAAAATAGAAGTTATGGAGATACATTCTTAATTAAAAATAAAGCTTGTGGTATTGCTAT
+TAATGCAGAATCAGAAGGTTAGAAAGGAGAATACATATGAAGGCTATTAAAGAAAATAAA
+GTTTATACAATAACTGAATCTGAACAGAACTTTTATAAACAACAAGGATATGACATAGTT
+AATGATGAAGGGGAAGTTATAGAACGTGGAGCAGGGAAATCTATTTCTTATGAGGAATAT
+ATAAAGTTAAAAGATGAATTAGATCCATTAAAAGATGAAAACTATACTTTAAAGCAAGAA
+AATGAGAAATTAAAAGAAGAAAATAAAAAGCTTAAAGCTGAAAATAAAGAGTTAAAGAAG
+TCTTAGTTAAGGCTTCTTTTTCTTTATAAGGATGTGAGTATATGTCTTATGTAGATATTT
+CATATTATAAAGATAATTTCAAAGGTGATATCCTTAATGATGATACTTTAGAAAATAGAT
+TAGAAAGAGCATCAGATCAAATTGATAAATTGACATATAACAGAATAATAGGAGTAGAAT
+TTAAAAATTTATCTCCATTTCAACAAGATAAAATTAAAAAAGCAGTTTGTTTACAGGCTG
+AATTTATAGAGCAATATGGTGAGTTTATTAATATGCCTTTAAGTGGATTTTCAGCTGGTA
+GTACTTCGGTATCTTTTAATGGAAGTATTGTAAATGGCATAACAACCACACAGGAAGTTA
+TTAATTATATATATCAAACTGGTTTAAATAGTAGGAGGATCTAAACTATGGGAATTAAAT
+TACCATTTCCTAAATGGCTTTTAAAAACACCAGTAGAGGTTTACCATACTTATATGAATG
+AGGATGGTGAACCAGTAGAAGAGTTAATTTATAAAGGATTAAGTATATATAATGAAAAGG
+GAAAGAATACTCTCGATGCAGAGCGTAGACTTGTAACTTTAAGTGGGACCGTAACAATTG
+AAGGTGATATTTATCCTAATAAATTAATTGAAGGATATATAAAGGTTGGAGATGTTAAAA
+AAGATATTTATAAGTCATCAAGGCCACGTAATCCAGATGGAAGTGTATTTTCTACTGAAT
+TGGAGCTTATCTAATGAAGGCTAAAGTAACAATAAAATTAGATAGAACTAAGATAAACAC
+TTTAATAAATGCTAGAAATAAAGCTTTAGAGGAAACTACAGAGGCCATGTTAAGTGATAT
+TAAGACAAGTGCTATAGTTCCTAAGGATACTGGAGAACTTGAAAGAAGTGGTTTTGTTGA
+TTTATCTAAGTTAGATGATGGAATAGCATCTATAATTTTTGATACACCATATGCTAGAAG
+ATTATATTGGCATCCAGAATATAATTTTAGACAAGATAAAAATATAAATGCACAAGGTAA
+ATGGATGCAATCTTATATTGATGGAGATAATAAAGAATTTGTAACAGAGACTTATTTTAA
+ATTCTTAAAAATATTTAGCAAAGGATTGATTAAATAATGTTGCTAAGTGAAGTAAGAGAA
+TATTTAAAAACTAAAATAGAATGCCCTCAATGGTATATAGGAAAGATAGATGCAACTAAA
+GAGCAATGTATAGGTATCTATAGCATAAGAGGACCAAGAAATCATATAGCCTTAGGTGGT
+TTAGAAAATACAAGCTATTCCACTAAGGCTATTTCTATATTAGTTCATTGGGGAAAGAAT
+GCTAATATAGCAGAGCAAAAAGCTCAAGAAGTATTTAATGTTTTATTTGGACAAGATGCT
+GTTATAGGTGGGAAAAGAGTTATAGATTTTAAAATGATAACTACTGAACCTATAGGAGTT
+GGAACAGATAAAAATAACATATATGAATATGTAATAGAAGTAAATATAATACATGAAAGG
+TAGTGAATAATTATGGCATTTACAGGAGTTTTTCCAGTATATAATCTTAAATTTAAGATA
+GGAACAAAAGGGAAAGCAAGTCAATCTCAAGATATGCAGACTATAGCTGATATGGAGAAC
+TTTGGTATAAAGATTGATGGTAAGGTAGAAGATTGGACACCAATGGATACAGCAGGTTGG
+GCAAGAAGTTTAATGACAGGAAAAAGTTTCTCAATATCTTTAAAAGGCAAAAGAAATGTA
+GGTGATCCAGGAAATGATTATGTTGCAGCAACTGCATGGAAGGATGGATTAGATTGTAGT
+ACAAAAGGAGAAATGGAGTTCCCAGATGGGTCTAAACTTACATTTAATTGTGTAATTGAT
+ATTAAAAATGTAGGTGGAGATGATAGTACAAAGGTTGCTCCATTAGAATTTGACTTAAAA
+GGTGACGGAAAACCAGAATATACAGAAGCACCATCAAGCTTAGGACATTAGGAGGTATAA
+ACAATGGCAAAAGTATATGACATAATGAATAAGTTAGTTAATGTAAAACCAACAGTAAAG
+ATAGATGAAGATCACGAATATAAAATTAATAATACGAAGAATAATGCTATATATATTCAA
+TCATTAGTTAAAGAAAATAAGAAAAAAGATGATAAAAAACAGGATGAGATGGAGCTTATT
+AATAAAATAATAAAAGCTTCCCTAGGTAAAGAAGCTTTTGAATATATAGATAGTAAAGGT
+GATGAATGGAGCATGTCAGCATATAATGCAATAATAAATGTAATAATGGCTGCTATATCT
+AATGTTGAATTAGAAGAAATTGAAGAAATGAGTGAGAAAGAGGCAAAGCGATTTCAAGAA
+AGTAAAGAATAATCAATGGTATGATTTATTTGAAGATTGGGAGCTTATAGAAGCTTCTTT
+TACAGCTCAATACGGAATTAGATTAAGAAATGAAACTAATATGACTTGGGATGAATTCTG
+TACATTGCTTAGTGGAATAATGCCTAAAACACCACTAGGTCAAATTGTTTCAATAAGAAG
+TGAAGAAGATGAAAATATGCTTAAGAACTTTACAGAAGAACAACATAGGATTCGTAATGA
+ATGGAGAAGTAGACAAGTAGAGCAAATGACAGATGAAGAAAAAGAGGAACAAATAAAAGA
+AATACAAGAAATTCTTAAAAAGGCGTTTAGTTAAAACTAAATGTCTTTTTTATTTTAAGA
+AAGGTGGTGAGGTAATGGCAGATGCAGATTCGGTAGGGAAAATTGGTCTTGATTTAGAGA
+TACAAGATGGTGATATAGGAAAACAAATAGAAAAGATGGCTAGTGCTATAGGTAGTCAAA
+TAAGTAAGTCGCTAGAAGGAATAACAGAAAAATTTGATTTTAATTCAATAACAAAAGGAA
+TTTCTGAATCTTTAAATAAAGGAATGAATAATATTGATGAAACTATAAAATCTAGTGTTG
+AGAAAAGTAAAGCTAATATTCTTAAGACAATAGAAGAAATAAAATCAAAAGCTTTAGATG
+CTATAAGAAGTATAATAGCTAAATCTAAAGAAATAAAAATTCCTATTCAGTTTTCTCCAG
+TTAGTAATATTGCAATGCCTAGTAGCAAGGTAGCAACGCAACCAATAAGTAGAAGAGGAC
+CACCAAAAAGTAATGTTGGAGATTTAGAATCTATAAAATCTAAGATTGAAAATCTTTCTA
+ATAGTTTAGAGATAACTAATAGATCAATAGAGCAGCAACAAGAAAAATTATCAGGATTGA
+AGGCTGCTTATAATTCTACATTTAATCAAGCTAGAAAAAACAAATTACAGGAGCAAATAT
+TAAAAACAGAAGCTGTTATAAATAAACTTATAGCTAAATCTGATGCAACAGGGTTTAAAT
+TAGCTGATTTAGATAGGCAGTTTGAGAAATTAGGTAATTCAGCTAAGAATTCTACTTTAG
+GATTAAATGAAGCAAGTAATAGTATGAAGAGGCTTGAAAATACTACAAGTAGAACAAATA
+GAAATTTAAGAAATGCTAATAACTCTACTAGACGATATAGAGAAAATATGAATGGTGCTA
+GAAGTGCAACAGGGATGTTTATTGATAGTATGTTTAGGTGGGGAATAGTATTCCCTTTAG
+TAATGAAGGGGATAAACACTGTTGCTAGTTATATAGGAAGTGCTTTAATGACTAATGCTC
+AGTTTGCAAACAGTTTAGCACAAATTAGAACTAATCTTATGGTTGCATTTATGCCAATCT
+ATCAAGCAGTTCTACCAGCACTTAATGCTCTTATGAGTGCATTAGCAACAGTAACCGCAT
+ATATTGCAGCTTTTATAAGTGCTATATTTGGTAAAACATATCAAGCTAGTTTTGGTGCTG
+CTAAAAGTATGAATGCTTCTATAGCTTCAATGAAGAATATGGAAAAGCAAGGTAAAAAAA
+CATCTGGAGCAGTAGATAAAATAGGAGATTCGGCAGAAAAGACAAAAAAGAAAATACAAA
+GGTCCTTAGCTGGATTTGATGAAATAAATAAATTAAGTATTCCAGATGATTCTGATAAAG
+CTCCAAAGGCTCCAAAAGGAGGAGGCGGTGGTGGAGGAATAGATCCGATACCAATGGTTG
+CTCCAGATATAGATTTAAGTCCAACAAGTGTAGCAATGCAAAAAATAAATGCTATGGTAG
+AAAAGCTAAAAGATATTATATCTAAAATATTTCAACCTTTTAAAAATGCATGGGCAAGAG
+AAGGAGCTGCAACAATTGCAAGTATTAAATATGCATTACATGGAGTTTGGGAGCTTATAA
+AAGCTATAGGTATTAGTTTTTTAGAAGTATGGACTAATGGAACGGGAGAAAAAATACTTG
+TAGTTATTCTACAAATTTTACAAAACATATTTAATATAGTTGGAGATATAGCAATTACAT
+TTGCAGATGCTTGGAATGCTGGAGGAATAGGAACAGCTATAGTTCAATCTTTAGCAAATG
+CTCTTTTAAATGCACTTACATTAATTAAGCATATGGGAGATTCTTTAAGGCAAGTTTGGG
+GAGAAATTGGTCCTGGATTAGCAACTACATTCATGCAAATATTAAATGCAACATCAGGAG
+TATTAGAAAATTTAACTCAAAAATTAATTTATGTTTGGGATAATGGAGGTAGTCATTTAT
+TCCAGGGATTTATAAGGCTAGGTGCAAAAATATTTGAATTAGCTGGGTATATTTATACTA
+ATTTTGTTGCTCCTATGGTTAATTGGTTTGTAAACATGATAGCTCCAGTTCTAGCTAAAT
+TAGCAGATATATTAGGAATTGTTTTAGATGCGTTTAGCAACTTAATAAATTGGTTAATGG
+GTAGTGGAAAGCCAGTATTAGATACAATTATTATTGTTTTAGGAAGTCTTGGTGCTTCTA
+TACTAATAGTTAAAGGAGCATTAACTTTATGGACAATAGCTCAAACAATTTGGACAACTG
+TAGCAAAAACAAGTACTATAGCAACAACATTACTAGGTGGAGCAATAGCATTTTTAACAA
+GTCCAATAGGAATTGCAATAGTTGCTATAACAGCAATAATAGCTAGTGGAGTAGCTTTAT
+ATAAAAATTGGGACTTTGTAAAAGCTAAAGCTATAGAAATATGGGGAAAAATAAAAGACA
+TATTTAATAGCTTTAAAGAATGGTTAAGGAATGTTTTCCAAACAGATTGGTCAAATTGTT
+TTGGAGTATTAGGGAATCTATTAAATCTTTTCTTAAAAAATGTAGATAATGTTTTTCAAT
+CTATCAAAAAAATATTTGGTGGAATAATAGACTTTGTAACCGGAGTATTTACTGGAAACT
+GGAGCAGAGCTTGGCATGGCGTTGTAGATATTTTCAAAGGTATAATGAGTGGATTAGGTT
+CTGTAATTAAAGCGCCTCTAAACTCCGTTATTGGGCTAATTAATATGGCTATAGATGGTT
+TAAACAAAATTAGTTTTACTACTCCAGATTGGATTCCTGGTATTGGTGGTAAGCACTTTG
+GAGTTAACATAGCTAAAATGCCTTATTTGGCTAAAGGCGGTATAGTAGATAAACCAACAC
+AAGCCGTAATAGGAGAGGCTGGAACAGAGGCAGTAGTACCACTAGAAAATAATACTGGTG
+GATTAAATTTACTTGCTATTAAACTTTCAGAAAGAATTAATAATATGTTATTACTTTCTA
+ATAATGCATTAAAACAACCTGATTTAACAATGTTAGGTCAAAATATTAATAGTAATGAAA
+AGAAGAGTATTAATGATCCAGAGTTCATAGAAAAAATAAAAGAAGTTATAATAGAAGCTA
+TTTTAGAAGCGATGAAGAATAAAAAAGATAATAGCTATAATAATTCAGGGCCTCAAGAGA
+GTGGTGATTTAATATTAAGAATAAGAGATACTGATTTAGGTAGAATTGCAATAGAAGCTA
+TAAATAAAGTGAATAGACAAGCTGGAGAGCAATTATTAAATCTTTAGGAGGTGGCAACTA
+TAGGAATTAGTATAAATGGAGTAGCAGTTGCTTCTCCAAAGAGTTTTAAGGTTAACATAA
+TGGATTTAGATGGAGAAAATACAGGAAGAAATTTATTAGGTGTAATGCTTAGAGATAGGA
+TAAGAGTTACTAGAAAACTTGAGTGTGAATGGGGTCCTTTAACATCTAATGAGATTAAAA
+CAATATTACAATCAGTAAGTGGAACAGAGTTTCCAGTTACTTATCCTGATCCAATGGAAG
+GAGTTACAACTAAAAATTTTTATGTAGGAGATAGAAGTACACCAGCTGTTGATTTTAATA
+AGAATGTATGGCAAGGTCTGTCTATGAATTTAATAGAAATATAAATAAAAGAAAGAAGGA
+ATTGAAATGTCAGAAGAAAATATAAAAGTAACAAGCACAATAACAGAATCTACTAACTTA
+AATGGAACAGTAAATATAGAAAAGGATGGAATGAAGCAAACAGTATTAACAATGAGTTGT
+AGTTTAACTCAAAATACTATCGCAAATATTCAAACATATCCTACTAATATGGAGTTGTTC
+TTAGCAAATTCTCAATTAGTTCAAGCTGAGGTTCAAAAATTTAGAACAAAGGCTACGGAA
+GTTGGCAAAAGCTTAAATTGTTTTATACTTTAGTTTATAAGAGCTTACAAAATGTAGGTT
+CTTTTTTAATGAAATTTTTAAAAGAAAGAGGTGTTCAAAATGGTTAAAATGACAAATAAA
+GAAATATTAGAAAAAGTTAATGTATTAGGAGAAATAAGTTTAAGAAAGTTACCAGTTAAA
+GTTTCTTATGCTATAGGCAAGAATATATCTAAAGTTGAAAGAGAATTAAAACACTATAAT
+AAAGAAAGGCAAAAATTAATAGAAGAATATTGTTTAAAAGAAGATGATGGAACTCTAAAA
+ATAACAGATGGAAATTATGATATTGATCCAGAAAGATTAGAGTATTTTAATAAAGAAATT
+AATGAATTACAAGAAATTGAAGTTGAAATGAATATACATAAATTTAATATTGAATTATTA
+AATGGTTATGAAATGAGTCCAGGAGATTTAATGTGTATTGACTTTATGATAGAGGAATAA
+TATAAATATTAATCTTTAGGAAAGGGGGTTAGTATTTGTTTAAAGTATCAGAAGCATTTA
+ATAAAGAAATAAATAAGTTACAAGGAAGAAAATTTAATGCTAAGGTTATTATAAGAGATA
+AAGAATATAGTGGAAATCAAATATATGAAATGAATTTAGAGGAATCAGTTAATCCTAGTG
+ATAGTTTTTCTATAGGATCAATTTGTTCTAACAGTTTCGATATAAAACTAATTAATACAG
+GAGATATATTTGATAATGCTATTGTAAAACCATATGTAGGATTGTATATAGGAGATGATA
+TAGAATATATACCTTTAGGTGTATTTACTGTAATTAAGACTAGTGTAAAAGGAAAATTTA
+TAAATCTTGAGTGTGTAGATAATATGCTAGGGTTAGAAAAAGTATATTTTTCAGATTTAT
+CTTATCCAGCAGATATAAACGATATTGCTAAAGAAATATGTAAAAAGGCAGGCGTTAATT
+TAGCCAGTAAATTACCTAATTATAGAGTTAATAAAATAGAGGGATATTCATTAAGGGAAG
+CTATAGGATTTATAGCTTCCCTTTGTGGTTCATTTGCTAGATTTAATAGGATAGGTGACT
+TAGAAGTTAGAGATTATGAGGTAGTAAAGCAGGAAATGACACCTCATAATTTATTTAAAT
+TAGATATTGAAGCTAATGAGTGCATTATAAAAAAAGTAATAGCCAAAAAAGGTGAAGAAG
+AATTAAGTACTGGTACAGATGATGGAAATAAAATTGTATTCAATAATCCAATAATAACTA
+AAGAAATTTTAAGTGATATATATACTAAATATAATGGATTTAAATATATATCATATACAG
+CTAAGTGGAAAGGTAACCCAGCTATAATGGCTGGAGATATATTAAATTTAACTGATTTAA
+ATGGGAATAAATATAATGCTTTAATAATGGAGCAAAAGTTTACCTATAAGAATGGTATTT
+CATCAGAAGTAAAGGCTAAAGGAAAAACTAGACAAGATTCTAGCTTTGATAGTAAAGGAT
+CAGTTGCTCAATCAATGGAGAGATATTCTATTGAACAAGCAAATATAAAAAAGGCTTTAA
+TAGATAAGGCTAGTATAAATGATTTAACAGCTGTTGATGCTAAAATACAGAGGTTATATA
+CAGAGGATTTAACAGCTATAAGAGCAGATATAGTTACTTTAAATTCTCAAAAAGCTAATA
+TTATCGAATTAAATTCTGTAAGAGCAGATTTACAACAGGCTATAATTGGTAAAGCTAATA
+TAACAGATTTAAACGCAGCAGTTGGAAAATTAAATGTATTAGAATCTAAAACAGCTAGTA
+TAGAAAATGCACTTAATAAAAATCTTACAGCAGAAAATATAGCGACAGGAGCAATAACAG
+CTAGTTCTGGAATAATAGCAGAAGGAGCTATAGGAGATGCAGAAATAAGTTCTTTATCTG
+TAAATAAGTTAAAAGCTGGAGATATAACAACTAGCAAACATAGAATTGTTAGTGCAGATG
+GAACCATAGAAATTGTAGGAAATCAAATTCTTATTAATAGAAATAATGTTAATAGAGTTA
+TATTAGGAGAGTATAGGAAAACAGATGGTACTACAGATTATGGACTACTTATCAGAGGTA
+AAGATGGTAAAACCATAATGCTTGATTCAGACGGAGTTCATAATGCAGGGATAACTAATG
+GAGCTATAGATAATAATAAAGTAGCTGACAACGCTAATATAAGTGGTAATAAGCTAGATA
+TAAATAGTGTTATTAGAGAAGTAAACAATAATGGTACTGAAACTATTAAGGGTACTAAGG
+TTACTGTAGGTGATAGAACTTTAGATGTAGAATTATCTACACAAAATAATACTATTACAG
+AGCATAGCAAAGAACTATCTAGTCAAAAAGCTTCCTTAACCGCTTTAGATAATGCATTAA
+AGTTTAAAGTAGATTCACAAACTTTTAATCAGAGTACAACTACTATAAATAATAATATTA
+ATAGAGCCAAGGAAGAAGCTATAAACAGTTCTAATTCTCACGCTGATAGTAAAGTTAATG
+AAGCTCTTAATAATGCTAAAGCTTTTGTTAATTCAGAAATTACTAATGTTAATACTCATT
+TGAATAAAAACACTAGCGAGATAAATATTTTAAAAGGTCAGATAGAAAGTAAAGTTTCTC
+AATCAGATATAGATAAATCTATTCAAAATATTGAGTTTGGTGGAAGAAATCTATTTTTAA
+AAAGTAAAGGTCCATTTAAAAGCTCTAATGAATATGTAGGGATTTCAATAACTTCTGTTG
+TAGAAAAATATTTAAATAAAAAAATTACAATATCAGCAGATGTAAAAGCTAATAAAGTTG
+GGAAAATTAGATTTTATTCTCTTGGTGGATATTCTGTAGGATTTTGGGTTGAGAGAGATG
+TAACTACAGAATGGACAAGAATAAAAGCTACTGGAAAGTTTACACTTAATGATGAAAAAC
+AAAAGTGGTGTGATTTAAGTTTTTATGGTACTTATGGAAGTGGACTATTTACTGAAGTTA
+GAAATGTAAAAATAGAATTAGGAGAATTGGCTAGTGATTATACAGAGGCTCCAGAAGATA
+CTGACAAGCTAATTATAGACAATATAAAAACAGTAACAGATAAAATATCTACAGTAGAAA
+GTAAACTTACACAAGAAAATAATAGTATAAAAGCTAGTGTTCAAGATTTAAATTCTACAA
+CTCAAAGTATTACAACTAATGTAAGTAATATAAATAGAGATTTAATAAGTAAAATAAATT
+CTAATTTAGCTGTAGCTAAAAATTTTGCTACAGATATAGCTATAGCAAAAGCTAATCTTG
+CAAGAGAACAAGCTATAGCTTCAGCTGATGGCAAGATTACAGAAGAAGAAAGAAAGAGAA
+TACAACAAGCACAGGAAAATCTTGATACGGCTATAGCAAGAGCAGATAAAGCTAAACAAG
+ATGCAATTAATGCAGCAAGTACAGATGCAACTAACAAAGCAAATAATGCTTTAAATAGTG
+CTAAGGCGTTTGTTAATGCAGAAATAACAACAGTTAATAATAAAGTGCATAACGTAGAAA
+GTAATATTGATATATTAAAAAATAAAATTGCTCTTAAAGTTGAACAATCAGACATAGATA
+AAACAAAAACAGAGTTAATTAATAAGATAAATGTTGTAGATAATTTAGCTAATAACGCTA
+AAGATTTAGCTAGTGCCATGAGCTTAGGTAAAATGTTATTTAGTGATCCTACATTTAAAA
+ATAGTTCTAACAATATTAAAACTTACAATAACAATGGAAATGGAACAGTAACAACTTCAA
+GAATTTCTAAAATAAATGGATGTCCAACTGATTCACAATATTGTATAGAAGTAAAAACTG
+TTGGAAGTGCAAGTCCTAACCATGGTGGATTTTATTTTGGAAATATGACTAGAGCAAATG
+CAATATTTGTAACGAAAATTATTGCTAAAATTCCAGTTGGATTAAGAATAGGGTGGTATT
+CAAATTCAACAGGGAATAATGGGAGTTCTAAATGGTTAACATCAGTAAATGGAACAGGTA
+AGTGGGAAGAGTATATACATTTATTAAAATGTGGTGATACAGGAAGTTTTTCTAGTACCA
+GTTTCTTTGCATTAGATGGAGGGGGAACTCCAACATCTAGCAATCCAATAATTTGGCATA
+TAGCTTATGCAACTGTTTTTGATATAACTGAAAATGATGAATCAGTTAATGTATTAAAAA
+CTGAAATGTCAACAGCTAAGAATAAGGTGGCAATAATAGAAACTAATTTAGACAGTATAA
+CTCAAAGAATAAGTTCTACTGAAAGTAAAACACATTCTATAGAAACTACATTAGGTGGAA
+AAGCATCTAAACAAGAAGTTGCAGAAGTTAATAATAGAATTGCTACTATTAAAGCTAACT
+TAGATTCTATTACACAAAGAGTTTCTAATACAGAAAGTAAAACAAATAGCTTAGAAACAA
+ATATAAATGGTAAAGCTAGTAAGCAAGAATTAACAGTAGTTAATAACAAAGTTACAGAAG
+TTACAGCTAGTTTGAATGGAATCACTCAAAGAGTAGGAAACACGGAAAGTAGAATAAATG
+CTTTAGATGGAAAAGTAGCTGGAGCTGTAACATTACAACAATTTACAGAATTCAAACAAA
+GCAATGATAAATTTAAATTTACTGTAGAACAAAGAAGTAGTGTATCAAATATACTTCCAA
+ACAGTTCTTTTCATGGTGGAGATCGTGGGTGGCTTCATGGTGGAAATGAATTTTGGTCTG
+GTCCTTATAGTGGGTATGGATTTAAGGGAAGAATTACTGGTGCAATAAAAAATAGAGCAG
+CATATAACAATCCAGAAAGATACTTACAAACTCATAAAGCTTATAAAGTTAAAAAGAACA
+CTACTTATACAATAAACTTCCATTATATTTGTGAAAAGAATGTTCAATCAATGGATGCTT
+TTGTTGTTTTAAGTGATACTGAACATGGTGATTATGCACAACCAATTTATGTATTAACAG
+CTCAAGGTGGTTCTCAAAGTAATGCAACTGAAGAAAAACCATTTACATATAAATTTAATA
+CAGGTAACCATGAGTGGGTATGGATTAGATTTGACCATAATGGAATGAAAAGTGGCGTTA
+ATTGGGATGAATTTTGTTGGGTTTATGTTAGTGAAATTGGAATCTATGAAGGTGATGTCG
+GAGCTGTTAAGTGGACACCAAAAGGTGGAGAAGTTTATTCAGCTAACTATCAAATGGATG
+GTCTAGGATTCAAAGGGACTTTTGAAGATGGTACTTATGCATCTTTAGGTAAAGATGGAC
+TTGAATGGTTTAACGCTGGTACTGGACATGCATATCATGCATTAACATACGTAACCTCAT
+TCGACATTCCAATTGGTAATCCAGGTAAAGCATATATAAAACTACCAGCTGAATTTACTA
+AAAGAAGAAACTCTCTTAAATGGACAGTCGCATTAAGAGGATATTATTACTCAACAAGTG
+GCGATTTCTTCCCATTCCATATACATTGTACTGGTGGGAGGGATTATATAGAAAATGGAC
+TTGTTGTATGTGAAGTTCAAGGTTACTGTAAAATACAAAATGCCCAAAATGCTGGTGATG
+TACAGTTTAGACCACTTACAGCTATGTTAATAGCTATAGCTTAAATAGAAAGGAGGGTTA
+TTATGGATAATTCTATAAAAAACTTTGAAAATAAAGTTACTTTATTTTATTCTCAATCAA
+CTGGAGATATAAAACTTCATGCTGGTGGAATACAAGATATGAGTTATTTTGGTCCTGAAA
+GAGATGACTATAATTATAAATTTATAGTTGTAGATAAAGATTATTATTTACTTAATAATT
+TAGAAAATTTTAAGGTTGAAAATGGAAAGTTAAAATTAAAAAGTAATAGTATATTAGCTA
+AATACATGTAGGAAGGAATAGACTATGGAAAATATATTTGATTATTTAAAGATGGGGATT
+GTAGCAATAGGAACTTTATTTACATGGCTATTAGGAGCATGGGATACCCCTTTAGTTATA
+CTTATAGTTTTAATGTCTTTAGATTATATTACTGGTATTACTAAAGGTTATGTTAATAAA
+GATTTAAGCAGCAATATAGGACTTAAAGGAATAGCAAGAAAGGGAATTATTTTCACTATT
+CTTATAGTAGCTGTAATGTTAGACAGACTTTTAAATACAGGAAATTGGATATTTAGAACT
+TTGGTATGCTATTTTTACATAGCTAATGAAGGTATAAGTATTATAGAAAATGCAAGTAAA
+CTAGGTGTACCAGTACCATCTAAATTAAAAAATGCGTTAATACAACTTAAAGAAGATAAA
+GAGGATCATAAGAAATTATGATTCTTTTTTTATAAATAAAATTAAGAAAGAAGGAATTAA
+AATGTTAAAAACAATTTTAAAATTAGTAATTAAAGTATTAGAAAGTAAATTACAAAAAAG
+TGGGTTAGAAGAAAAGATAATAAAAAATAAACAGTATATAGATATAGCAAAGCAAGTGTG
+GAATGTAGTTGAAGAAAACTTCCGTATCACAGAATCAGTAGAAAAGAAATTAAGTTCTAA
+AGCTTATGAATTTGACAAAATGATGATGGATAAGTTTCCAGAGTTATCACCAACAGATGT
+AAAAGAATTAAGACAAAGTATTGCTGGAGAAGTTAATAAAGGGAAAGAAGCTGTTTTAGA
+AAATTCAGAGATATTAAAGAAGTTACAAGAAGAAAACCAAGAGCTTAAGTCTAAGAACAC
+TGATTTAGAAAGTAAACTAGCTGCAATATCAAACTATGTGCCAGTGGAAAACAAATAGTT
+TATTAATGTAATACATAGGACTAGAGATAGTCTTTTTTTATTGGATTTAATTATATAAAT
+TTAAAAGAAAGAAGGAATTAATAATGCAAAGTAGAAACAATAATAATTTAAAAGGAATTG
+ATGTATCAAACTGGAAAGGAAATATAAATTTTCAAAGTGTAAAAAATGATGGTGTAGAAG
+TAGTTTATATTAAAGCTACAGAAGGTAATTACTTTAAGGATAAATATGCTAAACAAAATT
+ATGAGAGAGCGAAAGAACAAGGATTAAGAGTAGGATTTTATCATTTCTTTAGAGCTAATA
+AAGGAGCCAAGGATCAAGCAAATTTTTTCGTAAATTATTTGAATGAAATAGGAGCAGTTA
+ATTATGATTGTAAATTAGCTTTAGATATAGAAACTACTGAAGGGGTAGGAGCAAGAGATT
+TAACTTCTATGTGTATAGAATTCTTAGAAGAGGTAAAAAGAATTACTGGAAAAGAAGTTG
+TTGTATATACATATACAAGCTTTGCAAATAATAATTTAGATAGTAGATTATCCAGTTATC
+CAGTTTGGATAGCTCATTATGGTGTAAACACTCCTGGAGCTAACAATATATGGAGTGAAT
+GGGTTGGGTTCCAATATTCAGAGAATGGAAGTGTAGCTGGTGTAAGTGGTGGATGTGATA
+TGAATGAGTTCACTAATGGAATATTCATTGATTCAAATAATTTTACTTTAGACAATGCTA
+CTACTAAAAATGTAAGTATTAAATTAAATATAAGAGCTAAAGGAACTACTAATTCTAAAG
+TAATTGGTTCAATACCAGCCAATGAGAAGTTTAAAATAAAATGGGTTGATGAAGATTATC
+TTGGTTGGTATTACGTTGAGTATAATGGAATAGTTGGCTATGTAAATGCAGATTATGTAG
+AAAAGCTACAAATGGCTACTACTCATAATGTAAGTACTTTTTTAAATGTAAGAGAAGAAG
+GATCATTAAATTCTAGAATAGTAGATAAGATAAATACAGGTGATATTTTTAGAATAGATT
+GGGTGGATTCCGATTTTATAGGTTGGTATAGAGTAACAACTAAAAATGGAAAAGTTGGAT
+TTGTTAATGCTGAATTTGTTAAGAAATTATAATTTTAAGGTTAGTTAGAGTAATATCTGA
+CTAACCTTTTATTTTTTTGTTCATAATCATAATGAGGTGATTATGAACAAAAAAGATAAT
+ATTAGAATTGATTTAATAATTTTATTAGCTATTATTTCTATAATATTACTTTTAGTATAA
+TTTATATAAACTTTTAAAATTAACAATAGTTAAGGCTAGGTAGATTAATTCCTATTTAGT
+CTTTTTTATATTCTTAAAATAAAAAAGCTACACTTAAATGTGTAGCTAAAAAAGGAGTGT
+GATATATTATCTCTGTATCATTTAAAATAAAAATCTATCTTAATTATAGACATTATTTTC
+AATTATATACATATTAACAAAAAACTTTTTTTATTTACAATAATGTTATATAATGTTAAT
+AAAAACACAATTAAAAAGGAGTATTTAAAGTGAACAAAAAAGAAAATGTTAATTTAATTT
+ATTTAATAAAATCTTTTTCAAAAAAAGTGTACAATATATTTAATATCAGTAAAGGATTTA
+AGAAAGTTAAAAAAATTGTAGAATTTAATAATTTAAATCAAATTGAACAATTAAATATAA
+TTAAAGAAAATGATAAGTTATTATCTAAAAAAGATAAAGAAGTTAAAAATAAAGTTGTAG
+CTAATAATATAGATACATTTTTTAAGTTAACAAAAGATAAATATTATGGGTGTAATATAC
+CTATAGAGAAAGCTAGAATAAATCAATATTTTTTAGGTGATAGAAAAAAGAAATCCAATT
+CCGAATTTTTAAATAATATATTTTGCTCAGCTATATTAGGAAGTTTTTTAGCTGCATTTT
+TAAGTATTGAAATCAATGAAAGCTTAATAAAAATATCCGGTTTTTTGCTTTTAATTATAG
+TTATTTTATCAATTATAATAGTTATGCTTTCAATAATTTTTATAGATTTTTTCTTAGAAA
+TATCAGAAAAAGACACTGTTAATAAAGATCTATATTATAATATTGTACTTGAAATATTGT
+CAGAACTTGAGTTTGAGGAAACAAAGAAAAAAATAAATGATTCAAAGGAAATAAATATGG
+ATTTTAATCTAAATTTTTTAAAACTAAAATAGATAATTTTTAAATAGTATGTTAGTAAAC
+ATACTATTTTTATATTTGTATGCAAAAATATGTTTTGTATAAAGGAAAAAGTTGAGTGAT
+TTTATAATTTAAGGTAAAATTAAAAGCAAGTATAATAGGAATATACTTGCTTTTAATAGA
+GTATTTATAAAAATTAGTTATTTTATTATATCATAATACTCTATTAAAGAAAATAATAAA
+TGAGATGGAGGACTTATGAAACTAAAGTTAATAGAAAATAAAATACTTAGAGACTCACCT
+AATAGTTTAAAACAAAAGGTAATAAATGAGGTTGTTAAAAAAGGAATAGCAACATATAAA
+TATAAAACAGAGCCTGATTTAATACAATTATATAAAAAAACTATAGAAGAAAAAATTAGT
+GAATGTCTTGAAAAAGATCAGTCAACAATAAAAATAATAGATTTAATAGAAATGAAAAAA
+GGATATAAGCATTCAATACTTTATGATTATAAAAATTTAGATACAAATTTAGCAAAAAAG
+AAATGTATAGATATTGAGACAGAATATTATAAAAATGTAGGAATTACTTTAAGTGAATTA
+GAAACTCTTTGTTATGAAACAGAGAATGAATTTTTTATTAAGTTTCATAATGAAATTGAT
+ATATTAGAGAAAGTTGATTTACCAAAGTGGTTTAAAGTTAGATATCCAATTTTATTTGTT
+TTTCATAAAAAGTTTAATATTTTAGAAGTTAAATTTGACAAAATAAGTACAGACAAGGAA
+AGAAAATATTATAAAATTGCTATTAGTAAATGTTTTAAGTGGTTAGAAGAAAATTTAAAG
+TGTAAATGCAGTTATCTTAACCTAGATAAATATATTAGAAATTTACTAGAAGATCCTAAT
+GGAATAGTTAAAGAAATAGTTTGGACCGGTGAGCTTGCTAAATCTCAAGGGATAACATTA
+AAAGCTGGAGAAGATATGTCAATGCCATTTTTTCAACAATTAGAGAAAGAAATAATAAGT
+TGGAAGGAAAAATACGCACATAAAGAAGATGCACTGGATTGCTTAAAAGATATTGAGGAT
+TATTTAAATAAAACAAAAAAATTTGCTAATGATAAGTTAAGAACTTTAAGGTTTGTAAAA
+TATAAAGAAAATAATATTTTAAAGACTTTAGAAAAATATATAGAATTAAAAATAACATAT
+AATTACTCAGGAACTTCAGCCGATTTAATAGATGTTATTGAAAGTGAAGTAAATGATTTG
+GAGAGGATGAATTATGTCATTGAGCTTATTGGAACTAGAAAGATTAATAAACCAATGGAA
+GAAAGTATCGCAAAATCAAGTTAAAGATTTGTATGAATTACTAGAATATTTTAGTGGTGG
+AGTGTTGCCTATTAATACAGTAAAAAGAATTTTGGAATTAGACAACGATGAAGTAGAAGA
+ATTAATGATTTTTTTAGAAACTAAAGGAATTTTAAAAAGTGCATTTAAAGTCCTTTGTCC
+TGACAAATTTGAAAGTATTAGAGAAGAAATTTATGATGATATACGAAAGGTTCCTAAAAA
+GTATTGCGATAAATGTGAAAAAGGATGTATGTATTTAGAAAATATTGTAGTTGTTTTTAA
+GGTGGTATAAAATTTAATGAGTAATTATGAAATGTGTATGACTGATGAAGAATTTATTAG
+ATATAATAGTTATTTAAGAAAAATGTCTAAAATTAATCCAAAATTTATTTTAGATAAAAC
+ATTTTCTGTTTCAGATGAAGATATAGAAAAAGGAAAAAGTTTAATAAATGAGATTGAAAA
+TTTAGCTAAAGATATTAAAAAGGCTAAAACTCCAAAAGAGAGAAATGCAATTAATAGAGA
+AAAGGGTAAGAAATTAGAAGAGTTGGCTGGAGTTATGTTTAATTCAGCTGGACTATATTC
+TGAAAGAAATAATTTAAGGGATCATACTAATGAAATAGATCTATTATTAATTGCCGATGA
+CTATAATAAACTTCATAAAACTATTTTACCAGAGTATTTACAGAACGATATATTAATTGA
+ATGTAAAAATTATAATAAAACTATAAAAGTTGATTGGGTGGGTAAATTCTTTTCCTTATT
+AACTACTCATGATGGTGAATTAGGAATAATTTTTTCATTCGATAGTTTTTCAGGACCAGG
+GGAATGGCAATCTGCTAAAGGATTAGCAAAAAAAATATTTTTGTCAGAGAAAAGAGCTAT
+TTTAAATATAGAGTTAAAAGATATTAAGGAAATGTTAGATAATAAAGGAAATATAGTTTC
+TTTAATAAAGGAAAAATATGATGCTTTGAAACATCATGTTGATTTTAAAGCTTTAATAAA
+AAGACATCCAGCTGAAAAATAA
+>NC_008261.1|provirus_1784095_1821197
+CTATTTTATTAGATTTTCAAATTTACCAGATACTACTTCTACTAAGTCATTGGGATTTAA
+TTTTATTTGATGTCCTATCTTTCCTGCACTTACTATCATGAAATCTAAGCCTTTAGCACT
+CTCATGTATAAATGTTCTGTAATCACGTTTTAAACCGATAGGGGAACATCCACCACGAAT
+ATAACCAGTGTATTTTAATATATCCTTAACTGCTATCATTTCAACTTTCTTTTCTCCAGC
+TATCTTAGCAGCATTCTTTAAATTTAATTCTTCTGCAACTGGTATAACAAAAACATATAA
+CTCTTTGCTTGTTCCTTGAGCTACTAATGTTTTAAATACATTTTTCTCATCTACTCCAAT
+TTTATGAGCTACTGAAATCCCATCTATCTTTCCATCTTCACTTTCATAACTTAACATTTC
+ATATGAAACCTTTTTAGAATCTAATATTCTCATAGCATTTGTCTTAAGCTTCTTATCTTT
+TGCCATAATTTTCACCTCTTAAAATTAAATCATTTATAATTATACAATAAACACTTAAAA
+TATATAACTCTAATGCAAAAAGGACTAGTTAAACCTAGTCTTTTTATACTAATTTAAATG
+TTAAATCATAATCACTTATATTACCATCATAATATTCAATCCCATATTCACTTTATAATA
+TTAAAAATATAATTATAAATAATATAATTATAATAAAAGCTATACATCCACAACTTAGAC
+AAGTTACAACATCATCATCTGTATTAGAACTATCATTTTTTAATCCATCCATAGCATCAA
+AGCTTGTCTTATTATATACTTTATTGTAAGCTGCCTTTTTAGGATCATTAACCCATCCCA
+TGCCCTTTTTACCATATGTAGGATTTATAGATTTTTTTACTTGTCTTTTTACTTTTCCAG
+TTGTTCTTGATTTTACACTTTTTTTTAAGCTTGGTTTTCTAGGACCTATCTTCATAACTA
+CCTCCTAATTTATCATTTTCCGTTTAACATTATATAATATTTTTATTAATATAAAAAGTT
+TATATCCTTATCGGTATAAAGTTTTATAGCATGACAATAATTAAAATATAGATTAACTTT
+ATTTGTATAAATAGCTTCAAAAATGAAAAAAGTGATAGATAATATTAATTATCTATCACT
+TCTTAATTAGATCTTCTTAACAAATTCAGAATTAACAAATCCAACTTTTCCATTTTTAGT
+TGTTACTCTATACCAACCTATAAAATCGGAATCCACCCAATCTATTCTAAAAATATCACC
+TGCATTTATCTTATCTACTATTCTAGAATTTAATGATCCTTCTTCTCTTACATTTAAAAA
+AGTACTTACATTATGAGTAGTAGCCATTTGTAGCTTTTCTACATAATCTGCATTTACATA
+ACCAACTATTCCATTATACTCAACGTAATACCAACCAAGATAATCTTCATCAACCCATTT
+TATTTTAAAGGTTTCATTTGCTGGTATTGAACCAATTACTTTAGAATTAGTAGTTCCTTT
+AGCTCTTATATTTAATTTAGTGCTTACATTTTTAGTAGTAGCATTATCTAAATTAAAGTT
+ACTTGAATCAATAAATATTTCTTCTGTAAACTCATTCATATCACATCCACCGCTTACACC
+ATCTACACTTCCATTCTCTGAATATTGAAATCCAACCCATTCACTCCAAATATTATTAGC
+TCCAGGAGTGTTCACCCCATAATGTGCTATCCAAACTGGATAATTAGATAATCTACTATC
+TAAATTATTATTTGAAAAACTTGTATAAGTATATACAACAACTTCTTTTCCTGTAAGTCT
+TTTTACCTCTTCTAAAAATTCTATACACATAGATGTTAAATCTCTTGCTCCTACTCCTTC
+AGTAGTTTCTATATCTAAAGCTAATTTACAATCATAATTAACAGCTCCTATTTCATTTAA
+ATAATCTATAAAGAAATTAGCTTGATCCTTAGCCCCTTTATTAGCTCTAAAGAAATGGTA
+AAACCCTACACTTAATCCTTGTTCTTTTGCTCCCTCATAATTTTGTTTAGCGTATTTATC
+CTTAAAGTAATTACCTTCTGTAGCTTTAATATAAACTACTTCTACGCCATCATTTTTTAC
+ACTCTCAAAATTTATATTTCCTTTCCAGTTTGATACATCAATTCCTTTTAAATTATTATT
+GTTTCTACTTTGCATTATTAATTCCTTCTTTCTTTAAAATATTTTTTATAGAAAAAAGAG
+AACCTAAATTATAGGCTCTCATTTAAGCTTTTTACTGCTGCTAATTTATTTTCTGTTTCT
+GCATTTAATAATTTTAACTTCTCATTTTCTTCTACTAATTGTGTAGCTTGTTGTTTTAAA
+CTATCTTCATATAGCATAGCTTTTCCTTTGTTATATTCTCCTGCTATAGCTTGTCTAATT
+TGTATTAATTCATCTTTGGTTAAGTATGGACAGTTTTCTAAAAGCATTTTATCAAATAAA
+TCAGCTTTTGATTTAGCAAGATTTTCTATATTCTCTGTAATTCTATATTTTTCTTCTATA
+GCAAAGAATATTTTTTTACCAGTTTCATATGCTTCATTAAATTTAGAAGCTTTAAGCTTT
+TGGTCTGTAGCTTCTATCTTGACTTTAATTAGTTGTATTAATTGGTCACCTAGAGTTTTT
+ATTATTGTAGCTAAAAAAAGTGTAATAGCAGCAGCTAAAGCACTTAAAATTGGGTCTAAT
+ATCTTTTCCATTTTACATTCCTTCTTTCTTTTTATTTAAATAAATGATTTTGTATTGCAT
+AAAAAAAGAAGCCTACTATAGAGCCTCCAAACATTGTTATAAATATCTTTAATATCATTA
+TTAAAGTATCTATACTTTTTATTAAGTTAGTTATTTGAACTTCTTTTTTAGCATCACTTT
+GCTCTAACTTATCCAATCTATCAGCATGATTATTTAATCTTTTATCATGTGTTTTTAATT
+TATCTTCTACTAATTCTTCATGCATATCGCTACCCTTTCTTTTTTATGTAATTTAAGAGA
+ATAAAAAAAGACTATCTCTAGCCTTAATTATTCCCCTTCTATTTTATTAAGCTTGAATTG
+TTTCATGATCTGTTGGTAATGAAGTTACTAACAGATTAGATAACTCAATATATTGTTCAG
+GTGTTATTTCATGAGTCATCATGAAGCAGCCTAAAAATTGCTTCATTTCCTCTCTTTCCT
+TCTCTGTTTTACATCTATTTTCTATTTGTCTTTTACATAATTCATACATCATAATTAATC
+ATCCTTTCATTTATTTTAAATTATTATTTAATTTAATCATAGCAAGATTTCCGTTAGCTT
+TTAATATACCTGGTACTAATAAATTATTAATAACATCCCAGATATTATTAACTTCTTTAG
+CTAAGTTTTGCAAAGAGCTTCCTAGGTTTGAAGGTACTTTAAAGTCTAAAGTTCCTGGTA
+AACTATTTTCTATAGAAAAATAAGTTTTTTCTTGATAGGTATCTAAATCTATATCTATTA
+CCCCATCTACAACTTCTGTTACTGGTGTAGCTAATTGATAAACCACGGTTGTTGGATTCT
+CTTTTAGCCATGCTTTGAAGCCTTCTACATCTTGTGTTGTTAGCTTGGATTTATTTATTC
+TGATATAAAGATTACCACCAGAAATTTGCATATTTTCCTTATCTTTATCCCATGTTGATT
+CTGAAAGTATTGGGAAGTTTGAAATTATTCCTTTTCCGCCTTTAGAATTTAAACTATTTG
+GTAATTGTGCTGAAAAACGGATAGTGTTAATATCTGTGCCACTAGCTACACTAGACTTCA
+TAAAATTTAATGTAGCTAACTTAACCTCAAAATCATTTCTATAAACTTTAACTTGTCCAT
+TATCCTCATAAAGATAATCATCTTCACGAAGTGGTTCTTTAATTAAAATATCTTTTTTAT
+AACATTTATAAAGTTCGTATGGTTGATTTTCAGTTCCATCTATAACATAACAAAATAAAT
+CTTTTGCCACAAAATTAACTTGTGTATTATGTGGATTTTCTATTCTTATACTACTATTAG
+TATCAATATAGGCAATTCTTTGTCCAACTTGAAAATCATTAAGATTATTATTCCAATTGT
+TAGTATCTATCATATTTCTAAATTCGCCACTTTCTAACCAACAATTATTTATTATTAATC
+TACAACCTTTTAATTTAGCCTTAATCAATACTTTTGTTTTTTTATCAATGCTTATTTTAG
+CTGATGTTGTTCCATTATATTGATTAGCAATTCCACTTATAACGCCATTTTCATTTTTAA
+AATTAGTTACTGCACCTTGTTGAATTTTTTGTATATCAAAAAGATTTTTACCAGTACTTA
+AAACACTAATTTTATACTTATCTTCAACCTTTTCTGCTTCTCCAAAGCTTTTTAAGCCTT
+CAAAATATTTTTTAGGCATATAAGTTTCTTCTCTGTCAAGTACTATGCAAGTATTTCTTA
+GCAATTCCTTATCAGTTTCACTATTAGTCCACCCTCTATCATACATACCTAGAAAACCAG
+TTAATCTTTTACCAGTTAAGTCTAATTTAGTTATAGAATTTTCTTTTAAAATAGGGTTGC
+TATCCCATCCTCCACCTATTTTATACACATTCAATAAAAGTATTTTGTTAGTATTATTCA
+CTACATAAACAATTCTGTCTTTCGGTTCATTCTTCACAAGCGTATCAACAAGTATATAGT
+TTCCTCCAGCATCATCTCTTGTATTATTTGGTTTATATAGGTTATTCAAAGTTCTACCCT
+TAATTTTCATACTTTCTGTTCTACCTTCTAGTGTGTCATTTGCACTTATAGAACTCCCTT
+CATAACTTAAAGCTTGATTACTTTTAAGTCCATTCTGTAGTTCCGTTACATCCATACGAA
+TTTGAGGAATGTTTTGACTTCCATCCAACCCTTCTATGAATTCTTTAGTCTTTTCCAAAG
+AAGCTTGAAGTTCTGTATTTTTAGAAGTAGCTTCTTGGTTAGTTGCTGCAAGATTTGTGT
+TAGCAACTTTAGCTGATTCAACATTTTTAATTAATTCTGAATTTAAAGGTAGTCCTTTAT
+TTATATTATTTGATAGTTCTTCAGCTTTAGAATTTAATCCAGTTAGTGTTTCTATTTTCT
+CTGTAGATTCTATATTTTTAGTATCTAAATCTTTTATAGTTTCTTTAACTTCTTTAGCTA
+GATCTATGTTAGATTCTAAATTTTTATTTAAAGAAGTAGCAGTAGAAGTATTTTCTAAGA
+GCTTAGAATTAATATTATTAGCTTCTGTTATATTAGATTCTAAATTACTATTTGCATTAG
+TAGCACTAGAAGTATTTTCTTTTAACTTTTCATTTAATTTACTAGCTTTGTCTAGTATAT
+TTTCTAAATAAGTAAAGTCTTTACTATCTGCTATTTCTCCAGCTATTTTAGTAAATATAT
+TAGCTTCTACAGTTAATCCAAATGTTGCTGTATGCTCTAAAAATCCATCTGCTCCATAAA
+TAGCTAATTGACAACTATAGACACCATCTTGTTTAGATATTCTATTAGTTATTGGGAAAG
+TTATTTCTCCTTGCTCTGCATTTGTAATATTTAAATTTTCTATTATGTCTCCTTTGGTTG
+TTCCAGCCATTACATAGCCAAGTTTAACAGTCTTACCTGTTAAATTTAATCTTCTCTTAT
+TCTGTAATACACATATTTTATAGATTTCAGCATTATTATTGCCTTTTATTGTTTTAATGC
+CTTCGTTATTATAAGAATCAACATTAACTTTTAGTTCAATTTCTCTCATAATTCACGCTC
+CTTTCTATTTAGCTTTTGTATCTCTTCCAGCACTTGGATTAGTACATACTCCACTTCCAT
+TAAAGTCGTACCATTTACCTTCGATAAATAAGGTTTCCTCGGAAGCCATTACCCCATTAA
+ATTTTAGCCAATAGTAGTTAGAATCTTTATAAAGCCATTCATTCTTCTTTAATGCTCCAC
+CTTTACCAGCATAATAATAGTTAGCTTGGTATTCATAAAACTCTTCTTCTGCCATTAATG
+TATTAGACTTAATTAAATAAGTATTATTGTTATAATAAATAAGTTTAGGCTCTATAACCA
+TTTTGCAATTTTCATCTATCCAATAATAACAAGGTTTTTCATTAAAAGTACCTTGAATAA
+AGCAATTTCTATCTAAAGCACCTGAAGAACTTGCATGATAATCAATCCCATCATGTTTTA
+TCCACTCATTTTTAGCAATAAATCCATCATCTTTTACGAAATAGAAATCACTCTTATAAG
+GGTAAATTCCTTTAGTTGCAATTCCACCAGCTTCATTAGTCATTTTATATTTGCCGCTAT
+AGTAATCCAGGAATTGAAGTGGTAATTTATACTCATGACAACATGGATAAATAGCACCTC
+GACTTATCTTAAATACTGTCATATCATTATTATCGTTGGAGTAAACTTTACCGCCATATT
+TTAGACATTTTAAAGCAAAGTTTTTTATTATATCTTTCTTATAAACATCCAATCTATCTA
+TTAAACAATACCTAGCTTGTAATTCTTCAAATCGCCTGTCTGAGTTACCACCGTCTGCTC
+CGTGATGACTTAATTTGTATAAATCAATTTTCCCTATTCTGTTTTGTAAATGTGTTTCAG
+TAGCTACTGTACTATCACCAGGAAACAATGATTTAGTTCCATGAGATACTAGAAGATAAT
+TAACACTCATATTATTTTCATTGCTATAATCATAGAATTTAGATGCGAAAGCTTCTATAT
+AATCATTTTTCCCAATTCTGAACTGTTGGTCATTAGCAACTATTTTTTGTACATTGAATT
+TATCTGCTGCTGCTAACATTCTATCATGGTACCCTTTAGTGTCCCATTCAGTTTCTTGTG
+ATGGTAACCTAGAATAATCTATTCCATCTTTATATACAATGTATTGTGGTCTATATTTTT
+CTATAATGGCTGGTGCATTCCCTATATGATCAGAATGATCATGAGTAGCAAAAAAATATT
+TTAATTTATTTACTCCAATTTTATCTAGTTGTTGAATCATTATTTGAAAATTTTCTTCCA
+TGAAACAATCTATCATCGAAAATGTTCCATCGTCGCTCTTTATTACTATACAATCTCCAT
+AAGAGCCTTCTTTGTTTTTAAGGTTATAAATAATAGTTTCTGTATTATCCTGCATTCTTT
+CTGCTGTATAATCCAATTTTTTAGTCATTTCAGTTATGTTAGAAGCATTTTCTTTACTTC
+TTACATCTACCTCATTAAAATTATCTACTTTTGCAAGAGCCTTATCTAACGCAGAAAATT
+TATTAGAACTTTGTATAGCTTCAGTATCTACTAAACTTTCGGAAATAATTAATCTAACTA
+AGCAAAGCGGTGTAAGATGGCTACCAGTAGAATCACTAATTGTTAATTGATAATCTGCTG
+TTCCTGGAATTAAAAAATCATCTGTTAATTCTAATCTTGCAATTCCTTTTTTACCATCAA
+CTATAGTTAACTCATCAAAAATAGAAAAATGTTTGGGGTTTATACCAGAAATTCTAACTG
+TACTATATGTTAAATCTATAATATTAATTTCACCTAGAAACTTAAAATCTATAAACCTTG
+ATTTAATATCATGCTCAACCGCTTTAATTTCTATTGGATCATCTCGATTAATATAAATTT
+TTCTAGGTGGTTCTAAATATTGCATAAATTATTTCTCCTTTCTTGTAATAAAAAAGATAG
+TAGAAAACTACTCTCTTACACTAAATCTCCAACTTTTAAAGAAGGAGCTATATTTTGAGC
+TGTACCATTAACTCTAAGTTCCCAATGACAATGTGGGCCTGATGAATTTCCAGTATTACC
+ACTTCTAGATATAACTTGTCCTGCTTTTACTGTATCACCTTCATTTACTAGCAACTCGCT
+ATTATGAGCGTAAATAGTAACTAATCCACCGCCATGATCTATAAATAAATATTTACCATA
+GCTTGTAGTTAATTCTCTTCTTTTTATAACTTTACCTGACTTTGAAGCTCTAACTGGCGT
+ACCTATAGGAACACCAAAATCTATTCCTGAATGTTGAGCCCCTGAAGGATAATAAGGGAA
+TGTTGCTGTTACATGTCCATTACTTACTGGAATAATCCAACCATTACCATACTCATTATT
+TATTGTTTTAAAGTTACTACTTTCTATAGGTGGGAAGTATCCATCACCTTTTACTGTGCC
+TATTTGATTTCCACTTGCGTTTAAAATTCCAATAGGAGACATAATGTAGTTAGCATTTTT
+AAACATTTCAGCTTCTTCCTTTCTTCTACGCTTTAATCCTTTTTCAAAAATTGTTCCAGG
+CATAGTTGCATATGTTAGCCAATCATTATAAATTTCATCAATACTAGCACCCCTTATCCA
+AGCTCTGTACATACGAGAATTATAATATCCTGAGTTATAGCATAAATCTACAAATGCATC
+AAAAACATTTATATTAACTTTACTAAGGTCTAAACCATCTTTAAGCATTTGATTTTTAAC
+TAAAGAGCCATATCTGTCTGGTATTAATTCAAATAAAACTTTAGATGCAGTTTCTTCAGA
+ACAAGGTGGATTACCTAATTTAGCAAAGTATGTTGGCTCATTAGCTTTAGTAACTCCATA
+ACCATATGTTATTTGGCCATCTCCAATATTACCTGGATATTGTTGTAGGCCTTCTATTCC
+TTTGACATACCTGAAATATTTTCTTGAAGGTATTCCTTTACTAACATTCCCTAGGGTATC
+TACACCACCTCCTATAGGAGAGTTTGGGTCAAATACAGTAGTACCACTTGTATTTTTAAT
+AACACCATCTAATACTAGGTCATTACATCTCAATTCTCCAGTTCTAGCATCATAATATAA
+AGATTTATCTTTTCCTATCCTTGTTCCTGAACCTGCAACTACAATTTCATTATCAGGTGT
+AGTTATATTAATAAAATGATCTCCAACATGAATGCTATTTGTACCATTATCAGAACGAAT
+ATCTATGTTATAAACTTTGTTCCCTTTAAAATCTACTTCTTCATATATTCTTACTGGCTT
+TCCACCTGAATCATCTAAAATGTTATATTTGTCAAGCGCAATATAAGAAGGAACTTTTGT
+CTTACCTTCAACAGCATACCCAAGAGACATTGCACTATCAATATCATTTGCTAACCCAAT
+CAAAGGCTTATTTTCATCATCTCCTTGAACCAATGACATTAACGCACCTATATAATCGCC
+GTTCTTTTTCCAATTGTAAAGCTTAATCATATTATTTTCTATCTTTATTGCATCTTTTCC
+ATTGTTTCTAAATAAAGCTCCACCAGGTTTCTTTAAATCTATCTCAAAGCTTTTATCCAT
+ATTCCGTATTAAAACTGTTGTTAAAATACCTATTAATTCGTCAGCTATTATTCCTTTTGG
+AGTTATAGCTGTTTTAAAGTCCCACCCTGAATTATCGCTTAATCTTTTATCAGATAAAAG
+AATCCCTTTTGTCCCACCTTGAACACATCCAAAATCAGGATCATTTGGATCCAAAACTTC
+TTGAATCCAAGCAACTATATCTAATTTTTTTGCTCTATCTCTTTGTGCTAATAATGGAGC
+TTTCATAGCATTTATTGCTCCAATTATATTTTCGCCACCTAAATTCCCATCACCATCAAA
+GCTTCCTGCAATAGTATCAAATGTTACACTCTTATCTGCTTGTGCTGATGCATATGTGTC
+TAAATAATTTCCTATTTCACAATTCAACATTTCTTCATTTAAACAATCATATTCAAGTGA
+TATACATCTAGCTTTAATATTAATATCTAATGGTTTATGTTCTATATATACTGTATCTCC
+TAATAAAATCTCTTCTAGTGACTTATACTCTTTATATTCTTCAGTACTTGATAAAGGAAT
+AAATTGAACACTATAATTTACTAACGGCTTATCTATTCCTTTACTTATAAGCTCCTTACC
+TTTATTTTTTAACGCTTCATTAACCTGCTCTTGTGTATCAAACCCCTCTGCATTTTCACC
+TTTATTGTTTGGTGTCCCTTTTAACTTAATATCTTCAAATCTTTGCTCTGATTCAAACAC
+ATGACTATAATTATTAATTAATGGAGAATCTACCCATGGAGTTGTTCCACTTATACAGAT
+ACCATCATAACCAGTTGGTATTACTCTAGTTATTAAACTATCCATATCTATTGTTTCAAC
+TAAACCTGTTAAATTCTTTTTATATGCAATTCTAACATTATTATCTTCTCCTACTCTTTT
+ATTTAAGTAAATATCAAAATTATTTAAAAATAATTCTCCTCCCCATCTACTTAAAAAAGA
+ATTTTCTTTATCATCTCCACCTATTGCTTGTACTATCTTCTTTCTAAAATAATAAGATGT
+TGCTATCTTTTCTATATCTGAATGTCCTTTAAACTCTGTCCCTTTTAAAATTTTATCTAA
+TGCTTGTTGTCCATTACAATTTACACATCTAACATCAAATATATTTTCCTCTCTAGTTAA
+ATCCTTAATATATATGTCAACTAAGTCATAGAATATATGCCTTGCTTTTACACTCATATA
+ATCTAAGTTTTTTTCTATATCGTAGATTCTATAAAGCTGTTCTGGTATTTTTTTATATGG
+TGTACTAACTTTTATAACATCATCTCTAGAAATATATTTCCATCTTTCCTCTTCATCATA
+TTCATGCTCCATTGCTACTTCATTTAATCCAGTTACTAATTCCATTTTCAAAGTACATTT
+AGAAGGTTCTAATATCATATCTCCATTATTAACAAAATTCTTATTATTAAATTTATATAA
+TTGTACTTTCCCCATAAGCTTAATAATAAATATAATTAGGAATTATATTTATACTCTCTA
+TATTTCCTTCCCATCTAATTGTATTTTCCTCTAATTTTAAAATAGGAAAATCTCCCTTCA
+TGTACTTATTAGTTGGATTATCTAAAGTATCTTTATAACATAATTCAAGTTTAGAATTTA
+TAGTTGTTTTTCCCATGGTTAAATTTAATTCTATTAAACTTTCATTTATCCATAACTTTA
+TATCTCCTTCTCCTTGTATAGTTATTATTGGTTTACTTTCAAAATCTCCACTATTATAAA
+GCATGTCCCCATTATTTATTTCTAATTCTTCAGCTCCATAAAAACTATATGCAAAAGGTT
+CTAGTGTAAAAGTAACTTTGAATTTACCTATTGTTTTTAATTTTCTTTCTATATCATCAT
+ATTCAACTTTCTTAACTATATAAAAATAAGAAGGATCATCTCCTTCCCATAATTTTTTGT
+CTTTAATATTATCTAGCCATCTTCTTATTCTTCTTACTTTTTCATGAATATTTTTCCTAT
+CAATAAAGTTATACTCTACAACCAAAATTCTATTTTCATAACCTATAATTTTATAGTCAG
+TCCCATCCTTACCATCAATTTGTTGTTCTCTATATCTCTTTTTTAGTGAAGGGAAGAATG
+GTCTTTTTATTGCCTTAATTCCTATTTCTAAATCTGTGCAATTATTGAACCAAATAAAAT
+ATTTATGCACATATTCGACCTCCCTTCTTTCCTTTAGTAACTCTATAACTATTTTCATCA
+CTTTTCATTTGTTTAGCTACTTTCTTATATACTTTAGTACTGATTACTTCACCATCTAAA
+TTAGTTACATTTTCAATTACAACTACTATATTATTATTGTTTGTATTATTAAGTTTTGTA
+TTTATTTTTTCTAAGTCAACATTTGATATAGAAGGTACTATATTAGTATTTATAGTTCTA
+TCCAAACTTTGCTTTATATCTAAATTTATATCTTCCATTTCATTGACAAAACCTACTCCA
+ACACCTTGAGCCATAAATTTACCAACCTGATCTCTTAACACCCTAGATGGAGAATGTATA
+TCTAAAGAACTTTTAAATCCTTCTACAATTCCATCACAAAATTGTTTTATCTTACTTTTT
+ATCCATCCAATAGCACCTGTTATACCATCCCAAATCCCATGAACTATATTTTTACCTATC
+TCTTTCATTTGTCCTGGTATAGCTTTTACTGTATCTACTATAGAATCAACTAACTTTTTA
+CCACTCTCTTTACCAGCAGTCTTTAAATCTTCTCCCCATGCACTTACCTTATTCCAAGAT
+TCTTTTAACCAATTTTTAAATCTTGTTGGTAGTTCTTTAACATGATCTACTATAGAATCA
+ACAAATTCCTTTCCCACTTTCTTAGCTTCTTGGTACATATTATTTCCCCATGTAGTAACT
+CCATCATAAGCTTCAGTAATCTTATTCCAAATTTTATGTGGTAGTTCCTTAACATAATCT
+ATCACTCCATATATAAAATCCTTACCTGTCTTTTTTGCTGAAATATATAAATTATTTCCC
+CATGTCTTTACTTTCATATATGAATCAAGTAATTGTTTCCCTATTGCTTCAGGAAGCTGT
+GCAAACCATTGCTTTATAGAATTTATTGCATCTGGAATAGTTTTAGTGATAAATATTTTT
+ATGTTTAAAAATCCCTTATAAATTTCTCCTGCAATTTTTCCTATCAATATCCCCATAAGT
+TTAGGTAAATTACTAAATATAAATTTTACTTCTTCTATATAATTTTTTATTCTAGTTTTT
+ATTATAGTACCAAACTCTTTTATTTTATTTATGAAGTCTGTTTTAAATTGTGTAAGTTTA
+GATATTAACCACTTAAAGAAATCAGGAATACTTTTAGTAAAAAACTCTTTAATATTTGAA
+AATAATTTGTCCACTCCATTCCTAAATCCTTCACAATGCTTGTAAGCTAATGCAAAAGCT
+CCAGCAAAAGGATTAACTATAAGCAACAAAATTTCCTTCCAATCATTTTTAAAGAAATTT
+ATTAACTGCTTTAATTTATTAGGTACTGTTTCTGTAAAAAACTTTATAAGTCCACTAAAT
+ATTTTATTAACTCCATTTCTAAACCACTCGCAATGATTATATAAATAAGTTAAAGCTCCT
+ACTACTAATCCAACGACTAATATAATTTTTCCTACTGGAGATATTTCAGTAACAAAATTT
+AAAGCTTTCTGTGCTGCTGTTTGTAACTTTGTAGCAATTTTTAATTTTTCCATAACATCT
+CTAAATGCTTTATAATCTTTAATGGCATTTCTTATTGTTCCTGTAACTTTAGTTGTTACT
+GCTAAAGCTCCATAAGAACCAACTACAAAAGCTCCTATTCCCACTACTGCCTTTTTTTGC
+CCTTCACTTAATCCACCAAAAGCTTTAGCTATACCACCTATTCCCTTAGCAGCTAAAGAA
+ATAAATGGTGCTAATACTTCACCAAATCCAACTAGACTATTTTTAGCTAAGTTTAAAGAT
+GTTCTTAAATCATTTCCAGTAGTATTATTTATTTTTGCAAGAGCTGAATCAGTTGTTCCT
+ATAGCCTCATTCATTTTCTTAGACTTATCTGCCAACGTATCAAACTGTGAACTTGTTAAT
+GCTGTAATTGCTGTTAGTCCTTCAGTACTACTAAAAAGTTTTCCCATTTTATCTGATTGT
+CCACCAGTTTCTTTTTGTAATATTTTTAAAGTACCAATTAAGCCCTCACTTTTTAACATT
+GCTTGACCATTTTGGAAGCCATATTTCTCCATTAATTTTTGCATATCTGCTGTTGGTTTA
+ATTAAGTTACTAAATACTGCTTTTAACTGGGTACATACTTCTGAAGTGTTTCCTGTAACC
+CCTGTTAATGTAGCCATATTAGTAAATAAATCTGTCATTGATAAATTTAAATTGCTTGCT
+AGTGGGAATAATGGTTGCATGCTTGAAGCCATTTCTGGAAAAGTTGTTACTCCCAACTTA
+GCTGTTTGGAAGGCTAAATCACTTATCTTCTTTGCTGTTTCATCATTAACTTGATTATAT
+CCTTTCATTCCTGCACTAATTAAAGCAACTGCATCTTTAACCTCTGCTCCACCAGCCTTA
+GCACTTTTAGCCATAGTATCAAATATCTTCTCTGTTTCTGCTCCTCCATCTCCAATTGAT
+GAAATAGCCTGATACATACCATCTGTTACAATCTTCAAATCAATTCCTGTTTGGTTTGAT
+ACTTCCATTATTTTATTTTTATATCCTTCTAAATGACTTTGGTCATCTAAAAGAGTATTT
+ATATTTGCTATACCATCCTGAAACTTCATTTCTGTCACTGCAGCAGCAACACCAAATCCA
+GTAACAGCTATTGCTGCTGGTTTTAAAGCACTAGCTGCCTTCCCTGTAGCATTGCTTACC
+TTGTCCATTTTTTGAGAGAATTTATCTAAATTGATATCTTTTAATTTCTTATCAACCTCT
+TCTAAAGCTTTTTTATTTTCTAATAGCTCTGTCTTAGATTTATTCATTTTCATATTTGCA
+GTATCTATTTTTCTATTAGATGAATCTATTGCTCTTTCATTCCTAGCATATTCTTCTTTT
+AAATCAGCTAAAGATTTTCCTAACTTTTTTGTTTCCTCGCTATTCTTTCCAGTAGCTTCA
+GAACTTTCTTTATATTTTTTAGTTACTTCTTCTATTTTTTTAGATAATTCTTCTCTTTTT
+TCTTTTTGCTTCTGAACATCATTAGTCAACTTATTAATTGCTTCTTTTTGTAAATTAATC
+ATTCTATTTTGAAGTTTCATTTTTTCAGTAAGCTCAGCCTGTTTTACTTTTAATTGTTCA
+TTAGCATTACCAAATAATTTAGCCTGAGTACTTGCTAAATTAAATGTACTGCCAAGAGAT
+TTAAGCTCTCTTACCATATCCTTCATTTGCTTTTGAAAGTCAGATGTATTTGCTCCTATT
+TTTACATTAGCACCCATTAATCAACCTCCTTTCTTCAACAAAATAAAAAGGACTATACAT
+CTGTATAATCCTTGTCTTTATTCTCTTCTAAATATTCAAATTCTGAATTTATATAATCTA
+ATAAATCAACTATAGAAATATCTAAACATTCTTTTAAACTCATGTTACATTGTTTTCTAG
+CAAATCTAAAAATACTATATAATGTGTCAAGAAGATTTTCATATATTGTTATTTCTCTTT
+CTTCTTCATATCCTTCTTCTTTGTCATATTCTTCAAAGATACTTTTTTCAATTTTAATTT
+CCTGTACTGATCCTAAAGATTTAAATCTTTCTACAACTTCATTCTTGATATAAATTTCTA
+TAAAATTAAAAATGTAATACAAATCTTTTATATCTAATCTTTCCAAATTATTTTTTTTAA
+TATTTCCATCAAATATTAAATCTATAATTCTATATATTAAATCTAATCCATTAATCGTAT
+TTTTATATTCAAGATATTTTTTATACTTATATCCAGTTATATCAGTTGCATAAATTCTTT
+TTCTATTGCAAGAAATATTTAAATCACTTATTTCTTGCCCTTCGTAAAAGCCTTTTGTGC
+CTTATCTATATTCTTATCTAGTTTTCCTACTATCTCTATATCACACTTCATAAATTCAAA
+TATGATTTCAGCAACATCTAAATTGTCATCTATATCTTCTTTGGTAAATTGATTATCATA
+TATAGTTACTATTGTATCTTCCATTAATTCTAAATCATCATCGGTATAATCAATTTTCTT
+TTCCTCTTTTTCATTTATCTTAGCTTTAGCTTCAGTATATGTTCTATACTTTTTTCTTAC
+TATTTTTCCACTATCATATGTAGTACCATTTATCTCTATCTTCATAGTTACTCACTCACT
+TTCTTTTCTGTTCCTAAACTTTTAGGTTCTTGAACTTGTCCAAACCATCCATCTAAAACC
+TCTTTTGCACTTCCTGCATCAGCAAGATCCATTTCATCTGCATCCACACCAATATTACGA
+TCTTTTTTTCGTGGTATTATAGTTCCTTTTATTTTTGCATTTTGTCTTTTTCCTTTTTTA
+GCTATTGTTTCTGCCTCTTCATCCTCTTCTTCGCCAAAATTAACTCTATACCACCAATAA
+AATTTATATAATCCATTAGTTAATTTTGTTCTATATCCTATAGCTACATCTTTAGCTTTA
+TCGTCAGCATTTATAGCAGTCATTCCACCTAAATTTTTATGACCTCTTATCATTTCTCTT
+ATTTTTCTTGATAGATAATCCCCTTCGATTTCTATAGTTCCCTCTTCAAAATCATTGTCA
+CTTTCATCTTGAACATCATCAAAATATACTGGTTCATTCGTATATTTTAATTTTGTTTTT
+ACACTAGCTGCCTTCATTAATCTAACTGGTTTACCAGTAGTATAATTTTCAGCACTATCT
+TCTGTTATTGGTGCTACATATAAATCTTTTAATCCTTTTGGTTGTGCCATATCAACGCCA
+CCTTTCTTAATCTAATTCTTCGCTATAATTAAATCTCATAGCTTTATGATAAATTTTCAC
+ATCTACTTCAAATTGATCATTACTATCCTCTAATAAAAATCCATTATCTTTTAATAATTT
+CTTGACCTTATTTTTTAACTTCAATCCTTCTTCACTATTAGTTGTCCATATATCAACTTG
+TATATTATGAGTAATTGAAACTTCTTCATCATCTAAAAAATCCTCTGGAGCTTCTAAATA
+TTCAAAGAATGTAATATGTGTTTTTTTTAGCTCTTCATCATACCAACCTTCAAATACTGG
+AATATCTAAACTACTTAAACTATCAGCTACCAAAGCAATAATATCAAACTCCAATATATC
+ACCTACTTTTCTAATTTCTTCACAAGAGCTTCATAATGATACATAGCAATAGTATCATAT
+TTAGTTTTCAGCAATTTATTAACAGTACCAAAACTATGATGTGGAGGTCTTTTAGTTGTT
+CCCCACTCTTCCATCTTCATATAATAATAAGGACTATTATCCGTTTTATCCCATCCTATA
+ATTACATATAAGTTTCCATTCTTCTTTCTAAATTTAGGTTTAGGAATATTATCACTTGCA
+TGCCCTGGTGGTCTGCTTCCTTTCCTCCCACTCTTAGAATTATCTTTACTTTTATGAATT
+TTAGGCTTTACAGTATCATAAGCTAATTCACTACAATCTTTAAGTATATCTTTATTTACT
+CTTTCTAACCCTTCATTTGTAGAAATGCTCTCTGCTGTTTTTATAAGTTCATCTAATCCA
+ACAAACTCCATATTAATCATTAAAGCACCTCTTTACATTTTAGTTTTATAAAATCCTTTT
+TATATCCTAAGAAATCAGGATAATATATTTCATATTGTCTACCTTGCCATTCAACTATAA
+AATTTTCTTTATTCCTAAGCTCTTCTAACTTTTTGCAATATCTAACTTTAAATATTACTG
+TATTCTCTAATTTCATAGCCATAGCTTCATATAATTCTTTACCATATAAATCTAATACTT
+TTGCTCTACAATCATAAAAGGGAGTTGGCTCCCTTGGTGGTTGCCTTCTCCCTTTAATAA
+TTACTTCTTCTATTTTCTTTATATATATTCTTTCTCTTAGCCTAGACATTATTATCACCA
+CAATATTTCAATTGAGTTATTATTGAATTTAATGCAAATTGAGCTTTATCATTTTTATTG
+CCAATACTAATACTTTCTTCATCATCATACCAGTTCTTTACAAGTAATTTTACTGCTAAT
+GAATAAAGTTTCTTTCTATAATCTTTTTTCACGCCAGCATTTGTTAAATATTCTTCTGCT
+GCTTCTAAAAGACCTAATAAAAGATCATCATCTTCATCACAATCAATACATAGATATTTT
+TTTAATTCTTCCAAGCTCATTTTTAATCACTCTACGCTTTAGCTTCATTTACTTTTACTA
+TTAATCCAAATTTTCTTATTACTGCTGCATCTTCTGATTTTTTTAATGGTGATTCAACAT
+CAAATCTTTCTATAATTCTAGCTATAGTTTGATTCTTAGTATATCCAGCTTCTTTTGATT
+GATCTATTAAATATTGTTTTCTATCCATAAATTTAATTAATGTCTTTAAATCTGCAATTA
+TAAACTTGATTTCCTCTCCTGTATTAAATGTAGTTGAGTCTAATTCAACCACATCTCTTC
+CCTTAAATATTAAACTTCCTCCATCTGATAATTCTTTTAAAAGTGGTCTACCTTGCTTAT
+CCATTAATGCATCTAAATAACCTCTACCTAAAGAATTAGTAACAATAACAGCTCTACTTC
+TTGCATTAGGAACTAATGAATTTATTTTCTCAACCATTTCTATATAATCTTTCACTTCTT
+CAGTAGCTAGTAATTTATTAGCTTGATCTACTACTTCGCTATTTTCAGTATTAACTGCAT
+ATTCTACGAATTCTTCATTTACAAATTCTAAAAAGTTTATTTCACTATCTTCAAGTAATG
+AGTTATCTATCGGTGCAAGTAATCCATAATCATTTATATCATATGACATAGGTTTAGTTT
+TCATCATAGCCTTAACTAATTCTGTATCTTCTTCTAAATTTGCAAGTTTAGTAACACTTC
+CCCCAGCTCTTACAGGTAACTTTCCTGAATTTCTTGCAACTGGTATTACATGACAGTATG
+ATTTTAAAGCTGGATATCCCTCTTTTAATTTTTCAAATTCATTAACAAATTCTTGAGGTA
+TTACAGCTCCATTATTTGTTGCTGACATAACATCTCTTTCTTCTTCACTTAAAGATATTC
+CTCTTACAACTTTACTCATTGCGCTTAATTGTAAACTTCTTTTTTCTTCTTTTGAACCTT
+CTCCACCTAAAACTCTTCCACCTGAAAAGTTACTGTTGCTTCTTTCCTCTTCAATGGCTT
+CCATAACTGATTCTATTTCTTCCTCAATTATTTCCATTCTAGCCTCTATCTTTTCTCTTT
+CAATAGCTTTACTTCTTATTTCCTCTTCCTTCTCTTCTTTAGCTAATGATCTAATCTCTT
+CTACTATTACTTTTCTTCTTTCCTCTAAGTCTTTCTTCTTTGCTCTTAATTCTTTTAATC
+TTTCAAATAATTTCATTTATAAAATCCTCCTAAATTTAAATAATAAAAAAAGAGCTTTAA
+CAATATATAAGCTCTAATAAATTACTTCTTTTTTCTTCTTTTTTCTTTGCATTTATTTTT
+ATTTTTTCTAAGCTTCTACAATCTACTTCAGTATCTTCATAAGCAGGAAATGGTGTTGGT
+GATATTTCATATAACTCAACTTCTAATAAAGTCCTTTTCATTATTTCTTCACCATCTTTT
+TCAACTTTACTCCATTTATCGTCAAGTACCTTGAATCCAAATGAAGTACCATCAACATCC
+CCACGCTTTACACTTTCATATAAATCATTAGCAACTGTTGTATTAGGTAAATCAATATCA
+AACCTTAATCCTACTGAATCACTTTCTAACCTTAAAGTACCACTTTTTGTTGAACCTAAT
+ACATTATCAGTATTATGATTATATAAAGCTTTTATAGTATTGTTTCTTAAACTATTATCA
+AAAGCTCCCTCAGCAACAACTTCTACAAACTTATCTCCCCACCAATCTCTTAATACTTGT
+GATTCAACATTATACTTTGATGCATAACCTGATATTGTTTTAACTCCTGTTTCATCATTT
+GACCTTGCTTCAAAATTTGAAATTATATTTCTTACTTCTCTTTTAACTTCCTTATGCTCC
+ACTATTATCACCACCTTTCAAATATTGTTTTCCAGCCATAGCTATAGGCATCATATTACC
+ATTTATAAGTAATTCATTTCCTCCATCTTTTGGTGGTAAATTTTCTTTTTTTCTCACCTC
+ATTGGAAGCTATAAATCCACTTTGAATACCAATTCTATAAGCTTCATATCTTGTTTTTAT
+ATCACTTCTTAAAATACTATCTACATTAAACTCAATTTTCACATTATTTAAAGTTTCATA
+TTGACTTAATAATTTATCTTGCATCTCTTGTTCATAATTAGTAAGAGATGGTTGAAGTGT
+TGTTATATAAAAATCTTTCTGTTGTTCTGTAAGATTATTAAATGTTGCTCTCTCTAAATC
+ATTAAGATGATATGACTTCATTCCAAATGCTGCTGCTAATTCTCTTTTAGTTAATTTTGC
+ATTTTCTAAAAATTGTGCATCTGCCATGCTTAATGACAAAGGTTGAAATTGATACCCTAA
+AGGAAGTAATGAAACCGAATGAGCATTTGCTAGACCATTACTCATAGATTCAAATTCTTT
+TATAAAAGTTTTCTTTGCCTTTTCGTCTAGCTCTCCTACATATTGAATTATTCCTTTTGT
+AGTTAATCCACTTTTAAAGAATTTATTTATAAACTCCTGAGTAGCTCTTCCATTCTCAAT
+AGTACATTTCAAATAATCAAGTGGAGCTATTCCTATTAATCCATCTAAAGTAATATCTCC
+AATAAAATGTAGTATTTCATCAGGAAGTAACTTATGTTTAATCCCTTTATTGTCAGTTAC
+TATATACCAAACTTTAGTTAAACTACTTAAAAAGTTATTATCATCCATAACTTTAGTTAC
+ATTATCTGAATCAATAGGATATAAACCAATTATCTTTCCTCTTCTATCTCTTTCTATATA
+TGTATACGCATTACCTTTTAAAGTTCTTTGTGCTTCTAAGCACTTCCAAAAATTAATTGA
+GTTCATTAATGGATTAGGCTTATATCTTAAAAGATAATAAAGTTCATGTTCTTTATACTC
+TTCTCTATCCTTGTAAATCTTTAAAGATAATTTACCTATGCTTTCAGCTCTTACCTTAGT
+ACATATATAAACTGTATTTTCTTTTAATACTCTCTTACCTGATATTAAAAATTTTAATTT
+AATACCAAACTTCTCCCAAAAGTTAGAATCAGATATATTAATACCAATCTCTTCATCATA
+ATTACTTCTTTTATTAAATAACTTTTTAAAAAACTTCATCTATTTTCTCCCCCATAATCT
+CTTTAAGAAATCTTCTTCTGCAAATTCACTCACATTTAAGTTTTCTCTTTTCCAATATGT
+TATAGCTCTAACATGAGCGAATATACAACTTGCTAATGGGTCAATTCTTTTAAATCTGCT
+TTTTTTACTTATTTTTATTTCTCCAAAAGAGTTGGAATCAATCTCTGCATTTTGAACACA
+CCAAGTCATAAGTTTATTATCATCATGTTCAAGTTGCTTAACTTTCATTAAATCTCTAAA
+ATTTACAGTAGCTTCATTTAGTTTTGCACAACTTTGTCCACATTCTACACAGGTATAATC
+CTTTCTTTCTAGTTCTCCAACTAACATTGCAGCTCCATGAGGGTCATAACTAACTTCTAT
+AACATTTAGTTCATATTCTTTTACAATACTTTCTATAGTATTTAGAACTGCCCAAAAATC
+TACTATTAAACCATCATTAGCTTCTGTCTTTATTAACCAACCTTTTTTACTCCATAATTC
+ATATGGTACATTGTCAGTTATCATTTTTTCTTTAACTACTTCTGATGGTATAAATGATTG
+TCCAAATAAAGCATATCGTCTAATATTCCCATCTAAATAAGGAAACTCAAAAGCAATTGA
+AGTTAAATCCCCTGACTTTGATAAATCTATTCCAATATAACAATCATGTCCTCTGAAATC
+CTCTAAGGTTAATTCCTTTTTACAAGCTTTCCAGTATTCAACATCAACATACCTTTTTTC
+TCCTGCTGCAACATATATATTACAATTCTTAGTAAAGAACTCTATTCTCTTCTTTTCATT
+ACTTGTATTCTTAGCTAATTTAGCATTTTCCCTCATGCTTTGTATTCCTTCAGGATAAGT
+ACATAAAATTGGATTAGCCTTTAACCAAACTTCTTCATCAAAAGGATCATCTTCTTTTTC
+TAGCTCACAAATCATTACAAAGTATTTATCATTCTCAAAAGTTCCATCTAATATTGAACA
+ACAATCTAAATATTCATAATAACAAGCCGTTTCTTCGTAGTCCATTCCAGCCGTAGTTAT
+TATTACTAATAATGGCTCTGTTCTTGCCATCATACCTGATTTCATAACATCATACATATC
+TGAATTAGGATGTGCATGATACTCATCTATAATAGCCATTTGTGGATTCTTACCATCACC
+AGTTTTACCAGCTTTTTTACTTAAATGCTTCATAAAACTATTACTATTTCTATGTCGTAT
+TTCTTTTTGAGTAAACTTAAATTTCTTCTTTAATGGTTTAGAAGTCATTAGCTCCCATTC
+ATCAAAAACAATTTTAGCCTGATCTCTTTCAACTCCTAAAGTATAAACTTCTGCTGCATT
+ATACCCTTTTGCTCCTATTTCATAACCAGCCATTCCAGCTTCCATTTGAGATTTTGCATT
+TTTTCTCCCTACTTGAATAAAAGCAAATCTAAACCTTCTATAATTTGTATCCTTATGCTT
+CCAAGCTTCTATATTACAAATTACAAACTTTGACCATGAATTTAATATTATTGGTTGTCC
+CTCTAATACTCCTTTTGAATGTTTACAGTAACTATACCACTTAACAATTTTTTGAGCTTC
+CTCTTCATCCCAATAATACTCGAAATCTTCATGCTCCATTCTTTCTAAATCATTTAGAAA
+TCTCTGACAAGCTTGTTTATGTCTTTTACAAGCAACAATTTCACAATTTAGTATTTTATT
+AGAATAATCAATAAGCTCTTCAAGAACTGTATTATACATTTCCAAAATCCTTATTAAATG
+CTTTTTCATCATCATCAATATCAGATGCTTCTTGAATAATTTTTAATCTTGCTGCTGGAC
+TTAATCCAAACTCTGCACCTAACTTTTTAATAACATCAGCATATTGAATTTGAATAGAAA
+TCAAAGGATTCTTTTGAGTTGTTAAAGATCCTTGTTTATTAATATGTGTTACTGTAAGCT
+CATCACAATTTAACTTCATGGTACATTCTATATATTTTTCTATAGAGTTAGCCAAAACAG
+CTAAATTATAATTATCAATATTAGCAAGTATATCTACAGCTTCTAACTCTTTAACAATTT
+TCTTAAAAATACTTTTACCATCTTTGGATAACCATGTTGGTGGTCTTATTTTATCTCTAG
+GTAATTTTTTTAATTTTTCTTCTTGTTCTTGTCTTTTTTCAATTTCTTCATTAGTCAAAT
+GGCTCTTATTACCATTTGCAATAATTTGAGAAACTGAAATCATCTTTCTTCCCAAACCTA
+ACATTACCCCCCTTTAGTTCAAAAAACGAAAAAATTTTTTCTGACATAGATACTGCGACC
+TTTTGACACTCCTTAAAAACTTTTTATACACCCCCTACCCTTTAGGAATTAGCTTAAATA
+ACTCTTCCTGAGTATTTCTTTTAGTAACCATACCTTTTCTATATTTAGCATGTATCTCTT
+GGTGACATGAATTACATAAAGAAAGCAGGTTGCTTGTCCTTAATCCAAGCTCCCTGCTTT
+CCTTTAACTCTATTATGTGATGTACAACATCAGCAACTCTTATTCTATTCTTACTTAAAC
+AAACCTTACATAAACCTAAATCCCTAGCAATAACGTTAGTCCTAACTATATGCCATTCTT
+TAGAATTATAAAAAGCTTGTTCATCTTTATCTTTTCTTCTTACCTTATAATTCTTATGTC
+TATCCTTATTATCAAATGAATGCTTACTACAATAAGTTTCATTTAATTTTATAAGGTTAT
+TACATCCACTATAGTTACAAACTTTTTTAATTTTTAATCGCTCCTAATAAATATTTTAAT
+GCACCTTCAATTTCTTCGTTAACTTTTATCAAAGAAGTATTTTCTTTGTATTTTTCCACA
+AAGTCATCTATACAATCTGACTCTTCCTGACTTTGTGGAATTAATTCTTCTCTTAGCTCT
+GTTGGTCTCATATGATTACTAGCTTCAATATTATTCTTTAACTTAGTATCTTCTACAGGC
+ACAAACTTTAACTTAGGTGTAGTACAATCAACCGTTTTTTTATACTCATCATTCAATATA
+TTTTCCAATAAAAATTCTATTATCACTTCGTGATTACTTTTTTTATCAATCAGTCTTTTA
+TTTTCAATATATAAATCATATATTTTCTTTATAATTATTATACTTTCATTGGTATCATAA
+ATCATTAGTTCATATATTAAATCTTTTACATTTGATTTTATTTCTGGAATTATAAATCTA
+AAATCTTCACTTACTCGCTTAACCCCCCATGTATTACCTGCTTCAAAAATATAATAAAAA
+AAATCTTCCTTAACTGAATTAATATACTCTAATAACTCAGTATAAACTATAATATTAATT
+CTTCTTAGTTTTTCTTTTTGCTCAACATTTTTCTGATTTTTAGAATATTCAATTGAAATT
+AAGACAGCAATTATTGTTGCATATGCTCCTATTAAAGTAGTTACTACTGTAGCACAAAAT
+ATAATCCATTCAGCAACTTTAAAATGATTACCCCATACTTTCCAAATACTAAATAATGAA
+GCATATACCAATATTGATATTACCCCTAAACTTATTGATATATTTTTTATTATGGTTTTT
+TTATCCATTTAATCACCTCAATAACATATTATATATTATTGCAATATCAAGTTCAACAAC
+TTGCAAATAATACCCCATAATACATATTGTGTGGTTTAAATGAATTATCTTCAAAGCTTC
+ATAAAATCTAAGTTTAAAGGTAGTCTTAAAATTTAATGCCACCTCATTCTTTTATGTCCT
+ATTTAATAGATTTTAAAACCTTTAATCATTCTATTTATATGGCTCTGTTCAACCCCTATA
+TAATGTAAAGTTATTGAAGGGTCAGAATGATTGAATATCTTTTGGAGTGTAACAACGTCC
+TTATATTGCATATAAAAATGATATCCAAAAGTCTTTCTTAAAGTGTGAGTTCCTAAGTTA
+TAAAGTCCTAAAGTTTCTCCTGCATCTCTTAATATAGTGTAAGCTTGTTTTCTTCCAATA
+GGTCTGTTATAACCTTTCTTTGATTTTATAAGAAATTGGTCTAAATCTTTTTCATCACAA
+TATTTCTTTATTTCTCTTTTTAATATTGGTGTCATTGGAAATATCTTTTGCTTTCCAGTT
+TTCTTTTCTCTAATGGAAATATAATCTTTTCCTTTAACATCTCTAATTCTAAGACTTAAA
+ATATCACTTATCCTTAATCCTGAATTAATACCTAGTATGAACATAATATAATTTCTTTCA
+CTATACTTTCTTAAGTAATTAGCAATCTCATGTACCTTATTTGAATCTCTTATTGGTTCA
+ACATAGTTCATATACTACCTCACTTAACTAAAATTATTTCTTATTCTATGAAATACAAAT
+AAAAGAAAGAGTTTTTATTATAATTAAAACTCTTTCTTTTATTTATTATGGTACATAAAC
+TCTTACTATTTTATTAGAATCTGATGAATTTATCTCTAGAATTTTTTTTGTTTTTAGATA
+TTTCATCTTTGTATAATGACAATTATATGTTCCAAAGAGTTGAATATCTCTAAAATCATC
+AAAACCATCATCTTCCCACATGATACTTATCTTTTGCGAACTACTATCAAATGCTATAAC
+TATTGAAACATTTGCATTAAATGCAAGTTTCCTTCCTTTTTTTAATAAAACTTCTACCTT
+AGTATTAAATGGTCCATTTTGATGATTATTGGCAAAATAATATTTTTGTAATGCCTCAAC
+ACTCTGTAATTCTTGGTCTCTATCCAATTTTTTTCCCATTATTATCCCCTCCACAGATAA
+TTATAAGTTAAAGTTTTATAATTTTCAAAAAAATTTATTATTTTTGTCTTAATGCTCCAT
+TTACTCTTTTATAGCTACTATGTTTCATACATTCATCAATTCCTTGACAAGGATCATAAA
+TAACTACTTCTTCTTGACACTTTCCTTTTTGATATTTACTACATAATGGTGAGAAAAATG
+AACATGCACATTTAAGTCTGTTCCCTTCCCACAACATATACATAGGTAACTTTCTCTTTT
+CCATTTATCTCACCTCTTTTTTTACAAAGTAAAAAGAGCCAACTATAAAGTTAGCTCTTC
+TAAAGTTTAAGTGGTTATTCATTTGATACTATTATATTAACGCATATAAAGTTAGCTATT
+CAACCACATAATAGTTAGAGTTTAGTCAGAAATTAGTTAGACTTTTTAAATTCATCATAT
+CTAACTCTATTTTCTTAATTATTTTTGATTTTTTGCATATAAGATATTTAGGATTCATCC
+CTAATCTTTCAGCAATACTCTCCATATTCATTCCCCTAAAGTAATATGATGTGATTATCT
+CATACTCAACTTCATCTAAACATGATATTAGGTTTTCTATTTTCTTTATCCTCAACTCCT
+TATTTCTTTTCAAATATTTAAGAAACTGTATTCTCTTTTCCTTTGATAAAACTTCATTTA
+CTACTGGATCTGTTATTTTATAAGTTGTTCCAGTTCTTTCTGAATATTGTAATGCTCCAC
+ATCCTTGATATTCATTTTCTACAGTTGCAATTTCTAATTCCAAAGCTCTTATTTCTCTTA
+CTGTTTCTTTATAACTCTTTAATAATCCTTCTACATCATCCTTAAACTTAATCATATTAC
+CTATCATTTGAATACCTCACTTTAACTTTTTTTATTTAAACTAACTAAGTTGTACAATAT
+ATAGCTTTTGTAAAGGAACTTTCACATCCTTTCATAATAACTTATATCCTAGTTAGTAAA
+AATCTTTTTATTTACTTAGTCATTTAATATTTATTCTCTAAACACCTTCTAATTAACGAT
+ATACTTCTTATTCCTAGCATACCTTTTAATATTTTCAAAATTAAATTTTTCACTCCTGCA
+CCTACTATATTTTTATGAATAACTATCTTATTTTTGAATATAATATTAAATATAATATTA
+AATATAAAATTAACCATTGAGGTGATTAAATGCAAGGTGATTTAACATTACTGATAATCT
+TAGTATTAGCTTTATGCATATTAAAATGTCTTTAATTTTTAATTAAAGCTATAGAATAGA
+TATATATGTATCTATTCTGTTAGATCATATGTTAAAATAAATCAAATAAACACTTCATTA
+ATCACCTTTAAGATAGAGAGTTGTAAAACACAACTCTCTTTTTGATTACTCTTAGTCACT
+ACCTAGAATGGAATATCCCCATCATCAACTGGTATCATATCATCATTGAATTTATCATTA
+TTTACTTTACTATCACTTGAATCAATAAAATCAAATCCATCAACCGCTATATAAGTTATA
+TATCTTCTTGTCCCATCTTGTGCATCATAACTTCCAGTTCTAATGCTCCCTGATATACTA
+AATCTTTTACCTTTAGTTAAATACTTAGCTATGACTTCTGCTCTTTTTGAATAAGCTATG
+CAATTTATAAAATCAGCTTCTTGTGTTCCATCTTCTTTTTTAAAATCTCTATTAACTGCT
+AGTGTAAATCTTGTTACTGCTGTTCCTTTATTAGCAGTAAATCTTAATTCAGGATCTTTA
+GATAATCTCCCAACTAAAACAACTTTATTCATTTAAATCATCCTCTCTAGTCATAATACT
+TTCTATTATTTCTTCCTCTTGCTATGGCAATAGTAGTAAACTTGTATTTATCATATTCTA
+GTTCTTTTGCCTTACGCTTCTTTTTTAAGTCATTAACATATCTAGCAACAAATTCTTCTT
+TACTTAGTTTCATATTAATCACTCCTAAAATTCTGATAATCTTTGAGTTGGCAAATTATA
+ATTTAATTCAACTACTCCAGTTCTACCATTTCTACACTTAGCAAAGTTTATTTCTAAAAC
+ATCATCTACAATATCTTCCTTATCCTCTCTTGCTCTATAATAACCATCCCTATAAAGAAG
+TCCTATTACATCAGCATCTTCTTCAATGCTTCCAGTATCTCTTAAGTCTGATAGTATTGG
+TCTATGGTCTGCCCTTTGCTCTGATGCTCTTGAAAGTTGACATAATGCTACCATTGCTAC
+ATTTAACTCTTTAGCCATAGCCTTTAATGAATTTGATATATAGCTTGATTGTTCATATTT
+ACTTCCCTTTGTTGTCGGTCTTATTTTTCCTATATGATCTACTATGATTACATCTAACCC
+ATACTTTATTTGAATTTCTTTAGCTATTAATCTTATTTGATTTACTGTTATTGATGCAGG
+TTCATAAACAAATATGTTATTCTTCCTGCTTAACCTATCAAAAACATTTAATAAGCTATT
+CATCTCAGAATCATTGAATCTTCCTCTAGCAATCTTTCCATTTTCTATACATGTATTTGA
+AGCCAATAACCTTTGTCCCATTCCTTCGGTACTCATATCTAACTGAATATAAAGAACCTT
+GCCTTTTATATTTTCCATTATTGATAGTGATAAAGCTGTCTTTCCCATTGAAGGCCTTGC
+TCCAAATACAATAAAGTCTTTTTTCTCTAATCCATTTGTCGCATTATCTATTTTTTGAAT
+TCCTGTACTTATTCCAGTTAATCCACTTTTATTATTAAAAGCTTTTTCTATCTTATTTAA
+AGTTTTCTCCATTACCTCACTCATTGTATAAAATTTATCTTCTCTATCTGATGAATTAAG
+CTCAAGCAAAGTATTTTGTAATAAATCCACTTTTGATTCAATACTTCCACCATCAGTTAT
+TATACTTTTACAAGCAACAATTAACTTTCTTTCCTTACTCTTTTCTTTAACTAAGTTTAA
+ATGACTATCAAATGTACCTCTTGATGTGTGATATGATATTTCAGTTAAATCAGATAAGGT
+TATAGCTTGTGCCTTTATTTCTTTGGATAACTTCTCAGCGACTATTGTTAAATCAAAACT
+TATGTTATCCTTAAACAACTCTCTCATAGCTCTATATGTAATTTTATTTTTAGAGCTATA
+AAAATCATTATCTTCCAAAGAACCCATAGCTTTTATCATAAAATCATTATCTTGTATAAT
+AGTTCCTAAAATAGCTTTTTCACTATCAATAGCATAATTACTCTCCATACTCTCACCTTT
+AATAATCAAAATTACCTTTCTTTATATTAAGATTATCTTTACTTATTTCTTTTGTTCCTG
+CTCCAAGCTCTTGATTTAAATATCCTTCAAACTTATTACCAAATAAAGTTTCAGGCCTTA
+AATATTTCTCATACTCTGTACCTTTCCATTCAGAAACTTTATTATCTATAACCTTAAAAA
+ATTCTTCTTCATTGAATCCTTCATCTAATCTAGCTTTAATTAAAGATTGTGTCTTTCTAG
+TAGTAGCTTTATATGATTTTCCAGTCTTTGAATTGAGATACTCTATAACTCGACTATATA
+TAATATTATTTATATCTCTTATAGAAGAATCTTTGTTGGGATATATTGTCCTAACCCTTG
+GGACACTTTGTCCTAACCCTTGGGACATTTTGTCCCAAGGTATATATTCTGTTAAGTTAT
+CTAATTTTGAAGTAACATTTATATAAGAAAATTTTCCTCTTATCCCATCTTTACAAAATA
+AAACTTTTCTTTCTATTATCTTTAAATCATCAAACTTTTTTAATCTTCTCTTAAGACTTC
+TTTGAGTTCCTATTATCGGTATTTGTTCTAATAAATATCCCTGATCTATCCATATAAAAC
+GCTCTCCATCAATAATTTGAAACTGCATATTTTTACTTGAATACATATCTTTAATTACTG
+ATAATATAAGAGCATCATCATTATCTAATCCTGATTCTATTAATTTTTTCTGACTAAATC
+CATGAATTGTGTATTTCAATTTTATACACCTCTTTTCTTGCCTAAATTAATCTTGGATGC
+TAAAATTAAATTGTAAGTATTTTTGAGTGCATTGATTGCTTTGGTCGGTATCAATACACT
+TGTTTAGAGCTTCTTTACATGACATACCATTTAAAGAAAGCTCTATTATTTTTTCAATAA
+TTTTATTCATCTCAACTTTATCCATATTTAAACCCTTCTTACTAGCATTTCTGCTTCACT
+CAAAATCTCTAAGAATTTAATTTGTGATGTTTTCTTTCCAAAGCCAAGTCTATTAAATCT
+GATATCCTCTTCTGCAATACATAAAATAGTTTTAAAATCACAACTTGAATATTTGTTTTT
+TAATCTTTGAATTGCTTTTAATACCATAATTACCTCCTATAGCTTGTACAAATTATTTGC
+ATTGTATTATTTCTTTAGCCTTTTCACTTTCAATCTCTATAGCCTTTTTAGCTAAGAAAC
+TATTGAATTTTTCTATAGCCTCCATAGATGGTTGTTTTAATATTCTCACTTTAGTTGTTC
+CTATATATCCATCTGTTATAAATACATTTCCATCTTTTATAATTTTCTTTGGAAATAAAC
+TTCTATCCCAATCTTTAGGATCATCTTTTTTTCTTCTTGCCATACTACCTAATCCTCCCC
+TAAATATTTTTCTGCTATAAGTCTCATTTCTGCTGCTCTCTTTTCTAATTTTGAAAAGAA
+TTTTACTATAATTTCCAATTCTTTTCTTTCTGATACATCAATTACTCCATCTTCAACTAT
+TTTTAATAATGTCTTCTGAATATTAACACTATCATCTAATGTATTAGCTACTGAAATTGC
+AAACTTATACAAATTATCAATATTCTCTGATTCAATTATTGGAGTAATTCTCTTGCCAAT
+AGGACATTCATTACAACAATAATGATTTAAAAGTTCAGGAGCATTATATGCTTCTGCCAT
+AATAACAACCTTATCTACTGGAACTACTTTACAAAGGTCTAATTCATAATCAGTTAATGA
+ATCCTTTGAAATTCCTAAAAACTCTGAAGCTCCCTCCCTACTTGAAAATTTAGAATTAAA
+TTCAGCAGCCTTTTTTCTTGCAATACAATACACATTATTAGCTGCTTTAGTTGGTTGTTT
+TGCCATGTATTTTCTTCTCCTTTCATGTGATAATCAAACTACACAATAAGTGTAGTTAGT
+TTGCAAAAAAAATTTCATCTAAAGTACATCTAAATTTACTTTTAAATTTTTTCAAGAAAT
+TATAACTAGGATTTCTTATTCCCAATTCAATTTTAGTGTAGTACGATTCGGAAATTCCTA
+GTAATTTTGCTATTTCACTTCTGCTTAAATTCTTACTTAGCCTAAATCTTTGTAAACTAT
+TCATGTAAACCTCCTACACTTATCGTGTGATTTAAATATACTACACATTTTGTGTATAGT
+CAAGTTTTTTAACACTTTTTGTGTTTTAATCTTTTTATAGATGTTTTTAACTTCACATTT
+TGTGTAAAATATATATAAGGATGGTGAATATAATTGTTTGGAAATAGATTAAAGACTTTA
+AGAAAAGAGAAGGATTTAACCCAAGCTCAACTAGCTAATATATTAAAAACATCAGCTAGT
+GCTATTGGAATGTATGAGCAAAATAGAAGAACTCCTGATACAGAAACTCTACAAACTTTA
+TCAAACTATTTTAATGTATCTGTAGATTACTTAATTGGAAAGACAGAAATACGAGAATCT
+GCTGAACAATTATTAGAAGATAAATCAGTTACCATTGCTCTACACAATAAAAATGGTATT
+GATGATGAGCTTCCTGATGAAGCTAAAAAGGAAATTGAAAATTTTATTGAATATGTAAAA
+CATAAATATAAAAAATAGTTTTTATAAACTATAAAAATAACTGATATTTATTTGGAGGAG
+ACATTTTAATGAGTACTTTTTTTACAGATATTTCAATTGACAAACTTATCGTAAACCCTG
+AAAATTATAGATTTGATTCTGTTGACAATGAAACTTCAGCAATAAAAATAATGTTACAAA
+ATCATAATAAAGCAATCAAAGAATTATTAAAGGATATTTTAGAAAATGGACTTAATCCAC
+TAGAAAGATTATTAGTATTTAAAAAGAATGAATTTTATATTGTATTAGAAGGAAATCGAA
+GGGTAACTGCTCTTAAAATAATACATAATGTGAATCTTCTAAAAGATATTGAACAAAAAT
+ATTTTAATGAATATTCTAAAATACTTAATAACGCTAATTCTAAAATCAATATTGATAAGA
+TTTCTTGCGCTATAACAGATAATATTTCCGATTCCAATAAATGGATTGCACTTAAACATA
+CTGGATCTAATGGTGGAAAAGGTACTATTCCATGGGATACAACTCAAAAAAGACGATTTT
+TAAATAAAACAAATCCCAATAATTCATCTAATATAATAACTTCATTGTTCTCTTACATAA
+AATCAAGTAACATTTATGATGATACAATAACCCAAAATCTAACTAATATACCTATAACTA
+CACTTGAAAGAATATTAAGTGATCCATATGTAAGAGAAAATATTGGTATAGATATTAAAA
+AAAATACTATATATAAATTATATCCAGATAGCGAAATAAAGAAACCATTGTCAAAGATTC
+TACACGATTTGATAAATAAAACAATTGTAGTAACAGATGTTTATACTAAAAATGATAGAT
+TGGATTATATAGAAACTTTTAATAGCAACTCACTACCTAATTATGCAAATAAATTAAATA
+AACCAGTTGAAATATTATCTAATTTAAATCTTATCAATTTACCTTTACAAACAACTATTG
+ATAATAACTCTAATAATGATAATAGTGCTAATACCGATAATATTAACTCTAACAATATCA
+ATAATAGTGCTACTACTAATAATACTAGTAATAATACTAGTAATAATACTAGTAATACTA
+ATAATATCGCTAATATTGATAATAATAACTCTAGCAATATCAATAATAGCACTAATAATA
+ATAATAATAATAATAACAATACCGGTAATAGTAGCTCTATCAAATCTACTTCTCCAAAAA
+GAGATAATAAAGATATTAATAAAAGAAAAGCTCTAATTCCAAGTACATTTCATGTTAAAA
+TAACTGTACCAAGAATACAACAAATTTATAAAGAATTAAAAAAATTAGATGTATCTGATT
+TTCCTAATTCAACCTCAGTTCTTTTTAGAGTATTTTTAGAATTAGTTGTAGATGAATATA
+TAGAAAAGCTTAATTTAACTGGACTTTCAAATAACGATAAACTCAATAAGAAAGTACAAG
+CTTGCATTGATGATTTAAAAAGTAAAAATTTAATTGATAAAAACAAAGTAAAACCTATTA
+ATGTAGCAATATCTAATCATGATAGTCTATTTTCAATAAATACATTTAATAGTTATGTTC
+ATAATAAACATATGCTACCTGATGCAACTAATTTAAAAAACACTTGGAATCAATTTGAAT
+ATTTTATTTTAGTTTTATTAAATTCAATCACAAAATAATTTATGGCCAAAGTTTTATTTT
+TATGATAGACTTATATTGTAATTAAATGACTAAGGAGTTTACTTTATGAGCCTAAAAAAT
+TATTCACCTCTAAGATACCCAGGTGGAAAAAATAAGTTATCAAAATATGTAGGTAATTTA
+ATAAAATTAAATGATTTAAATGGTCATACATATGTTGAACCATTTGCTGGTGGAGCTGCT
+GTTGGTTTATATTTATTAATTAATGGTCATGTTGATAATATAATAATAAATGATTATGAT
+AGATCAATTTATGCATTTTGGCGTTGTGTATTGTCATACCCAAATAAATTTTGTGAATTG
+ATAAAAAATACTCCAATAACAATGGATGAATGGTACAAACAAAAAGAAATTCAAAACAAT
+AAAAAAAATGCTAGAATTTTAGAATTAGGTTTTTCAACCTTTTTTCTTAATAGAACTAAT
+CGTTCAGGTATTATAAAAGCAGGTGTTATAGGTGGCTATAATCAAAATGGAAACTACAAA
+ATGGATTGTAGATTTAATAAAGAAGATTTAATAGAACGTATAAAATTAATTTCTCGTTAT
+AAAAGACATATTAAACTTTATAATTATGATGCTATTGAATTAATTGATAAAATTATTAAA
+CCAAACTCTGATAAAACTTTTACATTTTTTGATCCACCTTATTATAATCAAGGTTCAAAT
+CTATATGTAAATTTTTACAAACATCAAGATCATGTGAATTTAGCAAATAAAATTAAAGAA
+TTAGATCATACTCACAAATGGATTGTTACATATGACAACACTCCTGAGATTTTTAATATC
+TATAATGATTTTTCTTTTATTCAATATCCATTAAAATATACTGTTGAAAGAAAATATTAT
+GGTGTTGAAGTTTTATTTTATTCAAAATCAACTATTATAAATGCATTTGATAAGAACTAG
+ACAACTTTAATCTAGTTCTTATTTTCACAGTTTATAAGAACATATGTTCGACCTTTAAGT
+AAATAGATGCTATAATTATCCTGTAAATAAATAAAATGGATGGTGGAACTAATGAAAAGT
+TTAAGTGATATTTATAGTGTAATTGAAGATGAAAACATAGAATTAGAAGAAGTTTATTTT
+AAGTCATCTAATATCGAAGGTATATATTTTAAAGTATCAGGAATGAATCCTATAATTGGA
+ATACATAAAAATTTACTTACTGATACTAGAAAATATATATCTGTGTTAGCTGAGGAACTT
+GGCCATCACTTTACCTCCTCAGGCAATTTAACATCTGAATGTATAACTTACTCTGATAAA
+ATTAATAGAAGTAAGCAAGAAAAGAAGGCTAGAATGTGGGCTGCTAACTATTTAGTTTCT
+GATGAAGAAATAATTGAAGCTTTATTACACATATCTGGTACTTTAAGTGGATTGGCTCTC
+CATTTTAATGTTACTGAAGAAATTATAAAATATAAGTTATTATCACTCTACCTAAAAGAA
+GATAAGTTTAGGATATCTAAATTAATGATTATGGAAGATGAAATAATTTATAATTCTTGT
+TCTGTTTAATGGAGGTCTATTATGAAAAAAGTTGCTATTTATTCAAGAAAATCTGTTTTA
+GTTGAAGGATCAGTATCAATAGAAACTCAGATTAATATGTGTAAAGATTATATAAATAAT
+AAATTTCCTAATGCTAAATTTAAAGTTTTTGAAGATGAAGGTTTTTCAGGTGGAAATACT
+AATAGACCTGCCTTTCAAAAAATGCTTAGAATGGCTCAACTAAATGAAATTGATATAGTT
+GTTTGTTACAAAGTAGATAGAATTGCTAGAAACACTTTAGACTTCTTAAAAATATTAGAA
+CTATTTAAAGAAAATAATGTTGAACTTATTTCTATAAGTGAAGGTTTTGACCCCAATACT
+CAAATGGGAAAAGTTATGTTGACACTATTAGCTAGTTTTGCTGAAATGGAGAGAACTAAT
+ATTCAACAAAGAGTAAAAGATAATTTATTATCTATAGCTAAAAAAGGCAAATGGACTGGT
+GGCTCCCCTCCTACTGGATTTAAAAATGGTTTAAATGGTGGACTTGAATGGAATAAACAA
+GATATGATTTTAGATGTTTTTAATATGAAATATGAGAAAGAAAAAAACTCTAATATTATT
+AAATATATAAAAGAAAAATATAATCATAATTTTCTTGGGGGAACTTTAGCTACCACATTA
+AGAAAACCTATATATGTTAAAAGCTCTCCCTCTGTATCTTTATACTTAAAGACTAAAGGA
+TATATAGTTCAAGGTGATGAAGATAATATACATTCCTATCTAACATATACAGATAAAGAA
+ACTAAATATGCTATTGTTAGTGATATAGTTGGATTAATAGAGCCTTCTATTTGGATTTCT
+ATAAATAAAGATATGGATAAAAATATATCAAGAGAAGGTAATAGATTTAGTGAGAAATTT
+TGGCTTACTAAAACAGTTAGATGTAAGTATTGTGGTCAAACATTTTGTGGACAAACCAAA
+ACAACTAAAACCAAACATTATAATAAACATGGTGAAGAAAAAATATATATTTCTACTTAT
+AGTTATTATTCTTGTAGGGATGCTGTTCGTGGTAAATTAAAAACTTGTACGAATACTAAA
+AGAGTTAAACAAGAAATATTAGAATTTAAGGTATCTGAACTTATACATTTGCTTAAAGAT
+AAAAAAACATTTAATTCTTCATATTTTTCTAATAAAATAGATAATTCTTCTAAAATAGAT
+ACTATAAAAAAACAAATAAAAAGTATTGATAAAACTATAAATAATCTTACTGACAAAATA
+GCTCTACTAAGTAATGAAGCTTCCCTTATTTTTATATCTAAATTAGAAGAATTAGTAAAA
+GAAAAATCTATATTAAAAGATAATTTGCTACAACTAGAATTACAAGAGCTTAATTCAAAT
+ACTAAAAAAGATAGCTCATTAGTCTATAATAATATACTTGCATTTAATGATGATCTTAGT
+GTAGATGACAAAAGAAAAATAGCTATGAGTTTATTTAAAGAAATTATATATGATCCTGAA
+ACTGATTCTTTAGATGTTACTTTCATGTAACATCTATTTTTGTCTAAATAAACATTGGAG
+AACATCCACCACGAATATATCCAGTATATTTCATTATATCCTTAACTGCTATCATTTCAA
+CTTTCTTTTCTCCAGCTATCTTAGCAGCATTTTTTAAATCTAATTCTTCTGCAACTGGTA
+TAACAAAAACATATAACTCTTTGCTTGTTCCTTGAGCTACTAAGGTTTTAAATACATTTT
+TCTCATCTACTCCAATTTTATGAGCTACAGATATTCCATCTATCTTTCCATCTTCGCTTT
+CATAACTTAACATTTCATATGAAACCTTTTTAGAATCTAATATTCTCATAGCATTTGTCT
+TAAGCTTCTTATCTTTTGCCATAATTTTCACCTCTTAAACTTAAATCATTTATAATTATA
+CAATAAAATTCTTTAAAAACTAAGCTTAACTTAATATTATCTCAGATGAAGTTAATATAA
+ATTAAGATATTTTGTGTCCATATTTTCAGTATATAATATCAAATCTTATTGAACCAAAAT
+TCTAGATTAATGGTAAAATACACTAATTATAAACTCTTAAATCTAGTAAGATTATAAAGA
+TTCTATATAAATAATTTAGAAGATAAAACACAAACTCATCTAGCCAAAGCTAAATTACTT
+AAGCTAAATAATTATCTAGATTTATTCTACTTATTTACTTCAAGGTGGTCATTTATGTCA
+TTCCTTTTCTACACATATATAATAAAAATGCTTTCATAATAAATTTATTATAAAAGCATT
+TCTTTTTATTTGTTTAAATCTTCAAATATAGCTTTATCATTATTTGAAAATTTGTTTAAA
+TCATTCGATTGTATAAGATTCCCATTGGCATAGTTTAATTTAGTATAACCTTTTTCTCCT
+ATAGTATAAACATATGGTTCTATTTCTTTATAATTTGATATAATATCAATAGCGTCCTGA
+TTTTTAGTATCATACAAATCTAATTTTTTATTGAAATTTTCATCAGAAAATTTATAGATG
+GCAAACTGTCCATCTACACCAAAGGATTCCATAGTATCTCTATCTCCTGTAGAAGAGTAT
+CTAGATGCTTCGTTATTATTTCCACAACCTAGAAATAAAAGAGCAAAGCTTAAAGCTATA
+AATATTAAAGAGACTTTTTTCAT
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_009012.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3000 @@
+>NC_009012.1|provirus_1938476_1983993
+TTACGAGCAGGAATTATCGTAACATTCCTGGTTGTCATCTAAAATCACCTCGCTCTTGAT
+AAGACTATAAGCATACTCTGCCTGCTGAAATGGATCATCGTATAGATTATCTGGCATTGA
+AGCATGAAACCTAAAATTCAGGCATTTCTTTTCATTTCCTTTATGTTCATAAATCCTGCC
+AAGCGCCTCAGCTCGTCTGCGTCTTTCAAGTTGTGCTTTTTCGAATGTGTCCCTGCTGAT
+AATTGGCGGATAGAATTTATCCTCAACATACCGTTTATCTGAAAGCATTCTTGCAATAGA
+TGTGTGGTAACGCTTAATGCCCGCTTTTTGAGCCGCCTCGGCTAAAGAAAGCCCGGAAAG
+ATAAGCCTCAAATAGTTTCTTAATTTTAACTGCTTCCTCTTCATTAACGACAGCCCTGCC
+GTTTTGAATGGTATATCCAAAAGGTATATGGCTCATCATTTCATCAACCTTTCCCTCAAG
+TTCAACCCGCATTTCATTTTGAAACCTATTTCCTCCTGTGAAAACACAATGATTTCTTCA
+ATAAAGTTCTCAAATATATCGCTATCAAATGCATCAATCTGCTTTTCAGCCTTCGTTGCA
+AATTTAAAAAGCTTTTCTACCTCAACAAGAGTAGTCATGCCTCCATCGATTACGCGTTTT
+AATGCTTCTCTTTGTTCTTTTAATAAAGCCGCTTCTTTGAGCAGCTCATTTTTCTGTGTA
+TTAAAAAGAGCGGGTTCCAGGTATCCTTTGGCCATAAGTCCCATAATCACCTGAACTTGC
+TCTGTATTTTCTTTGATTTTAGTTTCCAGTTCCTGAATCTTAGTTATGTTATCTGAGTAA
+TTTGTTTTCTTTAAGCTTTGCAGCAATGGCCTTAGAATGAACTTATGTCCGAAAATAAGC
+TTATTGATCATTACAACGAAGGCCTGATGGATCGCATCCTCTCTGACAAACTTCATGGAA
+CAGCTTGATGCGTCCTTTATATGCTTTGTGCAGCACCAGGCAATGTATTTATGATTACCA
+CTGCCATGAATTCGACGCTTAAAACTGCTGCCACATTCTGCGCATTTGATTTTCCCCGAG
+AAAGGGTAGCGGTTTTGATATTTACTGCTTCCCTTGATTACGCCTTTTTCTTTACCTCTT
+TGCTTCAATATTTCTTTGACGGCTTCAAATTCCTCATGGGATATAATGGCTTCATGATGA
+TCTTTTATCATGTATTGATCTTTTTCCCCATGATTATAATGCCGTTTAAAATTCTCATCT
+GTATAGGTCTTTTGCAGAAGGACATCCCCAGTATATTTTTCATTGCTTAAAATGCCGCGG
+ATAGTTGTCGCTGTCCAGTGTGAACCTCTCTTTGTTGGGATTTTATCCGAATTTAGCCCA
+TCTGCAATTTTCTGTGTGCCTTTACCGTCCAAAGCCTCGGAAAAAATCCGCTTTACGATT
+TCAGCCTGTTCTTTATTGATAAATAGCTTTCCATCCACATAATCGTAACCATAGGGAGGA
+TACGAAATTTTGTATGTTCCGTTTTGGAACCTACGTCTGATAGACCACTTACTATTTTCT
+GCAATGGATAATGACTCGTTTTCTGCAAGACTGCTCAAAATTGTCAGCACCAATTCGCCT
+TCCATGCGCTGTGTGTTTATATTCTCTTTCTCGAAATAGATGAAAACACCGAGATCGGTA
+AGTTTTCTCACCATCTCAATACAGTCGGTTGTGTTTCTGGCAAATCTGCTGACCGACTTG
+GTTATAATAAAGTCAATTTTCTTGTTTTCACAATCTGCAAGCAGCCTTAAAAGTCCAGTC
+CGATTCTCCTTTTTTGTGCCTGATATGCCTTCATCATAGTAAATCCCTGCAAATTCCCAA
+TCAGGATTTGCTTTTATATAGGATTCATAATGGTCTTTTTGTGCTTCCAGGGTTGCCATT
+TGTTCATCACTGTCTGTTGAAACCCTGCAATAAGCCGCTACCCTCACCTTTGGCTTGAAA
+GCTTGGAGAGCATTGTTCCCATCAATCCTCGTTACCTTTCTCACTGTTTTCACCTCCTTT
+GGGTATGTGACATGTTACCTCTTTGTGCCGCTAATAGCAAGCCAATTAGGCCATAAGCTG
+TGCATACATCGGCGAGAAAGTTTTGCGGTTCAACTTGTCGATTTTGTTGAATTCTTCTTC
+TGAAATCAGTCCCGCCTTAAGCATCCTCTGCAGAATTTTGTACGCCCGCCAGTAATCAAC
+CTCTCTTTGAATTTCCTCCTGTGTTATCTTTGTATAGTTCGTTTCCTGCGGGTTATATGG
+TATATGATTAGCCGTCTCTATCATTCAAGAAAGCACCTCCTATAAAAACTTAGGACAGCC
+GCGATTGGCTGTCCTTTATCGTTATTCCGGCAATTTCAGAACTTGTCCGGGGTAAATAGT
+ATCTGAAGTCAGGCCATTGAGTTTCTTAATCTCCGGATATCTTGTTCCTCTACCAAGTTC
+TTTTTCCGCTATTCTCCATAAGGTATCGCCTTTTTGCACTGTATAGGTTCTATTGCCCTT
+GTTATCAGGAATGCTGTTTACAATTACAAGGTTTTCTTTTGCTACCCAAGTGTTTATGCC
+TGCGATTTCTTGACCGCCGGATTTCTTAACCTTTTTGCCAAGCAATACACATTCTTTGCC
+GCCTTTTATGACCGGCTTGCCTTTGTATAAAGTCTGTGTGACCCTGTGGTAATAGTCATT
+TTTGACCCACGTTGGAACTTCCACACTGCCGGGGTAGTAATTCTTTACACTGACCTTAAA
+CTCCACCATATCTCCAATTCCAATATCAGTATTGTTATCTGTACTGTTCTCCAGCGCTTT
+TTTCACTGCTTTTCGGAAAGTGTCCATATTCTCCCCATGCTTGGGGAACCAGTGCATCAC
+ATCAGCATGGTTGCTGGCAATACCGAGCTTGTATCCTTCGGAGTGGCAGATGATGTCATT
+CTCGTCAAGTCCGTACTCCCTGCAGAGCATAACGCAGAGTTCAACCGCATTCTGCCACGC
+TTTAAAGAAATAATCTTCCTGCTTTGCTGCATCATAACCCACCATCACCGACCCGGATTT
+ATACGAAAACCCAGCAGGCTCACAGATTTCAAAGCCAATATGGGTATTGTTTGCTGCTCC
+TCCCGCATGCCACCCGCGATGATCCCAAGGCAGGTATTGCCAAACCTCTTTATCGTCTAC
+AAAAGCGTGAACACATACCTGCCTATTTATTTCGCCGGCCTTGTAAGATTTGTTCCAACG
+GGAAAACCACTCAGCCGCCATTACACCCGGCACAGCCGTCGAATGTACCATGATTCCTTT
+AGGCGTGATTTTCCGACCTGCTGTATAGCAATCGTTTCGCGTCATGTATTTTGTAAAAAG
+CTTCATTTCTTTTCATCCTCCTCATTTGAGTGGCCATGCAGTTGTTCCAATGCGTTCTTC
+AGCTTTTCAGGAATGGGCAGTCCTATATGTGCTGCATTCTCAAGAATTGAAATTCCCTCG
+TTACTCAGGTAAAAGAAAATCACCGCTGTCCGGATTGCCCCTCCGTTGCCGAGAACCTGG
+CTGTCGATTATGTGTCCCACACCCACAAGTACAAATATAAGCACTTTCTTAAAGATGCCC
+TTGGCTCCGACTTCACTCGAAAGCTTTCTGTCTACAACGGCACACATCACTCCGGTCACA
+TAGTCAATGGCTACAAAAGCGATGAGTGCATATAAAAATCCATCCAGCCCTCCAAGAAAC
+CAGCCAAGAAATCCGCCAATAGCAGTAAAAACCGCCTGCGCCCAGTTCCATACTGTTTTC
+ATTGTCTTAAACCTCCGTTCAACTTGAGTTTTGCATATAAAAAAGCGCCCTGCCTTAAAG
+CAAAGCGCTGAAAATTAAAACTTCTAATCTATATTTGCTTCGGAAGCGCCTCCCACAACC
+GCATATCCTCCTGCCCAAGAGACCAGATGGCTATACCTCGCAGTTTCCATCGATAAGCCG
+CTTCGTTTGCCCAGTAAACAAGGCTGTCCACATCCTGATAATACAGAATAGAAAAACCAT
+CTGCATCTCCGAGGAAGAGACGGGATATCCAGATATTGATGTCTTTCAGTATAATCTTTA
+CTTCATAGTCATTACCGCAAGAAAGAGCCAAAAGTTGTGAGTGGAAGAAGTCATAGTCCA
+TCGAAATGTCCTCACTGCGAGTTATCGATTCCTCCACATCGTTATTTACTGAAAACACCT
+GAAATTCATCATCCCACGTGACACCAGTGCGAGCAAGCCTGCCAAAGCTGGTTATATTTC
+CATCCGGAAGTTCCACATCAAAACGCTCGTATGGTTCATATACCCATGCATCGCCCAGTC
+GCAGCAGCTCGCATACCGTCCGGTTGTCCGAGCAGTAACCTACATAACCACTACCACCGG
+TTACATTCACTGTGAAGCGCAGGGTTGAAGCTGCACCTGAATATACTCTTACCTTATTGC
+CGCGTTTTCGCATCTCTATAGTATACATATTCGGATTAGCACGAAGATCGGCATCTACAG
+TTTTTGAGAAACTGGTGGAATAGCTACCAAGCAAGGAATTACCTTGATAAAGCTCGACTC
+TTTGCGTGTCATAATTTAAGCAGCAGAAAATATCCCCAAGGAACACCCCAGCCCGTCCAC
+TGCTATTTTGAGGGAAAGCCAGCCTTGCCCGGATATGAATATCGGAAAACCCGTCGTATT
+TCCATGCAAGTTTGCCATATCCCTCGAGCTGGGAATATGGACGGTTTTCTGTGCTGTCTG
+GGTCTTGCCAAACATCCCATTCGCCATCCAGCACAGTCCAGTAGTTTTCAGGCAGGATGT
+TCCTGTCTCGAAAATCCTCATACCAAATAAGCGCCGAGTCGGGTTTTCTTCGCAACATTT
+CAAAGGTCAGTTTAAAACCTCGATCCGGCTCAACCATCACACCATTTACATCCTTGAACC
+GACGAGGAGAGAGCATAAAGCTGGCTTCACCGGCAAAGGGATACTCCGAAAATCCACTGC
+AAACCCTAAAACCGTAAAACTGGACTCCCGGCACACCACCGCTTATGCTGATAGCATGCG
+TTCCCTCTTGGAGAAATACACCTTTTGCAAGTGTCAACCAGCAAACTCTTCTCCAGTATG
+GCCACCATAAACGGTTCTCGCTGAAAGTCTTTGATATACCATCAAGGGAAACAATAATCG
+CATTTTTGTCCCAGTAAGGAAAGCAAAGCTGTACTGCAATATCGTAATATCCCGCTTCTC
+TTATCTCAAAACGGTACTCTGCTGACGCCTGGGCATCTCCCAGTGAGGTCATCTCATCAG
+TAATAATGACATTTCCTTCGTATTCATCCGGAACTCCGTTCCTGTCAATATAAATGGTTC
+CGAACTCCGCTTTCTGCTCCTTGCCATAGCTTGTCAAATATCTTCGCCTGTTGTAAACCC
+CTTTTAGCAGCGGATATTCCCAGGATACAGCATCCCATCCTTCCATATAGTCATATACAT
+GAGGAAGAGCCCAAGGTACTTTGTTATAGTCATCCCAGTAAGCCACAATTGGAATAAACG
+GCTGGGGCGGTGCATCACCTGTGAAATTGTAAACCCCAGTCATCCAGTATTTAGCCGCAT
+AGTAGGTATTAGACACTCCTCGATAGGTTATTCCGAGGTTTTCAGGCGTATCATGGATCC
+TCCAGTTCCAGCCATAAGCAGGCAAACCCATGAATATCTTGTCCGGCGACATAACGGAAA
+CAGCATAATCATATATGCCCTCAAGCCAGTCACGGGGAGATACCGGACCGGGAGCAGAAC
+CCGCCCATGCCATGCCGTAGCTCATGATGGCGGCGGTATCGCAATAGTCGTTAAGATCGG
+CATAAACACACCAGTTTTCACCGCCCACCGAGCCTTGAACACCGATCATACCCGGCAGGC
+AGATGTTGACAAGCTTTGTTGCATCATAAGACTTAACTGTATTGTATATATCCCTAAATA
+GTGCATTCGCCGCATCCTTGTTTTCATAACCGCCGCCGCGCTCCAGGTCAATATCTACCC
+CAGCGCACCATGGATACTTGTTCATTATTCGGATGATTTCAGTGAGAAACTTATCCTTTG
+CACCGTTTTCGTTGTTGCGAAGTGCAGTAAAAATATTGGCTATTCCATGATTCATAATAG
+TGAGCAGCCACTTAATGTGCGGCCATTTCTGAATATACGGAAGCATGCTGCTGATGCTGG
+TACCGGTTTCAGTGATTGTGCCTGTTTCGTCAACCTCAAAAGTAAAAATGCCTACCGTAT
+CAAAGCGGTCGCCGTAGTCTCTAAGTGCTTCATACATTCGGGCATTTCCCATAAAACTCC
+ACACCATGCACCGCTTACCTTTTAAATAATCCCTCACAACCGGTCACCGCCTTCTTGCAT
+CTCCTGAAATTCAAAGAGCACCCGCGCCGATTTTCTCTCTTCCAGCTTCACCATATGTTT
+GCTATCCCATGCCGCAGAGTATTGATAAAATCCATCCTTACGAGTAGGGCTTCCGTTTTT
+AAGGCATTGACGGGTGGAAGCCTTGAGCGCCAGCTCATCGCCTGCATTAACCGGGTCAAG
+AAACTTTACCTTATGCGCACCTACACCTTGGGATAGTTCAATACTCCCTGCGGCCATATA
+CTGTATAGGATAGATATAACAGTCAAGACCAGCAGAAGTTTTGCCAAGGTTGAATAAGAC
+TACAGTCTCCGCTGTTCGCACCACACCGTTATAATGCCGGGGCGGAACTGGCTGCCCGTT
+TTCCTGCATTTTCTTTAGCATTTTGCTCGTGTGGACGGTATAACCTGTTAATTGATCTCC
+TTCCTGAAACTGCAAGTCGGTGAAATAGATTGTTCCGGTGCAGTCGGAAATCTTGAGTGT
+CACAGTAACGCCCACCACATGTTTATTGCTTTTTGGTTGTATGGTTTCCGCAAACCTTGA
+AAACTGCATCCATTTCACCTACCCGTCCAATGTCCACTGTATTTCGCATACATGCCCGAT
+CCATCCGGTAGTAACCGCGCCACCTTGAAGCAATAAGTCTGTAAAGTACACTGTGCCGGT
+GCAGTCAGTGACACACAGCCTGATGGTGATAGATTTGACTCTGCTGATACTTTTGGGATA
+AATACTGTATGCAATCTGATTGAAATATGCCATATCATCACCCTCAAATCAGGTCTATAA
+ATCTTGTTTCTGTTGTACCGTCCTCGTATTCAATGACTATCTCAACACCAACTTGGCCGT
+TTTCACCCTTTTCGAGGCTTTCGGAAGCAATTTGTGCTGAAAAAGTGTAGCTTTTACGCG
+TTGCTGGATATACCGTCTGTGAAAGGCTCTTTTTCATACCAGGTACACCGACAGCCTTGA
+AGGAAGCAGTTCCCGAAACACCATTTTCAGTATCCACTTCAAAACCGGAATTGACCCAGT
+AGGCAAAACCATCATCCGCTCTGGAATTGCGCAGATGGTTGAATGGTACCATATCTTTAA
+TTTCCTGACGGTTTATCAACTCTGCTGAGGACAGCGCATCCGCTGCCTTGTCCCACTGTG
+CTGAAGAATCGCCAAGTTCCCGCAGTTTAGTTGAAAGCTCAATCACTGTTTTCCATGGTT
+CCTGCAAGTTATACTGCCTTCTCACAACACGAGTCTTTACCAAAAGGCCTAGTTCTTTAT
+CGTCCACTGTAACAATATCACCCAGTTTCCATGCTTCGTGCTCATAACCGGTTAGCGCAG
+ATAAATCCATTGCCGACAGCACATAAGAGACGCGAGGCTTCGAATATTCTGCAAGCCGCA
+TTTTTGCATATTCCAGCATCTGATACGGATTTGTAAACGACGAACAATCAAGCGTCGACA
+CCCTCACTTCACTGGAAAAAGTGTAATCTTCCACGTATTCCTTACCTCCATTAATTGAAG
+CGAAGGTCAATCCGTCCTTTCCATAAGCATAGAGCTTTGTCACTAATTCACGTGTATCGA
+CTACCCGCTGAATACTTTTCAAATTCTTTCTATATGAAAAAAGCGCTCCGCTATCAGTAC
+CACTAAAAGTCAAAAGGTGTACCTGGCGGTTGGCGCTGTCAAACACCAGATCGCCGCCAT
+AAATATTCTGTACGGTGCGAAGGATGGATAAGGCATTTTTTTCTGTACACTGCCATGTCC
+GTTTCGTAGTGACAGTAACATTTCCTACTGTCCAGCCTGTACCCAAAAGTGCATATTGCA
+TCGGAACATCTGCAGTATCTGCATTGAATTCTCTAGGTTCTTTTTCCGCACTGAAAGACA
+GATCGTAAAATACCGCTTCAGCATATACTTGCGTGATAACACGCCCATCTTCGCCTTTAT
+TGTCCGTTAAGGTTCGGATCCGGTAAATGTCATTTACGATTTGCACTTGTTTTTCATTTT
+CCAGTGTGCTTCTTTTTGGATCATGGAACGGAAGCTTGAATTCCAGCGTATCCGCGCCGT
+TCACCTCACCAGTGACAATGATATCAAAGGCATTTTCAAGAACAGCTTCCCATGCTCCGT
+TTTTGTCCAAAATCACAGGACGGGCAAAGCCTAATTTCTCATAGGGCGCTTTCGGTATAT
+CATGAAGCTGTATTTCCAGAAGTTTTGGCGTCTTCAACGGATCGCTGCTGGTAAGGGTAA
+CACGGAACCTTATATATTGCCGATTTGGCGATTGAAGTTCACCGCTGGTTCCCACAGCCT
+GCCATGCAGACCATTCTTCAAGATCATCGCTTGTGCTGGTCTCTACTAGAGACACTGAAG
+TAACACCTGCAGTATATTCGCTTGTCACAGCTACACGACCGCTGCCCGATAATGCACATG
+GAACCGCCCTTGTATAAAGTACGCCACTTGCAGGATACTCGCCATCTGTTGCTTTAAGGG
+TGACTGCGCCAGGCTCTGCCAAAGCATCTACATCCGAAGCCGCATCCCCACCGTTTGCTT
+GTAAAGACGACTTAAAATATAACAGCAAATCATCAGCTGTAAGCTGTGAGTCCGTTTCCA
+GAAACCAGTCGTCGAAGCCTCCGGCATAGTAGTAGGTATTTGCATGCATCCCCATAATAA
+TGTCTGCTATACATTCCCGATTCAGCTCTCCCGAAAAGGAACGCACAGGTGACACCCAGG
+TTGCCCCGTCGCTGCGATCGCATATGATGTTCTGCACCTTTTTGTTGTTTACTTCAATGA
+TGGAGGCGATAAAGTACCAGCCGCCGTTTTTTAAGGTAATGGTAGCTGTTTCACTCTGGT
+CGTAGATTAGTGTGCCGGAGGAGTTATACAACATCAGCCTAAGTCTTCCTTGATAAAGTG
+AAACATAAAGAATTGGCTGACCAGGTCCTTGGCGGGTATTGAATATGGATATATATGTCT
+GGCCGACCGAATAGGTGGTAGGATTAATCCAACCGCCTACAACAATCTTTTCGCCCAGAT
+TGCTAAAGAAACTCCCATCATTTTCTGCTATAAGATGGGTCTTTTCAGAAGTCGGATTAA
+CAATATTTTGCCTAAAGTATCTTCCGAATCTTCCAGCAATAAGGTTTGCCGATGTCCCTG
+ACCAGCCGGAGATGGTAAAATGTCTGCCATGTCCCGATGAATCCATAAGCAGAAGATTTT
+CGTCTGGTGTTTTTTCATTAAATCGCCATAAAGCAGACGTCCTTGATGTTACAGGAAACT
+CACCGGTAAAATCCTCTTGGCTCGTTAGAATTGATTTTATCGCCATGTTATCACCTCCAT
+CTGCTTTTTGCCTGTATTTTTAACTCAGTAAAGGTCGCGTTTTCTGCGGCAATCTCAATA
+TGATTAACACCTTTCCTGAGAATTGGAAAATTCAGATCCTGCAGGCTGGGAAGACCATTT
+CTCAAGGTTCGGCCTGTTTCATCAATAACCTTAGCTGTTACCATGCCGGAGTCGACAATC
+AGAGTTTCACCTTCAGATAATGAGCCAACAATTCTCAATTCCTCGCCGTTTGTAATAAGC
+GAAATATAGCTTGATGAGGACGTTGATATCAAACCCTTCAAGAGATAAACCGGATTGGAA
+TCCGCATTTCCTTTAACCCTCTCCAATTCATGCAGACCTGTTTCAGAAAGAACAAATATC
+TCATCTTCCAACGCGTAAACATACGGGTCGGGACAAACAAACCGAAGTTCAAAGCTGCCC
+GCTGTCCGCAATATCCGCTCACAGTCAACCGCTTCTGATAAGCGAGCCATGAAATATCGG
+TCGGGCAAATCATCTATAACAAGTTGCTTAAGCCCGTTTTCCGGATTTAACCATTCTGCA
+ACATTATCAAGAACCGATACAAGCTCAGCAAAACTGCGCTGGGGAAGCACACTACAGCTA
+ATTATTATGTTTCGTTCTGATATATCGCAGCCAAAATCTGCAATACCTGCTTTGCCCGGC
+ACAGTTTCAAAGGAATTGCGCAGGGCAGGGGAGACCTGCCATTTAGTAAGTCTTGCTCGT
+ATTTTCATACTTTGCGACGATATTCCATTGTAGATAAATCCCATATGCTTCCCTCCATTA
+CGCTGTTATAAAACGTCCCTGCGCCCTTGAACCTGTCTGCATCAGGTTATATAACTCCTG
+TGAAATCCTACGTATGTCTTCTTCACCACGAACAATCATCTGCTGCACCACAACAAGCGG
+CCCAGAAGCTAAACCGCTAAATTCACCTCTTCCACTTACATTAATATCAGGAGATATATT
+AAAATCTGTCGGCACTGCATTTTGCATATCGTCTGCCACTCTGGCCATAGCCTTGTCAAA
+TCCCTCACCAATACCCAGTGCCATATTGCCGCCAATGCCTTCAAAAACAGTGGACGGAGA
+TCTGATTCCAAGAAAATTCTTTACTCCATCAACAATACCGGAAAAGAAACCGGAAACCTT
+ATCCTTAATCCAGCTACCAAGGCTTTTAATACCTTCCCAGATGCCTTTTACAATGTTCTT
+ACCAATCTCAACTACTGAAACAACCGCCTTGCCCAAACCTTCAATAATTGCCGCAACAAT
+CTGAGGTAAAGACTTTACTAGTTCTGGAATGGCTTTCACAAGCCCGGCAGCAAGATGTAC
+GATAAGCGTAATTCCCAATTCTATGATCTTCGGCATATTGTTCGTCACAAAGTCAATGAT
+TGTTGTAATTATCCTCGGCAGTGCTTCAATTAGTTCTGGCAATGCATTTAAAAGTCCCTG
+CGCCAACCCCTGTATGATCTGAAACGCTGCGTCAAGAATTTTATCCATATTGTCAAGAAG
+TACCTCGGCAATGAGGATAATGGCTTCGACAACAGCGGGTATCAGCTCCGGAAGCGCCTC
+CCCGATACCGGACGCCAGTGTGGCAATCATTTGCACCGCGGCTTCCACCAAAGCGGGAAG
+GTTGTCAATAATTCCCTGCACCAGCGCCATAACAAGCTGCAAAGCACCGTCGGTTATCTG
+CGGCAGTGCATCGATTAAAGCCTGCAGCAGCGTCATGACAATCCGCACCGCCGCGTCGAT
+AATAACCGGCAGATTGTCCACAATAGCCCCGCCGATGGAGGTGACGATATCCAATCCTAC
+CTGGATAAGCTTCGGCAGGTTTTCCATCAGCATGTTTACAAGGCTTCCCACCGTATTGCC
+GATGACCCCGCTGATCTTCGTCCAGTCTCCGTTTGCTTCAGATAATCCACGAGTAAATTC
+CCCGAGAAGCACAACCCCGTCGTCGGCCAATATCTGAAGCTGGGGAAGCAGCACGGTGCC
+CAGCATGTTTTTGGCCGCCGCGCCGCCCGCCTTGAGCCGCTGGATGCTGTCGTCAAATTT
+CCCGAGAGCGTTCAATGAATCCTCGCTCATCACTGCGCCCATGCGCTTTGCTTCCTCGGT
+CAGCTCCGCTATCCCTGCCGAACCCTGCGCAATCAGGGGATTGAGTTCCTGTGCGGACTT
+TCCGAAAATCTGCATGGCCAGCGCGTCACGCTCAGTTTCGTTGGACACCTTGCCAAGTGC
+GTCTATGGTTTCCCAGTATACGGCTTCGCTGTCGCGCAGGTTGCCGTTGGCGTCCGTGAC
+CGAAACGCCGAGCTTCCGGTAAGCGTCCGCGATCTCACCGGTGCCTTTCCGTGCTGAAGA
+CATGGATCTGACGTTCCTTGCCATGCTGCCGGTTAAAGTATCTAAGGAGACATCCACAAG
+CTCCGCGGCGTATTTATACGCCTGCAGGCTGTCGGTGGACATGCCGGTTACGGTCGAGGC
+GGTAAGGATTTCATCGGCATAGGCCGCCGAATTTACCGACATATCCACAAGAGCTTTTCC
+CGCACCGACCGCTGCTGTACCAATAGCGGCCAGGGCTGCTCCCATGGCCACACCGATACC
+TTTCAATACACCTCCCAGTTTTTCAAAGCGCCCGCCTGCGTCATCCGCCTGATCCGCGGC
+CTTTTTAATTTCTCTGCCAAATTCGCCCGCCTGTTTTTCCGCTTCGTCAAACTCTTTTCC
+CGCATTGTCCAGCGCTTTGTTGTTCGCTTCCAGCTCGCGCTCCATTTTGTTCAGCTCTGC
+TTTGGCGTTGTTAAGCTGTATCTGCCAGGACTGCGTCCGCTTGTCGGTCTCCCCGAAAGA
+GGAGGCGGCGTTGGCAAGCGCTTTCTCCAAAGTAGCAATTTTTTCTTTCTGCAATTCGAT
+TTCTTTATTCAGCACCTTGTTTCTTGCAGTAACAGCTTCAACTGATTTATCTTGCTTATC
+AAACTGAGATGCAACCAGGTTCATCTCGCTGCCCAGTACCTTAAAACTTTGGTTGATCTC
+ACGAATGGCGTTCTTAAATTCCTTTTCGCCTTCAATCCCAATCTTCAAGCCAAAATTGTC
+TGCCACATAACCGCCTCCTTTCGAGTAAAAATTAAAAAATTATAAAAGGCTATTGTATTT
+CAATGCGGTTTGGCATATACTAATAGTAGGGAAAGTAGGGAATTTCCTGCTTTTCAAATC
+CTAAAAAGGAGGACTTAGCATGAACGTTCCCATAGTTGATAATGCAAAGGTAATGGCAAA
+AGGCCAGATCACGCTGCCAAAAGATATCCGCTCCAAACTTCGCCTTTCCACCGGAGACCG
+CGTCACCCTCATTTGCGAGGAAGACCGGGTTATCCTTATGAACTCCGCTGTCTACGCCAT
+GAAAATGCTACAGAAAGAAATGGAGGGCGAAGCGGAAAAAGCCGGGATCCGCAATGATGA
+CGATGTTATGGATCTGGTGAAGGACGTCCGCGCGGAGATTGAAGGTCTATGAGAGTGTTA
+ATTGACACCAACATCCTGATCTCCGCTTCCTTGAGCTGCGAAGGAACGCCTTATCAGGCG
+TACATTAAAGCTGTAACACACCCCAACCATGGTATGGTTTGCGATCAAAACATCGATGAG
+CTTCGCCGGGTATACAACCGGAAATTCCCCCATAAGATCCAGGCGCTTGAACGCTTTTTG
+GCGATTGCGCTTACTGTTCTTGAAGTTGTTCCAACTCCCGCAGTTGACGTGTCGGATGAG
+GCGCTTGTCCGGGACGCATCCGACAGGCCAATACTCAGGGCGGCCATTGCGGCAAAAGCT
+GACGTGCTTGTAACCGGAGACAGGGATTTCCTTGAATCCGGCATAACAAACCCAAAGATC
+GTAACAGCGGCAGAGTTTCTGCAAATGGAATAAAAGCAGCTTTTTAAAGCAGGGATTACA
+GCCACCCTGCTTTTTTGCTGCTTATATTCCATAAGGTATCACATCATCAATGGTCAGCAT
+ACGCTTTGGTTTCGCCAGCCCTAAAAACTGCTTATGGCACTCCCATAAATCCAGCAGGTA
+CCCAACAGGCATTAGCCATACTTCATCCTCTGAACGATTAAGCTGGACGGTGCCGTAATA
+TAAAAGCCGAGTGAACAATTCCTCATCGCTCACTCGGCCGGTGTGTTTTTTAAATCATCC
+TCACTTTCAACATTTCTTTTGGTGCCTTTGAACATCGCTTTCATGATAGCGTCTTTATAT
+GCTGCCAGTTCCAAAGGAGATGTGAGAAGTTCCACTGTCTCTTCGGTAAGGAGTTCACGC
+TTATCCTGATGTTTGAGATTGTGTATCAGAATGCTCTGGTTAGCCAGCAGTGTAATCAGC
+CATACCACTTCGTCAAGAGCCATTTCGAAGTTCTCGGTTTTCATCAGTTTCGTGCCGAGG
+TTTTCAAGACCGCCGTACCTTTTTGCAATCTCCTTTGTCGCTTTAGTGGTTAGAATAAGC
+TGGTATTCTTCGCCGCCGATGCTGATGTTTGCGCTTCTGTCCGTATCCTGCATTATTAGC
+TTCCTCCTCCCACAGCAAATACCGGCTCATAAACTTCCGTATACCAGCCAGCGATAGTTT
+CAGGCAATACACCGGGATCGTCTTCGCTGACCTCCGCCTTCCAAGGGTGCTTTCCCTGGC
+CATCTGGTTTGTTACGTCTCATGACTGTCCCTTCAATGGTGGGGGTCGAAAAGGTAATGC
+TGTCACCTTTCGTTTGCAGATTTGTCGCCGGGATTCCGAATTTCACCCTGTAAAGCCAAA
+AATACCTGTACTTGCCGTTAGCTTTCTTGGCTCTAAAGCCAATTGCAACAGGCGCGCCTC
+CATCCTCGCTGGTGGAAATCAGCACCTTGTTGTCATCAAGGGTGGCTCCCGTCAAAACCT
+CAGCAGCGTCTACTCCGATATCTGCAACACCAAGAGTCAGTGTGCCGCTTTGAAATTCCT
+TGACCACTTCTGCCGCCCCGTCATCGGCATAAAGCGTCGCCTCTGCCAGCTCCACAGAAA
+GCTCTGCCGTAATAGCCTTAGCCAGCGGAACAGGCGTGGCGTATGTCTCTTCTCCGTTTT
+CATTCTCAGTTATTTTGGCATAATATAACCTGTCCAGTCCGATTGTGGCCATGTTTTTCA
+TTCCTCCTTTACTTCATATTCTTTTGCCACATCAATGGCATAGTGGTGATAGCCGGTATC
+GTCCTCATGGCCTATATACCGCCTGTCGGTAATGGTAAAGCCTGCTTGAAGCAATGTGTT
+CACTATTTCGTTTTTACGGGCAGTGTAGTTTCCCTTTATAAATAAAGACAACCTTACCTC
+CTGGGTTTCTACCTGAGGCTGGTTGTCTGCAAAAACTTCAAATGTATCTGTCATCGGAGT
+AATGACAAGGTACTCATCTGGCGGTACACCGCTAAATACCCCGGTTTCAATGGGGATACC
+CAAACCATCCAATAACGAGTTTAATTCTGACAATATGCTCATATACGACCCAGCTCCTGT
+TCCAGTCTTGACTTCATTACTTCGATGCAGGACTTCCTTGTAGCTGATTTTGCCGGTTTC
+AAAAAGGGCCTTGGAGGCTGCCCGGACTTGCCATACTCAATAATATTAGCAATCTTCGCA
+TTGCTTTCCCCATCCTTCCTTGGTTCAGTAAAGCCGATTTTTATGTTGTGGTTTCCATCC
+CTGTCCTGCTTGGCAGGAGAAAGTCCCAAAGCATTTACCAATTCACCGGTTGCTCTGGAC
+GGATATTTAGTGCCGCTCCCGATAACTGACTGAAGATTGGACTTTACTTTTGAAAGAACC
+ACTTCCCCGCCTGCTTCCAGCACCTTAGGTATGATTTCGTCTGTTCTTTCTCCAAGTCTG
+GATAACTTGAGCAAGAACTGTTCCGGCATTTTAACTTCCACCTTAGCCACGTTGCAGCCC
+CTCCTTTTATGCTTTGCTTGATTTCACCTTTTCCGCAAGCACCTCAATATACATTCCACG
+TCCTTTTACATCCTCAACACTTATAATGTTGTACCTGCCATCGCTGCAAACGAGTACAAG
+ATCTGTGGTAATTTCAAGGTTAGGTATCTTACGGAAGCGGAACAGGGCAGACGCCTGCGA
+AAACGCCGCCCTGTTTGCCCATTTTTCACTGCCATGCCTATCTTCCTTGTATGCTCTTAC
+CGAAGCAAGAATGACATCACCTTTTTCAGTAAAACCCTCACTATCCTTAACCGGCTTGAC
+TGAGATAATGTCCACGAAAGTTTTCATTTTCCCAAGGCCCATATTTACACCTTCCAATCC
+CGGTCAAGCCGCAGCAATAGATTAACTGTATTCCATACCTGCTGTCCTGCCTGCACACTA
+TCCCCAAAAAAGCCAGCAGTCGAGCCATCCCTGCTTTCATAAAAATGGCTCGACAGCATA
+ATGACAGCCTGCTCAGTAGTAGGCGGCATGGGGTTTTCAGCATAATATCCTTCCGGCTTT
+TTCTGGTAACTTTCCGCATAGGCCACTGCGGCTTTGATATACTCTTGTAAAAGTGCGTCA
+TCTTCGCTGTGCTGCAATATGAGGTTTGCTTTAACCTTCTCCAAAAGTTCCATGCCGCAG
+CACCTCCGTTTTCATTAAGTTGATTTCTGCTGCAGTATCTTGACTGCTTCAGACAGTACC
+AGCTTGCCATCTACACGCTGGGTTGCCATGAATCCAACTTGTCCGGTCGCAGCATACAAC
+TCATTAAGCCGCTTAAAAACCCTGCCTTGACGGTCTGCCACCCAGTAATAAGAAAAATCG
+CCGAATACAATCGTTTTTGCTCCGGCGGCAATGGCTGGCATAAATGCAGAAGTTTTAACT
+GGACGATTGAGGATAGTATCCGGTGTTCCAGCAGTTACAGAAGGCTGCCAGAGATACTGA
+CCGTTGTTGTCTTTGAGCTTCCTTATAGCTTTAATTGTCGAATCATTCATAATGAATACA
+GCGTTCCTGCGGTACGGAGACTTTAGGCTGTAGAACAAGTCCATGATCTCGTCAAGGGTA
+ATGGCTGTTGCACTCGCCGCGGTTACTCCTATCTCGCCACCGCCGTTATCCGCCAAGATA
+CCGGTTGGCTTGCCAGATCCGTCGCCGATAAAAAATGCTTCCTCCTCTTTTGCTCCGATT
+CGGCGGGCGAATTCTTTGGCTATATACTGTTCAAGGTTAAATACACTGTCGTTTAACAAT
+TCCTCTGACACCTTGATCATAGTAGCCAGCTTATATGCGCCGATGGATACCTGTGCAAAG
+GAGTCATCGCTTTCGGGAATCTGGCCTTCCTCATCCACCCAGGATGCAGTACCCTTGCTT
+GCCACCACAGGAATTTTCTTGTCACCGCTGGACGTGGTAATAACATTGGCAATCTGCCTA
+AAGATATTCTCCTCCTCCAGTGCTTCCACAAGAGTACGCTCAAAGTCGTCGGGAACAAGA
+TATCCACCTTCGGTGTCCTCTCCAATCTGCAGCGCGTTGTGTACGTCATATTTGCGCCTG
+CCGCGCATCATGTTCCAGAAAGACTGCCTGTACTCATCGCTGGCACGTCCGGTTTTTTCA
+TTGTTGCCAGATATGGAAGTGGGTTTGTCTGTAATAGGAATATTCAACGGTTTTGACAGT
+TCCAAATCTATGGCAGCCTGACGCTCAAGACGCTCTATTTCTTTGCCCAGCGCAATAACG
+TCGGCTTCCATTTTTTCATAAGTTGCGGTATCCTCCGGTGAAAGCAGTCCGTCGTTCCCG
+CGTTTGCTGTCGAGGAAAGCTTTAGCAGCTTCCCCTACTTTCGCGCGTTTTTCACGCAGT
+TCCAGTATTTTGCTCATAATCAAATCCTCCTTAAGGTTTTATTTGGGGTCCCCGCTAAAT
+CGTAGATTTAGTGGGGTAAAAGTAGAAAAAGCCGCTTTTCAAGCGACTCAATTGGTGTTC
+CTTTTGGTTTTTCTTTTGGTTTAAGCTTTTGCAGGATGGAATTTGTTACTGCCTGCCTGC
+TGAAGATCATTCCTCCTGATACTTCAAACTCGGATGGGAATGATTCATCCTCCATAAACA
+AGATTCCATCAGCAAAGCCAAGTTCCACCGCTTTTCTTGCGTTAAACCAGCTTTCTGCAT
+CCATTAGGTGCGATATTTTTGCCCTGGAAAGTCCGGTTTTCAGCTCATAAGCGTTGATGA
+TGGATTCCTTTATTTCTTCCAGCATTGCGATAGCTTTCTCCATTTCTTCTGTATCACCGA
+TGGCTATTGTCATAGGGTTGTGAATCATCATCATGCTGACTGGTGACATAAAGACGTCAC
+CTCCGGCCATAGCTATGACCGAAGCGGCGCTGGCTGCAATACCGTCAATCTTTACCGTCA
+CTTTGCCTTTGTAATCCATAAGCATGTTGTAAATTTGATTAGCTGCAAATATATCTCCGC
+CAGGGCTGTTGATCCAGATCGTTATATCACCCTCTCCGGACAACAGCTCTGATTTGAACT
+GTTTGGGAGTTACTTCGTCTCCCAGCCAGCTTTCTTCAGCTATTGGGCCGTCAATATATA
+ATGTCCGGCTGCCATCATCGTTTTGTATCCAGTTCCAGAAGCGGCGAACCGGTTTTTGTT
+TTTGTGATTTGTTCAACTTTTGATCCCTCCGTTTCAGCATTGTTTTTGCCTGCAAATGTA
+CCTGCATCGGCAAGCCTGGTCATGTTACCGTTAACAAGATACAGATCTCCGCCCAACTCC
+GCCGGAATCCGGTTCATGTCCTCAAGCTCGCGGATATCGTTAGCAGACATCCAGCCGTTC
+TGGCGAGCTACAGCATAACCATTCATGCGGCTTGCATAATCACCGCGCAGAAGGCCATCT
+ACATTGAATTTGACAAAGTATGCCCGCTTCTCTGATGGTAAAAGCAGCGCTTTTTGGAGA
+GCCTGTTCCCAACGCACCACCCACGGGTCAAGCGTGTATTTAACAAATTCCAGAGATTGC
+TGTTCGATGTTTGAAAAGCTTGACTTTTCAAGATCTCCAACCATATGGGGAGGTACTCGG
+AATATCCGGGCAATTTCGTTTATCTGGAACTTTCTTGTCTCCAAAAACTGTGCCTGTTCG
+GGTGGAATGCCGATTGGCTGAAACTTCATTCCCTCTTCCAGGACTGCAATACGGTGAGCA
+TTGGCACTTCCTTGATAAACAGCGTTCCAGCTTTCACGCACCTTTGCCGGATCCTTTAAT
+ACGCCGGGATGTTCCAGAACGCCACCCGGATTTGCTCCGTTGGCAAAAAAGGATGCACCA
+TACTCCTCACAGGCAATAGCCATGCCTATGGCATTCTTGGCCATAGCAATAGGGGAGTAT
+CCGATCAGTCCGTCAAAACCGAGTCCCGGGATGTGAAGAACCTCATCACTTCGTAGGTAT
+ATAAGGCCTGCTTTTGGATTAACCCTGCTCTCATCGCTGTCGCGCCGATAAGTGTAATAC
+AGCTCTCCGTTTGGAGCCCTGTCTACCGTCATTTTGTTTGGCAAAAGGGGATAAAGCGCC
+AGCACTCGCCCGGAACCGTCCCTGACAATCTGGGCATAAGCATTTCCCCATAAAAGAAGA
+TGACTCATCAGTGTTTCTCGGAACACAAATGAAGTCATCTCAGGGTTTGGTTCGTCATGG
+AGCAAATAATAGAGCGGGTGGGTCAACGCTTTTTCTTTGCCACCGTCTTCCTTGTATCGG
+TATACATGAAGCGGAAGCCCGGCGATGGCTTCTGCAAGTATCCTTACACAGGCATACACT
+GCAGTTGTCTGCATAGCAGTCCGCTCATTGACAGCTTTTCCGCTGGATGTGCCGCCGAAG
+AAAAAGCTATATGCATTACCGAACAGGCTGTTTTTCGGCTTGTCCCTTGCTTTGAACAAG
+CGGGAAAATATTCTCATAAGCATCACTCCTAAAAATGGGCATGAAAAAAGCACCACATTT
+GTGGAGCTTCTTTACATTTTTATATTTTATTGATTAACTTCTTATTAACTTATCCTTATT
+TTGTAGTAAAATATCTGTTGTTTCTTTCCGTTCAAACAATTTACGATCCGTCAAATCTAA
+TTCTTTTTGTGTTTCAATGAATTCAATTATTCTTAAAAAATAATCGAGACATTTCCCTGA
+ATCATTCAAGATACGCAAAATTTGATTGCAAGCATTGATCATTTTTTTGGCACTATGATG
+TTTTGGTAAGTTGTTTGTTGCCATATACTTTAAAAGCATTATGGCATGATACTTTCCTTT
+ACGGTATTTTTTATCAATACATTTTGTTTTTATCAGGTTTTCGAAACGAAACATGGCCAA
+AGAACTTGTGTAATACAATATAGGCTGGTCGTCAGGTAGAAAAATACGGTTTCCAATATC
+TTTCAATAAGCTACTATAATGACCAGCAGCGTCGTGTGGTTTATCATTGAACATTGATGA
+TGCATTTTTTAACTGGGCACGAATAGTAACTATTCGATCTTTGGGAATCGATTCATTCCT
+ATATTGTCCTGAACGACGTTCATAATACAAGCGTTCATCCTCAGCAGTGTATGTGCGATA
+GTATTCCTCCAGTGTTTTTTGGAAAGTTGATAACGCTTCTAATTGTTCTTTGGTTATACC
+AGTTTGATTATTTGTAGCTTTTGTAATACGGTTTTTTAAGTCCTCATCCTTGGTTACAAT
+AATCTTAATCGGTATAAGTAAATCATGTATTCCAAGATTATCACGGTTAAGATACAAAAC
+ATGGCTGGTTTGGCATCCATTAACTATCTGATAGTTTGAAATTGTCATCTTATCGCTCAC
+AAGCACAGCAGAATGAGCGACAATTGTTATTCCATTATTTAGCATGCAAAAAGCGCTATT
+TCTGCCTTCAACAATAGTTTCTTCAATGTCCGCATTAACATAATTATTCACTCCAAGGAA
+GTCCCGAATATTATCTTCAAATACTTTTTTTAGTGAACCATTTTCATCGCATATAATTTT
+ATAAAATTCGCAGAATGGCAGTACCCCACTATATCCATAATCTCCATTATCATCAGAAAA
+CATCATCACATTTTTTGTAAAAACAAAAGTCGCTTCTATTTGCTCTTGTGATTTTCTATA
+CATACGCTGTATTTCTTGGGCACCGCAAGGTATAAATTCCACAGATGAAAAAAGTGCCAT
+GTTATTAAGCGTATCTATATGACTATTAATTACAGCTTTCAAATTGGAATCATCATCGTT
+CCACTTCCCCGGAGCAATATAATAAAGTCGTATTATCGGGTTTTTGACTTTCATATAGCG
+AGAATTACTATAAATAAAATCCTTCATTTCTATGAAGTCTGCCATTTCCTCTGTACTGAA
+TGTATTCTTAGCTTCATCAGAAAAAAAGACTTTAACAAAAGACAAAAAGTTACTTATCTC
+TGAATTATCAAAACTGTCAGATGTTTTTGCTTGTACAAATATAAATTTTACATCAAGTTT
+TTTATTTTGCTTAATTAACGTTTCTATCTCATCAATACTGCACACAATAGCTCCGTTTAC
+TTCTATCGCTATTCCATCAATACCTTGAGTAGCATTGCCAGTATGCATGTCTTGAATATC
+TATTTCAACCATGCCAGTTTCTGCAGATAAAGCACAGAAATTGGCAAAATGCTCGAATTG
+AACACTTGTTTCGTACATAGTAAAATTATGGCTAATAGAAAATTCATCTAAAAAAGCCTG
+AGTTATACGATCCAAAGTTACTCCTCCGATAATAATCTTATTTGGAGGAATTATAACACG
+TTTTGTCAAAAAATTCAATTACTTCACTCCTCGAGTGTTTTTTAATTAAGGACTTATATA
+AGATATTATGCTCACTTATGATATATTTTGTTTATAAAAATAAAATTCCCCTTTCATCAT
+AAATTGATCCGTTGCGTTCATCCCCGTCATGCCTTAACGCGCGGTCAAGCGCCATAATTA
+ACGCTACCGCGCCATCTATTCTCTCGGTGGATTTTTCTTTATCAGGCTTTATGTTTCCAG
+CTGGATCAGTTTTGACATAGATATTGTCCATCATCCAGCGCAGTACTGGATGGCCACCAT
+GGGCGATGCGTTCTTCCAATGTCAGCTTCATCAACTCTTTTGTAGGCGGCGACATATCTT
+TGAAACCCTGGCCGAACGGAACAACCGTAAAGCCCAAGGCCTCGAGGTTTTGCGTCATCT
+GAATTGCTCCCCAGCGGTCAAAGGCTATTTCCTTAATGTTATATTTCATCCCGAGCTCCT
+CAATAAAAGTCTCGATAAAACCGTAATGCACGACGTTACCCTCAGTGGTATATAAAAAGC
+CCTGCCGCTCCCAGACATCATAAGGTACGTGATCTCTCCGCACACGCTGATCGATATTCT
+CCTCCGGTATCCAGAAAAAAGTCAGTATCTGATATTTGTCCGATTCATCAAGCGGCGGAA
+ACACCAGTACAAATGCAGTAATATCGGTAGTAGATGACAGGTCAAGTCCTCCGTAACAGG
+TTCTGCCGCGCAATTTTTCCGCATCAACAGGAAACGCACACTTATCCCATTTATCCATTG
+GCATCCAGCGCACCGATTGTTTCACCCACTGATTTAAGCGGAGCTGACGGAATAAATTTT
+CCTCTGCGGGGTTTTGCTTGGCATTTTCACAAGCCACCCTCAGTTTTTCGATGTCGACTG
+TAATGCCTAGTGACGGATTAACCTTTCTCCATACCTTTTCACTTGTCCAGTCGTCGGTAT
+CGGATGCGCTGTAGATAACAGGGTAGAAAGTCGGATCTATCTTACGTCCCTGCAGAATAT
+CCTCTGCCTTTTGATGCACTTCCCAGCAGATGGAATTGCGGTCTGTGCCAGCAGTTGTGA
+TCAGGAAAAACAGCGGTTGTTTTCTTGCATCGCCAGATCCGTGAAGCATTACATCATAAA
+GATCCCTGTTTGGCTGAGCATGAAGTTCGTCAAATACCACACCATGGACGTTTAGGCCAT
+GTTTCGTATATGCCTCCGCTGAAAGCACCTGATAAAAACTGCCTAACGGTTTATAAACCA
+GCCGCTTCTGTGACAGCATTGGTTTAATTCGAGATTTTAATGCCGGACACTGTTCCACCA
+TATCTACTGCAACGTCGAAAACAATGGATGCCTGCTGACGATCAGACGCACATCCATAAA
+CCTCGCCACCATGCTCGAAATCACCACAGGTAAGATATAAAGCAATTGCCGCTGCAAGTT
+CGCTCTTACCCTGCTTTTTGGGATTTCTATATAGGCAGTGTTAAACTGCCGGTATCCGTT
+AGGTTTCAAGATTCCGAATATGTCCCGGACAATCTGTTCCTGCCAGTCAATTAATTCAAA
+AGGCATTCCATACCATTCACCCTTGGTATGCTTCAGGCAGTTTATAAAAGTAACAGCGGC
+ATCCGCCGCTTCCTTGTCATATCGAGAACCTTCCGCCATAAACTTGGTTGGTTTATATCG
+TTTTAACTTCCGCAGCTTTGCCGCCTCCTTTCCTAAAATTGAGCAAGAAAAAAGGAACCT
+CAGGGATGAAGTTCCTCTCGTTAGTGGATTTCTATGAAGCCTGTTACGTTATTACTGTTA
+TCGTTTGCCTGTCAGGATAAACTCGGCATATTCTTTTTTGTGTTCATTTAGAAAGACCAC
+CAATTCATAATAACCCTTTTTGTATGCCTCCTCCTGCACTCTTGGCAAATCAAACATATT
+GCAGACACCGCTGTCCCGTATGACAATTATCTGCCGGTAAATCTTATCAGTTATCAGATT
+TTCTATACCCATGTCCTACACCTCAGACTTCTCTGCCGCTGAAATTGAATCTCTTACCGC
+TTTATTGAGAACTGAAATATCAAAGCCCGCGTCTATATATCCGTGCCGAATCACCTCGTA
+ATAGTAACGACCCGGTGCTCCCAGTGGTCTGCCTTCATTCATGATATACACCATTGCGGG
+TACCCACTGCCCTTTGAAACGTACCTTAACTGTTTCTTTCCGGTATAGATGCGGATAACC
+TTCATATCTGTCCAGCGCTTTCTCATCATTAGGCATGATTCTCCAAAGCAGTACTGGTAC
+TCTTTCACCTTTTTGTTTTTCTATTGTCGCTACTGCGCCGCCATTCCCTCCTCTGAATAA
+CAGCCGGTATCCTGTGAGTTTTGCACTCCCCAGCACTTTTGCCGTCGGGCAGCGGTATGC
+CATCTGCCTTAAGTTCAGATTGCTTCCGTATGCTAAATATATGGTTCCTTTTTCTTTGCT
+CATCGTATCATCCTCCTTGTATTTACCAAGGCAGGGGCGGAGATCCGCCCCTGCGCTTGT
+CTATCTATGCCGCCCGAAACCGCCATGCCGCGTTGCCGCCCAAGTGTTTGCAAAGGTGCT
+CCCGACAATTTTTGAACTCATCACCAATAAGTCCTATGCGGTTGAGATATGTCCGCATGG
+CAAACTTCTCGTTCTCGACCTGCGGCTTTTTGCTGGAAGCGCATTTTTGCGTCAGCGCCT
+GATGGTTGAGCGCCAAGGCAAGGACGATGTAGCTCCTTATTATCCCGGCGTGGAGTTCGC
+TGTTGAAGCCGCGAAGCTCGATCGTACCGTTGCCGTTGAAAAAGCTGTGCAGATTGAGAA
+AATAGTACCGACTTCCATGATATCGCTGGCTGCGGCTTTCGCTGTAACCCTCATACCAGA
+TGCTCTCAATCGCCGCCATGGTTTTGGGCTTACGCCGATTCATCTTCTCAACCAGTGCCG
+CATCCATCTTTTTACAAAACCGCATCCTGTCCGGCTCAATCTGCAATGCTTTATAGAAAA
+GGTCATTCTTGCTGGCGATAATATTGATAAAATTGCGGATGCTTCGAGGCGTGTGGTCTG
+CCCCGTCTATATGGATATGGATCCCACAGCTTGTGTTTGCAAAACCTCCCGCCTTGCGAA
+GCCTCCTTACCAATTCCTGCAGGGTTTCAATGTCCTCGCGGTATGTCAGTATCGGACTTA
+CCAACTCGACGCTATATTCCCGGCCAGCCGCCGCAATCCGGCCGTTTTCCTTTTTCTGAG
+TCCGAATGCTCCCGTCGCTCATGAATTTCCATATCCGTCCATCCGGTGCAATAACCTTTT
+GGGTATCGTAATAATCTCCGCTGGATTCAATCCTCCCTCCAAGAAAAGCTGCTGCAGTTT
+TTGCCGCCTGTTTTCTTGTAATCCCCGTCAATTCTACCTCGATTCCAAATCTCGTTGTAA
+GCATTGCGCTTTCTCCTCGCTTTCTCTGTGTTTTTTGCCCTTTGGCAGTGTACATTAGGC
+CATTGAAAACACAGGATAGCAAGGCAATTCTGCATGAGTTTCCGCTGGATTTTGGACAAT
+TTTACATATCTTGATTTGTGTACATTTACAGCTTTCTGATCACATCTATACCATAGGCTG
+CACCCAGAGAAGAACCGCAGTCCCAGTTGATATGAACGGTTCCGATATCATCCACGAAAG
+ATACTGTTCCTTGGTCTCCCGGTTTCAGCTTAGAATACGGATCATCCATGCAGATAAGTT
+CAACGCGTGTTCCCGGTGGATACTGCTCTTTAAGGCGAAGGACTGTTTCTTTTGAAGGAA
+AGCCTCTTGCACTCATAGTCCGTCCTCCTCTCCAGGATAAATCATTCATTTTCGTCCACC
+GCCTTTGCTCTGCCTTTCCGATACGCCCCGTTACCGGACAGCCTTGAAAGTAACACCTTG
+CGTTCAGTTTTGAAGTTATCACCTATAAACCCCAACCTAAGCAGGAAACAGCGAAAAGCA
+TATTTTTCATTATCTGTTGGTTTTTCTTTTCGTAGTACTCGCTTCTGTAATTTTGCCTGT
+TCTGCCATCTGCTTTGCCAGCGTTATATAGGTCTGCACTTCATCAGCATTTAAAGTCGCG
+TTCCAGAAAGGAAAGGAAATCTCATCATTTTCAGCTAAGACTACAAGTTCCCCCTCAATC
+AACATTGCCTTCTTTATCAATGTCTCTTTGCTGGCCAGCATATTATTTAGGTTTTCAAGG
+CTAATCTCGCTAAAGCCCTCCAACGAAAGAGTAATTGTCATGGTTTCCTCTGCTGAAAAA
+CCCTCCACATTCAACGCGTCAATAACTGAACGGATGGTTTTTATTTCATTGAGACTGATT
+TTCGGTGAGTGAACCACACTGTCCCTGTCAATCGTCCAACTGCCAGCAGATTTTTCGTCT
+TTAATCTCATACAAAAACTCCGGTGCTCCGGCATAGCGCACCTGGCCTTCAAGGGCTTCA
+GCTATGACCGAGGCAATGGCTTTTCTCTCCTGACCGACAATCTTCTGTGAAAAGCGAAAG
+CTGTTATTGCTCATGCCATACACCTCCCCTCAAATAAGCTAAAACATTTTTGATTCCCAT
+AAAAAATCCCACCTTTCCTTTTTGGTGGGGTACATTAACGCTCTGTTTTGAGGGGAAAGC
+AAGGACATTTTTAATCAATCTGTGTTTCCGCGTAAGGTATTTTTTCACTACCTGTTACCA
+AGAATACTGAATCTGCGCCAAATTGTGAAACATAGCGCTTTACAATCACATCGCAGTATT
+TCGGGTCAAGCTCCATCATAAAACAAACCCGCCCGGTCTGCTGTGCCGCAATCATTGTCG
+TACCAGAACCACCGAACAGGTCAAGAGTTAAATCTCCAATATGGGAACTATTGAGCATTG
+CCTTTGCTACAAGCGATACCGGCTTCATGGTAGGGTGCTCCTCCGATACTTTAGGACGGG
+GTATCTCCCAAACATCTGACTGTTTACGGTCTTTAAGCGGGCAAAGGCGTGTTCCTTCAA
+GCCAACCGTACCAGATCGGCTCGTACTGGGTATGATAGTCCTTTCTTGACAGTACCAAGC
+TGTCTTTTTTCCATATAATTGTGCTCGACCAGTGATACCCTGCCTCCCGCATGACGTTCA
+TCAAACTGCCCCATTCCTGAGCACTCATTACTATATAGGTCATGCATCCGGCTTCAGAAA
+CCTCTTTCATGCATTTAAAAGCGCGCAATAAAAAAGCGCCGAATTCTTCGGTGCTCATAT
+TGTCATTTAGAATTTGTCTTGGCTTCCAGCTTGGATGCCTGGTATCTGAACCGTAATCAA
+CATTCCAGGGTGGGTCGGTGAAAACAAATCTCGCCTTTTGTCCGTTCATCAGCTTTTGCA
+CATCTGAAAGCATGGTGCTATCACCGCACATCAGACGGTGGCTGCCAAGCACCCATATGT
+CGCCCTTTTTAGTGACCGGAGTTTCAATCTCTGCAATTGCCTTTTCTGTATCGAAATTAT
+CCTCTTTGACATTAGCGGTTGTTTTATCACGGAACAACTCATCAATTTCCGCAGCATCAA
+ACCCGGTAAGAGAAACGTCAAAACCATCTTCATTTAAATCCATAAGCAGATCGGTCAAAA
+GCGGAATATCAAACTCGCCACTGATTTTATTCAGTGCAACATTGAGCGCCTTTTCCCGCT
+GTTCATCCAAATCAACTACAACACAGTCGATCTCCTTATACCCCAAAGCTGTAAGTACTT
+TATAACGCTGATGTCCGCCGACAATGTTCCCGGTGCGTTTATTCCATATAACCGGCTCTA
+CATATCCAAACTCTTCAATAGACCGACGTAATTTTTCATATTCAGGGTCACCAGGCTTTA
+AATCTTTCCGCGGATTATATTTAGATGGTTTTAGTTTTTCTGTTGGTATTTTCAGTATAT
+CCATAAATCTTAACCCTCCAGTTTGATGGCTTTTTCGCCGGTGAATTCCTCCCAGCGCTT
+AACAGCTAAATCACAGTAAACAGGGGATAACTCCATTGCGTAGCATTTACGCTCGGTCTG
+TTCAGCCGCAATTATAGTAGTTCCGCTACCAGAGAACGGCTCAAGCACAATACCGCCTTT
+GTCGCTGTGCATTTTGATGCACCGCCATGGAAGCTCCACAGGGAACATTGCAGGATGCTC
+CTTGTTTGCCCGTACAGTGGTCATCTCCCATATCCCAGCATAACCCCATTTCTTGCGTTC
+TTCCTTTGTAAGCCGTTTCACAAATTTATAACTGTGTCCCGCAAAGGCTGAAAGCCATAC
+ATATTCCTGATCGTTATATTCCTCAACTTCTCCTTTATTGCTGAAGGCCGAAATATACTC
+ATACTGCTGAACCGGCTTGTTTGAAACAAGATGATAGGGTCCTACACCAAAGTTCTGCCC
+CTGCTTCTTCCAAATACGGATCCAGATAGGTCGATAGCCATTGTCCAAAAACATATTCAC
+GCTGTACACGCTGGTTGGTTCAATAAACTGGGAGCCGGTTGCATATAAATCACCTAAGTT
+CCAGCAGACAATATCTGCATACCTGCATAAGTTTCTAATCACTGGGCGTACTGTCTCGAA
+CCATGGCTCAATCCCGGCTTTTTCATATTCTTTGCCTACCCCATAAGGCGGGGAAGTCAC
+TGCCATCTGTGCGTGACACCCTTCCATCAACTTCTCAAAATCCTCATTCTTCGTAGAGTC
+GCCGCACATCAAGCGATGATTCCCGAGAAGCCAGATATCGCCCCGCTTCGTTACCGGCTC
+GCGCTGCACGATTTCCTCATGCGCTTTATCTATGTCAAAGCTGTCTTGTACCGCCTCTTT
+GGAGTACCATCGGTTAAGTAGTTCGTCTATTTCAGAGGCGTCAAACCCTGTAAGCGAAAC
+ATCAAATGCACCTGCGTCCAACTCAGCCATCAGTTCGGCCAGTTTATTCTCGTCCCACTC
+TCCTTGAATCTTATTGAGAGCAAGATTAAGCGCTTTTTCTCTCTGCGGGTCAAGATCCAC
+TACAACGCAGTCTATCTCAGTCTGTCCCAAGTCCAGCAAAACCTTTAAGCGTTGATGCCC
+GCCTACCACATTACCTGTTTTTTGGTTCCAGATAACAGGCTCCACATAGCCAAATTCCTC
+TATTGACCGTTTTAGCTTTTCATATTCCTTATCGCCAGGTTTTAAATCCTTGCGCGGGTT
+GTATGCTGCTGGATTAAGTTTTTCAACAGATATTTTTTGTATGTTCATGCTGCATTCTCC
+TGTTCAATATTTTCTTAAGACCCTTTTTTGCGCCCTCACAATCTCCGTTTATTACTTGTC
+CCCGCAGAGTCTTAAACTGCTGCTTCGTTAAATGGTCTTTATATTTTCTTAGTTCCCTAA
+GAAAGATTGAATTTGTTTTATGCATCAGCCACCCCTCCTGGCTGTCAGTAGTTTTTCCAT
+CACATCGTCGTGGGGAGTGGCCCCCTTGTATTCGGTAGCACAGTTTTCCCGCACGACTTG
+ATAAATTTGATACCACAGGTTATTGGCCTGTTTCATAAAGCTTTGACTCATAGCCACATA
+AGGTGACGGGATGGCATTGCCAGTTGTCGGATGTTTAGCAAGAAAGCCAAATTCAGTGAT
+ACATTCCTCGCACTTGATCCACCGCGCCACACTCTGGGCATATTGCTCTATAAGCTGCGC
+AGGGATAAGGTGAACACACCTGCGTTCCTTAAGCCACTGCCATGTTTTTTCGTATATTTC
+CACCGCCAGTGTTGTTTTTCCGTTCTTCTGCTTTGCAGCAAGATAATCCCTCGGTGGCGG
+CATGCTCTCTCCTTCTAGTTCCGCAGCATCCGTAAACTCCATTACCATGAGCTTTCGTCT
+GCCGGGGTTTCCTTCCAAAATCTTATCCGCCAGAGGCTTTTTCTTCTGTCCTGCACCGAT
+ACGTGCCCCGCCGCGGTTGGTACCGTCCTTTGCCATACACATCACCTCGATTCATGTAAA
+AATAAACAGGGGATATACCCCGTTTGAAACTGCGATTTTTCGCGCGTGACCCCCCGCCCG
+TTGCACAAAACTGCTTCACCAGAGATTTTGACCCCCCTACCGTCTTGCCCATCGCTCTCC
+TTCGCGGGCAGTGATCGATGAGTGACATTGTTTGCATAGACTCATAAGGTTACTGTCTGC
+ATTGGTTCCGCCTTTGGATAAAGGGATAATATGATGTACCTCTTCGGCTGGTGTAAGCCT
+TCCGTACTTTTGGCACTCCTCGCAAAGCGGATGCTCTGAGATATATCTGTCCCTGATGCG
+TTTCCATCTCCGGTCATAGCGTTTTCTTGTTTGGGGATCTCGTTCGTATTTGTTGTAATA
+AGCATCCATTTGCCTTTGATGCATGTCGCAGTACCTTCCGTCCGTCAGTTCAGGACAGCC
+AGGAAAGGAGCAAGGCCTTTTTGGTTTTCTTGGCATCTGGCCACCTCCTTTACGCGTATA
+AAAAAGCCCTCACAGGTTCATCCCATGAAGGCTTATCTATAATTTTTCACAATACCATTA
+TATTTGGATTTATAATGAATTTCATCTCATAAAAATCTCATCTGGAATATTGAACAACAC
+ATTTGCTATTTGACCATGGCATCTTACCGTTATAATACTTATCGGAGATATACCGCTGCA
+TATCGGGTGGTAAAGCTGCAAGCAAAAGATAAGCCTTTTTCCTGTCTTCCTCTAACTCCT
+GGGTGCTTTTATAGAAGGAACATTTATCTTGCAAGCACTTGTGTACAGTCAGGATATTGC
+AGCCATTCCTTCCGTTACTGCCAAAACAATTATCGTACATCTTTCCTCACTCCTGTTTTA
+TGGCATAAAAAAAGCCCCGAAGGGCTTATGCGTTTTAATGTTATTTTTTCACGATATCAT
+TATATATGGGATACCTGTGTTTTACATCTCATAAAAATCTCACATAAAAGGAATGTAAAA
+ATATCAGTTTATTTGTTCAAAGATAGCTTTCGAGTATACTTCTATATCTCCAGGAGTGAG
+CATGTTGAATTTTTCTTTCACAGCGACAAAATATTCCCCGATCAATTCTTTGGGTATTAC
+ACGATTAGAATGCGCATCCACCGGCAAACCGTCTCTGGTATACCGCCATGGTTTCTCCAG
+ATGCGTAAACTTTTCTAGTATTTTTCCACTATAGCAGCAGAAGTTCTTAATAACGCTATC
+CAATATTGCTTTTTCAGCAGTTGTAAAAACTGATTCATCGAAAGCTTCAACGCTCTCAAT
+TGGGTCAAACCGATAAGATGAATACCTGTTATATACATCTCTGTAAACCGGTCCATGAAC
+CCATGCCTCACAGTCTTCTTCAAAAAGAAACCGTCCTTCAAAAGCGTAATAAAAGCCCTG
+GACATAATATAGTGCCTTTTGTAAAGCTAAAGGAGTTATGTCCTCGCACTTATAAAGCAG
+ATATTGGATAATTGAGTCCAGCTTCGAACCCGTTTTGTTTTCTTCCCCAAGCAGTTCCTG
+TACCTTCCGCTTACTTTTTTCATATGCCTGCAGAGATTTTAAATTGTCCTTATTTTTCTC
+CAGTAATTCTTTATAATACGCTGGATCATCATAAATCTTTTGAAGAATATCTGAATACTG
+TTTTGTAGGCATATCACCTTCACAATATCTCGAAAAAGTCATTTCCCCCCAACCTAAAAG
+CAATGATAGCGGACGTTTGCCAATATTGTATTTCTGAGGTATTTCTAATATCTTCTCCAG
+CGAAATAATGCCGTTTTTTTGACGGTACGTGTCATACAAAGCCTTTAGATTTTCGTCCTC
+TATATCCGCTACATAGACTTCGCTCCCACATTCCGTACAAATAGCCTTCTTTCCAGTATA
+CTCATATTCTTCGCCTTTAAGTTTACCCTTAATTGTTGCTGTTTCTACCATGTATTCGAC
+ATCTCTTCTGCATTCCTCGCAAAATGTCTTATTCCTATTCATAAGGCGGCCTCCTTTCAA
+ACTCTCTAATTTTCTGATTGATCATCGGAAAAGATAATCAATCGGCTTGTTTCGCTTATG
+AAACGATATAACAACCACTCGTTTTCCACTTTCACTATCAATTAGATTAAATTTCGTATA
+TATATCAACTAACTCCTCAATGCCATCAAAGTTAAATAACGTAACCTGGGGACAAAATAC
+ATATAAAACCTCATGTTCAAATCCTACTTTCGTATTTTGCAATGAATGGCAAAAATCTTC
+TGTTTTTATTTTCAGTAAAATCTCCTTTTGCCTTCTGCTGTTTAGATTATATTCATTTAT
+AAAATCTATGTTTTCTTGTCTATTCTCATTTTTTGATATAATGAATCTGCCCTCTCTAAT
+ACAGTCATGTATCATTGCCAAAATCTCATCAATCTGTTCCCAGGTATAATTCTGATTATA
+GTGCTGATTCATTGCATCACCTCTTTTGTGATACAATGATACTATATTATATGCCTTTTG
+TCAAGATTTATGCATCAATTAGTGCATTTTTATTTTGTTGATTTTTACATTAAAATATGT
+ATACTAAAGATAACAGCTCCTACAAGCTTATATTAAGCGCAATACAGTAGGCCATTAAAA
+ATACCCACTTAGGTAGTTCGTTCTATCTAAGTGGGTTTCCTATTTAACATGCTGCTAATG
+TTATCTTAAACTACTTCCCGTATAAAAGCAGTGCCAGATGATTAAGTGCCTTGTCCTTCC
+TACGGTACACCTGTGCTCTTTCAAGAAACAGCTTCTCTCCGATGTTTGCTACAGCTTCTG
+TCTTGCTCACATCATTAACAAAAAATTCTGTCAGTATAAACTGTTCTTCCTCCGACAGGG
+CTTCCCAAGCAGGCTTGAACCACTCCATATATTCTAATGCCCGTCTGTAACGTTCTTTCA
+ACACATCAATCTCGTCAAGGCAAGCAGCAAGGCGTTCTTCGCCGCTTTTGGGATTGTGTT
+TGCCCGGAACTCCGGTAATCTTTGCACTATGAGGGCTTGTCATACGGGTTTCAATTTCAT
+ATATATCCTCATCACTGTGTTCGATAATGTACTGCATGCTGCTGTAATCTTTCAAAGCTT
+CAACAGCAGCCGCTTTTTTATCTAAATACTGCCATGCAATCAGCATATCGCACCTCCAAA
+AAATCAAGATAAAAAACCTTGATCTTTGAAGCAGTGTGCTTTTTTTCGTTGCTTTGCAGT
+GCTTGTTTCCTTGTTCGTTATATCTTCGTTCTTTGCAGAAGGTCATGCTTTTCCAGAATA
+ACCTTCACCTCATCTACCGAATGGACAACCGCTGCCACGCCTCCGGCATTGAGGATTTTT
+TTGATGGTTGCTTCCTGCAGTTTTGTTGTCTTTCCCGATGGGGTTTTTACTTCAAAAGCT
+ATAAACCGCCCATTTACACAGGCAATAATGTCTGGTAGCCCGGCTGTGCCGTACATACCG
+CCATGTTCCTTCCAACAGAAACACCCCGGTACTGTCTTTAAGTACCGCAGGATTTTAGTC
+ACAATACTCTTTTCAGACATAACCGCTTATCCTCCAAAAATGTTACCTTTTCCCCTCTTG
+TTACCCCGGTATTTCTAAAAAGGTAACTTCTCAAACCCGCTTTACAAGCGCATTTGCGGA
+TTTTGTTACCTTGTTACCTTTTTTTGGGGTAGGTATAGACACAAATATTTATATTTTTTT
+ATTTTTTATTTTTCAAAAAATAATTTCATCTCTCGCGCGTATATATAAAGTTTAGGTAAC
+AAAGGTAACATCGGTAACAAGTGGCTATTCACCAGCGTTTCGGGCGTTACCTTTTTGTTA
+CCTTGTTACCTTTTTCAATACTAAAGAGGCTCAATATCTGTAATTTCAAAGCCGCTCACA
+TCGCATCGCTCTTTCAGTATCGAGAAATCAAGAGCCCACGCTTTTTTTGTTTCATTCCCG
+AAACGCATCGTTTTATTGCTCTCTATAAAAAAGTCACTTTGCCTCAATTGCTTCAGAAAC
+TGGTTATATGGAAGACATTCACCTGTGATTGCATAATCGCGTCTGTACTTGGTATAGCGG
+TCATATACATCACAGAAACGAATCCCGATAACCTTGCCATCTTTATCAAAAGTGTAGTCT
+TGATTCGGAGCCAGTTTCATCCGGGCCATGATTTCCAGGGTCTGTTCTACAATGGTCTTG
+TTATTGCTGCCGCCATCCAGCAAGTACTCCTGCACACCGTTTTGAAGATATCGAATACAT
+GCCCCTTTGTTAATGGGAAATACTTCAGCCCACGTTACATTAAGGAATTCACACAGTTTG
+TTTACTAGGCTCAATCCGGCATAGCAACAGGCGAGATTATTGACGATACGAGATGGAAAC
+TCATCAGATATCTCTGACTTTGCTTCCTCATACCACTTCTCTGCCTCAGCAACCGATACT
+CTGAGTGCTATATCCAGCAGGCTCCGACCGAAGCTGCCAAGCAGATCCGCTTTTGCACAC
+AGCTTATAAAATGCTTGTCTATGGCTGGCTGGTTTTAAGTCCTTCTTGCTGAATAGCAAT
+TCTATGCTCCGTTCTCTGATGGCCGCTTCATCCGGCGATTCCTCACCAGCTACAATAATA
+GGTGCCAACAGTTCATAAGTAACAGCACTTTGATCCGCCCTACCGCGGACACCTTCATGG
+CCGTCATATGCATCTCGAAGATGGTTGTATAAGGCATTTAGCCTTAACTTATCTATCTTT
+GAAGGCTTGAACTCATCCATCAACTGCGGTATAAGATTCGATGATGCAGATTCCTTCATC
+AGTGTAAATGCAGTAACCTGCGTAGACGCGCGGATTTTGCTGCACGAAAATACCGGCAGA
+ATAACCCGCTCCAATGTATTACTTTTTCCGCTGCCTTGTTCTCCGACAAGCAATAAATGA
+GGAAACTTGATGCCTGATTTTTTAAGATGCGGTTTAATGAAGCATCCGGCCACCCAGGCC
+ATTACTGATACCGTTTTTATGGGCTCGTTATAGCTGAGGAGCCATTCACCAAGCATAATA
+AGCTGTTTCTTTGTCAATGGCTCAAAGGTTAGGATATCGGTTGTTATGCTTTTATACTTA
+TCAAGCTGCACGATATCTTCAACAATGTTGCCTCCTGCTTCAATGGCACCATCCGTTGAA
+ACATATACCATCCGCCCGCCATGCTCATAAATCCCAAGAGCCTTGACCCCTGTTTTCCTT
+ACCCACTCCATTTCAGATATATAACCTTTCAGCAGTTCCAAATCTCCTTCTGAGCCAAAA
+TAGCCTAAGGATATTGTCCGGCGGTTCAAGATATTTTTAAATTTTTGGATGTTATTGAAG
+TCGGTAGTCATAAATGTCTGGCGGTATATTTCATCACGGATTGTAATAAGGTCAGCAGTC
+ATCTGCGTTTCATCTTCCGATACAATCATCTCCACCGGTTGAATGATAAAATTTGTTATA
+GGATACACACTTTCGCCTCTGGTGCGGTAATACCTGCCCTCATGTTCAAAGATAACTGAC
+TCGCTTTCGCGGCTGTATACATTCTCTGTGACTTCAATGGCCTTATCCAGTGTCTCCTGC
+CCATATGTTGCTCCACTTGCATGATGTACCGTATCCCACTTTTCCCGGAATAACCCGGAA
+TTTCTAAACAGCCTGTCCATCTGCTCTTTGTTTTTGCCTGACCAGAAAGCCAGCATACAG
+CAAAGAGCAAGGTCGGCTTCGGACTGGCTCGGATACCCTGCTTCCTGCCATTTTCCTTCC
+CATAGCAGTTCAAATTCCTTATGGTTTTCGGCTGTCTGGGCTTTCTCCAGAATTTCTTCA
+TCTGTAAGCGGCTCTAGCTTAAAATTCTTACGGTTTTTCTTGCTTTTCCCGCTCCGCTTC
+TTGCTTTTGATATAGTTCTCATGTATCCAGGCCAGTGCTCCGTTATCTTCGGCAATGCTA
+TCAGGAGTCCCGGGCAACGGGTCGCCGGTCATTGTGAAGTACCTGCTGTGGGCATACATT
+TCAACGCCGGTTTTAGTGTTTTTATTGCCCTTGGCAGGCATCTCCCCTTTATAGAAAATA
+TGAAGCCCAGTTCCTGAAGGGCTGATTTCCGTATAGGACGGAAACCGCTCAAGGATATCC
+TTGGCGGTATCGCTTAATTCCCCAGTGTTTTTGTCGCGGCAGTGATCTATGTCTATCCCT
+ACTAAACCTCCGCTTTTTGCGAATACAAAATCTAATCCGGTATAGAGGTATTGTTCTTTT
+GCCGCAATCGCATCGTCAAGGGTCGACCAGTCGTTTGGGTTAGTGCTTGAGGCTTTTCTG
+CCGGTTAAGGGATTGTAAGGGATTTTACTGTCTCTTCCGTCCTTTGTGTTTGGTTCCAGA
+CGCCAGCAGATCCATTGCTTCCGGTTTGCCAATTCTTTAGGGAATGAGATGCTCACTTAC
+ACTGCACCTCCTCGCATCGTTCATTAAAATACCGGATCGGAATGCTGCGCTGCTTTGCCT
+TTTCAATCTCAATGGACATCCCTTTAGTAATTTTTCTGCCAAATACCCACACTTCTGAGC
+ACTTTGACATCAATACCATGCCAAAGTACAAGCCCAGATTTCGCATTTGTTCATCATCGT
+CGTCCATAAACTGCGGAAACAAGAGGTGCGGAGCAATAGGTATGCAATTCCTGCTCACTG
+CAAAGCGGCAGTACCCCTGAGCCTTACGGATATTACGTTCTATATCACCAGCATATGGGC
+TGCAGATAAATACCATCGGTCTGTAGGGCGCTTTCCTGGCCTCTCGCTCAATCCTAAGCA
+GTGCTTCATAAGGTGTGGGGTCGTAATATCCTTCTGCGTTAAACTTGCTGATACTCATGG
+TATTACCCCCTGCCTATGCGCTTTTTTGTTCACGTTCGATTACAGGCAATATACCTTTCT
+TGTTTTTAAGAAGGTCATAGATAAATAGCCTTCCTTTTTGTGTCCAATATGTGTGCATTA
+CGCTTCTTTCTGCATCAATAGCATGAGTCTTGGACTGCGTGTATCCTTGATCGGCGTACT
+CCTGATATAAAAGCCAGCAGTTTCCCATTTTGTACTGTACTCCAAGCTCATGAAGCAGCT
+TATTGAAAGCGCGGCCAGACATTCCGTAATCCTTGGCAATCTTGCTGATCGGCACAAGGC
+TTTTATTTTGCAATATGAGATCATAATAGCTCGCTTTGGGCTTCAACTCACTGATAATCT
+GTTTATTCTTTGCATTTTCTATTTCTAAAGCTTTCCGCCTGTCGCGTTCTGCCTTTAGTT
+CAGAGAAAATCCTGATGCCATACTCCGGATTAGAAATCATCTCTTCGATAACTTTATCTG
+TAGCATAAACTCCATATTTTCTGATCGTGGGCAGCACTTCATCAAAGACCCATTTCTCAA
+AGCGTTCAGCTGCAGGAAGTTGGGATTTAACTATCAACCGGAACAAATCACCTTCGGGAA
+TATAATTTATGTTGATGGTTTTTTCAGGATTTTGCGGATGAGGTACCTCACGTTTTGTTA
+GGTACTTACAATGATCTATTACTGCCTTGTGTGGGTTACTGTATCCCAGCATCCTTGCAC
+AATCCGTTGCAGGAAAGTATTCCTTTCCATCAATAACGAGTACTTTAAGTTCTCCAAATT
+CTGTATTCTTAAAAACCTGTAAATTAGTCATAATATCAATCCTCCATTTCTTTCATTTCT
+CCAAAATTTCTTCCTACCGAAGCCTCTGCCACAATAGGTACATCAAATGCAGGGAAGGGT
+TGTGTTTCCATACACTCTTTTATAAAAACAACTGCTTCGTCCACCTTGTCTTCCGGTAAT
+TCAAAAACCAGCTCGTCATGTATCTGCAGCATAGGTTTCAGCCAAAGCCTTTCGGGAAGT
+CCACTGATGATGCGCCCACAGGCAAGCTTTAGAATATCTGCCGCTGTACCTTGAATAGGT
+GTATTTAATGCGCACCGCTCGGCAAACGACTTCTTGCCCCAATCTGATGACCGAATTCCC
+AGCAAGTATCTTCGCCTGCCCAGCCATGTTTCTGAATAGCAGCTTACAGCAGCCCGCTTT
+TTTACCTCATCCTGCCATTTGGCAAGACCGGGGTATCCGGATTTCAAGTTTTGAATGATG
+GTCTCACATTCAGCCAAAGTTGGGTTTATGCCAGCTTTAAATTTTAGTGTCCTCTGTAAG
+CCAGTGGGAAACAGGCCATAGAACACACCGAAATTGCAGTTCTTTGCGATGGTTCTTCGC
+TCTTTATAATGCGGAGCATTTTTGTCTGCTGCCTCCTCAAAAGGAATGCGGTAAATAACA
+GAAGTGGTCTGCGCATGGATGTCACCGCCTGTACGATAGGTTTCCAGCATACGTTTGTCC
+CTGCAATAAAACGCTCCGACGCGCAGTTCTATCTGTGAAAAGTCAAGGGATAAAAGAACC
+TTTCCGGCTGGCGCAATGATAAATTTTCGTACACCTATTGGGTCATTGTCTTTCTGCGGA
+CAATTCTGCATATTCGGGTTTCTTGAAGCAAACCGCCCTGTCTCTGTCCCCAGCGGCATA
+AGATCTGGATGAATCCTGCCGGTATCCTCATCAATAAATCGAAGATAACCGTCTATATAG
+GTGGATTTGAGTTTTCCCCATTTGCGGTACTCCTGTACCAGCTCAAATAAGCGAACTAGC
+TCGGGCCTGTTAGTTGCACACCATTCTTTTAACAGAATCATGGTTTCATCATCGGCAGCT
+TCCTGATGTTTTGCGGTTGTTTTCATAACCGGAAGGCCAAGATCCACAAAAAGATACTTC
+TTAAATGCTGAAGTTGAAGCATTTGCCCCAATCTCTACATTGCCGATAATTCCGGCAATC
+TCTTTTCTGATACTGACAATCTTTTCTGCAGCTTCCGCTTGTTTCTTCAGCATGGCTGAC
+TTATCCACCAATATGCCGTTATACTTCATTATCCCGACATATACTGATGTAGGCGATTCT
+ACCTCTTCCACAATCGTTCTGTGTTTGGGTAAAAATCTATCAAACCACTGATTGAAAACA
+TGATACAAGCGAAGAGTGTAGTCGCTGTCAGCACAAGCGTAGCGGACAGTCTTCTCATCC
+TGAGGGTTCAATTCATCGAAAAACCGACCTTCAGTAACCGTTGAGAATTCTGTCATTTCT
+GCTTTGCAGAGTGCAGGCGCAAGCGTTTTAAGTCCGCTGTCAGCAAGACTTCTGAACTCC
+CACTTGCTTTTTAATGTAAGCTGTGATGCTGCAATCGTGTCATAGCAAGGCTTTTGAAGG
+ACGATACCTCTTGCGTAAAGGAACATAGACTCAAAAGCCAGATTATGAGCAACTTTTATT
+ACATCTTTTGATTCGAATAGTAATTTCAGATAATCCCATATTGCCGCCTGGTTCTCTGCA
+TTTCGCCCGCTACGATGTTTAAGTGGAACATATATAGCAGTCCCTTCTGATACTGAAAAA
+CTGATCCCTGTAATATCTGCTTTATGAGCATCCAGAGCTGCACTTTTATCGTTCCTCCAT
+TTATCGCGGGGTGACGTTTCAAAGTCGAAAGCAAATAGGACAGTGTTTTTCAGATACTCT
+TTTATTTCAGACAGCATATAAACACATTTGTATCCCATGCGGTTCTCCTTTCCGCCCTAT
+CGGAGATGGAAGTTACTCTCCGATAGGGCCTTTGATCACTTAAGCGGCTCAGTAATTTCA
+CCTGATTCAGGGTCTACATTTATTACCTCTTCACCGGCAGGTTCAGTGTCATGGCCGACT
+CGGGTACTGAATGCTTTGACCTGCTCGGAAAGCTTGGATATCAACGCATATTCGTCAGCG
+GTCAGATCCCGATCTACAGCAAACTGGGCCTGTGAATAGGTGATACCGCTTGAATTGGTC
+GCCTTTTTCAATGAAAAGCGGGTAACTACGCTGTTCGACTTTTTACCTTTAGAAAGCAGC
+CTTTTGATGTAGCGGGAAAACTCTTTCAACGATCCTGTTGGCAATGAGAGTATCAACGGG
+AAAATCTCCCCTTCACGCAGTACATATATCCTGCGGCGGTTTTTGCAGGCTTTGCTGCCG
+TTTTCCCCCGAACCGAACTGATTATATGGGCATTTGGCACAGCTTCCTCCGGGGTCTCCT
+TCGCCGGTTATACCATCAAAGCTTCCGCAATCCGGTGGGTTACTGCCTCCGGTATACTTG
+TCCTTGTAGTATGCATAAAGTGGATGATGATAAAGGATTACCGCTGAGAATTCCTTGACA
+GTATCAGGTTCTCCGGGATTCTCACCAGGCACTTCAAATACTGTGCTGCCTGCGGACGGG
+ATTTTTATGCGTTCAAAAGTCATGTCAAGACCGTCAAGTTCTGATGCCATTGCCTCGTCA
+AGATTGAAATCAGCGAGCTGAAGAAAACCTGTATTTTCGTTAATAGTTACGAGTTCATTG
+TTTTTCATGCTTTTATACCTCCGTAATTATGAATTTGGAATGTAATCTATATCATTGTTC
+TTTGAAGCATTGTTCTTCGAACAGTTATTCCTTGAACATTGATATTGGAGCATTGCTTTC
+TGAAGCTATTTACCTTGCTGCTTTCCGCACAGTTACTGTTGTCTTTTCGAAGACATTCAC
+AAGGCCTTTCAGCCAGTCCGGAAGCTCGTCCCCATTCTCCGCAATCTGTTCTTTAACAAA
+TGCTGACAGGGAATTTGCATTTACTGTTTCATAGATGAGTTCTCCAAAGCCTTTACTGCG
+TAGTGCGTCAAACAGTTCCTCCTTCATGCCTGCGGCAGCACTGGCTCTTGTTGTCGTTGA
+AAGGCAGAACATTGTTCCTGCTCTTGTGAAGTTTTGCGTCTCACTGCTGATCATCAGCTC
+AGACAGACGGTATTCGACATCGTCAATCTCCGCATTTATGCTTTTCATTTCCTCTTCCGC
+GGCCTTTTTTGCATCGCGAAGCTCCTTAAGACGGTCAGCAAGTTCAAACATCGCATTATC
+GCTCATAGCTTTCACCTCCCTCTGGGGCAAAAGGATTTGCTCCTTTGCGGTAGTCGTCTA
+TCAGCATTTTTGCAAGATCTGCCTTATTGCGTAGGGCAGTCAGGATTTTTGAATCCACAG
+TACCCTTGGCAATAAGGTAGATATATGTGCAGCCATTCTTCTGTCCAACTCTATGGATGC
+GGGCCTTTGTCTGCTCGAAATTCGACATGGAATAATCAAGGGAGTAAAATACCATTGTGC
+TTGCAGCAGTCAGCGTAATACCGAGTCCAGCGGTTGCAATCTGGCCTACAAACACCATGC
+AGTCGGGATCATATTGAAACCGGTTTACTTGTTCTTGGCGATCCTTAGTCGCACCATAAA
+TACACGCATAGCCGATGTTCTTTTTCTCCAGCAACCTGCATATAGCATGAATTTCAGGGA
+TAAACCTTGCTATGACAACCAGCTTATGTCCTTCTTGAATACTGCTTTCAAGGATATCTT
+CAAGAGCTTTCAACTTGGCATCACTGACTTGCTCGATTTTCCCACCGTCATCGCTTCCGA
+TGAAGCCGCCGGTTAATTGCGAAAGACGAAGCAAGCGTGTCAGTATGTTTGTAGCTGTTA
+CTTCTCCTGCTGACAGCTCAGTATAGCTTTGTTTGACAAGCTCTTTATATTTCTTTAAAG
+TGACAGGCTCAAGCTCAATATGGCGAATAATATCGGTGGTTTCCGGCAAATCCAGACACT
+CCGCTTTGGTCGCCCGGAATGCAATGCTGTGAATCCTTTTCATCAAATCCTGTTCCATTG
+ATTTTTTCAGCACTGGCGTATGGTTGCCATAGCCAACCATATTGAAATACCGGTTTCTGA
+AGGCATAGAAGCTGTTACCAAAGATGCGTGGATCGAGAAACTTATATTGGCTGAATACAT
+CTATGGCTTTGTTGGTTATAACCGTTCCTGTCAGTAAGAGCCGATACCGGGCAAGCAAGC
+CTAACCGGTGCATTGCCTTTGAAACAGAAGTATTATGAGTTTTAATTTTGTGTCCTTCAT
+CAGCAATGATAAGGTCAGGATGCCAATTAGCCAGTTCCTTTTCCATTCTCCATGCAGATT
+CATAGTTGACTACCACCACATGGACACCTTCGCCAGTTAAAAATCTTAGCTGTTGGATTT
+TCTTTTGAATCGTGCCATTAAGGACTATAAGCTGATATGGGAAATCTGCGAACCGTTTAA
+ACTCGTCTTCCCACACTCCCAGAATGGAAAGTGGCGCAACAATCAGCACACGTTTTATTC
+TTCCTGCAGCAAGCAATGCTCCTATAATGGCGATTGAGACAAGAGTTTTCCCGGTACTTT
+TCAGCCCATTTCCATCAGGAGCGCTGCACCCCATCCGGAAATGGCAGAAACACCACCACC
+CTTCAAAAGCCCAAATAGACTGCAGATGAAATTGAAAGCACGAATCTGATGGTTGTATGG
+TCTGCCCTTTATGGGCATTGGAATTATTGACAGCGTTTTTGCATTGTTCATAGAGTCTTG
+CATCTTATATCCTCCATCCTTCAATTTTGAGGGTTGGCCAACTCTCTGACTCAATGCTAC
+CTAAAATGCAAAAGCATGTCTGGACATCTAAAGTCCATGTTTTGGGCAAAAAAATAGCCA
+TTATGCAGTAAGGTTTTTGCACCTTTTTTGCATAATGCCTTAAAATCTCATTATAATAGC
+CGGTTTAAAATATAAAAAGTTGGACTTCAGAAGTCCAACAATTTTTTTAACTTATCATTT
+CTTTATATGCCTTTGCACAAAGAGGGGAAAGTCCCAAGGCTTCCAAAACTTCATTGCATT
+CATATATTGAATGCCCTCTATACGAATGGATTAGCTTTTTATACGCCAATTGCTGTGGAG
+TGTTATTGAGAGTATATCCGGCAAGCCTTAATATTTCTTCACTGTATGTAGGGCTTAGCT
+CCAATCCGATGCAGATTGCAACAACGGTTTCTAAAGTTGGATTGTTAAGTTCATTGTTTT
+TTATTCTGTCATATGTTTTTCCTGAAAGCAAAGTCTTTTCTATAAAAACAACCTTATTGT
+AGCCTTTCCTTTTGATATGTCCGTATACCGCTTGGGAAAATGTCTGGGTTGTACGGCTCA
+AATGCTGACCTTCTTCGACGAATTCTTCGTGAAACTTCTTTAGCTCTTCTGAACGATTAA
+ATACTTCCATATTATGCTTGTCCGGATTAAATGTCGGCACTCTGTTATAATCCGGTGTAG
+CTTTACGGAACATTATAGAATCGAGGTATACTACAATGTCCATTTTTGAGGCTTTATTTA
+ATTTTAAATCAAACAGAAGGCAGCATTCATCTACATGCAGTTTTGCATAGTCTGTAAGAT
+CAATGCTTCCATTTTCTAACTTTTTAATGTATTTGGAGTCGTTAATAACGTAATGACCAT
+CAACATAAATAAAATTACCGCTGTCTATAATCTTTGCGAATTCCGGATTTGCATAGTATT
+CAAAAAAAGAATCACTTAGGCTAATACTGTATGTTTGATTCTTATGTAATGAGTCTGCCT
+TAAATGAATAATTGCTGATAAAATGGTCATCTACGTAGGTATATACACCTTCAACTTCCT
+TATATCCAAGGTCAAGCATCCTTATTTTGGCCGCTATCCTTGACACCTGGAAGAAGTCAG
+CTAATTCATACACGACATTTTCCATTATATTTAGCCTGTCGTAAGTACCAAAAAGGAGCT
+CATTCTTTTTAATTAGCTCCTCAATCTTTTTAATGGTCATTGATCTAGGCATAAGGATTC
+GTGGTGCAATTCCGTTAGCATGCCATTCCATCCAGTCTTCTGGCGTCCATTGCTGTTTGT
+ATTTAGTTGTTTCGTTTACCCTGCAGCTTATGAGCAAAGCATCGCTGTTATACGTCTTAA
+CTAACTCATGGTATTTTCTATGCTTATACCAGTGGACACACTCATGAATAATGGTATTGT
+TCATGCACCCTATGTTTCGCATGAAATACACATTAGGATCCACGAGAATTGTTCCTCTTG
+AAACTTCCAAAGGCTTATATGTTCTTTCATTTCTGTCGTAATACTCTATTGTGCAATCGC
+CAAAGACTATTTGACCAAATATAGTGAAATGCTTTGTAAGCTGGATTTCCTTAACCTTAA
+GCCCCATTCTTTTCACTACTTCATCTACTGGAATGGGCATAGGAGTACTTAATGCTTCTG
+GGCAAAACTCATTTAGAAATTCAGTAGCAACATTGTCAAACTGTTCCTTTTCTATAATTG
+GTACTAAATACTCAGACAGTCTGCCTAATTTGCTTTCTCTGTACTTGTTGTATATTGAAA
+CAGAGTTGATTTGAAAATTCTGAATTCCGTCATCAAGGTCAGCTCTGCAGGAGATACGGA
+ACCATTGTTCTATACCATCAGTCTCGCGATTCCTTCGTACTGTTTCTGCAATTTCAATTT
+CGGCAGAAACAATTACGTCAAATAAAATACTGTTACCTGGCGAGTCGGTTATATCTATCG
+TTATGATGTCAAAATCAGATAATGCTGCTTCATCCGGTGATTGCACATGGTATGAGTTGG
+ATTCAAGCTTATCCGGGTTGTCCTCTATATATTCAGACAATTCGTCAAAGAGATCATTGT
+AATACATATTTGCAATAACATCTCTGAACGAGCTGACGCTTGCCATACCGTACCTCCCTG
+ATTACCATCATTTCAGACCAAATATTTCCTTATGTAAATTATAGCATGAATTTCGCAAAA
+CACAATAATTAATTTGCGGGCTCAAATTTTTATTGTGTTTCAGCTTACTTTATGATATTC
+TTTATAGCGAGCGAGGTGACAATTATGGCCGTAAGCTATAAAAAACTATGGAAACTCTTA
+ATTGATAAAGATATGAAAAAGAAAGATTTAAGAGAAGCGGCTGGTATTAGTACATCTTCT
+ATGGCAAAACTGGGTAAAAACGAAAATGTTACGACCGATGTGCTTGTGAAGATTTGTAAG
+GCATTAAACTGCGATATTTCAGATATTATGGAGATTGAGCCAGATGAATAGGTATCAACA
+GCTTTTACTTAATAGTTAAGCAACAATGACGCTAATTGAATTATTATGAAAAAACTTAAA
+TTAATAAAATTTTAAAAGTGAGGTTATAAAGATGTATAATCAATTTTTTAATACTGTTCT
+TGAAGTACTAAAATAAAGATGATAAAATGTATTCTGATTACTAAGAAGGTAAGTAATTAT
+ATATAGATTTCTTTGCTTACTAAATTGGAAAGAGATTACAGCCCAGAGGTTGTATATAAT
+GCTCCCCATTGTCAAGACAGTTTTTTAGCTTTTCTAAGTTAGTTCTCCTTTCTTAATTTT
+GTATAATCTTTACAACTGTGCACTCTGTTGGAGGATGTCAAGGGCGAGCGTAAGCGAGTT
+CATCTTGACCCTTGACATCCTTTGGACATATATCCTTTTGCTTTCCGGTCTGTTATGACA
+GACCGGCTGCCTTCCGGTGAGGACGGGGTTTGGGGCGGAGCCCCATAATTCTATACAACT
+GCCAGTAGCTGGTCATATCCTCCAAAGTAATACTCTGCCGGTGTTTTGTAATCCAATGAC
+TGGTGCGGTCTCCTATGGTTATAGTGCTCCACATATTCCTTTGTGATTTGTCTAAGTTGT
+TGTACCGTTTCGCACTCTTCAAGATAAAGTTTCTCCCACTTGTAGGAACGGAAAAATCGT
+TCTATCCTTTGGTTGTCTAATGCTCTTCCTTTTCCATCCATAGATATTTTGATACCGTTA
+TTTTTTAATAGATTTATGTAATCATCACTGGTAAACTGTGAGCCTTGATCACTGTTCATG
+ATTTCAGGCTTGCCATATCGCTTTATGGCCTTTTGGATTGCTTCTATGACGAATGTCTTA
+TCAAGAGTGTTTGATAGTTCAAACCCAACAATATACCGAGAATACCAGTCTATTATTGCA
+ACCATATACATGAAACCGCGTTTCATTCGGCAATAGGTCACATCTATGGACCATACCTGA
+TTAGGATGATCAATTTTCAAGTTTCTCAACAGATATGGATACAAATTCTTACCATGTATT
+CGTTTGCTGAGGTTGGGGCCAGGACAGAATCCATGTATGCCCATTTCCCTCATATAACGC
+CGGGTCCGTTTTCGATTGATATGAATGTGATAATCCTTGTTCAATATACTTGTCATCCTG
+CGATAGCCATATTCCGGATAAGACGCGTAAATTTCATCAATGATACGCTTAATCAGGTAT
+TCCTCCTCATTTACCGGAGCAGGCTTGTAGTAAACGCTCGTACGGTTTAAGCTCAATAAT
+TCTGCTTGCCTTGTTATGCTGAGTTTCTTCTCATTTCTATCAATCATTTTCATGCGGTCT
+TCTCGGGATTTAGAGGAGGCCAGATTTTTTTTTAAGCCAGGCAACCTCATATGATAGTTG
+ACCAATTTGCTTAAGCAGTTCGTCCTTCTCCTTTTCAT
+>NC_009012.1|provirus_2022140_2067593
+TTAAATTGCAACTTCAATCTCCGTGCTATCAAGCAAACTCACTATTATCTTTTTTCCATC
+AAATACTGTCATTTTCTCTATTATTCTAAAATACATATCAACATCAAACTCCTCTACTAT
+CTTTGCATCCTTTAAAATTTCAATAAACTGCCTTGCCTTATATCTTTTAAGCAAGTTATC
+ACTTTTAAGTCCTTCCTTCCACTTCTCCATAAAGTATTCCTTATTCTCCACCATAGCATT
+AAATGTATTTACAAAGGCATGATATAAAACCTTGTCATCTATATGCTTATTCTCACAGCT
+CTTTTTTCCCTTTACTTCATATTTTTTATTACATCTCCAAACCACTCTTCTTAGCCTTTC
+ATCAGTAGAATTCCATACCTTTCTTCCAAAGGCACTGCCGCAGTGTCCGCAGATAACTCT
+TCCTGCAAAGGGATTATCTACTGTGGCATAATCAAGCTTACTGATGTTATATTTTTCAGC
+AAAAGCTCTTCTTCTCTCCATCTCTAGCTGTACCGCTTCCCAAATTTCTTTATCTATAAT
+TGCAGGATGGCTTTCTTCTACATAATACATTGGAACTTCGCCATTGTTTACTGCTCTTTT
+TTTGGTTAGAAAATCAACAGTATATGTCTTTTGGAGAAGTGCATCTCCTTTATATTTTTC
+ATTACTTAAAATCTTTCTTATACTGCTTTCATACCACTTAGGTTTTCCATTCCAGTTAGG
+AACACCTTCTTCTTCAAGTTCCCTTGCAATTCTGTTTGCACCTTTACCGTCAAGGTAATC
+CTTATATATTCTTCTTACAATTTTAGCCTGCTTTTCATTTATCACAAGATTTCCTTCTTC
+ATCTTTATCATAGCCTAAAAACTTTGTATGATTTATATGAAGCTTTCCCTGTTCAAACCT
+TCTCCTTATGCCCCATGTAGAATTTTCACTTATACTTCTTGATTCATCTTGGGCAAGGGA
+GCTGAGGATTGTAAGCAGTACTTCTCCCTTTGAATCTAAAGTATTAATATTTTCCTTTTC
+AAATATTACTCCAATACCTAATTCTTTAAGCTGTCTTACGTAGTTTAATGTATCAAGTGT
+ATTTCTTGCAAACCTTGATATAGACTTGGTTATTATCATATCTATTTTCCCTGCTTTGCA
+GTCTTCTATCATTTTATTGAACTGTTCTCTCTTTTTAGTGTTTGTCCCTGAAATCCCCTC
+ATCTGCGTAAATTCCTCCGAATTCATAATCTGGATGATTTGTTATATAAGATGTATAATA
+AGCTACCTGTGCTTCATAGCTTGATAACTGTTCTAATTGGTCTGTTGATACTCTGCAATA
+AGCTCCCATTCTCTTTTTCTGCGTCTGTATTTGCTCTGCCAGATTGTTTCTGTTTGCTCT
+TGCAGGTATAAGTGTAATATTTCTTGCCATCCTTAACTTCCTCCCTTACAATTATTGGTT
+CTTCTATATTAAGCCTGCTTATAACCTCATCATCAATTGATGTTCCACTGCAGGCGTCTT
+TTCCGTTTTTAATATAATTACTGCACTGCCATACAATCTTTCTGCAATTTAATTTGCTGT
+TCCAAGTTCTTCTCCTTAGAGTAGAGCCGCATTTACTGCAGAAAAGCATTCCTGTTAATG
+GATATCTGTTTGTATATTTTTTTGTATCTCCTGCTTTATTTCCTTTTGCCTTTGCTCTTC
+TTGCAATTTCTATCTGAACCTGCTCCCACATTTCTCTTGAAACTATGGGAGAGTGATTAT
+CTTCAATATAATAGCTGTCAATTACGCCTTCATTTCTAACACTTACTTTTCTCAGATGGT
+CTGGTGTGTAATACTTTTGAAGTATGGCATCTCCCTTGTATTTTTCATTCTTGAGGATAT
+TTAAAATTGTACTTTCCTGCCATCTGCCGCCTGCAACAGTAGGCACTTTATCTTCATTTA
+ATTCTTTGGCTATGGTAAATGTTCCTTTGCCTTTTAAATAATCTTCAAATATTCTTTTAA
+CTATTTCTGCTTCTTTTGGGTTTATAACTAAATCGCCGTATTCATCCTTGTCATAACCTA
+AAAATCTTGTGGTATTTATAATCAGCTCTCCTCGTTCAAACTTCTTTTTTACCCTCCACT
+TTAAGTTATCACTGATATTTTTACTTTCTTCCTGGGCAAAAGAAGAGAGGACGGTTAGCA
+TAAGCTCTCCATCCCCTGATAAAGTTCTGATATTCTCTTTTTCAAATATTATTTCTACAC
+CAATGTCCTTTAGTTCTCTTACTACTTGAAGCATTATTGCTGTATTCCTTGCAAATCTTG
+AGATAGATTTGGTGATGATTAAGTCTATTTTCCCTTCTTTTGCAAGATTAAGCATTCTTT
+GAAACTCTGGTCTATTATCTGTAGTGCCGGTAATTCCTCTATCAGCAAATACACCTGCAT
+ATTCGTAATCAGGATTATTTGAAATCAGATTTTCATAATACTGGATTTGATTTTCTAAAG
+ATTCACCTTGAGCATCACTGCCGGTTGAAACTCTTGCATAAGCACAAACTCTTTTCTTTT
+TATTTTCCTTCTTTTTTACAGGTTCAATAATCCTAACACGCATTCTATATCCTTCCTTCT
+ATCAATTTGGTACTACTATACATCACTCTAAAGGTGATAGAAGTCAAGCTAAACAAAAGA
+AAAGCCGCTACTTTAATTAACGGCTACTTATTAAATATCATAATTACAGCATCAAACCCT
+GCTGCCCTAAGCCTTTGCACCTGCTTTTCAGCATTTTCTCTTGACTTATATGAACCTGCC
+ATAACCCTGTAAAGAGTCTGCTCGTTTTCTACTTGAGCTTTTGCTGAAGGTTCAATATAA
+CCAATACCTAATTGTGCAAGAACTGCTTTAGTTATAGCCTTAACTATTTCATTTCTCTTT
+GAATCAAATAAAATATTATCTCCTGTGTTATCAATAAAACCTATCTCTATTAACACTGCT
+GGAGCCTTGGTTTCTCTTAATACATGATAGTTAGCTTCCTTAACTCCTCTATCTGTAAAT
+CCTAATGCTGCAAGTGATGTTTGTATCCTTTGTGCTAATGCTTTTGATTTTGCTCCTCCA
+TTTAAATATGTGTATGTTTCAACACCTTTTGCCTTTTCTGGATCATAAGCATTCCTATGA
+AAAGAAATGAAGTAATCATAGTTATTCCTATTTTCAAAAGCACTTCTCTCATTAAGGCTT
+ACTGTGGCATCTGAAGTTCTTGTTTCATCAACTGTAACTCCATGCCTTCTTACCTCTGCT
+GCTACAGCTCTGCCTATGCTTAGAACATCATTGCTTTCCTTTCTTCCCTTATATACTGCC
+CCTGAATCTTGGCCACCGTTAATGGCCAGGATCAATCATTATAATCCTTGGCATTTAAAC
+CACCCCCTCAATAAAACGACCCAAGGAATCTCTTCTCCTTGGGTGTAAAATATTGTTATG
+GCATCTAGCACATACAACTTGTAGATTATTTAAATTGTTATTATTTCTATTCTTATCTTT
+ATGATGAATGTGCAGACGTGTACCTTCTTCTTCTTTCCCACAAACTTCACATCTTTTAGG
+CTTATTTGCAAGTGCTATCCTACGCCAGACATCACCTGAGATGAAACTGCGTCCATCTAT
+ATAACTAGGTGCTAAAGAACCTTTCTTTCCATACATAGGATTATTTTTTCCTGATACATC
+TGCATGATTAACACTTATTTTTAATCTAACTTCTGATTGCCAAGCTGGATTATCTATTTT
+ATTTCTATATGACATCCTACACGACTTTGAACAAAATTTACCTCCATTATTTCGTATTTG
+GGACTTATATACATAGAACTCATCATCACACCATTGACAATATCTTTTTATCTTAGTCAA
+CCTTATCATCCTCCTTATTTAGCTGTTTTAAAACATCCTTTAGTTTCTCTGGTATTGGTA
+AGCCTATCTTAGCAGAGTTCTCTATAATGCTTATTCCTTCATTGGAAATGTAGAAAAAAA
+TAACAGCAGTACGAATCGCACTACCGTTTTTAATCAAATGAACATCTACTATATTTCCTA
+TGCCCACCATTACAAAAATTAAAACTTTCTTAAATATCCCTCTGAATCCTACCTCACTTG
+ACAGCTTTCTTTCCAGCACTGCTACCATGAGACCTGTTACATAATCAATTACAACAAAGG
+TAATCAGTGCATACATAAAGCCATCAACCCCTCCTAAAAGCCAGCCAATATAGCCGCCAA
+TGGCAGCAAATACTGCTTGAATAAAATTAATTGAATTTTTCACTGTAAATCCCTCCACTC
+TAATAAAAATCTTCTCCATAGTTAATTAAATCTACTTCAAACATATACTGAACTTTCATT
+GTATTTGCTTCAGTTTTTTCAACAGGCTGTGCAAGCTTGGTATGTGCTCCAATAGGTCTG
+CTTGTTAAAAGGGCTTGGATACATAATTGAACATAGTTGTTATAAGCATAAGTGTATCTG
+CTTATCCATCTGTCAGTACCAAGGATATTATGATAATAATAATTACCATAACCATTTGGA
+AAACTAAAATACATTTTATAGGCTTCCAGTAAATTCCCTTGAGGAGTTATAACTTGATAA
+AAGCTTGTACCCCCTTGAGTGCTTGTGTAATATAAATAAATTCTATTGGCACTTCTATAA
+AAATTATAAACATAGCATCTTCTCTCAATATTTCCACTATCCATACCCTTATTTCCAAAC
+CAAGTGCTATTACCAATCTTAGGTTTAATATTCATATCCTGAACCTTGTTTCCTGCGGCA
+TCTACTCTAATCCATCTGTTTGTATAAACAGTTTCATTAAATTGGCTGTCTGTTCTTGAG
+GTGTATCCAATAATATCAATGCAACCATCAAGATAAATTCCATCACTAGAAACTGTTCTA
+TATGTGAAAGGTACGTTATATGCTGTATCCTTAAAACTTTGGCTCATATTTATATCAACA
+TAGCTTAATTGAACTCCTACCTTTGTCCACTTATATATTCTCATATATCTTTCACTATTT
+ATGCTGTAAAGGTAATACCCAATAAAAATAAGCTCTCCATCTGGTTGAATATACGGGCAT
+ACATGACTAAGTCCATCGTATTTTCTTACTGCATGACTACTGTCAATATTTAAGGCATTT
+CCATCTGAATTTAAAAGTTTAACCACCTTATCCCAAAACACAACATCATTTGTATTTATA
+TCAAATGGAATCATAAGCCATTGTCCTTTTAAGCTGTCTGGAAATTGAATATAGCTTGAC
+TGTGTTATGTTTGTATCCCTTGAATCTGCTAATATCCATCCCTTTGTTGGACTTGTAAAT
+TTTATAGTTCTTGCATAAGAAAATAAAGTATTCACTGCCCAATACCTTTTAGGATTTGTA
+GTATTATATACAGCATAATCTGAATCTGCTGTTTCCCTTCCATAGATTGCGGTTCCCGCA
+TAAAAATAATCCTTATTATCAGGGTCACCCTCTGCCCAGTAAATACTTTCAATTTTACCG
+TTTGCCGCATGGGTTGGAAAGTCAAATACAAAATTCATCTTTATTTTAGAATCTGTAACT
+TCAAATTTTGATTCTGCTCTATTTATAGTTCCACGCCTTGTATCATTTCCAGAGTAAGTA
+TTATTTCTATGGGCAAACCCTATAATATTTCCCATAACCCTTTGCTCATTAACATTTTCC
+GGCTTATCATTATCAGTTAAGTATAAGTATTCAAACCAGCTGTAATTATCACATCTTCTT
+GTATTTCCTGCACCCATAATACCTTGAACAAAATGTCCTAAAAATGTATCTTTAAAATAT
+AAATCCGGTATTAAGTTTTCTGTGTATGCCTCTCTTATTTTCTCCTTAGTTTCTGCATTA
+AAAAGTTCTAATAAAACCTTTCCTTTAATGCCCCTCTGTCTTTTACTCTTTTTACTTTCA
+GAAATCTCACCTGTAAGCAAATCTTTATTGTAAGCAATACTTTCGTAAGGCTGTCCCTCA
+ATAAACATATCATCACCCCTCAGTTGTAAAGAATTTTCATCTTCCTTAATTTACACACAT
+CATTTAATGTAGGTTTTTCTAAAATATAAGCAAACCTCAGTTTCCTATTTTGAGCAATCA
+TTGTATTTAAAGCTGCATAATCTAAACTTGTAAGTATTGTAGGATTTATCCCATTTACAA
+GAAATGCAGCAGAATCTATAATATCAATACTTTCAAAGCTTGATGTATTGATATTATAGG
+TAAGCCAGCTTAATCCCGAATCAACACTTAAAGCTATTCTAATTCTGCCATTGGTTGTAA
+CATCATTTAAATTTGAATCTTTCTTAGTGTACTGAACAATTGCTTCAAGTTTATTTATGC
+TTTTCCCATCATGTATGTTAAAATCATAGTTTTGAATAATTACCTTTGGCTTACTTGTTA
+CTGTCTTTTCAATAAAGAATCTATTGCTATTTTTATTTGCCTTAACATCTGGATTATCAG
+TATAGATATAAAGAGCAGGTGAAGTGCCTGAAAGTCCTGCCATGGAAGCAGGAAGAGTAT
+CAACGCCGTAGGTTTTAAACATTTCTTCTGTAAGAGGTAAATCTCCAATTTTAACCCATG
+TACTACCTTGATAGTTTTTCACTCCTTCATTATCCACCATAAGAAATTTTGTTATACATG
+GAATATATGAACCTTCCTGCACTATGTAATTTTTACCCAGTGGGTCTGATGGAGTGAAAA
+TATATGATTTTCCCGCTGTTAATGCCAATGATTGAGTGCCTACATTTGGATTTACAAAAC
+TATTTGTGCCGTTATTAGGTATCTTCTCAACAACAAGCCTTATTACTCCAGTTTCAAAAA
+TAGAAAGTTCCCAAATAAGGTCATTGCTGCCCCAGTTGCTATAGGAACTGTTTCCTTCAA
+ACCTTATTCTGAAAAGCTTTGTGCTGTATTCTACTTCACTGGCATAATAAAGGTTATTAT
+AGCTGGCATCTCTTCTGTTAATACAAAGATGTTCTGATGCTCCCCCAAAGCCTACCCAGG
+TATTACCGCTTGTGTAAAGCTGTCTTATGGCTAAACCATTGTAATTAAAGTTAAAACCAA
+TGTCAGGAAGAGTTACTGTACTATCATCATTTCTTGTACCATAAAGTGTCATTCCTGCAT
+TTCCTTTTGGAAGGGACATTTGATTTATAACTGGCATTATCCTCTCCCCCTAACCTTGCT
+TAAGATATGCATTTATTGCAATCAAATCCTTATAAAGTGTTGTATCCCGCACATTTGCAG
+CATAAATTACGCCATTTCCTAAGTCCTCAATATATCCGCCTTCTCTTTTTAAAATGGGCT
+CCTTTATTGTTACCCTATTATAAAAGTCATAGGTTCCATCTTTGTTTTTATCGTAGTCAG
+AACTAAACTCAACCCAATCGGCGTCAAAAGCATAGCTGCTTGATTTACTGTTATTAAACT
+CTTCTATAATTCCCATTACATTTAAGGTTAACTTTGGGTTTCCATGAGATATAGCAGCAA
+TATTAAATCTTGTATTGAAATTCTCAAGACTATAGCTATCTACTCCACTCACATTGTTGT
+CTAAATAATACTTAAAACTGTGTCCTGTATTAAAACTGTATGTTCCAATCTTGATATTGA
+ACAAATTATAAAGGAAAGTATAAACAATCTCTGCCCTTGGTATACTTGCACTTAGTCCAC
+CCTCTAAGTCTCTTCCCTCAATACTTACCTGCAGATTATTCTTTTCAATTGTAAATGTTC
+CATTTGAAACCTTCATCTCTACCATAAAAGTATGGTCTCCTGCCGTTACCTGTGGCATTG
+GAAGGGGCAATCCTATAACATTATCTCCTGATGCTAACTTTTGAATTGGCTTAAAATCGT
+AGTATTTTCCATCTAAGGAAAACAGAATTGTTAATGTGCAGTCTGCACTAGCTTTCCCTG
+TCATGGTGATATTACAATTTAAGTTTGTATCTGCTTTTGTTGTTATTCCTATAATCATTG
+CTGGATAGCTGCTAGTGCTGATTGTTATAGTATCGCTGTTTTTCTTGATTATTACACTGC
+TTAAAGTACCGCTTATTGCACTGTTTATTTCCTCTAAAAGCTTACTGGTATCCAGCTTTT
+CAATAATTGTGTTTAAAGGATCACCAAGCTCTATCTTTGTATTTATAGGATTTATAAGGT
+CTGTCTTTTTCTTTATAACTCTTAAATCAGTAGTTACAGCTATCTTTTCATTTCTTACCT
+TTACAAAATCACCAACACTTACTTTAGTAAGATGACTATAATTTTTATACTCTTCTGTCT
+TACTTAGCTCCATAAAATCTATTGTTATAAATACCTTTGGACTTGCAGCCTTTTCAGCAT
+ATTCTTCTGCCCTTGCTCTAAGGCTTTCTACATCCTTGCATTCCTTAAACTCAACCCTTT
+TGGTTATGGGATAGGGAAGTAATTTTGCTCTTTCTCCCTCTACTTCTATATATCTTTCTG
+GCAACAATAAATTATTTGCTCCTACTGCATATATCCTTGTAGCAAGTTCACTGGTATCCT
+CAATAACCTTCATTCCATTTATGTTTTTACCGTATTTTATTAAAATTCCATTGTTTTCAC
+CAATGGACTCTTTTATCTCTATATTAAAGTTATCTCTAAAAAGTTCTCCACCATAAATTT
+CAATAAGTCTAAAAATAGCATCTACTGCATTAACCTCTTTAACAGCAAAAGGTGCTAAAT
+TCTCTTCTAATGCCTTGAATAAAAACAACCCTTGAAGTTCGGGCGGTATGCTTGCTTCAA
+GAGCTTCTTTCATATTTGCATTAAGCACCTTTGCTGATTCTATAAAATAAAAGGCAAGAT
+CATAGAATATATGTCTTGCCCATACCTTAACTTTACTTATTTTATCCTGTGTTCTCTCTA
+CTTTATATATTCTAAAAAGCTGTCCATCAGCTTTAATAATATTGAGTTCCTCTAAATACT
+GTGCTTTTTTAGATTGAGCAGGGTATTCAATTTCTAAACTATAATCTCCATTTAACTCTT
+CATTTATCTCAGCCATAAGGCATTCATCTAAAACAGCAAGCCCATTATTGTCAAAGTTTC
+CTCTAGTTGTCTTCTTATCATATACATAGATCATTATAACCACCGCCAATTTGGAACAAT
+TTCTATTTTTGAAACACTACCTGTCCAATCAAATTTATTAGAACCTGTTTTTAATGTTAT
+GAAATCACCATTTACTTTACTGTTTAAGTTATCTCCTGCATCATTATAGGCATCTTGAAT
+GACTGAATCTAATATGATTTTTCCTGTTATATCATTCAAGTTTACAGTAGTTTCATTAAC
+CTTAAGGCTTACCTTCCCAGAACCATAAACTGATATTATAGGTTCACTTTTAAGTGTTCC
+TGGATTTATTATTGAAGCTCCATTTTCAGTAATAGTAAATATGTTATTCTGCACAGCGTA
+TTTAAAGGGTCTGCAATTAAATATAATTGGAAAAACAGATGTGTATTTGAATACTTGTTT
+AAAATCTATAGCATTAACTACTTGTGCTTTATATTTTTTATCATCTTGAAAACTAAATAT
+TAAATCACTTTCTCCTGCTGAAAAAAGCCATGCCTTTATATTATCTAGCTTTTCAGCTAT
+GTTATTACCTTTAATACTGCATTCAACTGCAATTGTTATATCTTCATAAGTTCCTTCATC
+ATATCTTAAGCTTGAGTCTCGCCCTGGAATATCAATATATGATACTCTTCTTTTAGGAGA
+TGGCAGAGATGGTCTTTTAGAAATAATAATGCCATAATCACTATAACTATTTTTTCCACC
+AAAATTGAAACTAAGCATTAAGCACCACCCCTTCCCATTGAAACTCTCTGCCTGTAAAAT
+TCAAGCTCATAGGCAAGCTGCTCTATATCCTTATCTGAATTATTAATGAAATTTTCTATA
+TGAAGTGTTAATCCGCTTCCACTTCCTCCTTTTGCTTTTTCAATTGCCCTTGCCATAAGC
+TCATCTAACCTATCTATAGGAAGTACAGCTTCAGTTCCTGCTTCACCGACACCGATTATA
+CTAGGTCTATTAAATATACCACCCTTCGCATACCAATCTACACCTAGGTAAGGTACACTT
+GGAGGTTTCAAACTAAACTCTCCCTCAATACTAAAATGAGGAAGTTTTATTTTAGGTATT
+TTTATTTCTGGTAAATGTAGATTGCTGAAAAATCCTTTAATTGCATTTATAGCATTACCT
+ACAGCATTCTTTGCTGCATTTATTGGATTTTCAATAGCTGATTTTATCTCATTCCAAACT
+GCTGAAGTTATTCCTTTAATGCCATTCCATATTCCTAAGATTATGCCTTTGATAAATTCA
+AATTCTGTTTTTATAGTTCCTTTAACTAAATCAATGGCTGATTTTATCACATTCTTTATT
+CCATTCCATAAGTCAGAGGTAAGATTTTTTATTCCTTCCCATACACCCTTCCAATCACCT
+TTTATTGCACTGGTAACTATTTTTATAACATCTTGAATGGCTTTAAGTGTGGTATTTACA
+ATAGTTGCTACTAAATTAAAAGCAGTTGTTATTATCTTTACAAAATCATCACCATACTTT
+TTCCATATTTGATTTGCTAAGGTAATAAAGGCTTGAAACATAGCCTTTAAGCTTTCAATG
+ACACCACTTATTAAAGCTTTAACTCCATTCCATACTGTATTTACTGAATTCCTAAAGTCC
+TCATTATTTTTGTATAAGGCTACAAAAATAGCAATAAGACCTGTAATAGCCGCTACTGCA
+ATGCCAACTGGACCAGTTATTGCTGCAAAAGCAGCTCCTAAGGCTCCAGATGCACCACCT
+GCTGCTGCCATTGCTCCACTCACTGTTCCAATTACAGTAGAAAGAGTTCCTGCAATACTT
+ATTACCTTACCTATAATCATGATTACTGGACCTATTGCTGCAACTACTAATCCGATTTTA
+ATAATTGTTTCTTGCTGTTCCTTTGATAGCCCTTGGAACTTATCTAAAAGAGGTTTTATA
+GTGTTCATTAGTTTTTCAAGTATAGGAATTAAAAGTTGTCCAAACTGAATGCCAAGCTGC
+TGTGTTTGCTCTTTCATAACTCTAAGCTTATTGGTTGGTGAATCCATAGTTCTTGCAAGG
+TCACCTTGAGCATTTTTTGTAGCTTCCATTATAGCACCATACCTTGCTTGAACCTTTTGT
+GCTTCAGTAAGCTGTTCACCCTGCTTTGCAATTCCATGAGAATAAGCATAGGTTTTAATT
+GTATTATCATTAACTAATATACCTAAAGCTTTAAGTGGTTCTGCCTCTCCACTAATACCA
+GATTTTAATTTCTCAAATGCCTCTTCTGGTTTTAAGTTATAGAAAGAAGCCATATCATAG
+GAAAGCTGAGTTAATCCTTCTGACATCTTTAATGACTCTTGTGAAGTTAACCCCATAGAG
+GTAAGCATGGCATTATAAGTTGCTACATTTTTTCTTACATTGAAAGCATTGAGTCCTAGA
+GCTTTTGAGGTTTCTTCTGACCACTTTCTTGCATCGCCTGCCATTGAACCCATAGCTACT
+TCAAAGAGATTTTCAGATTCCACTGCATCCATAGCCATTTTTGTTGCAGCAGTTCCTATT
+CCAACTAAAGGAAGTGTTACAGCAGTAGAAAGCTTACTTCCTATAGAAGACATCTTATCT
+CCTACAGATTTCATCTTTTCTCCTGCACTATTCATGCTTTCAGACAGCTTATACCAAGCC
+GAGCTTTTTTCCTTAAGTTCTCTTGTTGCCTCTTTCAGCTCATTCTCCATTTTATTTAGT
+TCTGCTGTAGCATAATTAAGCTTAATTTTAAGATTTTCAGTAGCCTTTGCATCTTCACCC
+TTTGTTTCTACACTCTTTTGATATGCTTTTTCTAATGCCGCAACTTTATCCTTCTGAAGT
+TCTATCTGTTTATTTAAGGTATCTGATTTAAGTCTTAGTCCTTCTTCAGATTTGCCAAAA
+TCACCAAGCTTAGAAGAAGCTGCTGCAAATTCACTTTGAACAACCTTTAGACTTCTTTGA
+ATTTTTGCTACACCTTCTTGAAAACCTCTATCATCAAGTCCTACCCTTGCAACTACGGTA
+TTTGCATCTCTTGCCATCATCTCACCTCCCTGCTAGAAAATAATGTTATCTATATAATCA
+AGCTCCTCTTCTTCCTCAATTCCATTTACTCTCTTGTATACATTAAAAAGCGCTTGTAAC
+TTCTTAGGTGTACTGTGCCAAAATTGCTCCTCTGTCATTTTTAAAAGGTTTGTTCCTAAA
+TAGAAAAGCCACTCCCAATCCCAACCTTCGGAATCAGTGTGGCTTTCTATTCCCCCATGT
+TTTCAGTTACTTCTGGCATTGCTATTACCAATGCTTCATTAATTGCAGTGCCTAATTTCT
+CCATATCACTTAAAGTTAACATTTTTCCTACTTCTTTTAAGGTTACACTTTCATCTGCAG
+CCTTAATTGCTGAATAAATAAGTGCTCTTATTGCCTTTAGTTTTCTATTCTGTAAATCTT
+CAAAAGCTTCATTGATATCTCCATAGATCTCTTCTAATTCACAGAATGTATTCATATCAA
+ATTTAAGTTCATACTCTTTGTTTCCTATAGTAATTTTAATACCTTTATTTTTCAGTTCTG
+ATGCTTTCATATAATCAGCTCCTTTCTGGATTTTGGGTATAAAAAAACAGGGATGCTTAT
+TTCCCTGCTAATTAAAAATACTTTAATGTTGATACATTAGTATAAATATTGTTCTTAACT
+ATGTATCAAAATAATTACTTAAGCTTTTGTATCTCTATAACTAAAATAAGGACCGCACCA
+CCCAGTTTCGTGTGTTTTTACATAAGTCCAGTTAAATTCTTTGTCTACAACATAAACATC
+AAATTCATTCAACAAATCATTTGCATTCAAGTTAGCTGCCTCTTCAACAATAAAAACATC
+ATCTGTATGTTGGTAAAAAATATAACAGGAATTTTTCCGTTCATTATTAAAAGCCGTTTC
+TGCTTCTTGCTCTTTCAAACAAACTCTTTTTTCGAAGCTGAATACATGCCATAAATATCC
+ACAAAAACCATCGTCATCGTACATAAAAATTTCTTTCTTTTCATTATGACTCAAATGATT
+TGCAAAAACATTCTCCCATTGCTTTCGTAAAAAAGTCCCCCATTTAGGAACTTCAATCAC
+CTTAATACTTTTATTTTTAAGTATCTCATTTATACTCATATTAAGTTCCATCTCTTCACC
+AACCTTTAGATTAACTCAATAATAAAATTGTAAATTTATCAGCCTTTTTTATTGTATTTA
+GGACGATATGCTAAGATAAAAGAGGATTCAAGTGCTTGTCTAGCAATAATATCAATTTTT
+TCATCTAACTTTATAATATGAATTAAATTACCTTCTTTAAACCAAGGTTTGTCCGACTCT
+TTTGGAGTATGCTTATAACATCTATCGTTTAATGAAGTACCTGTTTCTCCAATATATAAA
+CATTCAGAATTATTATAAAATAAGTATATGATATTTGAAACCGAAATTTCTTCTTTAAAT
+TTTTGTTATAAATTGCAATATTAAATGCCGTGCAAAATTTGGTAAATCCATTGCTTACTG
+GAATAAATTCTATACATCATACCGCCATTTCTATGGCTGACCTATAACCAAACATTCTTC
+TTGGATATTCATTAATCCATCTCTCTATACTTTTTATTTTTGCTTTACTTACTTTTGATA
+TATCTGTTCCTTTTGGTATAAATCTTCTTATCAGTTTATTAATATTTTCGTTCGTTCCTC
+TTTCCCAAGAACTATAAGGATGAGCATAATACACTTTCGTCCTGTCCTTGCCTGGCTCTG
+TTTTTGATTTCTCTATCCCTCTATAGTCCAAAAACTCTGTCCCGTTATCTACTGTTATCG
+TTTTAAACTTCTCCCTAAATTTCCTTCTATACTTCCTTTCTAATTCATCTATTGCTTTGA
+TTACTGATTCCTGCGTTTTGTCTGGTAGTTTAAGAATTATTTCTTCTCTTGTCTTTCGTT
+CACTTAATACCAGTAATACTGCTGCGCTATTTTTTCTGCCTACTACACAGTCCATCTCCC
+AGTGTCCATATTCCTTCCTATCGTTAACTTCTTTCGGCCTTTCCTCTATGCTGCTTCCCT
+TAAGATTTTTCAGTGCTATCTTCTTTACCCTTTGATATATGCGTTTTTTACCATCCTTTT
+TCACTGGCAAATATTTATTCGTTAGTCTTAAAAATACATCCCCTCTATCAATGTAGTTAT
+ATAGTGTTTTCGTGCAGATACTCGTTTTAAACTTCAGTCCCTTTGCTTTTATTTGTCCAA
+TAACAGCATCAGGAGAATATTTTTCATTTATTATCTTTGATTCTATATACCTCACTAATT
+CATGGTCATTTCCTATCTTTAACCGTGGACCTTTATTCTTCCCGTTCTCTACATATCTCC
+TTTGGGCTACATCTGCACAATACTCTTTTCTGTATGTTAAATCACTATTTTGTAAATATA
+TTGTCCCACGGGTTATTTCTCTTTCTATTGTCCTTCTGTGCCTGCCCAACCTCTTTGCTA
+TTTCCGTTACTGTATACTTTTCTTTTAGGTACAACTCTATGGCGTATCTTTCTCTTTCAT
+TTAGGTGTTTGTTTTTTCTTGTTTCTGTGTTATTATTCATATATAACTCATGGTACTCCT
+TTGCTAATGTTTTTCTTTGGTTATTAAACATTTTACAATGGATTACCATGAGTTTTCTAT
+ATATTACGGCATTTTATTTTACAACTTCCCTCTTTAAATTTTTGTATATCTTGTTTATTA
+GAAACTAGATTACAATAATTATATTTTACAGTTTTTAATTCCATTTTATCCCCCTTTGAA
+TTATTATTTTATCTTTTAGTTAAGTAAATATCATTACTTCAAAACATTCTACAACGGTAT
+ACTAACTACATATTTTATTATAACAAACATTTCCTTACAGTTAAATTAGCTTCATGTAAT
+ATTTTATGCTGTTACTACAGGCTCTTCAGGAACAGCAGTAAACCACGAACTAATAATTGT
+TGCATCTACCCCTTCAGCATCCTCATCTGCAATAAATCTATAATTACCATCAAAGTCCCT
+TGAATAAAACTTGCCTTTAAGCTTAGCACTTTGTGCCTTTGGCTTTTCTGCTTCAGTATC
+ATATTCATCTGTTGCAAGTTCAAACTTTCCTTTTAAAAGCCATACATACCTGTACTTCCC
+GTTATTTTTCTTAGATTTAAAACCAAGTGCTATAGTTGGAGGCATATCATCCTTGTTTTC
+TACTAATATACCCTTTACAACCTTTGATCCCTGCAGTTTTGCCCTGCTTGTAATTGATAG
+CTGATTTACTTCAATTTCTACATCCACACCTTCAAAAGCAGTTATTATATCTTCTACAGT
+ATCATCTGAATAAATATTTTCTGAATTTGATTTTGGAGAAAGTTTAGCACTTATTGCTCT
+TTCTAACTTTTCCGGAGTGCTGTAAGTAACACCAGTACTGTCATCCTTTGTTAAAACAGC
+TATATGAATATCTCTAAGCCCTATCTGTCTTGCCATACTTATTCACCTTCCTCTAAATAA
+TAAAATTTAAAGCCTTTATGATAGATTTTTGTATCTTCTTCATAAAGGTCTATTTCATTT
+AATCTTTTGAACCCTGCTTTAAGCAAAAGTTCTTTTATATTTTTAACTATATCTGTATAA
+TCAGCCTTTGACCACACATCTACTTGGATATAATGTGCTGTCAAAGCTTCTTCATCATCC
+TCATACTCTTCACCTGCAGTTAAATACTCATGAAAAGTAATATAGGTTTCTGTTTTTCCA
+CTATACTTTTGAAAAGCTACTGGAATCTTAAGAGGTTTCAATGTATCCATAATCAACTTA
+TTTATCATTCCTCAAGTCCCCTTTGCAGTTCTTCCTTTATAATATTATTTATCTCTCTTT
+TATTCTCAAGGACAGAGTTCTCTGCCCAATGCTGTGCAGGAATTTTACTTGTACCAAATT
+CAGTAAATTTTGAATAAAAGAACTCTGAATTATCTCCTTTATTAGGACCTATCTCAATAA
+AATCTACGCCGTTTTCTTTTTCAATATCCGAAACCTTTATATTATCTGCCATATGTCTTT
+TTGTCTTGTTTGACCTTGGAGCATTTTTTTCCATGCTAGTTTTCACTAAATTCCCTGCTT
+TATCAAGTGCTCTTTTCTTTATTACATCTCCTCTTGCACCCAGCTTGTTTACCCTGTCTA
+TAAGCTCCTGCATTCCTTCAAGTTCTATTCTAGCCACTGATATCAACCTCCATAGCCTTG
+ATTTCTATGAATTTATTGGCATATTTTATGTTATCAATTGAAGTTATATTGTACTGCTTT
+CCTTTAAATAAAATCCTCATTGTTGTTTCAATATTTGGTACATACCGTATAGTAAATTTA
+ACAGTATTTTCGGCATGAACAGCTGCTGCTTCAAAGTATTCTCTGCCATGAAGATTTGTA
+ACAGCCGCCCATAACTCTTTAAAATCTGTCCAAGTTTCAGTTTCAAAGCCATTATCATCT
+GTTTGAACTGTATTTTTCTGCAATTTTATTCTATGTCTTAAATCTTCAGCCTTCATATTG
+GAATCACCCTGTTCATAGAAAGAAGAGCATTTCTTGCTTCCTCTAACTTTGTTTTTTCCT
+CTGGTCTGTAATCATCATATAAAAGCTTCATTTGAAGTATCATTGCCCACTTTATTGCTT
+CAGGCACTTTATCTCCACTATCTCCATAGCCTGCAATTAATCTTACTCTTACTGCATTTA
+CTGACTGAAGTTCTACTGTAGGCCAATGCTTTCCTCTATTTAAAACAACTCTATTTACAA
+AGCCATCTAAATCAAAAATATAATTACTTTCATCAAATAAATACTCCTGTCTATTCTCAT
+CATAATATTTTATACTTTCCACCTTTTGTATCGGTGAGCAGCTATCAAAAACTATAGCAT
+TACCATTAGGGAAAGTATCCAAAACAAACTCTAATGTCTGAGTTATATATTTTCTATTTT
+GAAAGTTTTCACACCATTCCCTTGCCTGCTTTATAAGACTTTGTATTAGCAAATCATCAT
+CATTACCATCTACTCTTAAATGCTGTTTTGCTTCTTCTAAAGTTATGGGTTCAACTATTG
+GTGGATTTATTATTTTGATTGCCATCTTATCACCCCAAAAGAAAAGGAGCACTAAGGCTC
+CTTGATTTAACTGCTGTATCTGCTGTCTATAATAACATCTGCACTTGCAAAATTAGCTGC
+TTGAGAACTTGCCCCGATTTTAATTCCGATACAAGTAAATCCTTCATTTATATCAAGCTT
+TGCAGGATCTATTTGAAAAACAATCTGCTTATTTCCTGCTGTTTCTTCTACTGTATATCC
+TGCTCCATCTGTTTTTAATAAAGTATCTGCAGTCGTATTCTCATTTGCCCATACTGGTAC
+ACTGCTGATTAATGCCTTTGAATCTGTTCCTTGTGTATCTTTTGCCTGATATATGGATAT
+TTGTGTTTCATGAGCTGCTGCTTGAGTAAGATTTACAATTACTACAGCATTTACTGCATT
+TTTTAAATTTACATATCTGCTTTCTATACCTTCATTTGTTGTCTTTGGTGAAATGATCTG
+TATTACTTTATATTTTTCAATAAACATAATTTTTACCTCCTACCTATCTGCTAAAGTTAC
+AAAAGGACTTAGTGGATTTGCACCCTTGTAAGGCATAATTGGCTTATTCTTATAAGGCAT
+TCCATTGAACTTATAGATGAATCTGAATACCTGCTCATCATATAAAAATCTTACATGGAT
+AGATACATCAGAAGTTAAACCTTTTTTATCTATTCCAATATACTGGGTTGGGTCAGCTAA
+AATAATATCTCCCTTTTTACCAAGAGGTGAACACTGCTCTATTGGAATTATTGGTCTATT
+AAGTAAGGTACTGTACTGTGATGCTGCAGCTCCACCGGAAGGCATAAACACAGGTGCTCC
+ACCAGCTCCAATATTAAGAGCCATAGTGTAAAGCTGTGGTTCTATCTCTTGATTTATATA
+CCATACTGCATTTGCTCTAAGTCTTGCAGGCATTGAACTCCACATTTTAAGTATATTTTC
+ATACTTAATTGTTCCTGCTCCTTGATCTTTTTCCTTGGGTACTGTAACTAATGCATCAGA
+GTTTAATATTCCAAGGGGCATTCCAACACCAGTACCATTAATGATTGCATCATCTATTTT
+AAAACTCATTTCATCTGCATAAGCTTGCCTTACTATAGCTTCAAGTGCTGTAGTATCTTG
+TAAAAGGTCATCGGTTACATAGCAAAGTGCTAAAAGCTTTTGAAGTGACATTTCAATTTC
+CCTAAACTTTGGCTTGCTTTGAGCTGCTGTTTCTGCTTCAGCTACCCAGTAAGCCTGTAC
+ACCTCCCCATCTTGAGCCATTGGCTCTGCTGTTTTCATCAATTCCAAGCGCCCTAAGTCT
+ATTGGTATTAGCCCCTATTGGTATCATTCTTATTCTGTTTGCCACCTGACTTTGTGCCAT
+CATGGATTCAAATAAGTCATTTATAAACTCATTTTCTAGTAAAAATCCTCCTTCTGAAGC
+TATGCTTTCATTAAGTCCTGTTGCTGAGTTCTGATAAGTTAATCTGTTGTCCATTCTTCC
+TCCGGGAGATGAAGCCTTTGCAACGGCACTTAAAAATTCTCCCATGCACTTCCACTTCTT
+TTCATTGTGATTCTTTGGCTGAGCATATATTGGTTCATTCACTGGCGTCTTAGCCTGTTT
+TTCTCTTTCTGCATTTAATGCATCAATTTCTTTTTGTGCCTCAATTTTAGCTTTTAAAGC
+CTTAATTTCAGAAAGCTTTGCATTAATTTCATCAGCTGTAGCCTCCTCTTTATTTATAAG
+GTTTTTAGATTCTGTTTCTAAATTTGATAACTGAGCTAATAATTCTTTCATTTTTTCTGA
+CATATACATTACCTTCCTTTCAAAATAATAAAAGCCCTAAAGTTCACACTCTAAGGCAAG
+TTTTGCTTTTAATAATTTTATTTTTTCTTCATCTTTATAGGTTTCTTTAAACCTTTGATT
+ATACTGTTTTATAAAATCTCTAGTCCTGTTATTAACACTATTTTGAATAGCAAACCTGCT
+GAACATAAAAGAATTTTCCAATGGCTCTTCTTTATTCTTTTCATAAAGCATTCCATCTGC
+AAATCCTTCAGCTACAGCTTTTTTTGCACTCATCCAAGTTTCCTCATCCATCATCTGAGA
+TATTTTTGCTCTTGATTTGCCTGTTTTAAGCTGATAGGCATTAATTATAGTTTCCTTTAC
+TTCATCTAGCACATCAGCTCCATGCCTTAAATCCTTAGCTTCACCTTGAAAAGTTCCCCA
+GGGGTTGTGTAGCATTATTATTGATGTTGGAGACATAAGTATTTCATCTCCTGCCATAGC
+TATAACTGAAGCTGCTGAAATTGCCACACCATCAATTTTTACTTTAACCTTTCCCTTGTG
+TTCCTTTAAACCTGTGTAAATTCTTGAAGCTGCATAGACATCCCCTCCATAGGAATTGAT
+CCAAACATTTATGTCTTTGCCTTTATATTTATTTAGTTCTGACATAAAACCCTTTGGAGT
+TACATTGTCATTTCCAAATAGCATCGACCAAAAATCATCGTCCATGACAATGTCACCATC
+AATTCTAAGCTCTATCTCCTCCTCATTTTCTTCGCTGTTTTTAAAATTCCAAAACGGCAT
+TTTATCACTTCCTTTCATTAATCATATTAAATATTTCTTCCCTTAGTGCTTTAAGCTGCT
+CTTCCTGTTTTCCTGCTTCGCTCATATTGAGAGGTTCGAGATATCTGTCACCGTTATCAA
+TAGGATTCATATTTTCAAGCCTTCTAATATCATTAACAGAAAGCCATCCCCACTGTCTTC
+CTTGTGCATAGGCTTCATATCTTGATTTAATATCTCCACGGAGTAGTCCACTGATATTAA
+ATTCAAAATATCTGTTTTTTCTTCTTGATTCTTTTGATAAAAGCTGAAGATTTAAATTTT
+CTTCCCATTTTTTAAACCACGGCAGCATAGTGTAAACAATAAACTCTAAGCTCTGATGTT
+CAATATTGTTATTTGTGGATCTTGTTAAATCCTGCACCAGATGAAGTGGTACTCTGAAAA
+TTCTGCACACATCTTCAATTCTGAATCTCTTGGATTCTAAAAACTGTGCATCTGTAAGCT
+TCATGGTTATTTCCTTAAACTGACCGCCGCCTTCAAGAATCATTGGAACTCCTGCATTAG
+AAAGTCCTGTGTAGTTCTTCTTAATATCCTTTTTAAGCCTTTGAAATGCTTCATCTGAAA
+GCTCGTTAGGATACTGAAAAATACCGCTGGTTGAAGCCCTGTTATGATAAAAATTTCTTT
+CAAAGGTGTCCTGAGATAATCCAATATCAATAGTAAGTGCCGCATAACTAAGAGGTGTTA
+TTCCTATATACCCGTCTAAAGTGAGTCCCGGAATATGAAATATTTCATCTCTTGTTTTAG
+GTTCTTGCTTTCCATCAATATAATAAAGAAGCCTTCCTGTAGATTTATCTATATCAATTC
+TTACTCTGTCCCATGCTATTGGTCTAAGTTCTAAAAGCTCTCCATGCATATTAAAAACCT
+TTTGTGCTATAAAGTTTCCCCCAAGGTTTATATTTGTCATACCAAACTCTTTAAACTGCA
+CTGGTGTCATTTCTGCATTTGGTGCATAATGAAGTACACCATATTCAGCAGTATCTGTAA
+CCTGCCTTCTGTTTCCTTTATCATCTTTTTCATAAAGCATTATAGGACAGCTTGCCAAGG
+TTTCAGAAAGGACTCTATTGCAGGCAAAAACTGCAGAAAAACTCATAGCCGCTGCTGTAT
+CTATTTTAAAATTATCTTTTACAACTTCTTCACCATTTAAAAAATCCTCCGAATATTTCT
+GAAGGACTTCAAACAAGGCATTCTGGGGCGTTAAAAATAACTTCACTCTATCTTTTAGTT
+TCAAAGCACCACCTCCTAATCAAGAAAACTTCTCATTCCTCTTTTTTCATAGACACTTTC
+TTTATTTTCATGTCTTATGGATCTATCAAGTGCCATAATAAGTGCTACAGCACCATCTAT
+CTTTTCAGTAGACTTTTCTTTATCAGGCTTTATATTGCCTGCAGGATCAGTTTTTACATA
+AATATTATCCATCATCCACCTTAAAACAGGATGTCCTCCATGGGCTATTTTCTTTTCAAG
+AGTAATTTTCATAAGCTCCTTTGTAGGAGGAGACATATCCTTATACCCCTGCCCAAAAGG
+TACAACTGTAAAACCCATTCCCTCCAGGTTCTGTACCATCTGCACAGCACCCCATCTGTC
+AAAGGCAATTTCTTTTATGTTGTATTTTTTCCCAAGCTCTTCAATAAAGGTTTCTATATA
+GCCATAATGAACTACATTTCCTTCAGTAGTTTTTAAGTATCCCTGCTTTTTCCAAATATC
+ATAAGGTACATGATCTCGTCTTACTCTTAAATTTAAATTATCCTCTGGTATCCAAAAGTG
+AGGAAGAACAATATATTTTTCATCTGATGTTCTTGGAGGAAATACTAAAACAAAGGCTGT
+GATATCTGTGGTACTTGAAAGGTCAAGTCCCCCATAACACTCTCTTCCTTTTAAACTATC
+TATATCAACTTTAAAAGCACACTCATCCCACTTGTCCATCTGCATCCATCTTGTGGACTG
+CTTCACCCATTGATTTAATCTAAGCTGACGGAATATATTTTCTTCAGCAGGATTTTCTTT
+TGCACTGTTAAAGGCATTTCTCACTTTTTCTATATCTATGGTATGCCCAAGAGAAGGGTT
+TGCTTTATACCAGTTTTTCTCTAATGTCCAATCGTCATTGTCATCTATTCCATAAATAAC
+AGGATAAAATGTTGGATCGATTTTTCTTCCTTCTAATATATCTACTGCCTTTTGATGTAC
+TTCATAGCATATAGAATTTCTATCTGTTCCGGCTGTGGTTATAAGAAAAAACAGCGGCTG
+CAATCTTGCATCACCACTTCCTTTAGTCATAACATCATATAAATCCCTGTTAGGCTGAGC
+ATGAAGTTCATCCATTACAACTCCATGAACATTAAGTCCATGTTTTGAATAAGCTTCAGC
+AGATAATACCTGATAAAAGCTGTTTGTAGGCTTATATATCAATCTTTTTACAGAAAGAAC
+AGGTTTAATTCTTTTCTTAAGAGCAGGACACTGTTCTACCATTTCAACAGCTACATCAAA
+AACGATAGAAGCCTGTTGTCTGTCTGCAGCACAGCCGTAAACTTCAGCTCCCCATTCTCC
+ATCTCCGCAGGTCATATAAAGAGCAACTGCAGCAGCAAGCTCGCTATTATGTGTAGGAAT
+CATGGATTTACCTGCTAAATATAATCTTGATGGGCTGTCAACCTGAATACATCTCATTTT
+TGTCTTTCCTGTTTTTTCAATAGACTTTATATAATGAAAATGTGATCTTGTTTTAATATT
+TCTTTCTCTGCCTCTTTTAAGCTTTCTATCTAATCCTGATACTTCTAAGTCATTAAAAGC
+AGTAAACTTTATTAAATAACATATTTCACCTGTTTCAATTCCATATCTAGCTGATGGAGC
+TGTTTTTAACGTATTCTTTATTCCCAATGACCATAATAAATCCTGAACATCCTTGGCAAG
+TTCAAAAAGAATTGTCACATATATTGCCTGGCTTTTAGCAGTGCTTACACATCCATCAGA
+ATCTATTAACCCTTGTAATAATCTTTTTCTTTGCTGAGCTGATGCTCTTAAATATTCAAT
+AGGTATCCTTTTTTCCCTAAAGTTTTTAACTAATATACTTTTAAGTTCTTTATATACTAA
+AATATCGCTGTTACCCTCCTGCTTATATCTATTATGAAGTTTATATGGTATATTTTTAAT
+AACTTCGTCAACATCATCTCTCATTACAGTTATTTCAGGCTTTACAGCATTACCATTTCC
+TATCCAGTACCCAAATAGATACGGATCTATAGGAAGTTTATTTTCAGGCAAAATAAAAGC
+ATCCGCTATTGGGATGCGAAATAATGCTCTATTTTCTTTACTTTTAGTTTTAAACTGCTT
+TTGATACATTTCTCCTGTTGTTAATAGTTTTTCTCTTCTGCCATTATTAGTAACTTGAAC
+CTTCCATAGATGCCTTTCTCCAGCTACTATACTTGTTCCATCTCTAAAATTTATTTTATA
+TGCCTGCTCCGTATCATCAATTTCACTTATTGCAACAACATTACAAGGTCTTCCCTTTTC
+ATCAATTACCTTATCTCCTGCTTTTATTTCCCCCATTGTAGTCCATCCATCAGGTGTTGG
+AATCGGAGTATCAAGGGCTAACTGTTTTCCATTTTTCTTAGGAATTTCAACATAAGCAGT
+ATTATACTGCCTGTATCCATTTTCTTTTACTGTTCCGAATATATCCCTTATAATTTTATC
+CTGCCAAGGCAGAAGATCAAAAGGAACACCACGCCACTGACCCTTTGTATGCTTTAAGCA
+GTTAATAAAGTTTACGGCATGCTGTGCTTTTGCTTCATCATACACTCTTACTGCCTCCTT
+TATAAAGTATAAGTTCCATTGGATCTTCTTCATCATTTATATTGTCAGTGACTATTCTGC
+TTCTTGCTGATGGAGTAAGTCCAAACTGTTCGCAGAATCTGTTCATGATTTTAAGGTAGG
+TTTGAGCGATAGATACCTGTGGCACCTGCTGCCAGTATCCCGATGGTGTTTTTACAATAG
+TTCCATGTTTAGTTATAAATTCTTCTGCTTCCTTCCACCTTGCATAGGCTTGACAATATC
+CTGCAAAGGCTGCCATATCTATTTCTGTAAGTATTCCCATTGCCTCAAGCTGCTTTGACA
+TTCTCCTCCACTCTTTTTTAGCTTCAGCATCAAGCCAGCCTGGACATTTAGGTGCTTTTT
+TCTCAGGTTTTGGTTCATCTTCATTAAGTGGTCTTTTCCCTGGATTTCCTTCAAGTATTT
+TTAATGCTGTTGGTTTTGGTTTTCTTCCCCTTTGAGCCATAGGTATCACCTCCTCTTTTG
+GCTAACTAAAAAGAGCCTACAATCGTAGACCCTTAAACTTATTTTCTTTTTCCTTTTATA
+CCCTTGTAGTTGTAATTCCCTTTCTTAACTTCTTCATATTCAGCTTCTACAGCTTCTTTA
+TAATCACTACGTTTCCTTTCCTTTTCCTTGCAGCTTAAGCAAATGCAATCCTCATTATAC
+ATTGACATTATTCTACCCTCTTTTAAGCTTTCTCCACAGCGATCACAGGTTTTCTGAGTA
+AAAAATTTATCCATTTATTTCAGCACTTCCTTCCTGTTGTAATTTTCTAAAAGCACAACT
+GCCTTCAAGATTTGAAAGAAGTGTTTTCCTTATATCTTTATACCTACTTCCATTCATGCC
+AAGGCGAATGAGCCAAGTTCTGAATGCATATTTAGGGTTATCCTCCTGAGCCTGCTTAAA
+AGAGGTGTGTTTTAATTTTTGTGCGTTCACATTTATTAAAGATGCAAGTTCTATAAATGC
+GGATATTTTTTCATGGCTTAAGGTTTCACCTAATAGCTTAAAGGTAAAAGTTCCTTTCTC
+AAAATCAAAGGATATGCCTTTGCAACCATCAGTTCCAACTTCAGTAATAGCATTTTGAAA
+TTCTTCTAAAGTTTCTGTTCTCTTTAAATTCAAATTCTTTATAAAGGTTTCCTCAATAAA
+AGGTTCTTTTAATTCGAAGGTTTTAACAATTAGCTGCTGTTTACTGTAAAGCATATTTAA
+AATATTTATTAGCGTTTTTCCCGTATGCTCTCCTAATGGAATTTCTAAATTAAAACTATC
+AATAGTTGTATCCTCTATTTTTTCTTCAGAATCCTCTCCCTTTAAAATTTCGTTAAGTGT
+AACAACCCTACCTTGCGAAGTTATAATGGTTCCCTGCCTATCTATTGTGTAGATTTCCTT
+TTCCGTTTTAATTTCATAGGCAAAGCTTGGTGCTCCAAGATACTTTGCTTGAGAACCTAA
+GGCTTCACTTAAAATTTTAACTATTTCTTTTCTATCCATCTTCATTCCTCCCTGTGTTTT
+GGTAGTTACATATATCACTCTAAACACAGTTAATAGCAAGTACTTTGTATAAATATTTTA
+AGAAGAAAACAGGCCCTTCAGTCTGCTTCTGTCTAATTTTCAATCGCTGTGTACCTTGGG
+TAGGTGTAGCCTTCTGAATCTACTAAAATGCTTTTCTTTGTTTTTGTGTTCCTAACCCTT
+ATGCATCTTAGCTCTCCTTTTTCGTTGCAACCACCATCTTCTTTGGTTATCCAAGGCTGG
+TCTTTGCAGAAGTCTTTTGCAAATTCTTTAAATTCCTCATCTCTTAGTTCAATTTCTTTT
+GTAACTTCGTAGGCTGTTCCTTTTACTCCATCCTTCTTAGCTTCTTTTGTAAGTTCTTTA
+AGTTCCTTTAAATTTAAAACCTTTCTTCCAAATAATGCTATCATTCTAAAACCTCCAAGT
+GTGTTTTTGTTATACTATATATCACTCTAAAACACACATATATCAAGCTAATTCTTAAAG
+TTTATATCTATTATTTTTGCTTATAGCTTCAGCACTTACTTTCAATGCTTCTTCAATAAA
+ACCTATATCAAAACCTGAAGATGTATATCCTTCTTTAACTATTCTTAGATACCTTTCACT
+TGGAAGGTTTAAGTTAATCCTATCTTTTATTTTATTGGTCATGATGTACACCATAGCAGT
+TACTATTTCTCCACTTTCAAGCTCCACCTCTAAATCTTTTTTATAATAAAAGTTTGGGAA
+ACCTTCGTAAATGTCTAAAGCTTTCTCATCTTTAGGTTTAACCTCCCAAACAAGTACTGG
+TACCTTTCCACCCTTAAAAGGTTCAATAGTAGCATAAGCATTATTAGGTACTCCTTTAAA
+AAGCAACCTAAAATCCTTTAACTCCCCCTTGCCATAAACCCTAGCCGTAGGACATCTTTT
+TTCCATCTGCTGAAGATTTAAGTTTGAACCATAAGCAATATACAATCTTTTCATCTATCA
+ATCCACCCTTTCTGAAAGCTTCTAATTGGGCCACAGTTCCCCTGTATTGCCTTAAGTTTA
+ATTCCTAGCCCATTAGTTCCTTCTACTACCCTAAGGGCGGTAATTCCGCCCTGTGGCTTT
+ATGAAGCCAGCCGCCTATCTATGCGGCTCTCTGAAATCTCCAAGCTGCTGAGCCTTGAAG
+GTGCTTTATAAGGTGTTCTCTGCAGTTTTTGAATTCTTCACCTATAAAGCCTATTCTGTT
+AAGCCAGGTCCTCATTGCAAACTTTGGATTTTCAACCTGTGGCTTTTTACTGCTTGCACT
+CTTTTGAGTAAGGGCTTGATGGTTAAGTGCCAAGGCTAAAACTATATTTGACCTAATAAC
+TCCTGCGTGCATGGTTCCATTAAAACCTCTAAGTTCAACTGTTCCTGTTCCGTTGAAAAA
+GCTGTGTAGGTTTAAGAAGTGGTATCTGCTTTCATGGTAATGCCTTTCTCTATTTGAACC
+GTATCCCTCGTACCAAATATCCTCAATCTGCTTCATGGTAGTAGGCTTTTTCTTGTTTAT
+CCTTTCCACCAAATCTGCATCCATCTTTTTGCAGTATCTCATTCTTTCTCTCTCAATCTG
+AAGGCTTTCATAAAGCAGGTCATTTCTTGAGTAGATTATGTTTATAAAGTTTCTAATACT
+TCTTGGTGTATGGTCAGCTCCATCAAGGTGTATGTGAATCCCTGTGCAGTTTTGCTTTTC
+TGAAAAGGCTCCTGCTTTTCTAAGCTTTCTTACTATCTCCTGCAAAGTTTCTATGTCTTC
+TTTGTAGGTAAGTATTGGACTTACTAGTTCTACACTATACTCTTTTGTAGCTGCTACCTT
+CTCGTCATTTACTTTCTTTTGGGTGTAAATACTTCCGTCATACATAAGCTTCCATACTCT
+TCCGTCTGCTGCTGTTACCTTATAGGTATCATAATAATCATTTTCTCTTTTTATACTTCC
+TCTTAAAACTTCTGCAACAACCTTTGCGGCCTTGTTTCTTGTAACTCCTGTCATTTCAAT
+TTCAATTCCAAATCTTGCTTTTAAAAAATCTGTGTTTTGCATTTTTGTTTCCCCTTTCTT
+AGTGTGTTTTTGGTCATGTACATATATCACTCTAAAGGGGAGTAATAGCAAGTATATTAT
+CAAAGATTATTAACACTATTTTTATTTAATAGATTGTGCTACTGCAAAAGCTACATTTAC
+AGTTACTGCATTACCTGCCTGCTTATATAGCTGAGCATCTGAATTTACAGCCCTTGCTTT
+TTCAAATAATTCATCTGGGAAGCCTTGAAGTCTGAAGCATTCCTTTGGTGTAAGCCTTCT
+AATACGGTAATTTTTGTCCAATGTAGCCATTTGGCATCCTGTATCTAAAGTATTTGATAT
+ACCTTTTCCAACCCTGCCTCTTCTTGTTTTTGAATTAGGTACTGAAATATTTATGCTGTC
+TCCAATCTCAGCTTCAGCATAGCCTTTTTTTGTGGCTTCTTTAACTGCAACTCCATGTCT
+GTCCTGACTTGTTAAAGTAAACATTGGTTCATCTGCATTTTTAAATCTCCTTCCATTCTG
+ACGTTTATTTTCTCTTTCAGGAGTTATAACAGCCCTTGCTTCAAGAACAGCATTTTGTGT
+TTGATTTCTGTTTAGTCCTCGCCAATCACTGGCACTGATTGTATGTGCTATTTTTATTTC
+ATCAAGAATACCATCATTTCTATTAAACTCAATTGGAACACTCTCTAAAACTCCGCTATT
+CATTGCAGTTCTATTAACCACTCCTGCTGTATAACGTGATGTAATACATCTTGATGTATC
+TGTGAGCTTTGGCTTTGTGTAAGACTGGTCTATAAAAATTTTGCTTCCTTCGCCCTTATT
+AGTTGTAACTGCTGGAGCAATTCCTTCTGATGAATAAACATTTCCATTCATACCTTTGCC
+GCTTGGATTTATATTTCCTACGCAGTAAAGACCAGTCTTTGCTCCTCCACCTCCACCACA
+ACCTGTAAGTGTGCAAGCTACTCCTTCTGCATCATAAACTCGCTCACCTTGACAGCCGCC
+TATAATCTGCTTAAGAGCTGCTGTGTTTTCTCCTCTGACAGGTAGTATTTCTCGTCTGCC
+TCTGCTTCTAAGATTTGCAGTAATGAACACACGCTCTCTGTTTTGGGGTACTCCGAAATC
+TTTAGAGTTAAGCACCTGCCAGAAAGCATCATACCCTGCTTCATCCAGCTCAGAGAGAAC
+GGCTGCAAAGTCCCATCCGTTATTAATTGACAGCAGGTTTTTAACGTTCTCAATAAGAAG
+GTATGAGGGTTTATCTTTTTCTTCTTTGCCTTTGATAAGGTCAATAATTCTAAAATATAA
+GCCGCTTCTTTTTCCTCTGATTCCTCGCTGTTTTCCTGCAACTGAGATGTCTTGACATGG
+GAATCCAAAACACCAGATGTCTGCATATGGGATATCTTCGCTTTTAAGTTTTGTAACGTC
+ATCTGCATACCACTCTCCTTCCGTATCAAACATTGCTCTATAGCTTTTAACTGCAAATTT
+ATCTTTTTCACAAAATCCTATACATTTATGTCCTGCAAGTTCTAACCCCAATCGAAAGCC
+GCCTATTCCTGCAAAGAAATCAAGGAAGGTCATATTAATCACAACCTTCCTTTTTTATAT
+CAGCATATTTAATTTTAACTCCATCTCTAACTAAAAATACTTCTTCATCTGTACCAACCT
+GCTCTATATATCTTTTTACAATAACATCCGCATACTTTTCATCAAGCTCTATGGTATAGC
+AGATTCTATTAGTCTGCTCACAGGCAATCAAAGTAGAACCACTGCCGCCAAAAGGGTCAA
+GAACAATACAATTGCTCATGCTGCTGTTTTGAATTGGATAAGCACAAAGAGCTACTGGCT
+TCATTGTTGGATGGAGAGCATTCTTAGATGGTCTGTCAAAGCTCCATATAGTACTTTGTT
+TTCTATCAGAGTACCAATTATGCCTGCCTTCCTTCTTCCAACCAAAGAGTACAGGTTCAT
+GTTTCCACTGATAAGGACTTCTGCCCAGTACCAAGCTTTGCTTTGCCCAGATACAAACTC
+CGGATAAATAAAATCCAACAGCTTTAAAAGCCTTTCTAAAGTTTAATCCTTCTGTATCTG
+CATGGAATACATAAATTGAAGCATCTTTCTCCATAGCATCATACATATTAGTGAACGCCT
+TATAAAGGAAATTATAAAACTCCTCATCTTTAAGGTTATCATTTTGAATCTTTCCGGCTT
+TTGCTTCATATGCAACATTGTAGGGAGGGTCTGTAACCACTAAATTAGCTTTTTTACCAT
+CCATTAAAGCCTCATATGTTTCAGCTTTAGTACTATCCCCGCAAATAAGCCTGTGCCTTC
+CAAGCAGCCACAAATCTCCCTGCTTTGAAATTACAGGTTCTTTTAAAGCATCTTCAACAT
+CAAAATCATCTTCTTTTATTTCCTTGTCATGAACATTGCTAAACAGTTCTTCTATCTCCG
+GCGGTTCAAAACCTGTAAAGGAAACATCATAATCTATACTCTGCAAATCCTTAATAAGCT
+CAGCAAGAAGTGCTTCATTCCACTCTCCGCTTATTTTATTAAGTGCCACATTCAAAGCCT
+TTTCTTTTGTTTTATCTATATCAATAACAACACAATCAACTTCTGTATAGCCTAAGCTTT
+TTAAAACCTTCCATCTTTGATGACCGCCAATAATTGTAAGGTCTGAATTTACAATAATGG
+GATCTACATATCCAAATTCAGTTAAACTGTTTTTTATCTTTTCATATTCCTTATCACCCG
+GCTTTAAATCTTTTCTCGGATTATATTTAGCAGGTATAAGGCTGTCTATTTTTAACTTCC
+TAAACTGCATCTTCTTAAACCTCCCCAAACCTTGATTTTATATAGCAGCTGTGACTGCAG
+TATTTTCTGTTTTTATTTCCATAAGAGCTGAACTCTTTCTGGCAATAGACACAGGTATAT
+TTATAAACAGCTGTATCCTTTTTGTTTCTTTTATCTTGATTGTTTTTCCACCAGATTCTC
+CTGCATTCTTCAGAGCAGAATTTCCTTGTTCTCCCTTTTCCCTTTTGTTTTAATTTCTTA
+CCACAGTGAAGGCATACAAGATTCTGCTTTTTCATCTCTTCAATGTTTAAACTTACTACA
+GAAACATCACCGCAAAGACCATTCCTTTTACAGTAGCTTTTTACTGAATCTCTTGATAAA
+CCAAGAACTACAGCTATCGCTTTATATCCCAGTCCTTTAAGTCTTAACTCATGAATCTGC
+TGTTTTTCAACTTCAGTCAATTCCTTTATGCCTCCTTTCCTTTTGCGATGAGATTAATGT
+AAAATCTTAAAAAAATGCCTTAAAAACACTTAAAAATCACTGTTTAAACTTGATTTTTGA
+ATAGTTTTTATATAAACATCAAAAGCCTATAAATCCTTGTATTTTTAAGGTTCACAGGCT
+TTTATCTTCTGATTTTTTATAGATACTTATCTGCAAAATATAAAATAGCTTGATTGCTGA
+TTTTCCAATGGTTACAGTTGATTTTTTATGAAATATATGCTACCCCCCTTATCAAATTCT
+GCGAAATTTCGTGCGAAGGGAGCCGCCCGACGTAGGGGGTTCAAGTGGTGAGGATAATGA
+TGCCCCCTACCCTTTGTTGAAGAATTATCAACAGATTGTCCACAGGTTATTAACATATCA
+TTGTTGATAACTTTAATAAGAATAGACTCGTCCTTTCCTTCCCCATCTGCCGTCTTCCTT
+AGCAGTCTTTCTATCATGACAGCTTTTGCATAAACTCTGCCAATTGCTCTCATCCCAGAA
+CAACCTTTCATCACCTTGATGTGGTTTAATATGATCCACTACAGTTGCAGCAGTAACAAT
+ACCTTTTCTTTTACACTCTTCACACAGTGGGTGTTTATGCAGAAACTGTTTCCTAAGTCT
+TCTCCACCTGCTACTGTTATAAAGGTATCCATAGGGTCTGCAGTTTTTATTGTAGGTTTT
+ATTTATTTCCTTTTGATGTTTCTCACAGTATCTGTCGCAGGTAAGTTCAGGACAGCCAGG
+ATAACTGCAGGGTCGTTTAGGTTTTACTGGCATATATATCAGTCCTCCCAAGTTATGTTT
+TTACATATGAAAACCACCACAGTTTTTCTGTGATGGCTTCATCTGTTTTTTCACTTCGTC
+TATTATAATACTACTGCGGATACAAGGGTGTCTTTCAATGTCTTTTAGTGTCCTCTTTAA
+TAGATATCTAAATTCTTTTTTCCTAATTATAATTTAATCAGATTTTAATACTCTCTTTCT
+ATCACATTTACTCTCATCTTTTGTTTTTATTCTAAAAATTTCCGTTTTTAAAATAGTTTT
+TTTAATTTTTTTACAATCAGAACAGATATAATTATAATTTGGTACATAGTTACATGACAT
+TACTTCTGTACCACAAAATATACATCTAGGGTAGTATCTAGCTTGTTTACCTTTTTGTTC
+AATCCTAATCCCGTCTAACAAAGCTTCTTTATAACTCATCTTTCTAATCCTCCAATTATA
+ATATAAACACATTTTGATACTCTCTTTCTATCACATTTACTCTCATCTTATGAAATATTT
+ATTTCTTTTAAAGCTTTATCATGAATACGAAATATATGCTGTAAACTGTATCCCATATCA
+ACAGCAATCTGTTCCCATGTCTTAAAACAGAGATATCTAAGTTCCAATAGAGTCTGATAT
+TCTGTATTATCTATTTTTCTAATAACTGAAACAAACTCCCTTTTTAAATCCACAAGAATA
+TCAATATCTCTATTTATTTCATTTTCTAAATCAACTATCTTAGCTATTATATCCTCCATA
+GAATGCACATTACGAGTTCCACTAGGTGGTGTATCGCTTAAAGTAGATGTTGCCTTTGTA
+GCTAATGCCCTTAAGGAAATAATCTGCTCTAACTTACTATTAATTCTTTGGTCTATATGA
+TAAGCCTGTGATAAATATTCTTTGGCTGTCATGCTAAATCTCCTCCTTTAGCCAAGGCAT
+TTTATTGTCATAATAGGACTCTGCAATATGCATTTGTGTACCTTTATCTAAGGATTTAAT
+CCTTTTAAAAGTTAGCTTCTTTTCCTGCTGAAGCTGCTGCTTAGTTTTATAAAAACTACA
+ACTTAGGTCATCACATTTTCTAACATTTAGCACACTGCACTTACCTTTTCTTAAGGCAAA
+ACAACTATTTATTGTTTTTTTCTTTTTTAATTCCTTTATTCCATTCCCAACAGCCTTTGC
+AGCTGTAGGATCTGAGTATGCTTGTCTATCGCTCATTTACAATTCCCCCTTACTTAGGGA
+GTACATGATACCTAGTTATATATATATATTTCTTTTTTATATAGTAATATTTTTATATAT
+ACTATATCTTATTATATAAAGGGTATATACATCTTGGACATCTTGTACCCCATTGATTTT
+ACTACGTTACAATCTTGTACTTATGTTGAACTCATATAGAACCCATCTTGTACTTACATT
+TTCACAAATATCCTATATTTCTTCCCATCAATTTTTTTATCTATAGTTTTATAACCGAAC
+CTCTTGGTAATCTGTCTTGAAAATTCTATATGACTAAGTGGCTGCAGATTATTATTTAAA
+CAAAACTCCAAATAATTCTTATAGACATTTTTCGTTGGCTCATTTTCTACTTTTGTTTCA
+TATTCTTCATAGAATTCAATAATTGGATTGTTGGTCTTCTCATATTCTTTAAGCTCATGC
+TCCACTTGTATGGATTTTGTGAACTTTTTATTTTGTAGGATTCTTTTAAGCCCCTTTAAA
+CCCAGTAAAATCAAATATTCCATGGACTCTTTTGTCCTTAATTCATATTTAATATCTGGT
+CTGAAATCAGGATCATCTGCTGTAAACTTTGCCTTAAACGGAATTATAAGAAGTCTTCTT
+TGGACAGCTCCTGTTTTATCCTTAACCCTTGGAACATTATTGGCTGAAAATAAAAGCTTG
+GAGTAATTATTAAAATCAAAAGGGTCTTTGCCTTTCCTCTCTGCATTAACTCTATCCCCT
+GTAACAAGCTTCTTAAACATTGAAGGCTCTGCAATAAATTCATCTCCAATATCGTCACCA
+ATATTTGCAAGCTTTCCAAATAATTCTGCTGTTTTAAATCGCTCTCCCAACTCCTTTAAA
+TCAAGAGCTGCAATATTAGAAATACCTATAAGTGTAGTTACCATATCCAAAAATGTTGAT
+TTCCCATTTTGTTTTTCACCAGTTAAAATGAAAGCTTTTCCAATTTCATTTCTTCTATAA
+AATGTGTATCCTATAAGTTCTTCAAGCACACTTCTAATTTCAGCATCATTGCAGCTGATT
+TTATCTAAGGTTTTATCTGCTAATTCAAAATAAGCATTTGGGTTATAATCCCACGGAATT
+CTGTTAGTGATGATAAAATCTGGAGAATGTTCTGTAAAAGAATCATCTATTATGTTATAA
+ATTCCATTGTTAAATGCTATGCGATTATAATCTTCAAAGCTTGGAATAACGTTATTAGTA
+ATAAGTTCTAGGTAATTTATAGTTTCATTCCTCTTTGCTTTATTAAGCTCTGGTAAATGT
+TTAATCATAACTGATTCAATTTCCAAAGTACTATTTTTATAAATTCCGTCCTTATAAACA
+TGGAGCTGGTTATTAATTTTAATAATGTGCTCTTCATCCCTTATAAATCTTGCAAACTGG
+TCATGTAAGAATTTTGACTTTTGATAAAACAAAGGTTTTAAAAATGCTTCATCTCGAAGT
+ATTGTATCTATTTCTCTTTGTTCTAATGGTTCTTTTAAAATATATTTGTTTATGATATTT
+ATAATGTTTTTAATACTATCCTTACTAAAACCTTCTGATTGAAGGGTTAATATATAATTG
+AATAATGCTTGATTTCTTCCATCTCCTTCTTTCATATTTAGAAAATCCGGTGCTGTTTTT
+AATGGTCTTAGCCATTCTGGAAGATAGTCAACTTCTTCTGTTTTGTTTAACCATCTTCTT
+GTTACCCCATTCACTCTCAATGGCACAATACAATTCTTTGAGCCAAGTCCTATGTCAATT
+GTTACTCCTAAAGGAGTCTTTGTCTTGATTTTTCTTGTTTTTAAATCTGTGTTTTTAAAA
+TAAAAATGCATCCCTCTATCTGTCTTTAATATGCAACATTTAATATCTAAATCTGTTATT
+ATGTTTTTTACAACATTTGCTTCTTCTATTGAATCAAAATCTATTTGAATAATATCATCT
+TGTAAAACTGCACCGTAATCTTTGCCTGTTTTTCTTATATAGTCATAACAATAAAATTTA
+TTTCTGTCCTTATATCCCTCTAAAGGTTTTTTTCCTTTTAAAGGAATGTATCCTTTGAAA
+ATATCCATGGTGTTTTCACCCGCCTTTTGGTAAGAATTATATAGTAAAAAGGATGTTTTT
+TTGCCCATTTTCATATACTTTTTGGGTTGTTTAATCATAAAATTTATATGTTTATTCCCA
+AAAGTCGCTTTAAAAATCTTAATATTACCCTTAAATTGCTTTGAAATTTAACCTTTTTGA
+TTAATATTTCCCAAATTCCTATAATTTTTTATCTGATTTCACCAACAAAATCTTCAATTC
+TTTTCTTTGCTAAATTTATATACCACTCTTTATCAAGGCGTCTTGGTACTCTTTTGCCTA
+TAACACTGTCATTTACTATAAAACATCTTTCCGGAGTATTTGCTATTTTTTCAACTCTGC
+CATTAGGCTTTACTTTAAATACACCTTTATCCTCCTCATTCTTTGATGCAAAAACTCTTA
+AAGTTTTTTCTGCTAATGGTTTGTCCCCATAAAGAGCATGAGAATATTTATAAGTAAGCT
+TTACAACCTTTTGAAACATTAAAAGCTCCTTACATTCCGTTATAGTTTTTTCAACTGGAA
+AACCTTCTATAAAATATTTCTTTAAAGCTAAGTTTATTATAGGCAGATCATTATCAATAC
+TATTTAGTTCCTTAACATAGGCCCCTTTAGATTTAAAACTGCCGTCTTCTTTAATAATGA
+TGTAGTTATTTACATCCTTTTGATATATTTTTTTAAAGATTTCAAAATCAAGCTTCATAT
+AAGTCCTATCTTCCCACTCTCTGCAGATTTCTTTAATTTTATCTAAATCTGATTTCCTAT
+TTATTTTTCCTATTAAACCATCAGTATTGGACTGAATTAAAGTCCAATGCGGTTCCAGCC
+TTTCTATTAAATCTAAAAGTAAAAGCTGTCCTGCTACACATACATTATTAGCCTGTCTTG
+GGTCATAGAGGTTATTGTATTTGTATTTCATAGCACCATAGGTACTATTTAGAACAATTT
+TATAAGGTTGCTGCATTGGGTTCTTTTCAGCTTTTAATCTTATACGTTCTTTATAAATCT
+CTTTATATAAATTAGAATCTTCCACATTCCTTGATAAATAGCCATACTCTATCATCAGTG
+TTGGATAAAATGAAATTACATCTACATTTAAAAGAATTCCTTCACCTATATATTTTTCTT
+TTGCACCATGAAGTCCACCCCATGCAAATACATGCGGGACACCACTTATATTTATTTCTA
+ATGATTTATCATAACTGTGATTACTTGAATTTTTGTACCAATCAAGAACCTCATTATATT
+TATTTATTTTTAAATTACTTGGTATGTCCAAATCAAACTCATCAGAGCGATTTATTTTAT
+TTGCTTTTAAAATAACTGCTGCAAGCTGAGCCTTTGTTTTACTTATATATTTAAGCGGCA
+GTTTAAAAGCTTTAAGTAAAGCTATATGACTATCAAATTCCTCTTTACGATGTAAAAATA
+TTTCTATAGTCTGCTCAACATCATGGGTACAGTATTTTACTACTTCCTCTAATTCTTCTT
+CTGTTAACTTTCTATCTATTGAAAAGCTTACAGTGCTTTCTCTTATGTCATTTCCCATAA
+ATCCTTCTAGTTCTTTTAAACCGTGAGTTGTTGTCATAATATCAAATTCATAAAGTTGAA
+TTTTTTGAAATAGCGAGCTGTACTGCCAGCCTTGATTTTTTTCTGCTATAATGAAACTGG
+AGATACTATATGGGTCAAAACCACAAAGGATACCTTTTAAAATATACTGATCATAATGAT
+GGCTGTTATAGCCAATCCAGATATGTTCTTTATGTTCTTCATAAAATGATGCTAATTTCT
+TAGCATCATTTATAAAGACATATTTTTGATGATTAATAGGGTCTATTACGACGAAGAGCC
+AATCTTGCAGGAAAACCTCTGCGTCAAAGAATAAAATCATACCTATTCAACCTCAAAAAC
+CTCAGTAATTTTAAAGGTCTTAAATCCTTTGTTGGTTTCCCCATACTCTACTGCATATTC
+TAAATTGCCGTCAATTGCTTCATGAATATCAAGTATTAAATCGTAGTATTGTGAAAAACT
+TTCAAACTCTACTTCTATTCCAGCTTCAAGAGATCTTAAAAATTCATTAGCGTTATGAAG
+CCCAAAAGCTGTGTTTATAACTTGGTTCATAAACAATATGGAATTTTGATATTCACCAGA
+TAAGATTTTCATCCAGCAGGATAACATAGGTTTACCTGTCTTTGATTCTACAAGTTCCAT
+TTTTTCAATTTTTACCTCATATGTTCCAAGGGGTACATCTTTGTATTGACCTTCTCCTGT
+TCCTACATTTTTTAAGTCTTCCTTTAAACCCTTAATATCAAATTCCTTATCAAACTTTGC
+AAATAAATTTTTTGTTGCCATAATTATCTCCTCCTATTTTTATTTTCTAGAGCGTCTGCT
+CTTTTTTACTGATTCTTCTTTAACTTCAGATGTTTCTAATACAGTTGTATTATCTACTGC
+TGCTGTATTATCAGAAGTATCTGTTTCTGATTTAGAATAAGTTTTTACACCTTCCTGAGC
+ATCTTCTAAAGCTTTCATAAACTCACCCTTATCAAGCTCTACTTTTGGAACTTTAAAATT
+GAATCTGCCACCGCCGAAGATATTTTCTTTCTTTTCAAGCTGCAAGTATCTTTCTTCTCC
+ATCCATAAAGGCTCTTACAGTTAAATCTACTGTTCCTGCTAAAACATTAGCTATTTTTTC
+ATTAATATTAGGTTTTATGGTTGTAAGCTTAGCTCCATTTTTTAGTGTTATTTCTGTAGT
+TACTTCCTTAGAAATATAAATTATTTGATATCCTAAATTCTTAAGTCTTTTTATGGCTGA
+TAAATATTCAGTTCTAACCATATCCCATCCTTTACCAAAACCTGCATCCTGCTCATGGTC
+TATTCCTAACTTGTTATACATATAAAGCCTGCAGTGTTCATATAAGTCCTCAACTAAATC
+AATGCACACTCTTTTGAAAGTGTTATCTTTCTTTTCAAGCTCTGTAATAACATCTAAAAA
+TACTTCCCAAGCCATTTTGACTTTTTTAAGTCTTCCTTCAAAAGTTACTTCATCAGCTAT
+TTTTATAACTGGACTTGTTGTGTTATCTGTGTTTCCATCAGTATTTAAGAATAATAAATC
+ATCGAACTGATCAACAAAAGTTGATTTTCCAACGTAACTGTCGGCATATATCCACATGTC
+CGGATACCTGTCTATTTGAAGTTCTCTCCTAACATTTTCTGGTAATAACATATCTGTTTG
+TCCTCCTTCACAATAATTTTGATATTCACACCAATCACAAAGTCTTGATGGTGTTTTTTC
+ATATTCTTTTTCATTAATAATTTCCCGGCATCTTAGCTTAAATTCTTGAACCTTAGTCTC
+ATCATATGGAATTTGAATCACCTTAACTTCCATAGCTTCTAAAGTTTTATGAAGCCTTTT
+TCTAAACTGATATAAATCCTCAGTTTTCCTTTGCCTTATAGCTGTTTTAGGAATAAAAAT
+AAATCCTATTTCTGATACCTTAAATCCAAGTTTTTCTAAGTAATACCTATATAAGTGCAG
+CTGTTTTGACTCCAGATAATGCTCTATATTATTGCTGTATTTAAAATCATAAATGCTAAG
+ACTTCCATCCTGTGTTTGGATAATAAAGTCTACAAATCCTATAAATTCTGGAAAATCAAT
+TTTAAACTCATATTTTTCTGTCGGCTCTTTATTATGAAGCATTGTATTTATTACAATCTG
+AGCCTTTTTCACTAATGATGTAAGCTTAATAACTTCATTTACATGAGCATCAGTAATAAC
+TGGATACTGATTATAATAATATTGCTCCATTGCCTCTATACCTTTCTCAATCCCAAGATG
+TAATGCTGAACCTGCAATTAAAGCATTATCTGCTGCCGGTGAAGGTATTGTCCTTACTTT
+GTCTTTATATCGCAGTTTGAATTGGTACTTGCACTTTTCAAAGCACTCAACTCTGCTGTG
+GGAAAATTGCACGCTAGCACCTCCTCTATGAGTTTTTTAAATTCTTCAAATCCTGAAGGA
+TATAAAATTATTCCAATGCCTCCTGCTTCATTTATATTTTTTATATTCATTTTTTGAAGT
+TCTGTTGGTTTTCCTTTTTCTGCTTTCAGCTCAATGGCTACAAAAACTCCATTTATACAA
+CAGATTAAATCTGGAATACCGCTTCTTTGAAATCCACCACCAAAAACTTTAAAATACCAT
+GTTTTTGAGAGTGTTTTTAAGTATTTTATAACTTTAGTTTGAAACTGTTTTTCTGTCATA
+ACATCTCCTTTTCAAACAGCTCCACAGTAAAATCCCGCCTTTGTTTTAATACTTCAAGTA
+TCTTTTCTTCTATGCTGTTTTCTGTAATAAGATAGTAGTAAAAGCAAGTCCTATTTTGCC
+CTATCCTGTGTATTCTCTTTTTTGACTGCATCCAAAATTCACTAGATAGTGGAAGGCTGA
+AATAAATAATTCTATTTGCCTTTTGCAAATTAACTCCAGATGCCCCTGCTTGGTACTGAA
+CCAATGTAATACTGTTTGACTTATTTTCATAATTTTCAAGGTCTGTTCCGTCTCCATTAA
+TATAGGAAATGGGTCTATCTATCTTAAAACAGATGTTTTTTATAATCTCAAACTCTCTTT
+TAAAATTGTAGAAGATAACAAATCTATCATTACTGGATTCAAAGATATCTTTTAGCACCT
+GATGTTTATTTGAGTTGTAAATAGATGTTAACTGCCTTAGATACAATAACTTTGTAAGTG
+CTGTATCTCCTGCTAAAGTTTCACCATCAATTGTAATAACTCTGTCTTTTTTAAACTTTT
+TATATTCCTTTGAGTTCTCGATTGTTACAACCTGTTCAATCTGCTCCGGCAGGTCAAATA
+CTTCTTCTGTTTTCATAAATACTGCACCATAGGATTTTAGTTTTTCCTTTAACCTATCAA
+CATTTTTATAGCCTTTTACAACTGGAATTTTAAATCCTCCAACATCAATCTTTTCTGTTA
+TTGTGTAGTGATTATAAAAGGAGCTTTTACTAATATTCCATCCAAGAAGTCTAAGCTGTG
+ACCACAGCTCCTCATATTTTCCACCTGTAGGAGTACCAGAGAGAAGAATTATATTTGCAG
+GATTAAGGCTTAAAATAAATTTTGCCCTGTTGGATGTTTCATTTTTAATATACTGCGATT
+CATCAAGTATTAATGTAAAATCCTTTAGCTTTTGTAATTGCTTCCTTCGCCATACCAAAT
+CATAATTAATAATAATTACACTATTTTGCGGTATGCTCTCTATAGATTGATTCTTGAAAA
+TTATAATTTGTAAGTTATAGTAATCTTTAAAATGTTCTTCCCAATCTTTAATTTTGGACT
+TTTGGCAGATTAGAAGATTATAAGGTGCATTTAATTGTTTCATTTTTTCTGAACCTAAAA
+ATGTCTTACCTAATCCCAATAGGTCACATGTCAAGATAATAGGCTACCTTTGACTTATCC
+ATTGTCTCCTCCAACACATGCTGCTGATGTTTAAATAGCTTTATCTCTGACATAAAAACC
+ACCTCCCTTCCAGTAACAGCTGCTAAATTTCAAATTTGTATCCATACTGATTCATGATTT
+GATCAATAAACTCTAATGATTCAGGAAGCCACACATTTGTCTTTATTTTCATTCCATTTT
+TCAAGGTATCAGTAATAACCTGACAGTATTTTGTATGACTGTATTCAGCTGTCATAACGT
+AGTATGGATTACGACCATAGAAGTTGTTATCAACTTTTTTAATTACACCTGCATCCTGCA
+TTATTCTGTTAAACTCCTGTGCCGTTATTCCATAATACATACCAATATCTGAAGCTCTAA
+GCATTTCATTTAAACGCTGAAGATTTCTAAATAATTCTAGTTTCTTATCCTGTTCTTCAA
+TCTTTTCTGTAAGCTTTTGTATCTTTTTTCTTTCTTCTTTTAGTGCCTGAAGTGTTTTTA
+TCATTGTATCTGGGTTATTTAGCATTTCTTCTATTACCTTATCCGTTGCATAAATTCCGT
+GTTTTCTTATAGAAGGTAAAACTTCATCAAAAACCCATCGTTCAAAACGTTCTGCTTTAG
+GTAATTTTGATTTAACAATTAATCTATAAAGATCTCCTTCTGGTATAAACTTTATTTCCT
+GTTCACCACCACTTGTAAGGACTCGGTGTTTCACCGACCCCTTTGTATGCCTATTAATTG
+CATCATAAGGATCTGAATATCCAAGTATCCTTGCACAATCAGTTGCTGGAAAATATTCTT
+TTCCGTCAATTACTAAAATGTTCAATTCACCAAATTCTGTGTTTTTAAAAACTTGTAATT
+CATTCATACCTTTTTCCCTCCCTTATATTTTTTTAGCATCTTCAAAAATATCAGCATAAT
+CTTCAAGTTTAACTTCAATTAGCTTTTCTGCACCATATTTTCTTAATAGTGCTTTAATTT
+CTGTTATCTTACCTTTTTTCATTTTCTCTGTTAGTACCATGCTTATATCTTGAATGCTTA
+TTTGATCATTCATTGTATGGTTCTTTGCTTTTGCTCGATATTCTGCTGCAAGTCTTTCTA
+GTTCTTCTGCAAGAACTAAATTTATATCAGTCATAAATTCCACCTCCTTCACCCTTATGC
+TTTTAGAGCAAAGTCTTTGATAATGCTATTCATTACTGCAAGGTCGTCACCTGACAGCAG
+GATACTTAATCTTTTTAATAATTCCAATTGTTCAGGTTTTAAATATTTTTGATTTAACTT
+ATAACCATCTGTAATCTTGATACCTCCACCATGTCGTCCTCGAATAGTTTCTATGGGGTA
+AGAAAGCGATAGGATATCAATATCATTTTTAATGGTTCTAATACTAACCCCAAACTCATT
+TGCTAAGTTAGCCATTGTGTCTTGCCTTCTATGACATAATCTTTCTATGATTTCTATGCG
+TCTTTCATTTGGTCCCATCGCTTTCTCACCCCCTTTCCTTTGCTCTGTGATTTAAGAATA
+AAAGTTAAATATGCAGACTTTTTGCTTATTTAAAAAAATTTTAGTTCCTGCAGCAATAAA
+AAATAGCCGGAGAAATGCTATGTGCTAAGGAACAATCCTTAAATGCACATTTACATTTCA
+ATCCGGCTATCTAAGCAGCTCACAAGGGATTGAATTTTATTTGATTTTTATATTATTTAA
+GATGCTTCTTCTCTTTTCTTTTTATAAATAGACTTACAGACTTCTTTAATTCGTACCATT
+GTCGTCTTATCTACATATGGACTTATAACAGAACTAATATCAATTAAAACAGGTTCCTTA
+TGCTCTCTGCATTTTATTGATATTAAGAAAGAATCTTCTTCAATAAGAATTTTAAATAAT
+AGCTTTTTATGTTTTCCTTTGTCTCTCACTTCTTCTAATACCATAGGCACCTCCATCTTT
+TTCTCTAATCGTGTCATGTCAGCTTTTAAGCGAACATATAGCTTAAAAAAATTTTGTCTT
+AGTTTTATAACTTGTATGCATTTAGTCATTAACATAATGCAAGAGTAAAATTGATACATT
+TGTTTTATGCACGCTTACATGTGAACATATTGTTTCAAAATAACAACACGAGCTATAGCT
+CCTGCTGTCATCTTTATATTGAAATTCCCAAAGTATTTAATCTTATTCCAGCAGCCTGTT
+TTGATACTTGAAACACAGATGCTAATTCATCAATTATTAATTCTCTAATAATTTCCGGAC
+TTAATCCTCTCCACAAAAAATCGTTTATTCTTTTTCCTGCTTTATATCTTCCTCTTAACT
+CTTCTGCCTTTATTCTAAACATTTCTGCTGGCATTAGGATTGCTGCTGCTATGTTATCAG
+CCTGCCACTCTATCCACTCATCTGCTGTTTTAGGCTTGTATGCTTTTTGTTTAGGACATC
+TACAGGCTTTTGCCATAGCTTTATCTTTATATGACAGGGTCATAAATCTTAATTGATGCT
+TGTCCCAATGAACCATTTCATGGGTAACAGTAAACCTTTCTCTGCCTCTATTTGCTATTT
+CAGAAAGATCGCTTTCAACTAGAAGAGTTCCTTTTTTATATTGTCTTACAATATTTTGCT
+GAGTATCCTTATCATAAAGTTCCACACATCCATCAGAAAATATCATCATCCCTAAAGTAT
+CACAGTTTCTATCGATATTTACATAGTCTATTTCAAGTCCCATTTTAAGCTCTGCAATAT
+CTTCTACTGGTATTGCCATTGGTTCTTTCAAACCTTGTGGATAGTATTTTTGCAAAAATT
+TAGCTGCTTCTTTATCTATATCCCCTTTTCTGATGATGGGAACTAAATCATTATTCAAAT
+TCATTATTACCCCATCCCCTTTATTTATTGTAAGCTTCTATGTCATTTATAACAAAATCA
+CTTAATGAAGCATTATCTAATACTGCACTGCAGCTTAATTTAAACCATTGGCGTATTGAC
+TCTGAAATATTTTCTTTAGCAAAATAATCCCCTATTTCTATATCGCAATTAACAAGTATA
+TCAAAACTTACTTCTTCATCATCTTGCTTGATGTTATTGACCCTTAGTATTTCTATATTA
+TCCAATGTAGCTTCTAAAACTTCTATTACATCTCTAGCTCTTAATGTTAAGTCATACTCA
+GAATAGTTATTCATTATTTCATCTTCTAAAGTATCAAAAATTTGTTGGTAAAATTGTTCT
+TCTATCATACCTTTAAAATAATCATTCATGAGTATCCCCCTCCCTACTCTTTCTCATCTA
+AGGCTTTAATAAATTCAATCCAAGCCTTTTCTGTAATATCACTTTTCCCCTCACTTTCGA
+TTTTACGTGCTTTTCTAAGGGCAGTTCTAGCCAAACCACTTTCTTTTATATAATCAGGTA
+AGTCCATAGGGATTTCATCCCTATCTTCAGATGCTATATCAATCATATAATCTGTTTCTT
+CTGGTGTTAGTCCTAATATTTTTGCTATTTCCTCAATCTTATTGATATTAGGTGGATTTC
+TTCTCCCTTTTTCAATATCACTCCAATAAGCTGGAGAGATATCTAACAGCTCTGCCATCT
+TTCTTAAACTTATTTCCTTTTGTTTTCTTTTTTCTGCAATAAAATCCCCAAACTTACTAC
+TCATAATATACACCTCCTTTCACTGTCAGCATTATTTATTTAAAATTGAGTTTTGAACAC
+TTAAATAATAGAAAACTGCTTATATTCCTGTTTTTCCTTAATGAAATTCAAATTTTTAAG
+TCTTATCCTTGCAGCTGTTAAAGATACGTCAAATATATCTGCAATTTCACGACTTAAGAC
+ATCTGCCCATAAATCTTTTTCAAAATCAGTTCCCATTTCATAACACATTCCCACCATACC
+TGCTGACTTAAATTTAGCTGTTACATATCTGGTAAAGATTTTCTTAGGCATTAATAATGC
+TGAAGCCATATAATCCGCCTGCCATTCAATCCAATCATCATCAGTTACAAGCTGCCTTTT
+CCCTGCACTTTCAATATCGATTGTACGGCATTTTATCACTGGCTCATTTGGGATAGCACT
+ATCAAATAATGTCATCTGCATTTTATTAATTGTGTAAATATGTCTGTGTAAAAGCCAATG
+TGCTATCTCGTGTGCATGAGTAAAGCGGCCTCTTCTTAATTGATCTTCATTCAGAAGACT
+ATTGTCTATTAATATAGTCCCTTCATTTACTGGTATTCTTTTCGCTTTATTATTATCTGC
+ATCATATACAGGAATATAACAATCATTAAATACTGTCATTCCTAATATGGATTGATTATG
+TGTCAAATCTTGATAATCCATTTCCAATCCAGCATAACATTCTGAAAAATGCTCTACATC
+TAAACTGCAAGGCTCTTGAAGGACCTTTGAGTTATAATCCTGTAAAACTCTTTCTGCTAA
+ATCATCTATCTCTACTCTTTTAAGAATAGGTGTACCATTATTTTTAGTTTTAAAATCTAA
+TTGAATCAATCTACCATCCCTCTCATAAATGCATGTATGCTTCATTGCTAACACTATTAT
+AATATGGCATATTATTCCTTGTCAAGAAATAAACATACAAAAACCGAAAAATAAGACAAT
+TTTATTGAGATATCTTACTTTTCGTACATAACTTTTTCAATTCTTCTCTAATATTTTTGC
+TAGTGCCATAACAATACCTTTCAATTGCTTCTTTAATATTAAGAAATATTCCTTGAACCT
+TGCCAAACTGTGATACATTTTCAAAGATAGCTTTACATTTTATTAAACAAAGGTAGACTC
+CAACAAAATTCTAACTTTTAGTATTCAGTACCTCTATTATTTTATTTACGCAGCCATCCA
+AATCTTTGATAATCTGCTTAGACCAGAACCTCAGTACAATCCATCCTTCTTCTTCAAGCT
+TCCTTGTTACTTCTAAATCTCTTTCCATATTTCTTTTTATCTTTTTATTCCAGTATTCTT
+TATTTGTACCTGCAACATCTGTATTCTCCTTATAATTGTATCCATGCCAAAACTCTCCAT
+CACAAAATACAGCAACTTTTTTAACCACAAATACAACATCAGGCTTTCCAATTAATTTCC
+TATAATTTTTTCTATAACGATAACCTCTGCTCCACAGTGCTTTTCTTAGAATACATTCAC
+TCTTACTGTCTTTATTTTTTATTGCTCTCATATTTTTTCTTCTTTGTTCTGGAGTTAAAT
+TATCCACTATTTTCACCTCAAATTTATTAGATAAAAACTGACTTGTTTAATTAATGCTAA
+TTTTAATTTACCATTTTTTGTACACTATGCTTACATTTAAATCTATTCTGCTTGTACTAA
+TACCATTTTTTTAATATAATGTATTATATGAGTAATAAAGGGGTTGATGCTAGTGGCCAT
+TGCTGGAAACAGTTATACAATACAATTAAAGCCTTCTCATCTTGGTTGGGGAGATTATCG
+GTATACAAATACGAGAGATATTATCTACGGAGAAGGATATATTCCTTTACCCAAACCATA
+TGCTAAAGCATTTAATATATTTAACTCGAATTATTCTGCTACAGGCCTGGGATATAATTT
+ATTTCGTGCTTCATCTGTTGATGGTTTTTTAAATAACGTAACGCTTCTGGCCCAAGGTTC
+TTCAACTGCTGGAGATATATATGCTAAACAATTTTCTGTACATGGTAATCTTAAGATGAT
+TGGGGCATGGTATGCGAGTCAAAATGCAACAACTAACAATTTAGTAAGAGTTACTTGGAC
+ATCCCCAACAGATATTCTTCTTGAAATAATTTAA
+>NC_009012.1|provirus_2931283_2970170
+CTATTTTGCAAACAACTCCTCTATTTTGGACACAGCTTCTTTTTGAATATTAGGTAACAC
+ATGGCTGTAAGTATCAAGGGTAACGGAAATTTGGCTGTGGCCAAGACGTTCGCTTACTAT
+CTTTGGATTTATGCCTTGCTGTAAAAGCATAGTGGCGTGGGTGTGCCTCAGGTCGTGGAA
+ACGTATTTTGGGGTAACCTAGCAGCTTGATCAGTTTTGTAAATTTCTGACCTAGGTAATG
+GGGGTCATACGGTCTTCCGTCGTCCCAAGCGCATACAAAGTCTTGGTCATTATAGGCAGA
+ACCCATTAATAGCTTAGTTTTATTCTGCTTTCTTTTGTGTTCTTTTAAAGCTTGGACGGT
+GTAATCCATTAAAGCTATAGTACGCATTGATTTAGCTGTTTTTGGTTCTTTAAGCGTAAG
+TACGCCGTTTATGCGCTGTAGGGCATATTTGACCATTAAAAAGCCCCGTGGAAGGTCAAT
+GTTCTCCCATTTTAAGCCGCATATCTCACCTGCCCTCATGCCGGTTTGCAGTGCTAACAA
+TACTGGTATATAAATCGGTGTCTCGGCAATGTCATCTAAAAATTTTTTGGCTGTTTCGAC
+GTCCCATACTCGCATTTCTACTTTATCAGGACGGGGTGGCGTAACGGCATCGGTGGGGTT
+TGATATTATAATCTGCCAGTTTACCGCATGTTTCAACGCCAGGTGCAGCATGCGGTGTAT
+TTTTAAGACGGTGCTTTTACTTAAGTTTTTCTCCAGCAGGGATGAGTAAAAGCTTTGAAT
+ATGGGCTGGCTTTAGCTTCGGCATCATGATGCCGCCTATATGAGTTTTTATATGGGCGGC
+AAATTCGGTATAACGCCTATAAGTGCTCGGTGCTACATTGTTTTTGGGGTAAGTATCCAG
+CCAGTAATTGAGGTATTCGGCTACAGTCATGTTTGCTGGTTCAAAATATTCACCCTTCTC
+TATTTTTGCGATTATGTCGGCCAGGGCCTTTTCGGCTTCCTTTTTTGTTTTGTAGCCGCT
+AAACCACTTTTGTTTGCGTTTGCCGTTTTCGTCACGGCCGATGTCAACTACTATGCTGTA
+GGTGGAACCTCTTTTGCGTATATGGCCGCGCATAGGCTATCCCTCCTTTTAAGGCATATA
+ACTTTAAAAGACCACCGCCTTGCCAAATTTTTACAACGAATGTTTTCTTATTGCTTCGAC
+AATAGCGTCTGTATTCCAGCCTACTATTTCAATAGCTACGTCAGATACTGCTTTTGGTAT
+TCTTTCTTGTCCCCATGGTTTTATTCCTATTATAGGTTTACCATAATCCACAGATATATC
+TATTTCTTTTTGAATCCAGAAACTGTAAGCTGCATACATTCCTGACAAAATAAGCACACA
+ATTTACAGGACGAATTTGTCCTTTTAGCTCTTCAATTAATGTTTTCTGATCGACTGGGTC
+GTCTGGATCAATTACTGGGTCATGCTGTGGGACAGAGTAATTTCTCCATTTAAAATTTGG
+AGCTTTATTTAGTAGGTCTACTAAACGGTAATAATCATCATTGTATTTCCATGCATGGCT
+AATGAACAAATCATATATTTTTAGGTTGGGCATTGTTTACACACTCCCCTTCATTTGTGA
+TATAATCATATTAGAATCATAAATTTTAGAATAAGGCAGGGCGGTGGTCCCATGCAGAAT
+ATAAGAAAGAGAAAGTTTCGGAAAAAGCCCATTATCATTGAAGCCTACCAGACTGACAAG
+GAAATCATTATAAACACGATGGAAGGTCCTCTTAAGGCTTCGCCGGGCGATTGGATAATT
+ACCGGGGTAAACGGCGAACAATACCCATGCAAGCCGGATATTTTTAAAAAAACTTATGAA
+CCAATTGAGGATGAGTGATTTGTGTTTCTCACGTTATGGAGAGGGTTTGTTTGCCTTTGA
+CTCCAGTCAATGTGTTCGGTTGACATTATGCGTTCGCATTGTTCAACGAGCAACTTAAAC
+GGATCATCTGTTTTGGAATATATGCCAGCTTTAGTAAAGTATAAAAATTTTTCTTGCTTT
+AGTGCTTCGCATGTATTCCTATATTTAATCCAGTTTTCTTGGAATTTGCAGATGCCGTGT
+ACAGCTGCAATGATTGATATAACTGCGCTTAATATTGCTATAAGCAGTTTTAGATAAAGA
+GGTCCTTCCATGAGTGAAATCATAACAGTAATAGATGCAGACAGGACTATTTCTGCTATT
+CTTAGTCCTTTGTATATGTATTGATTTTTAGTGCTTTTTTCATCATACCACATTATCTGG
+TCATCTAGCCTTTGAGAAAGGTATTCTTCTTCTTTCATAAAGATATCCCACCTCTTTTCT
+TGTCGATTTATTTCATATGCAAGATTTTATACTCCACCAATTCCTCATTAACCCCTAGTG
+TGCTGGCGATATAACTTATCGGTTGGTAGCGCATTTCCTTAATGTCGTAATCATCGATAA
+GTAGCTCTGCTGCAAACTTGTTGGCCTCACATTCATACGGCCCAATAGGGAACAAGGTAT
+ATTCTCTGATAAAATATATTGGCTCTGATGAGTGCAGGATGGCATGTCCAAGTTCATGGG
+CCAATACGATACGCTGGCTGTATTCATCCAATGTACTGTTAACGACTATAAATTTATTTC
+GCAGCGTTTTTATGTAGTATCCTTTTGTATGATGTGAGTATTCCTTATGTACGACGTGTA
+TGTTGAGGTATTTTGCAAGCCTTAAGGGGTCTCTAGTTTCATATTTCTGGACGAGGTGCT
+TTACACGGGCGTGAATATTCTTTTTCACTCCGGAAGCACCTCCTTATTGGTCGGTTTTTG
+CCTTTTTTCTGCCGTATTTCTTCTTGTTCATCTCCTTTGCCTTCCAGAAGAGCTCGGATA
+TATCTCGAAAGAGCTTTTCTTTGTCTTCTTCTGCGACCTCATCGTTCATGAAGAAGATGC
+CGGCCTGCTTGATGAAGTCTTCATACTGCATTAGGTCACGTTTGGTCACTTTATGTTTTT
+GGGTGTATTCTTCAGGGATGTAGGGGTTGCGGATGTCAGTGCGACCTAGAAGATAATCGA
+CTGATACCGAATAAAATTCAGCTAATTTCTGTATTGTGACAAAGTCAGGTTGGCTTTTGC
+CTGTTTCATATTTTGTATATGTGGTTCTATCTACGCCAATAGCATCGGCTACATCTTTTT
+GGCTTAAGTTTTTCTCTGTTCTTAACTGCCTGAGAATTTCATTAAAGGGCATGTTATTCA
+CCTCCATATTTTATTATATGTGAATCTACTTCACATAACAATTATAGTGCAAAAATTTCA
+CTTTGGCTATTGACAAAGTGAAGCAACTTCACTATAATTAATTTCGGGGGGTGAAGTTAA
+TGCACAACAAAAACGTGGCAAGTGAAGTAAGAGAACTTATAAAAGAAAAACGTGCTGCCT
+TGAACCTTACACAAAAACAGCTAGCGGATTTGGTAGGAGTTGACAGAACAACAATTTCAA
+AAATTGAAAATGGAATAAGACCATCTGTAAATAGTGCCAAAAAAATAGCTCAAATTTTAG
+GCTTAGACTGGACAATTTTTTTTGATAGCGATGAAGAGCATCAAACCGAGACTGCGTAAA
+GGAAGGGGGTGAGGGGGATGGCAGACTTGCCACAGGTATTTAATTACAAAGGCAAACAAG
+TAAGGACATTTATCATCGATGGTGAACCGTGGTGGGTTGCTAAGGATGTGTGCGATATTT
+TAGAGCTTGGCGACACTCACAAAGCTATGGAAAGGTTAGATGAAGATGAGCGGAATACAA
+TTCCGGTCACCGACTCACTTGGAAGATTACAAGAAACTTATGTAGTTAATGAGGCTGGTT
+TATATAATCTCATTTTAGGTAGCAGAAAGCAAGAAGCTAAAGAATTTAAACGATGGATTA
+CCCATGAAGTCATACCTCAAATACGCAAGACAGGGATATATGCATTAGAACCAAAACAAC
+TTTTAGCAGTAGCAATAATTGAAGCACAGAAAATCATAGAAGAGCAAGACAGGAAGATAA
+AAGAATTACAACCCAAAGCGGAATTCTTTGATGCGGTAGCAGGAAGCAAAGATGCAATTG
+ACATGAACAGAGCCGCAAAACTGATATACGAAGAAACTAGACTAGGCAGAAACAAGCTGT
+TTAAGTTACTGCGGGACAAAGGCATTTTAATGAAAGACAACATACCGTATCAAGAATACA
+TAGACAAAGGGTACTTTAGAACTATTGAGCAGAAATATACGAAGCCAGATGGAACAACAC
+ACATCTACATTAAGACTCTGGTTTATCAGAAGGGGCTGGATTTCATAAGAAAGATTGTTA
+AAGAGGATAACGTAATACATCTTAAAAGAGCAAAGGGGGTTTGACAATGCGATACGAGGA
+CTTGCCTGATGTTTTAACTATACCGGAGATGGCAAAGTTTCTCCAGATAGGCATCACCAA
+AGCATACGAGATGAGCCACTGGAGGGGCTTCCCGGCCATACGAATAGGGCGGGCAATACG
+GGTACCCAAGAAAGCATTGCTGGAGTGGCTTGAACAACAGAGCAAACAGGAAGAGCCCAG
+ACTAACTGCAATTAGGGTGAGGTGATAAAAGAAAAGCCGTTTTCAAACGGCACAAACAAA
+AACCACTACACCCTCATTATACCACAAGGTGTAATGAGGGGGCAATAAGGGGGAGCGAGA
+ATGTTGTATAAAGTGACCTCACCCATGTTAGAACAGGAGATAGTTGTGGAAGCACAAAAC
+TCAACGCAGGCTAAGAGAAAGGCTTGTAGGTTGTGGGGCGTTAGCCCCAGCGACGAATGG
+CATGGCATATCCACGATGCAGGCCAGAAAGTTAACAGAGAAAGAAAGACAAGAAGAGTTG
+AGAAAGTGGGGGATTGAGGATGCGAGTATTTAAGTGTGGCTGCTGTGGCTATAAAGCACC
+GGAATATATGTTTGCATACGGACGAGGGCGGGAGTACGGTGAGCATCCGGAACACCGCTA
+CTGCCCTCAGTGTCATCAATCAATTGATTGGTACGGATACGGGATATTTTGGGTAAGTGA
+ACAGGCATCTTAAGGGGATGAAATACAAATGAGAAAATGGATCGGGAAATATGGAATGTA
+TATCGTAGCAATTGCTGCTGGTGCGGTACTGACACCGGCAGCAATCCGAACAGCAACACT
+ACAAAGAGGGTATAAGGCGATAGGTGGGGAGTATTTGATTATACCTCTTGCAATATTGAT
+AGTGTTCTTTGTGCAGGAAGTAAAACAAACAATAATGGAATTGAGGGGAGGAATAAAGCG
+TGAATAACGCATTGCAAATGCTTGAGATAGAAGAAGTTTACAACATGCCTGAGGAAAAGA
+GGGAGCGGTTTAAAGTAACAGATAAGGATAGTGCAAATTGGTGCCTGAGAAAGATCAAGG
+CTCTAAAACAGGAGATAGAGGAGAACAAAAGGATAGCTGATGCGGAAATACAACGGATAC
+AGAGCTGGTTAAAAGAAGTAACTGAACCACTGGAGAGGTCAATACAGTTCTTTGAAAGTT
+TACTGATTGAGTACCATATGAACATATATGCTGAGGACCCAAGCAAAAAGACTATCAAAC
+TACCATATGGCACATTGAAGGCTAGGGCTCAGCAACCGGAATTTTGCAGAGACGACGAAA
+AGCTGGTTAACTGGCTTAAACAAAATGGTATGACAGAATTTGTAAAGGTCATAGAAAAAC
+CTGAATGGAACGAGCTCAAGAAAAAAGTAAAAGTGATAGGTAATAGCGTAGTGTACGAAG
+AAACTGGCGAGGTCATAGATGGTATAACTGTTCAGGAAAGACCGCCTAAATTCACAGTGG
+AGGTGGAATAGATGACAAAAAAGTTAATGGAACTAGAACAGAGAGAAAACATAAATGCGA
+GCATAAGTATATTGGGCAGCGTGGATATTGCGCAGGTCCAACAGATCCTAACGAGTATAG
+AAAAATTTCAAATGGTTGTTCAAAAAACGCTAAATGAAGGCCATGACTATGATATTATCC
+CAGGCACATCGAAGCCATCACTTTTGAAGCCAGGGGCAGAGAAAATTTTGGTGTTGCTCG
+GGCTCACGTCGGAATACGAGATTATTGAAAAAATAGAGAATTATGAGAAGGGCATATTTG
+CATATACGGTTCGATGCATTCTGTCTAAAAACGGGAAAAAGGTTACAGAAGGACTGGGCT
+CATGTAATTCCAAGGAGGATAAATACCGGTGGCGGTGGGTATCGGAAAAGGATCTCCCAC
+CGAATGTTGATAAAGATATGCTGAAGAGCAAAACCAATGAGTACGGCCAAAAGCTATACA
+GGATTGAGAATGACGAGATATTTACTCAAGCGAATACAATCCTTAAGATAGCCAAGAAGA
+GAGCACAGATAGATGCGGTACTTACAGTCGCTGCATTGAGCGAGATATTTACACAGGATG
+TGGAAGATATGCAGGAGTTTCTGCAGAACGAACAGCTTGAAACCATGAAAGCAGAGGAGG
+CTGTAAATGTTAAGGTCACGTTCGGCAAACACAAGGGTAAGACGCTTGGCGAAATATACA
+GCCAGGCACCGGACTATGTGCAGTGGCTTGCGCAGAATGCAAGGAATGATGTCTTAAGAA
+AAGCGGCTAATATGGTTATGAACGGCAAAGGTAATGAGAGTCAACAGGAAGCTCAACGTT
+CGGAGGATCTATCGAACAATCAAGGAGAAGACAATATACCTGGGTTTGAGCTGACGGAGG
+AAGAACTCCCGTTCTAAAAACGGGCGAAGCTAGTTCTGTAAATTTGATCGCAGGGGTCGC
+TAAGATAGCGGCCCCGCCTAAATGTGAAATAAAAGGAGGCTACACCATGAACCGATTCAA
+ATGCCCCGCATGTGGCGGGAATCAATATACAGCATGTTCTACGTCTGAGAAGTGTATCTA
+TTGCGGATACAAAGGGCAACTAATGAAGATGGAGACGCTAGAGCCGGAAAGTGAAGGAAA
+AATGATAGATTGCAAATATTACGTGCCAGCATGGGTAGGGAACAAAACTACAAACCCACA
+GTCGGACTGGTGCTTGAAATATGGTGTAACCTTGGGCGGGAAATGCCTGAAGGGTTGCAG
+TGAAAAGAAGGATGTGAGGAATAGTGAAGTATAAGGTGATGTTCACACATAGCGACAAAG
+GACAAAAAAGAGGCCATAAACTGCGTGAAGGCAAAGAAATATACCAGCATCCGGAGGGGT
+ACTTCGTAGTGCTGGAGTTTGAAGGCGAAAGCGGGAAGTTCAGGGAGGCTTTTTGGCCGG
+AGGATATTGTGAAAGATAAGTTGTTTTTGTGAAGGTGGAGGGGTCAGAATGCCAAACAGA
+ATCATTAAAGAATCAATATGTACAAGCGACACCATAGACCAATTATCTTGGTTTGAGGAA
+GTGTTTTTCTATCGCCTCCTGGTTAATTGCGATGATTATGGGAGGATGGATGCAAGGCCG
+GCGATTCTGAAGGCGAAGCTGTTTCCTCTTAAAAGTGTTACCGAAAAGCAGATTTCTGAT
+GCTTTAAATAAGTTATCGACGGTAGGTATTGTAGCCCTATATGAGTATGATGGGAGACCG
+TACCTGCAATTGGTAACTTGGGAAAAGCATCAGCAAATACGTTCCCGGAAGGCAAAGTAT
+CCATTGCCTCCAGAGGATATTCCTTGTAAGCGCGAACACATCATGCCCGAAGAAAAAGAC
+ATCGAGGACCTCTTGTATGATGTCATGAGCTCAACGAAACGATTTGAGGAACATACCTTG
+CTCTCGGTTGAAAGACAGGTAAGGGTCGGTGAAAGCTATCTTGATATCGTTGCTAAAACC
+GAGAGCTCCGAAACACTTGTATTTGAATTGAAACGCGGCCGGTTGAGTAATAAGGCTATT
+GACCAGATATCCAAGTATTTGACCCTCATAAATGGAAATGGCATCTTAATAGGCTGCGGC
+TTAAGCGCCAATTTCGACATTGAGCGGTGCAGGAGCAACGATATAGCTGTTGTCATTTAT
+GATGATGACCTGAATATGTCGCTTGTATTAGGTAACTCCACTGTAAACAGTATTGATTTA
+ACGTTAAATCACGTTAAATCACGTTATGCAAAGTTAGCGCCTAATCCAATCCAATCCAAT
+CCAATCCGAATCCAATCCGAATCCAATCCTAATCCGAATCCAATTAGTAATAATGGCGCG
+AACAAGTCGCGCGGATTCACTCCTCCTACTCTTGAGGAAGTGGCCGCATATTGCCAGGAG
+CGTAACAACGGTGTTGATCCACAGAAATGGTATGACTTTTACGCCGCCAAGGGTTGGATG
+ATTGGGAAAAACAAGATGAAGGATTGGAAAGCAGCGGTGCGCACTTGGGAGAAGCGGCAA
+CAAAAAGGGGGTTATACATACAACTATGAGGATGGAGGCGATAGTCTGTGAACTTTGACG
+GTATTATCGAAGATCTGGCGAAGAAGTGTGAACCGAGCGAAGAACACTTTGATTATTACA
+AAGACGGCCTGCTTATTTGTGGCAAATGCAATACTCCCAAAGAGTGCGTGGTTGAAGTAT
+TGGGGACACTCAGAAAATTTGGATGCATGTGTAAATGCCAGAGTGAAGAGTACCGTGCCA
+TGCAGGAGCAGATCAGGCAAAGGGAAGAGTTTGAGCGGATCGGTCGCCTCCGGACGCAGG
+GCATCCAGGACCGATGCTATTGTAACTGGACTTTTGAAAATGACGATGGACGGAACCCTC
+AGCAAATGGACAAGGCTATGCGGTACTGCCTGAGATGGGAGGAAATGTACCGTGACAATA
+TTGGACTCCTCCTTTGGGGCGATGTCGGAACCGGCAAGACGTTTTTTGCGGCCTGCATAG
+CAAATTACCTAATAGACCGGGGCGTGCCGGTGCTTATGACTAACTTTATTAGATTGTCGA
+ATGCACTAATGGCCCTTGACGAGGACAGAAACGAGTACATTAAATCCTTAGACAGCTACA
+AGCTGCTCATAATCGATGATCTGGGCGCCGAACGGCAGAGTGACTATATGCTTGAGCAGG
+TCTATAACATCATAGATAGCCGTTATAAGAACGGCCAACCTCTTATTGTCACAACTAACC
+TGCCGTTGTCGGAAATCAAGAATCCTTCTGATATCAAGTACAGCAGGATTTATAGCAGAA
+TCATTGAAATGTGCGTGCCCATCAAGTTTGAGGGACCAGACAGGAGGAAAGAAATATTTA
+ACTTAAAGTTGGAAAAAGCAAAAAAATTGTTCGAGGGTGATTAAAATGCCAGTAAACAGC
+AGAGAAAAAGGCAAGCGCGGCGAACGGGAATGGGCAAGCATATGTCGGGAAGAAGGCTAT
+AACGTTAGGCGCGGACAGCAATACAACGGCATTGAAGGAGCTGACTGTGTCGGCTTGCCG
+GGAATACATCAGGAAGTCAAACGTGAACAGAGATTGAATATCGAAAAGGCATTGCAGCAA
+GCAACCAGAGACGCAAAGGACAGCGAGATACCGATAGTTGCCCACAGGAAAAATGGAGAG
+AAATGGAAAGTGACCATGTGGGCAAGTGATTGGTTCAAGCTATATCGCGAGTGGGAGGCA
+AGCGAATGGTTAAAGAAAAAAGAAATCAAAGAATTTGAAGGACAGGAGTTGTGGGGTTAG
+GGAGGCAGATCACATGAGCCGAGGAAGACCAAATAGGGGGTGTGAATGTGGGAATCCTAG
+AAAGACGCATATACAAAAAGATTGAGTACTATTTATACCACTACCACCAAATTCGTAAAG
+AGATAGAACAAGAAAAGGAAATTATTATCCAGTCAGGTGGCCGTGACCTCACCGAATGGA
+GAGGCGGTATCAGCTACCATTCGGATCCGACTGCGAATAAGGCTATTAAACTCACTAGTC
+CAGAGTTGCTAGAAAAAGAGAAATGGCTGAAGGTGATAGAAGGTACTATTCAGCATTTCC
+AAGGTACAGAAAAGGGCCGCTTACTACAGAAAAAGTATTTTGACCAGCTGGGAGAGCGAC
+ATATATGCAAGGAATTACACATCGAAAGGACAACTTACTATCGATGGCGAGAAGAAATTG
+TGCTGTATACCGCCTTACTAGCGGCGCAATATGGTCTTATAAAGTTTTAAAAAATTCAGA
+ATTTTTGGCCAATGAATGTGTTACAATGATAGCGGGAATATTATGATATTTGGGTGTCAT
+AGCAGAACAGATGCAATACAGCATAACTCGGCTGATGAAATATTTGAGGGTTAGATTGAT
+GAGCTGTTGAGGAGTTGCATGGTTCATATATTAGTAGCCAGGGTAGATGGGGGGTCAGAG
+AAGTATATTAGTCGTTTGCTTATAAAATGGGATAACAAAGGCAGAATTGAAAGTAGAAAA
+AATATAGAAGAAGGAGTGGTTACGTGTATTCTCACCGGTTCTAAGGGGTTCATATGCAGG
+CTTGATGTGGGAAAAGTATGTTGTTACGTGAACTTAGATGGCGTAGCCTTGTATCTGATA
+AATTTTGTCATAGATGTATAATTAAGTCAAGCTTAAAGTTGTAAGCAAAATATGCTATAA
+TAGATTGAGGGAAGAACGAGGTGAGATTATGAAAAGAAATCCACTTGTTGCTCCTGTGTT
+GAAGTGGGCAGGAGGGAAGCGGCAATTACTAAAAGACATAAAGAAGCATATACCAGAGAA
+ATTTTCAACTTATTATGAGCCCTTTTTAGGTGGTGGGGCTGTTTTATTCGAACTACAACC
+TAGTAAGGCTGTAGTGAATGATATAAATGAGGAATTGATGAATGTTTATTTAGTAATTCG
+GGATCATGTTGAAGAACTCATTGAAGAATTAAAAAAGCACGAAAGAAAAAATAGTGAAGA
+ATATTATTATGAAATAAGAGAACTAGATAGAGACAAGAGAAAGTATGAGCAATTAAGTAA
+CATAGAAAAAGCTGCGAGAATAATTTATTTAAACAAAACATGTTATAACGGTTTGTTTCG
+TGTAAATTCACAAGGTCAGTTTAATGTTCCTTATGGGAGATATAAAAATCCAGATATTGT
+GAATGAAGTTACATTAAGAGCAGTAAGTAATTATTTTAATAAAGCTAAAATAACTTTTAA
+ATGCGGAGATTTTGAAGAAGCAGTTAAGGGGGCAAGAGAGGGTAGTTTTGTGTATTTTGA
+TCCGCCTTATGATCCCGTTAGTGATACAAGCAGTTTTACAGGTTATGATATAAATGGGTT
+TGACAAGGAGGAACAGATAAGGCTTAAGGAATTATGTGATAAATTAAATAAAAAAGGTGT
+AAAGTTTCTACTTTCAAACTCAGCAACAGATTTTATTTTGGACCTGTATAAAGATTATAA
+TATAACAATAGTCCAAGCTAATAGGGCAATTAATTCAAAAGCGGACAAAAGAGGAAAAGT
+TGATGAAGTGCTGGTGAAGAATTATGAGTGAGACAAAGAATGATATTGCATGGGAACGAA
+TTTTTAAGAAATATAGAATATTAGAGAAAATAAAGAAAAATGGGGCTTTTGAAATAACGT
+CAGGGCAAATAAATGAGTTTAGAGAAGCAAGGTTAATGACAAAATTTGATCACCGAAAAA
+ATTTACCGAAGATTTTTGAAGAAAATAATTTTTCTATTCTTCCTATTACTAGAGGTAGTT
+ATTTAATTGCGCAGTTTAAGGCTTATCATAGGCTTGAGGAAAAAGAAACAGAAATAATCA
+AGATTCCATTTCCTACTTATATTGAAAGTATTGATTATGAAAACATAACAAGCGAGGCTG
+CGGCTTTAAACTGTGCGTATGTTTCAGGTATATTGGCTGATTTTATTGAGGATGAAGAAA
+TGGTTCCAACAGTTACAGGTCGAATGAGTTCTGATGCGTTTTGTTTTTATATTAATACTT
+ATTCGGGGTCTAAGTTTAAAGTTAATGTTACTAATGCTCAAATTGAGATAGATGGTGGAT
+ATGAAGGGCTGGGAACCTTTTCTTTAATTGAAGCGAAAAACTCGTTATCAGATGATTTTA
+TAATACGACAAATATATTACCCTTATAGGTTATGGCATGATAAAATTAACAAAAAAGTTA
+AGCCAATATTTATGACTTACTCTAACGGTATTTTTACTTTTTATGAGTATGAGTTTCAAG
+ACCCTGAAGATTATAATTCTCTTACTTTAGTAAAACAAAAAAAATATAGCATAGAGGAAA
+CAGAGATTGGGCTTGATGACATAATAGAGATCTACAAAAGGACAAAAATTATAAATGAAC
+CAGAAGTTCCATTTCCACAAGCAGATTCATTTGAAAGGATAATTAATCTTTGCGAGCTTT
+TAAATGAATCAGAGTTGACTAGAGATGAAATAACAACAAACTATGATTTTGACTCTAGGC
+AAACGAATTATTATACAGATGCAGCTAGATACTTGGGATTAGTACATAAGCGTAAAGAAG
+GTAGAGAGGTAATATTTTCGTTGACAGAAGAGGGGGAAAAATTATTTAAACTGAAATATA
+AGCCAAGACAATTAAAATTTGTTGAATTAATTTTGTCCCACAAAGTTTTTAGAGAAGTTT
+TTGAATTGTGTCTGAAAAATGGAAAAATGCCAGATAAACATGAAGTAGTGAAGATTATGA
+GATACAGCAATTTGTATAAAATAGAATCCGAGAAAACATTTTATAGGCGTGCTCAAACTA
+TAATGAGTTGGATTAAATGGATATTAGAATTAACTAGATTGTAGTACATAGCCAAAGATT
+GTACAAAAGTTCGGTACTTTTTAAACGGATTTATATGGTAGTATAGTAGTATAGAATTGT
+ATACTTTCCTCTTCAGCCCGGTTGCTCAGCCGGGCTTTGTTGAAAAATATGGTGGTTTTA
+GTAGGATTTTCTTCCTTTCTTATAGAAAATTAATACGAGATAGGAGGAAAGTAATAATGG
+GGGATAAGAAAGACGCTATAAAAAGTTTTCTTACAGAAAATGTCTTAGGCGTCATAATTG
+AATATGGTAAAGAAGCGGCTAAAGCTCGGATAAAAGATGTTGTTACTAATGACGCTGCGA
+AGTTAGCTGCAGCGGTTGGTATTGATATGGCAGGCTCAATAATACCGGGAATAGGGAGTG
+CTATTTCTGCATATAGAACTCAAAGACAACTTAATAATTTAAATACTTTAGTATCAGAAC
+TTAACAAGAAGGTTGAAGAGATTAAATTAAATTTTGAGAGACAGACAGAAGAAAATAAAA
+AAACCTTGGACGCAATTTTTGAAATGGTTATTTATAAAGCGGTTAATACTAATCAAAGCG
+AAAAAATAAAGTATATGGTTAATGGATACGCAAATCTGACAGCTATTCAAAATGTATCTT
+ATGATATAAGCTATCTTTTTTATGATGTTTTAGATAGAATGACTATATTAGATATAGCTG
+TTTTGAAAGCTTCATATCCTTTTTGGGGTACTGAAGAAAATAGGAAAAGCTTTGTAGATG
+TCTTGAATGAATTTGGCATAGATTATTATCAGTATGAAGCGGTAAGGGATAATCTTTATC
+GAATGGGGTTGCTAGAGAATCAATATGATGATGCTTTAGAAAAAGATCTAGATTTACTAG
+TTAAAAATGTTAATAATCTAAATGAAGTAGTTATTTCAATACAAGAAAGTCTTGCAAATC
+CCAGGAAGAAAATGAAGAAGCTTAAAAATACAAAAGTTGAATTAAAAGCTAAAGATCGTT
+TAAAGATATCTAAATTTGGCAGGGAATTTGTTGAATTTTTTATTAAAAATTATAACGATT
+AAAAATTATAACGATAATGTTGGAACATAAAGCTACTTGTTGAAGATAGCTTTTTAATTG
+GAGGGAACGATATGGATATTGGAATGTTTATAAAGAAATGTTTTGAAATAGGGATTTCAT
+TATTGAATAAAGAAAAGCTAACAGAGGAGGAGAAAGAACTTTTAAACGCTCTAGATAGTT
+TAGAAAAATGGATCCAAGATAGAATCCTTTTTGAGAATTAAGACTTTGGATAAATTAAGC
+GGGGTGAGGTGATGTGAAGCTAACAGAGAAGCAAAAGGCATTTTGCGATTATTACATTGA
+GACATTAAATGCTACTGAAAGCTACAAAAAAGCAGGATATAAAGTCAAAACAGATGGTGC
+AGCTAGAGTTAATGCTTCAAGATTGCTAACAAATGCTAACGTTAGGAAATACATCGAAGA
+GAGAATGAAGCAAAAAGAATCCGAGCGCATTGCCTCACAAGATGAGGTTCTGGAGTTCCT
+CACGCGAGTTATGCGTGGGCAAGAAGTTGAGGAAGTGGTCGGGTTTACTGAGTATGGGGC
+AGTAAAAGAGAAGAAAACACCGAGTGCCAGGGACAGAGTAAAAGCAGCCGAACTTTTAGG
+CAAAAGGTATGCGTTATTCACTGAAAAAGTCAACGTCGAAGGGAACATGGGCGTTGCTAT
+TATAGATGATATAAAAGAAGATGATAGTGATGACGCAAGTTAGACTTAGCGAATTAGTCG
+CACCGAGTTTCTACGAGATCCACAATGACATAAAGCATAATAGATATACTCATTACTGGC
+TTAAAGGTGGCCGTGGCTCAACCAAATCCTCTTTCGTGAGCATTGAAATCATCCTCGGCG
+TAATGAAGGACCCTAACGCTAATGCAGTGGCCCTGAGAAAAGTTAAGGAGACTATCAAAG
+ATAGCGTATTCGAGCAGTTAGTGTGGGCAATTGAGAAGCTGAAAGTTACTGAATACTGGG
+AGATAAAGCACAACCCTATGGAATTGACATATCTACCTACGGGACAAAAAATATTGTTCC
+GTGGCGCTGATAAGCCAAGGAAGATTAAATCCATCAAAGTAAGCCGGGGATATGTAAAGT
+TTATCTGGTATGAAGAAGTTGACGAATTCCTCGGAATGGAAGAAATCCGAATCATTAATC
+AGTCCTTGATGCGTGGCGGAGAGCAGTTTGTCGTCTTTTATACTTACAATCCTCCAAACA
+GGGTTAACGCTTGGGTGAATGAAGAAATACTGATTGATAGACCGGACAGAAAGGTCCATC
+ATAGCACGTATTTGACTGTTCCTCGAGATTGGCTTGGGGAACAGTTTTTTATTGAGGCAG
+AACATCTTAAAAAAGTTAACGAGAAAGCGTATAGGCACGAGTATTTAGGTGAAGTCACCG
+GCACAGGCGGCGAGGTATTTACAAACGTGAAAGCAAGGAAGATAAATGACGAGGAAATAA
+AAGCATTTGACAGGATAAAAAGAGGACTGGACTTTGGCTATGCTGTTGACCCGGCAGCTT
+ACATTGTGTGCCACTTTGATAAAACAAGGCGGCGGCTTTATATATTTCACGAGATATTCC
+AGGTCGGCTTGAGCAATAGGAAATTGGCAGAGTTAATTAAGAAAGAAAACAAAAGCAATA
+AGTTAGTGGTTGCGGACAGCGCGGAGCCAAAGTCAATAGCCGAATTGCGTGGTTATGGAA
+TCAACATAAGGGGAGCGAAAAAAGGACCGGACAGCGTTGAATATGGAATAAAGTTTTTGC
+AAGACCTTGAAGAGATAATAATTGACCCTGAGCGATGTCCAAATACATTGCGAGAGTTCG
+TAAATTATGAACTTGAGAAAGACAAAGACGGCAATTTTAAAGCTGAATTCCCGGATAAAA
+ACAACCACACGATCGATGCTGTTAGGTATGCGCTTGAGGATGATATGAGGACGGGCGGCC
+TATCAATTTTAAAGTGAAGAAGGTGAGAAAGGTTGCTGCTTAATCTTTTTAATTTCAGGA
+ACTTTAAAGACTTATTCCGCAATGATATAAACATGATGACTGTAGAAGAAATTTTATATA
+ACGAAATCAAAGAGTTCCAGGCATCCGATAGAAGGGCCTGGATGGTTATTGGCGATAGAT
+ATTACCGGTGCGAAAATGACATCCTTAACAGGCGTATAGTACGCCATACAGAGAGCGGAG
+ACATTGAAGATAGGTCAAAAGCAAACAATAGGTTGGCCCATGGTTTTGTTAAAAACCTTG
+TGGATGAAAAAATAGGATATCTGCTTACAAAGGATTATTCGCTGAAGTGCGACAATAAAG
+AATATATTGAGAAAGTTAAAAACGTCTTGGGTAAATATTTTCAATACACCCTTACCAGGC
+TCGGATATGAAGCGTCGAATAAAGGCATAGCATGGTTACAAGTTTACATAAATGAGCAGG
+GCAAATTTGGAATGATGATAATTCCTGCTGAACAGTGCGTTCCACTCTGGAAAGATAACA
+CTCACACTGAACTTTATGGCATGATTAGATATTATGTGCAGACAGTTTATGAAGGCAAGG
+AAAAGAAGCAGATCACTCGCGTGGAATATTACACGGATAAAGAGGTTTATTTTTATGTTC
+TCGATAATGACCATCTTATCCCGGATATAGAGCAATATGAAGGAGGGCCCATACTACACT
+ATAAAAAAGGGGAAGAAGGCCGAAGTTGGGGGAAAGTGCCTTTTATTGCCTGGAAGAATA
+ACCATCTTGAATATCCGGATGTTAAATTCATTAAATCGCTTGTGGACGCTTACGATAAGT
+CACGGAGTGAAATAGATAATTTCATTGAAGAAACAAAAAATCTTATCTATGTTTTAAAAG
+GCTATGGCGGAGAAAATTTATCTGATTTCATGAAAGACCTTAATTACTACCGGGCTATAA
+AAATAGATGATCCAGAGCATGGTGGAGTTGATACACTAACACCGAAAATAGATATTCAGG
+CAGCAAAGGAACATTTCGAACAATTAAAGCGGGATATAAATGAGTTTGGCCAAGGTGTGC
+CCAAGGACCTTGACAAATATGGCAATTCTCCCAGTGGGACAGCATTGAAGTTTTTATATA
+GTGGGCTGGATTTAAAATGCAACCACTTGGAAGTAGAATTTAGACAGTCATTTAATCAGC
+TTTTGTATTTTGTAAACAGATATCTCGCAGAAAACGGTCAGGGAAATTATGAGAATGAAA
+ATGTAGAGCTAATTTTCAATAGAGATATACAGATTAATGAAACTGAAACTATCAATAATT
+GTGTTAACAGTAAAGGCATTATTAGCGATGAGACTATCCTTGCAAATCATCCATGGGTGT
+CTGATGTAGAAGAAGAATTAAAGCAGATTGAGAAAGAAAGAAAATCAGAGGAACCGCCAA
+TGTTTGGTGAGGGGGATGAAGAGTGAAAGTAAGAGAACTGGTTGAAATATTAAAGGAACT
+AGACCAGGAGCAAGAGATAAGGTATAGTTCATATGAATTTCTCGGGGATTTTAAGATTGA
+AGGAGTTGAAGAAGCAGAACATGAAGGAATTAAGTACTATAACATAAAGTAGGTGGTAGT
+TAGTGAATAAAAAGGACATAACCTACTGGGAAAAACGACAGGAACGGAAATATCTGGCCG
+GAGAGAAGAAGCTTGATGAATATTATAAAGGTTTGCAGAAAGCGTTTAGACAAGCAAAAC
+GAGAAATCCAGAGTGTTATAAATGATTTCTACATGCGATATGCAAAAGAAAACAAAGTAT
+CCTATGCTGAAGCCCAAAAACTACTTGATAAGGCAGAAATAGGCGAGCTGCAGGACTTTA
+TAGACCTTGTTAATAAGAATATGGGCAAGTATAATCGAAAGCTTAACAATATGTCTATAA
+AAGCCAGAATTACCCGCTATCAAGCGCTAGAAAAGCAGATAGATGCTATACTACAGCAAT
+TATATGCTATTGAGTATGAGTATAAAGGTAAAGAGCTACTGAAGGAAGTATATGAGGATT
+CTTATTATCGTACCTGGTTTAACATAGACCAGTACCACGGCTTTCATCAGGAGTTCGCAC
+AGATTAATCCTAGAACTATAGAAGAGTTGATAAAATATCCTTGGAATGGAGCAAGTTTTT
+CTGATAGGATATGGAAGCAAAAAGACCATATGCTGCAGGTATTAAAAGAAGACATTACTA
+CTATGTTAATACAAGGGAAAAATCCTCAAACATTAGCAAGAGATTTCGCAAGAAGGTTTA
+AAACAAAAGAATATGAAGCATATAGGCTGCTACATACAGAGAGCAGTTTTATTATCGAAC
+AGGGAACTTTAGCAGCATATAAAGAAGATGGGGTGGAGAAGTATCAGATTCTGGCTACTC
+TGGACATGAGGACATCGGATATATGCAGAAGTGAGGATGGGAAAATATATGATGTGGATG
+AGGCGACAGTGGGAGTAAATTATCCTCCATATCATCCATTTTGTAGGACCACAACAGTGC
+CATATTATGAGGATGCTGAGGTAGGTACAAGGGTTGCGCGTGATCCGGTAACAGGTAGAA
+GTTATGAAGTTCCAGCGAATATGACATATGAGCAATGGAAAAATAGATATATAGATCAAC
+CTGACAATATTATTCGCCAAGAGATACTGAGTAATCCTGAAAGACTTGATAATTATAGTA
+TCCAACATTATAATAAGCATAAAGAAGGAACCAAACAATATGAGCAGTATAAGCAATCAA
+GACTTAAAAAAGGTCAAACTGAACAAAGCAGTTTACTAATTTCTTACGATGAAGCTAAAG
+AAATAATAAAAAAATATGCTGGTACTGGAGTATTTAGTAGAGACAGGAAAGGGAAATGGA
+GAAATGAGGAATTTGTGGATGTAGATTCTATAATTGGTGTTGTGCATAATATTGATGGGA
+CAGTAACGCCTACTAATAGAATTCAAATAAAATATGGGAAGAACAGCGTGCACATTGTAC
+CTGTATTACCAAGAAAGGAGAGAAATAAATGAATCTTTGTGAATATCAAGGTAAAAATGT
+AAGAGTTATTACGACAGACGGGCAGAAGATTGAGGGGTATGTAATAGCTTTTACAGATGA
+AGAGGAATGGGACGAGACCGATCCCGAGGGCAATAGTATTTCAATTGAAAATGATGAAGG
+CATTATTGGGATTTATGAAAAAGAAATAAAATCAATTGAAGTAATGAAAGGCTAAACACC
+ATCTATCATGAATAACGATAGATGGTGTTTTTATATCTATGGAAGCACTTGGTGAAGGCC
+AAGTGCTTTTATTATGCCGTCTTTTCGGTACTGCAGACGTAAAAGAACAGGACACTCGTG
+GAAGCGACCACGAAAAAAAGCGTAGTGAAGATGAAAGGAGAATGGAAATGACAAAAGAAC
+AGTTAATGGAAATGGGGTTAACTGAAGAACAAGCTGAGAAGGTTCTAGTTATATATAAAG
+AAGATTTAAAAAGCTTTATCCCTAAAGCTAGATTTGATGAAGTAAATGAAGCCAAAAAGA
+ATTTAGAGGAACAACTTAAAGACAGAGATAAGCAGTTAAAGGATCTTGGTGAAAAAGTAA
+AAGATAATGAAGAATTAACTAAGCAAATAAAAGACCTTCAAGAAGCCAACAAAAAAGCTA
+AAGAAGAGTATGAAACAAAGATTAAGAATCTTACATTAGACAACGCTATAAAACTTGCTT
+TAAAAGAACATAAGGCAAAATATGAGGACCTTCTTGTAAATAAGTTTGACAGAGAAAAAC
+TCGTTATCAAAGATGATGGCACTATAGAAGGATTAAATGAACAAATAGCAGCTTTAAAAG
+AAAATTACAAAGACTTATTTGAGCAGCCTTTAAGTGGACATACCCCTAATAATACCGGAG
+ATAATCCTGAGGGAGGAGAGCTTCAACAAATAGCCAATACTATCAGACAAAATTTAGGAT
+TTTAAGAAAGGAGAGCGTAAAATATGGCTAATGTATTAGAATATGCAAAAATATTTATGC
+AAGAACTTGATAAGCAGGTAGTGGCACAAGCTACATCTGGATGGATGGAAGCTAATGCAG
+GCTTAGTTAAGTACAATGGTGGTAATGAGGTAAAAATACCAGTTATAGACATGGATGCAT
+TAGGAGATTATGACAGGGCTAATGGATTTGTTGACGGGTCAGTAAATTTAACATATGAAA
+CAAAAATTATGACTCAAGATAGAGGCAGAACTTTCATGCTTGACCGCATGGATGTAGATG
+AAACTAACTTTGTAGCAACTGCTGCTAATGTCATGGGAGAATTCCAGAGAACAAAGGTTA
+TTCCTGAAATCGATGCGTACAGGTATTCCAGCATTGCAAGCCAGGCTATTGAAAAAGGTG
+TAGCAGTTGGTGGCTATACTCCTTCAGAAACCGACATACTTAAGAAGCTGAAAGAAGATG
+TCTATGCAATATATGATGTGGCCGGAGAAATTCCTCTGGTCATTATCATGAACATGCAGG
+TCGCTGCAATACTGGAGAATTCCACAGAATTAAGTAAAACGTTATCGGTTATTGATTTCA
+CTCAGGGGGATATTAAAACCTCGGTGAGGGCTATTGATAACAACCCAATAATCAAAGTGC
+CTTCCGCACGAATGAAGACAAAATATGTATTCTATGATGGCAAAACCGCAGGCCAGGAAG
+CAGGTGGATTTACACCAGCTGAAGATGCTAAAAACATCAACTGGATTATTTGTCCAAGGA
+CTGCGCCTATAGCTGTATCTAAAACAGATAACATAAGGATATTTACTCCTGAACAAAACC
+AAAAGGCTGACGCATGGAAGATCGATTACAGAAAATATCACGACCTCTGGATAAAGGACA
+ATCAGTTTAAAGCAATTCGTGTAAACATCAAAGAGGCCATAGCATAGGAGTGATGCCGGA
+TGTATAAACTTGAAAAGCTCAATGTAGTCAAAATCGTACCGACGGAACATGAACGGGAAA
+AACTCTTGGCTAAAGGCTTTAAGGATGCGGAGAAAGAGGAAAAGAAAGAGGAAAAGAAAA
+AGGATGAGAAGAAGGCTGCTAAATAGCGGCCTTCTCCCTCTTTTCTACCCTAAAAGGGGT
+GAGTATATGTCCATTGAAGAAATGCTTACAAAAGTAAAGAGTAACCTCAAAATTGAGGAT
+GATAGCAAGGACCTAATCATAACTGACATTATTCAGGAGTGTCTGAACTACTGCAACCTC
+AAAGAGCCGCCGGCAGAACTGGAACCATTTATCCGCCGCAAGGTCAAAACCATCATTGAC
+TATGAGGCCGAGACCGGAGGTAGTTCAGTATTTGACGTGACCTCAATAAAAGAGGGTGAT
+ACCTCTATAACTTACAACACTGACGAGGTTTCCAGAGAAACTATCTACGGCCTGTCTGAA
+AAAGACAAGCAGGCCTTGATGCGATTCCGGAGGTTACGAAGATGAGCGTATTGCAAAGAC
+TTTGGAAAGACCGAATGGATATATATCGTTGGGTTGAGGTTGTAGAGGGCGGCTTCACAA
+AACAGAAAAAGGAGAAGATTTACGAAAACGTCAAATGCCATTACAGTAAAGGCCAACTGG
+TTAACACGGGAGAAGACAGTGTGCCCACATTGATAACTTCTCACACTTTGTTTTGTGGTC
+CAGATGTGGACCTTCAAGAAGGTGATGAGGTGGTTGTTACCCAGCGGAATGGCAAGCAGG
+TAACCCTGACAGTAGGTGAGGGTTTTCCGTACAGCACTCACCAGGAGTTTTCCGTGAAAC
+GGGTGGATACGGCATGAGCAACTATCGCACAAATAAGGCCGCAATAGATAAATTCCGGAG
+AGAATTGAAAGCCATGCTGGGTGACATTTCTGAAATTGACAAGAGGGTTTTGGATAAAGC
+TGTGAGTATAGGCCTTGCTGATGCCAAAAGAAATACGCCGGTGGATACCGGTTTCATGCG
+GCGAAGTTGGCATGTAATGCCTACGAAGAAAACTTCGCAAGGTGTTGAAAAGGAGTTGAT
+TAATTCTGCAGATTATAGTTCCTTTGTGAACTACGGTCATAGGGTGGTCAACAAGAAAGG
+TGAAACAGTTGGCTGGGTAAAAGGCCAGTTTATATTGGAGAAAGCAGTAAACACAGTAGA
+AAAGGCTTTAGCAAAAGAATTTGAAAAAGAAGTGGAGAGGGTGAACAGGAAACATGATAA
+GTGAAATTAAGCAGGCTATTGCTCAGAAAATCCATGAACAGTATCCTTCATCTACTATCT
+ACGATGAAGACATTCCTCAAAACTTCAAAACACCCTCTTTTTTGGTAACCGTCATTGAAC
+AAAGCTATGGCAAGAGGCTCGCCAACAAATACAACAGCACCGTTTCCTTTGATGTGGCCT
+ATTTCAGCGATAAGGGGAAAAACGAGGTCAAATCCGACTGCCAGGCGGTACAAGTGAACC
+TGCTACGGGCTTTCGACCTGGTGGGAACCTTCCGGGTTCAGAACCTGCAGGCAACTATCG
+TGGATAACGTGCTGCATATTACCTTTGATGTGAGGTATTCGGAGATAAAGACAGGCGAAG
+AGATTCCAAAAATGCAAGCTCAAGCAACAAATACAGATATAAAGACCAGCTAATTAAAGT
+CAAGAGTTTTTAAGAAAAAATTTTAAGAATTTTCTAAAACTCCTGACAGCGAAAAAAGGC
+ACAACGACAAGACCACCTAAGATTAGTAGACATAAAATAGCTGGCCTGAAATAGTAAATT
+GATTTTTGAAAACTAAACATCGAGTACAAGTACTACTAAGCTGCTGTGTGCTTCGCTGCA
+AGCATTTGCGCGTGCTCTTGGGGAGAACGTAATTCGTAAGGCTTTCTATCCCTAAGAACA
+GCAAAAATATAATTAACAAGCTTACGCATAACAGCCCCCAAAGCTACTTTCTTGGGCTTG
+CTCTGGCATTTGTTTTTGTAATATTCCATCAGTACAGGGTTGCAAGCTGTTTTGTCCCGC
+TTGGTGCGGATATTAGCAAGAGCAATTGTGAAAAGTACTCTGCGAAGCAGTCTTGACCCC
+CTTTTTGACATCTTGTTTTGTGTGCCGGTAAACTCTCCGGACTGCATTACAGAGGGGTCA
+ATACCGAAATAAGCAACTAGCTTGCCTGGCTTTGAAAAGGCTGAAAAGTCGCCAATTTCA
+GCCAGAATGGTAACAGCAGAGATAAGTCCTATACCTGGAATGCTTTGTAGAAGCTCGAGA
+GTCAGTGCCAGCATGGGCATGTCCTTTGCCATATCTTCAATAATCAATGAACGAATGGCT
+TTGAAGACTTTCTCAAGGTTTTCTTCCAAGGTTTTAATCATAGAGATATACACACCAAGC
+ATGGCAACATTTGAAGAGTTACTAATGCTTAAAGGTGCAAATTCTTTGGCCTTGGAATTC
+AAAAGCTCATACTTTGCAGTTGCCCATTTAAGGCTTCTGCGGGAATTCTTCTGTATCAGT
+GCAATCAACTTGTTTCTGTTCGCTTTAAGAATATGCGCAGGTGCAGGATATTTCTCCAAT
+ACTGCAAGAGCAGCCTTTGAAAAGATATTAGGGAATACATCCTTGAAGTTTAGCATGAGT
+TGGTCAACAATACCCATAAGCCTGTTTTTGTAAGCAGTAAGTTCGTCAGAGAGCTTGTAG
+TACTGGCGGCAAAGGCTTCGCAGACATTCAATATCCTCGTCGGGGATATTGGTAGTTTTA
+AGCTCCTGAAATCTGTATAGCAGAGCAATTTTCCGGGCATCCACTTTATCATTTTTCACT
+TTCCTTATTCCAATATTTTTGATAGAATCAGTTTGGATGGGGTTTATGACAGAAACCTCA
+AATCCAGCTTTATAAAGTGAATGGAAAAGGATTTTGTGATAGTGCCCAGTGGATTCCATG
+ACGACGAAAGGCCTAGAATCAAAGTCCTTTTCCGTTTTTTTCAGTAATTCAACGGCTCTT
+TCAACGTCAGTACTGGAATCATGGCGGATCTTCATGCGGGCAATTACTTCATTGGATGGA
+GAAAGAATTGCCATCTCACTGAAGAACTTGCCGACATCGATTCCGGCGATGGGTCTAAAA
+TTCATAAAAATGCCTCCTTTATAAGATTAATGGACTTAAAAGACTCCATTCCTTCTCATG
+TAAGTAAACAACCTTGCGTGTGACACGAGGAGCCAGCTGAAATGCTGGCCTCAACCAGCC
+AAATCATTTAGACTTACCGGAATGGATAAATACTCTTTCTTACGGGTAGTCGGCCCAATA
+AGGTCCGTCCCAGGAGTGATTACAAACACTCTCCAAGTCCGGAAAATATTATACATGATT
+GACAAGGTTCAGGCCAGACGAAAGCTAGCAAGCGGTCATAGATGGGGAACCGCAGGCGGC
+AGGATTTGAAAGCCACCGCCATCCCCTAGGGGATGGCACATAGAAGTGCTTGATGTTTAG
+AAAAGCAACAAATATGACATTATGTTAACAGGGTCGAACAGTGGCAAAAGTCACTGATGA
+AATAACAATATTAATTGTACAAGGAGTGATAAAGATATGGGTGGAACTTGGACGAACCAG
+AATAAGATCCTTCCTGGGGCATACCTTAACTTTCGGACAAATGCTCCACTTTCCATAACA
+TTAGGGGAAAGAGGTACAGTAGTAATACTACAGGAAGTAAGCAAGGGTGCTAGTGGGGAA
+ATGTATAAAATAACAGCACTTGACCAGAGTAAATGGCCGACAGGTGTAACAGCTGAAGAT
+AAATTACTTGCAAATGAGGCGCTTAAAGGTGCCAATACTGTAATCGTATATAATTTGGGT
+GCTGAACACACCTCTGAGGTGGTTGAACAGGCTTTGGCTAAATTGATGACAGAAGATTTC
+AACGTATTGGTGTATCCATATGATGGTGCAGCATATGACACAATTAAAACTACTATCAAA
+GCTTGGGTTGATATGATGCGTACCGAAGAGGGCAAGAAAATTCAGGCAGTTATGGCTAAC
+TTTGCAGCTGACGATGAAGCGATTATCAATGTTACCCAAGGTGTTAGACTTGTTGACGGA
+ACAGAACTTACAGCAGCACAAACTACAGCATGGGTTGGAGGTGTTACTGCTGGTGCGGCT
+ATTAATCAGTCTAATACTGGACGTAAATATATAGGTGCTATCGATGTGGTACCTAGAATG
+ACTAAAACTGAAATGGAGGCTGCTGTTCAAAATGGAGAATTCATATTCAAAGTAGATACT
+GCTCAGAATGTAACAGTGATATACGACATTAACAGCCTAACCACTGTTACCGCAGAAAAA
+GGTAAGCAGTTTACAAAGAACAGAGTGATTAGAACATTAGATGGTATTAATAACGATATT
+GTAGAAATATTTGAATCGAATTATGTTGGCAAGGTCAATAACAACGCAGATGGTAGATCG
+CTTCTAAGAGCAACATTAATTGAGTATTTCAACGAATTGCAAAGACTAAACGCAATTCAG
+AATTTTACTGCTGAAGATGTAACCGTATCTCCTGGTAATGATTCTGATGCGGTAGTAATT
+GACTGTTATATCCAGCCAGTTGATTCCGTAGAAAAAATCTACATTACGGTAAATTTGTCA
+TAGTTGAAGGAGGGTAATAAGGTATGGCAGATAATTATGTAAGATTATCAGATACGATAT
+CCTCTAAAGAAGGAAAAGCTTATATCACAATTAATGGACAGAACAGGGAATTGTTTGAAA
+TATCGAGCCTGACTGCTCAACTTGAGCTTCAAGTACAGTCCCGCCAGATGCTCGGTCATC
+GTATGGTCCAGCATAAAGTAGTTGGGGCCGAGGGTACCGGATCAATGACAATGTATTTCA
+TGAACTCTGATATGTTGAGATTGGCGATACAATACATCAAAGAGGGTAAATATGGAGGAC
+TGAAGCTCCAGATTAAAAACGAAGATGCACAAAGCACAATTGGAAAACAAGAAATTGTGC
+TGCTTGGTGTATTGCTTAACACTATACCTGTTGCTGCATTAGATGATCAATCAGATGATC
+CGATTACTGTTGACACGGATTTTACATTTGATGACATTGAGGGTTTGAGTTTCTTTGACT
+TGCCGGCAAATTATAGATAAAAGGGAGTGGTAAATAATGAGTTTAGGTTCTTTAGAGGCT
+TTTCTTAATCCTGTGAAAGTTGAAAATAAAAAGGTTATAGTGTCAAACAGATTCAAAGAT
+AAAGACGGGAACCTTGTACCGTTTGAAATCCGCCCTATCACACAGGAAGAAAATAAAATG
+CTAATCAAGAAATACACAAAAAGGGACAAGAAAGGTCAGGAATACTTTGATAGAGCAGAG
+TATATATCAGAGCTTACGGCATCCGCCGTAGTATTCCCAGACCTTACAAATGCAGAACTG
+CAAAAAGCATACGGTGTACTAGGTGCATCTGCATTACTTCAAAAAATGTTATATGTTGGC
+GAGTATGCAGAATTAGCCCAGGCAGTTCAGGAATTGAGCGGACTTGACACAGATATAAAT
+GAGGATATTGAAGAAGTAAAAAACGCATAATGCAAGGCGATCCTGAGTTCGTCTTAGCTC
+ACTTCGCCTTGCAAAAATTACACATATTACCTTCAACATTAGCCAATATGAGCGAAAGAG
+AAAAAGCTTTTATATATGCTAGTATACAGCTTCGTATTGAGCAAGAGAAAAAAGAGTCAG
+CTAAAATAAAGGCTGCAAAGGGAGGAGGTAGAAGGCGTTAATATGGCAACTTTAAAAGCA
+GTTATGGCTTTATTGACTGGAGGTTATACATCAGGAATCAATAAAGTCATTAAAAATACA
+GATAAAGCAACAGATAAAATTTTAAAAGCTAGCGGTGCCACAGATGAATTTAATAAAAAA
+TTAGAAGTCACTGGCGCAAGTGCTAATACTGCAAGTGGTGGATTGGGGAAATTACTTAAA
+ACTTTTATAAGTTTAGCAGCGATAAAAAAAGGAATAGATATTACAGACGAATATAGTAAT
+ATAGCTGCTAGACTCGCACTTATTAATGACGGCTTGCAAACACAAGAAGAATTGCAAAAT
+AAAATCTTTGCAGCTGCTAATCGGTCTCGCGGTGTATACTCAGATATGGCCAGTGCAGTG
+GCCAAAATGGGGCTGCTAGCCAAGGACGCTTTTACCTCCAATGATGAACTAATTGCCTTT
+ACAGAGCTTGTACAAAAATCATTTAAAATTAGCGGAGCTGACCCATCTGAACAGGCAGGA
+GCAATGAGACAATTAGCTCAAGCGATGGCTTCTGGTAGGCTTCAAGGTGATGAATTAGTA
+TCAATAATGGAAAATGCTCCAATGATATATGAGGCAATAGCAAAATATATGGGAAAGACA
+AAAGGAGAACTTAAAAAATTATCTTCTGAAGGAGCTATAACGGCCGACATAATCAAAAAT
+GCCGTATTTGCCGCAGCGAAAAACATCAACACCAAGTTTGCAGAGATGCCAATGACTTTC
+GGAGACATATGGAACAGGATTAAGAATGGTGCACTTAAGGCCTTTGATAAAGTTATTGTA
+AAGGTAAATCAGCTTATTAATGCTGACAAGTTCCAGCGATTTGTAGACAGAATGATTACT
+GGTTTTAGTCTTGCAGCATCTGCGGCAAGCTGGTTAATCGATGCTATAATTAGAGGTTGG
+GATACGATAGGGCCAATACTTGCAGTTATTGCTGGCATATGGCTTGTTTCTATAATTGGA
+AAACTGTGGGCAATGATACCACCACTGATTGCGCAAGCAGCAGCATGGTTAAGTGTATAT
+TGGCCTATACTACTGGTAATTGCTATTATAGGAATAGCAATATCTGCAGCAAGACAGCTG
+GGAGCAACATGGGATGAGATTATAGGATTTATTGGAGGGCTAATCGGTGTTTTTGCCACA
+ACTTTCTATAACTATTTCGTCATGATCTGGAATCACATAGCCGCTTTCGTGAATTTCTTC
+GGCAACGTATTCAAAAACCCAGTAGCTGCTGTACAAGCGCTGTTTTTTGATCTAGCATCT
+AACTTGCTTGGGTATATCGAAAAAGTGGCCCGGGGAATTGAAGATTTGCTGAACAAGATC
+CCGGGCGTGAACGTAAATATCGCCGGAGCCATCACAAAACTGAGAGACAAACTAAAAGCG
+GCATCAACGCAGATAAAAACCGAAGCCGACCTGAAAACCTATGTTCAATCCAAAGAATTC
+ATGGATTTCTCTGAAGGTTGGACGAAAGGCAGCACCATGGGGAAAAATCTTGTAGACAAG
+GTAAGCAACGCATTGTCAGGGCTGACTGATATAGGCAAAAGTTTTGACATGGGGCAATTC
+GGTACAAGTCAAAACCCGCTATATGTCACATCTAACGATAAGCTTAAGGTGGACATGTCG
+GATGAAGACTTGAAGTATTTGCGAGATATCGCAGAAAGAGAATACATTGCCAAATTCAGC
+ACCGCAACGCTTGCACCTAACATCAGTATATCCTTTGGAGATGTACACGAAACAGCGGAT
+GCCAATAAGATAGCGGGAAGAATTAGAAAAATACTCCAGGAAGAAATCGCTATGGCGGCA
+GAGGGGGCATATGCATGAGTTATGCAGTGTTTTTCGATAAAGATGGTGTGACATACCGTC
+TGCCTGTTAATCCGGAACAAATCGAAGTTATATCAAATCAAGCAATTGAAAAATATGAAA
+TATTAAAACTTGGACAAATTGCTGTGCCAACACATATGGAATTAACCGAATATAGTTTTG
+AGTGCGAACTCCCATTCAAACCTTTACATTATATAGAAACAGCTGGCGATTTCAAGAATG
+CGGATTTCTACCTTAACCTTTTTAAAGCATGGAGAGAAAAGAAAGAGCCGGTACGCTTCA
+TTGCTTCAAACGGTATCGGCGATGATATCAACTCGTTAGTACTTATTGAAGAATTAACTA
+TCACTGAAAAAGCAGGAGAAGAAGGAGATAAATATGTATCTTTTCGTTTAGTAGAATATC
+GGCCATACGGAAAGAAAACTGTTGTGATCCCGACACCAACCCAAACAATAGTCAAAAAAG
+ATGAACCGGTTCCAGCGGTGTCGCTAAAAGCGAATGATTACCATGTAGTACAACCTGGAG
+ATACCCTTTGGGGCATCGCAAAAAAGTACTATGGAAACGGTAATCAATATCAGAAAATTT
+ACGAGGCAAATAAAAATCAAATCAAAAATCCTAATCTCATATATCCCGGGCAGAAGTTGG
+TGATACCGAGATGAATATGGAATTTGCGGTTGAAACAGATGGGAAGATATATGAAATCAG
+CGAGCTTGTTACTTCCGTATCTTATACAGATAAACTTAACGATGGATGTAGCAAGCTCGA
+ATTCTCATATATTGATGACGATTTAAAAATACATAACGGCAGCGTAGTGCGGTTTAGATA
+TGATAATGAAAACGTGTTTTATGGGTATGTTTTTAAGCATGGTCAGAATAAAGCCAAAGA
+GATCAGCGTAACCGCATATGACCAACTCCGCTATTGCAAGGCCAAGGATACGATTGTGGT
+CAAAAATGACACTGTAGATAGCCTCGTAAAGAAAATGTGTAACTATTTTAACCTGAAAGC
+TGGTATACTCACCAATACTGGCTACAAACTGCCTGTAAGCGTTCAGGACGACAAGACCTG
+GCTGGATATAATTTATACCGCCATAAGCGACACACTGATGAATACAGGCAGATGGTACTG
+CCTGCGCGATGAGTTCGGCAACATAGCAGTCAGAGATCTCCAGGAGCTGCAGCTCGATCT
+TATTCTTGGCGATGAGAGCCTGGCTTATGATTATGAATACGAGAAATCCATTGATGATGA
+GTTCTACAATCAAATTAAAATTGTAAGCGACAATGAAAAAACAGGCAAAAGAGATGTATA
+TATAACCAAGGATAGCAGCTCAATACAAAAATATGGGCTGCTACAATATTTTGAGGTACT
+TGATAAAAACTACAATCCTTCACAGGCCAAGGCAAAAGCTGATGCACTCCTGCGGCTATA
+TAATAGGGAAGTTGAAACTTTGGAGTTAGAGTGCCTTGGTGACGTGAGAGTAAGAGCGGG
+GAGCAGTTTTTACGGGCGGATTGAAGATATACAGTTGAATAAACGGCTAATCGTAAAGTC
+AGTTGCTCATGAGTTTATCCCTGTGCACACAATGAAGTTGGAAGTGATGATATGATTAAC
+GAAATTAAAGCTATAATCCAAAACTACCTCAATAATGCTAAACTATGCCGGCTTGTGGTG
+GGCACAGTGACCAATGACGGCATCAAGGTAAGTGATAAACTCACTATTCCATATGAGCTC
+ATAGTGGGTAATCTCAAAAAGAATTTGATTGCTGGCCAGAAAGTGCGGCTGCTCCAAAAT
+CACGGTGGCCAGCAGTTCTATATCCTGGAGGTGATCTCCGAATGATACCCAACGCTTCTA
+TAAATATTGAATTAGGCTCTGCAGAAAGTATAGAAACAAGCCGGACATATAAACTATCCG
+GAGATAAAATCCAGGGCTATGTAGATGGGTTGGAGGCTCTCAAACAAGCTATATATAAGG
+TGCTCAACACAGAGCGATATGAGTACCCGATATATAGCTTTAATTATGGGATTGAACTTG
+AAAGTTTAATAGGCAAAGATCCCATATATGTTCAAATTGAGTTGAAACGCAGAATTCGAG
+AGTGCCTTCTAAGAGATGATAGGATTACCGATGTCGATAATTTCAAGTTTGAAGTAAACG
+GTGATGAAATAAAATGCACGTTTGATGTTCATAGCATATTCGGCAATTTCACAGCCTCCC
+GGGAGGTGATTTTTTAATGTTTGAAGATAAGACTTATGAAAATATATTGAACGATATGCT
+AAGCAGGGTATCAAATGATGTAGACAAAAGAGAAGGTTCTATTATTTATGATGCTCTAGC
+TCCAATTGCTTATAAATTAGCCGAAACATACTTCCAATTAAATAATTATGTTGATTTATT
+TTTTGCAGACACTGCAGTAGGAGAGTTTCTGGAGCGAAGGACTGCTGAATCAGGAGTGGA
+ACGGCGACCTGCTACAAAGGCAATAAGGAAAATTGTTACAACAAGGCCTGTAGATGTTGG
+CACAAGATGGGGATTAGAAGATACAACATATGTTATTATAGAAAAGATATCTGATACAGA
+GTATAGGGCCGAATGTGAGCAGTATGGCACTATAGGAAATTTATATTCGGGCGCTCTTGA
+TAACATAGATAATATATCTGATGTATCTGCTGAACTAACAGATGTTCTCATTCTCGGCGA
+AGACGAGGAAACAGATGAAGAACTGTATCAACGTTACTTAGAGGAAATCAATGCCATACG
+ATACGGTGGTAATGTGGACCAATATCGTGAGTGGATCAGTGCTATCCCTGGTGTTGGACG
+CTTTAAAATCCAACCGTTATGGAACGGCCGCGGTACTGTTCGAGCGATTATAACAGATGC
+AAATAATCAAGTGCCTAGCCAGGAGCTTATTGACCTTGTACAAAATACATTAGATCCATA
+TCAGGATGGTATGGGGACCGGCCTTGTACCGATTGGACATGTGTTTACGGCCATGGGGGC
+TATCCCGAAGGTCGTGAACGTCACCATGACTGTAGTGTTCGAGGAAGGTTATGGCCCGGC
+TGATATACAGCAAGATGCCGAACGGATTATCACCGAATACTTCTCCGAAATCAACTTCGA
+GGACCAGAAATTTGTGCCGACCACGGTCCGGCACGCCGTCCTCCTGAGCCGTCTGATCAA
+TATTCCGATGGTTCGGGATATCCTGGTGCTAACGCTGAACGGTATAGATGGTAATATCAC
+GCTTGCGCCTGATGAAGTTGCCAGCCTCGGGACGGTGACGATAAATGCTGATTAAGTGGC
+TTGAGGAAGAAGCTGATTACCTTGCATATTTGCCTCCTGTTCTACAAAACATTAGAGAAT
+TTCAGGAGTTAGCGAAAGCAGTTAATCCTGAAATTATCGCACTAAAAAAAGCTATAAACA
+AGGTCCTAAACGAACAGTTTATCCAGAGTGCAGAGGATACGCTACAATGGAGGGAAAAGG
+AATTCAATATCACGGCCAGCAGCGATGAAACGATAGAATTCCGACGTGAACGATTGATTG
+AACGTAAAAGTCGAAAGCCACCTATTACGTTGCGTTCGCTGCGCAATCGACTGAACGCCT
+ATATCGGCACAACACAGGCAGAAATTGAACTAGTACCAGGGGAATATGCTTTCTCTATCT
+CTATACCAGCAGTAGATGGGTACAAATTCCGTGATATACAGAGGCTTGTTGAAGAATTGA
+AGCCCGCCAACATGGAATATCTGCAATTCCCGTTTTCAGTTGAGAGGATTCGGATCAAAG
+AAGAAAGTAGAGAAATTAAGATATTTTACGCAAGAGCTGGTCTGGCTATAGCAGGGAGAA
+CAAGAATTGGGACTACATTATCCGAGCGTGTAGTCTATAGAAGGTAGGTGATTTGATTGG
+CAGTATCTACATTTTACAAAAGTCAGTTGGTAGAAACAACCGATGCACTACTGACTAAAG
+CGCTGGTGAACGAAACTATCGAAGTGACGCAATTAAACATCACGAAGTATGCAGACAGCA
+TTACGGTTGAGATGGCTCTTCCACCCGATCTAATCGTTACGAGAATTGATTTTTTGGACA
+GCGAAGACAATATCATTACTTCAATAACAGGCATTGAGATAGATACGGCAGTAACTACGA
+TATTCAGCCACAACATCCAGTTTGTACAAGGAGGTGCATAAAGGTGCCTTTTCAGAAAAA
+AGTCTGGCAGTTTAACGACATAATCACAGAAGGCGAATTGAATCGCATGGAACAAGGTAT
+TGAAGATTCTATAACTGCCGCGAATCAAGCTGAAGTAAATGCAAAGGCTTATACTGACCA
+AGAAGTAGGTGAAGTTGCCCAAGAACTTGCTGCACATAAGGCGGAAAGTACGCAGAACGC
+TCATTTGGCGAAAAACATCGGGATTGAAGACGCTGCGGGTAACTTCACAGCGACCGACGT
+GGAAGGGGCACTGGCCGAGCTTTTTACGTCTGTCAGTAATGGTAAGACTCTTATCGCTGG
+GGCCATTACTGACAAAGGAGTGCCGACCAATCCCAGCGATACATTCCAGCAAATGGCAAC
+AAATATTCAAGCAATTCCTGTTGGAGATTATGCTGTAGGGGGTACAATCCGTGATTCTGT
+CTTGCGTTTTTTGCCGGGCGGTATGGGTGTAGAAATCTGGTCGAAGACGGACGTGGCGAG
+AGGGCAGGGCATCGCCGTAGACAGTGCAGGAAACGTATATGTCGCTCACTCTGTGGGCAG
+CGGCGGAAAAGCCGTACGAAAGTTGGATTCAGCAGGAAACGAAATCTGGTCGAAGACGGA
+CGTGGCGTATGGGCAGGGCATCGCCGTAGACAGTGTAGGAAACGTATATGTCACTCATTT
+TGTGAGCAGCAGCGAAAAAGCCGTACGGAAGCTGGACCCGAACGGAAACGAGATCTGGTC
+GAAGACGGACGTGGCGTATGGGTGGGGCATTGCCGTAGACAGTGCAGGAAACGTATATGT
+CGCTCACTCTGTGGGCAGCGGCGGAAAAGCCGTACGAAAGTTGGATTCAGCAGGAAACGA
+AATCTGGTCGAAGACGGACGTGGCGAATGGGCGGTACATCGCCGTAGACAGTGCAGGAAA
+CGTATATGTCGCTCACAATGTGAGCAGCGGAAAAACCGTACGAAAGTTGGATTCAGCAGG
+AAACGAAATCTGGTCGAAGACGGACGTGGCGTATGGGTGGGGCATTGCCGTAGACAGTGC
+AGGAAACGTATATGTCGCTCACAATGTGAGCAGCGGAAAAACCGTACGAAAGTTGGATTC
+AGCAGGAAACGAAATCTGGTCGAAGACGGACGTGGCGTATGGGCAGGGCATCGCCGTAGA
+CAGTGTAGGAAACGTATATGTCACTCATTTTGTGAGCAGCAGCGAAAAAGCCGTACGGAA
+GCTGGACCCGAACGGAAACGAGATCTGGTCGAAGACGGACGTGGCGAGAGGGCAGGGCAT
+CGCCGTAGACAGTGTAGGAAACGTATATGTCACTCACGATGTGAGCAGCGGCGAAAAAGC
+CGTACGAAAGCTGGATGGGAACAGATATTTTCAAATAGTGGGGTGATATCATGATATTTG
+TAGGAAATTTTATACAAGATGAAAAAGGAAAAGGGTTAAGGATTGGCTTTGTGCATTATA
+GGCCCTTTGACGAAACGGTAGGGATGAATCTACCCGAAGAAACAATACGCCAAATGGGAG
+CTTTAGTCGATGAAATCCCCGAACCAGAGCAAAGAGAAGGCAAAATCCCAGTGATGTATT
+ACAATCCTGAAACGAACACTGTTTATTATGAATATGAGGACAAGCCATTGTCGCTCGAGG
+AGGAAATTAAATATCTCAAGGAATTGAATGCAGAGTTGATATATCAATTAATGATGAAAG
+GAGCGTTGTAAATGGATTGGTTCAAGACAATCAAATGGTTTTACGACAGCCAATTGTGGA
+CAAAAGAACAAGTTGCAGATGCAGTGCAGTACGGGAAAATTACAGCGGAACAGTATCAGA
+AAATCACGAGTGAGGAATATAACGAAATAGAAAGCACCAATTAAGGTGTATTTTTTATTG
+CCTTTTTTTGAGGACTTACCTTTTAAGGTAGGTCCTCTATTAATTGTTTTTTAGAAAGGC
+GGTTGGTTTATTATGAGTGAAGAGTTCAACAACAAAGAAATCATAAAAATGATGATGGAC
+TTTAAATCAGACATTAAAGGTCTGCAAGCTGAAATTCAGGAAACAAAAAACTTGCTGAGG
+AATTACAATGGTTTGCGTGAAAAAATGATGTCCTTTGAAATTGAGCTGGCAACTTTCAAA
+AAGGAAATTTTGACTCTCAATGAATGCAAAAAAGAGCAAAAATCCGACTGGAGATGGGTT
+GCTGGTTGGATTGTTGCTGTCGGAAGCCTGACCGTATCAATTATTGCTAATTTCTTCAAA
+TAAAGGGGGATGAGCACATTGGTACCGTACATAGTCGACCACATACCCAAAACAACACCT
+TACAACCGTCGCCCCGGATATTCCATGACGCCGGAATATATCACAATACATTCTACCGGC
+AATCCGACCAGCACGGCAAGGAACGAACGAGCGTGGTTAACTAACCCGAATAACAATGTC
+ACGGCCAGCTGGCATATTGTAGTGGACGAAAAAGAGGCAATTGAAGCCATACCTCTAAAC
+GAGGTCGCATGGCATGCCGGGGACGGGGGGAACGGGACGGGAAACAGAAAAAGCATTGGT
+ATTGAAATATGCGAAAGCGGAGACAGGCAAAAGACTTTGCAGAATGCTGCGGAACTGGTT
+GCAAAGCTGCTGAAAGAGCGCGGCTGGGGAGTGGACAAGCTCCGTAGGCACTATGACTGG
+AGTGGTAAAATATGCCCTCGGATTTTCCATGATAACGGCAAGTGGACAGGGTGGAAACAG
+TTTAAGGAAGCTGTTCAAAAGGAACTTTTCGGAGGTGATAACATGACACAGGATAAAAAT
+CAGCCTTCCGACTGGGCAAAGGAAGCGTGGGAATGGGCAAAGCAGCAAGGTCTATTGGAT
+GGTACAAGACCAAAAGACAATCTTACCAGGCAAGAATTAGCGGTTGTATTAAAAAGGTTG
+GCTGAGAAAAAATGAAATTTTCAAAGGTAATCGTATCATTATGCTAATACAAAAGTAATT
+ATTGCCGAAAGAGCGGCACAGGAAGCGGAGAACAAACTAAAACGGTATGAAGAATTTTTC
+AGAACATTCAGAGGGTTCTTGGGAGGTGTGTGAAATGAACGATTTTTTCACTCCTGAATT
+CCTGGCCACATTCGCTGGGCTAACAACCGCAGTTGCTCTTATCGTGCAGTTTACGAAGTC
+TATAGTAAAACGTCAATTTGGCGATGCAAGCGTGAGAATATATGCATTTGTGATAGCACT
+AATATTGACGTTCATATTCGCACCGGCAGGATGGGGAGTACAGGGAATAGTGCTCACAAT
+TATAAACGCAATATTGGTTACATTAGCCGCAGTAGGAGGGTATGAGATTATAGCGGATCC
+CAAAGCGACAAAGCAGTTCCCCGAGGGGCAGTGATGCCCCTCTTTTTTTGTCTCTGGAAT
+GTTTGATACTGTGTTTTATGCACAATCTGCTTACATAAAGCATATATTGTATGCATGTAC
+CTTACCTACCACTATATGTAGTGTGTTGATTTTGGAAATATAAAATGGGATAATAAAAAG
+GGGAAGAATGGAAAAGGGGGATAAAAGTTGGAGAGAACAAAAGAATTAATTTGTTATTTT
+CTGGCTAATTCGCTACATCCTTTAAACAAAACAGAAATAGTGAAAATGTTATATTTATTC
+GAATATTATCATGTTCAAACTTTTGGAGAGCAGTATGCTGAGTTAACATTTATTAGGTAT
+AATTATGGGCCTTACGCGCAGGCTATTGAGATAGCTCTTGATGATTTAATGAACGATGGT
+TTAATCAAGAGAGAGATTGTTGAATATACAGACAGATGTATATATTTGCATACACTTTGT
+GATACTGGGAAAACCTACACGGATTTATTGAATGAGGAAAAGAAATTAATAGCTGATAGA
+GTTATTGGAGAATTGTCTAATAAAAACTACGATGATATGATCAAACACGTATATTCTACA
+CCCCCGATGAGAAGAATTTTAATTAAGGAAGAAAGGTGCGGTTTTACGTTGGTCGGGGAG
+GTGTTAAACATGAAAGAAAGTAAACCGCTTAGAAAGTTCAGTAAGGCAAAAATAGAAGAA
+GCAAGGAAAAGACTTGATAAATCATCTCGAGGTTCAGATGAAGAATATTATGCACACCTG
+TTAGCAGTAAATGAAGAACTTAAGATATTAAGAAGGAGGGCCAATAGTTGTATTCTGAAG
+TAAAACCTCTTTCTAGAGAAGAGCTAATAGACGAAAGGTGTTTTGAAATTGGAGAGATAT
+ACTATATAAACGATTCGTTGATAAACATTCCTAACGTAGATAGACTAAAAGATGGTTCAC
+GAAAGATACATGAGGGGAGAATGGTTGTAATTGTTCATCATAACGAACAAAACTACAATA
+AATTTTGTCCAGTAGTTGCAGTTACACCTTTATCAAGTCGTGTAGATTTGAAAAGGCCAT
+TTGATTTAATATTAAAGAAAGATGATGTAGATGGTAATTTAAGATATGACAGCATAATAC
+AACTCCAATTAATTCAACCCGTGTTGAAAGTAGATTTAGAAAGGTGTATAGGCAGATTGA
+AAGAATATAAAATTGAAGAATTGATTGCAATGCAACTCGAAATGATTGGAATAGAGTAAT
+AAACGAAAAAAAGAGCGGCAACCCCACCCGAGCGGTTAGCCGCTCTTTTTTGCAAACATT
+TTGCTAACGTAGCAAACCAAAAATGATGTGAAAAGGTAAAAAAGAATAACAATATTAACA
+CTGAAAAACGTTGATTTTTCGGCATTTTTACGAAATGGGTATAAATGACTGATAGAGGGT
+AAAAATACTTTTATGGGTTTCCTAAACCGCAGGTCAGGGGTTCGAATCCCTTTGGGCACA
+CCAGAAAAGCCGTTAACCATTCAGGTTGATGGCTTTTCTAATTTTTAACTCTAATTTTTA
+ACGGCCTTTGCTAATAATGCTTCCGGACGGAATGTAGGAACAACGACTTATCAGATAATA
+AGGGAGAACAATGTTATCTGAATTGTGGATCGGTATTGAATGTTTTCGGAAAACAATGGG
+TTTGACAATGAGCATTTTATTGGTTATAATTTTATTCGCAATGTTTGGTAGTTGTTTTGC
+TTTATACCTGTTTTATTAATCGGAGGATTGGACGCAAGTTGGAATTTGAAGCAGGGTCAC
+ATCATTGGTTTATGAGAGAGGCCCTGAAAGAGGCCTACAAGGCATATGGCAAGAACGAGA
+CGCCCATAGGGGCGGTGATGGTTAAGGATGGTTCAATAATTGCCAGGGGACATAATCAAA
+AGGAACTTACGAATGACCCCACCAATCATGCTGAGATGGCTGTAATCAGGGAAGCATGTG
+CAAAACTCGGCACGTGGAGACTTAACGACTGTGATTTGTATGTTACATTGGAGCCTTGCA
+CAATGTGTGCCGGTGCAATTATTCAGGCCCGGGTTGGAAGGCTTTTTATAGGCTCTCTTG
+ATCCTAAAGCAGGAGCGGCCGGTTCGGTAATAGATGTGCTGAAGGTTGATGCTTTTAACC
+ATAGGGTTGAAGTGACATATGGAATATTGCAGGAAGAATGTTCTGAGATTTTGAAAAATT
+TTTTCAAGGAACTTAGAAAAAGAAAGTCAAATCGGAAGATATGATTTTTAAGTTGATTTG
+ATGAAGTTTTTTGGGGATTATTGAAATTTGAAGGAATAGGATTTTAATATTAAAATATAA
+GTATAAAATATTATATTTATTAAAATACGGAGACGTATCGAAGTGGTCATAACGAGCCTG
+ACTCGAAATCAGGTTGTCGCGCAAGCGGCACGTGAGTTCGAATCTCACCGTCTCCGCCAC
+GAACCTGTTTGCGGGAAATATCCGCAGACAGGTTCTTTATTTTATGTTAAAGATTGAAGA
+AACAGTCTGGCAGTATGTAAAAGTTCCGGAAGGACAGGAAATTGGACAGGTGGAAATCTT
+GTTTGAACGGATTGACAAAAAAGTTGTACAGGAAGAAGAGTCACACCTCCTTAATATGAA
+ACATAGAATGATACAAAACAAGAAATAATGCCATAAAAGCCGGAAAGGAATGGGGAAGAG
+TGTATAATACGAACAACAAATGGCCATATCCTTGTTTTTCAAACGCGCCATTATATACTT
+CACATAGTATGCCACACGGTATGTACGGTGATAAAGTGTACCAGTGCCCGTATTTTCTGA
+ATATTCCAATGTATAACTTCAGCCTTTGCAGCCCGTTTTTGCCTCAGTATGGTCCTTGTA
+CGGAGAAGGCGAAGCCTTGCGATGTGATTAAATTGAAGGACTATGGTCCAGAGCCTTTTG
+TAGTAAATATTGAAGAAGCTGCAAAGCAAAACGACAATTTTCGCACGGCTTTGTGGACAG
+GAGAGCATTTGCAGCTTACATTAATGAGTATAAATGTCGGGGAAGACATAGGCCTCGAAA
+TGCATCCTGACGTCGATCAATTCATACGTATAGAAGAAGGCCGCGGACTTGTTAAAATGG
+GCGACAGCAAAGATAATCTGGATTTTCAAAGAAATGTGCATGAAGACTGTATAATTATCA
+TTCCTGCGGGGAAATGGCATAATCTGATAAACACAGGTAACAAACCGATAAAATTGTATT
+CCATTTATGCGCCGCCGAACCATCCTCACGGTACGGTTCATGTTACTAAAAAGGATGCCG
+GTGAGTAA
+>NC_009012.1|provirus_3339258_3389049
+GTGAGCGACCATATCGCCAAGCGTGATGGAACAAAAATTTTAATTGAAATCAACACCGCA
+GATGCCACAGAAGAGGACATAAAGAATCTCTACGACCTTCTTTCCAAGCTGTTTGACGAA
+ACAAAAGAGAATTACTCACCAATGGTTCATTACATGGTTGGAGAGATATTAGAGCCTGTG
+ATGATGAAGATGGCAAGCCTCATGAAACCAAAGAAGCCGGGTGTGAAGGCAGGTGAGTAA
+GAAAAAGTATATTGTACGCTGCCCTCATTGCAATCATGGAATGTTTGATGCCGATTATGC
+TGATGTTGAAATCAAATGCCCGGTATGCAGAAAGGTTTTTGAAGTAAAGCTGGAGAAAAA
+GGCGGGGTAAAAAGTGAATAAATCTGGCCCAGAGCCACAAAGGGAGCGAATGACTCACCT
+ATAGAGCCTGGCAGATAGTCTTAAAAACTATTTGTCAGGCTCTATTTATGTTCTCGGAGG
+AGGTGAGAATTTGAAAGTGACAATGATGGACGCAGCATTAAAATACGCAGAAGCAAATAT
+CCCAGTCATACCATTGCATTGGATTTGTGAGGATGGCTCCTGCTCCTGCAAGGAAGGGAG
+TAATTGTGACAGCAAAGGAAAGCATCCGTTATATACCGGCTGGTACAAGAATTCCACTGC
+TTATGTTGAGCAAATAAGGAAATGGTGGACGAAAACCCCCAATGCCAATATAGGCATTCC
+TACAGGCGAGAAGTCTGACTGGCTGGTACTTGATGTGGATGATGGCGGTGATGAAACCAT
+ATCTGCACTTGAAGCAACACATGGAAAACTCCCGGATACGGTTACTGCTGTTACAGGAAG
+TGGAGGTTGGCACTATGTCTTTAAATACCCTAAAGGCCGGAGTATCCCAAATAAGACCAA
+GTTTGCATCGGGTCTTGATACGCGTTCAACAGGTGGACTGATTGTCGTGGCTCCAAGCAT
+TCATGTAAGCGGTAATCAGTACCAATGGTTAGAAGGACATTCTCCCTTTGACAGAACCCT
+GGCAGAAGCTCCGGAGTGGCTATTAAAGCTTATGGAAAGGGAGGAAGTATTGCTTACACC
+CTTTGAAGGTAGCAGTATTATAGTCGAGATTAAGGAAGGAAACCGCAACAGTACCCTGAC
+AAGCCTTGCAGGAACCATGAGAGCAAGAGGAATGACGGAGGAAGGCATCTATACGGCATT
+ACTTGCAGAAAACAACGCAAGGTGCAATCCTACGCTTGATGAAGCGGAAGTTAAGAAAAT
+ATATAGTTTAGATTTTCAAAGAGTTAGTAACTTGTAAAGAATTATAATATATACGCACAA
+AGCCGCTTGATTTTTGCAGAGGATCTTTGTACAGTCATAAAGTATTTACATATTGCCTGA
+ACAATTCAGCTTTCAGGAGATAAGGAATATACATGTTGGATTTTTCTGGCTGTGGGTTAT
+TGCAGCGGTGTCTGCAGTATTAATTGCGGCAATAGTTGCTGCTGTGATTCATAATATAAG
+AAAAAGGAGAAAAGAAGAGGAGGAAAACGAGCTGGCGGCGGCTTGATTTGTAAAATAGGT
+ACGTTCTACTTGCTTTTTCAGAATAGAAATAATATAATAATGCCAGGAAAAGGCAGAAAA
+GTTTCCTGGCATTATTATAATGCAACCACGGATTGCAAGCATTGGGATGATAATTTTGAG
+GTGATAAAATGGCAACTATAACGTTATATGCCGGAAAAATCAACCAAATGCCCGGATTGA
+TAAATGAAGTCAAGAAATCTGTGGTGGATTACAAGTCAGAATTATCCGCATTGAGAAAGA
+AAACTTTGAACATCAACAGAAGTGTATGCAATTTGGATGAAGTAATAAGTTCCATACAGG
+CATCTTCCCAGACTCAGGATAGAAAAATTGATTCACTTGAGAAATTCTGCAGTGAAAGTG
+AGAAGTTTATATCGGAAGTAATACGTATCGATGAAGAAGTTGCTGAGCTTATCAATAAAC
+GGAAAGAAAATTTTTACAAAGAATATTATTATTTAAAACCGGAAAGCGAGAAAAGCGGCT
+GGGAAAAAATCAAGGACGGCTTAAAGTCGGTTGCGGAGTGGTGTAAAGAGAATTGGAAAT
+CCATTGCCAAGATAGTGGCTGCCGCAGTAGTTATTACCGGGTTAGGGATAGCGGCGGCAT
+TGACAGGAGGGGTATTGGGAGTCATACTGGCAGGAGCATTCTGGGGAGCATTGGCCGGAG
+GATTGATAGGAGGAGCGGTTGGAGGAATAGCCGCGGCGATAAATGGAGGATCGTTTCTGG
+AAGGATTTGCGGACGGGGCATTAAGCGGAGCGATTTCCGGAGCGGTAACGGGAGCCGCAT
+GTGCCGGGCTGGGTGCTTTGGGAGCAGCGGCAGGAAAAGGAATCCAATGTATGAGCACAG
+TGGGAAAAGCGATAAATGTTACATCAAAGGTTACGGCAGCACTCTCGTTTGGTATGGATG
+GATTTGACATGCTGGCAATGGGAGTATCATTGTTTGATCCATCCAACGCATTGGTTGAAT
+TTAACCGGAAGCTGCATTCCAATGCACTTTATAACGGATTCCAGATTGCTGTAAACGCGC
+TGGCTGTTTTCAGTGCCGGGGCGGCATCGACAATGAAGTGCTTTGTTGCAGGTACAATGA
+TATTGACAGCGGCAGGTTTGGTTGCGATAGAGAATATCAAGGCAGGAGACAAGGTAATTG
+CGACGAATCCGGAGACTTTTGAAGTAGCGGAAAAGACGGTGCTTGAGACATATGTGAGAG
+AGACAACGGAGCTTTTGCATTTGACAATCAATGGAGAGGTAATCAAGACAACCTTTGAGC
+ATCCGTTTTATGTAAAAGATGTGGGTTTTGTTGAAGCGGGAAAACTGCAAGTAGGAGATA
+AGTTGGTTGATTCAAAAGGCAATGTTTTGGTGGTGGAAGAGAAAAAGCTTGAGATAACAG
+ATGAACCTGTTAAGGTTTATAACTTCAAAGTGGATGATTTTCATACTTATCATGTTGGGA
+AAAAAGGGATATTGGTACATAATGCAGACTATAACCCCAAAATGGGATTTGATGATTTGG
+ACCTTGAGAAAGCTACGAACAAACAAAAAGGCAATTATGGAGAGTATCTGGCAGATGATA
+ATCTTATTAATAATCCAAAATTGAAAGAAGCAGGGTATGATTTGGAGCGGATAGGAGGTA
+AGGTTCCGACCTCACCGGATGATAAAATTACAAAAGGGATAGATGGGATATATATAAATA
+AGAATCCTGACTCAAATGTTAAATATGTAATTGATGAGGCGAAATTTGGAAAAGCGGGAC
+TTAGTACAAAGACAAGAGATGGAAAACAAATGTCGGATTCTTGGCTGATAGGTGATAAAA
+CAGGTAATGATAGAATTTTAGAAGCAGTGAATAATGATAAACAATTAGCAGCTGGTATAC
+TCGATGCATTACAAAACAACCAAGTAGAAAGAGTGTTGTCAAAAGTGGATGCAAACGGAA
+ATGTAACGACATATAGACTGGATAGTGATGGTAATATAATTGGAGTTTGGCCATAAATAA
+TTGAAAGGAGGTAATGATATGAGAGATCCATTATGTGATAAAAAAGATTTGATAGAAACG
+ATAGAATTTAACCAAAAGGCTATTTTAAAAATGAAAGAAAAAATTATTAATCTGAAGGCC
+GACATAGAGAATGGTATACAAAGATATCCAAGAGATAATCAAAGTATAATTTATGGTACA
+TTTAAATTAATGTTTATGTATGGAATGAGTACACTGAGAGCAAAATATTCTTTGGGAAAT
+GAGCCGGATGCAATGATAAATGATTATTTAGATAATATAACGTATTTAGAGAATATGGGA
+GAAGAAGAAATAGGATATATTTTTCTTTTATGGATGGTGGGACTGGGTATCCTTTTGGAA
+GTGGATAAAGAAGAATTGAAGAAGTTGGCGAAAGTTATAGAGAGACGAAAAACAGAAGAT
+GCACTTATAGATTTTCTTTTGAAATCCTGTGATATAGGTTGGAACCACAGTACAACGAAA
+TATGAAAAAAAGAACCCGTATGAAAAGACAGCAGAGATTATAAAAATAGCATTGCACGAC
+AAAGACAAGGAAGCGGCATCTAAAAGGCTTGAAAAATATATGGAAAAAGAATGGTTCAAG
+GGGCACTATGACTTTGAATGGAGGAATGCGCACAAGAGGCCGGGGTATTATGGTTTTTGG
+AGTTTTGATACAGCGGCACTGGCCAAGATACTGGGACTGGATGACAGTGCACTGAAAAAC
+AACAACCATTATCCTTATGATTTGGCACACTATAAGAAGGGAATGACCTTTGATTTGAGT
+TGGTATAGTGTACCAAAGGAAGAGGAAGATAAGGAAGAAGAAACGGTGGTATATGGTATA
+CCGGGTAATCCTGAGTTGGAGAGGATAATACCTGGGAAGTTTCACAGTTTTGTAAATGAG
+ATAATAAATGATTATAAAACACTGCCGGACGAAGAATTTTGGAAGAAATACAATTTGAAA
+GAAATCTGGTTTGATGTGGAGGAGTATAAGGAGGATAATAAAGATAAGAATTTGCTAGGA
+ACGATTATAGTATTCATGCTTGTGGACAAAGATTATATTTTGCAGTTGGATTATAAAGAA
+GAGTTAATAGACTATATAGAGAATATACATAATTACTGGGCCAAGAAAGAAGTTAAGCTT
+ATAAGCTTTGAATTAGACAATGACCAGCAGTACTATGCATATGTGCCGAAGGATGCGGAG
+GTTGGTTCGTTGTATGAGGTAAAACTGACAGAAGTGGAGAAAATAGAGGAGGTTTAGTGT
+TTATTGTGTAATAGTGTGAAGAAGATGAGTTGTTTATGAAGAATCTGCTGTATAATTGGA
+TATATATAGTTTGATTTTGGGAATCTCCTTCCTGGCGAAACAAAAACTATAGGACAGTAT
+TTGGGAAGGAGTATTTTTTGTGTTATTTTTTTTGGGGAAGATAATATTGTATTGAGAATA
+ATAAGAAGTTTTATTAGGATTGTTTATGGTTGTCAATGTTAATATAATCAATGTTAATAT
+AATCAATGTTAAAAGGTATAGGAACAGAACCATAGCAGGGGAGAGTCAAAATGTACATTT
+GGCAGTGAAAGATAAGCTGAAAAAAAGAGGGGCGTTCATTTGAATTAATTCCTGAAGATC
+TTGATGTTTATAAAGAAGCATTGGATTTATGGTTGAGTCCAAATTTGGAAGAGGTTAAAA
+GCGTGATTGATAAAATGATATTGTATCATTCCGTATTAGTTTCGGACATTGATAACGAAC
+CGGAATTTGGTGATTACACGTATGGATTTTATCCATATGAGATATTGTTTTTAATGCATA
+TAAGGAGGAAATTAGGTTTGCCGGTACCGGATAAATTTGAAGACTTGCTGATGAACACAC
+CGGAAGCGAAGGTGGTGATTAATGAGCCGGAGCCATATCCGGAGTGGGATCCTTTGTTGA
+GAGCCATAGATGAGTTTTACCGAAAGAATTATCCAAATTACATTCCCAACAAGCATGGAA
+AACTGTTTGAATAGGAGGAAACTGTTATGGCAATGGAAGATATAGTTGGGATTATATTTG
+AAGACATTGAGGAAGTGAAACCAATTTTAAGTGATTCGGAAGGAAATGATTTGGAAGGAA
+ATGATTTGAGTGAGGCGATATTGGAATACGGGATATCGGAAGGGAAGTTTCTGTGTGTTG
+ATTATGGTGGAGAAGAGGGGAGCGAGATAATAAATTATATAATGGATTATGAATTCAGTC
+ATGGAATAGAGCTTGCAACACAGGAGGAGTTGGAAGAGCTGGACGAGATGGAGTATGATG
+ATTTGACAGATAAGATAAAAGAAGTGAACAAGATATTGGAGAAAGCAGGGTATGGACTGT
+TTTGCTTTCCAACAGGAAGTGATTTTTATGCGTTGTTTATAGCGAAGTTGGAGGATAAAG
+AGAAGTTATTGGAGGAAAAGATAGTTGATGATGAGGAGTTGCCATTGGAAGAGAGGTATA
+TTCAGTATTATGTGTAAGGGGATAATCTGCAGTATTTAGAGTTTTGGATAAGAATATGGC
+TTTTATAAAAATATTGGCAGTGTAAATATTTTTGTGTAAACTAATTTTCCTTCTATGTTA
+GTGTTTAAATATATTTTAAGACTCGAAAGTCTGCTTTGTCAAATTTTATAGATTCAAAAG
+AATTTCTGATAAGAAATTCTTACAAAAGAAAAATTTGACAAAGATGATGCGTATAAAATA
+TTACAGGGGGGGTTCAGGAAACCAGAGTTTCCCTGAACCCCTTGATTATACTATATACGC
+CCTTCGAACATAATCTGTAGCTGTCCCAGTATCAAACCCCAGTTTTTGTAACGCATCGTC
+CATTTTGAAGTAATCTTTACTGTAGCTAAATATATGCTCTTTAAAAGTGACTGGTCGCCA
+GGAAATACTGTCCTTGATTTGTTTATCCTTCTATAACTGCTATTCAGGCTCTCAATAGTA
+TTGGTCGTATACATGATTTTACGTAGTTCCTCCGAATACTTAAAAAATGGACAAATAACA
+TCCCAATTGCTCTTCCAGCTCTTCATAGCTGCCGGGTATTTCTTCTCCCATTTCTCTGAA
+ACCTCAAGCATCTGGTCGTACCCTGCCTTCTCATTCGGAGCCGTATATATCCGTTTCAAG
+TCCCTGGCAAATTCCTTTCGGCCTTTATCTGACACATACTTTAGCGTGTTTCTTATCTGG
+TGTGTTAATGTCAATCAAAATTTAGGCCACTTACCGGGGTAAAATTAGGCCACCATTTCA
+TAAAAAATCAGTCATTATTTGCCTGCTTGGAAAGAGCCTGCTTAAACCTGTAGCTTTCAC
+CATTGATGTTCAGAATGTGCGCATTATGGGTCAAGCGGTCAAGCAGGGCGGCTGTCATTT
+GCTCATCGCCTAACACCTCCGTCCATCTTGGAAATTCTAAGTTTGTAGTTATGATCAGGC
+TGCCCCTCTCATATCGGGAAGAGCAGAACTGGAACAACAATTCTGCTCCGATTTTACTGA
+AAGGCACATAGCCTAATTCATCAAGGATCACTAAATGCGGCGCCAGCCATTGCTTTTCAA
+GCTTATTAAGACGATATTCCTGCTGTGCTGCAAGCAATTCATTTATCAAACCAGCTGCCG
+TATAGAATTTGACCTTCATACCCTGCCGACAAGCCTCGTAACCGAGCGCAGTTGCAATAT
+GGGTTTTCCCTACTCCGGAGTTGCCTATCAAAATGACATTTTCTCTTCTTCGGATATATT
+CTCCCTGCATGAGTTTCAATACCCGCGGTTTGTTCAAAGAAGGTATGGCAAGGAAGTCAA
+AGCTTTCAATCGTTTTGATAACAGGAAAGCCTGCTTGCCGGATCCCTCTCTGGATCCGGT
+TATTCTCCCGCTGATGTACTTCCTGTTCCAGCACACACAGCAGGTATTCTTCATAATCCA
+GATTATTGTCTGCGGCTTCTCTTGCCAGGGATTCATAGGTTTTTGCCACCTGTGGCATCT
+TTAGCTTCTTCATGTAAGTTTCGATAAGCATTTTATTGACCGGCATTATTGTCCACCTCC
+TGACATGAGAGCGCTGTATTTGCTGAGATCAGGAGGTATTACAACAACCTCGGGGATGCC
+CTGAAGCTTGTCTTTGCTGACAGGAGCCGTCTTAGGACTGCCTGAGACCAGTAGCTGTCC
+TAATATGTTAAATACACCGTCATAACTGTATACATTGTATGCCATAGCTATTTCAATAGC
+TTCTGTCACCAGTGCCGTAGGGTAATCCCTGTGCAGCATGAGTATTTTTACGAATTCCCT
+GTTGCCTCTCGGACTTCTGGCATTTAAGCTTCGACGATACTGCTCATAAACGGGTGCCAG
+CATCTGAGGTTTATATACTTTTGTGTTGCCCAGGGCGCGTGATTTTTGCAGCAGCAATTC
+CAGATAGTGATCAAGCTTTATCTGCTCCTGGTAGCGTCCGTATATCCTTGGATGGCTTGC
+TATCATTGTTCCTTTGTTTAGTATTTTTACTTCATCCGCAGTAGCTTTAACAGTGACTTT
+CTCTCCCACATATATCGTGGGAACAGAGTATCGGTTAGTTTCAAACTGTACCATAGAATA
+GCGGTTGACCTTTGCCTCTTTATACCTCGCACCATCAAACCTTACCGCCGGTAATGGCCT
+CAAAGCTGCCCTTTCCGCTTCCCATTTCGGATTGCTTTCCAAAAGCTTTATGCATTCGTT
+GTGCAGATATTCATTCAACTCCTCAAATGAATCAACCTCGGGGTAGGGAACGAAGAACCT
+TCGCACAGCCTCTTTGCCCGCATTCTCTACACCACCTTTATCGCTCCCTTTTGCCGGCCG
+GCAGAATGAAGATTCATAAAGGTAATGGGTTCGTAAAGCGATAAACTGCTCCTGCTCTTC
+TCTGTTGCTGCCTTCGAGTATCTTCTTCACTGCCGTTTTCAGATTGTCGTATGCTATCTT
+GTATGGTACACCGTTCATGAACTCAAAGCATTTGATATGGCCATCAAAGAACGCCTCCTG
+TTTCTCAAAAGGGTATGCTCTTACGTAGAATCCGCCTGATCCTCTCAACTTCATTACAAA
+CAAATGTGCCTTGGTTTCTTTGCCTTTTAGATAAAAATATGCTTCTGTCCAATCTACTTC
+TGCATATGCTCCCAACTCGAACTCCAGTGGCAGGAAAGCTTCCCTTTGTTTTCGGTATTC
+CTTTCTCAGGTAATCCATTACAGTGTTGTAGCCGCCTGAAAAGCCTTCTTTTTTAAGTGT
+CTCAAATATTTTTGTCCCTGTATGGCGTTGTTTGCGGTGTCTGGTTTTATCATCTTCTAT
+TATCTGTTTGATCATTGGTATGTACGGCCCTAATACCGGATGCGTTCTTTCCTTTGTCAA
+CTTGTACTTAGGTGGTTTTGGTTCCTCCAGCGAAATATATTTTGAGATTGTATCCCTATG
+TATCCCAGTCCTCCTGTTAATTTCCCTGATACTTAAGCCTTCCATGAAGTACATTTTTCT
+GATATCCTCTAATTGAGCCATCTTAATCATATCCTTTCCTCCTGTACGATAGTGTCTGTT
+CAACAAAATCATACAGGAAATTTGATTAAGGTGGCCTATTTTTTTGCCGGTATATGGTAC
+ATTTTTAGAGTAGCATTAACACTGGTGTACTATACACCTCTGATATTCAGTATTCGGAAA
+AGCCGCATTGATTGCATCCTTTATCCCTGAAAGTGCATCAGCACAGAGAATCAGGATGTC
+TTTAACTCCTCTGTTTTTAAGGTCTTTTAAGACACTCAGCCAGAATTTTGAGCTCTCATT
+TTCTCCTACATAAATACCGATAACATCTTTCTGCCCTTCTATATCAATTGCCAGCACAAT
+ATATACGGCCTTCTTCGAAACAATGCCGTCATTTTTTACTGAAAAATGAATTGCGTCAAT
+AAATACTATCGGATAAACCTCTCCCAGAGGCCTTTTCTGCCACTCTTCTATCTGAGGTAG
+TATTTTATCAGTGATCTTACTTACCATCTCGGCAGATACTTCAAATCCGTAGATTTCCTG
+TATCTGCTCATTGATTTCTCTGGTAGACATCCCCCGCGCATACATTGCTATTATTTTATT
+TTCAATTTCTGAAATGTCCCTTTTATACTTGGGAACAATTTTCGGCTCGAATTCTGCATT
+CCGGTCCCGCGGGATATCTATTTCTACTTGCCCTACACTTGACTTTAATGTTTTTGATGT
+GTACCCGTTACGGTAATTTGATTTCGCTTCTTCAGTTGATTCGTACTTTTCATATCCGAG
+ATGTTCATCCAGCTCTGCTTCCAACATATTTTGTATCGTATCTCCGAGCAGATCCTTCAA
+TGCTTCCTGCAAATTCTTTGCTCAAGTGATGTTGTACTCAGAAATGAGATTTCTGATAAG
+CTCTTTCTTTTCTGGTGTTATTATTCTTTTTCTTGCCATAAAAAACTCCTCCTATACTTT
+AGTATTCTATCATAGAAGGAGTCAATTAGTTTACATAAATATTTTACAGTCTCTTAGCTT
+GTAAAGAATTATAATATAATATATATGTACAAAGTCGCTTAATTTTTGCAAAAGATCTTT
+GTATAATCATAAAGTATTTAGATATTGCCTGCACAATTTCAGCTATAGATTCAAACAAGT
+TGTTATGCGTTACATTCATTCGGATGTCTTTCAAAAGGTGATCGATTGAATTCAACTCGG
+AGCTATAAGGAGGCAAATACTTAAGGGTAATGTTCTTTATTGAATCCAATGGGAGTATAA
+ATAATTTCATGTATTAAAAATTTTTCAGTTCTTCCTGGCAAGAAATTTTAAGTTTTCAAA
+GTTTACAGAATGTAAATCCTAAATCACTTCAATATTATATATTATTGCCGGTTTTGCTAA
+GTTTTACACATAAATTTGATTTAATTCGTCTATAATTATTTATAATGGAGTGTTTTGCCC
+TTTTTCGCTCAATTATCAACGAATTGGTTGACGAAAACCGGTGCAAGGTATATGATAACG
+GCAGGGAAATAGATTTCAAATATTACAGTGATAACAATACATTAACTTTTACCCTCGGAA
+AGGGTTGGCACAACGTTGGAATTGTCCTTGTGGATATGGCGGGAAATGTAAACAATATTC
+AGGAGATAAGGAATATACATGTTGGATTTTTCTGGCTGTGGGTTATTGCAGCGGTGTCTG
+CAGTATTAATTGCGGCAATAGTTGCTGCTGTGATTCATAATATAAGAAAAAGGAGAAAAG
+AAGAGGAGGAAAACGAGCTGGCGGCGGCTTGATTTGTAAAATAGGTACGTTCTACTTGCT
+TTTTCAGAATAGAAATAATATAATAATGCCAGGAAAAGGCAGAAAAGTTTCCTGGCATTA
+TTATAATGCAACCACGGATTGCAAGCATTGGGATGATAATTTTGAGGTGATAAAATGGCA
+ACTATAACGTTATATGCCGGAAAAATCAACCAAATACCCGGATTGATAAATGAAGTCAAG
+AAATCTGTGGTGGATTACAAGTCAGAATTATCCGCATTGAGAAAGAAAACTTTGAACATC
+AACAGAAGTGTATGCAATTTGGATGAAGTAATAAGTTCCATACAGGCATCTTCCCAGACT
+CAGGATAGAAAAATTGATTCACTTGAGAAATTCTGCAGTGAAAGTGAGAAGTTTATATCG
+GAAGTAGTACGTATCGATGAAGAAGTTGCTGAGCTTATCAATAAACGGAAAGAAAATTTT
+TACAAAGAATATTATTATTTAAAACCGGAAAGCGAGAAAAGCGGCTGGGAAAAAATCAAG
+GACGGCTTAAAGTCGGTTGCGGAGTGGTGTAAAGAGAATTGGAAATCCATTGCCAAGATA
+GTGGCTGCCGCAGTAGTTATTACCGGGTTAGGGATAGCGGCGGCATTGACAGGAGGGGTA
+TTGGGAGTCATACTGGCAGGAGCATTCTGGGGAGCATTGGCCGGAGGATTGATAGGAGGA
+GCGGTTGGAGGAATAGCCGCGGCGATAAATGGAGGATCGTTTCTGGAAGGATTTGCGGAC
+GGCGCTTTAAGCGGAGCAATTTCCGGAGCGGTGACAGGAGCGGCATGTGCCGGGCTTGGT
+GCTTTAGGAGCTCTAGCAGGGAAAAGCATCCAATGTATGAGCACAGTGGGAAAAGCGATA
+AATGTTACGTCAAAGGTTACGGCAGCACTTTCTTTTGGTATGGATGGATTTGACATGCTG
+GCAATGGGAATATCATTGTTTGATCCATCCAATGCATTGGTTGAATTTAACCGGAAGCTG
+CATTCCAGTGCACTTTACAACGGATTCCAGATTGCTGTAAACGCGCTGGCTGTTTTCAGT
+GCCGGGGCGGCATCGACAATGAAGTGCTTTGTTGCAGGTACAATGATATTGACTGTGGCA
+GGCTTGGTTGCGATAGAGAATATCAAGGCAGGGGACAAGGTAATTGCGACGAATCCGGAG
+ACTTTTGAAGTAGCGGAAAAGACGGTGCTTGAGACATATGTGAGAGAAACAACGGAGCTT
+TTGCATTTGACAATCAATGGAGAGGTAATCAAGACAACCTTTGAGCATCCGTTTTATGTA
+AAAGATGTGGGTTTTGTTGAAGCGGGAAAACTGCAAGTAGGAGATAAGTTGGTTGATTCA
+AGAGGCAATCTTTTGGTGGTGGAAGAGAAAAAGCTTGAAATAACAGATAAGCCTGTAAAG
+GTTTACAATTTTAAGGTCGATAATTTTCATACGTATCATGTTGGCGAAAATAGGGTATTG
+GTTCATAATGCGAATAAGTATGTTAAGGGAACGCGTAGTACTCAGTTGACGTTTGATGAA
+GCACTGAAAAAGTTAGACAAGTCAGGCTTACGACCGGGTCAAACAGAAATTTCAAAGAGT
+AGGGTTATGGAAATCGTAGAGAATTATGATCCTATGAAAGCACAAAGCAGTGTGTATACT
+GATTCAACGGGTAGATATTTAGTTGAAGGCCATCATACAACTGTCGCAAATACAATGCTA
+GGAAAAGGATCTGGGGTGAATATGAATATACCTACACAGCAGATACCATCTGCTACAAAT
+GTCTATTGGACAAAAAAGTGGTATGAATTTTGGAAAACACAAATAAAAGTAACAAAATAA
+GAAGGTGATACTTTGGAGAAGTACTCTTTATTCGGAGAATTATTGTATTTAGGGTTTGTG
+TGTGAAAAAGGGAGGTGTAAAAGTTCAGGATTTTGGAAGTTGGGGTATAAGAGAATCCTT
+CATAAACATATTGTCTTACTAAGTAAGTTGATTCAATGTATATTGGTTAGTGAGGTATCC
+GATAACGATGCTTTAATATTGAAAGAGTTTATTGAGTCAATTCAGACAGAAAAAGACATT
+ATTAAATATTACCCAATAAATGAAGATACAATGAAGAAATTACAGGATAGTAATTATTCA
+ATTATTACATCAATTGATTCTGATAGGTGTAATAATAACATTAATCTACTCATGAATGAT
+ATAACAACCGAGATACTAGAATTATTAGATCATAAATTTTTTTTAAACAAGAAAAGGATA
+GCTATGTTAATAAGGGCAATACATAATTTGCCACGCGTATACTTAGGAAAGGGGTTGCAC
+ACTTTGTGCAATATAGAGCAGCCTGCTATTGATTATAAAGCTGCACTTGAATATTCCTTT
+AATAACATGGATGAAGATACTAGACAGAGGTATAGAAAATACTATCAGTAGACGGTAGAA
+GATGTTAAAATGGATTATACTCATATTACCTTTACCGTTTTAGATTGAAAAGTTTAACTA
+ATACCCGGCAAGCCAATATAACGGCAAGTCGGGTTTTCTTTTTATCCATACTTGACAATA
+TGTAATACATTGTGATACAATTAAACCAACAAGAAATACAGGAGGTGCAATAATGTCTAC
+AGAAAAGGATAGTATGCTACGGGTAAGGCTTACACAAAGGCAGTCGGATGAGTTGGATGC
+TATTATTGGTGAGCTTCAAGCACAAATGCCGGAAGCAAGTGTTACCACATCAAGCATAGC
+AAGATACGCTCTGGAGAAATATGTGAGCGACCATATTGCCAAGCGTGATGGAACAAAAAT
+TTTAATTGAAATCAACACCGCAGATGCCACAGAAGAGGACATAAAGAATCTCTACGACCT
+TATTTCTAAGCTGTTTGACGAAACAAAGGAGAATTATTCACCAATGGTTCATTACATGGT
+TGGAGAGATATTAGAGCCTGTGATGATGAAGATGGTAAGACTTATGAAGCTAAATAAGCC
+GGGGGTGAAGGCGGATGAGTAAGAAAAAGTACATTGTCCGCTGTCCTCACTGCAATCATA
+GAATGTTTGATGCCGATTATGCTGATGTTGAAATCAAATGTCCGGTGTGCAGAAAGGTTT
+TTGAAGTAAAGCTGGAGAAAAAGGCGGGGTAAAAAGTGAATAAATCTGGCACAGAGCCAC
+AAAGGGAGCGAATGACTCACCTATAGAGTCTGGCAGATAGTCTTAAAAAACTATTTGTCA
+GGCTCTATTTATATTCGGCGAGACAGGAGGTGGGAAGTTTGAAATTGACAATGATGGACG
+CAGCATTAAAATATGCAGAAGCCAATATCCCAGTCATACCATTGCCCTGGATTTGTGAGG
+ATGGCTTCTCTCCTGCAAGGCAGGGAAAAATTGCGACAGCAGGGAAAAGCGTCCGTTATA
+TACAGGCTGGTACAATGATTCCACTACTGATATTGAGCAAATAAAGAAATGGTGGAGAAA
+AACAACCAATGCCAATATAGGCATTCCTACAGGCGAAAAGTCCGGTTGGCTGGTGCTTGA
+TGTGGACGATGGTGGTGATGAAACTCTATCGGCTCTTGAATCAACACATGGAAAGCTTCC
+GGATACGGTTACTGCTGTTACCGGCAGAGGAGGTCGGCACTATGTCTTTAAATACCCTAG
+AGGCCGAAGTATTCCAAATAAGACCAAGTTTGCACCGGGTCTTGATAACCATTCAACAGG
+TGGACTGATTGTCGTAGCTCCAAGCATTCATGTAAGCGATAATCAGTACCAATGGTTGAA
+AGGACATTCTTCCTTTGACAAAACCCCGGCAGAAGCTCCGGAGTGGCTGTTAAAGCTTAT
+GGGAAGGGAGGAAACATTGCTTACACCCTTTGAAGGTAGCAGTATTGTAGCAGGGATTAA
+GGAAGGCAGCCGAAACAGCACCCTGACAAGCCTTGCAGGAACCATGAGGGTAAGAGGAAT
+GACAGAAGAGAGCATCTATGCAGCATTGCTTGCTGAAAACAACGCAAGGTGCAATCCTCC
+GCTTGATGAAGCGGAAGTTAAGAAAATATATAGTTTAGGTTTTCAAAGAGTTAGTAGCTT
+GTAAAGAATTAATATATACGATATACGCACAAAGCCGCTTGATTTTTGCAAAGGAGCTTT
+GTACAGTCATAAAGTATTTACATATTGCCTGAACAATTCAGCTTTCAGGAGATAAGGAAT
+ATACATGTTGGATTTTTCTGGCTGTGGGTTATTGCAGCGGTGTCTGCAGTATTAATCACG
+TCAATAGTTGTTGCTATGATTATAATATAAGAAAAAGGAGAAAAGAAGAGAAGGAAAACG
+AGCTGGCGGCGGCTTGATTTGTAAAATAGGTACGTTCTACTTGCTTTTTCAGAATAGAAA
+TAATATAATAATGCCAGGAAAAGGCAGAAAAGTTTCCTGGCATTATTATAAGGCAACCAC
+GGATTGCAAGCATTGGGATGATAATTTTGAGGTGATAAAATGGCAACTCTAACGTTATAT
+GCCGGAAAAATCAACCAAATGCCCGGATTGATAAATGAAGTCAAGAAATCTGTGGTGGAT
+TACAAGTCAGAATTATCCGCATTGAGAAAGAAAACTTTGAACATCAACAGAAGTGTATGC
+AATTTGGATGAAGTAATAAGTTCCATACAGGCATCTTCCCAGACTCAGGATAGAAAAATT
+GATTCACTTGAGAAATTCTGCAGTGAAAGTGAGAAGTTTATATCGGAAGTAATACGTATC
+GATGAAGAAGTGGCTGAGCTTATCAATAAACGGAAAGAAAATTTTTACAAAGAATATTAT
+TATTTAAAACCGGAAAGCGAGAAAAGCGGCTGGGAAAAAATCAAGGACGGCTTAAAGTCG
+GTTGCGGAGTGGTGTAAAGAGAATTGGAAATCCATTGCCAAGATAGTGGCTGCCGCAGTA
+GTTATTACCGGGTTAGGGATAGCGGCGGCATTGACAGGAGGGGTATTGGGAGTCATACTG
+GCAGGAGCATTCTGGGGAGCATTGGCCGGAGGATTGATAGGAGGAGCGGTTGGAGGAATA
+GCCGCGGCGATAAATGGAGGTTCGTTTCTGGAAGGATTTGCGGACGGAGCATTGAGCGGA
+GCGATTTCCGGAGCGGTAACAGGAGCGGCATGTGCCGGGCTTGGTGCTTTAGGAGCTCTA
+GCAGGGAAAAGCATCCAATGTATGAGCACAGTGGGAAAAGCGATAAATGTTACATCAAAG
+GTTACGGCAGCACTTTCTTTTGGTATGGATGGATTTGACATGCTGGCAATGGGAATATCA
+TTGTTTGATCCATCCAATGCATTGGTTGAATTTAACCGGAAGCTGCATTCCAATGCACTT
+TACAATGGATTCCAGATTGCAGTAAACGCGCTGGCTGTGTTTACTGCCGGAGCGGCATCC
+ACAATGAAGTGCTTCGTTGCAGGCACGCTGATATTGACTTCGGCAGGCTTGGTTGCGATA
+GAAAATATCAAGGCAGGAGACAAGGTAATTGCGACGAATCCTGAAACTTTTGAAGTAGCG
+GAAAAGACGGTGCTTGAGACATATGTGAGAGAGACAACGGAGCTTTTGCATTTGAGAATC
+GGAGGCGAAGTAATCAAAACAACCGTCGACCATCCATTTTATGTTAAAGATGTAGGTTTT
+GTTGAAGCGGTGAATCTGCAAGTCGGAGACAAATTGGTTGATTCAAGAGGCAACGTTTTG
+GTAGTGGAAGAGAAAAAGCTCGAAATAACTGGTGAACCTGTGAAAGTTTACAACTTTAAA
+GTTGATGACTTTCATACTTATCATGTTGGGAATAAAGGGATATTGGTACATAATGCGAAT
+TATAATCCTAAAACTACCTTTGAAAATCTGGATCTGGAAACCGCCAGTAACAAGCAAAAG
+GGTAATTATGGAGAATATCGTGCGAACGATAATTTAATTAACAATCAAAGTCTGAAAGAA
+GAAAGATATAATTTAAAACGAAAGGGGAGAAGTGCACCGACATCTCCGGATGATAAAATT
+GTAAAGGGGATAGATGGAATATATGTAAACGAGGATCCAAACTCAAATATTAAATATGTA
+ATTAATGAGTCAAAGTTTAATAGTGCACAATTGGGGAAAACGAAAAAAGGCATAAAACAA
+ATGTCGGATGAGTGGCTCCTTGAGAAACAAGGTAAAAGAATTTTAAAAGCAGTTAATGGC
+GATAGAAAGCTGCAAAAAGACATATTGCAAGCGTTAGATGATGGTCAAATAGAAAAAGTT
+TTATCACGAGTTGGCAAAGATGGAAAAGTGATAACATATAGACTGGGCAGCAATGGTGAA
+ATAATCGGACTTTGGCCATAAATAATGAATGAAAAGGAGATGAGGATATGAGAGATCCGT
+TATGCAGTGAAAGTTATTTGTTAGAAACAATAGAATTTGACAAGGAAGAAATTTGTGAAA
+GAAAAAAAAAGATTATTGTGCTGAAAGATGATATGGAAAAGGGCATACAAAGATATCCAA
+AAGACAATCAAAGCATAATTTATGCTACATATAGAGGAATGTTTATGTATAATACAGAAA
+TACTTATAGCTAAATACTCTTTAGGTAGTCATCCGGATGAAATGATTGAAGATTATTTAA
+ACGGTATAGAGTATTTGGAAAATGTCGGTGAAGAAAAAGTATGGTATATTGATCTTTTGT
+GGATGCTATCGTTAGGTATACTTTTAGAGGTAGACAAACAAGATTTAAAAAGGCTTGCTT
+GTGTGATAGAGAAGCAAAAAAAAGAAGACGCACTGATGGATTTTCTTTTAAAGGCTTGTG
+ATATAGGATGGAATCATAATACAAGTGAATATGAGAGAAAAAATCCATATGCAAAGACGG
+CTGAAATTATACAAATGGCATTGCATGATAAAGACAGGGAAAAAGCTTCGAAAAGGCTAC
+AACAATATATAGAGAAAGAGTGGGTTAAGGGACATAATGATCTGGACTTCAAAAATGCGC
+ATAAAGAACCCGGCTACGTTGGCTTGTGGAGTTTTGAGGCTGCAGCATTGGCAAAGATAC
+TGGGATTGGACGACAGCGCACTGAAAGATAACAACCATTACCCTTATGATTTGGCGCATT
+ATAAAAATGGAATGAGTTTTGATTTAAGCTGGTATGGTGTGCCAGTTGAAGAGGAAGCCA
+AGGAAGAAGAGGCAATAGTGTATGGAATACCGAACAAACCTGAGTTGGAGCAAATAATAC
+CTGCAAAATTCCACAGTTTTGTGAATGAAGTGATAGGAGACTACAATACATTGACTGATG
+AAGAGTTTTGGAAGAAGTATAATTTGAGAGAAATCTGGTTTGATGTTAAGGAGTACGAGG
+AAGATAATAAAGCCAAAAATATGTTGGGAACGATTATAGTATTTTTGCTTGTAGAGAAGG
+AGTATATTTTGCAGTTGGATTATAAGGAAGATTTGGTAGATTACATAGAAGATATAGATA
+ATTATTGGGGTAAAGAGGAAGTAAAGTTGATAAGCTTTGAAGTGGACAATGACCAGCAGT
+ATTATGCATACGTACCGAAAACCGCAGCAATAGATTCGTTGTATGAGGTGAAATTGACAG
+AAGTGGAGAAGATAGAGGAAGTTTAGTCTTATAGTGAAGGATTGAGATTATTAAAATGAG
+GATGGATTTTGATATTATTTCAGTGAACGATGTAAAAAACGTTAATTGAATTTTATATAA
+TGCGGGCGGTAATGGTAATTCTGCCCGTTTTAATTTAAACTGATTTATTGAAGATTTCTG
+AATTACGGAAATAACTGTGCTTGTGTCCTATAAAAAGACGGGTAATTTAATTTGTGATGT
+TTTGTATAAAAGATATAGGTTTCGTTAAAGAGATGAAGCTGCAACCAGGAAACAGGTTGG
+TTGATTCGGTAAAGATATTTTTGGTAATTAAGAAAAAAGCCTGAGATAACGGATGAACCT
+GTGAAGGTTTACAACTTTCTAAAACCACCTTTGAAAATTTGGATTTGGAAACTGCCAGTA
+ACAAGCAAAAGGGTAATTACAGAAAATATCGTGCGAATGATAATTTTATTAATAAATAAT
+CAAAATGTGAAAGACAAAGGATATGATTTAAAAGGGGGGAATGAGTGCTATGGCATCTCC
+GAATGATGAAATTGTAAAAGGAATAGATGGAATATATTCAAACAAGAATCCAAACTCAAA
+TATTAAATATGTAATTAACGAATCAAGATTTAATGCTTCCCAATTATGTAAAACGAAGAA
+AGGCATAAAACAAATGTCGGATGAGTGGCTTCGTGAGAAACAAGGTAGAAGAATTTTGAA
+AGCAGTTAATGGTGATAGAAAACTCCAAAAGGACATAATACAAGCGTTAAAGAAAGGTAA
+GGTAGAGAAAGTTTTATCACGAGTTGGCAAGGATGGAAAAGTAACGACGTATAGGCTGAA
+CAGCAATGGTGAAATAATTGGATTTTGGCCATAAATAACAAATGAAAAGGAGATGATGGT
+ATGAGGGATCCGTTATGCAGTGAAAGTTATTTATTAGAAACAATAGAATTTGACAAGGAA
+GCAATTGATGAAAATAAAAAAGACATTGTTGAATTAAAAGATGATATGGAAAAGGGCATA
+CAAAGATATCCAAGAGATAATCAAAGCATAATTTATGCTACGTTTTTGCATATGTTTATG
+TATAACACGGAAACGCTTATAGCCAAATACTCTTTAGGTAGTCATCCGGATGAAATGATT
+GAAGATTATTTAAACGGTATAGAGTATTTGGAAAATGTCGGTGAAGAAAAAGTATGGTAT
+ATTGACCTTTTGTGGATGCTATCGTTAGGTATACTTTTAGAAGTAGATAAACAAGATTTA
+AAAAGGCTTGCTTGTGTGATAGAGAAGCAAAAAAAAAGAAGACGCACTGATGGATTTTCT
+TTTAAAGGCTTGTGATATAGGATGGAATCATAATACAAGTGAATATGAGAGAAAAAATCC
+ATATGCAAAGACGGCTGAAATTATACAAATGGCATTGCATGATAAAAACAGGGAAAAAGC
+TTCGAAAAGGCTACAACAATATATAGAGAAAGAGTGGATTAAGGGACATAATGATCTGGA
+CTTCAAAAATGCGCATAAAGAACCCGGCTACGTTGGCTTGTGGAGTTTTGAGGCTGCAGC
+ATTGGCAAAGATACTGGGATTGGACGACAGCGCACTGAAAGATAACAACCATTACTGCTG
+TTACCGGCAGAGGAGGTCGGCACTATGTCTTTAAATACCCTAGAGGCCGGAGTATTCCAA
+ATAAGACCAAGTTTGCACCGGGTTTTGATAACCATTCAACAGGTGGACTGATTGTCGTAG
+CTCCAAGCATTCATGTAAGCGATAATCAGTACCAATGGTTGAAAGGACATTCTTCCTTTG
+ACAAAACCCTGGCAGAAGCTCCGGAGTGGCTGTTAAAGCTCATGGAAAGGGAGGAAGTAT
+TGCTTACACCCTTTGAAGGTAGAAGTATTGTAGCAGGGATTAAGGAAGGCAGCCGAAACA
+GCACCCTGACAAGCCTTGCAGGAACCATGAGAGCAAGAGGAATGACGGAGGAAGGCATCT
+ATACGGCATTACTTGCAGAAAACAACGCAAGGTGCAATCCTCCGCTTGATGAAGCGGAAA
+TTAAGAAAATATATAGTTTAGGTTTTCAAAGAGTTAGTAGCTTGTAAAGAATTAATATAT
+ACGATATACGCACAAAGCCGCTTGATTTTTGCAAAGGAGCTTTGTACAGTCATAAAGTAT
+TTACGTATTGCCTGAACAATTCAGCTTTCAGGAGATAAGGAATATACATGTTGGATTTTT
+CTGGCTGTAGGTTATTGCAGCGGTGTCTGCAGTATTAATCACGTCAATAGTTGTTGCTAT
+GATTATAATATAAGAAAAAGGAGAAAAGAAGAGAAGGAAAACGAGCTGGCGGCCGCTTGA
+TTTGTAAAATAGGTACGTTCTACTTGCTTTTTCAGAATAGAAATAATATAATAATGCCAG
+GAAAAGGCAGAAAAGTTTCCTGGCATTATTATAAGGCAACCACGGATTGCAAGCATTGGG
+ATGATAATTTTGAGGTGATAAAATGGCAACTATAACGTTATATGCCGGAAAAATCAACCA
+AATGCCCGGATTGATAAATGAAGTCAAGAAATCTGTGGTGGATTACAAGTCAGAATTATC
+CGCATTGAGAAAGAAAACTTTGAACATCAACAGAAGTGTATGCAATTTGGATGAAGTAAT
+AAGTTCCATACAGGCATCTTCCCAGACTTAGGATAGAAAAATTGATTCACTTGAGAAATT
+CTGCAGTGAAAGTGAGAAGTTTATATCGGAAGTAATACGTATCGATGAAGAAGTTGCTGA
+GCTTATCAATAAACGGAAAGAAAATTTTTACAAAGAATATTATTATTTAAAACCGGAAAG
+CGAGAAAAGCGGCTGGGAAAAAATCAAGGACGGCTTAAAGGCGGTTGCGGAGTGGTGTAA
+AGAGAATTGGAAATCCATTGCCAAGATAGTGGCTGCCGCAGTAGTTATTACCGGGTTGGG
+GATAGCGGCGGCATTGACAGGCGGTATATTGGGAGTCATACTGGCAGGAGCATTCTGGGG
+AGCATTGGCCGGAGGATTGATAGGGGGAGCGGTTGGAGGAATAGCCGCTGCGATAAATGG
+AGGATCGTTTCTGGAAGGATTTGCGGACGGCGCTTTAAGCGGAGCAATTTCCGGAGCGGT
+GACAGGAGCGGCATGTGCCGGGCTTGGTGCTTTAGGAGCTCTAGCAGGGAAAAGCATCCA
+ATGTATGAGCACAGTGGGAAAAGCGATAAATGTTACGTCAAAGGTTACGGCAGCACTTTC
+TTTTGGTATGGATGGATTTGACATGCTGGCAATGGGAATATCATTGTTTGATCCATCCAA
+TGCATTGGTTGAATTCAACCGGAAGCTGCATTCCAATGCACTTTATAACGGATTCCAGAT
+TGCTGTAAACGCGCTGGCTGTTTTCAGTGCCGGGGCGGCATCGACAATGAAGTGCTTTGT
+TGCAGGTACAATGATATTGACTGTGGCAGGCTTGGTTGCGATAGAGAATATCAAGGCAGG
+GGACAAGGTAATTGCGACGAATCCGGAGACTTTTGAAGTAGCCGAGAAGACGGTGCTTGA
+GACATATGTGAGAGAAACAACGGAGCTTTTGCATTTGACAATCAATGGAGAGGTAATCAA
+GACAACCTTTGAGCATCCGTTTTATGTTAAAGATGTGGGTTTTGTTGAAGCGGGAAAACT
+GCAAGTAGGAGATAAGTTGGTTGATTCAAGAGGCAATCTTTTGGTGGTGGAAGAGAAAAA
+GCTTGAAATAACAGATAAGCCTGTAAAGGTTTACAATTTTAAGGTCGATAATTTTCATAC
+GTATCATGTTGGCGAAAATAGGGTATTGGTTCATAATGCGAATAAGTATGTTAAGGGAAC
+GAGTAGTACTCTAAAAAGTTTGGGAAACAAGACTGAACAATATGTTACAAAACGAGGCTG
+GACATGGGATTCTATGGACGATGTTGTTAAAAAAACATATACTACTCGTGAAGCTATTAA
+CAAAGCAACTGGTAATCCAGCAACTGCTTACTACAATAAAGCTGGCGATTATGTAGTTGT
+GGATAATGTTACCGGTGAATTAGTACAAGTTAGTAAATTTGGTGATACTGGATGGATTCC
+TGACGCGACAATTAAAAATCCATACAAACCATGAGAGGGTGTTATTGATGACTGATATTA
+TTAAGGAGAATTATTCAAAAAAGGCCGTTATCTATGATAATATATGGATGTATTTTATTA
+AAACGGCAAAAGAAGTAATATGTGATTGCCAAAAAAATCAGATTAGAATAATGGCGCTGG
+AGGCGTTTAAATTAACAGGAGAAGGGATACAACCATCTCAAGAACATAGCATATATTTTA
+ATGTCAACGAAGATTGCTGGAGCAGAGCTATTGAATTTTTATCAAAAATTAAGGATAATG
+ACTATTTATATGAAATTTGGTATGAAGGATATTAAATCAGGAGTTAATAATTGCATAGTC
+GCATATTTTTAAATGATGCGCCCTTCCCTCCGAATTGCGATAAAGTACAGTCTTAATACA
+ATACCCGGCAAGCCAATACAACGGCAAGTCGGGTTTTCTTTTTATCCATACTTGACAATA
+TGTAATACATTGTGATACAATTAAACCAACAAGAAATACAGGAGGTGCAATGATGTCTAC
+AGAAAAGGATAGTATGTTACGGGTAAGGCTTACACAAAGGCAGTCGGATGAATTGGATGC
+GATTATTGGTGAGCTTCAAGCACAAATGCCGGAGGCAAGTGTTACCACATCAAGCATAGC
+AAGATACGCTCTGGAGAAGTATGTGAGCGACCATATCGCCAAGCGTGACGGTACCAAGAT
+TTTCATTGAAATCAACACTGCTGATGCCACAGAAGAGGACATAAAGAATCTCTACGACCT
+TCTTTCCAAGTTGTTTGACGAAACAAAGGAGAATTACTCACCAATGGTTCATTACATGGT
+TGGAGAGATTTTAGAGCCTGTGATGATGAAGATGGCAAGCCTCATGAAGCCTAAGAAACC
+GGAGGTGAGGGATGGTGAGTAAGAAACAGTACACAGTCCGCTGCCCCCATTGCAATCACA
+GAGTATTTGATGCCGATTATGCTGATGTTGAAATCAAATGCCCAGTATGCAGAATGGTTT
+TTGAAGTAAAGCTGGAGAAAAAGGCGGGGTGAAAAGTGAATAAATCTGGCACAGAGCCAC
+AAAGGGAGCACAAGACTCACCTATAGAGCCTGGCAGATAGTCTAAAAAACTATTTGTCAG
+GCTCTTTAAATTTTCTAGCACGACAGGAGGTGAGAAGTTTGGAAATGACAATGATGGACG
+CGGCATTAAAATACGCAGAAGCCAATATCCCAGTTATACCTCTGCACTGGATTTGTGAGG
+ATGGCTCCTGCTCCTGCAAGGCAGGGAGCGATTGCGACAGCAAGGGAAAGCATCCGTTAT
+ATACCGGCTGGTACAAGAACTCCACTACTGATGTTGAGCAAATAAAGAAATGGTGGACGA
+AAACCCCCAATGCCAATATCGGAATTCCTACAGGTGAGAAATCCGACTGGCTGGTGCTTG
+ATGTGGACGATGGTGGTGATGAAACCCTATCTGCACTTGAGGCAACACATGGAAAACTTC
+CGGATACGGTTACTGCTGTTACAGGAAGTGGAGGTCGGCACTATGTATTTATATACCCTA
+AAGGCCGGAGTATTCCTAATAAGACCAAGTTTGCACCGGGTCTTGATATGCGTTCAACAG
+GTGGATTGATTGCCGTAGCTCCAAGCATTCATATAAGCGGTAATCGGTATGAATGGTTAG
+AAGGACATTCTCCCTTTGAGAGAATCCCGGCAGAAGCTCCAGCATGGTTGTTGAAGCTCA
+TGGAAAGGGTGGAAGTATTGCTTACACCCTTTGAAGGTAGCAGTATTATTGCCGAGATTA
+AGGAAGGAAACCGCAACAGTACCCTGACAAGCCTTGCCGGAACCATGAGGGCAAGAGGAA
+TGACAGAAGAGAGCATCTATGCGGCATTGCTTGCAGAAAACAACGCAAGGTGCAATCCTC
+CGCTTGATGAAGCGGAAGTTAGAAAGATAGCGCACAGTGTCAGCCGATACCAGCCAAATC
+CTCCGATGAAGAAGCATTACCACAGGACAGACAGCGGGAATGCAGAAAGGCTGCGTGACA
+GGTTTGGTGAAATCATTAGGTATTGTCCGGCTTTCAAATACTGGTTGGTATATGACGGCT
+GTTGCTGGAGGAAAGAAACCGGAGAACTTATGCAGTTTGCTATAAAAACAGCAAGAGACA
+TGCTCGCAGAAGCAAGCCGGATAGAGGATGAGGCTGCAAGAAAAGAACTGGTGCGCCATG
+CCATGCAGTCTGAAAACGCAGGCAGGCTTAAAGCCATGATCGATGTGGCTTCAAACCTTG
+AAGGAATGGTAATTATGCCGGATGAGATTGATTCTGATATATGGAAGCTGAACTGTAGAA
+ATGGTGTGGTAGACCTAAAGACAGGCGAACTCCTTCCTCATAAGCGGGAGTACTATATGA
+GCAAAATCTGCCCTGTTGAATATAAACCAAGCAGCAAGGCTCCCAAATGGATGGAATTTC
+TGAATACCATTACGGGAGGAAGCAAGGAGCTTGTAAGATACCTTCAAAAAGCTGTAGGCT
+CGTCATTAAGCGGGGATATTTCAGAGCAGGCCCTATTCGTCCTTTATGGAACAGGAGCAA
+ACGGAAAGAGCACATTTCTAAACACCATCTCTGACCTGTTGGGAGACTATGCAAGAAATA
+CTCCGTCCGAAACTTTTATGGCTAAAAGAATAGAAGCGATAGGAAATGATATCGCAAGGC
+TTCAGGGAGCAAGGCTCGTTACTGCCATAGAAATAAATGAGGGACAAAGGCTCTCTGAGG
+CATTGATTAAGAGCTTTACAGGCGGAGACAGAATTACAGCAAGGTTTCTTTATGGAGAAT
+ACTTTGATTTCCAGCCACAGTTCACCCCGTTTCTCGTAGTAAACCACAGACCAGTCATAA
+GAGATACCAGCCACAGCATTTGGAGGCGCATTAAGCTGATTCCTTTCACCGTTACCATAC
+CCGAGGATAAAAAGGATAAGCAGCTACCGGCAAAGCTGAGAGAAGAGCTGCCTGGCATAT
+TGTCATGGGCAGTAGAGGGTTGCCTTCTTTGGCAGAAGGAAGGACTAAATATGCCTGATG
+AAGTCAAAAAAGCCACAGAAGGTTACCGGGAGGAAATGGATACCTTCTCAAGTTTTATAG
+AGGAATGCTGCATTGTGGAGGAGGGCAGGAAAGTCTCCAATAGAAGCATCAGGTACGCTT
+ACGAAACATGGTGCCGGGAAAATGGAGACTACCCTCTTGGACAAAAGCTATTCAATGCAA
+AAATGACGGAGCGCGGCTTTGCTGTCAAACGCAGCGGAGCCAATGGCAGCAGGGACTGGC
+ATGGTATTGGTCTTGCGGATGAGGGGATACTTTTGTGATTACTGACGACTGACGGCTTCT
+GACGTCAATTCCGTAAATTTTTATATATATTTTTTCTTATGTGAAATTTATGAAAAAAGA
+GTCAGTAAGAGTCAGTACGTCAGTAAAATCTCAGTACCTTGATGCAGAGGGGAGGGGAGG
+TCAAATCTCTACAGTAAAGCATAAGGGCAACGGGCTGGCAGCACCGCGTAAAAAAATGCA
+GATTCAAACGGGGTATTAACCCCAGACCATATTAACAAAAAAACAATTATGAAAATGGAG
+GATTTAAGCATGAGATTTATAGCAGATTTAGTACATGAGAAAAAGCAATTGGTGGAGAAA
+GCAGAAGCTATTTTAAACGAAGCGGAAAAAGCAGGTGGAAGTTTGACTAAGGAACAGGAG
+CAACAGTTTAACCGCTACAAAGACAGAATAACACGCATCAATGATAGCATTGATGAAGAA
+TTATCAAAAATCAGAACCTCTGAGCCAATATTGAATATGCCGCACAATCCCATGGCTCGT
+GAAGATGTGTCAAAAATTCCGGTAACAAAGGCTATATCAAAATCATTCAGAGGGATGTTC
+TATGGAAACGAAACTGTGAGCTTAAGCAACAATGGTTTTCATTCCATGGATGAATTCCTG
+AGAACACTTCACTCAGGCAGAGCCGACAACAGGCTAATAAATGCCAGTATGGTGGAAGGA
+ATACCCGAATTCGGCGGATATTCCGTACCGGAGGAATACGGAGCCTTCCTGATGGATAAA
+TCCCTGGAGAATGAGATCATTCGTCCCAGAGCAACAGTATGGGCAATGGGAAGTGAAACA
+AAGAAAGTATCAGCCTTTGATGGAGCAGACAGAACCAATCACCTATTCGGCGGTATCTCA
+GGAGAATGGCTGGAGGAAGGACAGACAGGCACACGAAAAACAGCCAAGTTAAGGCTGATT
+CAACTGAAAGCCAAGAAGCTGGCCTGCTTCTCACAGGCATCCAATGAACTTATTGCAGAT
+GGTATGTCCTTTGAGGAAATGTTAGCTGGAGCGCTTATTAAAGGCTTGGGCTGGTACATG
+GACTATGCCTTTATCAATGGAACCGGTGAAGGCCAGCCTCTTGGTATTATAAATGACCCG
+GCACTGATTACTGTAAATAAAGAGGCTTCTCAAGAACCAGCCACAATTACCTATCAAAAC
+GTGGTCAATATGTTCTCAAGGCTTGCTCCGTCATGTTTTACCAATGCGGTATGGCTTGCC
+AATCCATCGGTAATACCACAATTGCTCACCATGACCATTACCATTGGTACCGGTGGCGCT
+CAGATACCGGTATTCAGGGAAGAGAGCGGGAAATTCACACTTCTGGGTAAGGAGGTCTTA
+TTCACTGAGAAATGCCCCACATTGGGTGCTAAGGGAGATTTAATCCTTGCAGATCTTTCC
+CAGTATGCCATAGGCATGAGGAAAGAGATCGCTCTTGACCGCTCCAATGTCCCAGGCTGG
+ATGGAGGATATGACCGACTACAGGGTGATAGTGCGTGTAGATGGTCAGGGAACCTGGGAT
+AAACCTATAACACCGAAAAACGGAGCAACGCTCTCATGGGCAGTGGCTTTGGAAGCGAGA
+TGATTTGCTCAGATTTGAGCCAAGTCTGAGCCTAAGCAATACTTAGGGTAAAACCGCTCA
+AAAATGAGAAAATAGGAAGCTCTGCTCCTGCTTAACAGACTATTTAACAGTGGGTAGTTC
+TCCTACCCACTGGAATGCTTCGAACCCTCAAAAGCTTATAAATATTGCATTTAGAAGCAG
+AATTGACTTGCTATATCAGCGTTTCAGAGTGATGAATGTTAGTGCGGAATAAAGGCTTTA
+ACCGTAGGAAGGGGTGAAAGTGTGAGAGCAAAGATTACCACAACCATAGAGGAAGCCTTA
+TTGAACAAAGCCAAGGCACTTGCTAAACAAGAGGGTTTGTCTGGTGCCAATGCCATTATT
+GAAAGGGCTCTGGAGTTGTATTTTACCAGTATTCAATGTGAAGTGTGGGAAAAATCGTTG
+TCCAGCGGCTGGATAAAGAAGCTGGTTCTCAAAAGGGATTCTATTCTGTACGAAAACATC
+AAGTGCAGAAAAACCATGGAGAACTGCAGGCCGGATGATTACACACCTGAAAGCCTAAAA
+GCAAAAGGCTGGAAGAAGGTTTAGCAGCCGGGGAAAAGGCCTCTGTATTGCTCCTTGAAA
+CGTAAAAGCATAGGTTGCAGCCGTAAGCTTTGTTGAAACAGAAAGGGCAAATAAAGAGGA
+ATTTGAAAGGCTACTGCAGTTATCAATACAGAAATTTATTTGGTCAGTAGCATTAAGAAG
+TTTATGTCCAAGCGAAGCAGTAAAAGAACACTAAGAAATTTGAACTAAGGCTCGTGATGC
+CTGAAATCACGTAATTTGTCACACCAGGAATAGATAGGTTGGCGTTCCCTTGCGAGGTCA
+AAGAACTAAGGTTCTTAGACTAACGCTCTTAAATTGAGGTTGCCGGTATGAGTGGTGGAG
+ACATTGGAAAAGGAAAGGATAGATATTTATCATAAACGAAACACCTGCTTTGTTGGAATT
+GATATGCACAAGGACGCACATTGTGCAGTTGTAATTGATTGTTGGATGAATAAACTGGGT
+GAGGTTAACTTTGAAAACAGGCCATCCAGATTCCCTGCATTCGTTGAGGATGTAAGGAAG
+ATTTGCGGGATAAAGGAAATTGTATTCGGACTTGAAGATACCAGAGGCTTTGGCAGAAAC
+CTTGCTGCCTATCTGGTGGGCAGGAAGTTTGAAGTAAAGCACGTAAACCCTGCATATACA
+AGCGCTGTAAGGCTTGCAAACCCCATTATTTACAAGGATGACTCCTATGATGCCTATTGT
+GTGGCAAGGGTGCTCAGGGATATGGTGGACACTCTGCAGGATGCCAAGCATGAGGATATA
+TTCTGGACAATACGGCAAATGGTGAAAAGACGGGATTTGATTGTAAAAAGTAATGTGATG
+AACAAGAACCAGCTCCACAGCCAGCTTGCTTATAGCTACCCATCCTACAGGAAATTCTTT
+GCCATGATTGATTCCAAGAGTGCCTTATGCTTCTGGGAGAACTACCCGTCACCGGAGTAT
+ATATGGAAAACAACACCAGAAGAAATATATCAGACGATAAAGCCTGTGCATCAGGCGCTT
+AAAATACAGCGCATCCATGAGATTATATCCATGATTGAAAGGGATGGAGACACAAGAAAG
+GACTATCAGCCCGAAAGGGATTTTATTGTGAGAAACATCGTGAAGGATATCAGACACAAC
+AAGGAGTTGATTGCCGAAATTGACGATGAACTAAGAAAGCTGATACCTTTGACAGGCTAT
+AAGCTACATACAATGCCGGGAATCGACCTTGTTACAGAAGCACAGATAATATCTGAAATC
+GGAGATATTAACCGTTTCCCTGACTCAGACAAGCTGGCTCGGTTTATGGGCTTGGCACCG
+GTGCAATTCAGCTCTGCCGGAAAGGGTAAAGACCAAAGATGCAGGAATGGCAACAGGGCA
+CTAAATGCGATATTTCACTTTCTTGCAATCCAGATGGTAGCAGTATCGGCCTCAGGAAAG
+CCAAGACACCCGGTATTCAGGGAGTATTTTGAGCAGAAGGTCAAAGAGGGCAAGAACAAG
+CCACAGGCGCTTGTATGCGTGGCAAGGCGGCTTGTGAGGATAATCTACGGTATGATGAAA
+ACCAAGACTGAATACAGGCCATATGAGAAGACTGACGACAAGAACTGATTTCATATTCTG
+GAAGCAAAGCAATGGAAGATAATTCTTTTTTTCGTTGAGATATGGTAACAGGAATTATAT
+AATAGATATAGTCCTTGTAGTGAGGGAACGCGTAAGACTACACCGAAGACAACACTAGAC
+TATTTAAAAGACATTGAAGTAAAAAATGGAAACTACTATGCTTCAAAAGCAACTATTGAT
+GAAATTGGGAAAATTGAAGCAAAAGGCGTGGACTTTTCAAAGCTAGATAGTAAAGTAATG
+TCATTAAGAGCATCAACTGAAGGGGGAATGTCAAGAGTAATAAAATACTCGGATGGCAAT
+GGCATAAAGTTTATAATACATGAAGTAACTGATGCAAAAGGGAATATAATTCATAGAGAT
+TTTGATGCTGTAAGAATTGAATCTGGTCAGTTAATCAACAAAAAGTAGGGAGTGAGTTTA
+GTGACTAAAAGTGATATTGAAAAAGTATTGAGTGATATAGTTAATAATTTCTTAGAGAAA
+AAAATTGATGCTGACGAAACTATTGAGCAACTCATTACAAGAATTGATCCTTTAGAAGTC
+TATAAGTTAGACAATGAGCTTTTAATAACAGACTGTTATTTTGCAATCAAACATTTGACG
+GAAAATGGTTATGAGACAACTATAAGAGAGCTCCAATATTTTAGAGAGTGTTTTGCAGGG
+CAACGGCTTTATGACATCAATGAGAAAAATAAGTTTATTTTGGATTAATAGTTAATATAC
+TATGCAGGTCACACAGTTTCGGCTGGTGTGGCCTTTTTATTGTCCATGCTTGACATATCG
+TAATACAATGTGATACAATAAAATCAACAAGAAATACAGGAGGTGCAATAATGTCTACAG
+AAAAGGATAGTATGTTACGGGTAAGGCTTACACAAAGGCAGTCGGATGAATTGGACGCTA
+TCATCGATGAACTTTAAGCGCAAATGCCGGAAGCAAGCGTTACCACATCAAGCATAGCAA
+GATACGCTCTGGAGAAGTATGTAAGCGACCATATCGCCAAGCGTGATGGAACAAAAATTT
+TAATTGAAATCAACACCGCAGATGCCACAGAAGAGGACATAAAGAATCTCTACGACCTTC
+TTTCCAAGCTGTTTGACGAAACAAAAGAGAATTACTCACCAATGGTTCATTACATGGTTG
+GAGAGATATTAGAGCCTGTGATGATGAAGATGGCAAGCCTCATGAAACCAAAGAAGCCGG
+GTGTGAAGGCAGGTGAGTAAGAAAAAGTATATTGTACGCTGCCCTCATTGCAATCATGGA
+ATGTTTGATGCCGATTATGCTGATGTTGAAATCAAATGCCCGGTATGCAGAAAGGTTTTT
+GAAGTAAAGCTGGAGAAAAAGGCGGGGTAAAAAGTGAATAAATCTGGCCCAGAGCCACAA
+AGGGAGCGAATGACTCACCTATAGAGCCTGGCAGATAGTCTTAAAAACTATTTGTCAGGC
+TCTATTTATGTTCTCGGAGGAGGTGGAAATTTGAAAGTGACAATGATGGACGCGGCATTA
+AAATATGCAGAAGCCAATATCCCGGTTATACCTCTGCACTGGATTTGTGAGGGTGGCTTA
+TGCTCCTGCAAGGCAGGGAAAAATTGCGACAGCAAGGGAAAGCATCCGTTATATACCGGC
+TGGTACAATAATTCCACTACTGATGTTGAGCAAATAAAGAAATGGTGGACGAAAACACCC
+AATGCCAATATAGGCATTCCTACAGGTGCGAAATCCGGCTGGCTGGTGCTTGATGTGGAC
+GATGGCGGTGATGAAACTCTATCGGCTCTTGAAGCAACACATGGAAAACTTCCTGATACG
+GTTACCGCTGTTACCGGAGGTGGCGGTCTGCACTATATCTTCAAATACTCACAAGGCAGG
+AGTATTCCAAATAAGACCAAGTTTGCACCGGGTTTTGATAACCATTCAACAGGTGGACTG
+ATTGTCGTAGCTCCAAGCATTCATGTAAGCGATAATCAGTACCAATGGTTGAAAGGACAT
+TCTTCCTTTGACAAAACCCTGGCAGAAGCTCCGGAGTGGCTGTTAAAGCTCATGGAAAGG
+GAGGAAGTATTGCTTACACCCTTTGAAGGTAGAAGTATTGTAGCAGGGATTAAGGAAGGC
+AGCCGAAACAGCACCCTGACAAGCCTTGCAGGAACCATGAGAGCAAGAGGAATGACGGAG
+GAAGGCATCTATACGGCATTACTTGCAGAAAACAACGCAAGGTGCAATCCTCCGCTTGAT
+GAAGCGGAAATTAAGAAAATATATAGTTTAGGTTTTCAAAGAGTTAGTAGCTTGTAAAGA
+ATTAATATATACGATATACGCACAAAGCCGCTTGATTTTTGCAAAGGAGCTTTGTACAGT
+CATAAAGTATTTACGTATTGCCTGAACAATTCAGCTTTCAGGAGATAAGGAATATACATG
+TTGGATTTTTCTGGCTGTGGGTTATTGCAGCGGTGTCTGCAGTATTAATCACGTCAATAG
+TTGTTGCTATGATTATAATATAAGAAAAAGGAGAAAAGAAGAGAAGGAAAACGAGCTGGC
+GGCCGCTTGATTTGTAAAATAGGTACGTTCTACTTGCTTTTTCAGAATAGAAATAATATA
+ATAATGCTAGGAAAAGGCAGAAAAGTTTCCTGGCATTATTATAAGGCAACCACGGATTGC
+AAGCATTGGGATGATAATTTTGAGGTGATAAAATGGCAACTATAACGTTATATGCCGGAA
+AAATCAACCAAATGCCCGGATTGATAAATGAAGTCAAGAAATCTGTGGTGGATTACAAGT
+CAGAATTATCCGCATTGAGAAAGAAAACTTTGAACATCAACAGAAGTGTATGTAATTTGG
+ATGAAGTAATAAGTTCCATACAGGCATCTTCCCAGACTCAGGATAGAAAAATTGATTCAC
+TTGAGAAATTCTGCAGTGAAAGCGAGAAGTTTATATCGGAAGTAGTACGTATCGATGAAG
+AAGTGGCTGAGCTTATCAATAAACGGAAAGAAAATTTTTACAAAGAATATTATTATTTAA
+AACCGGAAAGCGAGAAAAGCGGCTGGGAAAAAATCAAGGACGGCTTAAAGTCGGTTGCGG
+AGTGGTGTAAAGAGAATTGGAAATCCATTGCCAAGATAGTGGCTGCCGCAGTAGTTATTA
+CCGGGTTGGGGATAGCGGCGGCATTGACAGGCGGTATATTGGGAGTCATACTGGCAGGAG
+CATTCTGGGGAGCATTGGCCGGAGGATTGATAGGGGGAGCGGTTGGAGGAATAGCCGCTG
+CGATAAATGGAGGATCGTTTCTGGAAGGATTTGCGGACGGCGCTTTAAGCGGAGCAATTT
+CCGGAGCGGTGACAGGAGCGGCATGTGCCGGGCTTGGTGCTTTAGGAGCTCTAGCAGGGA
+AAAGCATCCAATGTATGAGCACAGTGGGAAAAGCGATAAATGTTACATCAAAGGTTACGG
+CAACACTTTCTTTTGGTATGGATGGATTTGACATGCTGGCAATGGGAATATCATTGTTTG
+ATCCATCCAATGCATTGGTTGAATTTAACCGGAAGCTGCATTCCAATGCACTTTATAACG
+GATTCCAGATTGCTGTAAACGCGCTGGCTGTTTTCACTGCCGGGGCGGCATCGACAATGA
+AGTGCTTTGTTGCAGGTACAATGATATTGACTGTGGCAGGCTTGGTTGCGATAGAGAATA
+TCAAGGCAGGGGACAAGGTAATTGCGACGAATCCTGAAACTTTTGAAGTAGCGGAAAAGA
+CGGTGCTTGAGACATATGTGAGAGAGACAACGGAGCTTTTGCATTTGACAATCAATGGAG
+AGGTAATCAAGACAACCTTTGAGCATCCGTTTTATGTAAAAGATGTGGGTTTTGTTGAAG
+CGGGAAAACTGCAAGTAGGAGATAAGTTGGTTGATTCAAAAGGCAATCTTTTGGTGGTGG
+AAGAGAAAAAGCTTGAGATAACAGATGAACCTGTTAAGGTTTATAACTTCAAAGTGGATG
+ATTTTCATACTTATCATGTTGGGAAAAAAGGGATATTGGTACATAATGCAGACTATAACC
+CCAAAATGGGATTTGATGATTTGGACCTTGAGAAAGCTACGAACAAACAAAAAGGCAATT
+ATGGAGAGTATCTGGCAGATGATAATCTTATTAATAATCCAAAATTGAAAGAAGCAGGGT
+ATGATTTGGAGCGGATAGGAGGTAAGGTTCCGACCTCACCGGATGATAAAATTACAAAAG
+GGATAGACGGTATATATATAAACAAGAATCCTAATTCAAATATTAAATATGTGATTGATG
+AAGCCAAATTTGGAAAAGCAGGACTGAGTGCAAAGACAAGAGATGGAAAACAAATGTCAG
+ATTCTTGGTTAGTGGGTTCTCGCTCAAGAAATAATAGAATTTTAAAAGCAGTAAGTAATA
+ATGAAGATTTAGCATTTGACATAGTGAAAGCATTAAGAAATAACCAAGTAGAAAGAGTAT
+TATCAAAGATAGATGTAAATGGAAAAATAATAACATATAGACTGGATAGCAATGGTAATA
+TAATTGGACTTTGGCCTTAGATGATTGAAAAGGAGGTAACTATATGAGAGATCCGTTATG
+TGATAAAAATTATTTATTAAAAACAATAGAACTTAGAAAGAAATATATTTGTGAAATGAA
+AGGAGAAATTGTTCAATTAAAATCTGATATAGAAAAGGGGATTCAGAGATATCCTAGAGA
+TAATCAAAGTATAATTTTTGCTAGATTTGCAATAATGTTTATGTATGGTATGGACATGCT
+TTTAGCAAAATATTCCTTGGGCAATCACCCTGATACAATGATAGATGACTATTTAGACAA
+CATAACATATTTAGAGAATTGCGGTGAAGAAGAGGCCGGCTACATTAACCTTTTATGGAT
+GGTTGGACTGGGTATCCTTTTGGAAATGGATAAAGAAGTGTTAAAAAGACTGGCAAGAGT
+TATAGAAAGGCAAAGAATAGAAGACGCACTTATGGATTTTCTATTGAAATCCTGTGATAT
+AGGTTGGAATCACAGTACAACGAAATATGAAAAAAAGAACCCGTATGAAAAGACAGCAGA
+GATTATAAAAATAGCATTACACGACAAAGACAAGGAAGCGGCATCAAAAAGGCTTGAAAA
+ATACATGGGAAAAGAATGGTTCAAGGGACATTACGACTTTGGGTGGAGGAATGCCCATAA
+GGAACCTGGCTATTATGGTTTTTGGAGTTTTGATACAGCGGCACTGGCCAAGATACTGGG
+ACTGGATGACAGTGCGTTAAAAGACAACAACCATTATCCTTATGATTTGGCACACTATAA
+AAATGGAATGACCTTTGATTTGAGTTGGTATAGTGTACCAAAGGAAGAGGAAGATAAGGA
+AGAAGAAACGGTGGTATATGGTATACCGGGTAATCCTGAGTTGGAGAGAATAATACCTGG
+GAGATTCCACAGTTTTGTAAATGAGATAATAAATGATTATAAAACACTGCCGGACGAAGA
+ATTTTGGAAGAAATACAATTTGAAAGAAATCTGGTTTGATGTGGAGGAGTATAAGGAGGA
+TAATAAAGATAAGAATTTGCTAGGAACGATTATAGTATTCATGCTTGTGGACAAAGATTA
+TATTTTGCAGTTGGATTATAAAGAAGAGTTAATAGACTATATAGAGAATATACATAATTA
+CTGGGCCAAGAAAGAAGTTAAGCTTATAAGCTTTGAATTAGACAATGACCAGCAGTACTA
+TGCATATGTGCCGAAGGATGCGGAGGTTGGTTCGTTGTATGAGGTAAAACTGACAGAAGT
+GGAGAAAATAGAGGAGGTTTAGTGTTTATTGTGTAATAGTGTGAAGAAGATGAGTTGTTT
+ATGAAGAATCTGCTGTATAATTGGATATATATAGTTTGATTTTGGGAATCTCCTTCCTGG
+CGAAACAAAAACTATAGGACAGTATTTGGGAAGGAGTATTTTTTGTGTTATTTTTTTTGG
+GGAAGATAATATTGTATTGAGAATAATAAGAAGTTTTATTAGGATTGTTTATGGTTGTCA
+ATGTTAATATAATCAATGTTAATATAATCAATGTTAAAAGGTATAGGAACAGAACTATAG
+CAGGGGAGAGTCAAAATGTACATTTGGCAGTGAAAGATAAGCTGAAAAAAGAGGGGCGTT
+CATTTGAATTAATTCCTGAAGATCTTGATGTTTATAAAGAAGCATTGGATTTATGGTTGA
+GTCCAAATTTGGAAGAGGTTAAAAGCGTGATTGATAAAATGATATTGTATCATTCCGTAT
+TAGTTTCGGACATTGATAACGAACCGGAATTTGGTGATTACACGTATGGATTTTATCCAT
+ATGAGATATTGTTTTTAATGCATATAAGGAGGAAATTAGGTTTGCCGGTACCGGATAAAT
+TTGAAGACTTGCTGATGAACACACCGGAAGCGAAGGTGGTGATTAATGAGCCGGAGCCAT
+ATCCGGAGTGGGATCCTTTGTTGAGAGCCATAGATGAGTTTTACCGAAAGAATTATCCAA
+ATTACATTCCCAACAAGCATGGAAAACTGTTTGAATAGGAGGAAACTGTTATGGCAATGG
+AAGATATAGTTGGGATTATATTTGAAGACATTGAGGAAGTGAAACCAATTTTAAGTGATT
+CGGAAGGAAATGATTTGGAAGGAAATGATTTGAGTGAGGCGATATTGGAATACGGGATAT
+CGGAAGGGAAGTTTCTGTGTGTTGATTATGGTGGAGAAGAGGGGAGCGAGATAATAAATT
+ATATAATGGATTATGAATTCAGTCATGGAATAGAGCTTGCAACACAGGAGGAGTTGGAAG
+AGCTGGACGAGATGGAGTATGATGATTTGACAGATAAGATAAAAGAAGTGAACAAGATAT
+TGGAGAAAGCAGGGTATGGACTGTTTTGCTTTCCAACAGGAAGTGATTTTTATGAGTTGT
+TTATAGCGAAGTTGGAGGATAAAGAGAAGTTATTGGAGGAAAAGATAGTTGATGATGAGG
+AGTTGCCATTGGAAGAGAGGTATATTCAGTATTATGTGTAAGGGGATAATCTGCAGTATT
+TAGAGTTTTGGATAAGAATATGGCTTTTATAAAAATATTGGCAGTGTAAATATTTTTGTG
+TAAACTAATTTTCCTTCTATGTTAGTGTTTAAATATATTTTAAGACTCGAAAGTCTGCTT
+TGTCAAATTTTATAGATTCAAAAGAATTTCTGATAAGAAATTCTTACAAAAGAAAAATTT
+GACAAAGATGATGCGTATAAAATATTACAGAGGGGTTCAGGAAACCAGAGTTTCCCTGAA
+CCCCTTGATTATACTATATACGCCCTTCGAACATAATCTGTAGCTGTCCCAGTATCAACC
+TCCAGTTTTTGTAACGCATCGTCCATTTTGAAGTAATCTTCACTGTAGCTAAATATATGC
+TCTTTAAAAGTGACTGGTCGCCAGGAAATACTGTCCTTGATTTGTTTATCCTTCTATAAC
+TGCTATTCAGGCTCTCAATAGTATTGGTCGTATACATGATTTTACGTAGTTCCTCCGAAT
+ACTTAAAAAATGGACAAATAACATCCCAATTGCTCTTCCAGCTCTTCATAGCTGCCGGGT
+ATTTCTTCTCCCATTTCTCTGAAACCTCAAGCATCTGGTCGTACCCTGCCTTCTCATTCG
+GAGCCGTATATATCCGTTTCAAGTCCCTGGCAAATTCCTTTCGGTCTTTATCTGACACAT
+ACTTTAGCGTGTTTCTTATCTGGTGTACTATACACCTCTGATATTCAGTATTCGGAAAAG
+CCGCATTGATTGCATCCTTTATCCCTGAAAGTGCATCAGCACAGAGAATCAGGATGTCTT
+TAACTCCTCTGTTTTTAAGGTCATTTAAGACACTCAGCCAGAATTTTGAGCTCTCATTTT
+CTCCTACATAAATACCGATAACATCTTTCTGCCCTTCTATATCAATCGCCAGCACAATAT
+ATACGGCCTTCTTCCCAACAATGCCGTCATTTTTTACTGAAAAATGAATTGCGTCAATAA
+ATACTATCGGATAAACCTCTCCCAGAGGCCTTTTCTGCCACTCTTCTATCTCAGGTAGTA
+TTTTATCAGTGATCTTACTTACCATCTCGGCAGATACTTCAAATCCGTAGATTTCCTGTA
+TCTGCTCGTTGATTTCTCTGGTAGACATCCCCCGCGCATACATTGCTATTATTTTATTTT
+CAATTTCTGAAATGTCCCTTTTATACCTGGGAACAATTTTCGGCTCGAATTCTGCATTCC
+GGTCCCGCGGGATATCTATTTCCACTTGCCCTACACTTGACTTTAATGTTTTTGATGTGT
+ACCCGTTACGGTAATTTGATTTCGCTTCTTCAGTTGATTCGTACTTTTCATATCCGAGAT
+GTTCATCCAGCTCTGCTTCCAACATATTTTGTATCGTATCTCCGAGCAGATCCTTCAATG
+CTTCCTGCAAATTCTTTGCTCAAGTGATGTTGTACTCAGAAATGAGATTTCTGATAAGCT
+CTTTCTTTTCTGGTGTTATTATTCTTTTTCTTGCCATAAAAAACTCCTCCTATACTTTAG
+TATTCTATCATAGAAGGAGTCAATTAGTTTACATAAATATTTTACAGTCTCTTAGCTTGT
+AAAGAATTATAATATAATATATATGTACAAAGTCGCTTAATTTTTGCAAAAGATCTTTGT
+ATAATCATAAAGTATTTAGATATTGCCTGCACAATTTCAGCTATAGATTCAAACAAGTTG
+TTATGCGTTACATTCATTCGGATGTCTTTCAAAAGGTGATCGATTGAATTCAACTCGGAG
+CTATAAGGAGGCAAATACTTAAGGGTAATGTTCTTTATTGAATCCAATGGGAGTATAAAT
+AATTTCATGTATTAAAAATTTTTCAGTTCTTCCTGGCAAGAAATTTTAAGTTTTCAAAGT
+TTACAGAATGTAAATCCTAAATCACTTCAATATTATATATTATTGCCGGTTTTGCTAAGT
+TTTACACATAAATTTGATTTAATTCGTCTATAATTATTTATAATGGAGTGTTTTGCCCTT
+TTTCGCTCAATTATCAACGAATTGGTTGACGAAAACCGGTGCAAGGTATATGATAGCGGC
+AGGGAAATAGATTTCAAATATTACAGTGATAACAATACATTAACTTTTACCCTCGGAAAG
+GGTTGGCACAACGTTGGAATTGTCCTTGTGGATATGGCGGGAAATGTAAACAATATTCAG
+GAGATAAGGAATATACATGTTGGATTTTTCTGGCTGTGGGTTATTGCAGCGGTGTCTGCA
+GTATTAATTGCGGCAATAGTTGCTGCTGTGATTCATAATATAAGAAAAAGGAGAAAAGAA
+GAGGAGGAAAACGAGCTGGCGGCGGCTTGATTTGTAAAATAGGTACGTTCTACTTGCTTT
+TTCAGAATAGAAATAATATAATAATGCCAGGAAAAGGCAGAAAAGTTTCCTGGCATTATT
+ATAATGCAACCACGGATTGCAAGCATTGGGATGATAATTTTGAGTTAATAAAATGGCAAC
+TATAACGTTATATGCCGGGAAAATCAACCAAATACCCGGATTGATAAATGAAGTCAAGAA
+ATCTGTGGTGGATTACAAGTCAGAATTATCCGCATTGAGAAAGAAAACTTTGAACATCAA
+CAGAAGTGTATGCAATTTGGATGAAGTAATAAGTTCCATACAGGCATCTTCCCAGACTCA
+GGATAGAAAAATTGATTCACTTGAGAAATTCTGCAGTGAAAGCGAGAAGTTTATATCGGA
+AGTAATACGTATCGATGAAGAAGTTGCTGAGCTTATCAATAAACGGAAAGAAAATTTTTA
+CAAAGAATATTATTATTTAAAACCGGAAAGCGAGAAAAGCGGCTGGGAAAAAATCAAGGA
+CGGCTTAAAGGCGGTTGCGGAGTGGTGTAAAGAGAATTGGAAATCCATTGCCAAGATAGT
+GGCTGCCGCAGTAGTTATTACCGGGTTAGGGATAGCGGCGGCATTGACAGGCGGTATATT
+GGGAGTCATACTGGCAGGAGCATTCTGGGGAGCATTGGCCGGAGGATTGATAGGGGGGAG
+CGGTTGGAGGAATAGCCGCTGCGATAAATGGAGGATCGTTTCTGGAAGGATTTGCGGACG
+GCGCTTTAAGCGGAGCAATTTCCGGAGCGGTGACAGGAGCGGCATGTGCCGGGCTTGGTG
+CTTTAGGAGCTCTAGCAGGGAAAAGCATCCAATGTATGAGCACAGTGGGAAAAGCGATAA
+ATGTTACGTCAAAGGTTACGGCAGCACTTTCTTTTGGTATGGATGGATTTGACATGCTGG
+CAATGGGAATATCATTGTTTGATCCATCCAATGCATTGGTTGAATTTAACCGGAAGCTGC
+ATTCCAATGCACTTTATAACGGATTCCAGATTGCTGTAAACGCGCTGGCTGTTTTCAGTG
+CCGGGGCGGCATCGACAATGAAGTGCTTTGTTGCAGGTACAATGATATTGACTGTGGCAG
+GCTTGGTTGCGATAGAGAATATCAAGGCAGGGGACAAGGTAATTGCGACGAATCCGGAGA
+CTTTTGAAGTAGCCGAGAAGACGGTGCTTGAGACATATGTGAGAGAGACAACGGAGCTTT
+TACATTTGACAATCAATGGAGATGTAATCAAGACAACCTTTGAACATCTGTTTTATGCAA
+AAGATGTAGGTTTTGTTGAAGCTAAAGAATTGCAAGTAGGAGATAAGCTGCTAGATTCAA
+AAGGCAATGTTTTGGTGGTGGAAGACAAAAAAATTAAAATTACAGATGAACCTGTCAAAG
+TTTACAACTTTCAAGTTGATGATTTTCACACTTATCATGTTGGCTGTAATGGTGTACTGG
+TTCATAATGTAAAATATAATGATGGTTCGAATAAGATTAATAAATGGGTTGATGAAGAAG
+GAAATATAATATGGCCTCCAAATAGAGGCTTCGACGGTGAACCGGTGAAAGTAACGTTGG
+AGCCGGGAACGCGAATCGATAGGTATGGCTATGAAGGAGGTACATTTGCTTCGCCTGTGG
+GAACGCCGTATGACTGTCGTTCTTTAGCACCGGGAACGGAAACTAAACCATATAATGTCT
+ATGAAGTTGTCAAGCCGGTTGAAGCACTAAGCGGCAAAATAGCACCATGGTTTGACAAGC
+CCGGTGGAGGAATACAATATGAATTTAGTCAGTCAATTAAGGAAATGTTGGAAGCAGGAA
+TACTAAAAAGGGTGGGATCATAAGATGAATAAAAATGATTTAAGGAAAATGTTGACCGAT
+AGCAATATACCTAAAGATACATACTCTTTGGACGGCGGTTTGCCGAATGAAGCATATTGC
+CTCAATCAAAATGGGGATAGATGGGAAGTTTATTACAGTGAACGGGCTCAGAAGACCGGA
+TTAAAAATATTTGAAACGGAAAGTGAAGCATGCGAGTATTTCTATAATTCATTAGTTCAG
+ATGTTAAAGGACATGGGCGTATTATAATTACAAGTTATCTGTATAGGTCATACAAGTTTT
+AACCGGTATGACCTATACATGATTCGGTTTACGGAGCTCATCCGATTATGCCTGAGGGAA
+GCTGATAAAATATGCATTTAATTGACTTGGAGATTTCCAAAATACAATCCATAAGAATAT
+ATTTGCCATGTAAAAAAGAGGATATAAAGCCATTTGATATTGTGTCAATAGAATATATAA
+AAGAACAAATAGAATATGATTTATATGTTGATGATTTTGCAACAGAAGCGATAACATCGT
+TGAAAAATCAGCTGAAAAAAGCGTTGAATTTTGAGTTGCATATTCAAAACGAATATATAA
+ATAAAGGGATTGGGTATTACTATAATATTTATGTAAATAAATTGTGGACAACTGATGCTC
+AAAGCCTTGTTGATCCATCACAAAATTTTAGCCTTTGGTCAACTCCAACTCATATAGGTA
+TTGAAACTTTTATGTATAATATTGATGATAAAATATATATTGAAATAAGTCCAATTTACA
+AGTGGAACTGCGATTATCCTGAGAATGAAAGTGAATATGAAACTTTTGACAATTTTCTAA
+ATAATTACAAACCAATTGATATTGTTTCAATTGACAGAAGTGTTGCTGAGAGATGGCTAG
+ACTTTTGTTGTGATATGATAAAGATATTTAAAGAAAACGATAAAAAGTACTTAAAAGAAG
+ATAACACAAATTAGCTTTTTATATGGCAATTTTTTATTTGTACAAAGCTACTAACGAATC
+ATAAAAAACTTAAGCTTAAGGGATAGGGAGAATTTGCAGGTCACGTAATTTCAACTAATG
+TGACCTTTTTGTTTAATATATATTATATTTATATATTAATTCAATTATATTCAGAGACAG
+GAAACACATTACAAGTTGTACAAAGGTAGTGGAATGTTTTATGTTATATGACCACAGCAC
+TTTCTTTTAGTATGGATGGATTTGACATGCTGGCAATGGGAATATCGTTGTTTGAACCAT
+CCAATGCATTGGTTGAATTTAACCGGAAGCTGCATTCCAATGCACTTTATAACGGATTCC
+AGATTGCTGTAAACGCGCTGGCTGTTTTCAGTGCCGGGGCGGCATCGACAATGAAGTGCT
+TTGTTGCAGGTACAATGATATTGACTGCGACAGGCTTGGTTGCGATAGAGAATATCAAGG
+CAGGGGACAAGGTAATTGCGACGAATCCTGAAACTTTTGAAGTAGCCGAGAAGACAGTGC
+TTGAGACATATGTGAGAGATACGACGGAGCTTTTGCATTTGACAATCAATGGAGAGGTAA
+TCAAGACAACCTTTGAGCATCCGTTTTATGTAAAAGATGTGGGTTTTGTTGAAGCGGGAA
+AACTGCAGATAGGAGACAGGTTGGTTGATTCAAGAGGTAATGTTTTAGTATTGGAAGGTA
+AAAAGCTTGAAATAACAGATAAGCCTGTAAAGGTTTACAATTTTAAGGTTGATAATTTTC
+ATACGTATCATGTTGGCGAAAATAGGGTATTGGTTCATAATGCGAATAAGTATGTTAAGG
+GAACGCGTAGTACTGTAGGTAAACTTACAGGTTCATTGGATGGGTTAACATCAGCAGAAA
+GAAAGGTTGTAAATGATTTGCTTTCACAGGGTAAGAATGTTGAAATAATTCCGCGTTCCA
+ATGTTCAAGGGGTTAGCACACCTGATTTTATAATAAATGGGGTAAAAACAGAATTAAAAA
+CATTAAATGGAACAAGTCTAAATACTCCGGTTACTAGGATTACAGATGCGTTTAAACAAG
+GTGCAGATGCAGTTATTATTGATGCAAGAAATGTTGGAATAACTGCTGAACAGGCAAACC
+AAATACTCAATCGAGCTGCAGGCACTTATCAAAATAAAGTATTACCAGGTCAAGTTGAGA
+TTTGGACTGTTGACGGTATTATTAGGAGGTAATAATTTATGAGAATGCAATGTAAGTGTG
+GAGAAATATTATCCAATAGTATGGCTCCTAATGACATCCAATTAAGAGTATATACTGATA
+GGGAATGGGATGATATAATTAATATGGGTGAAATTGATTCAATTAATATACCACACCCTA
+AAATCGATGTATGGCGTTGTCCTAAATGTGAAAGAGTTTATGTCTTTGAATATGGTAATC
+ATAAAGCAATAAAAGTCTATAAGTTAGAAGAATAGGTGTCTTTTTAAGGTCACACAGTTT
+CGTCTGATGTGGCCTTTTTTCTTATCTATGCTTGACAATATGTATTACAATGTGATACAA
+TAAAACCAACAAGAAATACAGGAGGTGCAATAATGTCTACAGAAAAGGATAGTATGTTAC
+GGGTAAGGCTTACAAAAATGCAGTCGGATGAATTGGATGCGATTATTGGTGAGCTTCAAG
+CACAGATGCCGGAAGCAAGCGTTACCACATCAAGCATAGCAAGATACGCTCTGGAGAAAT
+ATGTGAGCGACCATATTGCTAAGCGTGACGGAACCAAGATTTTTATTGAAATCAACACTG
+CTGATGCCACAGAAGAGGAGATAAAGAATCTCTATGACCTTCTTTCGAAGCTGTTTGACG
+AAGCAAAGGAGAATTACTCACCAATGGTTCATTACATGGTTGGGGAGATTTTAGAGCCTC
+TGATGATGAAAATGGCAAGACTCATGAAGCTAAAGAAGCCGGAGGTGAAGGCAGGTGAGT
+AAGAAAAAGTACATTGTCCGCTGTCCTCACTGTAATCACAGAGTATTTGATGCTGATTAT
+GCTGATGTTGAAATCAAATGCCCGGTATGCAAAAAGGTTTTTGAAGTAAAGCTGGAGAAA
+AAGGCGGGGTAAAAAGTGAATAAATCTGGCACAGAGCCACAAAGGGAGCGAATGACTCAC
+CTATAGAGCCTGGCAGATAGTCTTAAAAACTATTTGTCAGGCTCTATTTATGTTCTCGGA
+GGAGGTGAGAATTTGAAAATGACAATGATGGACGCAGCAATAAAATACGCAGAAGCCAAT
+ATCCCAGTTATGCCTTTGCACTGGATTTGTGAGGATGGCTCCTGCTCCTGCAAGGCAGGG
+AGTGATTGCGACAGCAAGGGAAAGCATCCGTTATATACCGGCTGGTACAAGAACTCAACT
+GCTGATATGGAGCAAATAAGGAAATGGTGGACAAAAACACCCAATGCCAATATAGGCATT
+CCTACAGGTGAGAAATCCGACTGGCTGGTACTTGATGTGGATGATGGCGGTGATGAAACC
+ATATCTGCACTTGAAGCAACATATGGAAAACTTCCGGATACGGTTACTGCTGTTACAGGA
+AGTGGAGGTTGGCACTATGTCTTTAAATACCCTAAAGGCCGGAGTATCCCAAATAAGACC
+AAGTTTGCATCGGGTCTTGATACGCGTTCAACAGGTGGACTGATTGTCGTGGCTCCAAGC
+ATTCATGTAAGCGGTAATCAGTACCAATGGTTAGAAGGACATTCTCCCTTTGACAGAACC
+CCGGCAGAAGCTCCAGCATGGTTATTAAAGCTCATGGAAAGGGTGGAAGTATTGCTTACA
+CCCTTTGAAGGTAGCAGTATTATAGCAGAGATTAAGGAAGGCAGCCGCAATAGCACCCTG
+ACGAGCCTTGCCGGGAGTATGAGAGCAAGAGGAATGACAGAAGAGAGCATCTATGCAGCA
+CTGCTTGCCGAAAACAAAGCCAGATGCAATCCTCCGCTTGATGAAGCGGAAGTTAAAAAG
+ATAGCGCACAGTGTCAGCCGATACCAGCCAAATCCTCCGATGAAGAAGCATTACCACAGG
+ACAGACAGCGGTAATGCAGAAAGGCTGCGTGACCGGTTTGGTTCAATCATAAGGTATTGT
+CCGGCTTTCAAATACTGGTTGGTATATGACGGCTGTTGCTGGAGGAAAGAAACCGGAGAA
+CTTATGCAGTTTGCTATAAAAACAGCAAGAGACATGCTCGCAGAAGCAAGCCGGATAGAG
+GATGAGGCTGCAAGAAAAGAACTGGTGCGCCATGCCATGCAGTCTGAAAACGCAGGCAGG
+CTTAAAGCCATGATCGATGTGGCTTCAAACCTTGAAGGAATGGTAATTATGCCGGATGAG
+CTTGATTCTGATATATGGAAGCTGAACTGCAAGAATGGTGTGGTAGACCTAAAGACAGGC
+GAACTCCTTTCTCATAAGCGGGAGTACTATATGAGCAAAATCTGTCCTGTTGAATATAAA
+CCAAGCAGCAAGGCTCCCAGATGGATGGATTTTCTGAATACCATTACGGGAGGAAGCAAC
+GAGCTTGTAAGATACCTTCAAAAAGCTGTAGGCTCATCTTTAAGCGGGGATATTTCAGAG
+CAGGCCCTATTCGTCCTTTATGGAACAGGAGCAAACGGCAAGAGCACATTTCTAAACACC
+GTCTCTGACCTGTTGGGAGACTATGCAAGAAATACTCCGTCCGAAACCTTTATGGCAAAA
+AGGATAGAAGCGATAGGAAATGATATTGCAAGGCTTCAGGGAGCAAGGCTCGTTACTGCC
+ATAGAAATAAATGAGGGACAAAGGCTCTCTGAGGCATTGATTAAAAGCTTCACAGGCGGA
+GACAGAATCACAGCAAGGTTCCTTTATGGAGAATACTTTGATTTCCAGCCGCAGTTTACC
+CCATTTCTCGTAGTAAACCACAGACCTGTCATAAGAGATACCAGTCACAGCATTTGGAGG
+CGCATTAAGCTGATTCCTTTCACCGTTACCATACCCGAGGATAAAAAGGATAAGCAGCTA
+CCGGCAAAGCTGAGAGAAGAGCTGCCTGGCATATTGTCATGGGCAGTTGAGGGCTGCCTT
+ATATGGCAGAAGGAAGGACTAAATATGCCTGATGAAGTCAAAGAAGCTACAGATGGGTAC
+CGGCAGGAAATGGATACTTTCTCATCGTTCATTGAGGAATGCTGCATTGTGGAGGAGGGC
+AGGAAAGTCTCCAATAGAAGCATCAGGTACGCTTACGAAACATGGTGCCGGGAGAACGGA
+GATTATCCTCTTGGTCAAAAGCTGTTCAATGCAAAAATGACGGAGCGCGGCTTTGCTGTC
+AAACGCAGCGGAGCCAATGGCAGCAGGGACTGGCATGGCATTGGTCTTGCTGAGGAGGCG
+ATACTTTTGTGATTACTGACGACTGACGGCTTCTGACGTCAATTCCGTAAATTTTTATAT
+ATATTTTTTCTTATGTGAAATTTATGAAAAAAGAGTCAGTAAGAGTCAGTACGTCAGTAA
+ACTCTCAGTACCCTGATGAGAGGGGAGGGGGAGGTCAAATCTCTACAGTAAAGCATAAGG
+GCAACGGGCTGGCAACATCGCGTAAAAAAACGCAGGTTCAAACGGGGTATTAACCCCAGA
+CCATATTTACAAAAAAATATTAAGAAAATGGAGGATTTAAGCATGAGATTTATAGCAGAT
+TTGGTACATGAGAAAAAGCAATTGGTGGAGAAAGCAGAAGCTATTTTAAACGAAGCTGAA
+AAAGCAGGTGGAAGTTTGACGAATGAACAGGAGCGACAGTTTAACCGCTACACAGACAAA
+ATTAAGAGCATTAATGAAAGCATTGACGAGGAATTATTAAATATCAGAACCTCTGAGCCA
+ATTCTAATTACACCACAAAAAGCTGTATCTCCTATTGAAGAATCAAAAACACCTGTAACA
+AAAGCCGTATCAAAATCATTCAGAGGGATGTTCTATGGAAACGAAACTGTGAGCTTAAGC
+AACAATGGTTTTCATTCCATGGATGAATTCCTGAGAACACTTCACTCAGGCAGAGCCGAC
+AACAGGCTAATAAATGCCAGTATGGTGGAAGGGATACCTGAATTCGGCGGATATTCCGTA
+CCGGAGGAATACGGAGCCTTCCTGATGGATAAATCCCTGGAGAATGAAATCATCCGTCCA
+AGAGCAACGGTATGGGCAATGGGAAGTGAAACAAAGAAAGTACCAGCCTTTGACGGAGCA
+GACAGAACCAACAACCTATTCGGCGGCATCTCGGGCGAATGGCTTGAAGAAGGACAGACA
+GGCACACGAAAAACAGCCAAGTTAAGGCTGATTCAACTGAAAGCCAAGAAGCTGGCTTGT
+TTCTCACAGGCATCCAATGAACTTATTGCAGATGGGATGTCCTTTGAAGAAATGTTAGCT
+GGAGCACTCATTAAAGGCTTGGGCTGGTACATGGACTATGCCTTTATCAATGGAACCGGT
+GAAGGCCAGCCTCTTGGTATTATAAATGACCCGGCGCTGATTACTGTAAATAAAGAGGAC
+TCTCAAGAACCAGCTACAATTACCTATCAGAATGTTGTCAATATGTTCTCAAGGCTTGCT
+CCATCCTGCTTTACCAATGCGGTATGGCTTGCCAATCCATCGGTAATACCACAATTACTT
+ACCATGACTATCACCATTGGTACCGGTGGCGCTCAGATACCGGTGTTCAGGGAAGAGAGC
+GGGAAATTCACGCTTCTGGGTAAGGAGGTCTTATTCACTGAGAAATGCCCCGCATTGGGT
+GCTAAGGGAGATTTAATCCTTGCAGATCTTTCCCAGTATGCCATAGGCATGAGGAAAGAG
+ATCGCTCTTGACCGCTCCAATGTCCCAGGCTGGATGGAGGATATGACCGACTACAGGGTG
+ATAGTGCGTGTAGATGGTCAGGGAACCTGGGATAAACCTATAACACCGAAAAACGGAGCA
+ACGCTCTCATGGGCAGTGGCTCTGGAGGCAAGATAGTCTGCTGAAATTTCAGCCAAAGCT
+ACCATTGAATCCAGTTTTAGGGTAAATGAGTGAATGCTTATTTCATTGCCACAGGACTCA
+ATTTGAGCCTAAACAATACTTAGGGTGAAACCGCCCAAAATGAGAAAATAGGAAGCTCTG
+CTCCTGTTTAACAGACTTTTTAAAAGTGGGTAGTTCTCCTGCCTGCTGGAATTGCTTTAA
+ACCCTCTGAAACCCATAGAAATACTGCTTTCTAAAGCATAATTGACTTGCTATATCAGCG
+GTTCAGAGTGATGAATGTTACTACGGAATAAAGGCTTTAACCGTAGGAAGGGGTGAAAGT
+GTGAGAGCAAAGATTACCACAACCATAGAGGAAGCCTTATTGAACAAAGCTAAGGCACTT
+GCCGGACAAGAGGGTTTGTCCGGTGCCAATGCCATTATTGAAAGGGCGCTGGAGTTGTAT
+TTTACCAGTATTCAATGTGAAGTATGGGAAAAATCGTTGCCCAGCGGCTGGATAAAGAAG
+CTGGTTCTAAAAGGGGATTTAATTCTGTACGAAAACATCAAGTGCAGAAAAACCTTGGAG
+AACTACAGGCCGGAAGATTACACACAGGAAAGCCTAAAAGCAAAAGGCTGGAAAAAGGTT
+TAGTAGCAAGTAAAAAGGCCTCTGTATTGCTCCCTGAAACGTAAAAGCGTAGGTTGCAGC
+CGTAAGCTTTGTTGAAACAAAAGGGGCAAGTAAAAAGGATTTTGTAAAGGTTGCAGCAGT
+TATCAATACAGAAATTTATTGGTCAGAAGCATTAAGAAATTAGTGTCCAAGAGAAGCAGT
+AAAAGAACATTAAGAAATTTGAACTAAGGCTCGTGATGCCTGAAATCACGTAATTTGTCA
+CATCAGGAATAGATAGGTTGGCGTTCCCTTGCGAGGATTAAGGTCAAGGGACACTTCTTT
+ACAAGAAATGTCCCTAATCGAATCTAACGCTCTTAAATTGAGGTTGCCGGTATGAGTGGT
+GGAGACATTGGAAAAGGAGAGGATAGATATTTATCATAAACGAAACACCTGCTTTGTTGG
+AATTGATATGCACAAGGACGCACATTGTGCAGTTGTAATTGATTGTTGGATGAATAAACT
+GGGTGAGGTTAACTTTGAAAACAGGCCATCCAGATTCCCTGCATTCGTTGAGGATGTAAG
+GAAGATTTGCGGCACAAAGGGAATTGTATTCGGACTTGAAGATACCAGAGGCTTTGGCAG
+AAACCTTGCTGCCTATCTGGTCGGCAGGAAGTTTGAAGTCAAGCACGTTAACCCTGCCTA
+TACAAGCGCTGTAAGGCTTGCAAACCCCATTATTTACAAGGATGACTCCTATGATGCCTA
+TTGTGTGGCAAGGGTGCTCAGGGATATGGTGGACACTTTGCAGGATGCCAAGCATGAGGA
+TATATTCTGGACAATACGGCAAATGGTGAAAAGACGGGATTTGATTGTAAAGAGCAATGT
+GATGAACAAGAACCAGCTCCACAGCCAGCTTGCTTATAGCTACCCATCCTACAGGAAATT
+CTTTGGCATGATTGATTCCAAGAGTGCCTTATGCTTCTGGGAGAACTACCCGTCACCGGA
+GTATATATGGAAAACAACACCGGAAGAAATATATCAGACGATAAAGCCTGTGCATCAGGC
+GCTTAAAATACAGCGCATCCATGAGATTATATCCATGATTGAAAGGGATGGAGACACAAG
+AAAGGACTATCAGCCCGAAAGGGATTTTATTGTCAGAAACATTGTAAAGGATATCAGGCA
+CAACAAGGAGTTGATTGCCGAAATTGACGATGAACTAAGAAAGCTGATACCTTTGACAGG
+CTATAAGCTACATACAATGCCGGGAATCGACCTTGTTACAGAAGCACAGATAATATCTGA
+AATCGGAGATATTAACCGCTTCCCAGACTCAGACAAGCTGGCTCGGTTTATGGGCTTGGC
+ACCGGTGCAATTCAGCTCTGCCGGAAAGGGTAAAGACCAAAGATGCAGGAATGGCAACAG
+GGCACTAAATGCGATATTTCACTTTCTCGCAATCCAGATGGTAGCAGTATCGGCCTCAGG
+AAAGCCAAGACACCCGGTATTCAGGGAGTATTTTGAGCAGAAGGTTAAAGAGGGCAAGAA
+CAAGCCACAGGCGCTTGTGTGCGTGGCAAGGCGGCTTGTGAGGATTATTTACGGCATGAT
+GAAAACCAGGACAGAATACAGGCCATTTGAGAAGGCTGACGACAAGAACTGA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_014168.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1022 @@
+>NC_014168.1|provirus_27479_67296
+ATGACGCGCGCGGTTCCGGTTGCGGATGTTCGTGTGGAGGGCAGGCACCGCAGGGATTTG
+GGCGATGTGTCGGCGCTCGCTGCGAGCATTCGCGAGGTGGGGTTGATCCATCCGGTGGCG
+GTGACGGCGGATTTGCGGCTGGTGGCCGGTCAGCGGCGTTTGGAGGCAGCGCGGCTGTTG
+GGCTGGCAGACGGTGCCGGTCACGGTGGTGGCCTCCCTGGTGGAGGCTGCGGACTTGTTG
+CGCGCGGAGGCGGATGAGAACACGCAGCGCAAGCCGTTCACCCCGACCGAGGCAGAGGCG
+ATAGCCAGCGCGATAGAGGCGGCGCTGCGGCCCGTGGCTGCGGCGAGGCGTGCTGCTGCG
+ATCAAGGACCGAGACGAGAAGGGCAGGGCTCTGTCCACTTCCGCCGAATCGGCGGAAGTG
+GAGCGCCAACCCGAGACCAGGGACATAGCCGCGCAAGCGGTGGGCTACGGGCGCGACACG
+ATATCGAAGGTCCGCAAGGTCAAAGATCTGGCTGAGGACGAGGAAACCCCCGAGCCTGTT
+CGCGAGGCGGCGCGCTGGGCGTTGGGGGAGATGGACGCGACCGGCTCTGTGGCGGGTCCG
+CACCACAGGGTCATGTGCGCGGTGGAGGCCGAGGCGGCGCCCAAGCCGCATCCGGGGGTC
+ACGAAGTGGCTTGAGTCGAGCCAGGAGCTGAAGGACAAGGGCTACATGGTCGCGTTCTAC
+AAGGTGCTCAAGAAGTCGGGCGAGATGTTCCAGTTCGACCCCGAGCGCGTCGGGCGACTC
+GGGGACGAGCGCGACGTGGAGGTGGTCGAGCACCAGTTGAAGTCCACGCAGAAGTTCTTG
+GACAAGATGCGCGCCGCCCGGTCGGGGCTGCGCCTTATCAAAGGAGACCAGGGATGAGCA
+GACGGCGCGCGAAGAAGAGCGTGTGGAGCACCGCGCATTGGAGCCAGCGGGACCGCGACG
+AGCACGACGCTCTGGTGTACGAGGCGTGGGAGTCGTCCAAGCGCCAGGACGAGCGCACGG
+ACTTCTACCTCAACGGCCTGATCGACGCGGAACAGGCGCAACGGGGATGGGCCGTGGAGG
+TCTTGGCGCACTACCGGCGCAACGGCTGCGCGAACGGGTTGAAGAACCACATGAAGCGCT
+GCCGTGTGCCCATGTCGCACGATGGCCGGATTTTGAGCAAGCCCGCCGTGGTGGGAGCCC
+GCCGCACCGACGAGGACGGCACGCGGTACTACGAACAGGCGCTCATCTACTACGTGACCC
+TGCCCGAGCTGCGGGAGAAGCAGAAGGAGAGCATCGCGCTTTCGAAGACCTACGACGAGA
+CGACGGCGATGTTCGGCAAGCTCATCGCCCTGTGCGAGGCGGGCGGCGCGAACACGCCCG
+CCGAGGCTGCGGAGAACCTTGGCGTCACTGTCGAGGGCTGGCTGCTGGGAGCGGCGGCAT
+GACCGGCCAGAAGAAGGACGAGCGGTGCGCTTGGTGCGAGCGGGCGTTCCGCGCGCATGT
+GGCCGCTGGGGGTTCGTGGGCGAGCGCGCCGAGGGTGCGGGCGGCGCAGACGCGCACGCA
+TCCCGGCAAGGGCGGCGAGCCGGTGTGCATGGAGCACCGGGCCGAGTTCACAGGCGTGTT
+CGGAGTGCTCATATGAGCGGGCTTGTGCGGATCGAGAAGGGCCGCAACCACTTTTACGAG
+CTGGACGGCGAGCGTGTGGACGGTGTGACGACGATCCTCAGCGGCGGGATACCCAAGGCT
+GCGTTGATGCCGTGGGCGTTGAAGACGGCGGCGCAGTTTGCGGTGGAGAACTGGGACGAG
+CTGTGCGGGCTCGGGCAGTTCGAGCGCGTGGACCAGATCAAGAAGGCCCCTTGGCGCGAG
+CGGGACGAGGCGGCGAACCGGGGCTCTGAGGTGCATAGGCTCGCGGAGCGGCTGATGCGC
+GGCGAGGAGGTGACCGTTCCGGCCACGTTGTCGGGGCATGTGCGCTCGTGCGTGGACTTC
+CTGGACGAGTGGCAGCCGGTGCCGGTGTTGCTGGAATGCCCGGTTGCGTCCCGAGCGGAG
+CGGTACGCGGGCACGTTGGACGCAGTGGTGGACATTCCCGGCGAGGGGCGTTGCCTGATC
+GACTTCAAAACCTCCCGTTCGGGCGTCCACCCGGAGACGGGGTTGCAGCTCGCGGCCTAT
+AGGCACGCGGACTTCGCCCTGGCGGGCGGGGAAGAGGTCGCTATGGGCGGTCTTGGCGTC
+GAGAGGGCGTTCGGGGTGTGGCTGCGCCCGGACGGCTACAGCGTCCACGAGCTGAGGGCG
+GGAGCCGAGGAGTTCGCGGTGTTCCTCAGCGCCGCGCGCATCGCCCGCTGGGCGAAGACA
+TCGAAACAAGTTGTCGGTGAAGCTTTGGAAAGGCAGAAGCATTGAGCGAGTTAGAGAGAA
+CCGAGACCGAACCGGAGCAGCGGGCGCTCTCGAAAGTCGGGCAGTGGGCGCTCGACGCGC
+GCGAGGCGCACCAAGTGGCGCAGTCGTTGGCGAAGACGTCGTTCGTCCCGAAGTGCTATC
+AAGGAAAGCCGTCGGAGGCCACGGCGGCGATCCTCATGGGCTCGGAGATCGGGCTTTCCC
+CGATGACTGCGCTGCGCTCCATCGTCGTCATCCACGGCACCCCGGCGATGACTGCTGTCG
+CGTTGCGGGGCCTGGTGCAGTCGCAGGGCCATCGGGTGTGGATCGAGAAGGCGAGCGACC
+AGTCCGTCACCGCGAAAGGCGTTCGGCAGGGCGACGACATCGTGCATGAGTCCGTGTGGG
+ACATCAAGCGCGCGGAATCGCTCGGGTTGATGGACCGGGATCAGTGGCGCAAGCAGCCCA
+AGGCCATGCTGACCGCCCGCGCCACGAGCGAGGTGTGCCGCCTGGTTTCCGCTGACGTGC
+TGCTCGGTCTGCCGTACTCGGTCGAAGAGCTGGACGAGCCCGAACCAACGACGACCGTCA
+AACGCAAACGTCTTGAGCCGGTCGAGTCGCAAAGCTCAGAGAGAGCCGAAGCCGAGCCCG
+CCGCCGCTGAGGAGCCACAGGAAGAAGAGGCGGTCTGATGGCAGGCGACACTGTTATCAA
+TGTGGTTGGGAATCTCACGGCGGACCCGGAGTTGCGGTTCACGCCGACCGGGGCTGCGGT
+CGCGAACTTCACCGTCGCGTCGACCCCGCGTGTGTTCGACCGGCAGACGAATCAGTGGCA
+GGACGGGGAGGCGTTGTTCTTGCGCTGCAACATTTGGCGCGAGGCCGCGGAGAACGTCGC
+GGAGTCCCTTGTCAGAGGTCAGCGAGTGATCGTTGTGGGCAGGTTGAAGCAACGCAGCTT
+CGAGAAGGACGGGCAGAAGCGCACGGTGGTGGAGCTCGAGGTGGACGAGATCGGGCCTTC
+GCTGCGCTACAGCACGGCGAAGGTGAGCCGCGCGAACCGTGGCGGCGTCTCGCAGTCCGA
+CGAGCCGGATTGGCGGTGACGGCTATGGAGTCTTCCCCGGTGTCGTTGGAGCTTGAGCTT
+CGCGAGTTGATGAAGCAGCGGCGGCTGGCGTCGCTTGAGAAGCGGGATTTGCGGATCAAG
+GCGGACGACGAGCGCCGGGAGTGGAAGAGGGCGCACGCGGTGTGTCACGCCTTCTACAGG
+AGCAAGGGCTACGCGGTGGAGGACGCGAAGCAGGCCGCGACAGCGGATAAGGGGGTGATG
+GCGGCTCAGCAGCGCGCGGAGCATGCCGAGGCTCTTGCCGGGTACGCGGCGGACCAGTTG
+CAGGACTTGCGGCAAGAGGTCATTGCCGTGCAGTCCCTCATCAGTTTGTGGAAAACCCTT
+GTCGAGAACGGAGGGTGAGCGGTGAGCGACCAGATAAAGAAGGCCGATGAGGCGTTGCGG
+GCGCATGAGGAGGCGTGGGTGCGCCGTTACGTGCAGCTCGGGCATTCCCTGGAAGAGGCG
+AGGGCGGCGTACCGGGCGAAGTTCTGGGCGGGGGAGGTCGATCTGCGATGGTGAGGCCGA
+TATGCCGGTTCGAGGGCTGCCAGCGGGAAACCACAAGGAGCAGCTTGTGCCCCGCTCACG
+AGAGGCAGCTTCACAGGCGTGGCGAGGGCGGGTTGACCCCGCTGGGCGTGCCCTTGTGGA
+AAGGCTGCGTGGTGCCGGGGTGCGAGCGCAGGCGTTTCGGGAAGAACATGTGCGGGCTGC
+ATCTCAACCGTTCCCGCAAGGGCTTGCCCCTGGACCCTTGGACCCGGCATGACGAGAAGG
+TGTACCAGTCGGCGCTACGGGGTGTGGCGGGTGTTTTCGAACGCCGTGTTGCGGTGGAGA
+TTGAGGCCGGGGAGTGCCGCGCGGAGGCTGAGCGGAAGTTCCGCGTCGAGTTCCAGTTGC
+TCGCGTCCTTCCTGGATGACTTCGCGGGAGAGGGGGCGCTGCGATGACCGCCGAGTTCAG
+CAAGCGCGCCCGCGCTCTTGTGGAGTTGCGCTCCGAGGGGAGGTGCGAGGGCGAGTTCGA
+CCCGCGCGAGCGCTCGAAGAGGCCCCGGTGCCTTCGGGTGGCCGAGGAGATGCACCACCG
+CCGCACCAGGGGCTCGGGCGGCACGAGCGATCCCGCGTCCTCGCAGGTGAGCAATGCTTT
+GGCGTTATGCCGCAACTGTCATCACTGGGCGGGGCAGTGCTTCCGTCTCGCGGAGGCGCT
+GGGGATCTGCGTGTACCAGGCGCACCGCCCGGACGCGCGGCCCGTGTTGATTCGGGGCGA
+GTGGCGCCTGCTCTTGGACGATGGCGGATTGACCCCGCTTATCCGCGTGGGCGAGGACGA
+GTGGCGTTTCGACGCGCTCGGCGGCCACCGCTACCCGGCGTGGCTGGTGGACGGCGCTAC
+ACCGCTCGATGAGCGGTACGTGGACGTGAGCGGGCCGTTGGATGCGAACCGTTACGCGAC
+GAGATGGGCGGTGGCCTGATGTCGTGGTTCAAGGTGGATGACGGGTTCTACGCGCACCCG
+AAGGTTATGGGGCTCTCGGACGGCGCTCTGAGCTTGTGGACGCTCGCGGGCACCTGGTGC
+GCTCACCAGCTCACGGACGGCGTTGTCCCGCACGCGGCGCTGTCGATGCACAGGGGCACG
+CCTGAGCGGGCTCAAGAGCTCGTGGAGGCCGGTCTTTGGGAGCTGCACCCGAAGGGCCAC
+AAGTTCCACGACTGGGAGCAGTACCAGCCCACCAAAGAGCAGGTCGAAGCGGAGCGTGAG
+GCCGCGAAGGAGCGGATGAAGGCCGCTCGGGCCAAGCGCAAAGCCGCGAAGCCTGTTCGG
+GAGAACACTGAGGATGGTTCGCGCGATGTTCCGGAGAACACCGAAGACGGTTCGGAGGAT
+GTTCGGGCGAACACCGACCGAACTTCGGGCGAAGTTCGCCTAACCCCGACCCGACCCGAC
+CCGTCCTTATCTACTGACGTAGATAACTCAAGTACTTCGCCTTCGGCTCAGTGTTCACCC
+GCCGAGCTTCGCGCCGAGTTCGCGGCGTTCTGGACCGTCTACCCCCGCAAGTCGGGGAAG
+GCCAAAGCCGAGAAGGCGTTCGAGCGGGCCAGGCGCAAGACCACCGTCGAGGCGATGACC
+GAGGCCGCTGGGCGCTACCGGGACGACCCGAACCGTGAGGCGGGTTTCACGAAAGAGGCA
+GCGACCTGGCTCAACCAGGAGTGCTGGAACGACCCGCCGCTGCCGCCGAGGTTCGAGCGC
+ACCAGCGCCAAGCCTCCTCCCGGCCCGTTGGACGGCTACGGGGCCGGTGTGAAAAGCCAG
+ATCGGATGGGAGATGCTGAGCCCCACGCCTGACCCGCAGGCGGTCGCGATGGCCGAGGCT
+GCGGGCTACAAGCCGCCATCGAACGGGCACAGATTGCGGGAGGTGGGCGCGTGATAACCG
+AACAGGAAGTCGTGTTGGTGCTGCGGAAGATCAGCGCGAACGACAAGCGCAAACCGGATC
+AGTTCGAATTGGATGAGTTCGTTTCCGCCGCGCGCCGCCACAACTGGACGTACCGGGAGG
+CGTGCGCCCAGGTGGACGCGTTCTTCGACATCCCGCGCGGCGGGGAGAGGATCACCCACG
+GGCACATCACAGCCGGGATCAAAGCGGACCGCAGGCACCCGAAGCCGGTGGCGGACGTCC
+TGCAACTGGAAGGCCCGAAACCCGCGAGCGAGGACAACCCCGACCGGCAGCGCGTGCTGG
+CGATGGTGCGCGAGCTGAGCCGCAAGTTCTCGATGCCCGAGGAGACCGCCCGGTGAACCG
+CATGAAGCAGAAGGGGGACCGCGCCGAGCGGGAGGCGGGGCGGATCGCGGGGGCGTCTGG
+TTTCCCGTGGTGGGAGCGCATGAAAGCCGGGGCCGAGCGGGACCGGGGCGACTTGACGCT
+GTGCCCGTACGTGATCGCCCAGGTGAAGGACTGCAAGCGCATCTCGATCCCCGAATGGCT
+CAGGCAGCTCGCGCAGCAGAAGCGCAACGCCCGCGCCGACGTCGCCGTGCTGGTGGTGAA
+GCACTCCATCCCCGGCAAGGCCCCGGTCTGGTCGATGATCCTGCCCTACCAAGAGGGATT
+GCGCCTGCTCAGGCAAGCCGGATGGGGCGAACCCGTCACCGACGAACCACGCATCACCGA
+GGAAAGGACAGAGCTATGAGCGGAAACCCGATAGCGACCACACGCTACACCGTTCTCTCC
+GGGCCGGGGAGCGGCCCGACGCTGGGCGAGCTTCGCGAGCTGGTCGCGAAAACGCACGAC
+TGGGCCGCAGACTCGCGCGTGCTCATCGCCCGCTCGCGGATCGACCAGGACGACGAAAGC
+TGGCACATGGCGCTGCTAAGGGAGGCCGGGAAATGAGCGAGGACATGTGGCGGGACGCCG
+CCCAGGTCGCGGCGCGGAACAATGCGGGCAGCGGTGGGCGTGTGCCGCTTTTGGCGTTCG
+TGGACCGCAGTGACATGGCGCAGGTCGGTGTGCTCATCGCGGCCCTGGTGGCCATGGCGT
+GGATGAGCGCGGACGGGTTGGCGTGGGACATGGCGGGCGTGTTGAGCTTCGCGGGGGGAT
+TTTTGACCGCGACGTTGGTCAACGCGCTCGTGTTCACGCTGATGGTCGTGAACGGGCGGG
+CGGTCTTGCGTCGCCTTGCCGTTGAGAAAGGAGCCGGGGAATGAGCGCCCGCAAACTAAT
+GGCAGGAGCCGTGGCCGTCGTCGTGGTCATAGCCGCCGCTGGCTGCGGCGCTTCTAACGA
+GCAAATCAACCCGCCTGAACCGCAGGTGTGGCGGCTGCCCATAGCTGATGGCCGGAAAGT
+CGTGTGTGTCTCGATCAGCAATTCGAGCAACACGGCGATGTCCCTTTCCTGTGATTGGGG
+GAATGCGAAATGAGCGATGAGCTACCGATCGGTGTTGTGGGACGGCGCATCGTCTCGATT
+GCAGAAGGGGCTCGCAGAATTGTCGAGCCTTCCGCTTACGACTCGTCGCCGTTCGTCCAC
+GACGGCTTGGTGATCGGTCTGGACGACGGATCTGAACTGTTCATTCAGGACAACGGCGAG
+TACTACCCAGGGTTCTTCACACACTGGCTCGGGCAGAGCATCACCGAGGAAAGGACACAG
+CAGTGAGCAGGGCGAGCATCAGGAGGATCACCATGTGGAGTGACGTCGCGTTCACTGCCC
+TCCCTCCGGGGTGGGTGAACGTCTACAGGATGGACGACGGCACCTATGAGACCGAGCCCT
+GCCCCGGTGTGCTGCTGCAAGAGGCGACCCAATATAAAGAATGCTGGGACGAGGAAGTGG
+GCGGCAGTAACGTGCTTCGGACCCGTCGGTGCGAGATGGACCGTGAGACAAGGACCGTGC
+CCGCCGAAATCTGTGTTGGAAACTTGTCGCCAGCCTGCGATGTCTCCAACTATGTGACAA
+CCGCCACGGCTGAGGAATGGGAGGGCCAAGAGGCCGGGGAGGCCGGGGAATGAACGCTCA
+AGAGTTGAAAGAGTTCATCGATGAGCACATGGCGCAAGACTGGCTGATCTTGGTGAACGA
+GATGACCGGGGCCGCGCTCGTGGCGGACTTGGCCATCACGAGCGCCGAGGGCTTTATCAG
+GCTCTCGGGCAGGATCACGCCTGACTTTTACAGGTTCGACCCTGAGACTGGTCGGCTCGC
+GCATGAGCGGTACTCGCTTGAACTCATGAGAGGTTGGCGCGCGGTGAAGCCTGGCAGCCC
+GGAGTACGAGGCGGCGATGCGCTTGAACACTGCACGGATCAAAGCGCGGGCGGTGTTCGA
+CCAGTTGGGCGCGGGCGACATGACCATGATCGAGACACGTTGGCCGGTGATCAGGGCCGC
+GATGTCCAACGTTTCGGAGGCTGCGGCGCATATTGCGGCGGCGGATGAGTACGGGGAGCT
+TCTACGGCGGCAGGAGACCATCAAGGAGGCCGGGGCATGACGGACGGTGGTTTGGATTTC
+GGGGATGGCGTGACCACAGCCCCTACACAGAGGTGGGCCGAGGCAACGACGAACGTCTCC
+GAGCTGCGGGACGTGTGGGGCGAGCTGGCGAACCATAACGGGCGCGTCACCGACCTTGAG
+GCGGAAGTGGAGAGCGTCAAAGCCGAGGTGCGGGCGCGCATGCTGGAAGCGGCGTATCCG
+TCCCGTAAATCGCTCCTCGCCTACATGCGGCCCGCGCGTTGGGCGCAGCTCGCGGCGCTG
+TTCGCGAACCTCGCGCTTGTCTTGTGGTGGGCTGTTGTCAGCTGCGGCATGGGGATGTCC
+CCTTATCCCGGTGCGATTGTCTGCGGGATCGCGATCTGCGCTGCCTGGATCTTTTCGGTG
+GAGGCGTTATTCGAGGCGCTGGACCGCAAGGGGGCCGGGGAATGAGCGATGAGACCAAGC
+CGTTCAGGTTGCAGGATCAAATTTTAGTCCTGATGCTGATGCACCTGGACCGGATCGATG
+AAGCCTACTGCGCCACGCTCGACGGCTATAAGGTGACCGAGGCGCGGGCCGAAGATGTCG
+ATCTTCTCCGCATGTCGGCGTACTTGGCCGAGCACGCCGACGCGTTCCGCGACGACTCGG
+AGGCTGAGTCCGGTGAGATCCGTGTGGTGGAGGTCGCGAAGGGTTTGCGGATGCTCAAAG
+CCGGTGACATGTGGGTCACCGAGAGCATGGTCGAACAGCTTGGCAGGGTCGCGTTCGATG
+ACATCAAGCCCTTGGGCAAGGTCAGAATCCCCGTCGCGAAGCACTTCGGACTGGCGAACA
+CCTACGCCATCGGCCTTTCCAAGAGCACCGGATGCCTCTCTTTGGCCTCATCGGCTGGAA
+CCGAAAAACTGTCACGCAACTTGTGTTTCTTCGGAGATGAAAAGTTGGACGAGACGCAAT
+CCGAAGAGGCCCACATCTATGCCGCGCAGGAACGAGCTATAGCCGCCCTTCCCTTGATGG
+TGTTGGCGGACCAGGCATGAGCCGCGATGAGTTCTGGACCGGCCCAGTGTCGTTCTGGAC
+GATGACCGGGGCGGGGTTCGTGTGCGCCGCGCTCGCTGGGTTTTTCGCCGCGCAAGGGAA
+ATGGCCGCTGGCCCTGTATTTCGCGTTCGCGGCCATCGTCTACCTGTGCTGGGTCAAATA
+CCGGCGTGTGGACGACTCGCGCCGCGCGTTCGAGGACGGCAGGCGTTACACGGTCGATGA
+GGTCGCCCGGATGCGGCGAGTGCTTTGGGAGTCCCGACCACAGGTGTCTTACACATACGC
+GCCGGGTGAAAGCGAGGAGTCCGCATGAGCGTCACAACCTTCTGTTCTGTCCCGCATTCG
+CGTGAGGCGACCGAGGACGACCCTGCCGACGCGCTCAGGGAGCACGGCGGGCGCCTGGTG
+GTGTACGACTTGAACCGTCCCGCCGCGTTCGACGGGGCGTATTTGTGCGCGGGTCACCTC
+GCGCGCCTGGCGGACTTGATCGCCCAAACCCCGCATATTGTGGCGTTGCTGTTGTCGGAT
+CGGGAGAAGTCTTGCGCTTGGGGCGATCAGGAGGGCACTCGCCGCAAGACCGACCCCCCG
+GCTCCGTTGAGCCTCGCAGCCCTCGATGAGGCCGACAAGGAGTTCGCCGTGTTGCAGTCG
+TGGGCTGAGAACCATCGTGACTCCACGGGGCTTGTGCCGCCCCGTATACAGCATTTGTGG
+AAGCGCGGCGGCGCGGGGGAGGTGATCGGCGCGAAGTCCGGGCATGTGCGTCTCTGCCAC
+GCCCTTGTCGGGTACCTGTTGACCGACCCCAATGTGCTCGCAAGCCAGGAATGGGCCGGC
+GAGATGCTGCAAGAGCTGGCGGACATGCGCGCCCGCCGCCGTCCGCGTTGGCGGCTCGTG
+GACGAGCCGACGCCGACCGGGTACCCGTGCTTGAAATGCGGGGGCCGCACGATGCTGTTC
+CGCCCTCCGATAGACCAGTTCGACCCGTGCCTGGTGCAATGCCCCGGTTGCGGTTTCACT
+TTGGAGCGCGAGCAGTTCGACCGGATCACCACGGTCATCGAGGACGGGAAAACACCGCGC
+GGGAGGGTAGGATCGGATGCGTGAACGCGCTGCTGGACGTGGATGTTCCCGAGTTCGTGA
+CGGTGGAGCGGGCGGTGCGCGCCACGGGCCGATCCCGCCGCACTATCTACCGTTGGAAAG
+AGTCCGGGGCGGTGCGGTGGCGGATGTTCGAGGGGAAGTTGATGGTCGAGGTCAACGACG
+CCGACGAGGCCAAACTGCGGTGCTCGGACGCGCGACGGGCGAACCTGCGCCGCAAACGGT
+AGATGATCCCCGTAAGTATTGCCAAACATGGCGAGGCGTCGTAGGCTGCCCAAGCGATGC
+GGGTGTTAAACCTGTTCGGTGTTGGGGTGCTTGGCGGCGCTGGGTGAAAGAGAATGCTCG
+TTGAATCTTGGTGATGTGCGGAGTGTGGATGTGGCCGCGCTCGGGGACTTGGCGACGAGT
+CTCGCGTCCCGAGCGTCGTCGTTGGAGGAGGCGCGGGCGCAGTTCGCGAAGATCACGCAG
+TTCCCCGGCTGGTCGGGGACGGCGAAGGACGCGGCGGCGGGGAGCTTCCAGCGCGCGGAC
+GCGAGCTTGTTGGACGATGTGGCGCGGGTGTCGGCGGTGCATCAGGCGGTGTTGGAGCTG
+TCGGCGGACTTCGCCCAGTTGCAGGCCCGTGTGCGGGAGTTGGAGCGGGAGGCGGCGAGC
+ATCGGGGCGGTGTTGGGCGACGACGGCAAAGTCACGTTCCCGGAGGGGGCTCCGTGGCCG
+GATGCGACCCAGCAGCACCGCGCCCTCGTCATCGGCGGCGAGGCGTACGAGTTGATGACA
+GACGCGGACCGGCTCGATGAGAAGGCGGGCGAGGTTCTGCGCAAAGCTGTGGGCGGGGAG
+ATCAACGCCGCTGGCACGGGGAACGAGACACAGGCGGCGCTGGCCGGGGCGGCGCAAGGC
+ACGTTGGGCATGCCGGAGCCTCCGAAGGCCCCTGGGGGGCATGCGGACCCTTCGTACAAC
+GCGGGATGGTGGAAAGACTTGACCCCGGAGCAGCGGCGTCGGGTGCTGGACTTGCACCCG
+GAGTGGGTCGGCAACCTGGACGGGGTGCCCGCGTCCGTGCACGACGAGGCGAACCGCAAA
+ATGCTGCCGGGGGACATCGCCCGGTTGCAGGCGGAGGTGGACCGTTTGCAGAAGCAACTG
+GACAGCGAGTTCGGGCACGGCGCCTTCAGCAACACAGACTCGGACCTGTGGTACGCGCAG
+CGCCGGTTGGAGGGTTTGCAAGCGACCGAGAAGGCGCTGCGGGACAATCCCGGCACGAAG
+CTCCTGGTCCTCGACCCCGACTACGGGACCAGGGGCCGTGTCGCCATCGGCACGGGCGAC
+CCGGACACCGCCAACCACATCTCCATCTCGACCCCCGGGGTGAACTCCTCCCCCGGGCAG
+AGCATTGGGGAGATGACCAAAGAAGCAGTAGCTCTAAAGACTGAGACCGAGAACGTGCTT
+AAGGCCAATGGGCATGGGAACGAGACGGTCTCGACCATCTCGTGGATCGGGTACGAGCCG
+CCGCAGGCGCAGCTCGACCCGCAGCACCTCGACAAGACGGGCGACGTCGGACCTGGCGGG
+TTGCGGGACGAGCCGGGGGGCTTGTCCGACGTGGCCAGCGATGCGAAGGCGAAGGCCGGC
+GCGGCGAGCCTTTCGCAGTTCTACGAGGGCATCAGCGCCGCCTGGCATCCTGCGGACGGA
+GACTCCGCCACGAGCCCGCACATCACCGCCCTCGGGCACTCCTACGGCTCGCTCACCACC
+AGCCTCGCGTTGCAGCAGACACAGACGGGAGTCGTGGACAACGCCGTGTTCTACGGCTCC
+CCCGGTCTGGAGCTTCCTTCCCTTGACCGATTGCCGGTCGCTACGGGGCACGCCTACTCC
+ATGCAAGCGCCGAGCGACCCGATCAACTACGTCCCCAACCTCACCGAGCACTACGGCCCC
+AACCCCGTCGAAATCCCCGGCATCACGAGGCTGTCCACCGAAGCCGGGGACACCACCGGC
+GACGCTGCACCCGGCACGACGGTGCACCACGACGGCGCGCACGGTCACTCGGAATACCCG
+CGCAAAGGCGACAACGGGCAGTTGCGGATGCCTGGATACAATATGTCTGTGATCGTCGCG
+GGGATGACCGGGCAGGACGGTCGCCCCGACCTCACCAAGAGGGGAGAATAACCCTTAAAT
+GACGTACCCGGTGGAGAAGAGGAGTTGGTTGCGACGGCGTGCGGCGTGGTTGTGGGCTGC
+TGGTGTGGTGGTGCTTGTCGGGGTGGTGTTGGTGTGCGGGGTGGGGGTGTTTCGGTTTGT
+GGAGGTGTTGAAGGGCATGGATGACGCGCCGCGGCACATGGCACAAGAAAAGGTTCCGGC
+GTTCGAGGAGCGGTATCGGGACAAGGGCAGTGTGCAGCAGGCTGCGGAAGACTTGGAGGC
+GGTGATCGCTCGGGCCGCCGACAAGATCGCCGCGCTCGTCCCCGGCCTGACCTGGAAATG
+GCAGTACGATCCTGGAAACATCGGCTGTCCGGCCGATGCTGCCAGCGACACGAGGGTCAC
+ACGATTCGCGACTCGCCTAGCGGGTTTCGACGGCGCCATTCCGGAGGACGTGTGGCCCCG
+TGCGGTGGCCATCGTGCGCAGCGAGGCGGAATTCCTCGGGATGACGGCCCAGTTCAAGTA
+CCAGGACGCGGCCAAGCAGCACGACCTGGTGTTCTCCTCTCAAGACGGCGGGGAGATAAG
+AATCGCCACAGCCGTAGAAGCGTTCATCAGGGGCAAGACCCCGTGCCGGTTGATGGAGGA
+CTGGTACACCGACCGCAATATTCCTATTCCGGGCACGGGCAAGGAGCCGCGATGACAGCC
+GATGGGGCTCCCGCAGGAGCAGGCCAGAGGATCGAGGTTGCGCTCGAAGAGCTTCACGCA
+GGCGCGAGCCAGCTTCACGACCTCGCGCAGGAGGCGACGAGCAAGCTCGCCTCAAGCGAT
+CTGATGTTGGAAACCTCCTCGCGAGCGTTGAAAGGCTTGAAATCCGCAATCGAGTTCGCC
+GCCTACGCCGAATTCGAGACCGCGCGGGGCAAATCCGCTATCGAGACGATCACCGCTGCG
+GCAGAAAACGTCGGGTATGCCGCCGAGCACTACCACGGCACGGACGAGTCGAACGCCGCC
+AGCCTCGGTTGACCAACCCTCCTCGTTTTTCGAACACGTCAGCGTGTCGTGTTGACGTGG
+GTAATCTTCGAATGGCACACTAATGCCAGTAGCACCCCTATGCCTACTGTCGCCAGATCC
+TTTCGTTACATGAGCGTTGATCCTGGTAGGGCCGCTTCCCGCCTGGTGTTGGCGCACCAG
+GGCGACGGGGAGCGGTTCTTTGTTTCCGGGGTTCTTTGGAGGCCGCATGCCCAGTCTTGA
+CGCTCTGCGCGACGAGATCGACCGGGCCGTGACCGCGTATGTGGCGCAGTCCCGCGCGGA
+GGACGGCGACAGCCCCGGTTTGCCCGGTCCTTGGGTGGTGGCGGTGGGCTCCCAGTCGAT
+AGACGACGACGGCGAGACCATCCACACTATCGAGCCTGTGGGACAGCCCGGATGGGTCAC
+GAAAGGGCTTCTGCTGTCCACGCAGGAACTCTTGCGGGCCGAGTACCAGGAGCGCGAATG
+AGCGCCAGCCCGAACGGCATGGACGGGGATAGTGACGGCGGTAGGATCGGGGCATGAGCG
+ACACCACGGCCTTGCCGGTCAAGGGACGCACGCTGATCGTGGCAAATCTTCAAACCAAGA
+AGGCCCTGCAAATCGGGCTTGGACCGGAAGTGACTATCACCTCCACATTGAGAGTTCCCG
+ATGGTTTCGGGCCAAATGCTCCTGAACCGCGACAACTGCACATCGCCGTTGGGGGCGACT
+CTGAGGCGGTCAACTCCGCTCGGGCTGCTCTCTCGCCCGAAGAGGGCGACATGATCGCGG
+TGCAAGACAACACCGACGATTCCGTGCCAGCGTGGTTCGCGCTCTCTCGCGAGACGATCA
+CGCGGGCGGCGGACGGCCAAGCGCTTTGGAGCATTGAGGGCGTGAGCATGTACGACCTGC
+GGCGGGCAAGGGCATGAGCAAGCGGATAGCGCCGTCGAGGCCGGGGGTTGACTTCCTGAT
+CGACGGGGAGCTGCACAAGGTTCCCCGTTCTGCGATGCTTGAGCCTTATGGCGCAGCTCG
+GCTGCAAGACGGCTCGATGGTCTACAGGTTCATGGCCGAACGGCTCCCGCCAGGGCTCAC
+CGAAGCGGTGAAGAACTCGGCGCACGCGGTCAACATCCGAGAGCACGACGCCATCCGAGG
+GCACGGGACGCTCAGATACACCGAACCGCTGTGGGTGACAACTGTTGTCGAAGAACGCGG
+GGTCACCACGTTCAAGGCGGTGTTCACGCAGATTGAACGTCACATCCTCGGGTGGCCGAC
+CCGTGATTTGTGGGTTAGCGCCCAGGCGGCGCCTGTCAGTTGCAGACCGAGAGGCGGATG
+TAGCAGTCGGCGCGGCTTGTGGCCTCGCAGCCTTGTCGGGCCATTTCGCGCGCTCGGGAC
+GCGGAGCTGCTAGCCGCAAGCTCGTAGCCGCGCCTCCCGTTGACGCTGTCCCTGGTGAAC
+GCGATTGCGGCGCAACCCCTGAACGGGTATGTCCCGCACCGTGGCCCGCACTTGTCCTTG
+GCTGCGAGCATGGCGTAGTTTCCGCTGGAAGCGCCGGTGGCCGCAGTTGCGTTCCCCTGC
+CTGTCGTAGGCGATGGCGCCCCAACGCGCATGGTACGCGAAGGCCGGACTGGCGAAGCTG
+AATGAAGCGGCGAGGGCCACGAGGGCGGCGGTAAAGCGCATCATTGGGTTCTCCTAGGGT
+AAAGCCGAAGCTGAGATTTGTGTCCTCAATCACTTAGACGCACGGGATGCCCCCCAGGTT
+CCATTCGTCGGAAAATTTCAAGAACGGCGGCATGATCTCAACCTTATCGACGCGCTATCT
+CCCTGAGGGCTTAGCCGAGGAGTGACCGATGGGCGTCCCGCGCAGCACGACCAAGCGGGA
+TGCCGACCGCAAGACCATCGCCAGGGGCAAACCGCCGTGCGGTATCTGCGGCGGGGAGAT
+CGACTATGCCCTGCCGCACACCGACCCCGCCTCGTTCGTCGCCGACCACATCGTGCCCTT
+GAACAAGGGCGGCGCTGATGTGCTCGCGAACAAGCAGCCCGCGCACCGGGACTGCAACAG
+GGCCAAGAGCGACACCGCTGTCACCGACCTCAGACGGCGGTACGTCACAGAGAGAGCGTG
+GGCATGAACGAAACAGAGCCAAGGGCGACACTCACCGGACCCCCGACGACAAGCACCATC
+TTCTACCCCGCGAACAGCGAGCACCCCGCGTTCAAGATCGTCCTCGTAGAGCAAGCAGGG
+GCTTGGGAAGCCGAGAGCGTCGAAATCCTCGACAGGCATCCAGTCCAGGAGCCAGACTCA
+GGTACGTGACCGAGAGGGCATGGGCGTAGAGCGTCCGAGTGCCCACACGCCCACGACGAC
+AATAACAACCCGTCATCCCGGCGCAACGCCCTGACCTGGGGAAACAGAAAAATCCCTGGT
+GGAAACACCCACGGGGGATACCCCCCACGGTAGCCCTTCCGCACCTCGGCGGCATAGGCG
+GGTGCCCCCCCTTGGATTTTTCCCTTTGAAGGGAATAGAGCTTTGGCCCTTGGAAGGAGT
+CCGTCATGTCTCGTGGGAGCAGCCGGCATCAGGTGCTCGGGCCGGTCGCTCGGGCGGTGG
+AGACTGGCAGCGAGATCGACCGTTTGAACGCTTTGCAGGCGCGCTTGGCGGGGGCTATTG
+ATGACGAGGGGACGCCGCCTCGGGATTTGGCGGCGTTGACGCGCCGTTTGCAGGACGTGT
+CGGAGCGGTTGGACTCGTTGATGAGCGAGAAGGCCGAGCAGGTCGCGGCGATTGTGGAGG
+ATGAGCGGTGGGATGGCTCGGCTATCTGAGGTCGCGCGTCATCTGGTGGTCCCGGAGGGG
+ATCGTTTCGACGGAGTGGCCTCGGGTGCGGGCGAAGTGCTCGGAGCTGGGGTTGGGTTTC
+GATGAGTGGCAGGACGGGCTTGGCCGGTTGATGTTCTCGAAGCGCGAGGACGGTTTGTAC
+GCGTGCGACACGGTGGTGGTGTCGATTCCCCGGCAGGTCGGCAAGACGCATGTGATGATG
+TCGGCTTTGTTCGCGCTGTGTTTGCTGCGGGCGGGGTTGACGGTGTTGTGGACGGCGCAC
+CGGGTGAAGACGGCGAAGGAGACGTTCGGGTCGATGGCGGCTCTGGCGGCGCGGGATTCG
+GTGCGTCCGCTGGTGGCCCAGGTTGTTCGTGGCCGTGGCGACGAGGCCGTGTTGTTTGTG
+AACGGCTCAAGGATTTTGTTCGGTGCTCGTGAGGCGGGGTTCGGGCGCGGGTTCGCGGAT
+GTGGGCGTGTTGGCGTTCGATGAGGCGCAAATCCTCGGTGAGTCGGCGTTGGACGACATG
+TTGGCGTCGCAGAACGTGGCTGAGAACCCGTTGACGTTGTTCATGGGCACGCCGCCGCGT
+CCGAAAGATCCCGGCGAGGCGTTCACGATGTTCCGGCAGGAGGCGTTGGACGGGGAGTCC
+GAGGGCACGTTGTACGTGGAGCTGTCGGCGGATCGTGGTTGCGACGTGGAGGACCGGGAG
+CAGTGGCGCAAGGCGAATCCGAGCTATCCGCACCGCACATCGGAGCGGGCGATGCTCCGG
+TTGCGCAAAAACCTCTTGGAGGATTCGTTCCGGCGCGAGGCGCTTGGGGTGTGGGACGAG
+GTTTCCACGCATCAGGCGGTGGTGAAGGATTCTGTGTGGCGGGCTCTTCGGGCTGATGGC
+CCGGAGTCGTCGGTCAGGCCGCACGCCTTGGTGGTGGACATGTCCCATTCGCGGGAGGTC
+TCTGTGGGGGCGTGCTGGTTGGACGGGGATTGCGCGCATGTCGAGGAGGTGTGGGCGGGG
+GTGTCGGGCTCTGAGTGCGTGGAGTGGGTCGCGGCGAACGTGGGCCGGCGTGTGCCTGTG
+GGGGTGGATTCGGCTTCGCCGGCGTCGTCGCTCGTGCCCGAGCTTCGCCGTCGCGGCGTT
+CGGGTGGTGGTCACGAACGCGTCGGACATGGCCAAGGCGTTCGGGATGCTCATGGACCGG
+GTTGCGGCGGGTTCGCTCTCGCACGCGAACCAGGAGTCGGTGAATCAGGCGGTGGCGGGG
+GCGAGGCGTAGGCCGATCCGCGACGCGGGTGGCTACGGGCTGGACCGCAGGGACGAGACG
+GCGAACATCGCGCCGCTTGTCGCGGTGATGTTGTCGGTGCTGGTCGCGGTGACGCATGGC
+AGACGGAAGAGTGTTGTTTCGAGCGGTCGAGGGGGGTTCGTGCTGTGACTGTGTTCGCGG
+AGGCTCCTCGGGTGCGGGGTTTGACGGACGACGAGCAGCGGCTGTTGGGCCGCTTGTTCG
+ATGAGTTGACGCGGCGCGCTGGGCGCAACCAGTCCCGCTCGCGGCTGTACGAGGGCAAGT
+ACGCGGTGAAGCGGACGAGCACGATCCCACCGGAGTATTTCCGCATGGGGATTGTGCTGG
+GTTGGGCCGCGAAGGCCGTGGACATCCTGGCGCGGCGTTGCAACCTGGACGGGTTCACAT
+GGGCGGACGGGGATCTTGAGTCGTTGGGGTCGCGCGAGGTGTGGTCGGAGAACCTGTTGG
+GCACCGAGTCGGACTCGGGCGTGGTGTCCTCGCTGATCCACGGCCCAGCGTTCCTTGTGA
+ACACCGCAGGGGAGGCGTGGGAGCCGAAGGCGTTGATCCATGTCAAGGACGCGCTCAACG
+CGGTGGGCGACTGGAACCCCCGCGCGAGGCGTTTGGAGAACCTGTTGTCGATCACGGATC
+GCGACGAAGAGGACCGGGTGACCGGGTTCGCGCTGTACATGGACGGGTTGACGGTTTCCG
+CCGCGCGGGACTCCTCGGGCTGGGCTGTGGAGCGCTCCGACCACAAGTTCGGGGTGCCCG
+CAGAGCCGCTGGTGTACAAGCCGCGCGCGGGTCGCCCGTTCGGCTCGTCGCGGATCAACC
+GGGCGGTGATCGCGCTTTTGGAGCAGGCCACGCGCGTGGCGATCCGCATGGAGGCGCACG
+CGGACACGTTCTCCTTCCCGGAGTTCTGGATGTTCGGGGCGACCCTCGCGGATCTGGCGG
+GGGGCGAGAAGAACCCGAACCCGTGGCGGGTTCGCATGGGCCGCATCAAAGGCTTGCCCG
+ACGACGAGGAGACCGGGGTGCGCGCGGAGGTGCATCAGTTCCCCGCCGCTTCGCCGCAGC
+CGCATGTGGACATGTTCGAGCACATCGCGGGGCAGTTCGCGGGGGAGACGTCGATCCCGG
+TGGAGTCGCTGGGGTTGGTGAACCGCGCGAACCCGACGTCCGCCGAGTCGTATATCGCCT
+CTCGTGAGGATTTGATCGCGGAGGCCGAGGGCGCCACCGACGATTGGTCCCCGGCGTTCC
+AACGCTCCTTCACCCGGGCGTTGGCGATCAGGAACGGCTTGGACTCGGTGCCCGCCGAGT
+GGGTCACGATAGCCCCGAAGTGGCGTTCGCCCATTCACTTGTCGCGGGCCGCGCAGGCGG
+ACGCGGGCTCCAAGCAGCTCGCGGCGGCGCCGTGGCTCGCTGACACCGAGGTCGGCCTCG
+GGCTGTTGGGGCTCGATGAGCAGCAGATCCGGTTGGCGCTCTCGCAGCGCCGCCGCGCGC
+AGGGCTCGCAGGCCCTCGCTGCGCTCACCGCTCGGGCCAGAGGGACCGCTGATGCCGCTG
+GCGAGTGACGCCGAGCAGATGCGCGCCTCCCTGGTGGGGTTGTCGGGCATGTTGGAGGAC
+GAGGCGCGCTCGCTCGCGGCGGATGACTCGGGATCTCTGGCGGGGTCGGCGGCGAAGGCG
+TGGATCGGCTCGCGTCTGGCTGTGGGGATCGGCGGCTTGATCGAGGAGTACGCGGGCGCG
+GCGCAGGCGGTCGCGGCTGACTTCTACGACCTCGCTCGGGGGGCGCTCGCTTTGCCGGGT
+CGGTTCACGGCGTTTGTGCCCGATCCGGGGACGTTCGGCCCGGACGCGCTGACAGGTTGG
+GCCGCGTCGGAGGCGACGAGCTTCACGGCGTTCGAGTCTCTGGTCGTCGGCGGGGCGAGC
+AGGCGCGTGATGAATGCCGCGCGGGACACGACGATGGCGAACGCTTTGGCGGACCCGCAG
+TGCCGGGGCTGGATGCGCATCGGGGCGGGGGAGTGCGATTTCTGCCGGATGCTCATCGCC
+CGTGGGGACGTGTACACGAGCGAGTCCGTGCGGTTCAAGTCGCACGACCACTGCAAATGC
+CAAGCGGCCCCTGTGTGGGACGAGAGCAATGTCGTGGAGCTGCGCGAGAAGTACGTGCCC
+AGCGCCCGGTTCAAGACCGAGGCAGCGCGGCGGCGCAACAACGAGGCCGTGAGGGCGTAC
+CTCTCGGCCCAGTAGAGACCATCCCTGCCGCAACGGCGGGGACCGACCCGGAACGGGGAA
+TGAATCATGTCCGAACCCATTGTCGAAGCGGCAGAGGCGCCCGAAACGGAAGCCGATGAG
+CCCAAGCCCAAGCAGACGGAGACGGTCGATTTCTGGAAGTCCAAGGCGCGTGATTGGGAG
+TCGAAAGCCAAGTCGAACAAGTCGGCGGCAGACGAACTCGCAGCGCTCAAGGACTCGCAG
+AAGACCGAGGCGGAACGAGCGGCAGAGAAGTTGGCGAACGCCGAGGCCGAGGCCGCGACG
+GTCCCGGTCAAGGTCGCCGGGGCGCTCAAGGCGCACCTGGTGGCGTTGCACGGGATCAGC
+GACGAGGACGCGGAGCTGTTTTTGACCGCGCAAGACCCGGAACTTTTGCTCAAGCAGGCC
+GCTCGTCTCGTCGGGAACCAGTCGGGCGTGAAAGGCAACAAGGTGCCCCATGAGGGCGCG
+AACCCCCGGCCCAAGCCGAACTCCACGAGCGAGTTCCTTGGCGCTTTGACCGGGGCCGGT
+TAACCACACAGATTAGGGAGAACAAAATCATGGCAGCATTGCAGAGCACGGACCTGTTCC
+TGCCCACGCAGATCGCGGACGGCATCGTGGAGCGGGCGAAGACAGGTTCGACGGTCGCGG
+CTTTGTCCGCTCAGGAGCCGATGCGTTTCGGCAAGGTCGAGATCATCACTTTCGATGACG
+ATTTGACCGCCGAGTTCGTTGAGGAGTCCGCCCCGAAGGGCGCGGATTCCGCGAAGCCGT
+CGCATGTGACGGCTGTTCCGCACAAAGCGGTCGTGCAGATGCGGACCTCCGACGAGTTCA
+AGTGGGCGGACGAGGACTACCAGCTGGGCGTCCTCGGCAAGTACCAGGAGAAATGCGCGC
+GGGCTCTGGCCCGAGGCTTGGACCTCGGTTTGTACTACCGGACCAACCCGCGCACCGGCA
+ACGCGCTCACGGCGTGGACGAACTATTTGAACGCGACGACCAAGCGCGTGGAGATCACCG
+CTTCCTCGCAGCCGGACATCGACTTCGAGACCGCCGCTGGTCTGGTGATCGGGGACGGTC
+ACAGCGTCAACGGCGTGGCGTTCGACCCCAAGCACGCTTGGAAGCTCTCCACGGCGCGTT
+ACGCGGACGGGCGCAAGAAGTACCCGGAGCTGGGGCTTGGCGCGAACCTCTCCTCGTTCG
+AGGGCGTGACCGCCGCTGTGTCTTCGACGGTCTCGGGCAAGGCGAAGGACGGGGACGCGA
+CGGACAACAAGGTTCGGGCGATCCTCGGGAACTTCCAGTCGGGCATTCGTTGGGGCGTGC
+AGCGCAATTTCCCGTTCAAGATGCTTGAGTACGGCGACCCGGACAACACCGGGAAGGATT
+TGGCGGGCAACAACGAGATCTTGTTCCGAACGGAGATCGTGTACGGCTGGTACGTCTTCA
+CCGACCAGTTCGCCGTGATCGAGGACGCGGCTGCCTGATGCCGCGTCTTAGGAATCGGGC
+GAGCGGGGCGGTCGTCAACGTCGATGACCGTCTCGCCTCCCGGCTCGGCCCGGACTGGGA
+GCCAGCCGGCGACGGCGGGGCCGACACCACGTCGCGCCCTCGGCGCAGAACGCGAGGGGC
+GCATGCCAGCGGTGACGATAACCCCAGCTGATCTCGCGCCGTTCGCGGTGATCGAGGAGC
+CGAAGGCTTTGGCGATGATCGCGGACGCGCTGGCGATGGCGCGGTTGGTCGCTCCCTGTG
+TTGACAAGGACGATTTCCCGTTCGCGGACGCCGCCAAGGCGGTGATCCGTGGCGCGATCC
+TGCGGTGGGAGGAGTCCGGCTCCGGTGCGATCTCGCAGCAGACGGCGGGGCCGTTCGGGC
+AGACGCTCGACACCCGATCCCCGCGCCGGGGCATGTTCTTGCCCAGCGAGATCGAGCAGT
+TGCAGAAGATGTGCCGCAACGCTTCAAGCTCGGGGGCTTTCTCCATCGACACGGCCCCGA
+ACGGGGGCGGGGTGTGGCACGACGACGCGTGCAACCTCGCGTTCGGCGCTTCGTGGTGCT
+CGTGCGGGGCGAACCTCACCGGCGACGGCCCGCTGTGGGGCACGGCGTGAGCCTCCCGCA
+GCCGCACACGGTCCAGCACCGCCGCAAGACCAAGGGCGGGTACGACGATCAGGGGTACCA
+GATCGAGCCGGGTTTCTCGGAGCCGGTGGAGCGCCGCGTGATCGCGGTGTATTGGGAGCG
+GCCCGCCGAGGCGGTGGTGGGGGACTCCCCGGAGCGGGACCGCGACGAGCTGGTGGTTCT
+CACCGGCGAACCGGAGGCGTATGGGGACGGGGATCTCATCGAGGCCGCTGGTTTGCAGTA
+CAGGGTGATCGGGCCGCGCGATTGGCGTATGGGGCCGTTCGGGTTCAAACCGGGCGGGGA
+GGTGCGGTGCGTGCGGAGGGACGGGTGAATGGGGCGCATCGACTGGAACCGGGAAGGGTT
+TCGGGAGCTGCGCAAAGACCCCGCTCTCGTCGCCCATTTGAAGACGATTGCCGAGGACGC
+GAAGCGCGACCTTGACGCGGAGCTGCATGGGGCGCAAACCAATCGCGGGCAGCGGGAAGC
+GTCCGGTTACCGCGCCGACGTGGCCGTGGGCCGCACGCGCGCACGGGGGTATGTCGGCAC
+GGAGACGGCTCGGGCGATGGCCCACGAGCAGGCCCACGACTCGCTTTTGAAGTGGGCGTT
+CCGCAACGGCGGTCAGTCTCCGAAGAGGAAGGGTTGAGCTGTGGCGGTCTATCGGCCTCC
+GGTGGCGGGCGAGGTCCGCGCCCATCTCGCGCGGGGGCTCTCGGCTCGCGGCGCCTCGTT
+CGGGTGGTTCTCATCGAACCCGAATCCGAGGCCGACCGATGGGCGGTGGGGCGTGTGCTC
+GCAGATCGAGTTGCGGGACGTGCAGCGCGTGGAGTCCGAGTCGCTGTTGCGGCTGGTGGT
+GATCGACCCGGACGAGCGGCGCGGGGAGCGCTCGGCGTCGTTGGCGCTGGCGCTCATCGA
+GGCGGCGCACCGCACGGCGGCGTTCAGCTTCCACGAGCTTTACAGCGGGCCGGCCCGCTA
+CCAAGACCCTGACGACCCGAGGGTGTTCGGGCACGTCATGAGGCTTTCCGTCACCAGGGC
+GGGCGAGCCGTTCGCGTGAGACGCGCGGGCGGGTGCAACACAGGAAGGAAATCGAGATGA
+CCAACCCAACGACCCCGGCGACGGGGAAGGATTATTTCGGGTACGGGGACGTGCGGAACA
+TTTTCAAGCCGCAACCGGACTCGGAGAAGACCGTGGGCGGCCTGTTCGTCGGCCCCAAGT
+TCATCGACGTCGCGGAGGCGCTGGACTTGGACGCCCCGGTGCTCGAATCGCTCAAGCAGG
+CCGGGTATTTGACCGTGGAGGGCATCCGCGTCAAGCAGGACCGGCCCGGCAAGGCCATCA
+ACGCGTTCGGCGGCGACGAGCTGGACTACGGGCAGACCTCGTTCTCCCTGACGGTGGCGT
+TCGACGTGTTGGAGTACTTCAACGACGACGCGCAGCGCCTCGCGTACGGCAAGAACAACG
+TGACGGTGACCCCGGCGACCACGAGCCACGGCAAGCGCACCCTCACGAAGATCACCGCGA
+AGCAGTTGGACGAGGTGTCTTTGTTCATCCTCTTGGTGCAGGGCGACAAGCAGGCCCGCT
+ACCTCGCCCCGTTCGCGCGGGTGACGGAGGTGGGCGAGGAGAAGCACGTCCACGACGAGC
+TGGTGTCCACGCCGCTCACCGCGCGCTGCTTCCCGTACCAGGGGGCGGTGTTGCACCGCA
+ACGTGGACGACGGCATGAAGCTGCCCGCAGGGTTGGCCGCGTGAGCGCCGCGAAGGGCAG
+GGGCGCCAAGGCCGAGAAGCCCGCCCCTGTCCCCGGCGACCTGGATTTCGACTGGTCGAA
+GGTGTACCCGGAGGGCGAGCTGTTCGAGTACGAGTCGGGCGGGGTCAAGGTGGTGATCCC
+GGTCTTCGAGAAGTTCAGCGCCGACTGGTACCGCCGCAACCGGCGCCTGTCGAACGAGGA
+GAGGTTCTACCTGCATTTGGAGCGCTCCGCGAAACCGGAGACGTTCGAGGCGGCGGACCG
+GCTCAGCCACGACGGGTACGCCGCGTGGTTGACCGCCTGGGGCGAAGAAATGATGTCCCA
+ACTGGGAAAATAGCGTGGGCGGTGGAAACGCTGCACCGGCATCCCTTCGCGGCCCGACGC
+GACCTGCTCGCGCTCGGGCTGCGATGGGAGAACCTGTGGGACGGCACTCTCGACGTCCTC
+GACGTCGCCGCGCTCGCCGTCGCCGCCCCGCCTCATTCCGCTTTGTTCCACGCGCTCACG
+GAGGGCTGGGACGTGAACGCGCATTTGACGGCGGATCTCGTCTACCTCTCCGAGCTGGGG
+CTGTGGGCGCGCACCAAGGACGCGCAATCCGATTTCCCGCGCCACAAGCCCCAACCCGTC
+CCGCGCCCCGGCGCGGCGCGCGAGCACGGCCCGACGCAGGCCGATTTCGAGAATTTCCAC
+GACGCTGTAGACAGGAGGGCTCGCGGTGGCGACCAATCTCTCTGACGTCTATGTGACCAT
+CATCCCGGAGACCCGCCGCGTCGGGGAAGCGATCCGGGCGGCGTTTCGGGACGCGGAGCG
+CGAGGCCAAGCTCTCCTCCGAGCGCATGGGCCGCGACTTGGACCGCGAACTCGGGGACGT
+GCATGTCACGGTGAAGGTCGGCGCGGACACAAAGCGCGCCAGGCGCGAGGTGGACGAGCT
+CAAGACGCACGGGCAGCGCGCCGGGGAGGCGATGGGCACCGCCACCGGGCTCGCGTTCGG
+GAAAATGTTCTCGGCGCAACTGGGCTTGGTGAAGTTCGCGTCCCTCGGCGCGGCAGGGGG
+CCTCGCTTTGTCGGGCCTCGGCGGCTCCCTCGCCTCTATCGTCGGGGTCGCCTCCCGCGC
+ATCGGGGGCGTTGGCGCTGGTGCCCGCCGCCGCGATGGGCGCCGCGGCCTCGGTGTCGGC
+GCTCAAGCTGGGGGTGTCGGGGCTGTCGGACGCGTTCAAGGCGATGGAAGACCCGCAGAA
+GTTCGCGAACGCCTTGCAGAAGCTCTCCCCGGCCGCGCAAGAGTCCGCCAAGGCCGTGTA
+CGCCCTCAAACCGGCGTTCGACAGCATGAAGAACACGGTGCAGGACTCGCTGTTCGCCGG
+TCTCGCCCCGCAAATCACCCAACTCGGGCGGACGTATCTGCCAGTGGTGCAGCAGGGGTT
+CGCGGGCGTGGCGGGGGCGGCGAACCAGGCGGGCAAGTCCGTGGCGGCGTGGGCGCAGAC
+CCCTGAGGCGGTGGGGCAGGTCAACAAGCTTTTGGGCAACACCACGGCGGGCATGAACAT
+CCTCGCGACCGCCGCGCGCCCAGCGGTTCAGGCGGTGCTGGGGCTCGGGGCCGCTGGCTC
+GGACTCCCTCCCGCGCCTCTCCCAGGCCGTCGCGGACGTGTCGAACAGGTTCGCGGGGTT
+CGTGAAAAACGCCTCGGAGTCGGGCCGGATCACCGAGTGGATCGACGCCGGGCTGACCTC
+GCTCACCCAATTGGGGCACGCCATCGGCGCGGTCGGCTCGGTGTTCGCCACCGTGTTCAA
+AGCGGGCTCGGCTGTGGGCGGCGGCATGCTCGGGACGATCACGCAGGTTGCCGACAAGTT
+CAACGACTTCCTCAAGAGCGCGGACGGGCAAGCAGCCCTGTCGGGGTTCTTCACCGGCAT
+CAGCCAAGCCGCAGCGGCGCTCGCCCCGATCCTCGGCACGCTCGCGCAGATCGTCGGCAC
+GACCATCGTCCCGGCCCTGTCGAATTTGGGCACCGCTGTGGCGCCCGCCCTGAACGGCAT
+GCTGCAAGGCCTCGGGGCGGGGTTGAACGCGATCAAACCGGTGTTCGAGCAACTGTCGGG
+GCCGCTCTCGCAGATCGGGCAGGTCATCGGGGACGTGCTGGCGAAGACCCTCCCGATCCT
+CGCCCCGGCGCTGGTGCCGCTCGCGCAGGCGTTCGCGGACCTGCTCTCCGCTATCGCGCC
+GCTGATCCCGCCGATAGCGCAGCTCGCGTCCATGTTCGTCCAGGCCGTCGCGCCCGCGCT
+CTCTGTAGTCTTCCAAGCCCTCGCCCCGGTCATACAGCAGCTCATGGACGCGCTCAAGCC
+GGTCCTCGACCAGCTCGGCCCCGTCCTCGCGCAGGTGGCGCAGACGCTCGCGGGACTTTT
+GGTGCAGGCGATCCAGGAGCTTCTGCCGCCGCTGATGCCGTTGGTGAAGTCGTTCGCGGA
+CTTCTTGGCGGCGGTCCTGCCGCTGCTGCCCGCCGTGGTGAAGGTCGCCGCCGTCATCGC
+GGGCGCGCTGGTCAAGGCGATGGCCGCGACCCTGCCGCTCGCGGTTTCGGTGGTCAAGGC
+GATGGTGGACTTCTCCACGAAGATCGCGAACTTCGTGGTGCCGTGGGTGAGCAAGCTCGC
+GGACGGCTTCGGGTGGCTCGGGGACAAGGTCAAATCCCTCATCGGCTGGTTCAGCGGCGT
+GAAGGACGCGGCGGGCGAGGCCTCGGGCTCGGTGAGCTCGTTCGCGTCCGCCACGCCCGC
+GCCTTTCGCGTTCCCGCAGACAAGCGGCGGGGTTCCGGGAGGCGGGGAGCCTTCCGCGCT
+CGCGAACCGCCTGCGCCGTTCGGCCGGAACGCCGGAGGGCATGGACCGCGCGGAGGCGGG
+GCGGTTGGGCCAGTCGCTCGCGGCATCGGCCACACCCGACGCCAACGGGTCGCTGCTGGC
+CGACGCTTCGCGCCTGCTGGCGGACTACGCGACAGGGAAGGGCGATCAGGACGCGGTGGC
+GCGGGCTGCGGAACTCATCGACCAGGCGTCCAAGGGCGGGGCGTATGTACCCGACTCGGA
+CCCGCCGCCTCCTGCCGTCCCGCTGCCGCCTGTTCCGGCGCCGCTGCCGGTCCCTGCCGC
+CCCGGTCCTGCCTGCGCCGTCAGCGGGCAAGGGCGGCAAAGCGCCCGCGCTGGCGCCGAT
+CACGATGGCGGATTTGGACAAGTACGACACGCCGGGGTTGGAGACCGGCGCCCCTGTGAC
+CGTGGCGCCGGGTTCCCCGGCCCGCGCGGAACAGAGCGTGCCCGCGACGATGGGCGTGGA
+CGTGTACACCGGCATGGGGCAGACCGGGGGCGGCTCGGGCGCTCAGCAGGGAATCGACTT
+CGCGCACTCCATGACCGGCACCGCGTACTCGCAGCAGGTGTTCGGGCGGATCGGCATCGA
+CTGCTCGGGGATGGTGTCCGCGACGGTGAACGCCGCAGAAGGCAAAGACCCGTTCTCCTC
+GCGCATGTCCACCGTCAACGAGGGCGAATGGCTCAAGGCGCACGGCGCGGTGGAGGGGAT
+GGGCGGTCCTGGGGATCTGAGCATCGGATGGTGGAACAAAGGCTCCTCTGGCGGCAACAA
+CGGGCACACGGCGTTGACGCTCCCGAACGGGGAGAACGTGGAGTCCGGGGGCAGCCACGG
+CGTCGTTGCCGTGGGGGCGGGCGCGGCCGGTGCGGGCGACAAGCAGTTCGACCATCACAT
+GCACATCCCGAAGGAGCTGTTGGGCTCCGTGCCCACCGCTGCGGGCTACGCGCCCGCGCT
+CTCGGGCGCTTCGGGGGATTGGCGCTCGCGCACCGCCGACCGCGCGGTGCAGAACGCGCA
+GGACTCGGTGAAAGACCACCAGTGGCGCGTGGACCAGGCCAAGCGGCGCATGATCGAGGC
+GAAGACGCAGCAGCAGCGCGACATGGCGGAGCACGCCCTGATCGTCGCGGAGCGCGAGCT
+GGCGAAGTCGCACGAGAAGCTGCGGGACGCGCAGGACAAGCGCGCGGAGACGATGGCGAA
+GGCGCGGCAGAAGGGGCAGCGGGGCGGTTCGGACGGCGCGGAGGACTTCGGGCACTCCCT
+GGTCTCGGGGGCGCTCTCCGGGCTCGGTTTGGACGGCTCGCTCTTGGACAACCCGTTGGA
+GTGGTCCGGGGTGAAGTGGCTCACGTCGATGGTGAACGGTTTCACCAAGCCCGCGCAGGG
+CCAGCAGGGCCGCTACGGCTCGGACGGGGCCGCTCTGCCCGGTTTCGGGCCCCCCGCGTC
+CGACCCCGCCCAACTCGCCTCGCTCGGCGCGCAGGGCCTCTCGCAAGGCTTCGGCGCCGA
+TTCCGGCTCGCAGCCCTCCCCGGCCCAGGTGGACCAGTCGATCAACCTCACGGGCCAGTT
+CGGCAACCCGAACGACACGGCGCGGGCGATGCGCGCGGAGATGGACAACCGCAACCGGGC
+GTTCTCCATGAACGCGGGGAGGATGTGATGGCCTACCAGCGCACGGACATGACGCAGTAC
+CCGAGCCAGCACCCGGACCTGCGGACCCCGCAAGGGGACTACCCGCCGTTCGGGCGCCCG
+CTCACCGAGTACTTCCAAAGCTGGGAGAACGTCCCGCCCGTGCTGCGCTCGGACCAGCTC
+ACCGTGATCTACGTCGGTGTGCCCGACGAGCGCGGGGTGCGGGCGATGTGGCATTTGGCG
+GGGCCGCGCCGGGGCTTGGAGGGCGTCGCTTTGGCGACGGACCTCTCCGGGCTGGTCATG
+CCCGAGTTCGAGCGCGCGTGGCACGAGTCGGCGTGGATGACCGGCGCCGTGCCGGGGCAT
+TTGTCGTGGCCCAAGCGGCTCTTGAACCTCGGCGTGCATATCAGCGCGCCGCGCCTGCCG
+AGGACGATTCTGGCGGCGGACGGGCGCCTGGAGCGGCTGGTGGCGTCGAGCAGCGCTGAC
+CGCTACCGGTTGACGCACCAGTTGTGGTGGAACTCGTTCTCGATGGACGCGGACGGCGAC
+CTTTTGTGCTTCACCCGCACGACGGGCTTCCGCAATCTCAAGGTCCGTCTCGCGAAAGCC
+CCTGCCGGGACGTTGGAGACGGACCCCGCCGCGTTCGGCAACAACCGGATCACCGTGGAT
+CTGCCCTTGGTCGCCTCGGACCCGTTCTTCGCTTCGCCCGCCTCGATGGGGACGTGGCGC
+AACAACGAGGACACCGCCACGCCGCTGGACGCGTTGGAAGAATTGGTGCGAAAGGTGATC
+CCGGACGCGGACTTCACGTTCGCGAAGACCGCGCTGGCTCTGGTCGCGGAGGCGCTGGGC
+AACCTGATACCGGGCATCGACGTGGGGCAGGGGCATATCGCGGTTCGCAACGACGGCGAC
+GTGCCGGCGTGGCCCGAATACGTGATCCACTCCGGGTCCGGGGGGTTCTGCTGGCTCCCG
+GACGGGGACCGGATGGTGATGCTGCCGAGGCTGTTGCCCACGGACGGGAAAGTGCTCGTG
+TCCACCGACCCCTCCAAGAAGACCTTCACCGCTGAGAACGAGCCGGTGGACATCGGGTTC
+TTGGGCGTGGTGGCCCGCTCGCAGTTGTTGGACCTGGTGCTCAAACCGTTCTTGGAGGCC
+ACGGAGCCGTTGTGGCGGCGCGGCGCGGAAGTGTTTTTCACCAAACCGATCCCCCCGAAG
+ACCACCGTGCAATTGCCGGTGCGGCACTCCAACGAGAACGCCGTCATCACCGCCCGCGTC
+CCGCAACGCCACTACGGGCCGGGGATCTGATGCCGTCCTGGGCCGTCTCCCCGGAGTCTC
+TGGCCTCCACGGCGCTCTCCGTGATGACCACGCTGGTGGTGGGACCGGAGGACGACGGGG
+CTCCCCGCTGCGATTATTTGAAGCTCTCGGCGCGCAGGGACGCGCGCCTGGCGCAGCTCT
+CGCAGGCGCCGATGGTGCGGATTTGGGACCACCAAATGCGTCTTGTGGGGCAGGTGCAGG
+TGGAGTCCTTGAGCGCGGACGAGCTGCTGCGCGACACCGGGACGTGCCAGTTCCGGTTCC
+CGTTGGACTCGCATGTGGCGCGGTGGCTTCGCAACGGTCGCCGCCCGGACTCGGACGTGC
+ATGTGACCATCGACCCGATTCCCACGGAGCGGACGTGGCGGGACCGTTGGGGCGGCAAGG
+CGTCCTTGGTGTCGTTCATTCGCGCCGAGGACGGGCGGGAGTGGTGCGAGGTGAAAGCCG
+CGCACCACTTCGAACATTTGAAACATATTATCTATAGGAATAATCCAATTACCCCACCGG
+AGGCGCAGGGGGTCAGGTTTTGGCTTCTGCCTGGGCCGACCCGGAGCGTCGTGTACTGGA
+CGACGCTGCTGGCATTGGCGCAACAGTTTTTTCCGCCCCTGACCTTGGTGGACTCGTTCG
+CGGACCCGCTGCGGTGGGCGACGATCAACCCCCTGGATCTCTCCCCGTTGAACTGGCCGG
+TGCAGCCGCAGTTCGTCAACCCCTTGCTGGATCAGTCGATGTTCACGGTGCTGACCGCCT
+CGTTCCAGAACGCGCACGCCGCCACCGCCGATGTGCTCAAGGCGTCGGGCTGCCACATCC
+GCGCCTACACCTGGCTCCCCGAGGACAAGGACTCCCCGCACCCGGAGCTGGAGGCGCTGA
+TCGGACCCTTGGCGCGCCCGTCCCGCGCGTGCGTGGTGCTGGCCTGCGAGGATTTGTCCG
+GGGTGACGGGGCCGACCGGGACGATATTTGACTCGGTGCTCTCCTTCGGCGCGAAGCTCT
+TGGACGACTCGTTGACCGAGGTGCTGCTGCCGCTGGATCTGGACGGGGACGGGCGCACGG
+ACCCGTTCTTCCGCGCGCTCACCCTCACCGCGCCCGCTCGCCCGAAGGTGGTGTTCCGCG
+ACGGCGACCAGACGGGGGTGATCGAGTCCAGCTATTCGCACGCCCCCGCGACCGCGCACA
+CCGTCTCGACTGGGAAGGGCTCGCCGCCGCTGCTGAACGACGGGATTTCGTTCGGGGTCA
+AATATGGCTTGAGCCGTTTGCAGGATCTTTTGCAGGGCGGGCAGCTCGGCGGCACCTGGC
+AGGTGCCCGGCACACCGGGTTTGGACGAGCTGTACCAGGGCCAGCTGAGCAACCGTTTTT
+TGACGCACAAGGCGTGGACGGACGCTCTGCGGGCGTTGCGCTCGGGGGACTACGCCTACA
+TCGCCGCGCACGAGCAGTCCGCGGTCGGGTACAGCGTGGCGGGGGCCTTGGCGATCCAGT
+CCGGTCTGCACAAGAACCGGCCCCGCACCACCAAGCACGTCCGCGTCCGCAACGGCGCCC
+CGCACTGGGTGGGCCGGGACTACACGCTGGGCACGCGCGTGCTGCACGAGCACGGCGGGG
+TGCTGTTCGCGGACCAGACCGGCGCGTTGGGCATCCGCATGGACCCGGACGGGCTGGTGA
+CCAGGCCGGTGCAGATCGGGGAGGACGACGACGAGGAGAACCCCGTGGCGTCGGCGTTGC
+GGGCGGTGCAAGGGATTTGGGGCGCCATCGGGGCGTTCGGCGGCGCGGACGGGGGCATTT
+AGTGGACGACGAGGAAGAGGTCAAGGCGCTTGAGGCCGCGTGCCGCGCGGTGCCGCTGGC
+GTCGGGGGCGGTGCTGGATCTGCGGCTGTTCGCGAAAGAGATAGCCGAGCATCTGTTCGC
+GGAGGGCTGCCGCAAGAGAGCCGAGCGGGTGGAGCGGGAGTTCCCGGAACGGTTCCTCGC
+GGTCCCGGACAAGTTGTTGGGCGGCTGGTCGCAGCCGTGCGAAGTGGTGGACAAGAGATC
+GGAGGAACGCTGATGGCCGATGTGCCGCAGCCGGGGGACAAGGTGTATATGTTCTCGGCG
+GACGCGAGGATGGACTTCCAGGGGATCGTGCTCGACCCGGACGTGCCGTTGAACATGGCC
+GCGACCATGCAGATGGTCGGCATGAACGGGGTGGTGACCTTCCCGGTGCTGGTGGGGCGG
+CAAGGCCCGCCCGGGGTGGACCGCCCGATCATCAAATTGATCTACGACCCGCAGATAGAC
+GACGCCTCGAAGCTGCCGCAGCTGACGAACACCCCCGAGGACGTGCAGAAGGGGTATGTC
+ATCGGTTCGCTCTGCCACTGGTGGGACGGGCGGCAGTGGCGGGGAATCCAACTGGGCGTG
+CCGGGGCCAAGTGGCCCGGTGCCGATCATCTCGTGGTCGGTGGTCTTGTTGGACCCGGAC
+GGCTCCGAGGAGTCGAACGTGAAGGTCACGGGCTCGGACGCGGCTCCGGGGGTCCAGTTG
+CGCCTCAAGGTGCCCAAGGGTCCGAAAGGCGATTCGGGGAGCATCCGCCTTGCGAGCGAC
+TACGACGACGCGACGCCGCCCGCTGTCGGGGACCTGCTCACGTGGACCCCGGAGAAGAAA
+TGGGCGCCGCGATCTTTGGGCAAGGAGGACGTGGCCTATTACACGGTGCCGCAGAGCCAG
+TTCAAGGCGCAATCGCTGGTGGTGGGCGCGAACGTCCCGGTCGGGTCGTTCACGATCCCC
+AAGCAGTCCTTCGACTGGAAGCCGTGGGTGTCGGGGTGCGTGAAGATCACCGGGGCGGAA
+CTGGACTTGGACCCGTTCTCCTCGCGCATCGAGGTCCGCAAGGACTCGATGGACGGCCCG
+TTGTGCGCGGTGGGGTTCGGGACGCCCACGACGATGACCGTGGTGTCGCCGCATTTCTCC
+TCGCCGGGCAACAAGACGGCGGCGGTGAACGCGAACAACGACGCGATGCGCTGCGAGGCG
+GGCAAAGACGCGGTGTTCCACGTCGTGATCGCGATGGATCAGGGCATCGGCGGGGTGTAC
+TCGTACAACCCGGACTGGACGGAGTTCCATGTCGAGTGCAAGCGGGTGAACTAGGGTGCC
+GCGCGCGCATCAGACGGCCCCGGTGGAGATCGACAAGAACCCGGAGCACCGGCTGGGGGT
+GAACGCCCACAAAGACCCTGTCGATTTGCAGAAGATCGCGCAAATGCAAGTCCAAGGCTT
+GCTGAACGCGATCAAGCTGTTCACCGGGCTCGACCTCGCGGACCCCGGCAAGCTGTTGGA
+GTCCGTCGTCAGCGGCGCGGCGGGGTTCGCGGGCGCGGTCCTGAACGCTTTGACTTCGGC
+GCTCGGCTTCGATTTGTCGGCCAAGCTCCGCGAGTTCGAGCAGGCGCTTGAGGAAGTGCC
+GGTGCTCGGGGACATCGTGAAGGCCCTCACGGGCAAGGCCGGGGGCGCGGGGGATTTGGA
+GGCGTGGGCGCAGTCGTTGCCCGCGCAAGCGGAGCAGGCCGCGCACGACGCGATAGCGCA
+GGTGAACACGCTCGTGGGGGAGTTGGCGCACGGCGCGGAGACGGTCGGGCAGACCCTCGC
+GGACACCATCGGGTCGGTGGTGGACCTGCTCGCGGGCACGCACCAGCAGACCCAGGACAA
+CACGGCCGCGATCACGGCTTTGTCAACTATCGCCCCGACGAACGTGGTCACCAGTTTGGC
+GTCTTCGACGGACCCGAACGACATCCCCGCCTTCGACCGGATCCTGATGGTCCCCATCGC
+GGCGACGGCCTCGGCGGGGGCGCACACCCACACGTACAGCAGCGGCGGCACGGGCCAAGG
+CACCACCTCCACGGCGGGGGCGCACACGCACGCCATCGGCTCCGACGCGTGGGGGTACGC
+CCCGGAGGACAAGGAGCTGGTGCTGGTCTTCATCCGCTCCGACCGCAAACAATCGGTGAA
+CGCGGTCAAGGTCATCACCGCCGTGACGGGCTGGTCCCTCGGCGGCGTGAGCACCGTGCA
+GTTGAGCCTGCACGCCTACAGCCAGCCCGACGCGGCCCTGAAACTGTTGGCGACCACCAG
+CAACCAGAAAGACGTCATCACCACCGCCGCGCAGGAGTACGCCATCGGGCTCGGCAGCAC
+CTTCGACGTGCTCCCCGGCCACGTCCTCGCGATCGGCGTGTGGCAGCAGGTCAACCTCTT
+CGGGGCCACGCGCAAGCTCGCCGGCATCCCGCAAGTGGGGGTCAAGCCCCGCACCGGGGC
+GCCGGTCAAAACGATCCTCGGCAAGATCACCGGGCAGTCGTCCATCCCGGCAACGATCAA
+GCTCTCCGACGTCGCGTGGAACTACAACGCCGCCGTGTGGGGGGCCTTGACGCTCGCCTG
+AGCGTGTGCGGCTCGCGCCGCAGACGGGCAATCGCCGCATCGCGGCGCGGAAGGAGAAAA
+AGATTATGACGGATCCGTATGGGCTGCCGGTCGGCTCGGACGTGCGCCAGGGCGCGCGGG
+GGTTCCCCGAATGGGTGTACGCGCTCGGCGCGGCGTTCGGTTTGGACGCCTCCACGTATC
+CGGGGCACCAGGAGCGCGCGGGCCTCAACCAGGGGATCGACTGGTGGCCGAAAGGCAGAG
+CGGACATGACGGGGGCCTCCTACACCCCGGCGCAGCGTTTGGCGTTGGGGCGGTTCGCCC
+TGTGGGCCGGGACTCAGCCGGGGGTGGAGCAGGTGATTTGGTGCGACCCGGTTTCCGGGG
+TGAAGACGGGGTTCTTCATGGGGGAGCGGGTGGGTCCGGGCACCGCGCAGCCGGGGTACT
+ACCGCGACGACTGGTCCGGGCACACCGGGCACGTGCACACCAGGATTGTGCGGGCGCTCG
+CAGCGCCCGACGACATCGGACAGGAAGGGAACAGCATGCCTTTGTGGGGCGTGGACATCA
+GCAACAACAACGGGGCCGTTGATCTGGCGCAGGTCAAAGCGGAAGGCTTCGATTTCGTCG
+CGGCGAAGGTCACCGAAGGCACGGGGTTCAAGGACTCGTATTGGCCGCGCAACCGGGACG
+CCGCGCGCGCCAACGACCTGATCCTGATCGGCTACCACTACGTGCGGGACGGGGACGCGG
+AGGGTCAGGCCGCGAACCTCGCCGCGCACATCGGGGACACGAGCGTGCCGGTCGCCCTGG
+ACTTCGAGTCCGGCTCCGGGGGGTACGCGAACTTCCAGGCGGTGAAATCAGCGGTGGAGC
+GGCGGGGGATGCGGGTCGCGCTCTCCTACATCCCGCGCTGGTACTGGCAGCGGATCGGCT
+CCCCGGACATCTCGGACGCGCCGGGGTTGTGGGCGTCGGCGTACGTGAACGGGACGGGCT
+ACGCCTCCGTGCTGTATCCGGGCGACGAATGGTCGGGCTGGCAGCCCTACGGCGGGGGTG
+AGCCGAAAATCTTGCAGTTCAGCTCAAGCGCCCACGTCGCCGGGAAGAGCGTGGACGTGA
+ACGCCTTCCGGGGCGCCCGTGAGGAGCTGCTGTCTTTGTTGGGCGCCACCGCTCCCGCGC
+AGCCCACAGCGAGCCTCGACCAGTTGGTGCTTGACCAGCTCGTCGGGCCGGGATTCCACG
+GTTGGCCGCAGCTCGACAACAAGTCCGTCGTGGACTTCCTCGCCTCGTGGCGCGAGGAGC
+AGCGCACAGCGAACAAAGCCATGGCGGACGCTTTGGCGCTTCTCCTGAAAGGAACAACCC
+AGTGAACGTGATATCCCTCCCCTACAAGTGGCGCGTCGCCCTCTACCAGGTGCTCAAACT
+CGCGAGCGCCGCTGTCGGCGCGTTGTTCGTGATCGCGCCCTTGTTCGGGTGGGAGCTGCC
+GAACACGAAACTCGACGCCCTCGACCAACTGGTATTCGCCGTCGTCAGCCTCTTGGGGCT
+CGGGGCGGGTTCGGTCGCTACAGAGCACGCGAAGATCTCCACGGACGGGCCGCTCCCGGA
+CCCCCGCGCCCAGGCGCCGCAACCGGACCCTATGGCGGTCGCCGCGCAAACCGTCGCAAT
+GACCATTGAGGGCGTGCTGGCACAGTTGGAGCGCTTGGCGAAGCCGCAGGGCGAGTGATG
+CTCAAACAGATCCTCGCGGACATCGCGCCTCTCGGGCCGACAGGGCTCCTCTCTGTCATG
+GTGGTGTTGATCATGACCGGGCGCATGCTGCCCTTGCGGGAGGTGCGGCGGATGGAGCAG
+ATGCTCAGCGAGCACATCGCGCGGCTTGAGCGGGCCAACGCGATTCAGGCCGAGACCATC
+GAGCAGCAGCACGAGACGGTGCGGGAGCTGATGGAGGGAGCGCGCCTGTCCACGGATCTG
+GTGTCCGCGATGAAGACCTCGGGGGGCGTGTGATGCGTTGGCCGTGGCAGTTGCGCGAGT
+CCGTGGAGTTCGACGGCGAGGATTTGGACCGCAGGGTGCGTGAGGCGCAGCACGCGAAAG
+ACCGCGCGGACAAGCTGCGCGAGGAGGCCGCGCCGCTGGTCGCGCTCGCGCGCCGCCAAC
+GGCGGGAGAACGGTTTCGGCGCGGCCGTGGAACGGACGATGAGGAGACGGCATGCGTAGC
+AGGGAATCAGCTGTCGGCGCGGCGTCGGCCGCAGCGGTCGCGGCGGCGTCTTGGCGCTGG
+CTGGGATGGGGCAGGGTGGACGACGCGCTTTTGACCGCAGCCGCCCTCGCGTCGGTGCTC
+TTCAGCCTCATGTACTGGCGGCAGGCCCGGGGATACATGAACCGCGCCGGGAGGGCCGTG
+CTGTGGGTGTTGGCCGCTCTGTCGGCGGTGTTGGCGCAAAACACCCTCAGCGTGTGGACC
+GAGCAGGACTACCCAGGCCGCGATCTCGTCCGCACAGTCCTCTACGGGGCGCTGCTGTTC
+ACCCTCGCCCGCCTGACCGCCACCGCCCTCGCGTACCGCAAGAAACACTAAGACCGTCTA
+CACTCTCATCCGGCCGCGCGCCCGTCCCTCATCCATAGGGCGCGCGGCCCTCACACACCA
+AGGGCTTTCCCGTGGCCGCTATGCGGTGATGTTGAACAGCCAAGGGCGCTTCTCGTCTCA
+GTGGTGGAGGATTGATAAGAACGCTGCGGGGATGCTGATGTAGAAGACCGGCCAGCCGAA
+GTAGAAGACCATACCGGCCAGCGAAGCCGCTATGACACCTCTTCCGGCGTTCCGCCATCG
+CTCATCGACCCTGAACAGATAGACGCCGACTCCGAGCGAGACAAGGAGGATGAACCCGAA
+TTTTGATTCCAGGGTGAACCCCAGGAGTATGAGTGTCCCGCTGGCGAGCAGGCACCAGAA
+AAAGCTAATGGGGCTGTCCGCTGGTGGTGTCTTCTCGGTTTTTGTCTTGTCGTTCAAAAT
+GTCACGTTCTCTCTCAGCACGGCAAGCGCGACTGGCACGATAAGGCATCCGATGGCCGCG
+CCACGCCATAGAGGGGTTCTCTTGATCAGGGGCAGCAGCAACCCCGCGCAAGCCATGATC
+AAGCATGTCATGATCAGCGCGGGTCGTTGGCTTGCCGCTTCATGCGGAAGGAAGTAACGG
+ATCAGCGAGTACAGGATCTCGCAGACTGCGGTCAGGATAGGAGCGCTCCATGTCGCGGCG
+TTCCATGACACAGCGGGGAATCTTATAGTCGGCATCAGTTCACCACTGAATATGTGTCGC
+GTCTTTGGTGGAGAAGAGGGCGAGGAACATTCCGGGGATCGTGTAGAGAAACAGCCAAAA
+AACATATCTGAGCAGCAAAGCGGAGACTGTCGCGGCCAACATGCCCATACCGATTTTTCT
+TTGCTTACCGGTTGTGAGCGACATAGCGAGTCCCGACAAAAACAGAATCAGCACTGTTGG
+CACGTACCAAGCCATATGCAGGGCGGCGACCGCCATAAGCGCTGCGGACGTCAAGACCAG
+GGCCGCGAAACTTTCCGGGCCGTGAAGCCGCTGGGCAGGTGCTGTGTCGTCGCTCTCGCG
+GTCTCGCTGGTTCATTGCGTCAACCACACGAACCAGGCCAACACGAAGGGCACCCCGAAT
+ATGCCCAACGCCACCCCGCGCGCGGTAGGGGTCCGAACGAAGACCCACAACAACAGGGAC
+AGCGTTGAGACGATGCCGCACAAGAGCGGGAATGTTAGGGACTTGCTCCCTGGCGGCTGC
+AAATTGACCAGGAAGGTTATCGCCGTCAAGCAAGCGCATACTGCCACGGGCGCGCTCCAC
+GTCGCAGCCGCCCACGACACAGCGGGGAGTTTTATGGATGGCATCAGATGTCTCCCCTCA
+TCGCTGGAGGTTGTTGCGGCGCTACCGGGTTGAGCTGTGGCGGCGAGTCCCCATCCTCTG
+GGGCGAGGGTCATGGACTCGTCGGGAACGGGAACCTGCGGTCGATTGCTCGGGATGCCGG
+GGCCATCCCACTGCAAGCCGGGTTGATACTCCTGTATGGAACCCGTCGGGCCATTGCCGA
+CAGGGTGCGATTTCGGCAGATTTTCCATAGGGCCGAACTCGCTTCCCGTCGCCTGATAGG
+CGTATGCGGTCGTTGTCGTGCCGTTCCTGTCTTGGTAGACCTCCATCGAAGGGTAGTCGC
+CCACTTGCCCGTCAATGTGGACCCCGTTCGCTGTCGGTGTCAAGGTGATCTCGCCGTTGA
+CCGACAGGCCAGCAGCATGCGAGAAGAAGGGCGCCAATGGGTTGGTCGCGTCGTAGTGGA
+TGCGCACACGTCCGTCCGTTGTTTGCTGCACGTCAATAACGGGGTCTTGCACTTCCGTTT
+TTCCTTGGATATCGACTGATGGGTTTTGTCTGGCGGCGACGACGCCGTTCTCGTAGTCGA
+TGTACAGGGACACTCGGGTCTGGCGCGGGTCGAATTGTTCTTTCGGGCCGCGCGCGTCCC
+CAAGGTCGTTGGGCATGTTGAACACGTCTGTGGCGGGGATGTACAGGCCGACCCGGACGA
+TTCCTTGGCCGGGGACGGCCTTGATGCGGCCGACGTCGACGCGGGCTGGCACGCCGTGGT
+TGCGTCCGACCATGCTGTGGGTGTCCATGATCGCGGCCATCTTCCAGTCGGCGTCGCTCT
+GCGGAAGCCTGCCGTACACATGCTGGAACTGGTCCGGGTCCACGCCGTGGTGTGATCCAC
+GATCCGGGATTTCGCCGGGGTCTTGCTTGAACGGCTCGAATTTGTCCGCTTCTTTCTTCA
+CGCTGTCGAGTTGGTCGCCCAGTTCCTCAGCGAGGTCTTTGTCTGCGGCGAGTTCTGCGG
+CGTTCAGTTCGTCGGTGGTCTCGTATTGGAGGGCGGATTCGCGGGTGGCTTGGGCGTGGG
+CGTGCAACGCCGCTGCGGCTTCTTGTGCGTTGATGTGCTGGTTGGTGATCGCGGCCATGA
+ACGCCGCGATGAACGGGGCTCCGATGGGGCCGAGGGCTGTTGTCATCATGCCCTGGAAGA
+CGCTGGGGTCGAACGCTATGGTTCCGTCGAGCATGAGCGCCATTTGTTCTGTCTGCTCGG
+CGTGCGCGAGCATGGTTTCTTGGCTCGCGTTCAAGGGTTGGCCCATGATGCTCCGATTCC
+TGTACAGGGGATTGTGAGTGGACTGTAGCATTCCGGTGGGATTCCAAAAACGCGAAGGCT
+GTGTCCGTTCAGCCCGCTAAGGCCACGGTGAGCTTGGTTTCTGCTCCTCTGAACGGATTT
+AGCCGACTCACGGCCTCGGAAGTTTTATGGGTCGGCACCTGTGTGTATTGCGCCGTTGTC
+GAGATCGAGGCGTGGCGCATGATCTCTTGCACGACCCGTATGTCAACGCCTTCGTCTAGG
+AGGGTTGTTCCTTGCCAGTGCCGCAACTGGTGCGGCGTGGCTCTGACCCCGGCTCTGCGC
+ATGGTGAGGCTTATCGTCTGAGACACCGATTTGCCGCTGATGTGCATTCCGGGCCAGCGG
+CTATCACGGGGGAACCACCAGCCGCGCTCGGGCATCGTGGGTGCGATTGCCTGCAAAATC
+GGGTGCAACGGGACGAGGCGTTCCTTGTTGCCTTTGCCCAAGACTCGGACGAAAACGCCG
+TCCACAATGTCTTCGCCGCGCAGTTTCGCGATCTCGAAGGCCCGTAGGCCCGCGAGACAG
+TACAGGAGCACCATGAGCCGGGTCCGTTTGCGGTTCACGGTCTCAAGGAGGCGTGCCAAG
+TCTCTGTCCGAGACGGGCCGGGGCGCGCGGTCGGGGTATCGCACGGTGCCGACCTTCACC
+ATGGGGTCGTCTGTCCGGTGCTCATGGACTTGTAGCCATTTGAACCAAGCTTTGAGGTAT
+TGGGAGTAGGTCGCAAGGCTGGATTGGCCGAGGCTGGACTGCTGAGCGAGCCACCGTGCC
+ACGTCTAGGGCGCTCGCTTGGCTTGGCTCGATCCCGATGGAGCTGGCGAATGACTTGATG
+ACACGTATCCTTTCCGTGATCGTCCGTTGCGAGAGCCTGCGGGCGAGCATGAAAAGTTCC
+CACTCTTGCACGAGCAGCATGGCTACGTTGTGTGCGTGGTGGGTTCCGGCGACGTTGACG
+GGGGACAGCACGGCGGGAATATTAGCGTCCGTTAAGGAGCTATTAACCTCTTGTTGACCT
+TGGTTATCTATCCGAGACGGACAGGGTGCGGATTTTTTATCGTCTTGCAGAGGGTGGGGG
+ACCGCTCGCAGTCGGCGCTCATTCTGTCGGGGTGCCAT
+>NC_014168.1|provirus_1141631_1162952
+TCATTTTGGGGTTGGGAGGCTCTCCCTCGCGAAGATCGCCGAGGCCCGTTTGAGGATCTC
+GACCTCCATCGCCAACACCCGGTTCTCCCGGCGCAGGCGGACCAGCTCGGCCCGCTCGTC
+GCCCGCGATCCCCTCGTGCCCTCCCTCGCGGACCACGCGCTTGCCCTCCACGCCGTCGGC
+CTGGGCCAGCCACTTGCGCAACGTCTTCGCGTCCACGCCCAGCTCCTTCGCTGCCCAGGC
+CACAGGCCGCCCGCCCTCGCGGGCGGCGCGGGCCGCCTCTGTCGCCCTGCGGCGGAACTC
+CTCCGGATGCGCGGCCATCCGCACTCCCTTCCCGAGGCCCGAGGCCCCGACTCAAAGTGT
+CCGGAAAAGCGTAACCAGATCATTCGGCGGTGAACACCGCGAGCCAGGCGTGGTTGTGCG
+GGTCGCGGGCGTCGAGGATCGCGGTGGGGAATCGGGAGACGTGCGCGATCCCGAGCACGT
+CTCGGCTGATGAGCGCGGCCTGCGCCTGGGCGGCGAGGAACCGGGCCTCGCTACGCCCTC
+GGGCGAAGGCGGCGACCCGCACGCGACAGGTGGTGGAGACGGGCCAGTTCACGCTGCCGC
+CGTCGTCGCCCACGAGCAGGAACGGCCGGCTGGTCTCGGGCTGCCAGTCCTCGGGCAACT
+GGCCCCCGGCGTCGGCGTGCGGGACCTCTCGGCGCAGGTGCTCCCAGATCGCTTTCGCGG
+GGTCCGCGGGGACCCTCACCGCTTGCGCCTGGGGTCTCTCACGGCGACTTGCAGCCCCGC
+GTCTTTCGCGGCCCTGGTGAGCACGCCGTGTTTGGCCTCCACGGCGAGCCCTGCGGGGTG
+GGCGAGCACCACCGCGGCGGCCTGACGGTCGGTGGTGTAGGCGTCGACCTGCACCAGCTC
+CTCGGCCTGCGCGCTGCCTTCTGTGATTGTGGCGGAGAGCGCGATGACGGCGGGGTCGGA
+GCGGACCTGGGATGCGATCCGTTCGGCGGCTTGGTCGACGAGCTTGCCGAACCGGGTTTT
+GAGGAGCTCGCCGACCGCCTGCTTGTCCAAGGTGACTTTGACGTTCATGGCCGTGCGCTC
+ACCCCCGTTCCGTCGTCGCCTCGACCACCAGCGCCGCCCGTCTCGTGAACGGGCTTCGCC
+ATTCCTTGACCCGCGCCCGGCACACCAAGCCCCGCACCGTGATCAGGTCGCCGCCCTTGA
+TCGGGCAGCCCAGCGGCAGGCCGACCTCGAACCCCTCGGACGCCTCGGCCCGGCCCGCCT
+CCTCTGGGGGGCGGCGCAGCGCGAGCGGCGCGATATAGAGGACGGGCTGCTCGTAGGGCA
+CCCCGCCCGGCTCGGGGTCCCCGTCCGCGCTCCACCCCGATTGCCGGGTGATGACGACCG
+TCTCGGGCATCGGCTGATTCCCTCCTCTGGGCGTATGATCTGGGCATGGGATCAGAACGC
+GACCTGCCGGTCGAGGAGGACTACAAAGATTTCGGGCAAGAAGGCATGATCCAGCCCGAG
+CTGTACCAGTCGAATGGACGGTCTCCGAGGATCCTGCCGTTACTGCCCCCGTCTCCTGCG
+GGGCAGTCGTCCTTGGTGGTCGATGACGACCCGCTGGGCAAAGACATGGCCCTAGAGGGG
+CCAGGCGGCCGCGCGGTCGTCCACTTCCCACAACACGGCTGATCGCGTCACGCGGCTGAT
+GGTAGGTAGTACCTGTTGAGGACCTCGTGCTGCTCCGGGCCGAGGCTGGAGGCTCCTGGG
+GCGGGGAAGTACTCGTAGGGCCCCATCTTCTCGTGGACGCCGCCGAGCGGCGAGGTGACT
+GCCCGGGCGGCTTGTTCGCAGATGAGGGCGGCGACGGCGGGGGCGTCGTCGTAGCCGTGC
+GTGAATTCGACTGTGACTGTGCCTTCAGGCCAGCCGGACTCGCGGACGAGCAGTCCGGCC
+GGATCGGCGCGGTAGCCTGTGATCTGCTCTCCGTCGACGGTGACGGATTGGACGGAGACC
+AGGCGCAGGGTGGGCAGCGCCAGGACCCTCCCGCCGTCGCAGGCGACGTTCTCGGTCTGG
+GCGACGACGGGGGCGATGTGCCAGCGGCAGTGGTCGCGCACGGCGGCGGTCGCCGCGCGG
+AGGGACTGCTCGGCCCGGCCGTGGTCCGCCAAGAGGCCCGCGAACACCTCGGGGTCCACC
+AGCGGCGGCAGCTCCACCGCGCTCACCCCTCTTGGGGCTTGGGCGGGGCCTGTTTCGCCG
+CCGGCTTCTCGGATTTCCCGGTGAACAGCGGCTTGTCGAGGAAATCGGCGTCGCCGAGCG
+CGTCCGATGCGGTCAAGCCTTGTTTGGCGGCGTCCTCGTCGGAGAGCTGCACGATGCGCT
+CGATACCGGCAATAGTTGTCTTATACAGCTTCATATCACTCACCAGTTCTATTAGTTGGC
+CAAAAAAATCTTCGCGAAGGCGAGGGGGCATCGCACGGCGAGCGCGAGGCGGGTCTCGGC
+GCGGATCTTGACCCGGTTGTAGACGAAGTCGTCCTGGTCCGAGTTGGTGGACTCGACCCT
+GATCCCGCCCTTGCGGTAGAGGGTGGCGCCTTGGGCGAAGTTGCCCACCAATGGCTTGCC
+CTGCGCGACGACGGGGGTGACGATGGTGCGCAGCCCCCACAGCGGCGGGTCGGTCAGGAC
+GGGGCCTTGCCCGTACTGCCCGGTGAAATACCCGCCTGCGAGGTATTGGCCGTTCCCGTC
+GCGGGAGAGGCGGAATTTCTGGTAGTCCAGGGGGTGGATGACCAGGCCGTCGGCCTTGTA
+GTTGGTGGCGGTGGCGATCTTGGTCATGGCCCGGAAGATGGAGTCCGCGTCGTCCCCGGC
+GTTCGCGCTCTGCTCGTTCTGCAGGCCCGAGCGGTTGAGGATGCCGGTCAGGTCGGTGCC
+TTGGCCGGTGCCGTAGAGCAGTTGGCGCTCCTCGAACACCGACAGCGTGTAGAGCAGCCT
+GTTGTCGATCTCCGACTGCACGAGCGGGAGGTCTTCGAGGGTCTCGTCGGTGAGGTGGAT
+GAACGCGGCGACCTTGGTGACGTGGTCGGTGACCGGGGTGGGCTCGGTGAGGTGCATCTG
+GGGCTTGCGCCCGCCCTCGGGGACGGTGGCGAAGTCGCCTTCGATCGATCCCTCCAGGTA
+GTAGCGGATCGCCTGCCCGGAGATGGAGCCCGAGCCGATCAAATCGGCGACGACGGGGCG
+CTCGCGCTTCTGGCGCTGCAGGGAGCGGTCCACATCGGTCAGCCAGTCCCGGTACGGGCC
+GTCCGGGCCCCCGGTGACCTGGACGTCGTCGGCGGCCTTGCGCCCTGCGGGGACCCATTC
+GGGCGCGGTGGCGGTCGCCCCGCTGACGCCTTTGATCTCTTGCAGCCGCTGGCCGGCGTG
+TTTGAGGAAGTGCTCCCCGAGGCTGCGCGCGGGGGCACGGCCCGGGTCGAGCTGCCAGCC
+CGGGTGTGCGAGGGCTTTGCTCGCGTCGGGGACGAGCTGGTCGATGGCGCGTTGCAGCTC
+GCTGGACTCGCGCTGGGATTTCAGCTTGACGTCGAAGCCTTTGACTTGCTCGATCAGCGA
+GCGGACGCGCTCGGCGTCCTCGGGGCTGAGGTCACCGCCGGCGGCCTTCGCGCCGTCCAG
+GATGGCTTTGGCCTGTTCGTGTGCTTCGGCGCGCTCTTTGAGCAGCGGGTTCTCGGCGAC
+AGTGGTGGTCAATTCGTCTCCTCGGGATGGATGTCGAGCAGGTGGAGCTCGGCGGCGTAG
+AGCCGGGCGGGCGGGGCGGACTTCGGTGGCGCTTGCGCTTCGGGTTCGGGCGGCGGCTCG
+TCTTCTGGCGGGTCGTCTGCGGGGAGGACCGCGAGCAGGGCCTCCCCGGCTGCGCGGACG
+GCGTCGAGCGCGTCCCGCAGGGCGGCCTCGTTGCGCGCGGAAATCGCGCGCCCGGCTTTC
+ACATCGAGGACCTCGGCGTCGGGGTTCGCGCCGATCGGCACGACGGACACCTCGTGCAGG
+CGCAGCTCTTTGAGGTCCCACCCGGCTTTGACGCGCTCGGAGTCGAGGACGTCGAAGGCG
+AAGCTCATCTGCGCGAGCCGCCCGTCCTTCATCAGGCGATGCACCTGTGCGGCCTTCGGG
+TTGTCCAAGTCGAGGGAGGCTGTCACCAAGAGGCCCGTGTCGTCCTCGCTCGCGGTGAGG
+ACCTTGCCCACGCACAGCTCGGGGTCGCTGAAATCGTGCCCGTAGAGCAGGGGGATCGGG
+CGGCCCTTCTCGGCCCATTGGGCGAGGGTCTTGGCGAACGCGCCTTTGACCACGACGTCG
+CCGTGCAGGTCGCGGTTGCCGAAGCAGGAGGCGTACGCGGTGAAGACGCCCTCCCGCTCA
+GGCAGCGGCCGGATAGTCGTGTCGAACGCTTTGCGCCGCATCGCCGGCTCCCTCCTCGTG
+CGGGCCGAGCGGCGGTGGCGGGCTCGGCTCGGTGGTCTGGTTGAGGTTCCTGAGCAGCTC
+GTCCCCGCCCTCGACGGCGGGGAGGTTGTCCTTGGCGCGGGCCTCGTTGACGGTGAGCCA
+CGGGCCTCCCACGGCGGTGGCGGTCGCCTGGGCCTCCTGCTCGAAGGAGCCTTTGAGCTT
+CTCGCGCAGGTCGAACTCCACGTAGCTCGCGGAGCCGGGGGCGATCCTCGGGACGAGGAA
+GGCGTTGAGGCGCCCTGCGACCATCGAGAGGGTGGGGCCGAGGGTGTCGGTGTAGAGCAT
+CCGGGAGAACGCCTCGACGTTGCTGTAGTTGGCGTTGTCCAACAGGCCGACCATCACCGG
+GGAGATGTGGTAGACCGAGGCGACGGTCGCCAGGGCGAGCTTCTGGGCCTCGATGTAGTC
+CTCGTCCTTCGCGGAGAACCCGATCCGGCGCAGCTCCATCCCGTCCTCGAGGACCGGGGT
+GCCGCCGGCGCGGGGGCCGTTGTTGCCCGAGTAGGCGCCCTGGTAGTCCGTGACGAAGCG
+GTGTTTGGCCTCCGGGGACCAGCGCGGCGCGTCGGCGGGGCGGTGGATGTAGGCGCCGAC
+CCGGCCGCCGTTGCGCCAGGTCTGCAAGCGGTAGGCTTGGGCGGCGATCTGCTCGGCGAG
+GACGGCTTTGAGCGTGGCCACGGGGGTGAGCCCGCCCGTGGGGTCCAGGGGGTTCCAGCC
+GTGGAAGACGAGCATCTTCTCGCCGGGGATCACCACCAGCCCGGTGGCGTGCGGCGGGGC
+GATCTGCCACTCGGCGACCGCGAACGGCGTTATCTGGCGGCGGCCGGTCACCCACGCGGG
+CGGGATCGGGCGCACCACCCAGCCGGACTCCGAGGCGGGGTCTTGGTCGACGTACCAGAA
+CGCCTGGTCGTACAGGCTCAAATCGGCGACGAGCGAGTACAGGAGCTCGTAGCAGGTCTG
+CTCCGGATTCGGGCGCTCCAACAGCCGCGCGAGCGCCGTGTTCCGCTCGCGCTCCCGCCC
+CCCGTTGGGCTGCCTGCTGTAGGCGTGCAGGCCGAGCTGGGCGACGTTCCTAGCGAGGAA
+GTCGATGACCGTTCGCAGGTTCGGCTGCTCGGCCCACAACTTCTCCACCGGCTGGGCTTG
+CAGGTCCGCGAGCACGACCCGCACCACCGGCTCGGCGGCGGTCCACACCGCAGGCGGCTG
+GGCTGGCGGCTTGAAACCGAGCCAGGAGAGCAGGCCCATACTTCTGGCCTCGCTCTCGTC
+AGGTCACAGCACGGTCAGCCCCGAGTCCTCGTAAGCGCTGACGGGCTCAGCAGCAGGTAG
+GTTCGCCAATCCCCATGTCGCGGCAATGGCGGCGACGAGCGGGGCTGGGTCGACGGGTGA
+GTGTTTGCGGTCGATAAGCCACGCGTCCCCGGCCGGGCGGACAGCTGCTGTGGCGGCTGC
+TTGGTCCAGGCCAGGGTGCGATAAGTGCCGTATCTTGCCGGTGGCGAGCAGGTCGTGGAA
+CGCTCCGGTCGCTTTGCCGAGGTCCGGGCCGCGCCACGCTATGACGGGCAGCCCGGCGGC
+CTCCAGATCGGCTACAAGGGATGAGGCGGGCGCGCCGTTGGCCTGCACGATCACGGCTGC
+GATCTTCTCGCGGCGCTCCGCGAGCCAGGGGGCGACCCAGTCCGAGCCGGCGCGTTGGGC
+GGTGATCTCCACATGCGCCATCCCGTCGTCGCGGCGACCGGCGAGGGCGAGCGTGACGGT
+GGAGCGGTTCCAGGCCATGTCCAGGCCGACCACTCGCGGCGAGTCGGTTGCGATCGTGCT
+GTTGTCGTCGCGGGTGGAGTCCCAGGAGCCGGGCGGGAACGGGCCGGGCGTGACGGTGAG
+GGGCCATTGGCAGAGGACTTCGGCGGCGAAAACCGGGGCGGGGTCGGTGGCGTACGCGCT
+GGCGATGGCGCGCTCGGTGATCGTCACCCCGAGGGCCGGGTTCGCTTGCGCCCAGGCGTG
+GCGGTCTTTGGGGTCGCAGCCGGGCGGGGCGGACCACTCGAAGATCCCCACCGAGTCGTC
+TTCGGCCTCATCGTCGGGGGCCTGGTCCTCGACGTGGTCGGGTTTGCCGTCCGGCCAGTC
+GAGCTGGCGGTGGGCGATGTTCCTGAGGTGGGCGAGGACGACGGAGAGGTGGTCCCCGGC
+GTTGGAGAGGCACCAGACCTGCGCGTCGGGGCGGGCCATCGTGGTCTTGGTGACCGCCGC
+CCAGGAGTCGAAGGACTGGTGCTCGCGCAGCTCGTCCAACAGGATCAGGTCGGCGGTGAA
+GCCGCGGGCTCCGCGCCGGGAGGCGGCCGCGATCCTGTATTGCGCGCCGGAGTGCAGGCG
+CAGGCTCTTCTTGCCGTTGGTCTTGTCGACGTGCAGGACCTCGGACGCGAGCTCCGGGGT
+GCCCTCCGCGAGCTCGACGGCCTCGCCCCATGCCTTCTCGCTGTTGGCGAGGTCTTGGGC
+GGTGCCGACGACGACGCCGCCTTTGACGTAGACGCGCCAGAGGGCGAGGACGATCATGAG
+CAGGCTTTTGCCGTTCTGGCGTGCGGCGAGGGCGATCACGGTGCGAAAGCGCGGCAGCCC
+GTCCGGGCGGACCTCCAAGGCGTGTGTGAGCAGCCATTCCTGCCAGGGGAGGAGCTGGAC
+GGCGAGGACGTCGCGGGCGAACTCGATCACCGAGTGGCCGAGGCTGGCGTCGGGGGTCAG
+CTCCCGCAGCGGCGGCGTCCACACGCGAGGGACAGTGGAGCCGAGCAGCTGTTCGGCCAC
+ATCCGCCCTCCAGGTGCTAAGTCTTCGTCTCTGCCGCCTTGCGCAGCTGCGCGAGCTTGC
+CCCCGGAAGCGGGCGGTTGCGGCAGGCCCTTGCGCCCGAACGGCGTCAGGCCCAAGTCGG
+AGAGGATCTTCCCGAGCGCGGGGGAGGCGTTGTGGCAGACGCGGGCGAACTCGTCCAGCC
+CGCGAGCCTCGGCCTCGTCGATCAAGCGCGCCAGGGCGCGGGCGTTCTCCACCGCGCCCG
+CGTCGAGCGGGGTCAGGTGCGAGGCTGCGGCGACGCTGGCCTCCACGGCGGCGAGGACAG
+AGGCCATGCGAGTGGCTCCCATCGAAAGTTGATCTGTTGGCCGGAGGGCGGCAGTCTCCT
+GGCTGGCTTCGCCATGGCCGACTTGCGCGGGCAGAGCCGAACCGGCTACCTGTGTGATCG
+AAATATCAATCCGCCGAAAAAGGCGTGATCAGGCAAGTGACGAGTGTAAAGTAAGGATGT
+CAGCGGATATCGCGCTTGGCCGTGTTGGCCGTTCCGTCGTTGGCATGTACCCGGCCATGT
+TGTGGCCGAGGCAGGAGGGCTCTCTTGAAGTGGGCGCCGAAAAAGAGGGATCGGCGGCAG
+GCGTTGCGCATGCTGCTGAAGCCGCAGGACCATGGATCGGGACCTGTCGACGGGTCGTGG
+TGGCCGCGGAGCCGGGACTTGCACGTCGAGCTGCCTCGGCTGCTCCCGGAGCTCGTGGGG
+CAGTTGGGGCTTGTCAATCTGGTGTTGTACGACTTTGGCGGTTGGTCGACCGCTCCGGGG
+CACGTCACCTCGCAGGAAAGGGCTGTGAAGACGACAGGGGAGGCTCGTCGGCCGTTGAAC
+GCGGTGCGTGTGGTCGGTTTGAGCCAGAAGCAGCTCTTGCTGCTCGTGATCCCGCACGAC
+CTGCACCCCGACGACGCTCGCTCGATCATGGCGAGGGCGGCGGGACGTCACAACACCGAC
+GCCCCCGAGAGGCTCTCCCAGATCCTCTCGCCCGACGGCGCCCAAGGCACAGACGTGGTC
+CCGAGGCAGCGGTCGTGGGCGGGCGACGGCGGCGGCGATCTGGGCGAATGACCCTGCCGG
+GCCGCCGCCGCGTCCAGGCTCCGGGGCGAGAGCGCCGCAGGTCGGGCTGGTTGGCGGCGC
+GAATCCCCCCACGGGCGTACAATGAACCGTATTCCCGCTGATTCGGACGGCCTCATTCGA
+AGGCGTCGTCGCGGGGGTCGAGAGGCTCGCTCCTGCGGGCCGGTCAGGAGCGTCCATCGT
+GTCGCGACAATTATCACTATCACACCAATCGGGCGCAGTCCTCGATCCGATGCCGCGCCA
+TGGCGTGACATTGCGTCTGCGGTTGAAGCCGAAAGCCGAGCCGACCGGACATGTGGACGG
+GGCGTGGTGGCCCCGCTCGCGAGACTTGGCCGAAGAGCTGCCCGAACTCCTGCGGGTGCT
+CGGGGTCCGCTTAGGCCACGTCCATCGGGTGATCTATCGCGCCAGGGAATGGGCGATCGC
+TCCGGCCCAAGCCCTGATTGCCGGGAAACGAGTGCTGCTGGACAAGTCCTACTACCAACC
+GCCAGGCACCATACGCCTAGAAGGGGAGCGGGGAAGACGGCACACGCTGTTCGTGGTCCC
+GCCCTGGGGCGTCCCGCATCTCGCGCACGACGCGATGATGACAGCGGCCGCACCGAACGA
+CAAGACGACCGTCGCGGACCTGCTGGAGATCTCCGACGCCACCCCCGCCGACCTCGTCGA
+GCAGCGAGAGGAAGAAGACCGATGGGGCACCGACGGAGGGGCGTTGCCACAACCTAGCCA
+GCGGCGGTAGCGCGGACGACGCCCTCCCCCCTCGCGCGCACGCGCGAGGGGGGCTGGTCG
+GGGAGGGATTCGACGCTACCGCCGCCATGGCTGTCATGATCGACTTCGCCGTGATCTTGA
+GCCCCTACCCCCTGGGGGTGGCGAGTGGGTTAGTCCTCGAAGGCCACGACGGTCTCGTCG
+CAGTAGTGGTCGCGCTCGTCGCAGTAGTTGTGCCGCACGAGCCCGTCGTCGTGCTTGATC
+GTCAGCCGCGTCCCTTTGTCTCCGATGACGGCGAGGATCAGTCCGCCCGCGCCGACCTCG
+TAGAGTCGCACGGTGAGGGTCTTGCCGTCTTCCGTTTTGGCGTCGACGGACTGGATGAGG
+CCGTAGTCGCCCGCGTCCTCCAGCTGGGTCTCGTAGCGCCAGTGCTTGAAGCTCTCCTCG
+GCAGATCCCATGCCCGCATCCTATCACATTCATCGAATACATGTTCGACTATGGCTAGAA
+GTCCTCGCTTCTCGCCCAGGCCGCGTGAGCGGGTTGGGCTGCGCCCCTGGTTTGGTTGCA
+GCGGGCGTGGCTGGCGCGCAGGTTCTGGTAGTCGAAGGCCAGATGCGGGTGGGTGGCCCT
+GGGGTAGGCGTGGTCGGCTTGGAAGCTGTCGGGGTGCTCGGGCGGCGCGTTGTAGTCGAT
+CGGCTGGCGGCAGATCCAGCACGGGCGGCGTTCTGCCCGCAGTCGTGCGCGGAGTTTGGC
+GGCCTTGTCGCCGGACCAGCTGGCGGCCATCTTGGTCAGGCCGCGAGGCCCTGCGCGGGC
+CGCTGTGCTGCGAGGTGGGCGGCGATGACGTTGCCGGCGACTTGCCCGAGCTGGACTGGG
+ACGGCGTTGCCGAGCTGCTTGAGCGCGCTCTGCCGCCCGGCGGCTATGATCTGCCAGGTG
+TCGGGGAAGGTCTGCGCCCTGAGCCTCTCGGGGATGGTGAGCTCGCGTGCCCGGCCTTCG
+GGGAGTTGCACCATGTTGAACCGCGCCGAGCCGGAGTGGCTGGCGAGGACGGTGTTGGCC
+GGCAGGTCCGGTCGGGTGGGGTGCATCTTCCACGGCGGGTTGACGATCGGCTCGCGCCAG
+AGCGCGTGGCGGGTGTGGTGGGAGCGGTCGACGGGGCCGATCTCGCCGAGGTCGCAGGTG
+GCGTCGCGGAAGGTGCGCCACGGCAGGAGCGCGCCGGGGCCGTTCTGCTTCACGAGCGCG
+AGCTTGCGGGCGTGGGGCTTGTTCAAGGGCAGCCGGTCGTCCTCGGGGACGGGGTGGCGA
+TGCCAGTATTCGCCGGTGACGTATTGGGAGTGCAGCAGGGCCTCGAAGGAGTGGGTGGGC
+TCGGGGAAGGCGAAGCCCTCGGGGTTCTGGTCTTCGCGGATGCCGATGACCAGGACGCGC
+CAGCGCTGCTGGGGGACGCCGTAGTCGGCGGCGCAGACGAGGTTCGGGGTGACGGTGTAG
+CGCAGGCCGAGGGCGGGCTCGGCGAGGCGTTCGAGGACGCGCCGGTAGTAGTCGGCGTGG
+CGTGGGGAGAGCAGGCCGCGCACGTTCTCCATGAGGAACGCCTTGGGGCGCAGCCCTTGG
+ACGGCGCGGACGAATTCGGGGATCATGTCGCGCTCGTCGGCCTCGCCCCGCTGCGAGCCG
+GCGAGGCTGAACGGCTGGCACGGCGGACCTCCGGCGACGAGGTCGGTCTCGCCGGGGGCT
+GCGATCTCGCTCCAGTCGACGCCTCGGACGTCGCCCTCGATGACGGGGGTGTCGGGGAAG
+TTGGCGCGCAGGGTCGCGCAGGCGTTCTTGTCGAATTCGACCAGGGCGGCGGCCTGGAAA
+CCGGCCCGCTCAAGGCCAAGGGCCAGGCCGCCCGCCCCGGCGAACAGCTCCACGCTCGTC
+AACAGTTCGGGCATGGGCTGTTTCCTCCCCTGGTCGTGGCTGCTCGCAGCAGGTCGTGGA
+ATCGGTAAAGGTGCACGCCCGAGTTGTCCAGGCCGGATGGCCGGAGCTTGCCCCGGCGGC
+TCCAGGCCCGGACGGTTTGGGCTTTGACGCCCAGGACCCGCGCGGCCTCGTCGGCGGCGA
+GGAGGGTGTCGGGGCCGTGGGCGAGGATGTTCGGCGGGAGCGGTCTGCCCACGATGGCCC
+CCTTGTCGACACAGCTCGCCGGTGGCGGCTCTCTAGGTGGGTGGTGGGGCTCGGGGCGCA
+CGTCTCCCGCTGACCTCTACGCTACGGAGTTAGCACACATGTTCGCAATGGAACGGCGCG
+GCGATGTGAAATCGCCTGGTCGGGGGGTTGTGCTCGGCGGCGTGCTTGTGGATGAGTCCA
+GGTCATGAAGCCTTGTGGCGGGCGATTTCTTCCCATTGGGCCTGGTATTGGTCGAGCCAG
+TCCGCGATCTCGCCCTCGTCGGGCTCCCAGTCGCACACCGAGCACACGATCCGGTCGTAG
+TGCTCCTCGACCTCGTCCCAGCAGCGCCAGACGGTGAGGTTCTCGCAGCCGGGGCATTTG
+CCGCCGAGCCAGACCATCGGGGCGGCGACGCCGTAGGGCTTGGTGCGCTCGCGCAGCTCG
+CCCCATTCGCTCGCGAGCTTGCCGGCGTGGTCGAGCTCGCAGATCGTCTCTAAGCGCTCG
+TCCAGCCACTGGCGGGACTGCGCGACGTGCGCGGCCTGGGAGAGGTTCTCGCTTGGTCCG
+AGGCCGCCCAGGACACAGGCGAGGAGCTGGTGGGCGCGGACGAGGGATTCGGCGATCTCG
+GCGCACAGCTCGCTGGCGCGTTCGGCGGGGTGCCCGAAGCCCTCGGGGGTGGCTTTGCGC
+CCGAGGGTGTCGGGGCCTTGCGGGCGGGGCAGGAGCGCGAGGCGTTCGTAGTCGGCGGCG
+ATGAGGCCGAGTGTGCGGCGCAGTTGATTCCGGCAGCCACGGCACATGCCGTCTGCGACA
+AGTCTGCGGTCGCCGAATTTGTCGCGGCAGCCGGGGTGGACGCAGGGCCGGGCGCTCATG
+CGGCTTGCTCCTGCTCTGGTTCGAGGGGGAGGTTGTAGGCGAATTCGGTTCCGGTCCAGG
+CGAGGCTGATGCGGCCCCTCTTCCACAGCTCCCAGGCGGCGTGTTGGAGCGCCCAGTGCC
+CGAACGCGAGGTGGGCCGCGCGCCACTCGGCGTTGGTGGGCCCGGACTCGCGAGAGTTGG
+CCCAGATCTCGCGCATGAAGCGCTCCAGGTCCTCCGGGTCGATCATCGAGGGCTCGTGCG
+TCACAGGTTCTCCTTCGCGGCGTCCGTGCTGGCGGTTGGCGTGGCGGGGCGTGCGGTGAG
+GGTTTCACCGTCCCAGGCGAAGGCCACCAGGCCGTCGCGCCACAGGGCGAGGACCTCGGC
+GAGGGTGATGAGCTGCTCGAACTCGGCGAGGGCCAGGGCGAGGTCTTCCTCGGAGAGGCG
+TCCTTCCGCGTGGCGCCGGACTTCGGCGATCATGCGTCTGGCTTCTGGGTCGTGCGCGAG
+GGCGATGTCGATGGTCATGGTTCAGTGCTCCTGTGTCGGCTGGTTGGTGTTGTCGATGGA
+CTTCTTGTCGGCGAGTTCGAGGATTTTGGCCTCTAGGCGGCGGTCGAGCCGGTTCTGGCG
+CTCAGAGCGCTCGCCGGGTTTCTCGCGTTCGGCCCGGTCGCGGCGGATCGCTCTGGCGTG
+TCGGATGACGTCGGCGGCGGCGATGTGCTCGCCGGTCTCGCTGTAGTGCAGGGTCACCGC
+GTCCAAGAGGTCCGGCAGTCGCAGGTCGAAACGGGCGAAGGCTTGGGCCCAGGCGCGGGC
+CATGCCGGGCTCGGGTTTGGCGAACCAGCGGTCGAAGAGCGCGGCTTTGCCGAGGGCTTT
+CGCGGCGTCGGCGACCTGCTGGTCGCTGGGGTTGATCATTAGTCGAGCTCCCTTCCGGTC
+AGGTCTTGGGCGTTGTGGGCTTTGGCCTCGTAGTCGGCGGCGATCGCGAGCCAGCCGAGG
+GCCTTCTCCGAGGGGCTGCCCCTGGCGGGCTGGGCCGGGTCAGCCCGGTTTTTGACGACT
+TCGGAGACCAGCGACGGCAACAGTCCCGCCCCTGCGCGGGGTTTGGCGAGCCACAGGCGC
+AGGGCGTCCGCGACGTCGGCTCTGGGGGTCCCGGCGCGCAGCAGTTCGGCGGCTTTGACG
+GCGAGGGCGGAGCGGATCTGCTGGGGGTGCTCGCCTGGGATCGTCTCGCGCACCAGTGCC
+CAGCCCTTGATCGGCACGCGACCGGGCAGCGGCCCCTCGCGCCCGCCCGCGTCGCTCAGG
+TGAGGTGCTTTAGGAACGTGACTAGTAGATGTCTTTTCTTCTCTATTCTTTTCTAGAGGC
+GTGACGTCACGGGACGTTTCCTGTGACCGCTCGCGCTGACGGCGTTTGCGCTCGCGGTCT
+TTCTCTCGTCGTTCGAGCAGTTCGTCGCCGGTTTTCTGCCACCTCTCCCAGTTGCGGAAC
+CGGTAGACGCCAGGACTGGTCTCGTCGACGATCTGTGCGCGGATCAGCTCCGATATGTAC
+GACGAAACGCGGACGATCCCGAGACACATCGCCTGCTTTTTGTCGAACACGCCTTTGGTC
+TCGGCGTTGCCGCAGAACGCGAGCGCGCGGGTGAACAGTCGCTCCGCGTTCGCCGACAGC
+CCGGCCACCTTCGCGTCGAGGTAGTAGGTCGAGGACAGCCACACCTTCTCCATCGCTCAC
+GCGCTCCTTTTGGGCGCTTCGCGCCGGTCGTGGAGCGCGACGACGGCGTCCACGGCCCTC
+GCGCCGAGAGCGTTGTCGGCGCGGTCCTGCGCCTCCACGCTCGCGTGCAGGTACAGGTCC
+GCCAGCACGGCGACCGGGGTCCGGACGGTCTGGGCCTGCCCGGAGCGCAGCCGGTGCAGC
+TCCGCGCTGCGGCGGTCCCGTTCCAGGCGGGCGTGGTTGCGCTCGCGCTTGTCCGGCGCC
+CACAGGAGGTCTTCTGCGACGACGGCGGTCATCTTCGGCGGTGAGGGGGAGCCGGGCGGG
+TCCAGGCTCACGAGGTAGCGCAGCTGGAGGACCTCGACTGTGACGCCTTTGGCGAACATG
+CCGTGTTTGGTGGCGAGGTCGCGGGCGAGCGGGATCGTCTCGCCCGGGCGCGGCGGGCTC
+ATTCGGACCTCCGCAAAAGGGCGCCGGCCTTGTGCAGGGCGTCGGCCTTCTCGGCCTGGG
+TGAGCGGTTCGAGGACGCGGGCCTTGCCCTCTTTTCCGAGGCGCCCGCCGATCCAGCCGC
+GCCCGCAGTGCTCTTCGAGGTTCTTCACCAGCCCCGCGCCGAAGACGAGGACGTCGGGGG
+CGCGCTCGGGTCCGGTGGGGTGCTCGACGTCGACGACGTTGGCGCGGATGGCGGGTTTGA
+CGCCGTACTGGCCGGTCTCGACGTCCTCTTTGGCGAGGGGCTCGATGAGCAGGACGTGGC
+CGTGGGCCTTGTCCCAGTCGAAGCGGTAGGGGGTGGGGTCGACGAGCTCGGGGTCGTCGG
+GCTCTGCGGTGTTCGCGGTCGTCATTTGGTTCCTCATTTCCTCTTAGGCGGCGTTGTGGG
+ACAGGACGGCGGTTTCGCCGGCGCACTGGACAGGCGAGCTGGGGCGTGGCGCGAAGAACG
+GGCAGTGCTCGCACTTGACGGGGGTGATGGGGATCTTGGCGAAATCGGGCTCGGTTCGCG
+TGATCGCGTTGTGTCGGCGGCGCCGGTTGGCTTGTTCGAATCGGCGCAGGTGCTCTTGGG
+CGAGCTCGGGGTCACAGGGCTCCTCGAAGCAGATCGCGTCCTCCAGGTTCCCCGAGCGCG
+GCAGGTAGACGACCGCGATCTTGCGCACCTTCACGCCGGTCTGGTTGAGGCCGTGCCCGT
+AGAGGCTGGTCTGGGCGCGGTGCTCGGGGTCCATCTCCCCTTGGCGCTTGACCGCCGCGA
+TCCTGGCGGCGGACCCGGTCTTCCAGTCGATCACCGTCCCCGAATCGGCGTCCACCAGGT
+CCGGGGTCCCCGCCAGGCCGGGGACGATCTCGATCTTGCGTTCGGCGGTCCACCGTTCCC
+GGCCGAGCCGGGCGTTGTCCGCTACAGCGGCGGCGCCCAGCCAGGCGTGGATCGCGGTGC
+CGACGATGGAGGCCCACGGGTCCCCGCCCTCGTTCGCCTTCGGGGCCCCGGCCAGGCGCA
+GCGCCAGGCGGCGCTCGCACGGGTGCGCCAGCTCCGAGGGCCCGAGCGCGGACTGCTTGG
+AGCGCGGGTTCGCCCCGTGCTGGGCCTTGATCATCTGTTTCAGGTCGGCGAGCAGCCCGA
+CAGGCCGGATGGGGTCGAGGATCTCGAATGCTCCGAGGGCGCTCATTGTTCGGACTCCTC
+CCGGGGTTCGACCAGCCGAAGCTGCGGGGGGCCGCCGCCGGGGGCGAGCTCTGGGTGGTG
+GGCGAGGTCGAGGAAGAATGAGTTCAGGTCGCTGAGCAGGCGCCAGAGCTGGCTGAAGAC
+GAAATCGCCCGCCGTCCACTGCCAGTGCCCGTCGCGCAGGTCGGTCCAGACCGGGGCGTG
+GCGTTTGTGCAGCGCGTCCAGCTCCTCCTGCAACCGCGCGATCCGCGCCGTCCGGGCGGT
+GATGGCCCAGTCTTGGGGCGTTATGGCGCTCATCTCTTCTTCTCCTCTTGGTCGTGGGCG
+AGCTTGCGCTCGGCGTAGCAGGGGCCGCACAGCTTGTGCCGCGCCTCGCCCGCTGTGAGC
+GACACCGAGGCACAGCGGACTTGCGGGCCGGGCAGCTGGCCGCCGGAGTCCAGGTGCGCG
+CCCCAGTTCGCGACGCAGTCCTCGCAGCGGATCGTCTTGGACGGGGTTTTCGTCCTCGTC
+GCCCTCCACGCGCTCATTCGTCGACCGCCCGGAACACGCGCACGCGTGTGGTGCGCTGGC
+AGTCGGCGAACGCGATGGGCCAGTCGCGTTTGAGCTTCGCCTGGTCCAGGCCCGTGCGCT
+GGTGGGATTCCCAGGTGACGACGGCGCGCCCGTCCAAGACCCCCACATCCGCGTCGCCGA
+GCGCGGCCTTGATCTGCGCCTCGTGCCGTTTGGCGAGCTCGGCGTGCTCGGCGGCCTTCT
+CGCGGTGGTGCAGCATGAGGTCGAGGTCCGTCCGGTGCTCGGCGAGGTGGCGGGCGGTGC
+GCTGGCGGGCCGGGGCGGGGTCGGCCAGGCGCAGCGTCGGCTTGCGCTCGGGCTCGTCGG
+GGAGCGCGGGCGCTGTCGCTGTGCTCATCGTGTTCTCCAATCTGGTGGGTTGTGGCCGGC
+TCCGGCCGGGAGCGGTGAACGCCTCCCGGCCGGAGGGCCGATGGGGTTAGTCGAGGGGGT
+TCTCCGCGAGGCGGGGCCACGGGTAGTGCTCGTTGGGGTCGACGCGGATCACTTGGGCGC
+TCTTGCCCGCGCCCCAGAGGTTGAAGGCTTTGAACACCGGGGCGAGCGTGTCGCGCAGCG
+CCTTGGGATTGTTCGCCGACGCGAGCCCGGAGCGCAGCTTGCGGCGCAGCGTGTAGGCGG
+GGTGCCCGTGGCCGATCATCTCTCCGGAGGCGAGCAGGTGCAGGAACATGTGGCCGTTGA
+CGTGGTCCACAGCGAGGATGCGCCACGCCGCCGCGGCCCAGGAGGAGGGGGAGCCGGCGA
+GGTCGCGGTAGACCTGGTACCCGAGTCGGGTCGCGCAGGCCAGCTGTTCTGCGTGCTCTC
+TGGCGAAGGCGACCGTCTCGGTGTGGGTGGGGACGTGCCGCTGGTCGAGCATGATCACGG
+CACGCGCGGCGGAGGCGACCTTGGTGGCGTCGGGGACGCCGTCGATGCGCAGCGCGTCGG
+CGACGGTGCGCTTGGCCCCGGAGTCCATGACGTGCTGTGAGTCTTTCGGCAGCCCGGTGA
+CGAGCAGCAGTTTCAGGCGGACGCCGGATTTGACGATCGCCGAGAGGCGGTGCTGCCCGT
+CGAGCAGCGTGCCGTCGGCGGCGACCTGGACCGGGGCGGCGTTCTCCTTCCAGCGCCCCT
+CGGTCATGTCTCTGGCGAGGGCGTCGCGGTGGGCGGGGCGCAGGTTTCTGTTGCGCGTGT
+TGTGCCCGAGGAGCTCTTCGGCCTCCTCGGGGCCGATCCACCACCAGGAGGCGTCGGGGC
+CTGAGGCGTCGGCGAACGCGGAGGCTGGAGTCGGGATAGTCGTGGTCATGGCGATCAGTT
+CCTCTCGGGGATGGGGATGGGCGGTTCTTCCTGTTGGGGGAAGTCTTCGGGGGCGAGCTC
+GTCGAGCAGCTCTCGCGCGGAGAAGATCGTCTGCTGCAAGGCGCGGCGGACTCTGGGCTC
+CAAGCTCTTGCGGTTCGAGCCCCAGCGGTCGTCTTTGAGCAGGCGGCGGTACCCGTCGAG
+GACGGCGTCCTGCTGCACGCTCAGCCGCAGCTCCACATCGGGCAGCGGTTTGCGCTTGCG
+GGCGGCCTTGGGCTCGGGCAGGGGCTCGTCCGGCGCCCGCTCCCGCTCAGGGGGCTGGGC
+GGCTTTGGCCTCGATCACGGACTTCCACGCGGCGTGGACGCTGCCGTCCTCGTCCATCGA
+GGCCAGTGCCCGCTCGGCGGCCTCGCGGACCGCCTCCGGGGCGTCGGGGTCCTCGGCGGC
+CTCGCGAACGCTGCGGACCTTCGCGATGGTGTCGCGGGAGTAGCCGACGGCTTCCGCCGC
+TATGTCCCTGGTCTTCGGAATCCGCGCGTCGGAAACTGGTGCAGAATCTGCACCAGTTTT
+CGGCCTGCCTTGGGTGGCCTGCCTGCGTGCTTCAGCAACAGGTTTGAGGATCTTCTCGAT
+CTCACCGGCGATGGCCTCGGCCTCCACGGGGGTGAAGGGCTTGCGGCAGGCGTTCTCGTC
+GGACTCGGCGCGCAGCAGCCGCGCCGCGTCGTCGAGGTCGGCCATGACGGTCACCGGGAC
+GCGCTGCCAGCCGAGCAGTTTGACGGCCTCGACGCGGCGCTGCCCGGCGACCAGCTGGCC
+GTCGGGGGTGACGACCACCGGGTGCAAGAGACCGACGGTCTTGATGCTGTCGGCGAGGGC
+TTGAAGGTCGCCGAGGTCTTTGCGGTGCCTGCCCTCGACGGTGATCGCGTCCAGCGGCAG
+GGACGGCGCGCTCACGCGGCGGCTCCCAGGCCCAGTTCGCGTGCCCAGGCGGGCAGGAGC
+TGCGCGACCGGGACGGCGAGCGCGTCGGCCACCTTCTGGAGCTCGTCGAGCCGCCAAGGG
+CGCTGGCCCTTCACGGCCCGGCACAGGACGGGGTACTCGACGCCGATCTTCTCGGCGAGC
+TGGGCGCGGGTCATGTCGCGTCTGGCGAGCAGGGCGCGCACCTCGGCTGCCACCGCGTCG
+GAGAGGGTGTGGTTTTCGATGGGCATGCCGAGAGCCTAATACCTAATCATGATGTTTGCA
+ACTTCATTAGGTATGTGTCATGGCTCATAGGTGTAGCGAAAGTCCGGAATATGTTGTTCA
+TCGTCATTCCCGTCCGATACGGTGGGCGCATGGTGAAGAAAACGGAGAGCATCCCCCTCA
+CTGCCCTGCAGCTGGCCATCGTGCGCGAGACCCGCGCCGAGCTGACCCGCCAGGGGCTGA
+GGGTCTCGGCGCTCCAGGGCCCCCCGTCGCTGGAGGGGGGCACGTTCGGCGCCGAGCGCT
+ACGTCCGCGCCCGGCTCGGCGAGAAGCCCGCGATCCCGCTCACCCTCCTGGAGCTAGAGA
+TCGTCTGCCGCCGCCTGGGCCTGAAAGTCTCCGATCTCGTCGAGCGCGCCGAGCTCTCCC
+TCGCCGCCGGGCGCATCCCCGCGCCGCTGTGGCCGGAGGAGCGCCCCGAGCGCCAGCCCC
+ACTGGGGCGGCCCGAACCGCCCCGAGCGCGCAGAAACGCCGACGAATCCAGAAAAGTGAT
+AGAGAACACATACATGTCCTGACATCGGAGGACGTCCGCGAATCAGGCGGAAAACCGAAA
+AAACATCAGTGTAATTCGAGGTCAGGGCCACTTTTTGTCAGTGGCCCGTCCGATGATCTC
+CAGCATGAGTAAACAACCGACCACGCGCACCGAACCGAACCAGGACCCAGCCGCCCGCCC
+GAACGAGACCTCGCCCGAGCGCAGAGCGGTCGAGGAGACCGCCGCCGCGCTCGCCCAACT
+CGGGCTCGAAGCCTCCCCGCTATCGGCGACACGCCGAGAAGCGGAAAACGGCGACACGCC
+GACAGCACTTTTATCCACAAGCGAGCGGTTCCCTGAGCTGGGGGAACGATCCGATGTTCG
+GCGAGTCTCCCCAGAACCCCTCGCCGTGTTCGCCGGATTTCAGACGATTTCGGCGAGTTC
+CACACAGCCCTGTGGACAACTGCGCTTGACGATCGCGCCGAAATGCCTAACGTTCAATCA
+CATGCATGTGATTCAGCACTCGGAGGACGACGACCAGGCACTGCGGGAGCGCCTCGCCCG
+CCGTCCCTTCCACCCGTGGCGGGCGCTCGGGGCCGGCTGGCCGGAGGTCGTCGTCGACGC
+CTTCGCCGAGCTGCCAGACGGGGTCGGCTGGGAGCGCGAGGGGAGCTTGATCCGGCTCGA
+CCGCCGCCTCGACGGCGTGGTCCGGCGCAGATGCGCCGCCGCCGCGGCGCTCGCCTCCCT
+GGAGCGCGAGCGCTGCGGCTTCGCGGCCCCGTGCCCAGCCGAGGAGCGCGCGGCGGCGGA
+GGCCGAGGCCGCGCGCTGGCTCTTCCATCTCGCGGACCTGCTGCAAGCCTACGGCGACGC
+GCACGACCCGACCGACCGCGTCGAGCTCGCCCGCCTCCTCGACGTCACCGAGGAAGTCGT
+CAAAGCCCGGCTCGACGGCCTCACCCGCGAGGAGGGCGCGTGGCTGCACATCACGTTCTG
+GAGCGCCGCGTGAAGCCCGACCCCGCCAGCCTCCTCGCGTTCGAGCGCGCGTGGTGGCGC
+AGGGCCGCGAACAAAGACGCCGCTGTCCGCGAAGCGTTCGGGCTCGGCCCGATCCGCTAC
+TACCAGCTCCTCAACCAAGCGCTCGACGACCCCGCCGCCGTCGCCGCGCACCCGCAGACC
+GCCAACCGCCTGCGTCGGCTGCGCGAGGCGCGACCGGCGGCCAGGGCGCTCGGCGCGGCC
+TAGAGGCCCTCGCCTCGAACCTGTTAACGAGGGAACAGATTCGAGCTATAGTATCGAACA
+TTAGTTCGAATAACCGGCGTCGAGCCGGCCATCCCGAGGAGCACAGATGCCCAGACCCGC
+CACCCCGCTCGGCTGCTACGGCAAGATCAACACGAAAGAGGCCCGGCCCGGCCACTGGAC
+CGCCTCGACCTGGTTCCGCGACTGGGACGGCGAGAGCAGGCTGGTCAAATCCAGCGGCCC
+GACCAAGGCCAAGGCCGAGAACGCCCTCAAGAAGAAACTCCAAGACCGCCAGACCCCCGC
+CTCGGGCGACCTGGTCACCCCGGACACCACCGTCGCGGTCCTGTGGGCCGAGTTCCGCAA
+CCAGCTCGTCGAACGGCAGAAGGAGGGCTCGATCTCGGAGGGGACCATCGACCAGTACGA
+CCGCGCGGCGAAGAAGATCCAGAAGGGCCTCGGACAGGTGCGGATCAAAGAGCTCAAAGT
+CCAGCTGCTGCACAACTTCCTGCGCGCGCTCCCGAAAGGCTCAGCCCACCACTGCCGCAC
+GATCCTCTCCGGGATGCTCGCCCTCGCCGTGCGCTACGAGGCCCTGCCCACCAACCCGAT
+GCGCGACGTCCCCAAGACGACCGCCGGCAAACGCGCGCGCGGCTCCGAGTCCGCCCAGCG
+GCCCAAGGGGATCGACGACGAGACGGTGGAGCGCATCCTCGACGCGATCATGACCTCGGA
+CGCCCCGTGCCCGCAGATCGGCCCCGGCGGCGTGCCGACCCCGCGCAGCGCCTACGCCCG
+CAAGCACTCGCCCGACCCGACTCTCAGCCAATACGCCCAAGACGCCGACCTCGTCGACGT
+GATCACCTTCCTGCTCGGCACCGGCATCCGCATCGGGGAGGCGCTCGGCGTCCTGTGGAC
+CGACGTCGACTTCGAGAAACGAATCCTGACGCTCTCCGGAAAAGCTGTCAGGGTCAAAGG
+CCGGGGCATGGTCCGCGAATCCCACACCAAGACCGAGGCGGGCGACGGGCGGCCCATCGA
+GCTGCCCGGCTTCGTCCTGGACATGCTTCAGCGCCGCAAGGCCCAGCGCCATCTGATCGG
+CGCGAGCGGGTTCCGCCACCCCGGCAAGATCCGGACCGACGAGGAGCAGCTGGACTTGGT
+CTTCCCGGCCGCCAACGGGGGAGTGCGCGACATGAACAACACCCAGCGCCAGTGGCGGCG
+CGTTCGGGCCGCGCTGGAACTGCACTGGGTCGTCCCGCACGCCTTCCGCAAGACCGTCTC
+CACCGCCATCGACGAGGGCGGGCTCTCCGCGCGCGTGGCCGCCGACCAGCTCGGCCACGC
+CAAAGTCAGCATGACCCAAGACGTCTACATGGCCCGCTGGAAGCCCCACCCCGAGGCCGC
+GCAGCTCCTCGACGAGCGCTTCGGCGCGATGGTGAAAACGATACGTAAACATGACTTCAA
+CGAGGAAGAGGCCGTGGCGTGA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_014212.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1309 @@
+>NC_014212.1|provirus_1170297_1209132
+TTAAGCGGTGGGTCTGTCTTCCCTGGGGCCAAGCAGCTCGCCAACGGCCAGGGCAGCTTT
+TTTGCGCTGCGCCCTGAACAGATGTTGGTACGTTTGCTGGGTAAAAGCTACGCTGGCGTG
+CCCTACCCGTTCTGAGACTACCTTGGGATCAACCCCGGCCAGGGCCAGCAGAGAGACGTG
+AGTATCCCGTAAATCATGGAAGCGAATTTCTTTGACTTTAGCCCGCTTGATGATGGCTAG
+AAACTCCCGACGCAGGTTGCTCGGCTCGATGGGGGTTCCCACAGAAGTTGTAAACACCCA
+GCCCTCGTCAGTCCAGGCGTCCCCTATCCCCAGGCGATCCTTTTCTTGCTGCTCCCGATG
+TTGCTGCAATACCTCGAGCACATCGCTTGAAACGTCTACTGGACGGCTCGAGCGGTAAGT
+TTTAGGGGATTGAACAACCCGCTTGCTGCCGGCTTTGGTAAGGTTTTGCCGCACCCAGAT
+CGCGCCTTCCTGCCAATCAATGTCCGCCCACTTCAGCCCTAGCAGTTCGCCTCGGCGCAT
+CCCGGTCATGAGGGCCAAGAAGAAAAGGGCATACAAGCGGGAGTGCTGTGCCTCAGCCAG
+GAAACGCCAGACTTCCTCGGGCGTCCACACCTCGCCGGTGTAGCGTGGCGCCTGAGGGGG
+CTTGACCCGGTCCGCCGGGTTCCAGGGCAACAATCCCCAACGCACGGCGTCCTCGAGCGC
+GGCGTGCAAGGTCCGGTGCACCAGCCGGACGGTCGTTGGGGAGAGGGTTTTGAGCCGCTT
+GGGGTCGTTGGGGTGAATGCGCTTCTTAAGCAGATCAGCGTAAAGGTGAGTCAAGTGCAG
+CGGCTGTAAGCGCTGCACCGCTATATCCCCCAATATAGGGATTGCGTGTTTCTCAAGGGC
+GACTTTGTACCCGTAATGGGTGGTGGGTTTGACTCGGTGTTCTACTGAAGTCAGCCAGCG
+CTCACAAAACTCTTTGAGGGTGATCCGGTCGGGGTCAGGGAGCAAATTGCGGCCATAGGC
+CACCAGCAGCTCAGCCAGCTTCTTGGCGGCTTCTTTGCGGGTCTTGGCGTACCCCCGGTG
+GCGCTTACCGCTGATCATCAACGAATACTCGTAGCGCCCGTCTGCGCGTTTGTAGATGGT
+GCCTTCATTGTTGGCGCGTTTCATAGGTGGTTGTGTGGCGGGGGATGGGGAGGGGGGAGG
+GCATGGGTCAGTTCGTGGGGTCAAGTACTATCGAATCTTGGTCAAGACCCACACGCGTAC
+TTGTTCCAAGTTTTGCGATCTGTGTACCGATATGTGCTTCCCCAAAATTCAGCTAGTTCA
+AGTTGGGCGGTGCGCATAGCCGGGTTATAAGTAGCAATTACGCTGAAAGGGCTGGTTTGA
+CCGTTAAGCACTGGCTGGTAATCTATAAGAGCATCTTGAGAAGTAATGAACTCGTCGTTT
+TTGGTGAAGAAAGAAACTTTAGCAACAACTTTATCCAAGCTTTGGCCTGACACGTTTGTC
+ACCCTACCCTCGGCCTTTACAAAACTGTCGCCAATCTGACTCCAATGCCAATCCTCAATG
+TTGACACTCCCACGGCTAAAGCACGTGGGATTCTTGGTTCGACGAGGACTGCCTACGTTG
+TGTAGGTCTTACACCCTCTCCCCAAGCGTTTAGCGTCTCCGGGTGCCCCACGGCGACGGG
+GATAGCTCGTATCCCTTCGGCCCGGATGTTCAGGGCCGCGTTCAGGTCTCGGTCGTGCAC
+CGCCCCGCACTCACAGGTCCAAACCCTGTCCGAGAGGGTGAGGGCGGTGTGGATTGTCCC
+GCACTCCCGACAAAGCTTGCTGCTGGGGAAGTATCGGTCAATCACGACGAGATGTTTGCG
+ATACCAGACCGCCTTGTACTCCAACTGCCGCCGAAACTCACCCGGGGCCGCATCTAGAAC
+CGACTTGGACAGCTTGGTTTTCGCCATCCCTTTCAGGTTCAGGTCCTCGATGCACAGCCC
+GTCGTACTTCTGGACGAGTCCGGTGGTCAGCTTGTGCAGCCAGTCCTGCCGCTGGTTGCG
+AACCTTGGCGTGGACCCTGTTCAGCCGATGCCTGGCCTTTTCCCGGTTCTTGCTACCCTT
+CTGCTTGCGGGAAAGCTCCCTTTGCGCCCTGCGAAGCTTGCGCTCTGCTTTGCGGTAGAA
+CTTGGGTGGAGCTATTCTTGTACCGTCGGAAAGCACTGCGAAGTCTTTCAAGCCGAGGTC
+AATCCCCACCACATGCTCAGGGTTTACGGGGGGCAGGGGTACGTCGGGCATCTCGAACTC
+GGCGGTCAGGGTGACGTGCCAGTGCCCTTCGGTGTCGCGTTTGAATGTTGCGCCTTTGAT
+GACGCAATCAATCGGCTGGCTCTGGCGAATCTTCACCCCACCGACCTTGGGGAGGTAAAC
+CTTGCCTTCCTCCACCCGGACGCGCTGGGGAATGCGGAAGCGGGGCGGGTCCTTCTTTCG
+GGTCTTGAACCGGGGGAACCCGGCCCGTCGCTCGAAAAACGCCTTGAACGCCCGGTCGAG
+GTCTTGGAGGGCTTGTTGCAAGAGTTGGCTATCCGCTTCTCTGAGCCAGGCCATCTCAGG
+CCGCTTCTTCAGGGCGGTGAGTTCGGTGGCCTGCCCGTTGTAGGTCAACCCCTTCCCGGT
+GGCGGCATACGCCTCCTTGCGCCGTGCAAGGCCCCAGTTCCACACGAACCGCCGAGCTCC
+GGCCATACGCAGCAAAGCCTCAGCTTGGGCTTGGGTGGGTTCCATGCGGAAGCGGTAGAC
+CTTGCGGAGCAGCATTCAGTCCCTCGTCTTCTGGGCGGCGATGTATTGCTCGATGGTTTT
+GCTACTGACCATGCCAGCCGTGGAAACGAAATAGCTCCGTGTCCACAGGGCGGGAAGGCG
+GATGAGTTGGGGAAACTCCCGGCGCAACACGTGCGAGGTGTAGCCCTTCAGGCGGTGGGC
+GACCTGGTTAGGGGCCACGTCGGGGTCTACCGAAATGAACAGGTGTACGTGGTCGGGCAT
+GATTTCCAGGGCGATGATTTCCCAGCCTAGTTTAGCGGTCTTCTCCCTAAGCAGAATATC
+CAAGCGCTCGGCCAACGGTCCTACCAGAATCTTGCGGCGGCGCTTGGGCACGAAAACGAA
+GTGGTAACGCAGCAGCGAGACGGAGGTGTTCTTGTGTTTGTAGGCCGTAGGCACTATCAC
+AGTATAGCACACCTGCCGCCCACCATGCGATGTGCCCCTGCGGGGCACATGGGGGAGTCC
+ATGTATCCCATCCCTGAAGGGAAGGGTTTTATAGCTCCCCCACACCCCCTCGCTTCTATA
+AGATTGCTCCTAGCACCCAGCCCCAACGTTTCCCCTTGGGTTTACGAAAAGCGAAAACCA
+ACAACCCTATGAAAACGATTGGCCATAAAAGGTATAGCATATCTCCCTCCAAAGCTTCAC
+CTAATCTATTTTGAATTTACATCAATGTTCGTCCAACTTAGGGTCATTTGCCATTCAGCG
+TTTCAATCCTCACTCGAGCTTTCGCCCGAGCGCAACTACATTTTCCGCACCAGGGTAGCT
+GCCACCCCAAGGACGCGGTCGTTATCGGTAAGAGGAACCGGCGGGTGGTCGGGGTTATCA
+GAGTAGAGGTACCAGGAACCGTTGTAGCGCTGTAACCGCTTGACGATGACCCCATCCCAG
+TGGACATGCACCGCCACGATGCGCCCCGGCTCGACTGCTCCCCCGGTCCAGAACACCACC
+ACGTCCCCGTCCTTGAGCGTGGGCTGCATGGAATCCCCACCGACCCGCACAGCGAACAGT
+TCAGACTCCGGCTTGCCTTTGAGGTCCGGGATGTGGAGAGTGATGTATTCGGCGTTTTCA
+TTCCACATCGGCGGCCCGGCTCCGGCATCTACGACGGGGATACGATACCGCGTCACCGGA
+ATGGTAGCAGTGATTTCCGACCCGGGGAGCTGGATGCCTGTCTCCTGGGAAAACTCCTCG
+GGAGTCCATTGGAGAACATCCAAAATGCGCTCGAGGGTTGTGGGCTCCTTATATGCTAAA
+TAACGAACCATTGTGTCTACACTAGGGAGAAAACGCGCTCCTGCCCACCCCGGGCTTTTA
+CCTACTCGCTTAGAAAATTCAGCTTGACTAATATCTAGTTGTTTCAAACGAGCCTTGATC
+GCTTCTGCGGCTTCTATTATTGCCACCATACCCCCTCCAGTCAAATACCTTTGGTATTAG
+GGTAGCAAATAAATAACTACTAGTGGTATTGACGCAGCGATTCGTATCGACTACAATGTG
+TAGCGATGATAGGTGAACGCCTAAAAGCTCTTCGAGAGGCACGGCAGATGTCACAGTACG
+ATCTGGCCCGTGCTGCGCATGTCAGCCAAGGGCTAATCTGGCAAATTGAGGCCAACCGTA
+AAAATCCTGGCTTGAAAACGCTATTGCGGCTAGCAAACGCCCTATCTGTATCTCCTGACC
+AACTACTACCTGTAGTATCTCATGTAGGACAGGAGGCCCCCCGATGACTGACCCCACCCT
+CATCTGGCAAGTAGCCGAATCCCTCGGCTTTGGCCGCCGTGTGACCTACACCCCGGATGA
+GGTAGCAGCCATTTTGCGCATGGGCCGCAGGCAAACCTACGAGCAGATTCGCTCGGGGCA
+TATCCGGGCTGTCCGCAACGGTAGCCGCTGGCTCGTACCAGTCAACGCCATTGCGGAATT
+CGTTGGGGCAGGGCGGGAGGCCATCTCCCGATGAAATGTCCCCCGCTAGCGGGCGGGGGA
+GGAAGGAGGAGAAAACAATGTACAGGGACAGTATAGCACAACTCGAACGGGCCAGGGCAG
+AGCTGGCCGAGATGGGCAACCCATACGCCTACCCCGTGCGGGATTGGATAGACGATCATC
+TGCGGCATCTGGCCCTGCAGCGTTATCAAGCGCTGCAGGAGGAGGTCGCGGCGATTGAGC
+GGCGGTTGGATAGGGAGGTGGCGTGATGCCTAGCCCTATGCGGCGCCTCGAGAAGGCCCT
+ACGGATCGCTTTGGGCCGGGCGCACGGCGGCGATGCTGCATACGCCGTGCAAGTAATCGA
+AACCCTCGAGACCGACGCCGAAGCCCCCGACTACGCCCCCCGCCCCTATCAGGGGTGGCG
+GGATGCCCGGCGGCTCATCAACGAGATTGAAGCCCTCGAGCGCTCAGAGGGGGTTGAGCA
+CGTCCGCATCAAGCGCCGGGTTCCATCGGCCTACCGAACCGGAGAGTTTTATGTCTAAGC
+GCAGATTCGACTGGCCTGCTTTCTTCGCGGCCTTCTTTCTGGCCCTCATCGCCTGGGGGA
+TCGCCTTCGGCATCCCCTGGGGCCTGGATTGGATGGATCGGAGGCTGCCCTGATGTGGTG
+GCCCGACGACCTCCGCGATTTCCGCCGTTTCCGCGCGGTGTATGGCGCGGGGCAGTTCCG
+CTGGGGTAGCCCCGCCACCACCCCGGCCAAACGACCAGGGGAGACCAACACCTGCCAGAC
+CTGGACCGAGCGGCAGGTGTTGCGGCTGGCGCGGCTGGGGGAGCTTGATTCTGATCGGCC
+AATCGCGGCGAGCGCCGCTGGCAATGTGTAGCCCCAAGGGGGCAAAAGGAGTGTGTGTAT
+GCCGTTTGTGATGGAAAAACCGCAACAAAATGACTTTGGCACTGAAAGCGTGGTCTTCCC
+CCCCAACACCCCACTCGAGTTCACCCTGGAGAAGATCGAGGCTGGGCTTTACGAGCCCTT
+CAAGCCCGACGGTAGCCGGGATCAGCCTTATCCCCATTTCCGCTTCACCTACAAGGACGC
+TGAAGGAGACATCTACCAGACTCAGCCGATGCGTTTTCCTCGAGCGTTCCAGTTCAACGA
+AAAGGCCGGCTTTTGGAGGCATATAGGGGCCCTTTTTGGCCGCCCACTCACCGAAGAGGA
+CGCTGGAGCTGTGGAGATCGATCTAGGGCCGGGCTTCGACACCTGGGAGGACGTGCTATC
+CCGAGATAAGATGCCTAACTTGTTTGCCAAAAAAGACGAGGTGCGCCCGCTCCAGGTTAG
+GAGCATCAAGGTCCACGGCAAGGAACTGATCAGCTCCGATAGCAAGGTGCTTTTGATGTT
+CTCCACACAAAAGAAAAAAGACAAAGACGGCAAGCCCAAGCGTGACAGCAACGGGGATGA
+GATCGAGTACAGCAAGCTCGAAAGCGTATTTCCGATTTCCAGTGGTGAGAGCGGCAAGAA
+GAAGCGCCCCGTTTAGGAATCCCGCAAGCCCCTACCCGGAATCCTGGGTAGGGGCTTCTT
+GACGCTCGAGGGGACAACTATGGACCACAGCAAACTCACCAAACTCACTGGGGTGGGACC
+CGCCTTGGCCGAGCGGATCGCCAATCACTTTGGGAGTGAAGCCGAAGCCCTGGCGGCCTT
+GTCTGAAAATCCCTATCGGCTGATGGAAGTAGAAGGCATCGGTTTTCGCCGGGCTGACTG
+CATTGCCCAGGCGCATTTTGGGATTTCCCCTGATGACCCTATCCGGCACGGCTACGGCAA
+CGACTGGGTTTTGCGGCAAGCCGGGGGGCGGATGCCCCTCGACCTCTACCAGGCCAGACG
+AATGGAGATCGGACTCTTTGATCGTCGGTACGAGCTATGGGGAGCTTTTTGTGACATCCT
+CCTAGAACCTGATTTGCAAGATTCCCCGGAGTTTGCGCAGTACGTTTGGCTAGAGCCCGA
+GCTTAGGGCCGAACAAAGTTTGGCCCGCTTTTTGGTAAAGGCGACGCGACCAACCACTAA
+CCCTTTTATCATGCCTAACGGCATTCCTACTTATCTAAACGAGGCTCAGGTAAATGCGGT
+ATTGAAGATGTCCTGCCCCGGATTTGTCCCCGCTCTTTGCGTCACGGGCGGGGCAGGGAC
+GGGTAAGACCACGGTGATCGCTGAGGCAGTGAGGCGGTTAGGGGCCGGGGCAGCAAGAAT
+CATGACGTTTACGGGAAAGGCCGCCCAGCGGGTTAGGCAGGCACTCGCTGGGCGTGGTTG
+TGAGGATTTTGCCGAAGTCAGCACGCTGCATCGCGGATTGGATTACAAACCCGGGGAGGG
+ATTCCGCAGGGAACGCTTTACGGAGTCCGTTGTAATCATCGACGAAGCCAGCATGGTGCC
+CAATTGGCTGCTGGCCCAGGTAGTGACGCGGCTAGAGCCCTTGGCAACGCTGGTGCTAGT
+CGGCGACGTGGCTCAGTTGCCGCCAATAGACGCCGGGTTCCCCTTCAAAGACTTTATCGA
+CGCTGGGGTTCACACCGTAACTCTGACCCAAAACTACCGCCAGGAAAACCAGCGGGAAAT
+TTTTGAGCTGGCCGAAGCAGTACGAACTCGAGCCCTCCAGCCCCCACCTTTGCATGCCTC
+GATCTGCGCCACCAATCTTTCCGCCTACGAGTTCAACTACTGGTGTGAAGCCTTGCTCGA
+CCCAGATCAGCTACCCCCTTTGCTGGACTGGCAAGCCATCACGTACAGAAACGCTGACCG
+CGAGCGGATCAACCTGGAGTTGCAAAAAATATTCAACCCCCACGGGGGGAAAGCTTTCGA
+GTACTGGCCCCGCGCCCTCCCCAAGGAAGAACGAAAGCCGATCACGGTAAAGACGGGGGA
+CAAAATCGCGGTGCGGGCAAATGTTTACTCCCTGGAGGTGATGAACGGTCAGACCGGGAT
+CGTCCGGGATGTTAAGCTCGACCGCGAAACCTACGAACCGGTTTCGGTAATTGTAGAAAT
+TGAAGGACGAAGTGTAGAAGTTCCGTTGGAACTGGCTCCAGATCTCCTCGAGTTGGGCTA
+TTGCATCACCACTCACAAGGCCCAGGGGTCGGGGTGGAAGGAGGTGTTTATCTTGCAGCC
+GGGGGCAGTTGGGTTTGACTCCCGGCGCTGGTGGTATACGGCGATCTCGCGAGCTGAGGA
+ACAGCTCGCAATCCTCACTCAAATGGGAACCAGGACCTGGTGGGCCAATGCCACCAAGCC
+TATGCCCTTCGAGCCGAGCAGCTTGCTCGCGCGGTTCCAGCGTTACGCCTCCCAGCCGGT
+GGGGGTTCGTTGATGCCTGGGGCCATGGATACCCACAGCTTCCGCCGTCGTCTGGCTGAG
+GCCATGAGCGAGGCGGAAATCCAGCAAGGGATTGTGAGGTACCTACGGGCTACGGGCTGG
+GTAGTACTGGAGATCAAAGGCAACGCCAAGCGGGGTGGGACGGTATTTCAGACTAAGGGG
+ATCCCTGACCTCTATGCCGCACGAAAGGGACGCAGCTTGTGGCTCGAGGTCAAACGGCCC
+GGCCAGAGGCCGCGCCCCGAGCAAGAAGCGCTCCATGAACGTTTGCGCCAGGAAGGGTGC
+GAGGTGCACGTCATAGACGGGATCGAAGCGCTGGAGAAGCTGTTATGACCGGAATTTTAA
+CTCCTCCTACCACCTACGCCTTTTTCCAACACCTCAGGCTTCCGGAGGAGCGCGGGTTTT
+TGGAGTTTCGCGCTTTGCCTTCTAAAAAGCAGAGTTGGCAAGAGTGGCCCCCGCCCGAGA
+ATTTTGATGGGCTTTATGAGTTTCCTCGCGAAGAGATCTACTTCGGAGTTCTCTTGCGCG
+ATACCCGCAAGGGCAACGCCGCCCACGTACGGCGAGGCAGTGTTGCCTGGCTCGAGCTGG
+ATTTAGCAGGGAGCCTTTACCTTCCCGATTGGGACAAGAAGAGCGTGAAACAGGCACCCC
+CCGAGATCCTTCGCCGGAGCGCGGAGCAGCTTTGGGCGGACCTGGAACTCGAAGCTCGAG
+AGCTGGGACTACCCCCGCTGGCCGCCGTGTATAGCGGGCAGGGGCTACATGTGTACTGGG
+GGCTGGACACTCCCCAGGAGGGGAAGTGGTTGGAGGGGCTCAACAAAAGCTTGATCAAGC
+TGTTTCGCTCCTATAACCCCGAGGAGTCCGCCTTCGACCGCGCCAGAATCCTGCGGGTTC
+CCGGTACGTGCCACAGTAAAAACCCTCAGCGCCCACTGCCGGTCGAGCTACTGTACCTAG
+GCGACGAGCGCCTCCCGCGAGAACGGCTAGAGGCGATTCTGCAGGTCGAGGATCCTCCAG
+CACTCCCCCCGTCGCTGGAACGGGCCATGCGAGCCGGGCTCTCCCCCTGGGAGCCCTCCG
+AGCACGATTTACGACTACTGGTGGAGCACTGGCATGTCGGTGAGCGTAACCAAAAGGCCA
+TGGCCTTTGGTGGATGGTGCGCCTCCCACGGGGTGCCGGAGAAGGTGGCGCTGGATTTGG
+TAGAGCGGATTTGCCGCGAGGCAGGGGATGAGGAGCCCGCCAACCGCCGCAGCGCGGTGG
+CCAACAGCTACCGCCGATATCAGCAGGGGCTGTCGATTCTGGGGTTTTCCAGTTTGCGTA
+AGCTGGTGCCTGGCCTGGAGGGGAAAGGCCGAGTGAGCCTGGGAATGCTTTCCGCCTCCG
+AAAGCGAGGCCCTGGAAGGCGCCGTCCCTGGCGAGAGCCTATCCCTCCCTCCCGAGTACC
+GCCTGGACGAGGCGGGGCGGCTGGTAAAGGTCGAAGTACGCAGCACCCGTTGGGGGATCG
+TGGAGGACATAGAGCTACTGGCCCCCCGCCCCATTGGGGTGCGCGAGGTGTACACCGACC
+TGGCCACCGGCGAAAAGCATTTGCGGCTGTTCTGGCCCGACCTGGATGGCACGGTGGTAG
+AGCGGCTGGTACCGATGGGGGAGGCCATGACCCGGCAAGGGCTGTTACGTTTGGCCGCCC
+AGGGGTTGCCGGTGGACGAACCCAATGCTGCCCAGCTATCGCGCTTTTTACAGATGTACC
+TCTCCCACAACCGCTGGGCACTACCGCACCGGCGAGTCACCTCGCACCTGGGCTGGCAGG
+GAAAAACGTTCATTTTACCCGGCGGCGATGTAGAGGTGCTGGAGGTAGATTCCGAGCCTT
+GGCGCCCAAGGGGCAATCTAGAAGGGTGGCTGGAGGGCCTGAGAGCCCTTCTAAGCTGGG
+GGGTGACCCCGGCCCTTATCGCAGCAGCCCTCAGTGCGACGGCGCCCCTGGTGCGAGGCG
+CGCGGCTGGTCAAGAACCCCATCCTGGCGCTATCCACCACCAGCCATTCGGGGAAGACCA
+CGGCGGTGTACTTCGCACTGAGCATCTGGGGGAGCCCAGAGTACAACGAAACGCTCTACC
+TCGAAGACGCCACGGTGAACGGATTGATGGGTCGAATGATGGCCCGCCAGGATCTGCCGC
+TAGGTTTAGACGACTTACAACGCTATGACGACCGCAAAGTAGGGGAACTGGTGCACTTGC
+TTTCTGGAGGCGCCGAAAAAGCCCGGCTTAAGCGCGATGGCAGCGAGCGCCCGGCCCGGC
+GATGGCGAGGGGTGGCCTTGCTCACTGGAGAGGTGAGCGCATTGCGGGAGACATTGGGTT
+CAGGGGCGGTGAACCGGATGGTGGAGCTCGATGACTACCCTCTGGGGGTGGGCAAAGGAC
+CGGAGGGGGCCGAACGTTCCCGAATCCTGCGCGAAGCGGCTCAGCATTGGGGGCAGGCAC
+GCACCCCGCTGGTCGAGTTGTACGCCGACCTCAACGTGCGGGAGGTAATCGATGCCTTAG
+GCCGATTGGCCTTGGAGGCCGGCGCCCCGGCAGATATGACCGACCTGTGCGGGTTGGTGG
+GGCTAGGGGTACAAATCCTTCAAGTACTTGGAGGGTGGGAGGGGGAGAGCCAGGATGAAG
+CGGCCGTGACCTACTTAGCCCGCAACCTGGTGGAGCTGCGCGAGCGGCACGGCAGCCTGG
+CAGGGCGGGCGATGGAGGCGCTGCGCGACTTCCTGCGCAGTTATGCCGGAGCGGGCGATC
+AGCCGACCGATGAGATCCGGGTACGGGAGGAGCTACAGGCGTTTTACAAGGGGGGGAGCT
+GGTTCATCAACCCTAACGGGCAGGAGGTGGAGCGGGTCATGCGGCGGTATGGAGGGTTGG
+AAGTGCATCTGCCGGAGTGGGCTCGAGCTGGGTGGATTGAGGTGGAGCAGGTAGAGGGGA
+AACGGCGCTATAAACCGTTGGTTCGGTACAAGGGAGAGCGATATCGTTGGGTGGCCGTTC
+CTTTACTTGATCACGCGGAGGATGCTGATGATTGCTAAAACGTCACCACGTGGTGACGTT
+GTGGTGACGCTAGTGGTGACGGTTGTTTTTTTGTGTAGGACGAATAAAACACAATGTGTC
+ACCACCGTCACCACTCTTTATTTCATTTCTATACGCGCGCGTTTTTTTGTACCAGGGGGA
+CCCCCCTACTTAATTAAGTACTTAAGTACCCGGTTAGTAGGGGGGGCAAAAATTTTTGCC
+AAATTTTCTTCTATAAACTGCTTGTTTTAGTGGTGACAGTGGTGACGTTGGGGGATTTCC
+CCGTACAGAACGATAAAAAAGCGTCACCACTAGCGTCACCACAGTGGCACCACCGCAGTG
+ACGGGGGGATGTATGACTGAACCCACCCTCCTCCTCCGCATTGCCCGGTTCTGGGGTGTC
+TCCCTTGCTGACCTATGCCGCCAGTTGCAACCAGAACCGCCGTTGCGCCGGATGGTTGGA
+ACGCTATGCCAGGACTGTTTGAACGGTTTGGAAAGCCACGGCCTCCGCCCTCCGATACAT
+TTGCTCAAAGAACTGCGGACCAATCCCCAGAAAAAGCGCTACGCGCTCTTGCTTGGCTGG
+TTAGAGCAGTATCGGCGTTGGTGTGAGCTGAGTAAGACTCCCTGGACAGAACGCGGGGCC
+GTCCATCAAGAAAACCAGGCAGCCCGGGAAGACCTGGGCTGGCAGATTTACCTGGTGGAG
+TCGCTAATTCAGGAAACTCCCTACCCAAACACTGTCTCTAACTGGATAGAAACGCTCATC
+GGCCTAGAAAAGGAGGAACCTATGCCCATTCAAGGAAAAGTCGCAAACACCAGCTCGCGC
+CTGCACGACCTGGCTGAGATCGAGCAGGCCATTCACGAACTGCCCGGCCAGGTAGAACCT
+TGGGACGCTGACCACAAAATGCTCTACACGTTGTTGCTGGACATCCGCTGCGCCCTGCAG
+ACCTACGGTCCCCGGCACGATCCCACCAGCCTTGAGCAAGATCCCGTCGAAGCGCTCCCT
+GATTATCTGGAGATGTACCGGGAGTATTTGAGTAACTTGAAAGATTCAGACGGAGCTCGA
+ACTGACGACGAGATGCGATATGGGGCTCGGCTGGCCTGGCGAATCTGGCAGATGCTCGAG
+CGCCAAGGGGCTACCTACGAAGATTTAGCAAAGCGAGTGGCACTATTATCTGACCCTTCC
+GCGGCCTAGCCGCGAGGTACCGCCATGCTGAAGGTCCGACCCCTGAAAGCGACAAAGGAC
+ACGGGAGTAGCTAGCCCCTGGGGAGCGGCGGGGGCGACTATGAGGAGGGATTGATTGCGC
+TATACTGAATCCATACACCCCGCTCGAGGGGAAACGGCAGGAGGAGCTGCCATCCCCGAG
+GGCGTGTTGCTCATCCCTGGTAGACCCCAATCCAAGCTCGGCACCCCCGAGTTCGAGCGC
+TGGCGTATGCACGCCAGCCGGGCTGTGCTCGACCAAATCGACAACCCGCCTCTAATCCCG
+TCAAGTTTTCTCGAGCTGGCCCTCGACTTCTACTACCCCTTTGAGCAGCCCAGCTACACT
+GCTGACGACCTGGCCGAGCACCGCATCCCCCGCATCACCGCGGCAGCTGAGCCGGTGCTG
+ATCGCCCTGGTCGGGCTATTGTTCCAGCGTCGAGGGCAGATCAGTAGCCTGAGCGTCACG
+CGGATTGTGCGTCCTGCTAGCGCCCTCGAGGCGGAGTGGGGCGAGGCTTGGCGTAGGGGT
+GGGGTGCGGGTGCGGTATTGCGCGGAGGATGAGGGGCCGTGAGCAAGGAACCGCACCGTC
+CGACTCTTAAAAACCCACGGAGCCGACGCGGGGTGCCTCCTAGCGAGGAACAATGGGAAG
+TTTTCCTGGAGGAGCTGCGCCAGCACGCCACTGTCAAACGGGCAGCCAAAGCGGCTAAGA
+TCCACCACTCCACGGTGTACGAACGTCTGGCTAAAGATGAGGTTTTCCGCCGTGTGGTTG
+AAGAGGCCCTCGAGGTCGGCGCGGTTGCGCTCGAGCAAGAGGCCATCCGCCGCGCGGTCG
+AGGGAGTCAAGGAGCCCGTTTTTTATCAAGGGCAAAAGGTTGACACGGTAACCCGCTACT
+CCGATACTTTATTGATTTTCCTGCTCAAGGGGCTCAAACCCGAGCGTTACAAAGATCGGC
+ACGAGCACACCGGCCCCGGTGGCGGCCCGATTCAGGTGATCAGCATCGAGGTGGTGCCCC
+CCGATGACGCTTGATCGCGATTTGACCACTGTGACCCCGCAGGGCAAGCTGCGCTTCAAC
+CTGCACCGCGGCCAGTGGAAAGCTTGGCAAAGCTCAAAGCGCTTTGTGCTGGTGCTAGCG
+GGTACCCAAGGCGGCAAAACCAGTTTTGGCCCGCTTTGGTTGTACCGCGAGATCCAGCGC
+AAGGGGCCGGGGGATTATATCGTGGCGACTCCGACTTTTCCCCTACTCGAGCTAAAGCTG
+CTGCCGGAGTTTCGCAAGCTTTTCGAGCAGCACCTATTGCTAGGTCGCTACGTCGGATCA
+CCCAGCAAAAAATTTGTCTTCAGCCCGGAGGGCTTCGAGCGCACGTTTGGGCGTAGGCCA
+GGGCCGGACGACGCGCCGGTGCAGGTGTTTTTTGGCCATGCCCAGGACCCTGACTCGCTC
+GAGTCTGCCACCGCCAAAGCCGCGTGGCTCGACGAGGCGGGGCAAAAAAAGTTTCGGCGC
+GACTCCTGGCAGGCCATTCTGCGCCGCCTTTCCATTCACCAAGGCCGGGTGCTCATCACC
+ACCACGCCCTACTATTTGGGCTGGCTTAAGGCCGATTTACACGACCCCGCCCGGCAAGGC
+CACCCTGACATCGAGCTGGTCAATTTCAAATCGGTGGACAATCCCAATTTTCCTCGAGCC
+GAGTACGAGCGCGCTCGGGCTACCTTGCCGCGCTGGAAGTTCGATATGTTCTATAACGGG
+CTCTTCACCCGGCCAGCAGGCCAGATCTATGACTGCTTCGACCCCGAGGTGCACGTTCGG
+CCAGCCTTCAATGTCCCCGAGGACTGGCCGCGCTTCATAGGCCTGGACTTTGGCGGGGTT
+AACACCGCGGCGGTCAAGCTCGCCAAAAACCCGGCGTCCGAAGAATATTTTGTTTATGCC
+GAGTACAAAGCCGGCGGGCGTACAGCCCGGGAGCACGCTGAGGTTTTGCTGAAGGGCGAG
+CCCCGGGCGCCCCACGCGGTGGGCGGGGCCAAGTCGGAGGGGAACTGGAGGCTCGAGTTT
+GCCGCGGCGGGCCTGGGTGTGGCCGCCCCGCCGGTGGCGGATGTCGAGGTGGGTATTAAC
+CGGGTATACGGGCTGCTCAAGAGTGGGCGGTTGTACGTCATGGATAGCTGCCCCGACCTC
+ATCGACGAGATCATCAGCTACAGCCGGGTACTCGACGAGAACGACGAGCCTACCGAGCAA
+ATCGAGGACAAAGAGACCTATCACCGCGCCGATGCCCTGCGCTACATCGCCACTTATCTC
+GCGCGCGGCATCAATGACTGGCAAGTGAAAGGAGAGCACGCCGGATGAGCCAACGTTTTG
+ACGTGACCGGTCAGAGTGTCGGGTGGGCCGAACCGCCCCCCCTCGAGCTGCGCCTATCCC
+CCGACGCGGCCACCAACCCCCGCATTGAGGAGAGCTTGGCCAGCCTCACTGCTTTTGAGG
+CCACCCCCATCCCCTGGCCGCTGGACCCCGCTACCCTGATCGACGTTTGGTACGGGAGCC
+CCTGGCTGGGGGCCATCGGGCGGCTATTAGGGGACGCTCTGGCATCGGCCAATTACGACC
+TCGAGCCCGCCCCTCGCCGCCCCGACGGTACCCGGTTGGGCCGGGGGTCAGGGCAGACCC
+CCCACGATGAACGGCAGTACGACCAGGGCATGGCTTGGCTGGAGCGCGAGGACCTGGGCC
+AGGACGGGCTCAGTCTCTACAGCCTGCCCGAGCTAGCGCGCACCCTAGCGCTGCACCTGG
+ACCAGACCGGCAACGCTTTCGTGGAGGTGGTGCGCGACCGGGCCGGTAGGGGCCCGATCC
+GGCTCGCGGTTTTGCTCCCGCAGTTCGTGAGCTACGTGATCCGCCGGGAAGACGGCATCG
+CTAAGCCGATGCTCTACCAGCTCGATCCCTACTGGGGCCAGCAGTGGTTCATTCCCTTTG
+GCACCCGCCTTCCGGGTGCGCCCGAGCGCGAGTACCTCCATCAACGCCTCCCCAACAGCG
+TGAGCAACGTCTACGGGCTGCCCCCCTGGATCGAGGCCCGGCAGAGCGTGGAGGTGGACA
+ACGCCCACCGCGCCTACTTGCGGGGGTTTTTCCGCTCTCACGCGGCCCCACGCTGGCTGG
+TCGAAATCACCCAGGACCCAAGCTGGACCGGCCCCCAACCGGCGCAAGAGCAGGTGGACC
+AGGTACGGGCCCTCATCGTCAACTACCTCTCGGCCAACGCCGGGGAGATGGCCGGGCGGA
+ACCTAGTGCTCTCCTACCCCGGGGGAATCCTGCTGCGGGCCACCCCGATGGATCAAAAGA
+TCGATGATCCCACCTTCGGGACCACCGCCAAAAACGCCCGCGACGAGATCATGGCGGTGC
+GCCACGTGAGCCTCATCAATCTGGGGCTTCCCGAGGGCGGCTACCGGGCTACCGCCGATC
+AGCAATCCGACAACTTCGACCGGCAGGTACTCGAGCCCTTCGCGGCCCCCCTGCTGGCGA
+TGTTCAACCGGGTGTTGCGCACCCCGCCGCCCTCTGGGCTGGGCATTACCGACTACCGGC
+TGGTGGCCGAGTTCCGCGATGTGGACATCCTTCAGCAGCGCATCGAGGCAGTGATTAAGG
+CTGCAGGGCGCCCCGTGCTCAGCGGCGACGAGGCCCGTGAGCTGCTGGGCTACGAGCCGC
+GCGGGGACGACGAGGTGCTAGTGCCCGCCGGGCTGGTCCCGGCGGGCAGTTTGGTCCCCC
+CACCCGGCCCCGATGATGGCAGCCCGGAATAGCCCCCGCACCAGCCGCCGCCACCTAGCT
+GAGGTCGAGGCGGCGGTGGCTGAGTACGCCGGGTTGCTATGGCAGCGGGCGGCTGCCTGG
+CGGCTACGCTGGTTGCGCTTGGTGCTGCGCCGGATTCGCCCCGCCCTGGAGCGCTTGATA
+ATCGTGCGCACCCCGCCCGAGGCGGTGCTGCTGGAGCAGCTCATCCGGCAGGCAGCCCTC
+GAGTTCCCCATCCCCGACCTCAGCGACACCCTGACCGAGCTGGGGCGGAAGATCGCTCTG
+CAGTATGGCTTCCTCCCCAACGACCCGCGCACGGCGACGCTCGAGCGGGAGTTCAAAGCC
+CTGCTTGAGTCCGACCTCTCGAGCTACTGGCGCACCCTCACTGACCCGGCTACCCTGGCT
+AAACGATTGGCCGAGCTGCGCGATCAGAATAAGAGCACTGCCCAGATCATCCAGGCCGTG
+CAGCGGGAATACGGCGCTGAGTATTTTTCCGCCGAGCGCCTGGTCCGAACGCTCTACAAC
+TCGGGGGCTAACCGGGCTCAGTACGAGGCGCTGCTGGCCCAGGGCTACACCCACCTGCGC
+TGGCTCACCGCGCGGGACAACCGGGTGCGCGTAGCCCACGGCTCGTCGAGGTTTGACCAC
+CGCCGCATGGACGGGGTGATCGTGCCCATTGGGGAATTTTTCATCACCCCATCGGGCTCG
+AGGCTGCGCTACCCGGGTGACCGCAGCCTGGGGGCTCCGGCGGGGGAGGTGGTGAACTGC
+CGGTGTACGGTGGTGGGGGTGGCACTTGGGAACGAGAATGCTCAACTATCGCGCAATGAC
+TTGGATCTTCCCGCACCTCCCGCCCAACCCCGCCGTCAGGATTAGGTTCCAGTAGGCTCC
+CCCTGGCGAAGCTTTCTGCGTCTGCCCCGCAAAAAACTCCTCGAGATCGACCAAGAGGTC
+TTCGAAGTAGTAGAGGAAGCCGCTGCTATCGCTTCGAAGGTTCATGGCTTGCAGGGGCTA
+CCTCGAGTACCGGTAGTGCAACGGTTGCTGGATCGTGATGAACTTGCCCGTTACGTCCCG
+GACCCGGAGACTGGAGATCCGGCATACATCGGAGTTCAGAAGGGCAAGACCACCTTGCTG
+GCAGTCCTGGAAGAGTTTGGCCACATGATCGATCATCAAGCATTTTTTCGGGGCCAGTAC
+GCCAGCCGCGCTGCGCAACAAGGCCAAGGGCCGCTGGTTAGGTGGTGGGAAATTGTCTGG
+GAAACTCAAGCGGTTAGAGAGTTGCGCTCGTTAAGGCGCGCGTTTTACACCTTCGACATT
+GAAGGGCGGAAAAAGGTAGATCGGGGGTTTGTAGCCTACTTGCTTCAGCCCGACGAAATT
+TTTGCCCGTAGCTATCGCCAATTCATCGCGGTCTATTCCGGTGATCCGCGTTTGTTGAAG
+GCCATTGGTTCACCAAAACCACCCCCGGAAGCCCCTGTCTTTAGACATGGGGAGGAAGGG
+GGTGGCGAGCGAAGCTCGCTGAATGGTCAAAAGCGTGATAAACTGAGTCAAGGTATGTCC
+CTCCTGTCCGTGCGTTGCAAACTGATACCCGACGCGAGTACGGCCGAGAAGCTGACCCGC
+ACGGTGAACCAGTTCGCGAATGCCTGTAACTACACCCTCCAAGTCGCAAGGCGGGACAAC
+CTGTGGAACAAGTTCGCCCTGCAACGTGCGGTCTACCGGGAGCTTCGGGAGCGGTTCGGC
+CTCAGCGCCAACCTCGCGGTGCGGGCCATCGCTCGGGTGGGCAAGCGCAAAGGCCACAAA
+GTGGGCGGCTTCAAGGCTACCAGCGTGGACTACGACCAGCGCATCCTCTCGGTCAACCTG
+GACACCGAAGTGGTCAGCCTCTCCACCGTGGACGGGCGGGTGAAAGTCCCCATGCAGATT
+GCGGGGTATCAGCGCCACCTTTTGCGAACCGCCAAAAGCATCCAGGGCGGTCAACTGGTC
+AGGGGGCGGGACTCCTGGTACGTCCACCTGTGGTGCGAGTACGACGACCCGCCCGCCATG
+ACCCCAAACGGCTTTCTCGGGGTTGACCTCGGCATCGTGAACATCGCCACCGATTCGGAC
+GGAGAGACCTACTCCGGCTCCCACCTCAACTCGGTTCGCCACCGCCACCGGAGGCTCAGG
+AGGAAGTTGCAGAAGAAAGGCACCAAGGGGGCCAAGCGCCGCCTGAAGAAGCTCTCGGGC
+AAGGAGGCCCGCTTTTCCAACCATACAAACCACGCGCTCAGCAAGCGCATTGTCGCCAAG
+GCCCAACGCACCGGGAGGGGTATCGCCATCGAGGATTTGGGTGGCATCCGCGACCGGGTA
+CGGCTCAGACGGCCTCAACGGGCGGCCTTGCATAGCTGGGCGTTCTTCGACCTGGGCCAG
+AAGCTTCGGTACAAGGCTGAACGGGCGGGAGTCGTTCTGGTCCAGGTTGACCCCCGCAAC
+ACTTCCCGCACCTGCCCGGCCTGCGGGCACTGCGAGAAGCTCAACCGCGTTTCGCAGGCA
+CAGTTCGTCTGTCGGTCGTGCGGCCTCGTTGGGCACGCAGACCACTTCGCAGCCGTGAAC
+ATTGCCGTTCGCGGCTGGGCCGCTGTAAACCGGCCATACCTGGGGGAAGCGGAGAGTGCT
+ATCCGGCATAATCCTGTCCCTGGAAGCCCCCGGCTTTAGCCGTGGGGTGGTTTACGGCAA
+AACAAACCGGGTTTCGAGATCGGCTATACTATACAGTGGGCAGATCAGGAGTTCGCAGAG
+ATCGCGATCGAACTTGAGGACGTTTTCAGGAGGCTAGGATGGCTGAGATAACCGAAAGGA
+AGCGCGAAAAGCAGACTGCCGCGGCTCGCCGTCTTGAGCGTTTCCGCAGCATGGGCATTG
+ACGGGGCGGAAGCACGCATCTATGCCGGGTTGGGGGGGGGTCAATACCGCAGCGCGTCGG
+AAGGCCCGCGCCGATTCGAGCCGCCTACCCCCGAAGAACTCGCCACATACGAAGATTGAG
+TGTGCTATAGTTAACTCATACATCCCCCTAGGGGAAGGCCCACCGGGCACCTCGAGGGGG
+ATTTTTCTTTGCCCATTCACTCTTTTACCCACCGCATCCCGCTACAACTGCGGCAACTAC
+GCCAGGGCGTCGTGCTGGTGCGGGCCAGCAACGACACGGTGGTGGATGAGTACGGTACCA
+CCATCACCGTCGAAGCGCTGATGCGGGACTGGGTGCCGGCGTTTTTACAGCACCGCACCA
+TCAGCCTGCAGCACAACCTGCCGGACCTGCGCGGCATCCAGGGCAAGCCCTTCGTGGGGC
+TGGCCCGTCGGGTGGACTTTGCTCCCCAGCTCGAGGTGGAGGTGGAGGTGCTCGACCCGG
+AGACCCAAGCCCTGATAGATGCGGGCCGGATCACCGGGGCCAGCCTGGAGTTCGTGCCCC
+TCGAGTCCCGCACCCAACGGGTAGGTGGCAAAGAGAGCGAGGTCTACTACCGGCTGGCGT
+CGGAACCGGAGCTCGCCGGGCTGACCCTCACCGACCTCCCGGCGGTGCCGGGGGCGGAGG
+TCCTCGAGATTCGGGCCGAAGTCCTGGCCCCCTGGCAATTCGCGGTGGTGGACCCCGCGG
+TCTTCGAGGCCCGCAGCCTAGCCGACGCGACGCGGCTGATGTGGTTCCCCCACCACGACG
+CCCCAGGCTTTTATCACAACCCTCGGATTAGCCTCAGCAGAACTTTGGGATCAGCCGAGA
+ACTTTCTAACCGAGCGCAACACCGGCCACCTTTTGAGATGCAGGAGGTTCAGGATCACAT
+CCCGTAGGTACATCAGCCCCGCCGCCCCCTTGCGGCTGCGGGAGGCATCTTCTCCCAACA
+CCGTGTCTCGTTTATGGTGTAAGCGATTCTCTACCTCCCAGTGTCCCCGCCACAGGGCAT
+ACAGCCGCTTGGCCGGGGCCTGTAGGCTGGTCAGGGCATAGGCGGTCTCCTCCCGTAGCT
+CCCCGCTATTCTTGCGCACCACCCGCCGTCGCATCCGCAAGGCCATCCGCGAGCCCCGCC
+AGCCGCTCACCCCCTCCGGCAGGGGGAGCCCTTCCAGGTGCCATATCCAGACCTCTCCAC
+CCCGAACCTGGTGCTGGATGTAGTGGTCGGTCGCCTGGTAGTTGGCAAAGGCCCACTGGA
+TCAGTTCCTTGAGCTCTGCCTGGTTCCCTTTGACGCTGAACAGATACCCCCCTTTTGCTC
+CACCACCACTGCCGCCAACTCCTGGGTGCACAAGGCCGCATCCCCCGTCAGTACCCAGTC
+CACCCCCAGCCCCTCCATGTGTACCACCAGTCCCTGCGCCGCCGCTGCCTCACCGTCGGC
+AATCGCCTGGCTCCCCAAGGAGAGCCCCAGCCCCTGAACCAACGCCGACAAAAAGACCAG
+CGCCTCTTCCCCTCGCCAAGCACACCGGGTGCCCCGGAGGTGTTTACCGTCCACGGCTAC
+GGGCAAGGGTTCATCGCCCTCCTTGCCCAGGGCCTTGAGTACCTCCCGAGCCCAGGATAG
+TAAGGCCTTTTGCAAGGGTTGTAGGTCCTTGCTCAAGGACCAAAAGAGGCGGTAGAGGGT
+GGCTTGCCCGGGTAGTTTGCGCTCACCCCGGCGGGTACGGATATGGACCTCGTCCAGCAA
+GAAGCGTCGCTGGTCTTGCACCCACTGGCTGACGGCCAGGATATTGTGCCGTCCCGAGCC
+CACCGCCATCAAGCAGATCAGCAGCAGGTCTTGCCAGCGATGCTGGGTCTTCAGGTACTC
+GCGGGGATCGGGTATCTGGGCTAGGTATGGCAACGGAGAGGGAATGGAAGCAGTTTTCAT
+ATGGCTTTATGATAAAAGCCTGACGACGCCCGCACGCACGCGGTGGACCCGGACCTGCTG
+AGGCAAGCCCTGGCTGATCTCGAGGCCGGGCGCTTCGAGGTATCCGCCGCCGCAACCCTA
+TCCCGCGAGGAGGTGGCACGCCGCGCTCGAGCCCACCTGGAACGGCACACGGCCCTAGGC
+ATCGGTATGCGTACTACGGAGGAAAACATGGAACAAACCCAATCCCAGGCTCCTACCCAG
+GAGCGCAGCCAGCAGGTTGACCTCAACATCAACCTGGACTTTCGCACCCCCGCCGAGCGC
+GCCGCCGGCGTGGCCGAGACCCCCGCCGAGCGCGCCGCCCGTGAGCAGCGCGAGCGCCAG
+CAGCCCACCGCCCCCAACCCCGCCGAGCGCTGGCTTCAGGCCCGCTCCGCCCAACTCGAG
+GCCGAGGGCACCCCGTCAGCCCAGGCCGAGGCCCAGGCCCGGCAGGAGCTCGAGCAAAAC
+CCCGAGCTGGCCCAGCGGCTGGCCGAGGCGGGCCGTGAGCCCACCGTCGAGGAGCGCGCC
+GCCCGCGCGGCCGCTCAGGCCGTGACCGAGGCCCTGTCCCGCCTGCCCGAGCCCCCGTTG
+GCGCTGGTTACCGACGGCGGCATCTCGGTGCGCTCGCGGCGCCCCACCAGCGATGAGCTG
+CTGTCCGAGATTTTCGCCCGTTCGGTAATCCCTCAACTGCAGCGTCGCCAGCCTACCCCC
+ACCGAGCGGCAGGAAATTGACAACATCCTGCGCCGCAACGGGCTCGACGTGCGCGCCATC
+ACCGTTGAGGCCAACGGCACCGTGATCTACAACGAGCTGGCCCGGCAGTTCGTGGTGCGC
+CCGGAGCCCGATATCATCGCGCGTAACCACTGGGCCAGTGTGCCGATGGGCGGGACCAAC
+AAGCGCACCTTCCCCCGCTTCGACCGCGGCGGCATCTCCCACACCTGGGGGCGCACCTCC
+ACCACCGCCATTACCGAGAGCGACCCCACCCTGGACACGTTCGAGGTCGAGGTCACCGAA
+CTCAACTCCAAGGTGCCCGTGCCCGATAGTTTTTCCTTGTTCAACGCCCAGGGGCCCAGC
+TTCATCCAGCGCGTGCTGCTCCCGGCCATGCGAGGAGCGGCCCAGTACGAGGAGGACCGC
+GCCTTTTTCCTCTCCAACGGGGTGAGCCCTAACCCCACCAAGATCATCGGCCTGCGCAAC
+AAGACCGGCGTGACCGTGGTGGCTTCCTCGGCCAACGGCGACGCCTTCACCCAAGACATC
+CTCACCAGCCTGCTGCGGGCCATGCCCGTGCGCTACCGCAATGACACCAGCCGCCTGGCC
+TACTACTTGCCGGTAGCCCTGGCCGATGACTACGGCGACATCCTGGCCGCCCGGCAGACC
+TCTGGAGGCGATACCTGGCTGCAGCGCTTCGCCAATCAGCCGGGGCCCATGCCTATCGGG
+GTCCACCGCGGCATCCCCATCTACTCCGTCTCCCATTTGCCCACCAACGAGACCCAGGGC
+ACCAGCAGCAACGCCGCTACCATCTACCTGGTGCACCGCGACATCCCGGTGATCGGGGAC
+GCGCTATCCATTCGCATCGAGCCCTATCGCCGGGAAAACTTCATCGACGTGCTGCAGCTG
+CAAGGGTTCGTGGGGCTGGGGTACCAGTGGCCGGACGCTATCGTGCGCCGCTCCGGTGTG
+CTGCCCAAGGTTTAGGAGGTAGCGCATGGCTAAAAAGAACGAGAGTGCCGCCGAAAACCT
+CGAGTCTACCCCAGCCCCCACTGGGCTGGTGCCGGTGCGGCTCAAGCCGGATTCGCCGTA
+TGGCCGGGTGGTGGTGGGTACCGTCGTGGTCGAGCGCTCTAAGTCGCCGGGCGCCGACTG
+GCCGCTGATTCCGGCGGAGGAACTCGAGCGCCTGGCCGAGGAGTACGGCCTCGAGGCCGT
+ACCCATAGACGAGGAGTAGCGTGGGCTGGCTCGCCCCATACGCCGACGACCTGCTACGCC
+TGGCAGGCTACCCTTCCCCCCACCCCCTGGCGGGGGATGCGCTGACCTATGCCGAGCAGG
+CCATCGAAAGCTACACCCGCCGGGTGTGGGGCTCGAGCCAGCCCTTTACCCAGCGTGTGT
+TTACCACGGCCAAATCCTACGCCCTGCCCCTGCCCCCAGATGCTACCAGCGTCGCCACCG
+TCAACGGCAGCCCAGCTCCGACTGGGGTCACCTGGAGCATTACCGCGCTGGGGCTCGAGG
+CCACCGACGCCGAGGGCCGACCGGTGGCCTGGGCTCCCGGCGTGTGGACGGTGGCCGGGC
+AGCGCGGCAGCGCAGCCATCCCCCAGGGAGTGCTCAAAGCCGCCAGCCTGCTGATCAATG
+CCTATTTGAGTCTTTCCGACGCCCAGCGCAGCCAGATGGCCAACGCCAGCCGGGGCGACC
+TGAGCTACTCGATGCGCTATGCCCAGCTGAGCGTGCCCGAGGCCGAGACCTATTTGGCTC
+CTTACGCCAACCGCATCGCCGGGGGGCTGTTGTGAACAACGTGATCGCCAAAATCTACAA
+CACCAAGCAGCGCCTCGAGGCGGGCTTCCTCACCGACGAGACGGGCAGCCTGCTGCTCGA
+GCAGCCCGCCCAGCTTTCGAGCCCCACCCGCCCCTGGGAGCGTGCAGCTGCGCTGGAGGG
+CGTTTTCTCGGCCACGCTCTACGTGCAAAGCGCCGAGGATCTGACCCAATCCGACCTCGC
+CGTCACCGAGGAGCCGATTAGCGGACAAACGCGGCAGTGGCGCGTGCTCAGCCACGCCAA
+CAGCGGCCCCGAGTGGCGCTTGGAGCTATCCAGCCGGGAGGTGCGCCGTGGCCCTTGATC
+CCAGCGTTCGGGCCAAGTTGCGCCGCAAGCTCACCGCAGGGCTGGCGGGCGTGGCCGTGG
+CGCTGACCAACGAGGCCAAGGTGCGGGCCACCCGCCACGTGGACACCGGGGAGCGCCGTA
+ACTCCATCGCCCACGCCGTGCTGCCCAACGGCTCGGTGATCTGGGGCCTGCCGGGCAACG
+CCAAGAACGCCGCGCTCGAGCTGGGCTTCCGCCCCCACTGGGTGCCAGCCGGATATATCG
+GAGTATGGATGCGGCGGCATGGATTGACGCGCGGCAAGCTAACCCGCCGAGCCGCAGGGC
+TCTACGTGGGCGGGCCGGGCTCGAGGCTCGACAGCGGACCCGGTGGGGCCAGCGGCACCC
+GCCGGATCGGCAACAAGAACGTCTTTGGGCGCTGGCGCACGCGGGGCGAGGTTAGCCGCT
+ACCTCGCGCCGGGGAAAGTAGGCCACAGCGTACTGCGCCACACCGTTGCTACTCGCCTGC
+GGGTGGTTGCGCCTGCTGCGTTTATCAGGGGGTACCAGCGTGGCTAGCTTGCAAGCCGCC
+GCGTTGCGGCAGTTCTACGCCGCCCTCGAGACCTACCCCCCGCTGGTGGCCCTCACCGGC
+CACGTCCCCGGCGCGACCAGTCTGGGGGCGGGCGCTCGGATTATTGGCGACTCGGTGCGG
+TTGCGGCCCCATCCCATCCCCGGCGTGGTGCTCGGGCTGGGGAACCGCAACCAGGGGGGC
+AAGGCCACGACACACGAGGCTCTGCGGGATTGGGAGATCAGCCTGCTCGTTTGGGCTGAG
+GACGTATTCCAGGCCGCGGAGATCGCCGAAGCGGTCGAGGACTTCTGCTCCCTGGCCCGT
+TGGGAGACTGGCCCGGTGCGCCAGGCGCAGTGGGTCTCGAGCCAGCAAATGGAGCTTTCT
+CAGGACCAGGAGTATATCAGCGTGCTGATCACGGTGCGCTTACGCATCGCATAGGAGGAC
+ACATGGGACGTTCGGCGGTAGACACCAACAAAATCGGCTTTTCGGCGGGGGCCCGTATGT
+TCGAGGGCCCGGTAGGGGCCACCGAGGCCTCCCTGCGCCCGTTGGGGCTACTGGGGGCGG
+ACGCCACGCTCAACATCGGCCAGACCACCAAGCAGAAGCAGGACCGGGCCCCGCTGGTAG
+TAGTCAAGCAGGCCATCAACCAGCAGTCGGCGCAGATTCAGGTAGTGCTCCACGAGATCA
+CCCAGGATAACCTGCGCCTGGCGTTCGGCCTGCAGGACTCGGACCTCACCGCCCTGGCCG
+GGGGCGACGTGGTGGTGACCGACGAGCAGGTGGTGCTCGATGCGAACGGGAACGGGGTGC
+TGGCCAATCCGGTCAAGACGGGCAACGTGCCGGTGGTGACCAACGTGGGCGGCACCACCA
+CCTACGTGGCCGGGACCGATTACATCTTTATCCCCCGCGACCAGTTCGGGCGCAGCGTGA
+TCTACCGGCTTTCGACCGGCGCGATCCCCAACGGGGCCACGCTCGAGGTGGATTACACCT
+GGACCCGCACCGCGCGGGTGGAGTTCCCCATCGGCTCGCGTACTACCGTAGTCGAGCGCA
+AAATCAAGCTCGAGGAGGAATACAGCGACGGGCGCAAGCTGGTGGCGGTCTTCTATCGCG
+CCGTCTTGAGCATCAACGGCAACATCACCGTCAACACTGACGGCGAGAACGGCATGAGCG
+TGCCGGTCACGGTGGATGGGCTCTACGACCCCACCCAGAACAAGATCGTCTCGATTTACC
+TGGAGGGCTAGTGGCTAGCCAAGCCAAGCTGATCGAGGAATTGCGCGCCCGCGTGGCCGA
+ACTGGAAGCCCGTCTGGCTGCGCTCGAGCCCGCCCCCGGCTCCACATCAGGGCAGCCGGG
+GGAGGTGCGCGTAGGCGGGCAGCCGGTGCGGCTCAGGCCGCTTTCCCCAGCCCAGTGGGT
+GCTGGCGTTGAAGGAGCTGCCCGGTTTCCTGCTGGCGTACGCCGTGCAGGAAGCGCGGGG
+CCAGGAACCCGAGGAGGCATTGCTCGAGCGGCTGGTGAACACCGCGCGGCAGTGGGTGGT
+GGCCTGCGCCATAGACCCCTGCGACCCGGCGATGCTCACCATCCCCGAAGCTCAGCAGGT
+GCTGGTGGAGGTGAGCCGCCAGAACGGGCTGGACGCGCAACTGGCGGAGTTTTTTCGCCA
+GCGACTCGGCCAAACTGCTGGATCAGGCAGCGCGGCGCTACGGAGTCCGCCCCAGCCAGA
+TGCTCGGGCTAACTGATTCGCGGCTAGCGCTAGCATTTGACCTGGGGCTGGCCGATCACT
+GCCTGCGCTGGGAGCTCGAGGAGGGATTAGGCGAGTTTTGGTGGATTAGCGTATTGCGCG
+CATTCACCGGCAAATAGGGGGGACTGTGGCCGAGCAGCTGAACCTGGGAGACCTCATCTA
+TCATCTGGGATTTGCCAACCAGGATGAGTTTCTGCAGGCTCTGCAACGAGTGCTTGAGCA
+GGCTGAGGCCAAGGCCAAATCGGGCGGAGGCGCCGGAGGCCGCGAGTTCGGGGAGGCGTT
+CGAAAACGAGGCCAAAAAAGCCCTCGCCGGAACCGGGTCGCAGCTGGTGCGCTCGCTGGG
+GCTGGACGCCGTTGGGGTGTTCCTCGGCAACGCCCTGTATAACGCATTCCAAAATGCGCT
+GGGCGCGACCAAACAGTTCATCGGGCAGTCCGTAAACGAGTTTGCCCGCTATGAACAGGG
+GTTAGTCCAGCTGAGGCTGGCTGGCGAGGAGAACCTGGGGGCCGCCGCCGCCAAGATCAA
+GGAGATTGCGGAAGCTTCGAAAGTCTTCAGCGAGACCGACGTAAGCCTCACCCTGGGTGA
+GCTGGTCAAAGCTGGATTCGACGCCAGCACCGCGATGGAGCTGACGGCTAAATCCACCAA
+CCTGGCCAGCGCGGAAATCGACACCGCCACCGGCAAATTCCTTGACCTCACCAGCTCGGC
+CAAGTCGGTCTCGGACATCCTCTCTGGCCTGGACTACAACGTCAGTCAGGCCGGGCGGGT
+CATTGACGTGCTGGGCAAAACCTCGCAGGACTCCAAACTGTCGCTCTCCGACCTGGTCCC
+GGCCATTGCCAGCGTCGCGGGGACGGCTAGAGGGGTGGGCCTCGAGGTCGAGGACCTGGG
+GGCGACCTTCGCCGCGCTCAAAGATCGGGGTATCCCCGCCGCCGAAGCGGCCACCGGGCT
+GCGTTCAGTCATCAACTCGCTGATTCAGCCCCCGGCTACAGCTAAAGACGCGTTTGAAAA
+GTTGGGGCTCGTCTTCATCAAAGCCGACGGGAGCACCCGCAGCTACGCCGAGGTGCTGCA
+AAACCTCAACCGGGTGGTAGCCGCCGGGCCCAGGGGGGTTCAGCTATTGGCCCAGGGGAT
+GGACACCTTCGCGCTCAACACCGCCGTGGCCCTGGGCAAATCCTCGAGCGCCATTGGCGA
+CTTCAAACAGAATCTGGAGAACGCCAGCGGGGCCACCGAGGAGCTGGGGAATACCCTGAA
+AAACACGGCCCTAGGGAAATTCCAACAACTCGAGGCCGAAATCGCTAACACCCGGCGAGA
+GATTGGGCAAAACCTGCAGCCCGCCATCGCCCTGTTCCTGGAGAACGTGGCAGGGCCGTT
+CGCCCGCTGGGTGGGGAATATCGCCGCCGGATTCCGCGCCGCTTCCGTATCGGTGCGGGA
+CTACCGCCAGGAGATCGAGGCTGTTCGGAACGGCACCGCGCCGATTAACACCCAAACTCG
+CCTACTGCGCGAGGCCGTGCAGCAGCTCGAAAAAACCACCAGTAAAGAAGGGCAGCCGCT
+AAAGGTTGGACCGATCACGGTAGGGCGCTTTTTCGTGACTGGCTCGCTCGAGGGCGACCT
+AAAGCTGCTCGAGGAACAGCGCAAAAGACTGCAGGAAGCCGAAGCGAAACTGCAAGCGGC
+TAACGCCAAAACGCCGCCCCCGCGTAAGGAGCCCCCGCCGTCCCCAAAACCGCTCGCCAT
+TCCCGACGAAGACCCGGTGATCAGGCAGGCCAGAGAGCTGCAGGACCAGCTAAAGATTCT
+CCAGTATCGCTACACCCTGGGCCGACTTTCCGCTGAGCAATACCGCGCCGAGTTAGAGAA
+GCTGCAACGCCAGCTGCAGGCTCTGGAGAAGGCGGCCACCACCACCGAGCGCAAATCTGC
+GGTGCTGGGCGGGCTAACTGACATTAGGAAGACCCTTGAGGATATTTCCAGGTCAGATTT
+TGAAACTCGCATAAAGGCCCTCAGCGACGAACTCGAGCGGCAGAAAAGGCTTTTTGCCGA
+TACCCGTGATATCAACCAGTATGCGGGCGCGTTGGCGAGCGTGGAGAAAAAAGCTCAAAC
+TCTGGGCAAAACCGCCACCACGGAGCAGGCCAAAAAAAGCGTCCGCGAACTGCTCGACCA
+GATCGCCACAGGCCGGAAGGAGTTGCAAAAAACCCTCGAGGAAGGCGGCACCCAAGCGGC
+AGAAGTTCTCTCGGAGCAGGCCCGAGCTCGCCTGCAAGCCATCTATGGCGATGGGATACA
+AGCCACCATCGCCGCCGTGCGCCGCAGCTATCCCGACTTCAAGAGCGCGTTTGAAGACCT
+GCTCAAAGACGGCTTGAAGTTTGACGATGCCCAAATGCTGGCCGCCCTGGCATTCCCCTC
+TAGCTTTTTGGAAGGGCTGGCAGAGACCTGGGGGGAGGGGCTCAGCACCGCCGCCCAGCG
+GGCCGGGGAACGGGCCCTGGATGAGTTTTACCAGATCCCTGAGCGGCTGCAGAAACAGAC
+CGATGCGGTGCTGCTCCGGCTGCGGGTGAGCGAGATGAGCCCTGAGGAGCTGTTGGGGCT
+CTCGCCGCAACTGCTGGAAAAGTATGTCAAGGAACTCGAGCAGTACGGGATAGACGCGGA
+AAACGAGATCGACCGGCTCAGGACGGCCATCGCCACCCTCACCGCTGATCCCGCCGTAAT
+TGAGCGGGCCATACGGGAGAGTGCTGAGTACGGCGACGAGATTGTAAAAACCGGGCGCAA
+GGTGGCCGACGGCACCGACTACGCCCGCACCGGGCTGGATGAGTTCAGGAAGTCTCTGGA
+GGCCCTGGCCGCCGCGGCGGGCACCCCGCTAGCGGCCATCCAGCAGCTAGCCGTGCTCGA
+GGGGAACCTCAAGGACGCGCTGGCCCTGGGATTCAGCTCTCCCCAGGAAGCCGAGCGGGC
+TCAAGCCCAGCTCGAGGTCCTCTCCGGCTTGCTCGACAAGCTTAGCAATTCTCTGCGAGT
+CACCGAGGCTCCCCTCGACCGCTTCGTTCGCAAGCAGGGGGAGGTACGGGACGGCTTGCA
+GGTGACCATCGAGGGATTCACCTACTACCTCGACACCCTCGAGCAGTTCGCGGCCCTCGC
+AAGCAATCTCCCCGATGATGCGCTCATCGGGCTATTTAGCGGCCTCGAGGCTGAGGCCGA
+GCGGGGCAACGAGCAAGCTAGGGCGCTACTCGAAACGCTGCGGCAGATCATCCTGGCTAG
+GGGCCAGGCGTTTGGCGAGGCCCCCAACCTGGGGGCCACCGATTATCGCAAGCTCGAGCG
+CGAGGGTTACGGCATGGATCAGGGCCGTGAGGCGTTCGAGAAAGACCGCCAGAAACGAGA
+AGATGATGCTCAAAAACAGCTTGAGCAATTCGAGGCCCAGCTCACCGATATCGCGCTATC
+CTTTCCCAAAGCCCTGGTAAGCGGGATTCTCTCCGGGGACGTGGCGGGGGCCCTAAAGCA
+AGCGCTGGGCTCGGCCACCGACTTCTTCCTCAACAAGATGCTGGAAGCCATCCTGGGGCC
+CATAGCCGAAGAGTTCTCCAAAGTCATCGCCAAGCAGGGACTAGGGGCGGCGCTGGGCGG
+CTCATCCATTCTAGGGGCATTAGGGCCCATCGGGCTGGCGGTGGGGGCCGGGCTGCTGCT
+CTTCGACTTCCTCTTCAACAAACCCCAGCCCGCATCAGAAAAAGCCGCCGCTGAACGCTC
+GAGCTTGCAATCCTCAACCCCCTCCATCACCTACAACGTCGAGGCCGTCCTGAACGCCAC
+GCTGCAGGGGGATCTCAAAGACCCGGCGACTCGGGCCGAGTTGCGCGGCCTGATGCGCCA
+GGTGGCGCTAGATGTGCTCAAGGAGGTGCAACTCGTCAAATGAGCAGCTACACGCCGATT
+ACCATTACCCCGCTCAATCCAGCAGGCCCTGCCGTGATTCTGCCCATGCCGGAGTCGGTG
+GAGAGCACTGCCAACACTGTTACCTTCGAGTTTCTCGATCCTATGGACGCGTCGGGGCAG
+CCGGTAGATCTGCCAACACTGGCGGCGCCGGCGCTCACTGGATCACCTGAGCGCATACAG
+CACGACATCCGCCGGGACGGCAAACGTCAGGTGCAATCTGATCCTCCCGCTCGATTGGTT
+GGAGTGCAATGGGCGGAAATTGAGCATTACAGCGCTGTTCAGCGCAGTTATACAGCGATT
+GGCGCGCTTGTGCTGGCGGCCAAACGCTACAACAAAAGCGCCAGCGAGGGCGCCAGTATC
+AGCCTAATCCTCTACCGGGCGGACGCTATCTGGACGGCTGAGGGGGTGCTGGAGCTATGA
+ATCTCGGAACTTCGCCGCTCTTGCCGCCTCGAGTACGCCGCTACCCGATGGACATGAGCA
+ATTTCGAACTTCCCAACGTCAAACGCTGGTGGACGCTGGAGGATTACGCTAAGGTGGGGC
+TGTTTGGGGCATATTTTCACTCTGGCGCGGGGGAGATTCGCGCACAGGCGTTTTGGGGGT
+TGTTCCGCTCCGACCCCAAACCTTATGCTTTTCATCTCACCGATCCGGTCACTCTTTTCC
+CGTATACCTTGGGATCAAACCCGGACATCCGTGTTACCAAGGGCCAGGTTCCCAGCCCTT
+TGGGGGGGAACGAAAGCTATTTTGCTGTACTGGCAACCCCGCCGTTTGGCGGCAGCGGTT
+ATGTGGTCGGGCTGGTGAGAGAACCGGTGAGCTATGTTCCGACGGAGAACTACCGGATAG
+GGCCGAACATCGCGCGAACCAGCCCGCCCAAAACCGGAGTTATTACCCCTATCGGGTTCA
+ACGATGCCCAGACTCATTTGCTGGTTGCTGTGCCGATAGATGACCGAATCCTCGTAGAGC
+GCCTAGAGTTGATACGGGATCCGAATACTCAAGAGCTAACGGGGATGCAGGCTGTGGGAT
+ATACCGAGTGGATACACGGGTATACGGCAGGGTCGGTTTACCTGCGCCAAAACTACGCTG
+CTGGCCTGGGAGGAATCATGACGACGCTTGCCGGGGAATTGGTGGCGTTTGTAATCAACC
+TCGACAGCGACGGCAACGTTATTAGCGGGCTTTCTGGTTTGGTCAATGTAAAATCCCCGT
+TCAATAACAATGCCGTTCATAGCTGGAACGCGGATGACGGCACGCTGATATTTTCCCAGG
+CGGGTTCTACATATGTAGGGCGGGCGTTCCAAACCGCTGTTTACGACGTCATTGACGTTT
+TGCAGCCTTACGATCCCCACAACAATCGTTATTTGTTGGAATCCGCCTCCATACCGTGGC
+TGCCATTGGTAGGGGCCGGGCCACAAACCCTGGCTCAGCGCTATTACTTTGATAAAAATA
+GCTGGGCGTATTTTGGCATGCTCAGCATGTTGCCGCCTGCCAGCTTGGGGTGAGTATGCC
+ACTGCCCCGCAACGATCCAAATCACACTAGCGACAAAGCGCTGTACATCCTGGACGGTAT
+TCTCCTTCCAGGAAACGGATTACTGCCCATCTGGCGGGGGAACCGGCTGGATCTCTACAA
+CGGCTCGCTGTTCGGGGTAGACAACCAAGCGCTGCTGGGGGGCCCGAACTACTGTCTTGC
+GTTCGACCTGCACCGCTCTGAGCTACGATTGTACGAGTTTGACCTCAACCTGCCGCCTGA
+CCTGATCGCTGATCCGGTGCGCCTGCAGCTCGAGGAATCCCTCACCGGTCCGGTGGTGGA
+CGCCAGCATCAGCTTTACCCTGTTCAACCGCGGCCAGCTCAACGTGGATGCGACGTATAG
+CATCGGGTCGCGGCTCGAGCCCTACACCTCGCTGTACCGGTTTTTTATCAACACCATAGA
+CCCCAACCGGGGCCTGGTGGACTATACCGGGGAGACCTATCTGCGCCGCCTGGACCGCAT
+TCCCGCAACCCGCCAGGTCCTGCTGCCGCCCAATGGAGGGCCATACACGCCCAAACAATG
+CTTGCAAGCCATTCTCGACACCTACGGCGTAAACTATGCCCCACTGCCGGAATTGCGGCT
+GCTTGGAGCCGAGGGGCCATTCGTCATCGACACCCCCGGATATGCGTACTTCCCCCCCAA
+AGCGGAGGATAAAACTGAGCCCCCGTCGCTCCTCGAGTTGATCCAGCGGGCCGTCGCTCC
+GTTTGAGGGTTACTATTTACGGATCAACCCGTTCACCAATAGTTTGATGCTGGTGCCACC
+CCCCTGGGCTCCCGAAGCCACCGCGGGGCCTACGCTGGCGAACGCCGATGTTTTGGAAAT
+AGACCCCGGCGAGATTGACCCCTCGACGGTGGTGAACCGCTGCACAGTTAAGAGCCAGGG
+ATTCAGCTTTACGGCCAGCCCGGTAGCGGTGATGGAGCCCGCCTCGTTTGGATTCCGCGG
+GTCGCTCGATCCGAGCAAAGGGGCCGATCCGCTGTTTACCGTCCTTTATCCAACCCCCGC
+AGAGCTAACCGGGAAGAAACTGAATGACGCTCCCATCGTCTACGGCAAAGAGACCCGGCG
+CGGGACGCTGGCCATCTGGCCCCTGCAAGCGCAAACCGTCCTGGGGGATCAAACCCTGCA
+AGTGAACTGGGTACTAACTACCTGGATTTACGAAGCGGGAACCGGCCAGTACGGGGGGAC
+TACCGGCTACCCCAAGAGCGGCAGCAAAACCATCCCCCTGGACGGCTCGAGCGTCGAGCT
+ATTCAAAGAGAGTGTGCAACTAGGGGCCCCGCTTTCCTACGGCCACGTTTGGGTTTACGC
+GGCGTGGGATGCCCAAGCCCAGGGGGTGCGCCTGGACTATGACCTTTACTTGTATTCTCA
+GAGCATCGGGTTTGGCGGGTCGGGGATTATAGTCTATGGCGTGCGGGTGGAGCTGAACGG
+CCTGGCGCGGAAGCTGGACAAGGGCGATGTTGTTGTGGCCACCTTTGGCGAGGTTTACGA
+CTCGGCTCCAGGATTGTCTCTTAGCCAGTCGCGGTACGGGCTACGACAAAAAACTCTGGA
+CATCGATTATCAGCTCACCCCCGATCAGGCTATGGCTATAGCGCAAAATCAGGTAGAAAA
+AGGACTCAACCCCAAACAGATTTATCGGGTGCGCCAGGCGGCGAACATGCGGGTGCGACC
+TGAGCACCTGGGAAGGCGCGTGTATATCCCCCGACCGGACGGGGCTCCGGGGTTGCTGGA
+AGGGACGGTACGGGCCTGGCGCTACCTCGAGGCCCACAGCACGGGCGGGGTACAGGCGGA
+TAGCGAGTTCGAGCTGGAGGTCACCCGCAACGTCTTTGGCGACGTGACCAATTTCACCCA
+ATACGGCGAGGCCATTTACGGTCTGAGCGCGTATTTGTAAGGAGGAATCATGCCGACCTA
+TAAACCCTACACCGAGATCAGCAGCCTGCTGGGATCGGGAGGCGTCAGGCGCATCAAGGA
+GTACCACCTGGACCGCCATGCCGAGGCGCTGGCCAACCAGCTCGAGGCGCTTTGCCGCTT
+TCTGTTCTCCGCGGGCGGGATAGCCGAGGCGGGCAGCGTGACCCTTAGCGGGTTTGACCT
+CCGGGTGCAGAATCGGCTGGGCCTCACTCTGGATGCGCTAGCCCCAGTACGGGTACTCGA
+CGAGATCCTGACTCTGCCCTCCACCCCGGCGACCGGCACCAAATGCCGGGTGGTGATGGC
+AGCCATCCCTCAACTGGCGAGCCCCGCTGACAGCTACACCGACCCCACTACCGCAGAGGT
+GGTTTCCCAGCCCATGAGTGTGGGGCTGGGGGCGCTCTTGTTTGTCGAGGGGGATACCAC
+CAACTACCCGGCTATCCCCAACGGGGCCGCCCCGGTGGCGCAGTTAACCCGCACCTCTAC
+GGACTACACTCTCGATTTAATCGAGAACACCCCGCCCACCTTCCGCTGGTGAGGATTGAA
+ATCGCTGGAGCGTGCTAAACTGAACGTAGACACCCCTTTCAGGGGAAGCGGCCCCTAAGC
+CGCACCTGAAAGGGGGTTTTGTTTGCGGATCGTTTTGGACCCCGGACACGGCAATTTCCC
+TGGGCCCGGCTACGACCCTGGGGTGGTAGGCCCCCCGCCGTTACGGCGCCACGAAGCGGC
+AGCGGCGCTCGAGCAGGCCCTCTCCTGCCGGATGCTGCTCGAGCAGGCGGGGCACGACGT
+GTATCTCACCCGCAACGGGCAGGGTATCTCGGGCAAGCCGGACTTGGCCTGGCGGGTGCG
+CTTTGCGGCCAATCTGCGGGCCGATCTATTCGTGAGTATCCACTTCAACATGATCGGCGG
+GGGTGGGCTGGTCTACCACGCGCCGGGGGCTGCTTCGGAGCGCTTCGCCAGGGGGCTGGC
+CCGGAGGGCCGGGCTCTCGAGGGTGTGGCCCTCGAGCGATTCGCGCTTTGGCGGGCTCTA
+CATAGACGCCTTCCCGGACGCCCGCCCGGCCGTGCTGTGGGAAGTGGACGGCATCGAGCG
+CGCGCCGCTGCCGGGGGCGCTAGGGCGGGGCGCCAGACTCCGGCTGGCAGCGGTGCTAGT
+CCAGGCAGTGAAGGACTTATAAGGGGGAAACCATGCAGTTTAGCGGAATCTTTTTAGAGT
+TAATCAAAATCGCAGCGGAGCTGGCCGACCTCGACGAGCCGGGGGAAAAGAAGCTGGCCG
+ATCTAACCGAGCGGTGCGTGAGCTTGCTCGAGGTGGCCGATGACGCGGCAGTGTCGTTGT
+TGCCGCCTGGATTTCGGGACATCGCGCGATGGCTCATTGACAATCCCGGAGTGGACTCGT
+GGGAGCGGGAAATATCCAAATCCATCGCAGAAGCTGCCTACCAAGCCTGGAAAGCGCTGC
+GGGAGCTATTGGGCAAGGATCAGGCCAAAGCGGTGCTGGGGTAGGTATGCGCGCAAAGTT
+AGCGTTGGCGGCGCTGTTAGCAGTGGGGCTGACCCAATCCGCCAATCCCCCTAAGTCTGT
+ACAGCTTGAATGCCCGGCGGAAGTGAACGGCCCCATCGTAGAGTGCAAACTCACAGTGAC
+GGGGCTGCCGCTGGGATCCAGCGCCGTCAAGGCGATTTTGTACCCGGCGGACAAGACCTC
+GACGGTGAGCCGCCAGGTGCGGGTCAACCGGGTGGCCGCCAATGTTGCCGCACAACCGAC
+GCTGCTTAGTAGCTACTGGCACCGCAAGATCCTGAGTTCTGGCACTGAAGGAGCTCCTGG
+AGTAGATCAGACTGAGATCCGCGACATGCGCTACCTGCCGCGTCAGCTAGTGGCGGGGAC
+ACTGGCCGAGTGGGAAAACGGATTGCCGCAGAACTTCTACGTCAGCCAGGTACCTCCCGA
+ATACCAGGGAGCCGACTTGCTGGTAACCCGCAACTATGGCACCTATGGCAGCGCTGGGTA
+TGCCAACACCTGCTGGACCCGCTTCACCCTGAACCGTTCGGCAAAGGTGATCTTGTTGAT
+GTTCTCAGAGCGTCCAGCTTGGGTGGACGATACCTGGACCGTTGGCCCTGCGGTGGGATA
+CGGCAGGAAAGGGAGCGACAATGTGCTTTCCACCACCGAAACGGCAGACAGCTATTTCAA
+AGTATTTCGGGAGGGGAGTCACTGCCTGCCGGGTCAGGGCGCACCGGGACGCATTTATCA
+AATCGCTTTCATGGAAGCGGATGGCTCGCCCAGCAAGCCCCCAGCGGTTCCGGCAGGATT
+GCCTGTTCCCCAGCCCAACACCTACTGCCCGCAATGGGTGCATGACCAGTACAAAGACTG
+GCATCCCCAGATTGATCCGGTCTACTGGTGTTATTTCGGCCACGAACACGGCTCTGATCC
+TGCACAATTCCCAAAAATCAAGGCGCTCCTAGATTCGGGAGCGATCAATTTGACCTTCGG
+GCGCGTGGAACAAGCCGGCAACGCCACCCCGATGTGCGTCTCCTGCCATCAACAAAAGCT
+CGGGCGAAGCAGGGTTGAGGCCCCCCGGGAATCCTACAAGCTGTTCGCCCTAGACGACCG
+GCAGGGTCATTTGTGGCTGATAAAGTTCGAGCTCTCCTCGCACAACCGAGCCCGGCTCTG
+CCAGCGTCATCACGAGTATGGAATCTGGGCAGTAGATTCCAATACCGGAGAGCTATTGGC
+GGCGCTGCAGTTCGCGAGCGACTTTGGCCCGGCCCTCAACGCCAGCGTGGGCAACAACAC
+TCGTTATAAACCTGATCTCTGCCCAGAAAACGTAGACATACCCATGAACAACGATCAAGG
+CCGTCACCGCATCCCCTTGATCAGCGCTGCTGGGTACGAAAACTGGACTCCCCACTTTCC
+GCCCCAGCTAGGGTTCTATGGTTACGGACGGAGCTACAACCTGGATAACCCCATGACCCG
+TTGCTCGGACGAAGTGGATGCAGATGGATTCTACACCTGCAACCAGGCGGTGCGGGCGCT
+GGATCCCAACAACTACAACTGGGGCGACAACCGCTGGTTCATCATCCCCGGCGGGGATCA
+ACCGGACGGGGGGTTCGGTATCCGGGCTTCCACGGCCATCGCCAGCGGTACTTTCTGCAC
+CGACGTGCTGGGAACCACCCTACGGGACTGCACTGCTCCCGATGCCGTGCAACAGTACAT
+CAAACCCGGACTGGACATTCTGCACAAGGATCAGTTCCGCTGGATTCCCTACGACCCCTG
+GTGGGTGGAGTACAAACCCGTACCCAGCGGATTCGTGAACTTCGACACGCACAACCTCGA
+GGGAGCCCTGAGAGCGCCTAACTAAGGGAGACATGTTCGCAGACACGAGCACCTACGATT
+TTCGAGTCATCCGGGGCGATACCTGGGAGTCCCCCATTTGGCTTGAGGACCCACACGGAT
+TGGAGGACCTCTCCGGGGCAACGGCCCGCCTGCAAGTGCGGGATGCGGCCAAAGCGCTCA
+TCCTGGAGGCCAGCACGGCCAACGGGCGGATTCAGCTACCCGGCCCGGTGGTGCTCGCCC
+AGGACGCTCCGGCGGGGAGCCGGACTCTTCAGGTGCTCCCGCTGCCCGGCCCCCTGCTGG
+GGAACTACCAGGCTCGGCAGACGCTGCGCTTTGCGGGGCTGCCGGTGCGGCTCGCTGCGG
+ACGCGCAAGAGGGGGATACCGCGCTACAGATCGAGCCGTTGGCGGCTCCCCTCAACGCCG
+GGAGCCAAGCGCCGATGGGACTGGTGCTAATCCGAATAGAGGCCAGCGCGATGGACCTCC
+CTCCGGGAGAGTACGCATACGACCTCGAGATTTCCTGGCCGGGTCCCCCAACCACGGTCG
+AAACCCCCTTGCGGGGCAGGCTACTGGTCATAGAGGACATCAGCCATGTCTAGGGTGGTC
+GCGATCGAACCCCAACGGCGGGTGTACGCGGTTGAGCAGGGAGTGCGGATGGTGGCAGTG
+GGGGTGCGCCCGCCCCGAATTGCAGTCTCAGGCGGGAGCGGCGGGGCCACCTACGAGCAC
+TTGCAAAGCAGCCCGGCCAGCGTGTGGACGGTCAACCACAACCTGGGGTTTTACCCCGAC
+GTGCACGTCTACACCCTGGGAAACCTGGAGATCCTGGCCGAAGTGCAGCACGTCTCAGTC
+AACCAAACGCTGGTTTACTTCGTCGCGCCTACCGCAGGGCGGGCGCGCTGTAGCTAGGGA
+GGGAATATGTCAAAGATCGTCGGCAGCAACCTGGACTTCAACAACGTCGCCAAAATCGTC
+AATCTGCCCAATCCCACGGCGCCCCAGGACGCAGCTACCAAAGCCTATGTGGATAGCGCG
+GTGGAGGGGCTGGCCTGGAAGGACTCGTGCCGCGTCGCAACGCAGGGCAACATCAACCTT
+GCGTCTCCAGGATCGACCATCGACGGCATCACGATGGCCGCCGGAGATCGCGTACTGGTG
+CGCGCCCAGACGACTGCCGCCGAAAACGGCATCTACATCTGGAACGGCGCGGCTGTCGCG
+ATGACGCGCGCCCCTGACGCCAACACCGCCGCCGAACTCGAGCAGGCCGTGACCACCGTC
+GAAGAAGGCACCAGCGCGGGGGCCACCTTCCGCCAAACCTCGGTGAATTTTGTTCTGGAT
+ACTGACCCGGTAAGCTGGACCCTCTTCGGTACCGCCGCTCCCAGCGCGTCGGAAACCCAG
+CAGGGCATCATCCAGATCGCCACCCAGGCCCAGACCGACGCGGGTACCGATGATTCGAAG
+GCCATCACGCCGCTCAAGCTGGCCAACTGGGCCGGGCGTAAACGTAAACTCTCCCAAGCG
+ATAGGGGACGGCAGCGCCACCCAGTACAACGTGACCCACAACTTTGGCACCCGTGATGTG
+CTGGTCACGGTGTACCGCAATGCGACCCCGTGGGACGATGTGCTCTGTGACGTCGAGCGC
+CCCGATGCTAACACGGTGCGGGTGCGATTCGCCGCTGCCCCCAGCGCGAACCAGTTTGTG
+GTGGTGGTGATCGGCTAGTGGAGCAGTACAGCCCGCTCAAAATCTTGTCTCTATCCGCGC
+TCCCTGCCGCCTCGGACTACGCCGGTGCGCTGGTTCGGGTGGGGGGCAGCCTCTACTGGT
+CGGACGGCGCCAACTGGCAGCAGCTAGCCCCGGCGGGCGGGGGGGGATTCAGCGGCGTGC
+GCCTTACTGCAGCTAATTTCAGCGTGGCGAATGATACCTGGACCCTGGTTTCGTGGGCCA
+CCCAGGTTTTCGACCTCGGAAACTACTGGGCCTCCACTCAACCCACCCGGCTCACCATCC
+CTAGTACCGGCTACTACCTGATCATCGCTTCCGCCGAGTGGGACCCTGACAGCGGTTCCC
+GCGGCATTCGACTCAAGATCAATGGTGCGACTGTCTATGACTTGGTGATAGACGATACCG
+GGCGGGCGCAACCCAGACGAAACAACGGCAGCATCTTGCTGGCTTTGACAGGGAGCGATT
+ATTTGGAGGTGGAACTCTATCACAACAGCGGCGACCCCACTGAAAACGTCATCCAAGCCG
+AAGTCGGCGCAGTCAGGATGGGATAGCGACTGGAGGCAATGTGGGCAACTGGCAAATCGG
+GCTCGTCGTGTTGGCATCGGTAGTAATCGCGTTCGTGCTGCTGTGGGACTCGTTGTCCAA
+ATCCCGCGATATCCCCCAGGGCTGGCTGTGGCTCATCGCGTTGGTGTGGGGGTCGGTGCT
+GGGGGTGAGCGACTTAATACGGCGGTTCTCGGAGCAGAAGAAAAACAAGGGAAAGGAGGA
+CAACAGCGATGATTGA
+>NC_014212.1|provirus_1746722_1764354
+TCATATGGCTTTATGATAAAAGCCTGAAGTATAGGAGTGGCGGAGGCCGTGCAAGCCGAT
+ACGGGGCAGCCCTGCCCGCTCGATCAACCGCCGAAATGCCCGCATGACGTTTCGGTAGGA
+CAGGGGGGTTCCCCGCTCTGATGGGAAGATCAAGCCGTGATCCTTCCACCTCCGGGCGGT
+GGTGCGCTCCTCGAGCTGGTAGCCCTGGTGCTGGTGTAGCAGCTCTTGCGTCGCAGGGTC
+AAGGTAGATGGGGGCGCTTGACCCCGGCGTTTTGGTAGGCCCCAGGCTGCCATCCTTTCC
+AAGAGTATGTCGGATGTATAGCCGCTCGCCCTGCCAGTCTTCCCAACGCAGGGCCATTGC
+CTCCCCTATGCGGATGCCGGTAGTGAGCATCAGATAGAACATGGGGTAAAGCCGGTGAGC
+CCTTGCGGCCTCGAGGAATGCCGCCGCCTGCTCTCGGTTCCAGGCTCGAGCGGGCCGGAC
+GACTCCCCCCGCCGGGGGGTCTACCGCCTCGATGGGGTTGGCCTCGAGCAATCCTAACCG
+CACTGCATCCCGTAGCGCCGCCCGCAAAAATTGATACAGATGGCGACGGCTCGAGGGCGA
+CAGGTCCGCTAGCTCGGCAAAGCGAGCACGGATAGCCAGCGCGGACAGCCGGGCCATAGG
+GATATTTGCCAGCGGGGCTAACATGCGCTGATACTCGGCATATTTGCGCTGCGTTGAGAG
+GCGAATATTGCGGCTTCGAACGCGCTCATCCGTCCACCGCTCGAGCCATTCTCCCAAGCG
+CAACCGGCTAGCCTGGATCACGCCATATCCCGCTTTGGGCAATAGCCGGGCAAGCCGCTC
+AGCTACCTCGCGCCGAGTTCTGCCGTACACCCAACGCTTTTGCTGCTTGCCATCCAGGCC
+ATAGCCCACCGTGACGAAGGCCGCCCAGCGCCCGTCCTTGCGCTGGAAGATGGAGCCTTC
+GCCTTTGCCACGCCGGGGCATGTTATCCTTTAGTTCAATGGCGATTGAAAATAAAAATCA
+TAATAATAACCAGCAAAATCCACAAATGCACTGGAACTTTTTTCATTACACTCAAGACCG
+GTTTACTTAACTGCCAATATCGTTTTGCAAGCAAAACAAAAGAAGGTGCGACGGAATACT
+CTAAACTAAGTTGACTTAACAAATCGGACTGACCCAAAGACGCTTTATATAAAATGGCAA
+GTTCTCTTTTCCCCCACAACTTCACTTTCGCATGCTGCGCTTGAATCTTTGCGCTCTGCG
+TAAAACCCGGACCTGTTGTGATTACAATTGCGTATTTAGCCTTCCAAACAGGCATAGCCC
+CAAGAACTGCCTGAACAGCATCATTTCCAACTTTACCCTTCCAATGCTTAACCTGAATAG
+CATAAATGCCAATCGGCGATTGAGCTATTATATCGGCTCCAAAATCATTACTTGGTGGCG
+TAGTTTTCGCCTTCCAACCAGGAATTCGATTAAACATTTCCGTTATTAAACGTTCTACAT
+CAACAGCGGAAGCATTTAAAATGCGTTGAGCATAAAACTGCTCAAAATCATTTGGGTCAT
+ACATCCGGTTTTTCACAGCTTGCCCCCAAGCGGATCATGGTAGTAGACACGGCCAATCAC
+CCGCATCTCGGATGGCCGCCACGGCCTGTACTTGGGATTGTCCGACACTAGCCACAACTC
+GCCATCGTCTAGCCGCCGCACGCGCTTTATGGTGTGTCCATCGCCGGGAATTTCGAGGAC
+ATACACCCTCCCCTCGCGCAAATCGAGGTCTGAGGGATCCACATACACCCTGTCCCCATC
+GTTGAGCGTGGGGGCCATACTATCTCCTTCAACCTGGTATAGCAAACTACCCCTGCGCCA
+CACATCCGCCAAAACCGGCATACCATCAGCATCAACGGGCCGCCCGGCGCTGGCAAGGCC
+CCGTACCAGCTCGATAAAAAAGCGCACCTTGCTGACGCGCTCGCCGGGTTGCAAGGACGT
+GGGAGATTCCAAATCTAAAAGAGGTTCTAGCCCGGTTTGTTCTTGCCAATCCGAAGCCCG
+CCAACCCAGCGCTTTCAACAAAAGAGAAAACTGCCTAACCGTAAGTGTAGAAGGGTCTTT
+TTTGCCGTTCTCGAGCCTATATATGAGAGCTTGATACAACTCTCCCCCTGTTTCGTTCTC
+GATATCCACCAAAGATTTCCCTAGCATAGCCCGCCTGGCAGCAATAGCCCGCCCCCACGC
+GGGCTTTTCTTTTTTCGTGACTTTGGGCATACAGCCAATGCTATGGTTAGCGACTAACAT
+AAGTCATTCACCCCCTGTCAACACTATGAACGCTATGACTTGACAAGTCATGAACTTTGT
+GTTCATACTTGGCATTAGCCATGAACGAAAAGTTCATAACCTCAGGGAAGGCGGCAAAGA
+TTTTAGGGGTAGCGACAAGCACGGTCACCGCTATGTGCGAGCGGGGCGAATTTTCCGGGG
+CATATAGACCCGGCAAGTGGTGGCGCATTCCGCTAGCCGAAGTGCAACGCAAGCGGCAGC
+CCCGTAAGCCGGAGGCCCCCCGTGAATAACCCCAAAATCGCCTACCGCGTGGACGAGGCG
+GCAAAGCTTTTGGACGTCCACCCCAGCACGGTTTACGAGCTGGTACGCGCCGGGTCTATC
+CCCCACAAGAGGCTAGGCCGTCGAATCATCATCCCCGCCCGGGCGCTCGAGGAGTGGATT
+AACTCCCCCGAGCCCTGGGCCAGCTACGACTACGCCCATAGGAGATAACCCCGGCTTTCG
+CCGGGGTCAGAAAGGAGTGTGTATGGATAGTGTAACACAGAAAGCACGGCTCGAAGAAGA
+GGCCATCTCCCTATATCGGGAGTACATAGAGAAACACGGTTATGATCCCGAGCGCGCTGC
+TGCGGCGGCGGCGCTGGAGGTGGCCGAGGGGCAGCAGGCCCTCGAGGCGCTGGAGGCCGG
+CAATGCTTCCTAGCCGCATCCAAATCCAACGCCTCGAGAGGGCCTTGCAAATATCGCTCC
+GCCGGGTTCATGGCGGAAATGCTGATTGCGCTGCGTTCCTTTGGGAGCTGCACGAAACGG
+ACTATTACGCCCCACAATACGCGCCCCGGCCCCATCGGGCCTGGCAGGACGCTAAACGCA
+TCATCAACGTCCTCGAGGCCCTCGAGGCCCTCGAGGCCGTCGAGCATGTGCGCATCAAAC
+CTGTTCGGGACGCCTACCGCACGGGGGAGTTCTATGCGTAACAAGCGCTTCAACTGGCTC
+GCCTTTTGGGGGGCCTTTTTCCTGGCCCTGGTGGCCTGGGGGCTGGCTTTTGGCATCCCC
+TGGGGCCTGGATTGGGCCGACCGGAGGCTGCCGTGATGATCCGCTGGCTAATTCGCGGCT
+TTGTGCTGGTGGTGGGGCGGATTGCCCTGCCCATCATCAGCCCGGAGCGGCTAGGAGGCA
+GACTATGAAATGGAGCGAACACGCACAGGAGCAAGCTAGAGCATCGCGTGATCCACGGGT
+CACCGAGGCTTTTCTGCGCATCCAGTCCCCCGGGCACCGCGCGAGGATGGTAGAGCGGCG
+CCTTGAAACGCTGGGCTATTCCGTGCTGCTCAATCAGCGCGGTCCCGAGCTGTGGATGGC
+GGAGTGCTACTACGTTCGGGGCCAGGGTAGCCGACTTTTTGCCCGCCCGGTAGCCCGACA
+GACTGGGAAAACGCGTCTGGGCGCATTATTGGCTATTTGCGGGGAGCTGGGGGTGGTGGT
+GTGACAGTATCCATTGAGGACATGATTACTGCTGTACGCCGTGAGCTGGCGCTGCGGAAA
+AACGTCTACCGCCGCCGGGTAACCGAGGGCCGCATGAAGCCCGAAGAGGCTGCCCGCGAG
+TATGCAACCATGCTGGCGGTCATGCTCACGCTCCGGGACGTGCTCGAGGGCGGGGTAGTC
+GTCGCCAAAGATGTCAAAGATGTTGAAGACTTCAGTGCGAACGCGAACCTACCCACCGAC
+CCCCGCCCCACCGACCGCCTGACCCAACTCGAGCACAAACTAGAGCTGCTCGAGCGGACC
+GTGTCCGCCCTCATCAAGGATTACGCGGAAAAAGTTCTACAGTGATGGACCTTTACCCAT
+TTGCGGGCTTAGCCGCCTGCAACCCTGGCCGCACCGCCCGATTCCGCCGGGCGGGGCTGC
+TAATCGCCCTTACCTGGACTCCCTCGAGGGAGTGGGAGGCCAAAATATGGGGACCTAACG
+GAGTAACGGCTAATCAGCTCGAGGGCATTGCTAAGGCCCTCGAGCTGGACTTTTACGCCA
+TTGAAAGCTATCTATCGGCAGACTTTCAAAGCTACGTGTACGTCATCACTGGGGGCCGCC
+ACATCGCCCCCGAGTTACAGCGTCAATATGATGAACTCATCTCCCAACGCCGCGACACCT
+TCGCGCCCATATCCTGAGTTTAGCCCCAAGCTCGAGGGCTTCCCCCGCCCAATCAGCGAC
+CGGCTGGCGTATCATCTGAGCTACGGAAACCTTAGCCTGCCCCCGGATGATCCCCGCTGG
+GGGCTTATTGATTCGTACTTATCAAGTGAGGCCTTGGCCGTCGGTTGCCAAATAGCGAAA
+TCCGCTAACGCGATATGGCATCGGCGTATTGAGGCTAGCTGGGTGGGGCCGGGCTTGTCA
+AATGCTCCATATCTCGACGCTACGTCCAGCACGCAATTTTTGGGCCTTCGGGCACGACTG
+CTGATTAACCCGGGAACCCTCAAGCTCCGCATAGGGGGGCTATTGCAATCCGGGCTAGGG
+GGGGAGAGCGTGCGGGGAATTATCCGGCGATTGAGTAAAAAAAGCCGGAGTAGGCTACTC
+GAGCTAACCCGCGAGCTGGAAGCGAGCGATATTTACCCCGAGCTAATGATTACGCTGACG
+TACCCGCGCGATTGGGAGGGGGCCATATCGCCCGAGCACGCCGAGGCTCTTTGGCAATTC
+CGCCGCGCCTGGGGCAGGATGAACGCCCACCGCTACCGACCCAAGGGGCCAGGCTGGGCC
+GAGCGCTGGGCCGAGCTGCGGGCTGAAGTCCGTGCGCGGCTTTTGCGGCTGCGCGAGGTC
+GGGCCGGATGGCAAAAAAGTAAAGGCGCACCTCGAGGCCTTCCGCAAAAGATTTGAACGC
+AAATTTGGAACATCGTGGGGGTTGATTTGGAAGTTGGAGTTCCAGCGGAGAGGGGCTCCA
+CACATCCATCTCTTTTTGTGGAACTGCAACGACATCGACCCTACGGAACTCCGGGCCTGG
+ATAGGCCGGGCCTGGGCAGAGATAGTTGCCGGATCAGACCTGAGCGCATATTTCGATCCA
+CAGAAACTAGCGCTATATGACGCCTACCGCGAGCAGGGGGGAAGAGAATTTGCCGAAGCT
+ATGCTCGAAGGCATGGGGCTAAACGCGGGCACTTGGAATCACATTAGGGCGGGAACTGGC
+GTGGAAGTAATTCGGGAAAAACATTGGGGGTATTTGGCTAAGGAGGTGCAGGGTGGGATG
+AATAAAGCGTATCAACACGATGTGCCACGCAGGTATCGCAACGTGGGCCGTTGGTGGGGA
+TACTGGCGTTATAACCGTGCCGGCTGGATTGAGCTATTTTACGATCTCGCCAGCGCTTCT
+ATGCAGGAAATCAAAGAGGCTATTGTAAAGCCGTTTGAGGCCGCCATAAAAACCCTGCCT
+AAGGCGTGTACGGATTTCAAAAAAAGAGCAAAGGCCGCACTTACCCGTTTTCTCAAAACA
+GGATCATTAGCCGCGCAAAAAGTCGATTCTGACGGCGTAGTTACCGAGGGGGCCTACGGC
+TATCTCACTGTATGGGGCCGAGCCGGAGTACAGGCCGCTATAGGGGCGCTATGAGCAGCT
+ACCGCAAACCAAAACACAAATGTCCAGCCACCGGCAAGCGCTCCTACCCCTCCCAACTCG
+CCGCCGAGAACGCCGCCATCCTCTACCGAATGCGGCTAGGCAGCGGGGGCCGTCCCTACG
+TGTGCCCGCATTGTGGATGCTGGCATCTGACCACTCAGCCCCGCCACAGCAAAGATAGGA
+TGGCAACATGCAACAAATAAGAATCCTCTTGCTGATAGCCATAGCGGCTTACTTCGCTTT
+CCAGTTTCGGGGGGCTTCCCCCACCTCGAGCCCCGCCAAAACCCCAGCCCCGACGGATAC
+CCCGCCCTGCACCAGCCACATCCTTGAAGCCGCCGCCAGCACCCGCGAGCTGCGCCTGAA
+GGTGAGCGGAACCGCCCAAACCCTCCAGGTCGGATACGACGGCGGCATGATGGTGAAAGC
+TACCGAAGAGGTGTGCAGCGGGGGAGAGTGCCGCGTCTTTACCCCCGCTGCCCCTAAAAC
+CGTTCAACTCGATGGTTGCCCGGCCATAAACCTGCCCTAATCGCAATACTATTGATGTAT
+ACTGTTACTAATGGAAAGCGAACTAACTAGACGTCCAGGAAGACAACTCACTATGGGCCT
+CTTACGCAAGCGGGACCGGCTGGATATCCGCCAACTTCCGCTTTCTGACCTGCTCTATAC
+CCTCTGGGGCGACCGCACCGCCGCTATCAGCGTTGCCGAATATGCCGGGGGCGACCTGCG
+CAACCTGCAAGGCAAAAGCGCCATGGAACTGCTCGAGCTGCCCGGAGTGGGGGAGGGGAG
+GGTTGCCAAAGTCATCGCCCTGTTTGAAATCATCCGGCGGGTGGTACAGCGGTGAAACTA
+CGCTCCAGCCTGGCAATTCAAGACAAAATCCGACAAAAACACCAAGTCCGGCTTTACGAA
+GTCGCAGAAGCGATCCGTGATCCTCGCCGGTATACCCGCAGGGTCGAGATCGAAGCCGAG
+GGAACGGTTTACATCATTGTGGGGAAAACCAAATCGGGGCGATTGCTGCGGGTAGTATAC
+ATTGCCAAAAAAAATGGCAACTGGTTGAAAACCGCCCTGGATGCCTACCCACGCGACCGA
+AAGATGTACAATAGAAAGTAGCCATGGCGAAGCTCAAGGTACCCAAGTTCAAAAGCCTGG
+ATGAAGAAATGAACTTCTACGCCAACATTGACCTATACGCCGAGGCCCGCGAATTGAGCC
+CCGATGAGGAAAAAGCCTTGGATAAAAGCCTTGGCATCCGGCGTAAACCTCACCCCGCCG
+CTCGAAAGCTCGCGTTGCACCTAAGCAAAACCTCGGGCGGGGATTGACGCCCACCGCTAC
+GTAAACCTGGCAGGGCTCACCTTAGCCCTGCCATAGCTTTTTTGCGCCGGGGCTGAAACG
+CTATCGGTATGGCGGAATTCCGGCGTATCCAGATAAATGCAAACACGCCGCTAACCCCAG
+GCTTTTACGAGTTCGTGGGTGAGGTAGAAGGTAGCCCAGAGCGGGCCACCAAAAGCGACA
+TCCAAAGCTACCTGCGCGGGGCTACCCGGCTGCCCGACCTGGAAGTTCTGGACTGGGCCA
+GGGTCAGCGGGAACACCTGGCGGGTGCTGGTGCAGGTCAAGACCATCCCTAAAACTCAAG
+CTCAAAACGACGGCATGGTGCATACCGCCGTAGCTCCGGTGGTGGTGTGGGTGGTGGGGA
+TCATCGTCACCGCGTTGCTGGTCGGCTACGGCATCTTCAAGTTCAACCAAACCAAGCTCG
+AGATGTTCCAGCTCATCCCCGAGCCCGATCGGAAAAGCGTCGCCATCGCCCAGTCGCTTA
+ACTTCGGCCTGATTGCGGTGGCAGGGCTGGCAGTACTGTTTTTGGTGCTGCGCAAATGAA
+ACGTAAAGAATTGCGGCTCGAGCTGCCCAGCCTGGATTTACCCCCGGCAGAACCCCCCGC
+TGCCGAACCCACCCCCATCCCGCCCGGCGAGCTGGACCCCTTGCTAAAAACGGCGGTGGA
+CTCGCAGCCGGAGGTTAAACCGGCCCCCCAGCCCACCCCCGAACCCCAACCCACGCCCAA
+ACCCAACCCTGCGCCCCAACCTCCATTGCCCCGCAAAGGCTACGGCCCCCTCATCGTAGG
+AGGGGTGGCTTTGTTGATCGGTTTGAGCGCCGCATTGCTCGGAGGCAAACCCAGTGGAAA
+CGGAACCCCTCAACCCCGACCCAACCCCCCCCAACCCCCCAGCCGAAACGATTGGGCCTG
+ACCTCGAGCCCCCCTCGCCGGAAATTCCCGAAGTGGAAAACCTGGAGGGGCTCGAGGCCG
+AACCCGACTCCTCGCCCCCGCCTCCCGCCCGCATCCCCTTCCGAGGAGCCGAGCTGGCCG
+CCTTCGCAGGCATCCTCGGTATGGCGCTGGCCCGGCCCAAAAGCATGGGAGAAGTCAGCG
+TCTTTGGCGAAGCATTCCATGGGCCTATTCGGCTTTCGCTGCCCGCCATGGGCCTGGACT
+TTTCCACCTCGGTAGCCGAAGCCCTGGACTCGCTGCGGGTAGGGGAGGCCCTGGCCGCCT
+TCGGCATCTACAAGCCGGGCGGTTGGGGCGGGGATTTAGGCGAACTGCCGCCGCTCTTAC
+GGCTAGCCCTGGGCGTCGCAGTAGTCGGGTACGCCGGATTTGGAGGGATTCGTGCTGTTC
+AAGAATATCGAGCTGCGCAAGCTGCCCAAATGGGCACTCCCGGCAGCGGCCCTAATCGGG
+TTCCTAGTGCTGATGATGCGAACTAACCCCAAACCCAAAGGGGCCAGGCCATCGGGGCGT
+TACTTTTACCCCATGAATCCCTTTGTGCTGCCCCCCACCACCGGTTGGATGGATACCGAA
+TACCACGACTACGGAGTGCGCGACCACCGGGGAAGCGGCTACCTGGTGCGCCCTGGGTAC
+TGGCATCCGGCGGTAGACCTCAACAACCCCGGCGGGGGGGATAGCGACTGTGGGCAAAGC
+GTTCACGCCATCACCGACGGGGTGGTGATCGTAGCCGGGTGGGCTCCGGTGATCGGGGAA
+CGGGCGGTGATATGGCACGAAGGGCCGGGAGTGTGGTCGGTGTACTGGCATCTGCGCAAC
+CTCGAGGTCAAACCCGGTAGCGTGGTTATGGCCGGGCAAAAAATTGCCGAAGTGGGGCGA
+ATGGCATCCGGCGGGTTCTGCCACCTGCACTTCGGCGTGTACTACGCTCAACCCCCAAGC
+TGGGACTACTTTCCCAACGAACTGAACGTGCCCAAAGAAAAAAGCGTATGGCTCAAGTAC
+TCGGTGGACCCGCTGCAATTCCTGAACAAAAACAAAGCCCAGCTACCGCCTAAATGGGAG
+CGTGACTAATATGGAAAAAGCCCTCAAGCTGGTCAAAGAAAACCCCCTGGCTCTGGCCGC
+CCTGGCCTATGGCCTCTACTCGGGCCTGGGCCGCCTCAAGAACCTCCGCGAGCAGCAAGG
+CTGCCCCAAGTGCGAAACCGCCCAAATGTATTTGGGCTTCGGGCTGGCGGCTTTCGCGGC
+CTATACCCTGTGGCAGGACTACCGGGCATAGTGAACCGCTCCGCTTTGCGCATCATCATC
+TCTGGGAAAACCCGCTCCGGGAAGACCACTCGAGCCCGCGACCTGATCCGCGCCCTGCGC
+CGCAAAGCCCGGCGGGTGGTGGTGGTGAACTTCAAGCCCGAGCTATGGGAATACGCCCAA
+GGGCGCTATACCGTAGACGACGCGGGGAAGAGCGCCGCCCTGGTGGGAACCGCGCTGAAA
+AAACACCGCGATGTGTGGTTTTACCTGCGGGCTCCCCGCCGCCAAGAATTCATGGATGCC
+CTGGCCTGGCACATTTTGCAAGAAAACGACCTGCTACTGGTCTGCGATGAAGCCCACCTG
+GCCTGGCAACGGGGCCAGCTCAGCGAAAATCAGGTGCGCGTCTTTACCCAGGGGGCCGGG
+CAGGGGATCAATACCCTGCTCATCTCGCAAACCCTGGTGTCCCAGGCCGGAAACATTGAC
+CCTTTGCTGGTCAAACAATCCAGCCACCTGGTGTCTTTTCAGCTCACCGAAAAAAACGAA
+GTAGACCGGCTCAGCGAGTACATCCCCGAACTGGGCGAAAACGTCCGGCGGTTAGCCAAA
+GCGAACCTGCCCACCCCCGGCGCGCCCGGAGAGTACGTGGTTAAATCCTTCGACACCGGA
+GAGGCCGGAGTAGCCGCGCGTTCGCCCAGCGATCCAAAACGGCTGCTTTGGATTCCCCTT
+ACGCACGACAACAGCACCGGAGTTTATCGCTTTCTGCACGGCGACTAGGCAGGGCTCACC
+TGAGCCGCGCCGTTGACACCGAGGTAAAAACGCCTCCAAGCTCGAGCTATGGCAGATCGA
+GCCCTTCCGCAAATCGACACCAACCCCTTGCAGGTGGTGCAAGACCCACGGGTGGTTTCC
+GGGGCCATGGGAGTCCTGGGGGCCAACCTACTGCGAAAAGCCCTCTTTACCCAGCAGCGC
+AGCGTGTTTGGGTACGCCGCCAAAGGCAGCGATGGCCGCATTCGCTATTACGAGAACGCC
+GATGAAGCCAAAAAGGGCGACGCCGGGAAGCAGATAGCCAGCGCCTACCAAAGACGCATC
+TTTCTGCACCTCGGCTACGTACTCTTTGGAACGCTGGCTATGAGCTACGGAAAGGAAGCC
+CGCAAAGACGATGTGCTCTCGAGCACCGATGACACCACGCTGATGGTCAAATACGCCGGT
+TTGGGCTTCGCCGCCTCCGGCTTCGCCAACCTGGTAATGACCCTCTTCAACATCGAGTAA
+AGGAGTGATATGAACCCTAGCGCAGGACGCCCCACGGAAATCATCATCAACGACCCTAAC
+GCCTCTTTTTTTGCCGGCCCCCAACGGCTTCGGCTGTGGGAGTATCTCGTACCGGTAGGG
+GTAGAGTTGAAAATTCAAAACCCCTTCCGCCTCATCGCCAAGCTGTACGGGGCCGGAAAC
+GTGCAAATCCCGGCCTCATCCAAACTGTACCTGGCCCGCATCCGCCGGGGAGATTTCGAG
+ATTGAGGACCTGGCCGAGATTCCCTATGCCCCCTACTTCTCTCTCACCATTGACCAGCAG
+CTCGACGCCAACTTTGCCGAGCGGATCACCCACGTGATTGAAAACACCGGGCGCATGGGC
+TACGCCTTCGATGAAGGCGACCGGCTAGCCATCCTCATTGAAAGCACCCTCGCGGTGGAC
+ACCACCAACCCTAACAACCGCATCCAGTTCACCGGTCTGGTGAACAACTAAGGAACGCCA
+TGGGACTCATTGACTCGCTCACCAACCCCCTAGCCGCCGTCGGGGCCGGGGTGAGTAGAA
+TCGCCTCCGTTTTCCGCGACGCGCCCGAAGCAGGCCCTACCCCTACCCCGGCTGCCGCCC
+CCGCTGCCCCCGCGCCTGCCGCCCTGGCAACAACGCCTTGGCGGCAACAGTACATTGACG
+CAAACGACTTTCAAGCCGGGGAAACCTGGCGTAGCGGCGACTATATCCGTCTGGCCCAAT
+TTCTGCTACCAGAAGGCACCGAATGGCGCCTGGAACGAGGCCGCCCTTACGGCTTTTATG
+TGAAGGCGGTGCAGGACCTAGCCGGGCAAAACCTGGGAGCCCCCGCCGCGCGAAACGTGG
+TCATCAACGACTTACAAAAGAGCACCCAAGCCGGCCAGGCTACTCTACCCGCCACCTACC
+ACCCCGATGTAGCGGTGTGGGCTACCACCGGCAGCGGGCGGGTCAAATGCACCATCACCA
+ACGTTGACTACACCACCAAAACCATCACCTTCACCGAACCCGCGGGGGTCAACGGGGCCA
+GCGCCATCCAGGTGTACTACCTCTCCAACGACGGGGATTGGCGCATCCGGGTCGCCCGTG
+AGCTAGGGGTAGATACCAGCATCGTGGCGATCCTCAATGACTCCTTCGCCGTCGCCCACG
+CGGTGGACCAGCTCAACCGGCGCACCGCTCGCTACTGGCCGCAAGATACCGTGCTGGTGC
+AAAAACAACGGCTGGTGCTGGAAGTGCGCACCACGGTGAAAATGGTCTGGACCCCGGAAG
+CTGAAAACATCCTCAACTTCTATGCCTGGATGCGCCAACTCAAGGTGCTCGACGATCAAC
+GCCTGGGCCGGGTAGCGGAAGGTGTGCAGCGCAGGGGGTTCTGATGAATCCGCTCGACTC
+CATCATCAAAGGCGTCCTGGGGGTCTTTGATCAGGTCTACTACTCGGATGAGGAAAAAGC
+CCGCGACCAGCAGCAAAAAGAGCTTGCCGAGGAAAAACTGCGCCTCGAGGCCGAACTACG
+CAAACAGCGCGAACAAACAGCGCAAAACGTAGCTATCGGTGCAGGGGTGGTGGCCCTGGT
+AGGCATCATCACTTGGGGCGTGGTCGCATCTAAAAAAGCTGCGTAGGGTGGGTAGCCATG
+GCTGATAACGTCGGAACCACCATCGCCATCACCGCAGTCGGGCTAGCGGGGGTCGCCGCC
+GCTTTTGTGATCGTGGACCGGTTGACCAAGGCCCAGCAGCCCTTCCAGAATCCAGGCCAA
+CTGCCCGCGCAAAACCCCGGCAATACGCCCGCCCCAAACCCTGGCAATACGCCCGCCCCG
+AACCCCGGCGGCTCTGCTCCCCCTGCCAACCCCGGCACTCCGGGGACCGGCGGCAGCTAC
+ACCTATGGCGACCGCTGCAAGGAACTGCAAAACCAGCGCAACACCTACGAGGGGCTGCAA
+CAAACTGCCCAGCAAAAGATGGATGGCGTCATGGCCGAAGTGGAGGCGCACCGCCGCGAC
+ATCACCCACCACAGGTTATGGTGCATTACGGATTGCAATTGGCACCTGGAAGAGCGCTCC
+AAGCGCATAAACGCCTACGTGCGCGGCGAGCCAGTAAGCGGGTACTGGAACGAACAACAA
+CTGCTCGAGGCCGCTGACGGAGCTGGGGTAAACCTGCGCGAGTACCGCAAGCGCTACCTC
+AAAGCCAAATCGGAATACGACTCCTACGAGCAGCAAATCAAGGATATTGATGCCGAGCTG
+CTGAAACTCTCCAAGCAGGGGGTGCGCTGTTGAACCCCGTAGAAATCAAACAGTGGGCTG
+AGCTGGGGATTAGCGTGCTCGCCTTCCTGTCGTTCGTGGCGTTGGTGTTCAAAGTGGGCC
+TGCCCCTGGTGCAAGCGGTAGAGGCGATGAGTGGGGAATTTCGACTGTTGCGCCAAGCCC
+TAAGCGGCGAACAGATGGAAAATCTGGTACGCGAAATGCGATCCACCCGGCATAGCCTGG
+AGGGTATGAACCGGACCATGCGCCGCCTGGAAGGGGTTCTAGAGCGAAAAGGCTTTACCT
+TCCGCATGGAAGACGAGGTGATGCCGTGAACTACTTGGTGTTGGGCCTGGGATTGGGAGT
+ATTCGCCATTGGCGGGTATCTCTTCCTCGAGGCAAGAAAAACCAAACCCCAGCCCCCCGC
+CCCCGACCCGATCCTGAGCAATCCAGACAACCGCGATGCCTACGACGATTACCGCAAGGG
+GGAAAGGGACTCATGGGGATGAAATGGCTGTGGGGAATCCTGGTAGCGGGGGCAGCGGGA
+GCGGCCTTATGGATCTACGCTCGAGGCCGAAAACCCGCCGCGCCTGGGCTCAAGAACTGC
+GCCCAGGTGATTACCCCCTGCGCCGATGGCTTTATAGCCCCCACCCCCTGCGGCTGTGCC
+AGCCACGGCGGGGCAGCGAGAACTACCCCGCCCCCCTTGCCGCAGCCCCAAACCCCCACT
+CCCCAGCCGACCCCTCCGATCACCATCATGCCGGTGCCTAGCGAACCTCCGCCGGGGGTC
+GGCACCACCCTGCCCCACTGCAACCCCGATGAACTGTTTCAAAACGGGCGGTGTGTACCC
+AAATCCCCTCCGATGGATCAAGCGGCGCCGCCTCCGCCCGCGCCACCAGCGCCTATCCCC
+CCAAAGGTTATAGACGCGCTGAAAGGCATCACCCCACAACCGGCTACCGAAACCAAACCG
+CGAAACGTGACCCTACCCGTAATAGCCGATATCTACTGACGGAGGAACCATGGACACCAA
+ACCCTGGTACATGTCAAAAACCGTATGGGCCGCCCTGCTCACCGGGCTACTGGGAACCTA
+CCAAGGTTTAGATGCCGCGCTCAATGACGCCCTGCCGAACATCCCCCAGTGGGTGTTCTA
+CGTGCTGACCGGGCTGGGCCTGTACGGGCTGCGCACCGCCGATAAAAAGATCGGATAACC
+ATGGAACAACAACCCAGCACCGGCGAACTCATCAAGATGGGCTTCTGGCAGGCCAGCGGG
+CAAGCGCTTTTTTGGGGAATCGTCTTGCTGATACTGGGCATACTGGGCAGCTTCGTGAAA
+ACTCCCCAGCCCACCGCACCAGCAACCTCGGAGAAACCCAAATGTTCGGCCTAGATATAT
+CCAACATCCTGGCGCAGATTCGGGGGCAGCTAGCCCCCGAACTGGAGCGTTTAAAGGTTG
+AACTGGAATGTAAACTGGATGCCCTCATCTCTGCCGTGCTCTCCGGACCGCGCGGGCAGG
+AATACGAATTTGGCCGGGGGAAGCCGGAGGTGCGCGGCCACGATCCGGCTGTATTCCCGG
+CCATCGTCAAACTAGCAGGAAAGCAGCGGGCCAATCTGGCCGCGCTGCTCTCGAAAACCG
+TAACTCGAGGATTCGCCGCCAACATCGGGACCAATCCGGCCATTTTGCGCTTTTGGAAAG
+AGCAAAGCCCCGAACCATCCGCCCCTTTTACCCTACTGCCTGGGCAAACCGTGGACTTTA
+GCTGGTTCTTCGACGAAATCAGCGTGGAGGAAGCCACGCCGGGGCAACCCGTAGAGGTAG
+AGGTGTTAGCCCAATAATGAAGCGCACCGTCCTCACCACCCATCGCGGCAAATCCTATTT
+GCCGGAAATCGCCCTGTGCCTGGGGCCGCAAATCATGGGCCAACCAGGAAGCGGCACCTA
+TGCCGATCTATACGGGCGGGTGTGGGCCTCAACGATTGAGCCCGATGGGCTGGTACACCT
+CTGGCAGGCCACCGCCTCCGACTGGCAGGAAGTGCCCATCCCGCAACCCCCGCACGATCC
+CCGGACCATGCGGCATCACTCATTGGCGTTCGACCAGTCCGCCCGGCACGTGCTGGCCTA
+CGAGATAGCGGGGCAAATCTACATCCGGCAATGGGATGCATTGACCAACCAATACGTTAT
+GCGTGGCCCCTGGCCGGGAGTAGATCCGGTAGTTATAGCCGATGCGACGGTGAATTATTA
+TGTGCCGGATAGCGATGTTTTGCTGTTCTATTTGTCCTCGGATCGCTCCAAGTTGTATAT
+GCGGGTACAACGCGAGCTATATGGCACGGCCCATCTAATACAGAGCTTCCCCAACCCACA
+AATACTTGACCAAGCAGTGTCCATCCCCTATCAATTTGAACTACTGGGCTCAAGCGTGAG
+CGCCCCAAACGATTTAGGATTAGTGGTGCGCTCCGACTTGTACCCCGTGTATTTGCCCCT
+GGACGCCCTGACTACGGCATCCGTCGCAACCCCCAGCGCGGGCAACTATTACCCTGTGGT
+GGTGGTTCGTGACCTCGGTACCGATGCTCTGAGCACAGCATCCTTTGCCGTACCCAGCGC
+GGGCAACTATTACCCTGTGGTGGTGGTGGTTCGTGACCTCGGTACCGATGCTCTGAGCAC
+AGCATCCTTTGCCGTACCCAGCGCGGGCAACTATTACCCTGTGGTGGTGGTTCGTGACCT
+CGGTACCGATGCTCTGAGCACAGCATCCTTTGCCGTACCCAGCGCGGGCAACTATTACTT
+GGTGGTTGTGGGACACGATCTCACTCAACCCCGCTACAACTCCCCCGACACAATCACCGC
+AGCTAACATAGCGGTCCCAAGTCAAGGAGCCTATAATGTTGCCTAGAATAATCATCCGCG
+AGCTAAACGCCCCCAGGCCGCAAATTGGCGTATCCCTGCAACCGCAGGAGATGCACTGGC
+AAATATTGGGGCCGGATGGCCGCGTCATCCGGGAGAGCGAACAACCCCTGCATAATCTAG
+TACTAAACAATGCCAAGGAGCTAGCGGCGACCTATCGCTTCTCCACCCTCAACATGTACG
+CCAAAGTCGGCACGGGCTCGTCAATCCCGAGCGCTACACAAACAGCCCTGGACAATCAAG
+TAGCAGATACTAACTCCATCCCCAGCGGCGAGAGCGACAGCGTCACCTACGTTTCCCCCG
+GAGTCTATGACGTGCGCCGAGTGCGTGAGTTTACCGCAGCCCAGGTAAGGGGAAACAATC
+TGACTGAGTGGGGATGGGGGCCAGTTAGCGGCATTGGAAACCTGATGAGCCGGGAACTCT
+TCAGGGATGCCAACAGCACGCCCATTACGCTCACTTTGGGCACGGATCAAAACCTTCGCC
+TGATATACAAAACCCGCATTACCATATCCCCCGCGCCTAATACCGCTACCCCGGCATCAA
+TCACCATTGCCAATTTGGGAACCTACAATGGCAACTTTTGGACCAAGAGGGGGAACGAAG
+ATGCCGGAAACGGCGACTTATACCTAGCAGAGCTGGCCGCAATAGGGGCAGGAAGCCCTC
+TAAACACTGACACTGCCGGGCTATGTATAGCCGGGCTGTCGGCCAACCTGAACACGGCAG
+AGCCGTATATACATGTATATCGTGTAAATGATTTTGGCTTGTCCTACGCCCCTTACACCG
+CAGCCAGTAAAAAGCGCACTACCCAAACCGTCACGGCGGATATTTCGCAGTGGAACACTA
+CCTTATGGGGGCTGATGATCGGAGCAAACATAACCGGATTTGATAACGTCAGCCACGCCG
+GAGTCGTTTTCAACTTTGGTGCGAGTTTTGTAAAAGACAGCCTGCACAAACTAATTATCA
+ACCCTTGGGACATAGTGACCTGGACATGATTCCTAACGTTTCGACCCGCCCATTTATCGA
+GCCCCCCTTAATCCCCCTGCCCGCCCTGCGGGTGGACTGTGCGCCAACGCCCCGCGTGTT
+GTATTCGCATTTCCCGCAGCGGGTATCCCTGGGCTCGATCCTGTATCTCGATTTATACGC
+CTATGCGTGGTACGCGGGGGGCGGCTATCTAACCCTCAACCGGGGCCGTAAGGGGCTAAG
+GCGCACGTCCCACGGGGTAGAAGATGGCCTTGGCTCAACTCGCACGTAATCCCTGGGTGT
+GGCTGGGGGCCATCGGGGCGCTTATCCTGCTGCGGCCTAGAGGGGGCCTCGAGGCCAACG
+CCAAGCCTGCACCCACCCCCAGGGATGGGGCAGGGTGCGGCTATCCTCGCTCCGACCTGC
+CACCCGCCGTCGCAAAAACCAATGCCGAGCTGATCGAGCGGACCTGGGGGATAATCCTGG
+CCGATAATGGGCGGGTAAACGATTTGGCCCAGAGTTACGGCTACGAAGCCCCACCAGGGC
+AATACGCCCGCGACCTGGCCGCCGCGCTAGTGGGAGCGGCACAGAGCGCCGGAGTGCCGC
+TGGATTTGCTCGTGGCACAATCCAGACGGGAATCAAACCACGTGCCCACCGTTGTAACAA
+ACACGTATTTGAGCATCGGATGGGAGGATGCCGCCATTCGACGGGCAGTTGCAAATAACT
+GGGCCATTGGGCCACTCCAGGTCAAGCCGGGAGTATTCCCCGAGGTCGGCTTGCCGTCCC
+CGAGTCGCTGGCTGGGCGACCCGGTGAGGTGGAGTAGTCAAGCCCGGCTCAGGGATGCAG
+TATTAGCCGGAGCACGATATTTAGCCAAACAAAAAAGTCGCTACGGTACATGGTGCGCCG
+CACTACACGCCTATACCGTAGGGCCTACGGCATACGCCAATGGGGCCAGGGCAGACGGGT
+ATGTGAGCCAGATTATTGCTTGGGCCAACGGGTACACGGAGCTGCGCACATAA
+>NC_014212.1|provirus_1893193_1914973
+GTGACCAGCCTTGATCGCATCTATCAACGTAATCTGAGCCCAACCCAGGCCCGCCACTAC
+GCACGGCTGTGCGAGAGGAATCACAACACGTTTGGAGCGCAAATCTACCACGATGTGGCG
+GAAGCACTGGAAGCTGCCGAGCGTATCCGCGCCGCGATGAGGCTGCAAGGCTACCTCTGC
+CCCACCTGCGGTAACACCGGGAGGCTCGATGACATCCCCTGCTTCCACTGTGCTGCTTGA
+GCCAGCCATGATGACCCCGGATCAGATACTGGCCACCATTGAACGGGCGTCTCGGCCTGT
+ACTGCTTTTTTATACCCACGACACCGCCTTGCGGGTGCGCTTCCTGGGTCGCACCATGCT
+CCCTGACCTGACGGACCCCAGCGATCTGTGGGGATATCGGCCCGGCGAGCAAATAGAACT
+ATTTGGCTGTGGAAGAAAAACAATCAATACATCAAGACTTACGACATCGAGCCGCAGCTC
+GAGGCCACCTACCCCAGCGAAGACACCGTTTGGCGCTGGCTGAAGATGCACCTGGCCGGC
+CTACCCCTTCGGGGAATCGGTCTGGCTGGCCTCGAGCTGATTGAACGACGTATGGCAAAG
+GAGAACCCCCATGCCTAGTGCAAGAGCCCTGGCAATGGCCAAAGCCAGCCCTCAGCAGAA
+CCTGGACGAGCTCTTCGCGGCCCTCCAGGCCGCCCAGGGCCGCCCGCTGGATCTCCACAG
+CTCCGGCCTGGAAGTGCGGGCGTGCTTCCTGGGCCTGGAGGACGGTAAACCCCGCTACGG
+CCTGTACTGCTTGGCCCTGGGCGACTGGCTGAACGTGGCAGAAACCACGCTGCGCACATA
+CCTGAGCCAGTCCGGGCCCTATACGTGGGAAAAGGAAGATGAATAACCCGATCTACGAAG
+CTATCCAGCGAGAGCTGGCCTCCTGCCCGGGGATGAATTTCAGCATCTGGGAACTCCTGG
+CCGCGTTCGAGCTGGAGGCTACCCGCAACAACTACTACCGCCTCTATTACTTTCTGCGCC
+AGCTTGAACAGAAGGGGCTGGTGGGGCGCTGCCCCGGCTGGGCCCCCGGGGGCGGAAGCC
+CTATCTGTACGGATTAAAGGAGCCATATGGACGAGTTTGAACTGGCCCGCCAAGTGTTTC
+GAGTTCTTTGGGAGGCCGGCCCCCAGGGTCTGGATCGCGACGCCCTGGCCCACGCCCTGG
+GCGTGCCGGATCGGGAGATGCGGGAAGCGGTCGAGCTCTGCGCCAAACTGGCGGCAAGGC
+CCAGCGTGCCAGGGGCCAGGCCGGAGGTAGTGGGATTTGACCCCATGACCCGGCGCTACC
+ACATCGCCAACTCGGTGGAGCAGGCCGACCGAATCATCAGCTACGCCCTGAGTTACATCA
+ACAGCGGCCTCGAGCGCGTGCGGGCCTACTGCGAGGCCCGCACCTTGCGCTGGGGGGAGA
+TCGAGACGCCCCAGGCTACACAACAGGCCCTGTTCGAGGCCGAGCGGAGGCTAGAGAGGT
+AAACCCCCCACGCCCCGCCACGCCGTGGCGGGAAGCCGGGGGCTTTCCGAGGGAGGACGC
+TCTGCTGGGCAGGAGCAGGAGGTGGACATGGAACTCACAGAGATCGGATGGCTAGGCCTG
+GTCGCCCTGATCGTGGGCTGGGTGGCTGGTGGGCAGGTGGTTGGAGGCGGTATCAGCGTA
+AGTGCCAGCGTCCTCCTGACGGCGGCCCCGGTGCACATCTACGTCACCCCAATCACCGTC
+TGGAGGCTGACCCACAACCAGCTTGTGGAGCGGTTGTGGGGAACCGGCTTTACCCTGGGC
+GGCACGGTGGTTTACGTGGATCCCCGGCCGCCAGCGACCCAGATGCCCGAGCGCGACATC
+AACAGCCTGCGAACCATGATAGAGCAATACGAGCTGGGGCACATCCTGGGCTGGAGGCAC
+TACGGGCTAGAATACCTTCACCAGATAGCCCACGAAGCCTGCCGGTACGACCCCAAAGCC
+CTGTGGGCGGTGCACTGCCGTAACGACCACAGACCCCCACAAATCCTGCTGCCGCATACC
+GGCGCCATCCGGGTGGTGCTGCCATGAACGCGCATCTGCGAAACACACTGATTGCGTTGC
+TGGCGCTCGCCTACCTGGCGACCCTGGTGATGTCGGCCGGCCACCTGACCAAGTGGTTTG
+ACCTCAGCTTGGGCGAGCTGCCCCGGTTTTTCTCTATTGGCCTGGCGGTGGGCCTGGAGC
+TGCTGGCCTTTACCCTTAGCCTGGCCAGCACCCTCGAGCCCCGCCTGCGCTGGAGCCTGG
+CTGGTGGTCTGTTCTTCTTATTGCTGGTCTGGCTGGGCAACCTGCTGGCAATGGCCCGCG
+TGGCCAACGCCCCCGGCTGGGAGGTGTTCGCCCAGAGCCTGTTTGCCCTGGGGCCGCTGG
+TCGCGGGTAAAGCCATTGGAGAGCTGCTACGGCTGGAGCGGCCCGGACGGCCACCGTCCG
+CCGACCTTTCAACAAGCGGACAGAGGGTCCACGTCCAGACCCACGTTCACACCACTACGG
+TCCACCAGGCGCTCCAGGTCACGGACCGGATGAGTTCATCAACCCAGCCCGGAAAACCGG
+ACGAACGGGTGGAACAACTGCTGGCCGTTCTATCCGGCCAGCCCCTGGGACCTTCCGCCC
+TGGCCCGGCGGACCGGACTACCCAAGACCACGGTCTACCGGCTGACCGCCCGACTGCTCG
+AGGCCGGACTGATTGCGCAGACCCCGGGCGGATACGTCCGCACAGAGGTGGAGCGTGGCC
+GGTAACCTGGAACGCTGGCGGGCGGAGCACACCGCTAAATACCTCTGGTGGGTGGCGCAT
+GGCGTGCGGGGCTGGCAGTCCGACCGGATCAGCTACGCCCCAGAAACAGACCGTTTGGCC
+GCACGACCAAAACAGCCTGGATACCTGGTCATCCAGGTGATGGCGCTGCCCGAGATCGGT
+ATCGACCGCCATACGCTGCGGCTGTGGCGGTCGGACTACCAGGCCCTGCTGGATCGGACC
+GATCCGGCTATCAAAGATGAGTGGGCGGCGTTCCTTCACCGTGCCCGATGGTCTAGCCTG
+TGGTATTTCGACGCGAGGAACAGGCGGATTCGTCCCGGGAACGAGCACCGCGGACTGACC
+GCCTGGACCCTCGAGCTGGGTCGACTGGCCGAGGTACTGCCCGGCGGAAAACCAGCCACC
+CAGCAAAATATCTGATACCATTATTTGTAACGTAACCCGCCGCGTACTACGCGGCGGGTT
+TGGAGTCGCGCGTGGACGAAACCGAGAACCACCTCAACCGTTTGTTGGAACACCTGATCC
+GGGCCATGCGGGCCAACCGAAAAGCCGAGCGGGAGGCCGAACTGCGGGAGGCCGAGAACA
+TTCTGAATGCCCGCAAGGTGATTCTGCAGATTCCCAAGCCCAAAGCACCGGCCTGGTGGC
+AGAACGAGTGGGTTTTTCGCTTCATAGCCACCCTAGTGGGCGCGACCCTGGCAGCCCTGG
+GAATCAACTGGAAGTTTTAAAGGAGGCCTATGATCTTTGACAAGAAAAACCCGCGCCGGG
+CCGCTTTGATCCGGGGGCGGATCCTGGAAGTGATCTATTTCGCGGCGATGGGAGACGCGC
+TAAATCCTGACGACCCTTACAGTATGAGCCGCGGGGTGCTTCAGGCCGCGCTCGAGCAGC
+TCAACGAGCTGCCCGCCGAAACCGACCTGCACGCTGCCCTGCGCTACTGCGCTGAGAAGG
+GGTATCTGGAGGTGGCCTGGCGAAAAGACGGCTCGGGGAGCTTCGACAGCGTGCGCCTGA
+CCACGGCTGGCATCGACCTGTACGAAGGAAGCATCCACGACAAGGCCGTGTATTTTCACT
+CGAGGCGCTGAGATGGAGCGTCTGGATCGTATAGAGGCGCAGATAGGCGATCTGCGGGAG
+GAATTGCGTGGGCTGCGGTTGGCCCAGACACTCACCAATCGGGAGCTGCACGAAACCTTG
+GGTGTGTTGCGAACCGTGCTGGAGCAGGTCAGTCGACAATCCCGCCCACCCCGCCTGCAG
+ATCTGGGCGACCATTGCCATCGGCCTGGCGAGCTTTGGGCTGGGTTTTACCGCCCACTGG
+CGCATCTCAGAGATCGAGGAGGTGAGGCATGTCCAGTTTGTTCTACCCCCGCGAGCCCCG
+GTGCAAAATTTGCAACAGTCCGATTCGCGATGAGATTGACCAGATGCTGCTGGGCAATCA
+ACTGACCGAGCATGGCGAGCGCTGGTGCCTGGAGGCGATTGTGGAGTGGGCTCGGGAGAG
+AGGGTTGAACACCAGCATGGCGGCCCTTTCGCGGCATAAGAACAACCACCTCAATCCGGC
+CGTTCAGGCCGCCCTGGAGACCGAGCGGATGGTGGAGGCCATCAGCGCGGCCACCGGCCG
+TAAGCTCAGCGTGGCCAGGGCCTATGCCAACGCGGTGCTCGCCAAGACCCTGCGGATTCT
+CGACGACCTGGAGTGGGACAGGCTGGACACCGACCAGAAGTTACGCGCTGTAACACACGG
+CCTGCGGGCCGGCGAGGTTTTGTCCAGACTGGAGCGAGCCGACGTGCGGCAGGAGGTGGC
+GACCAAGGTCGAGAAAACTCTGTCGGAAGCTGGCATCAGCCAGGATCTGCTGCAAAAGGT
+GCGGGAGATTTATGGACTGGCCTAATACTGGCTTGTTGCTGCCGTATCAACGGGCCTGGA
+TCGAGGACCAGAGCCGCTTCAAAATCGGGCTGTGGTCGCGGCAGGTTGGTAAGAGCTTTG
+CAGCCTCCCTGGAGGCCGTGCTGGACTGTGTGGCGCACCCGCGCAGCCTGTGGGTTTTTC
+TCTCGCGGGGGGAACGCCAGAGTAAAGAGCTGGCCGAGAAGGCCCAGAGGCACCTGGAGG
+CCATCCAGGTGGTGGCTGAGATGTACGACGAGCCCTTCGACGCCGAGTCCACCCAGACGG
+TGATCCGGCTGCCCAACGGTTCTCGCATCATCAGCCTACCAGCTAACCCAGACACCGCCA
+GGGGCTACTCAGGCAACGTGCTTTTGGATGAATTTGCCCTGCACAAGGACTCCCGCGAGA
+TCTGGGGAGCCCTCTACCCCACCATCACCCGCTCCAAACGGTACCGGCTGCGGGTGCTCT
+CCACTCCCAAGGGCCAGCAAGGCAAATTTTACGAGATCTGGCAGCCCGAGCCCGGCGGAG
+ATCTGTGGAGCCGCCACCGGGTGGACATCTACGACGCGGTGCAGCAGGGCCTGGAGGTGG
+ATCCGGAGGAACTGCGCAAGGGCCTCAAGGACCCGGTTCTGTGGCAGCAGGAGTACCTAC
+TCGAGTTCGTGGACGAGGCCTCTGCCTGGCTGCCCTACGAACTAATTACAAGCTGCGAGA
+GCTCGCAGGCCCGTACCGATGGAGCACTGGAAGGAGATCTGTACCTGGGCATGGACATCG
+GCCGCCACCGCGACCTCAGCGTGATCTGGGTGGCTGAACGCGTGGGGGACGTGCTCTGGA
+CACGCCGGGTGATCTGGCTCGAGCGCACCCCCTTTGCCACCCAGCGAGAGGTTTTATACA
+GCCTCTTGCCACAGGTGCGCCGAGCCTGCATCGACGCCTCCGGCCTGGGCATGCAGCTGG
+CCGAGGAGGCGCAAAGCCGCTTTGGCAGCAGGGTGGAGCCGGTGATGTTTACCCGCGCGG
+TCAAAGAGGATCTGGCCGTTACGCTGCGACGGAAATTTGAGGATCGCCTGATCCGCATAC
+CCCCCGACGACCGCATCCGTGAGAGCCTGCACGCCGTGCGACGCATCACCACCAGCGCAG
+GCCACATCCGCTTCGATGCCGATCGCGATGATGCAGGCCACGCCGACGAGTTCTGGGCCG
+CAGCTTTGATGGCCCACGCGGCGGCCAGCCCCAGCGGGCCCATCACCTTCGAGCGGGTCG
+GCTGGGGCCGTATGAGCCAAAAAGGAGCCTGGTAATGTGGCTGACAGAGCAAATTGCTAA
+ACTGCTGGGCCGCAAACCCCCTGTTGCGCCGCTGCCACACCCTGTCAGCGGGCGCGTCAT
+CAGCGGGACTTCGCGGGGCCTGGAGCCGGAGGGCCTGGCTGCTATCCTGCGGCAGGCCGA
+ACAGGGCGATCTGACCCGGCAGATGGAACTTTTTGAGGAGATCGAGGAGAAAGATGCGTA
+TTTGGCGAGCCTTTTGCAAACGCGCAAGCAGGCGGTGCTGGCCCTGGACTACGCGGTGCT
+ACCCGCCGACGATTCGCCGGCGGCGAGGCAAATCTCGGACGAGGTGAGCGCGCTATTGCA
+GCATATCAACTTGCAGGACCTGCTGCTGGATCTGCTGGACGCGATTGCTAAAGGTCTGAG
+CGTGATTACCATGCGCTGGGAGTACGATCGGGACAGCCGGCGCCAGCTGCCCACCGAATT
+CACCTGGATTCATCCGCGAGACCTGCTCTATGATCCGCAAACCGGCGAACTGCGTCTGCG
+CACCCAGGATGGCCCGCAGAGCATTCCCTACGGCGCGGCCCTGGTGCATCACTACAAGGC
+CAAGTCGGGCGCGCCGTCCCGCGCCGGGCTGCTGCGCAGCCTGGCCTGGCTGTACCTGTT
+CAAGAACTACAGCATCAAGGACTGGATTACCTTCCTGGAACAATACGGCCAGCCCCTGGT
+GCTGGGCAAGTACGATCCCACCGCCAGTAAGGACGAGCTCAACGCCCTCAAAGAGGCGGT
+GGCGGCCATCGGGCCGGAGGGCCGCGGGGTCATCTCCAAAGCCACCGAGATCGAATTCAA
+GGAATCGCAACGCTACGGCACTGCCGACGCTTACAGCCGCTTCATCGAGCTAATGGAGCG
+GGAGATGGCGGTAGCCATCACCGGCTCTCCGCTCTCGAGCTTCGATGGCAGCGGCGGCTC
+CAATGCGATGGCGCTTACCCTGGATAAGATCTCCCAGCGGCTGACGCGTTCGGATGCCAA
+AGCGGTCTACAGCACCTTGCGCCGCGACCTGGTGGTGCCCTTCTGCCATTACAACTTTGA
+CCGGGCCGACCTGGCCCCCCGCCTCGAGCCCATCCTGCGTGAGCCGGAGGACCTGAAGGT
+GGCTGCCGAGACCATCAAAACCCTGGTGGATGCTGGCGCGCCCATACCGTTGCGCTACAT
+CCACGACCGCTTTCAGATCCCGGTGCCGCAAGCAGACGAGCCGGTTCTGGCCCCCTCCAG
+GGCGGGGGTGACCGGGCGGGGCGTCAGGCTGGCATCGGGGGATGCCCGCGGGGCGCGGGG
+ATTTATCAACGGGCAGCTGTACGTGGACGGGCTGGACGAGGTGGCCCGGGCCGAGGCGGC
+GCCGATTCTGAATGACCTCATCGAGCGCATCGCAGCTATGGCAAACCGGCACCACAGCTA
+TTCGGATTTGCGGGAGGCGCTGGTACGGGAGTACCCCAGCCTGGCCAAGCCGGTGCTGGC
+CGAGCTGATCGAGGGCAGCCTGGTGCTGGCCGAGCTGGCCGGGCGCGCTGCAGTAGACGA
+GGACATCTGATATGGCCTGGAATGTTGATGCTGATCCGCTCCAGCCAGCCGAGGCCACCG
+ACTGGTTCCGGCGCAAGCTCAATCTACGCAAGGACGAATACAGACAACTGACCGACCGCG
+CCCGACGGCGAGCCTTCACGGTGGCTGGCGTGGCCTCCCTGGACCTTCTGGCCGAGGTAC
+ACCGCAGCCTGCTGGAAGCCCTTGTGCAGGGAACCCCCTACCAGGCCTGGGCCCAGAACC
+TGGGGCCGACGCTGGCGGCAGCCTGGGGGACGACCAACGGCTACCGGCTCAAACTGGTCT
+TCCAGCAGAACATCCTCTCGGCCTATGCGGCCGGTCGTTACGCCCAGCTCACCGACCCGG
+AGGTGCTGCGGGCCCGGCCATACTGGATGTTCGACGCGGTGCTGGATAGTGCGACCACCG
+AGACCTGCCGGCAGCTCAACGGGGTCGTCCTGCCCCACGATCACCCGCTCTGGGCAAAAA
+ACTACCCCCCGCGCCACTTCGCTTGCAGGAGCGGGATACGCAGTCTAACCGTCCGGGAAG
+CCCAGGAAAGGGGGATAACGGAGAACCCGCCGGAGGTCCAGGCCGAGGCAGGATTTGGAT
+TGCGTTCCGACCCGTCGGAGTGGGGGCGCGACTGGGCCCGGGGGGTGGCCACCAGCGCCA
+GCAGCGCACGCTGGCAACCGGCGTTTGCCGGCACACCGCCAGACTGGCGCACATACGGCC
+GGCCCGAGGCCATTCCACGGGATCGGTTGCCCCCAGACCTCCTGGTACCCTCCATCAGCG
+AGGTGGGTGAAGCCGGCTTCCGCCGTGCGCTGGCGCGGGCCTGGGGCGGCCTGGAGGTGG
+TGGTGGCCGATCCCACCGGGGCGGGAACCATTCTCAACGCCCGGGTGCTGCTGGAGCACC
+TTAGCCGCGAACCGCCGGATGACCGGGAGCGCTACTACGGCCTCTTGCCGGATGTGGTGG
+CAAACCCCTACGAGATCTGGTTGGTACCGCTACAGTCGGATCGTGGGGCGGTAGCCTTTC
+GCAAGTATTACCTCAAGCTCTATGGAGACAAAGAGCGGGCCTTCCTTCTGGTGGTGGAGC
+AGCAGCGGGGAAGCACCTGGACCGCGTATACCCACATCTACAGCAGCAAGAAACGGTATA
+TCGCCGACCGGCGGATTGGTTTTCTGCTGTGGGGGAGGGATTGACACTCCCACGGCTAAA
+GCACGTGGGATTCTTGGTTCGACGAGGACTGCCTACGTTGTGTAGGTCTTACACCCTCTC
+CCCAAGCGTTTAGCGTCTCCGGGTGCCCCACGGCGACGGGGATAGCTCGTATCCCTTCGG
+CCCGGATGTTCAGGGCCGCGTTCAGGTCTCGGTCGTGCACCGCCCCGCACTCACAGGTCC
+AAACCCTGTCCGAGAGGGTGAGGGCGGTGTGGATTGTCCCGCACTCCCGACAAAGCTTGC
+TGCTGGGGAAGTATCGGTCAATCACGACGAGATGTTTGCGATACCAGACCGCCTTGTACT
+CCAACTGCCGCCGAAACTCACCCGGGGCCGCATCTAGAACCGACTTGGACAGCTTGGTTT
+TCGCCATCCCTTTCAGGTTCAGGTCCTCGATGCACAGCCCGTCGTACTTCTGGACGAGTC
+CGGTGGTCAGCTTGTGCAGCCAGTCCTGCCGCTGGTTGCGAACCTTGGCGTGGACCCTGT
+TCAGCCGATGCCTGGCCTTTTCCCGGTTCTTGCTACCCTTCTGCTTGCGGGAAAGCTCCC
+TTTGCGCCCTGCGAAGCTTGCGCTCTGCTTTGCGGTAGAACTTGGGTGGAGCTATTCTTG
+TACCGTCGGAAAGCACTGCGAAGTCTTTCAAGCCGAGGTCAATCCCCACCACATGCTCAG
+GGTTTACGGGGGGCAGGGGTACGTCGGGCATCTCGAACTCGGCGGTCAGGGTGACGTGCC
+AGTGCCCTTCGGTGTCGCGTTTGAATGTTGCGCCTTTGATGACGCAATCAATCGGCTGGC
+TCTGGCGAATCTTCACCCCACCGACCTTGGGGAGGTAAACCTTGCCTTCCTCCACCCGGA
+CGCGCTGGGGAATGCGGAAGCGGGGCGGGTCCTTCTTTCGGGTCTTGAACCGGGGGAACC
+CGGCCCGTCGCTCGAAAAACGCCTTGAACGCCCGGTCGAGGTCTTGGAGGGCTTGTTGCA
+AGAGTTGGCTATCCGCTTCTCTGAGCCAGGCCATCTCAGGCCGCTTCTTCAGGGCGGTGA
+GTTCGGTGGCCTGCCCGTTGTAGGTCAACCCCTTCCCGGTGGCGGCATACGCCTCCTTGC
+GCCGTGCAAGGCCCCAGTTCCACACGAACCGCCGAGCTCCGGCCATACGCAGCAAAGCCT
+CAGCTTGGGCTTGGGTGGGTTCCATGCGGAAGCGGTAGACCTTGCGGAGCAGCATTCAGT
+CCCTCGTCTTCTGGGCGGCGATGTATTGCTCGATGGTTTTGCTACTGACCATGCCAGCCG
+TGGAAACGAAATAGCTCCGTGTCCACAGGGCGGGAAGGCGGATGAGTTGGGGAAACTCCC
+GGCGCAACACGTGCGAGGTGTAGCCCTTCAGGCGGTGGGCGACCTGGTTAGGGGCCACGT
+CGGGGTCTACCGAAATGAACAGGTGTACGTGGTCGGGCATGATTTCCAGGGCGATGATTT
+CCCAGCCTAGTTTAGCGGTCTTCTCCCTAAGCAGAATATCCAAGCGCTCGGCCAACGGTC
+CTACCAGAATCTTGCGGCGGCGCTTGGGCACGAAAACGAAGTGGTAACGCAGCAGCGAGA
+CGGAGGTGTTCTTGTGTTTGTAGGCCGTAGGCACTATCACAGTATAGCACACCTGCCGCC
+CACCATGCGATGTGCCCCTGCGGGGCACATGGGGGAGTCCATGTATCCCATCCCTGAAGG
+GAAGGGTTTTATAGCTCCCCCACACCCCCTCGCTTCTATAAGCCGCTTGCGACCCCCAGC
+CTAGGGGGAAGTCGAGGAGGCCACTTGGAAGCCCGTAAAAACGATCGTAGAGGCAAGAAG
+GAAAATCTATCACAAAAAGAGGAGGTGGGACGTGCACAAGGTGGCACAGATCGCGCTGCT
+GGCGGTGCGGCGGGAACTCCCAGGATTCATAAGCAGCCCGGGCTGGTGCGTGGCGTTCGC
+CTTTGAGTGCATCGCCCGGGCATATGACACCAACCGCTGGCTGCTCTACAGCCGGATGCT
+CGATTCCGTGCAGGCCGACCCCGACCGCAGCCGCTGGGCCCACGACGTGGAGCTGGCCAT
+CGACCGCCTGGACTGGGATGTCACCAAAGCAGACCGGGACCCGGCCGGGGATGACCGCAA
+AGGCCTCTTGCGAATAATCAAGCCCGGTGACTTACTATTCAGTAGCCAGCTCCACGATGA
+GCCACCGAAATCCCGGCGCACCGCCACCGATCGGGAGGGCCACCTCGCCATCTTCGTCGG
+TGAGGTGGAGGGTATACCCAGCGTGGCGGAGAACACCCGCGCGGATCGGGGCAGATGGTT
+TGGGCGGAGGTCAGCCCTGCGCCTGACCCCACTGGCCCACTGGGATACCGTGACCACGGT
+GGGGCGGATCCCCAGCGGGTGGCGGCCGTGAGCGTCTCGGGCTCGTTTGGTGATCTCGAT
+GGCCTGATCCGCCGGCTGGGCCGAATGGCCCAGCCAGCCTTCGCTGCGGGCCTGGCCAAG
+AGCCTGGGGCAGGCCGCCCTGAACCAAATTGACGAATCTTTTGCGGGGCAGCGCGACCCC
+TGGGATCGGCCCTGGAAACCCTCCATCCGGGCCGAGACCACCGGTGGCCAGACCCTGCGC
+CAGAGCGCCCGGCTGCAGCGCAGCATGACCTCGCAGACCGCCCTGACCACCGGCCCTGCC
+GGATTCGAGGTGGGCACCAACGTCCAGTACGCTGCGGCCCACCAGTACGGAGCCACCATC
+AGACCCCGGAAGGCCAAGGCGCTCAGGTTCAAGCTGGGAAAGCGCTTCGTGCAAACCAAC
+CGGGTGGAGGTTCCTCCCCGGCCCTTCATTCCGGAGCCTGTGCTATCCCCCCGCTGGGAA
+CGGGCGCTCGAGGCGGCGGCGGGGGCGTACCTCGACCGAGGGTTGGCCTGATTCGAGCGA
+TCCAGGAAGGGGGTAAACCACCCCACGTCCCGCCACGCTGTGGCGGGACGTGGGGTGAGG
+AGGTGAGGCAATTGACCGAGACCTTGTTGGAGCGCCTTCGGGCTGAGCTGCCCCGCAGGG
+TAAAGCTTGAGCTGGGCCCCGATGCGCTCAATCAACACGAGGGGCCGCTCAAACTGGTGC
+TGGTGCCAGGGCAGGACACGTTTACACCACCGGATACCCGGGCCATCGCCCCTGAGGCGC
+TGGCCAGGGAGACCCTCCCGCAGCCCCGACCCCGGCCGCCCTACACCAGGCTGGCAGGCT
+ATACCCTGCACATCTGGGCGAAGAGCTACCAGGCTGTGGAGGACATCCTCTCCGAGTGCG
+TGGCGGCCTTGCGGCGCATCTGCGGTAGCAGCCTCGAGCTGCTCCCGAGCGGCTGGGACG
+AGGACGAGACCGGCCAGGCGGCGGCGCTACCAGCGGACAAGCGCCGCTATCAGCTGCGGT
+TCAGGGTACTGGTGGAGGTAGGGGCGGCAGAACCGGGCCTGTACGTCCGCCTCGAGCGGG
+CCCTGCTCGACCAGGCGGAAATTCTTCCCTGAGAGGAGCGTTATGGCAAAAGCAACCGAT
+AACAACAACGGCGGGCAAGCTGCACCTGCCCGAAAGACCGTCGAGGAGCTGGCTGCGGAG
+GCCGGTACCCCGGACTGGCTGCTGGCCGCGGCACGGGCCAAACACCGCTGGGTGATCGGG
+CAGGAACTGACCAAAGCGGCCTTCGAGCGGGGCATCCAGGAGGCGGCCAACGAACCCATA
+GGAGGTGAGGTATGACCGGCCTGCCGCGCGTGGAGGTGAGCCCCCAGGACTTCGGCATCG
+GCGCGGTGCCGGGCAACGGTGAGGGGGTGCACGTCAAAATTGGCATCGCCTCCATCCTGC
+CAGCAGGCGAGATCATAACCGTAACCAGCCCGCAGGGGGCCCGGGAGCGGGTCGGCGGCA
+AGCTAGGCGAGGCCGCCGCCCTGGCCTTTGGCGAGGGAACCCGGGCGGTGATCTGCCTGG
+CCGCCAACCCCAGCGTGCCCGGGACAGCGGGCGCTGTGACGCACACCGGCAGCGGCACGG
+CGGTACTGTCTCTGACCGGAACCCCCCGGGATGACTACCGCCTGCGCCTCAGAATCACCC
+GCGCGGCCCCGAACCTGGCTGCGGCCACGGCGGCGTTTCAATACTCGCTGGACAACGGTA
+ACACCTTCAGCGCCGAAATCGCCGTGCCGACCACCGGCCTGTACACCCTGCCCGATACCG
+GCCTGACCCTCAACTGGGCCGACGGCTCCTTTGTGGTCGGTGATGTGTACACCGCGGACT
+GCGTTGCGCCGAGCTACACCACCACCGATCTGGTCACCGCGCTCAACATTTTGTTTGCCC
+GCACCGAGCTATCCTACCGCTTCATTCACGTGGTGGGGGCGGGCAGCCCGACCACCGCTG
+CTACGCTGAACACCCTGCTGGAGGCCCGCGCCGCCGACCCGAACAACCCCCGCTTCATCC
+ACGCCCTGATGGACACGGCGGACCAGGCCGACGCTGCCCTGATCGCCGCGTATGCCGGCA
+CCACCAGCGTGCGAGTGGGTGCAGGAGCCCGCTATGCCGATGTGGTGAGCCCGATCACCG
+GCCTGGTGATGAAGCGGCCGGCCGCATGGGTGGTCGCTGGGCGGTACAGCGGCCGCCCGG
+TCGAGGAACACCCCGGCCGCTACGCCAGCGGAGCGCTGCGCACGGTTGTGAAACTCCACG
+GCGATGAGTCCATCACCCCCGGGCTGGACGCCGCCCGGTTCACCACGCTGCGCACCATCA
+GCGGGGGATTTTACATCACCCGGGGCCGCCTGTTTGCCCCGCCCGGTTCGGACTATGAAC
+AGGTGCAGAACCGCGAGGTGATGGATGTGGCCTGTGAGGTTGCCTACCGGGCCTGGCTGC
+GCTGGCTAAATGAGCAGATCCAGGTCTCCGCGCAGACCGGGCGCATCCTGGAGCGGGAGG
+CCCTGCGGATTGAGGCCTATGTGGAGGGGTTGGTGCGCACCGCGCTGCGGGGCAAAATTT
+CCATTGACGAGGTCATCGACCAGCCCGCTGCCTACGTCCGCATTGACCGCACCGAGAATA
+TCCTGTCCACCAGGACCATCCCCTACGACATCAGTCTGGTGCCACTGGGCTATGCTGAGC
+GGATCACCGGCAAGGTGCGCTTCTTCAACCCACAGCTCCAGCCAGTGGCCTAGGAGGTAG
+ACCATGAGCGTGACCGTGCGAAATGGCAAGGTGTACGACAACTCGAGCATCCAGCTTGAC
+CTGGATGGCGAACGGATTCCGGTCAACGTCGAGTTGGAGTACAACACCGGCGAGGTGTCG
+GAAGAGTATATCTACGCCGGGGGCAAGCCGGTGGGGCGCACCCCCGGACAAATGGCCCCC
+GCCGATGTGACCATCCGGATGCCGCTGGACCAGTGGCAGCAGTTTCGCAGCAAACTGGGG
+GCTAAATACAAGCGCAAGGAGTTCAATGCCGTTGTGACGTTTGTGGACGCCGACGATAAC
+GTGGTCAGTGACAAGCTGAATAGGTTGCGCATCCTCAACGACGCGCTCTCGGCCTCGCCA
+GGCGCCGAGGCGCTTATGCAGGAGCTAACCTGTAAGGCGCTGGATGTGGTGCCTGGCGAT
+CAAGCCACTTTCTGATTTCTGAACCTGCTAGCCCCACCCCGAACGGGGTGGGGCTAGCTC
+TTGAGGCATCAACATGGGAAAAACCATTCTTAGTGAAGACCTCGAGGGCCAGCTGCCCCC
+CACCACCCTGACCGCCCTCCGCGCCACACATGGCGACCGCTTGTTCGCCCTGGTTCGCCA
+GGGGCGGGTGCTGGTGTTCCGCCCGCTCACCAAGGCCGAGTACCGCATGATGCGGGCGGA
+TCTAGACAAGGCGTCTGCCAGCCCGAAGCTGGCACTGGACACCTACGCCATCGGCGAGAA
+GTACGCCAAGCTGGCCCTGTGCTACCCCGACCGGTCCGAGTTCGAGGCCATCCTGGACGA
+CTACCCAGGCCTGGCCGATGTGGTCAGCCAGGACTTAGCGGCAATTGCCCAGATGGCCGA
+AACGGAGTTTCTTCAACAAATCGATTGAACTGCTAAACGACGCCCTGCGGCACCGCGAAC
+AACCCTTGGTAGCGGCCCGACTCCTGCTGGCCTACCGCCGAGGTGAGGATTCCCCCGAGG
+CGCTGGCCGGTGCGGCGTTGGAGGCCGCGGTGCTGCTGGGCCATTTTGGGAGGATCCAAT
+GAGGCGGCTGACATGGTTTTTTGGGTTACGCAGCAATTTTGTAACCCAGTCGCGCGCCAT
+GTCTAGAGGGCTGACGGGGGTTCGGGCAGCCCTCCAAGAAGTGGGCGGTGCGGCCCCGGC
+GACCGCCCGAGCGGTCGCCCAGAGCCTGAGGCTGCCCATCGGCGCGGCGCGTCACCTGGT
+GGGGGCGCTGACCGCTGCGGGGGCTGCGAGCGCGCACCTGGGACGGATCAGTAGCGCGGC
+AGCCAGGGCCCATCAATCCCTGCAGGGCCTGGTCGGCCGGCTGACCAGCCTGCCTGGCCT
+ACTGGCCGCTGGGGCGGTTGGCATGGCCACCAAAAGCATATTTGACGCCATCGGCTTCAA
+AGAACAGCAGTTGATCAGCCTGCGGGTGATGCTACGGCCGCAGGTGGGGCTTGACGCCGG
+TCGGATGGCCCAGCAAACCTACGCCATGCTCGCCCGCTTCGCCGCCGAGACGCCCTTCGA
+GACCCAGGAGGTGATCGCCGGCGGCAAACAGCTGCTAGCCGCGGGTGTGGCGGTGAAAAA
+CCTCCAGGGGCTATTGAAGGATGCCGGCGACCTGGCGGCAGGGATGGGAGTGCGCCTCGA
+GGAGGCCATCGCCCCCATCACCCGGCTGCGTGCCGGCAATTTCGGCGAGGCCTTTGAGCG
+GCTTCGCGACTTCGGTATCAGCCGGGAGGCCCTGGAGGCCAGGGGCCTGAAGTTCGATAA
+AAGCGGCAGCTATGTGGGCTCGGTCAACAAGGCCATGCTGGCGGTGCGCCAGGCCATCAA
+GGAGCGCTTTGGCGGCCTGATGGCCGAGCAGAGCCAGAGCATCTTCGGCCTGATCTCGAC
+CCTGAAGAGCCGACCCTTTGAGCTATTCAGCCAGATGAGCGTGGACCCCCAGGGACCCCT
+CAAGCCCTTCAAGCAAGTGCTGGCCAACCTGGCGGTCCTCACCGACTTCAGCCGGGGGCC
+GGGGGCGGCCCTCTCCAAGCGCTTCCAGGCCAGCCTGGCCGGACTGATAAAAGCGGCCTT
+CGGCCCGCTGGCGGCTGCCAGCGAGCCCAAACAAGCCGGGCAGGCGATCCTGGCGTTCCT
+CGACCGGAGCACCGCGCTGGTTCGGCGGGCCCGGCAGATCTTCCCGACGGCCCTGGGCTA
+TGCCCGGCAGTTCTGGACCGGGATCCAGGCGGGCTTGGCGATTCTGCAAGGGGTCTGGCG
+CACCCTCGAGCCCGCCGCCAGCCTGCTGGGCCGGCTGGCCCAGGGGCTTAGCGCCAGCCA
+GGCGGGCATGGGCGCTGCCAGCGGTAGCGGCCTGGCCCTGGCCGGCACCCTGGTGCTGCT
+GGCGACCGGCCTAAGGCTGCTCAATGCCCTTACCTTCGGACTGGTCGGAACCGTGGCGCG
+GCTGGGACTGGTCTGGCTGGCCACCGGCCTCAAAATGTCTGCAGGCTGGCTGGTTGCCCT
+GGGGCCGGTGGGCCTCCTGATCGGCCTGATCGGCGGGGTGGTTGCGGCGGTGGGGCTGGC
+CTACCAACGGCTGGACTGGTTCCGCAACGGTGTCAACGGTGTCTGGAAAGCGGTCGTGGC
+TGGCGGCAGCGCATTCATCGCCTGGATCAGAGCGCTGCCCCAGACCATCGGCGAGACCCT
+GGCTGGCCTACCGGCGCTGATGCACGAGACCGGCGCCCGGGCAGTACAGGGGCTCTGGAA
+CGGGCTGAGAGCCGCCCCTGGCAGAGTCTGGGAGGCGGCCAAAAACCTGGCTCGGCAGGC
+GGTGGGTGGAAGCCGTGAAGCGTTGCAGGTGCGCAGCCCATCCCGGGTGTTTGCCTCGCT
+GGGCGAGCAGAGCGGGCTGGGTTTGCGGCAGGGCCTGTTGGCCATGCGCGGCGCGGTGGC
+GGGCGCTGGACTGGCCCTGGCCGCAGCAGCCATCCCGGCCACGCTGCAGATCCCGGCCCC
+GGCCGCAGCCCTGGGGGCGGCGAGCCCCCACCGCGAGGTGCATATCCACATTGGCCAGAT
+CGTGCTCGGTCAGGCGCAGACCCCCAGCGAGGCCAAAACCCTGGTGGTAGAGGCCATCCT
+GGAGGCGTTGGAACGGGCCCAGATGGAGGAGGGGGCCTGATGGAACGTGACCAGATCGTA
+TTCGTGGGCACCAGTGGGCAGCGCTTTGCCATCAAGCCCCAGCCCAAGGGGCCGAACGAA
+ATCCAGGGGGTTGTGGCGGTATCGGTGCGCCGGGCTCTGAAGGAGCAGAGCGCCGAGATT
+CCCCAGAGGGGCATTGAGTACACCTACCTCGGCTACGACTACGCGGAGGTCACGGTGGAG
+GTGCGGGTCTGGCGGGAAAGTGAATATGACAAACTACAGCGTCTGATCCAGTTATTCCGC
+CCCAAAGGAAAGGACCAACGGGCCCCCGAGGTTTATCAACCGGTTCACCCAATCCTGCGC
+CGGCACGGCATCACCCACCTCTACATGTTTGCTGTGGAGGAGCCGCCCTACGACCCGGTA
+AAAGGCTGGATGGCCACGCTGAGCCTGCGGGAGTGGAAGCCGGCGTACAAGCGGGTGCAG
+ACCAATGGCACGCGCATCGGAGGCGGCAGTGCCAGCAGCGCGGATACCGGAGGCGCCGAC
+GCCGACCGCGACGGCGTGCTTACCTCCCAGCAGCGTGCCCAGGCCAGCCCGCCCAGCAGC
+AGGGGGGTGCGGCCGTGAGCTTTGCCACAGTCGACGAGCTTCCGATTAGCAGCGGTACGC
+TCACCGTGCCCCGGATAGGTCGCCCCATCGCGGAGCTCCAGCTGGCCGCGAACCGCCTGC
+TGCTGGCGGGTGAATCCGTGCAGATGCGGTTCGCCGATGGCACCACCTACCGGATGGTGG
+TACGCCGCAGTGGCGTGCGCGGGGGCCTGGTGGAGGCGCTGCTGGTGGGCGGCGCGGATC
+GGCTGAACGCCTGGCTGCCCAGCCGCGATTACCAGGGCGTGCCGGCCGCACTGGTGGTGC
+AGGATCTGCTGCGGGAGGCCGGTGAGGCCGCTGGCCTCCTCGAGCTACCCACCGTGTTCA
+CCCGCTGGGTGCGCCGCGCCGGCCCCGCTCATGAGGCGCTACTCCATGTCATGGCCCGGC
+TACCCGACCGGGCCTGGCGCATCCGGGCCGACGGCCGGGTCTGGGCTGGGCTCGAAGCCT
+GGCCGGCTGGACCGGAAGGGGTGGTGGTTGAGGCTGCTCCGGCCCGGGGCTGGTACGACC
+TGCTGCCGCTGCCCAGCCTGGAGCCCGGGGTGCTGCTGACGGCCCAGCTAAACGGTGAAC
+AGCGGCTGCTGGGGAGGGTTGAGCGCGTCGTTCACCAGATTGGCCCCCGGCTGCGCACGG
+CCGTGTACACAGGAGGGTGACGTGCAGGAGCGACTCAAAAAAGCCATTCAGGGCCTGGCC
+CGGCCACCGCACCTGGACTTTCTAGCCCTGTACCCAGCCACGGTGCTTAAGGACCATGAG
+GACATGCACCTGGACTTGCAGGCCGACGACGAGCGCCTGGGTACCCTGACCCGGGTGCCC
+ATCTGGTTGGGCCTGCCGGGGGTTACGGTGCGGGTGGCGGCAGGGGCCCGGGTTCTGCTC
+GGATTCCATCAGGGCGATCCGGAGCGGCGCTACTGTGACCTCTGGGGGGGTGGGGGGCTG
+CGTGAAATCATCCTCACGGCCAGCGTGAAGGTGGTGGTGGACGCCCCCCTTGTCGAGCTG
+GGCGGGAGCGCGGGGGCCAGCGTGCTGCTACAGGGGCAGCCGCTCACGTTCGTGTTCAAT
+ACCACGCCGGTCGCAATGGTGCCGACCGTTGGCACCGTGCAGGCCGGGGGATCCACACGG
+GTAAAAGGGGTGCAGTAGTGGACGACTTTGGTACCGACCTGTCGGTTTTCCCGGACCTTT
+CCTGGACGCTCAAAAGCGGCTACGACAATCTGGCCGAAGCCGCCGTGCGCTGCCTTATGA
+CCGCCCCCGGAGCGCTCTTTTATGCCCCCGAGTACCGCCTGGATCTCAGGCGGTTCCTCA
+ATGAGGCCATCACGCCGGAGGCGCTGCTCGAGGTGGAGACGCTGGCGACGAACGCGCTCG
+AGGCCGATCCCCGTATTGTGTCGGCCGAGGTGCGGGCCAGCTGCCCCGGCCCGGGGGTGC
+TGAACCTCGAGCTGCTGCTAACGACCGAACGCGGCCCGTTTGCACTGGTGCTGCGCATTG
+ATCAGGTGACCGTGGAGGTGTTGCGTGCCTAACCTCAGCCAGCTGTTGCAGCCACGGAGC
+CGTGACGCAGTCCTGGCCGACCTGATCAGCATTTTGCAGACCAGGGGCTACCCTCCCACC
+GACTGGGTTGAGGGCAGTGTGCAGCGCACCCTGATCGAACTGGTTGCGGCAGGCTTGGCC
+GACCTGGAGGCTTTGCGATTGGAGATTGCCAAGGGCGGGTTTCTGGATCTAGCCAGCGGG
+GACTACCTCGACCTACTGGCCCGGAGCGCCTACGCCCTCGAGCGCAAGCAGGCCACCTTT
+GCCCGCCAGACCTTCCGCCTCACCGCCGCGCCAGGCTTTGGGCCCTACAGCATCCAGCCA
+GCCCAGCTTTGGGCGGGAAATGCCGCCGGCCTGCGCTTCAATAACACAGCCGGTGGTACG
+CTCCCGCTGGGGGGCACCCTCGACCTGGAGTTCAAGGCCGAGAGCCCGGGGGCGGCCTAC
+AACCTGCCACTGAACACCGGCACGCTGCTGTTCACGCCCTTACCGGGGGTCACGGTCAGC
+AACATCGGCGTTGTGGAAGCGGCCATCGATCGGGAAACCGACGCGGCCTTCCGGACCCGC
+TGCCGGCTGCGCTGGGCCGAGATCGGCCTAGGGGCAACCCGGGCCGCCTACGAAAGCTGG
+GCGCTGGCCAGCACCCCCAGCATTACCAAGGTGCGCATTCTAGATAACAACCCCCGCGGA
+CAGGGAACGGTGGATGTGGTGGTCTGGGGGGAAGGGGGCCTTGGGGCGGGCGCGGTGGCG
+CAAGTCAACAGCTATATCCAGCAACGCAAACCCCTGACCAGCAACGTCGAGGTGTATGCC
+GCCACCCAGGTCAGTATCGGGGTGACGGCCACCATTCGTCTGCGAGCCGGATTCCTGGCG
+GCCGTGCAGGCTGCGGTTGCCAGCCGCCTGGCGGACTTCCAGCGCGGCCTGGCGATCGGG
+GCCACGGTGTACCGGTCGGCGCTGATTGAAGCTTTGTTTGTTCCAAACGTCGTCGATGTG
+GCCCTGTCGGCTCCGGCTGCGGATACCAGCCTGGGTCCCACGCAGGTGGCCACCTTTACC
+CTGACCCCGACCTGGCTGGAGGTGTAGATGGCAGGAGAGGAGATTCCACTGGTGCCGGTC
+GCCCTGTACCAGGCCTGGCTGCCGGAGCTGGCCCCACCCTGGTTGCAGGGGCCTCGCGGG
+CATGCCCTACTGGCTGGCTGGGGCCAGGCGCTCGACCAGCACGCATCCCTGCTAACGACC
+GCGATACTGGCCCGCTTTGTCCAGCAGGCCCCCGAGGATGCCCTCAACCTGCTGGGGGCC
+GAACGCGGCCTGGGGCGGTATCCGGAAGAGGCCCTGGGCACCTGGCGGGATCGGGTGCTG
+GGGGCTTGGGAATTCTGGCGCTGGTCGGGGACTGAGTTCGGGATGCGCACCGCGCTCGCC
+CAGCTGGGCTACGACGCGGCGGTGGTGCCGGTGTGGACCTACGACGCGACCCGCTGGAGC
+GAATTCGACGTGTACATATACCCCATGACCCGTAGCTACGACGGCTCAACCGCAGAGCGA
+AACCGAATCCTGGGCGTGATCAACCAGGTCAAAGCGGCCCACACGCGGTTGGCAAAACTC
+ACCTATGTGAGCTTCGGTCCACTGACCTGGGATCCTCCAGGCCTCACCTGGGATGCCCCC
+GCAGTATGGGGCGATACCCCGGTGCAACTGTTTCCGTAGGAGGCGTATGCCAAAAACACT
+GAACCCGATTAGCGTCTTTCCGAGCAGCATTGTCAACTTCCCGCAGGCCGGAAACAACGA
+GCCGGTGGCCATCGGACCTTTAGAGGCGGCCATTCAGGCGGTGCTGAACCGCACCGAGCA
+CCTCCATCAGAGCCGCCTGGAGGTGGAAGGCCCCGGCGTCAAACGCCTCCGGCGGGTGGC
+CACCCTGGCGGCGCTGCAAAACCTGACCGGCATGGCCGATCTGGACGTGGTTGCTGTGGA
+CGGCTACGGCCTCTACCGCCTCTTCGACCCCAGCGCCCTCACCGCCGACGGGCTGTGGGT
+GTTGAGCGCGGCTGGCGGTGGCCGCTGGGTGCACAGCAGCTACCTGATGCGCGGCATCAA
+CAACGGCTGGGCCATGCTGGACAGCAGCGGTCGGCTGGCCCAGGACGTGCGCGATGGCTC
+CATCCTCACGCAACACATCGGCAACGGCCAAGTAACGGGGCCGAAGCTGGCCACGGGGGC
+CGCCGTTGCAAATCTCGGCTATACCCCGGTGAACAAAAATGGGGACACCATGACGGGGGC
+GCTGACGGTGACCGCCAACGTTGGCGAGGCGCTCAGCCTCAAGGGCGGGAGCAGCAACCA
+CGTATACCTCGGGTTTTACGCCCGCAGCGCTAACCAGAGCGAGCGTTCTGGTTTCATCGG
+GTACGGCAGCTTCGGGAGCAACAGCCTCGACATCGTCAATGAGATTGGTGGGCATGTGTA
+CATAGCTTCTGCTCAGATGGTTGTGAACAGCAACCTGAGTGTTTTTGGGCAGATCAACGG
+ACGTTACAACCACGCCGAGCGGTTTTCCGTGTGCGCTAACGCGGGCAGCGACATGGTCTT
+GTCCCCAAGCGTTAGTGGGATTATTGCCGAGCTCAACTTAACCTTACCGGCAGGCCGAAA
+GTTGTACTTGCGGCGGCTGCGCCATGCTGGCAACAACAACTTTCGCGCGCATATCTTCAC
+GACCGGGCCGGGCAGCAACCCCTACCTAGCCCCAAACACCTCGGAAGAGCTGAGTTTAGA
+TTATGAACTGAAGAATGTAGCAGAAACGTTTACGCTTATGCTAGCGGTATTCAATGCATC
+TACTAGCAATCAAACAGTTAGCCGAACCTGGTCTGTCTGGGCCGAGCTGGAGATCCGTTA
+A
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_014364.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2212 @@
+>NC_014364.1|provirus_2121424_2157334
+TTAAGAACTTTTTCTATATCTTCCTTCATTTAGTTTTATGCTTAAAAGGTCATCATATTT
+ACAATAATAATGATTGAAGAAATCTTTATATGTAATAAGTATTTTATCAGGAATAAGTGA
+GAGATCATAATTTTCAATGTAACCGATAATTTCAGGGTCTTCTTCCTTTATCTCCCTATA
+GAGGGACCTCCAATTATCAGTCAACCCTTCTTTTTCAGCAATATCACGTAATAAAATATA
+TGAATCTGGCATATGTAAAATCTCAAAGAATTCTGAAATATTTTTTCCAAAAGCTCTTTC
+AAAAAATGATCGATTTCTTCCGACCTTTCCCTTTGTGGAATTCAAAATTAGCTGTATAGC
+ACGTATGTATTTTCTATTCCAGTTCTTTCCGATATATTTTCTAGTCTGATATAATTTTTG
+TTCATCATTGATTGGAGAATAACGCATTGGAAAAGAATATATAATTAAATCAAATTCTTC
+ACATAATTTAATATTTAATTCTAATCGATTCCATAAATCTTCTGGTTTATCTTCAAAATT
+ATATAAAAGATAATTAGATAGATTACGTATTTTATATTTTGCAGATAACCTAATTGCATT
+GATATAAATATCTCGTAATGACCAATGATCAAAAGCAATTCGTAAGGGTTGGATAGCAAT
+TTTCGAAAGTAGTCTCATATTTTCTTCATTACATAATCTTGAATCAATACCTTGATTAAA
+GTCAACTGTCCTTTTTTTATAAGTTATTTTCCTAATATCAAAATTCCTATCGAGTTCTTC
+AAAGCATTGAATTAAAGAGAAAGAATTCGGAACGAAATTGTCGGTTTTAAAATATTTATC
+TAAGATATCCGAAGCAATTTTTTTATTTGAAAGATTTAATTGCTTTACGAAGTTTAATAT
+TTCTTTCCAGAGAGCAACTGAATATTCAAAACTGTTAGTCCCTTTTTTAAGCAACAAATA
+AAAACTATATAGTTTAGTCTTCTGCTTTAATTTAGCACCACGAAAGAATCCTACTTCAAT
+AATATCATTTATGATATCTTTAAAAAAAGGTGATGCTAGAACATTATTATCTAATAAAAG
+AAGCTTTCGACGAATATAATACTTACTATCTATCTCTTTGACAGTTTTTTTTATATCAAT
+ATATGAGACATAATCCGGTTCAATGATTGGTACAGCACAGAATTTGCATTTTCGTATACA
+ACCTCTAGTGGCATAGGTTATATAAGAGTCCCATTCAGGATAAGTATAAGATATTTGATG
+AAGAATGGAATAATCTGGAGTAACAAGGTCTATATTGTCATTAGTTGTTAAACCAATTCT
+TTTAGAATCAGTTAACAAACCATTTACTACCTGTACACCAGTTATATTTTCTATTTCTTC
+TGATAAAACAGAAGCCATTACACCACCAACAAACATATTGCTACTGTTCTTAATGTAAGG
+CTTTAATTCCTTTATAGAAGAAATAGTTATATCCCAGTAGAAAGTGAATAAAGTTGTAAC
+ATAAATTCTATCCCATTTCAGATCATCTATAATTTTATTTTTGCGAGCATCACGAAAAGC
+CTTTCTTAACCAACTTTCAATAGTTGGAAAGAAAAAACCAACATTATTTTCAATTGCCTC
+TAAGTATATCGTTCTACCAGTCTTTAGATAATAAAAGACATTATCCAATATTGTTTCCGG
+AATAATATCATTCTCAATTTTGGTAAATCTATCTACTAAATAGACAGAAAGTTGTTTTAA
+ATAAACCTCTTTAATGTTACCTTTGACAAAGATAACTTCATCACCTAAAGTTTTATGATA
+AGAAGATAATTTCATTAACCCAAGTGGTGGGTATTTGTTTTTATATCTAGGTTCGTATAG
+AAGTATTCTTTTCATTTTAGCTTCATTTTTATTGCAAAGATTAAATTTTCAGCCACATCG
+CTTGTCATCGTCTCATTTATTATAGCAAAAACTTTTGATAAAAGTTTCTTTTCTTTTCTA
+TCTAATTTGCTTAGATCAGAGACAGCATATTTTTTCTTTTCGTGATTATCCTGGCTTTCA
+TTAGTGATAATAGTATTAGTGCTAATTCGTGGCGGATAAACTTTCTTAATGCCGTCTTTT
+ACAATTTTTGAGCTAATTCGTTCTATTCTATGGTCAAGGTCATTTCTTTTCTTTTCTAAT
+TCCTCATGTGTTTTAACAAGAGCATCATATGATGACTCTTCATGCTTTTTGTTTATAAAA
+CTATTTGTTTGTTTATTTTCATCGTATTTGCTCTTTTGTGCATTATAGTCTTCACTTGCA
+TTATTCAGAGAATTAATGTCAGAAGCAAGTTTGCATAAGCTATTTAGGTCTTTAATGTAT
+TTTCGAGTTTCTCGCATTAAAAATCGAAATTCTGGAGAATCTTCAAAGTAATTACGTTGT
+GCGTTAGGTATAATCGTATTCTCAAAAATATGTAACTCACCAATAAAATAATTAACAAAC
+CTTTCTTGAGGCTCAAATAGTTCTCTTAAAACATCGCTCCTTCCGATCTGAAAATTATTT
+TGCCTAAATTTAATACCTGGATAATTTAGTTTAGGAATTAGTTGTAGTTTTCTTGTCAAC
+GCATACCAGCAGAAAGCAATAATTTTTGAATCGTTATATATGACAAAATGATTAATATCA
+ACTATCTCATCATGTTTCTTTTTTTTGTTTGAAGCTATTTTATATATGTCAGTACCATAA
+TTTTTTTTGACTTCTTTCTTATTTACTATAATATAATATTCTTTTAATTTTAGATTATAG
+TTATCAAGGAAATTTCGTATTTTAGTTTTAAATACAAATTTTGAATCAAATTCAACTGGA
+CAAACTTGAGAAATATATTCAATAACTTTTTGCTCTTCCAATAATTCCTGATTATTAACA
+TCACTCAAAATAACTTCGAAATAGTGTTTGTCCGTATCTTCTTTTTCTGTAAAAGACTCG
+GTAGTGTTATTTATAAGATCTATGGCCTCAATCATTTTATCAGCGCGTAAAGAATCACGT
+ATCTTTTGAGCATCCCATCGCAAAATGGAAGCAGTATTTTCTCCATAATATGAGCTTTTC
+ATAGTCAGGGTAGAACAATAGGCTATGCCGGCGAGTCTTCCTATTCCACGAAATCCAATA
+TTTGAATCAATCTTTTTAGTTGATGCAGCAATACTAGTCAGGGTCGAATAAAAAAGACTA
+CTTTTTAAACCAATTCCTGTATCATAAATTGAAATAGCTTTTTCTTGTTTTTTTATTTCT
+ATATATATAGGATTGTTGATGTAATTGTCAAATATTCCTTTTATTTTACAAGCCTCAATT
+GCATCAACCGAATTTTGAATGTATTCTCTATAGATTATTATTGGATCTTGATACATACCT
+ATCGTTAATACATCTAATAAATGCTTTCCTATTTTTATCTCGTCTTTATCCATTCTTTTG
+GTCCTCTATTTATCAAATTGGTAGAAAAGTGGTTTGGGGAATTTAATCATCAAAGGAGAA
+GGAAAAATCGGATTTGTAATAATGTACTCGCCTTGAACCAATCTTGTCATAATATTCTTA
+TATGTGGAATTGATAAAACTATAGTCTTTATTACTTATTTCAATACTATTTGTTCTACCA
+TAACAATTAGTTGAACAGTTTCCTTTTACACCAGCATTTATTGAACTTCGAAATTGCTCA
+GCACCGAATAATACTAAACCTAACGATCTTCCCCTCTCTGTAATATCAAGAATATAACGA
+AGCAAAGGAGAGTTTTTTGGTACATTACTTCCTGCATGCTTATTAAGTTCATCTACAAAG
+ATTATGATACGGTCAGGAAAATCTTCTTTTAAATCTACCCCTTCAAGTTTTGCTTCATAG
+ATGTTTTTCAGAACATCACCAAAAACAAAAGATTGCAAAGTTTCATCTAATTTTGCAATA
+TCAATTACATAAACATTATTTTTCTTTAATTCTCGTAAGGAATCACATAGATGAACCTCA
+TTTTTTTCTTTAATTGCTCTATCAGAGAATAAAGGATTTTTTAATGGCTTTGATATTAGT
+CTTTTGTATTTTTTCCAACTACTAACCGCAATTTCCTTGTTACTTCTATTCTGCTGGCTC
+GAGACACAAAAATCACTAATTCGATCACGAAAATTGTCCCATGTGGAAATATTTGAGAAT
+GGTCCATTATCATCAAGAATTAATTCATTAATTGATTCCATAGTCCTTGTTTGATCATCA
+AAATTCGCAAACAACAATTCTAAACTTTCTTTATCATCCTGAACTGTATATTTAAACGAA
+TTATAAATCCCCTCATTCTTTTGATCGTTTATCAATTCATCAGTTGCATATGTATTTCTT
+ATAATTGCGTTTGAATGGGGATAGAAATACTGAACATTTGAGAACGGTGTAGCATTGATA
+GAAAGATCAGAATATAGATTTTTGTCAAAAATATCTAATGTTTTGTTTTCTCTATCAATA
+CACAAGAGATCCTTTCCTTTTACATTAAAAACAATAAATGCTATTGATTCATTGTCGGTA
+TTAGTTCCTGATATATATTGGTCTTGCAATGACTTTAGTAGAAACATGCAATAGCTGGTT
+TTGGCAGCAAGCCCAGAAATTCCAGATATATTCAAATGAGCCCCTTCTGGTCCTATTAAA
+AACCTTCGGTCTAATTTAACTGGAATGAATTTTTTTTCTTTATCCATTTTTTCATACATT
+TCGATGTAGCCACAAGAAATTGGATACTTTATGTCATTAAGTCCTAATGCAAAAATAATA
+TCATCTTCACTTGCTAAGAAAACTTTTGAACCGTCTAGAACAGGAAGATATATTCCTTTT
+GTATTTCTTAATACTTTGCACTTGACATAATTCATACTGAGTCGCTTGGTCAATAATTTA
+GCATCAGTATTGCCAAAATCATTACTGACAAACGCGCCTAAATAATTAGGAGTGTCAGTA
+ATATGAAAGACATCTTCTACTATACCATATGTAATACTGTCTTTCTGATTATCCACTCTT
+ACAACATCAAAGGCTTGGAGCATAATATTTGTGTTCGTCCAAAACACAAATTCATCATTA
+GTACATGGTTGTTTCTCAGTGGCTGTAATTTTCCCAATAGCAGTAGAAGTGTCCATTATA
+ATACCTCTATTAAAAAATATTCATAAAATAATCATCAGAAATGAAAGTATTTTTAAGGAG
+CCTTTCTGTAAGATGGACTGGATATAAATGATTGGGCCATCGGTCCTCAATACCATATGT
+AGTAGGTAATCTTTCATTGATTATATTTGCTGAGATCATATCTATTTCTTCTGAATCCAT
+TAAATAATTCTCACCATCTTCTGGTACAACCTTCTCGATTTTTACAATACCGTCAAATGG
+ATTATGGTTATAAGTCTTTTCACGGATTCTAATATACCAAGTGATAAAGAAAACAGGCCC
+TTTAGCCCCTTTGGACCTTTTACTTTCGTATTTATATGAAGGCGTTCTATGATATAGTGG
+GAGGTCCGCAATTAAAGATGCTTGTGTTTTTTTCCTGTTATCTTTTAAGAAATCGGGATT
+AAATGTTTTTGATACACCAATAACTCTTTTGTAATTATTTAATAGCAATGAGAAATCATT
+AAAGTCTCCATTTTTCGAATCGATATATTCTATTGAGCCATCTTTTATTAAGTAATTATC
+AACATAACGAAGTCCATCATCATTTACTAATATGTTAATCATTCTTTTTTCTTCATCAAG
+CATAAATTCATGTATTTTTGATATCCCTAAATTCTCGTATGGAATATCTTTTTGCAGATG
+CAAATCTTGATTATAAAGGAGTACTTTATTGATAACGATATTTTGTTTTTTTAGCGTTGA
+AGAATTATTTATTTGAGTTCTTAGATATTCTATCGCCGTTCTTTTATCTTTACAATCATC
+GATCAAAGACACAATTGCAATATTAGGTAGTGCAATTACATTGTATCTATTTAACCTTTT
+ACATTTTAAAATTCTTTTATTTCTTTCACAACAAGCAACACCAACTTGTCCAGCAATTAT
+TGGATAGATACTCTTTTCATATTCTATGCTTGTCAACTTGTAAGTCTTTCTAGAGCCATC
+AACAAAATATTTGAATAATGATTCACCATCCCGGAGAAATTCTTTTTTCATTCTTGATCT
+TAAATCAATGGGATTTGTATAATCAATTTCTTCACCTAAGTTTCTTGTTGAGAATGGAAT
+TTGCTCTTCTGATGAACTATGAAAAGCTATTGAATGTTCATCATTATAGCAGAATTTGTT
+TATATTATAGATTTTACCAATCGTCAGCTTTGCTATAATAGAAAGCGCTCTATCTATCAT
+TTTTAAAAGTCCTAATACTAATTTAGGGAGAATAATTTAAAACCATCCCTCCCAAAGTTC
+TTAATTTCTACACTACCGCTTACTATTTAAGTTCTAATAAGTTTTTACACTTACATTTGT
+TTATTTTAAGTGTCATAAGTATATAAATCAATATCTAATAGCTGCTAATCTGGAAAATAC
+AAGATTTTACATCTTTGGGACCCTACGCCTCCCTCTTAATACTCTGTATAGATCGATCTG
+CTAGGCTGGAAGTCAATGCCTTCACCGTTTCTAAGTCCTTCTCGTCCAACATTTCCAAGT
+CAGCCACGATATTTGCATATCGCTTTGGCGGCTGCCAGTTATCCGGATTTTTGCCGGTTA
+CCAGGTATTCTACGGTAGTATCCAACGATTGGGCAATTCTTACCCCATCATCAACACGCG
+GTAATCGTTTTCTTGCTATCCACCCTCGGAAAGTTTCAAAGCTAATATTCGAGTGATTAG
+AAACCCATTCTTGAGTAGTATTTTGCCGCTTTATTTCTTTTTTGACTATGTCCCAAAATC
+CCATACATCTATTATCGTCTAAAAATGTTGTCAAATGACGCATGTTTTTCTTGACAAAGT
+TGTTAAACGGCCATAATATGCAGTTATGAAAGTTGCTAAACGACAACAAGATAGTCGTTA
+CAAGGTGTCTATTCCATTCAGCGAAGATGAGAGAAACAGATTTGTTACCTTCCTCGAATC
+TACCGGCCGAAAGGCTGGACCCTATCTAAAAATAGAAATGATGAACCGTGTAAGGGAATG
+GGAAGCTATCCAGTCCGGCAAAACACAACTCAATACAAAGCCATTTGAGAAAGTAGGGGA
+GTAGTCATGGGCATAAAAGATGCCGCTGGCCAGTTAAAAAAGTCAGAGGCCGTGAGATGA
+ACATTGACGGCCGCCTTGAAGCGATGCTTGAGATTATCGAGCAGACACTATCCGAGATCA
+AAGAGAGAGAAGAGCACCTGGCTGGCGTATCCCATGAGATCGAACTTGCGACCAGAGATA
+TCGAAGAGTTACGAGGGATCACCGGCAGCTTAGCCGAGATTGTCGAATCAGGGAAACGGA
+TCGAGTGGATGACAACAACCGAAGTGGCTGACGAGCTTCATGTGAATAAACAGACCGTAA
+GAAGGTGGGCAGATACCGGGCTGCTTAGATGCTACCGGATCGTTAAAGAAGGGCATCGGC
+GCTTTGACCGCCGGGAGATATACGAGGACGTGAAGCGGATGGGAGATGAAGGTAACAAAC
+AATGAGATCAGAGCAGAAACAAGGAGAACAGAAATGGCGTTAAACGAAGACAATCAGCAG
+CTTATAACGCTCATTAACGAGCTTGATAGCAGTGGGTACCTAATCAGAAAGATTTCTGAG
+CGGCCTTCATTGTGTCCTGTAAGAGAATTCGAGCTTCTTATTGAAGAAAAGTCCAAGAAA
+GATGATCTCCGCGGTTTGAGTGCTGCCGCGATAGAAGGATAGCGTTCGTTTACGAGGGGT
+GAGTGAGGTTCGGTCTTTACTGGCCTGAACCTCAGATCAAGGATCTTTGAAAATCAATGA
+CTTGTGGATAGGACCTTATCTGCAAATCACGGGGTAGAGAAGGGAAAAAGAGCAGGTGAG
+GGCGTTGGTAGCACCCTCACTAATCCGCGTTCACACACAACGCAAATCACAGACAAAGCT
+GCTGCTCAATACATCATATCGGCAGCTTTATAGAGGAGATAAATCGTTGAATAGTCCTAT
+TTCGTACATCGGAGGAAAAAGCAAACTTGCGGATACTATCATCAACTTTATCCCGGAACA
+TCAAACCTATGTCGAGGTATTTGCCGGTGGTGCGTGGATATTCTTTAGAAAGAAGTATTC
+GAATGGGGAAGTGCTCAACGATAAAGATGGCGATCTGGTATCTCTCTATCGGGTGATTCA
+GAACCACCTCGAGGAGTTTTTACGGCAGTTCAAATGGATATTGACCAGCCGCGAAGTCTT
+CGATGACTTCAAGGGCCAGATGGAAAAAACCGGCCTTACAGATATCCAGAGGGCCGCACG
+GTACTACTACTTACAGCGTTTGTGCTTTGGGGGGAGGGTACTAAACCGAGCTTTTGGCGT
+GGATTCCACCTAAGCGGGCGAGCAACGAAACCGGCGGAAGCGGTTAGAGAGACATTTCTG
+CATCAAGGCAGCTATGCCAGCCTGGCAAAAATAGCAACCAGTGAGTCTGCCGGAAGGCAG
+ATGAGAGGATACGCAGTGAGCAACGTTACGTTGGGAGAGCCTGAAAAGGTCATAGGTTCG
+TCCGGTTGTCAAATCTCCAGATCGCTCACCTCCGGGCCAAACCGGACACTGGTTAAAGGC
+TGGATGGTTTCGCATCCCGTTCAAGACGGCCTTAATAAATGTCTACCAACGGGAAGAGTC
+TACGTCAGTAGCTACCGAGCGCCGGGGAATCGTGGCGCACCTTGGGACTGTGGCGGAGAG
+GTTTATCGCACGTCGGATTAAGTTCCGGTCGAGTCAACGGTGCGAGAGTGGAGACTCGTA
+ACGCAGGTTCGAATCCTGCCGGTCCCAATACGGCGCCAACCACACGCCGAAACCACGAGG
+ATGTGGGGGAAACATGTTTCACAAACGGCTCTCTCCGGAGAATGACCTCCGGGGAGAGGA
+TTTCATCAAAGATCAATGCGAGGTGCAAAACATGAGCAGTACAGACATGAAAACCGCTAC
+CGAACCGGTAGCGGTTAGAAAAAATAAAAGAAAGGTTGTGATGAATCACCCGAAAAGTAG
+CACTATCCGATTCAAAAATCAGGAAATACAGGCAATTGATGAACACCTTGAGTCTATGGA
+CCATCTCATCCAGGACCTCTTTAAGAACGGTAACCGGGCAAACCGGGACCTCTTTGCCAT
+GAGGCTTGCAACCCTGGTGCGGGTGATCCGGGAGACCCTCAACGAAGGGGTGCTTGAGTG
+AACGATCTGCAGAGCCAGGACGTGGTTTCCGAGAACAAGATCATCCAATACATGGAAGCT
+TCGGGAGTCGCCTCTAACCTCAACGATCATGAAAAACGGCAGTTTATCGAGGTGGCCAAG
+GCCTACCAGCTGAACCCCTTCAAGCGTGAAATATACTGCGTGGCCTACGGGCAGGGAGAT
+AACCGGAGGCTGTCGATCATAACAGGCTATGAGGTCTATCTCAAACGGGCGGAGCGAACC
+CAAAAGCTTGACGGGTGGGGTGTTGAAACGGCCGGATCGATCAGAACTCGCTCTCTCAGA
+GCCATTGTCACCATTCACCGGAAGGACTGGCAGAATCCCTTTGTACATGAAGCGTGGTGG
+ATTGAGTACAGGCAGAACAACCGGATGTGGAACGAGAAGCCGGTAACCATGATCAAGAAG
+GTGGCCATTGCCCAGGCCTTCCGGTTTTGTTTTCCCGATGAGTTTGGAGGCATGCCGTAT
+ACCGCAGATGAGCTTTCCGACGAAGAGACCGGATACCGGGATGTTACCGAGGAACATAGT
+GAAATACAGAAAACTCCGCCGCCGGTGCAGGAAGAAGCTACCAAGGTTCCGGAGCACTCC
+GAGGCTATCCCTGAGGATCCGGATGCAAAGGTCAGGGAGGATTTCAAACACAGGCTTGAC
+GGGGCGTTTCTCGGGAAACTGATTACCAGGGACGAGCGGAACACGATGGTTGCAAACAGC
+AAGAAACACTCGGGGAAGACGCTCGACTCTTACATTCGGATGGTAGAGAAGAGGCTCTAT
+GGTCAGCAGCAGAGGGCAGGGCAGGGGCCTTCTGGATCGGGCTCCGGGGATCCGCAGACG
+TCGGTGCCTGAAGCGCCGGAAATCTATTGAGGAAAGGTGCATGGAATCATGAAAGAACAC
+GGAATCATCTTCAACGCCGATATGGTCCGTGCTGATCTTGCCGGAAAGAAATGGCAGACA
+AGACGGCCTGTTAAACACCAGTTTTGTCGATCAGAATACGAGCCGGAGCTCATATCGTGG
+TGGGAACAGAGAAAGCATGAAACGATAGAGTGTTGTGGTAGTTTCAGTGAACTTCAAAAG
+CATGGCCCGTATGGAGGCGTCGGTGATGTGCTTTGGATCAGAGAGACATGGAGAATAGGT
+GCATGGAAATTTCAACCTCATTCTTTTGCGATTGATTACAAAGCAGATAATTATCCTCGT
+CAGGAATGGTTAAGCTGTAATGACGAGCTTATGTTTCTACGGTTATTTGCACAGACGGAG
+AATGATGCTTACAAAAGAGAAATATATCCTAATGGAAATGGTATCTATGATTGGAAACCT
+GGACATTCTCCTGCAGTATGGCGCCCGTCAATCCACATGCCGAAATGGGCCTGCCGGACT
+AAACGCCGAATCACCGGCGTGCGATTACAAAGAGTACAGGATATAAGCGCCGAGGACCAG
+GAAGCCGAAGGATGCGGCCATGAGTTTGCGTTTGTCTGGGATGCTATCTACAAAGAGCGA
+GGCCTCGGCTGGGATGCAAACCCCTGGGTTTGGGTTTACGAATATGACAATACGATCAAT
+CGGGCGAAAACGTCATGAGTAGTCCCCGGACAATCATCATCCCCGCGGCCGAGCGTATCA
+AAACCGGCGAGCGGGGAGTCGTTTCTTTTCGTGCCGGTGAGACTTTCGAACAATACCTTG
+TGCACCTGTTCCGCTACCAGGAAATCGAAAGACGCTCTCCGGCCCCTTACTACTGGCTGG
+CGATCGATGTACCCCACCGTCCCCGGACAACCGGGCACGGCAGCCAGAACCACCATATCA
+ACGGTCATTGTCAACAAATCTCAGTGGAAACCGGCCAGCCCTTCGGGGATGTAAAGCGGC
+TTGCAAAGCAGTTCGCCGTTACCATGGGCTACCCGATCCTTGAGGACGAGTCCGGGGAGC
+CCATACTCGACCTGTGGGGAGATATCCAGGGGATCAGCGAGAGGAACTGCAGTACAGAGG
+ATGCAGCTATTTTGATTGAGGCGATCCACCAGATAGCGGCGGAAATGGATGTGGAGCTGA
+TCGAAGTATGACAGAGCGGCAGGAGGCTATAACGTCAGCTGATATGTGGTTTAGCCGGTA
+TATCCGGGCCCGTGACAGGTGGCGGTCGGTGACAAGCGGATGTAAACGTAATCTGACCTG
+TTCGCACCTGTTCTCACGAAGATTCTACGCTACCCGCTGGGATGAGATGAATGCTTATTG
+TCAGAGCGCAGGGGAGAATGAAGAGCATGACCGGAATCCGGGGAAGCTTATCTGCTACTT
+CATTACGCTTCACGGAGAAGATGCGTACAAAGCGCTTTACCTGAAATCGAGGTCCGGCGT
+GAAGATTACAACGGAAGAGATTCGGACGATTGCACAGTACTACCGGAAGAAGTACGAGGC
+GATCACACAACAGAACCATGACTTTTTTGGCGTTCTTTAGGGAGGAACCATGGCAAACGA
+TATTACCAGTTTCACGGCGGTCGGAAGGCTTACCCGTGATGCAGAGTTGCGATATACGAA
+CAGCGGAATACCGTTGTGTAAGTTCAGCATAGCATCGAATTACAGCAGGAAGGTGCATGA
+TAACTGGCAGGAGGAAGTCAGCTATTTCGATTTCACCCTATTCGGGAAACGTGCTGAGGC
+GCTTGCTCAGTATCTCACCAAAGGTCAGCAGGTGGTGGTTTCAGGACAGCTGAGACAAGA
+CCGGTGGGAGGACAATGGGGAGAAGCGAAGCAGGGTAGCGTTCTTTGCCCAGGATGTACA
+GCTGATTGGGGGAAAACCTGCCGGCCAGAGCAACCAGCAGGGGCAGTATGGAGAGGCCCC
+CTATCAGGGACCGCCGCAGAACCAGCGGGGCGGCTATTCCCAGCAGCCTCCACAGCAAAG
+GCAACAGCAGAATTCCCGGCAGGGTCAGCAACGTCGACAGGGGCCTCCGCCTAACTCCGG
+GTATCAGAAGCCGACAGGCGGCTATGATCAGTGGGGCTACCCGATAAACCCCGGACCGAA
+TAATCAGGGCCCGGATCAGGAAATGGACTTCGAGGACGACATACCCTTTTAAGGACAGGA
+CATTATGGGCGCAAAAAAAAGGATGATAGATCCGGGGATCTGGACGGACCCCAAGATCAT
+GAAACTTTCCTCGGTGTCGGTACTCATCTTCATCGGGATGATCTCGAATGCAGACGATGA
+GGGAATCATCGAGGCTGAACCGGATAGCCTGTACTTCAGGCTGGCACGAAAGGACATCAC
+CATCGATATGATCAAAGAGGCCCTGGAAGACTTCGGGGCCTATGGTCTTGTCCGCCTGTA
+TGGCGGATACGCCTTTTTCCCGAACTGGTTCAAGTATCAGAACCTGAAAGGACGAAAGCC
+GCAGGAGACGAAATTCCGCCGGCCGCCGAAAGAGTATCTGACAGACGAATACCGGAATGA
+ATGGCTTGAGACCTTCAGGAGGGGAAGTGAAGCCCCGTATCCCTTTGAGACCTGTTTTTC
+CAGCGGTGAGTCACCGGTGAGCAACCGGGAAATGGAGGACAAAGAGCCTGCGACAACCAG
+TGAGTCACCGGTGTGCTACCGGTGTGCTACCGGTAGTGCACCAGTGACCACAGAAGTGAA
+GGGAAGTGAAGTGAAGGGAAGTGAGACTAGTATGCCTGCGGCAGCTTCGGCCGAGCCTCA
+GCCTGAGCGGGACGGGGAGGTTTCACCATCGGAGGAGCCGGAACCCGATTCCCCGGAGCC
+TGTTTTCAAGCTCGAATGCCCGGAGCCGAAGAAGCGCAAGGGGAAACCTCCTACCGCCGG
+GAAAGAGCCGACAGACCCGCTGTACCACTCGATCAAGGATTCCTTCCTCGCTGTTGTCGG
+GGACTTCTCGAACTGGGGCAAGGAAGGCAAGGCGATCCACGGGATCATCGAGAAATGCTC
+ACGCGCCTCACCGGAAGACCCTTCGGGCTGTGCCGAGCGGATGATAGGCGAGTTATGGCG
+GCTAAAGAATTCGGGGGATCGGTTCTACCGAGATCAGCCCTTTGTGCCGTCCACCCTCAA
+CGCCTCGGGAATCTGGGACCGGGTTGCCGAGCAGCTGAAGGTCACGGCCGACGAGCTGGA
+AGGTGTGAGGATGTGGGAAGCGCTTGATCCCTACGGGGTGAGAGGCAAGGCAAAGCAGGC
+GGTGGGAGGATAGGCGTATGCAGTGGAACAGCAAAACGTTTATGGCGATGTTGCAGCAGT
+ACTACGGCAAGCTTTCGCCGATCCACGCGGGAGCGCTTGTCGACTGGCTCGATAGCAAGC
+AGTTTTCGGGGGAGTATCTCAAGCGGCTGTACCAGGAGATAACCGAAAGCTACTCAACGA
+AGTACGGGCGGCCTTGTGATCTGGCAGTTGTGAAGGAAACGCACATGGCCCTTGCGCCTT
+CGTATGTGCCCCCTGCCCGGCAGCTTGAGAGTGATCAGCGGATGATTGGGGAGCGGATCG
+TTGAGCGGGAGGAAGGAGCAAAGCTGTTTGCGAGCATCATCGAGAATCTGACGAAGAAAA
+AACGGAAGGTGAAACCGGAGAATAAGTCGAGGAGAGTGCGGAATGACATTCACAGATAAG
+TACCTGAAAGAAAGGATTCCGGCGGTAAAGACGGTTTTCAAAGGGGATGATCCTATTGAA
+AAAGAAATGGTACTTGAGATAACGGACTATGACCGAGGGATCATTGAAATGAAAGCCGGT
+AATGCGTATTACCGGTTTCGGCATGTTGATCTTGAGCGAGCCGTTACATCGATACAGGTG
+CGGCAAGAGGTAAATGCATGAGCGAGTATGGTGTAAGAAAAGTTTGTGGGAATTGTAGGT
+CCTTCGAAAAGTGCTTTGCCGAATCAGAGGAGCTTATCGGAATCTTTTCCTCCGGTTGTC
+TTGCGGCTGATAAGGAGGAGACGCGGCAGATGCCTGCGTGTGGAGACTTTGAGCCGATGA
+TGAAGCCGGTACCGCTGTCCGGGGAGTAAGGGTGCTGGTGTTGGGAGGGGCAATGAGCAC
+GATGATATCGGCGGATTGTAAAGATCAGCGGGTGGCTGACTCTATCCGCTGGCTCTTGTA
+TGAGCTTGAGAAGGCGAAAGACGGCGAGGTGGTGGTGTCGTTCTTCGTGAAAAGCGGGAA
+GGTCCGCGGTGTGGAGAAAGTGGTCAGGGATAAGAGTATAAAACAGGAGTAAGAGCATAC
+ACGGAACATGTTGTGTGAGAATTGGGAAAAAAGCTACCTGTATATTATTTTTACAGGTTT
+CCGCTATTACATTATGGCTGTATTATGTGTATAAATTTTTTAAAAAAAACCAAATTAAAA
+GGATGGATAGAAGAATGAAGAAAATCTGGATTATTCCTGTGTTGCTCCTGTCGATAGGCC
+TCGCCGGATGTAGTATGTTCGGAAACGACGGAGATGATGACGACGATTCCTTCATTGTTG
+GTTACTGGGTTCAAGAGTCGTTCTCTCTCCCCGATACTGATGTCTATGAATTTGCCTCAG
+GTGGGACTTGTGCTGTTTATGCAGACTATGCAATGAGAACCGTAGATCTTGAAACGAACT
+GGTCTTTATCTGGCGATACATTGACCATCATGGGAATTACAGGAACAATAACGAAGGTCA
+GTGAAAATGAGTTTCAATGGAATACTGAACTTGGTAGTCATGCTGTTTACTATCGCAAGG
+GCTACGAGCCTGGTGGGTTTGCATTGGATGGACCATTTACCGAGCTCACTTTAGGAACCG
+CCTATGAAGGGGAGTTTACCGAAGAAACTGATTTCGATGTGTTTACTGTGGCGGTAGAAG
+ATGGGGCAAGCTATGAGATTTTCTGGGAGGATAAATATGATCATGGTGCTTCCTCCTATA
+GTGGAGCCATAGTGGTTTCTGCATATGAGGCAGATAAATCAACCGATTATTTTACGGGTG
+AAAGTACTGGATATCCTATGCCAATGGCTGTTACCGCTAGTGGGACTACCATTTATATCA
+TTACCCGTCGTCCGGTTTCTTTAAAGCTGTCAGGAACCTACAGCTTGAAAGTAAGAAAGG
+TGACACCATAGTAGGCATATTTCCTAAGGCTCTGTGACAAAGAGTAGATATCGGGCATAG
+ATTCCTCTATGCCCGTTTTTTTATAGTTTCCCCCTTGATGCAAAAATTCTTCCGTGATAG
+AATTTTTTTTGTTAGATAACCCAAGGTAAGGATGCTTACCCTGGCCGTTCCGGACGGATT
+CCGGTCGCTCTAATGGTGCAAGAAGCAATCAGGCGGCGAAGTATCTTACGTTAAACACTG
+TGACAGGTGTCTTTCGTGAGCTACTTCGTCGCCTTTTTTTGTGCCCTTTGGCTTTGACAG
+AGGAGAGGACGAGAGACTATGGGAAGGCAGGATAGACGGAAGAGTTCAACACAGCGCGGG
+TATGGAGCAGCCTGGCGGAAGATCCGTATCGAGGTCCTCCAGGCCTGGGGCATCCCGAAG
+CGGCTATGGCCGAAGTATGATGTGGACCACAATCCCGCCTATGACCGGAGAATCGAACCA
+GATCACCGAAAGTACCAGCTCATCCCTCGGCTTCATGCAGATCACAGCAGAAAGACTGCG
+AAGTTTGACAACGGCTTTGGTAACCGGAAGAAGAGAGAACCTCGTCCTGTCTCCCCTATC
+ATCAATCAGAGCACAGCCCGCCTTACGGAGGGGGGATGTAAATCTCTGAGGGAAAAATGC
+CCAAACCACGCGCCTATACAAGAAAACACTCTGTCAGCAAAGGCAAAGGGGGTATAGGCC
+ATGAGTCGAGGCGGACACAACAAAAAGCCGACTATTTTAAAGCTCACCCATGGCACCTTT
+CGGGAGGACCGGGCCAACGAGAAGGAGCCGGAAGTCAAGGCACTTGATGAGACGCCCAAG
+GCGCCGAGCCACCTTAACAATTTTGCAAAGAACAAGTGGAAGGAGCTTGCCCCGGTGCTT
+GCACAAACGAAGGTTCTATCGGAAGCGGACCTCACCATGCTGGAAGCCTTATGCGAGGCA
+TACGGACAGTACCGGGAAGCGCAGTATGCGGTCTACCACTACAAAGATGAGGAGTCCGGG
+AAAACCAAAAAGCGCAGTTTAGCCCAGTACATGAGTGGGAAAAACTCTCAAACCATGCCT
+GAGTACACGGCCATGCGGCAGGCGTTGTCCATGGTCAAAACCATATCCGCAGAGTTCGGG
+CTCTCGCCTGCAACCCGCTCCCGTGTGAATGCAATCGACACACCTGAAGAAAAGGACCCT
+ATGGAAGCTCTTTTAGAAGGGGCCGGATGATGTGGAAACGACTGGTACTTGTGGGGCTTT
+TGATGAGTAGCCTTTTTACCTACCGGCAGTATGCCCAGGATGTTGCAAGCGGGAAGATCG
+TTACCTGCAGGTGGGTGAAGCTTGCTGTAGCCAGGTGGGAAAATGACCTCTTACGGCAGA
+ACTCTCCGGAGTTCCCCTACTACTTTGACGAAGAATGCGCCAACAGGTATATCAGCTTTG
+CCCAGCAGCTTGAGCACACCCAAGGCTTCAGCGGGAAGATCGTGCTTGAACCCTGGCAGC
+AGTTTGCCTGGGCGAATATCTTCGGGTGGAAAAGTACGGCCACGGGCCTGCGGCGGTTTC
+GAAAGGCATACCGGGAGGTAGCACGGAAGAACGGGAAGACGGTCGAAGGGGCTGCAATGA
+TGAACGCCTGCTTCCACCTCGATAAAGAGATCGGGGCGGAAGAGTTCTTTCTGGCGGTGG
+ACCGGAACCAGGCGAAGAAAGGCTATGACGAGGCGGTACGCCAGAACCTTCGAAACCCTA
+CGCTATCGCGGCTTACCAAGGAGTATAGATCCTCAAAGCGCCTTGTGAAGGTCAATGATC
+CTGCGGCCTTCATGACTCCGGTCTCAAGAGATCACAAGAGTCAGGACTCATGGAACCCTC
+ACGCGATCTTAGTGGATGAGTACCATGCCCACGCGACCAATGAGCTGATCAACGTGTATG
+AGTCGGGCATGGGAGCCAGGCGCCAGCCCTTAACGATCATCATCACCACGGCCGGGACGA
+ACATCAACGGGCCTGCCTATCAGGAAGAGCGCACGCTCGTTACCAAGATCCTTGAAGGAA
+GTATCGAGCCGGTTCCGGAACACATCTGGGGGATCATCTACAGCCTGGATGAGGGGGACA
+GGTGGGAGAATCCTGCGGTGTGGATCAAAAGCAACCCGAACATGGGAGTGAGCTTTTACC
+GCGACTACCTTGAAAAGCGTATTGCAGAGGCCAAGGGCTCGCCCCGGAAAGCCAGCGATG
+TTTTGACCAAGAACTTCAATATCTGGCTGTCCTCTCCCACCCGGTGGATGGACCACTCGG
+TATGGATGCGGGGAAGTGCTCCTGTTGTCGAAGAGGAGCTTGTAGGCTCTGGTGCAAGGG
+GCGGGCTTGACCTATCGATGACAACCGACATCACGGCCCTGTGTTGGGCATTCGGTGAGA
+AGGACGGACGGTATCCGCTACTCTGGCGGTTTTTCATACCGGAAGAAGGATTACTTGATC
+GCTGTCACCGTGACCAGGTCGACTACCGCTCGTGGATCGATGAGGGGTGGATGATTGCAA
+CACCGGGGCAGACGGTCAACTACGAGATCGTGTTAGAGGTCTTGCGGCAGGATGCGAACA
+CCTTTGGCGGCCGGTCAATCGGCTATGACCCGTGGCATGCCGGAGAGTTTGAGCGGGAGC
+TTGAGGGAGAGATCGAGCTTGTCAAATATCCTCAACGGTATTCGGGGATGACGGTTCCTA
+CTCAGCTGTTTGAGCGGATGGTGATCGACGGGAAGATCGCCCACGGAGACAACCCGGTTG
+CCTCCTGGATGATGAGCAATGTGGAGCTGAAGGACGACCGGCAGGGGAACATCATGCCCA
+TGAAGCCGAAGCGGGATTCCTACGGCAAGAGGATCGACGGGATCGTGGCGGCCATCATGG
+CGCTTCACCAGGTGACCGGAGGCCAGGTGGAAAGTGCGTATGAAGCGCGGGGGCTTCGAA
+CCCTATGAAAGCGCATATCAAGTTTCGCAACAGAGTAAAGGCTTTTTTCTCACCGCTTTC
+CGGGTTGGATGAGTTTCTCGAGGCTCTAACTGCCGGAGGACGCTCATCATCGGGGATGAG
+TGTAAACGAGGCGACGGCAATGAGCGTGTCTGCCTTTTTCTCGGCGGTCCGGGTCATTAC
+CGAGAGTATTGCCTCCCTTCCGTTGGAGCTTTACGAACGGCTGCCGGAAGGGGGCAAGAG
+GAAGGATGAAGGGACGAAACTCTATCACCTCCTTCACACCCAGCCGAACAGCTGGCAAAC
+CTCCTTCGAGTTTCGGGAGATGCTCACCTATCACATCATCATGCGGGGAAACGGGTATGC
+CTACCTTTCGAGGGGACGGGACGGGCGTATCTACGAGCTGATTCCCATGCATCCGGATAA
+CGTTACAGTCCGGCAGGATGATACCTACCGGCTGCATTACACCTTCCAGTCAAAGCGCGG
+TTCTGTTGCCTTAGAGCAGGGAGAGGTGTTGCACCTGCGGGGCCTGTCTCTTAACGGCTA
+TACGGGCGTGAGCCTTTTGACCTGGGCCCGGGAAGTACTCGGCGGAGCCCTTGGCCAGCA
+GGAGCATGGAAACCGGCTATGGAAGAACGGGGCGAACCCGGGTGTGGTCCTGCGCCATCC
+GAAGACCTTATCTGATATCGCCTACGAGCGGCTGAAAACGGACTGGGAGGACAAGTATGC
+CGGGGCCCGTAATGCGGCCAAGACGGTGATTCTCGAGGAAGGTATGGAGATCGAGCGGCT
+TTCGATGACAAGCGAGGATGCCCAGTACATCGAAAGCAGGAAGTTCACGCGAAGTGAGAT
+CGCCGGGATCACACGGGTGCCGCCGCACATGATCGGAGACCTTGACCGGGCCACGTTCTC
+GAACATCGAGCACCAGGACCTTGCCTTTGTCAAACACACCCTGCGTCCCTGGCTGGTGCG
+GTGGGAACAGGCCTTATCCCGTGATGTGATCAGAGCACCTCGGCGTTTTGCCGAGTTCAA
+CGTGGACGGGCTTGCACGGGGAGATTTGAAAAGCCGGTATGAGTCCTATGCCATCGGCCG
+GAACTGGGGATGGCTGAGCGTGAACGACATCCGGGCAAGGGAGAACATGAACCCGATCGA
+GGACGGGGATGAGTATCTGCGGCCGCTTAACATGCAGCCGGTGGGAGACGAGGTGCCGAA
+GGCGCTACAGGAAAAACAGTCGGGAGAGAAGAGCGATGGAGCATAGAAGCTGGTATGAGA
+TGAAGGGAGAAGATGAAGGGCCTATCACCATCGACATCTTCGATGAGATCGGCGGATGGG
+GTGTGTATGCTGCGGACTTCAAGCGGGAGCTTGAGGCCCTGGCGGAAGGCAACAGTCGGG
+ATATCGTGGTGAACCTGAACTCTCCGGGAGGGGACGTGTTCGAGGGCATTGCCATCTATA
+ACACCATAAGCGCCTACCGGAGCCGGGTGAGCGTGAGGATCACCGGGGTGGCGGCGTCCA
+TAGCATCGGTGATCGCCTTATCGGGATCCCGGAGGATCATGGGGGAAGGGTCGTTTTTTA
+TGATCCACAACCCCTATGCCGTTGTCATGGGAGAGGCGGATGTACTTCGCTCCCGTGCCC
+AGACCCTGGATAAAATCGCCCTCCAGATGGTGGGCATTTACGAACGGCACAGCAGCCTTT
+CGAAAGACGAGATCGAAAAGGCAATGGATGAGGAGACGTGGTACGGACCTGATGAGGCGT
+ATGCCGCAGGCTTTGCCGACGCCATAGAGGATTACGGCGAGATTGCGGCCAAGGCCTTTA
+ACTGGAGGGCCTACCACTATCACAGCGTCCCACAGGCGTTGTGGGAGATGAGGAAACACA
+GACAGGCACCGAGGAGCAAGCGGGAACTTGAAGTACGGCTTGTTGCCCTTGGGTTTAGTA
+GAAATCAGGCGCAAGGGATTATCAGCCGGGGGTACGGGGCCCTGCAGGGGGATCCTGCAG
+ACGGCCATGAGCAGGGGGATCCTGCCGGGGAAGTGGCCAACGGGTTTTTGGAGCTTGCGC
+AGATGTTCCGGCAAGGAGGAAAAGCATAAATGGATCCGGAAATTAGAGCGGCAATTGAAG
+AGCAGAAAAAGGCCTGGAAAGCGTTCCAGGATGCGAACGACCAGCGGCTTTTGAAGATAG
+AAGCCGGGGATGTAAAGGGGCTTTCTGATATCAACGTGAAGATCGACAGGATCACTGCGG
+CGATGGAAGAGAATGCGAAGGTTATCGAGCGGGTCGGAGAGATCGAGAACAGCATCAACA
+AGCTGTCTCTGGGAACCGGCGGTGGCAAGGCCAAAGGGACCGGTGCCTTTAGCGCATACA
+TGAGAAGCGGAGATGAAAGCGGGTTTCGTGCGGATGCCACGGTACAGGTCGATCCCGACG
+GCGGGTGGCTGGTGCCTGAGAACATACGAAAGGAAATCGGACGGATTGCCCAGGGGATTA
+CCGCCATGCGGAACCTTGCCTCTGTGCAGGGAATTTCCGAAGGGGCAAGTTATACCGAGT
+TCGTCACCACCTCCGGAGCCGGGGCCGAATGGGTGGCGGAGACCGAGAAGCGGGAGGAGA
+CCGCCACGCCTTCCCTTGCCCGTATCGATACGGTAGTACATGAGATGTCGGCGAATCCCA
+AGGCGAGCCAGAGGCTCCTTGATGATGCCATGGTGGATATTGAGGCCTGGCTGTCTGGGG
+AAGTGGCCATCGCCTTTGCAGAGCTTGAGGCTGAGAGCTTTATCACCGGAAGCGGGGTCA
+AACAGCCCCGGGGGATCCTTTCCTACGATGCGGTGGAGGATAAGAACTATACGTGGGGAA
+AGCTCGGGTATCGTACAACTGGGGCGGCTGCCGGCTTTGCCTCTTCGAATCCTGAGGATG
+CCCTGGTCGACCTTGCTTATGCACTAAAGAGTAAGTACCGAAACGGGGCCACCTGGCTCA
+TGAGCCGGACAACCTTGGCTGCGGTACGAAAGTTCAAAACATCCATGGGCTACCTGTGGC
+AGCCCTCCTTTCAGGCTGGCGAGCCTTCCATGCTCTTAGGCTACCCGGTGGCTGAGGATG
+ATGCCATGCCTTCTCATACCACAAGCGGGGCCTTTCCCATCGCCTTCGGTGATTTCAAGG
+CAGGCTACCGAATCGTGGACCATATGGGCATTCGGGTACTTCGCGACCCCTACAGTGCAA
+AGCCTTTTATCAGTTTTTACACCACCAAGCAGGTAGGCGGCGGTGTGAAGAATTTCGAAG
+CGATCAAACTCTTGAAGGTCGCAGCCTAAGGAAGGAGGAAGGAGAATGCGGGATATACAC
+CATACCATCGCCATGGAGACTGCCATCGTGCCGGCGCTCTTGAGCGCGGATGGCACCCCT
+GTAGAGGTAGATCTGCAGGGGTATGACGCGGCCGAGGTGGTACTTTCCATCGGGCCCGGT
+GGCATTAGCTTCACCGAGGATAACAAGATCGAGTTTATCCTTTCCCACAGTCTTGACGGG
+GTGACCTACACCCCTGTTACCGCCGGGGATCTGGACGGACTGGAAGGGGACATAGAAGGC
+GGAGTGATCCTCTCGCTTACTGAGGAGAAACCGGAAGCAAGTATGCTGTGTCTCGGGTAT
+GTCGGAGCCCTTCGGTATCTGAAGCTCTCGGCTGTCTTTAGCGGCACCCACGCGGAAGGT
+ACTGCGGTGAGTGCCGTGGTGATAAAGGGCAGGCCGAACCTGGCATAGAAGGATGAAACT
+TTCTTTCCGGCGGGGGCCTTTAGGGGCCTTTTGCCGGGAGAAATAAAAGAAGGACGTAAG
+GTAAAGATGAGTGGAGAGCTAACCAGCTGGCAGGCGGTAAAGGCGCGTCTTGATCTTGAG
+GATAACCAAGAGGATAAGGCAACCGGTCTTATTGCCGTGGCGTCCCGTCGGGCTGAGAGG
+TACACCGGACGGCTTCTTGCAGGTCGGGACGGGACACTGGTGATGGACGGAAGGGCCTCA
+GATCATCTTGTCCTGCCTCAGTACCCGATTAACCGTATCGAGAGCGTGAAGGTCGACCCG
+TACCGTGTATTCGACGGTGAACCTGTCACCGACTATTTCGCAGACCTTGGGGCGGGGATC
+CTGATACGCACCGCCCCTCATCTATGGCCTTTGGGGGTGAAGAACATCCAGGTTACGGGC
+AACTTCGGCTATGGAGCGATCCCTGAGGACCTTGAAGAGTCGGTGATACAGCTGGTCGGC
+TACTGGCTTGGTTCCCAGGGTATCAGCTGGCTGGGTAAAGGGGATGCGGCAAGCGGAGAG
+TATCAAACCATGTATGTGGGGGTGATGGACCTGCCATTTCAGGTTCGTAATGTGTGGGAC
+TCCTACCGGGAGGTGTCAGTGTGAGCTGGGCGAAGAGGAGCAGCAGTGGCCAGAGAAGTA
+CGGTCAGACGCCGGAAGACCGTGCGCTCGTATGCAGGGCTTACCATCTCGGCGGCAGGGA
+ACACGATCGGGCCGCTGACCGAGAAGGCCTATGAGTATGCCCTCGAGTTTTTAGATAAAC
+GGGTGACGGACAGGACCGGGAACCTTCGAGCCGGCATGAGCTATGACGTTAAGGGTCATA
+CCGGAGCGGTGAAGAACGATGCTCCCCATGCCTTCATTGTTGAGTACGGCACAGAGGAAA
+GGGCGACAAAGACCGGTGAGAACCGTGGCCGTATGAAACCACATTCCTTCATGCGGGCCG
+GGAAGAACAAGGCCCTGAGGGAGATACGGAAGATATGGAAAGAAGGATTGAGGAAGGCGC
+TTGATGAGCAGAGCACCGGAAGTTGAGATCACAGAGCAGCTTCGAGCCGACACGGCCCTC
+ATGGAGCGGATCAAAGCAATCTATGACACCGAGAGCCGGGTTTTGCTAAAGATACCGTAC
+CTGGTGGTGAGCCTTGTAAGCGACACGAATGAGAAGGTGTATCTCTCATACTACGGGGGA
+TCAGCTGCCATACAGATCGATATCTATGCAAAGGATGAGAGAAGCTCTGACCTCAGGGCC
+CTTGTCAAAGATGCGGTTCGAAGGATTCGCGGGGTATCGGGGGCCTTGAAGTTCTCCTCG
+GTGGTTGTCACAGGAGATGCGTTTCTCGGTATTGCCCCCAATGGGCTCTACCGCTGGATG
+GTGGAGATCAGAGCGGATTACACGGAAGAAGGAGAGAGATGAGAGATGATGAAGAAAGAG
+CGACTGATTGGAAGTGACGGAAAGCTTGTCACCGTCAATCTTGCATCCGAGGTTACAGGG
+GACGGGATAAAGAGCCTTGATGAACTTGCAGGAGGCCTTGCGGATAACGGGAAAGGTTCC
+GGCTGGTGGAGTATCACGGCAAAGGGAGAAGAGAGCGGTTTTTCCTCGGCCCTTGATGTC
+GGGGAGCTGTTCTGGGATGACGGCACGCTTATCCCGAAAAGTGGGGACAAGTGTGCATTT
+TTAGAGGAAAGCGAGAAGGCCGACATCAACAGCTTTTCGATCGAGGTGAGTAGAAGCGAG
+ATCGATGTGACGACCTTGAGTGACAAGGTCAAACGCTACCGGTCGGGGAAAACGGATATG
+ACCGGCAGCCTTGAGGGGATCACCAACCTTGATATCACCGATGCGGCCGGCTACATCATC
+AACAACTTCATCAAGGTTATCAGGCAGTCGGTAAGCGGGACCATCATCAAAAACGATGTG
+GACGGCTCGCCGATCTACATCAAGGGCGTGATTCAGAAGTCAACGGATAAGGGAGAAAAG
+GAAGCCTTTATCTGGGCAAAGGTCATCATCCTTTCTTCCAGCCTCGGAGCATCGGGGGAA
+GATGCACAGAACTTTTCAAGTAGCTTCAGAATCGCTCCCGGAGATCCTGATCCCACCCTG
+TACATAAGAGAGGTGGGGTAAGGATGGCGGAACCTATCACCATAGCCCGGGACGGGGTGT
+ATGTCCCCTCCTGGGGCAATAAGGGACGGAAGAAGGATGAGAGAATAACGGTGCATTACC
+GGTTTCTCACCTTTGAAGAGGAAGAGAAGATCTACGGCCGGGCCAGGCGGGAAGCCGGGG
+AAGTACCGGAGAAGCAGGATAGCAGGGCCTATGATGCGTGGTATGTGGAGTACCTGTCAC
+AGGCTTGGCTGTTGCGGGTGAAGAAGATGATCACGGAGATCGAAAACCTGTCGGTGAGTA
+TCGACGGCCAGGTGATCGAGGTTAAGGATGGTGAAACGCTCTTCTCAGGTCTCCCCTTAG
+TCGAGCTTGCAAACGAGATTTTGCATGAGCTCAAGGGCCTGACTTCTGTTGATAAAAAAA
+AATAGCCCTTGGAATCGGGCTGTGGATGAGGGGACAGAGCACGCAGAAGGTACGCCGGGA
+GATTGGGGACGGAAAGCTCGGCGTGGTGGTGGACGGGAAGCTGGTAACGATCCTGCGAAG
+TGAAGTGAACGAGTACCTTGATGACTGGTTCTGGAGTGCATTCAGCCTGTGGTACCGCTA
+TAAGCTTTTCGGCGCTCTTCCCTTCTCAGGGGGATGGGCGGAATTACCGGCTTTCATCAT
+CGAGATCATAGAAACGGCAGAGGCCGCCTATAGGAACGGGTATGGGAACAGCACTCATTG
+ATGAGTTAAAGATACTCCTTCGCGCAGAGACACGGACCGCGGTAAAGGCCATGCGCGATG
+CACAGAAACAAACCGACTCACTTGAAGGCCAGCTCAAGAGCCTTGCAACAGGGGCTGTGA
+AAAGTTTCGGAACCTATGCGGCCGCTGCACTGTCGATCAAGAAAGTCATCGATATCTCGA
+GGGAATCGGGCCAGGCGGCAAGTGACGCTCAGGAGACCATGAGTAAGTATGCGGTGGTCT
+TCGATGATGTGAGACAGGCAAGCATGGCAACGGCCAGCCAGCTTGCAGAGGACTTTGACC
+TTGCCTCCTCCACGGCTCAAAAGCTCCTCGGTAATACCGGGGACTTACTCACCGGCTTCG
+GTTTGAGTTCAGATGCTGCCTTAAAGCTCTCCGATACAACAAACCGGCTTGCCATCGACC
+TTGCAAGCTTTTCGAATGCTCAAGGGGGGGCTGCGGCGGTCAGTCATGCCCTGGTATCGG
+CGTTCTCCGGAGAGCGGGAGGCCTTAAAGAGCTACGGGATTGTGATCAACGAGGCCATGG
+TCAAAGAAAAGATGGCAGAGAACACGGCCAAGGGCTTAACCTTTGCCACCGAACAGCAGG
+CGAAGATCCAGGCCACCTTAGACCTTGCAACCGAGCAGTCGAAGAATGCCATCGGGGACT
+ATGCGAGGACCTCAGACAGTGCGGCCAATGTGACGAGGGCCTTGGGGGAAGAGACCAAGC
+GGCTGAAAGAGAACTACGGAACTCTGGTCAATGAGGGGCTGACCCCGGCAAAGGCGTTCT
+TTCGTGACCTGCTTGATTCGATCAACGACAATATCGAGAAGAACCGAGAACTGTCGGCCG
+CCCTTGATGCGATCTACGGCAGAAGCGCGATAGGTGATTCCGTCGAAAGCCTGCAGCAGC
+TTGAGGCGGGCCTCCAGGACCTGAAAGAAAAAGAAGCTGCCCTGCAGGAGCTTGTCAAAA
+GCGGCAGGGGTGATGTGGCGGCCCAGGCGAAAGAGGCTCTATCCGGTATCCAGGGGCAGA
+TTGAAAGGACCGAGCAGCTGATCCTTGCCTCCTCACGGTTTTTGTCGGCTCAGGAAGCAA
+TCAGGCTCGAAGAAAAGCGATCCCTTGAGGCGGCGGCAAAGCTTGCAGCCGTTCGGGAGA
+AAGCTGCCAAAGACAACGAAACGGCGTTGAGTGAGCTTGCAAAGCGAGAGCTTGAAGCCA
+TGGAGCCGAACGAGAAGCAATTGAGGCTCCTGCAGGATGAGATCGACAAGTGGGCTGCCG
+TTCGTGACGCCGGGGTGGCCGCCGGTCAGGATATGGCTGAGGTCCAAAGGCTCCTCAATG
+ATCTTATCGATGAGCGAAACCGAAAGCTTTCGGAAGGCAAGACCAACTGGTCACAGCCGC
+TTGAAGGGCTCTCTGAGTGGGAACAAGAGTATAAGGACATTTTGAATGAAGCCTCCCTTG
+ACCGGCAGCAGATGGAACGGGACGAGGAAGCCCGTCTTGCTGAGATACGGGAGAGCTTTG
+GAAAGAGCCAGCTGCAGGCCCGCCTTGATGAGATACGCCTGCAGGTGGATGCGGCCAAAC
+AGGCCGGTGTGGATGAGGTGGATGTTGAGAAGTGGAAAACCGAGCAGATCATCCAGCTGT
+ATGCCACAAGGGCCCAAGAGGCTATGGCCATCTACAACCAGCTAAGCGGCATGCTCTCTG
+ATATCTACAGCCTCCAGGGGAATCTCTCGGATGCTGCGGCCGAGAAGGAAATTGCAAACC
+TCGACAACCAGATCGAGTTCAAGAAGGCGGCCGGGGAAACATACGAAGACCTTGAAGCCG
+AGAAGACGGAGAAAGAGGACAAGCTTGCGCGGAAGCAGTTCGAACGGGACAAGAAGAACA
+GGAAGAGTGAAACCATAGCATCGGGAGCACAGGCGGTTATCAATGCCTATGCATCCATGA
+ACCCGATTGCAGCCTCGGCTATGGCCGCCGTCATTGCAGGACTGACCGCCCGCAAGGTGG
+CGCTGATCAATCAGCAGCAATACACGGGCCTTGCAGACGGCGGTATTGTGCCGGCACAAG
+GAGATGCCGGAGGGCTGTACCGGCTGGGGGACAAGAACAAAGCTGAGACGGTCATCCCCT
+TTGACATCCGGAACCTCAAAAGCGGCGGGACGACGGTACAGGTGCATGTGGATAATGTGT
+ACGGTCCCGGAGGATCGGAGGCCTTTGCAAAGTACATCGTCCAGACGGTAAAGCGCGGCC
+AGTCATCCGGCCGTGTCGAGAAGTGGGGAGCCTGACGATGAGCTGGCAAATTCTCATTGA
+TTACGGGGACGGCTGGGTCGATATCACCGGCTACGGGGGAGATAACCTTGTCAGGGACTC
+CCTGAAACTCACCGAGAAGCTTCATGACGATGATTTTAAGCCTGCTTTAGGTTCAGCCAC
+GTTTTCTTGTACCCTCACCCCGGCCCTTAGTACCCGGCTTTTGCAGTGTACCGGTACCAT
+CCCGTGTGAGATCTATCATGACGGGGTGATCTGGTTTCGCGGCTTCTCCCGGCCGGTGAC
+CAAGTACAAGGTCACCGATAACGACCGAACCATCGACTTCGAGATCTATGACTATGGGTA
+TCTGCTTGAATCCACCCTGCAGGACGACGTAATGATAACGGACGGGAAGATCTGTGACCC
+GGAAGACCCCGATCATTCGATCGTCCACCTCCTATTGTCCTCTGCAGGCTACCCTCAGCA
+GTACATCGGTATAAGCGAAACCATAGACGAGGTTATCCCGAAGCTCACCTTTGCTTCCGG
+CGACAGCTATGCGGACGATCTTGCGGCGATCCTCTGGGATTACCATCACCTCTACAATGT
+ATCACCTAACGGGGTGATCGACATCTACGACTGGGCCGCCTCTTCCGTCGAAGCGGACGG
+GGCCTTCAGTGAACAGAATATCATAGGATCTCTGGAGGTTGAAAGAAAGGATTCTGAGGC
+CGACCAGGTACAGGTAACCTTCAATCAGTATGAGAAGCTTACCGGCCTTACCCTCTACTA
+TGAGAAGGTCAGTCGATACGAATCGATAGAATCGGATAGTGGTCAGGATGCAGAAGGGCC
+TGGCCTCTGGCCGGCAGAGGGTCCCTACCGTTGTGACTACAACCTTGCCGTCGACAGTTC
+GAATTATGAAGTAGCGGCTGCAGAGAACCAAAGCGTCGAGGTTCATGGATACGTCCCCTT
+TAGCACGGGGTGGAGAATAACGTTTTTCGACTCGCTGTATATAGCCGGGGACCACTATCT
+TGATGTGGCACTACAGGAGCATGCAACCACCTATTCCGACCTGCAGTACAATCTCTCTGG
+CGGCCAGGTTATCAATGAGATCAAGATAACCGGCGACCTTCATATCATCTATAAGGACCA
+AAAGAAAACCTCCGTCTTTTCAGGGCCGAACAGCACGGGCATACTGAAAAAGTATTCTGC
+CACCTACCTGTATGACGATGAGGCTGCCTCTTTCCTTGCAAACGCTCTGTTCTCGTCGAT
+TACGAACGGAAGACTTCATTACACGTTTAAAAGTCTTACCGAAAAGAGCCTTGGAAGCTA
+CGTTACGGTGAGTTCCCTTTCCCTCGGAATCTCGACCCTCATCCGTATCACCGCCCGAAG
+CTGGGATGTTGAGACGGAGATCTGGGAATACGAGGGTGTGAGCGTGGCCCCGCTTGAAAC
+CATCCTCGGGACGATTATTGCAGGGCAGATCGTGGTACCGACAAATCCGGATGAGGCGAA
+GAGTGTGGCCGAGCGGGTGGATGTGGGCCTTGAGTCGGACGGAAGCATCATACAGCCGGT
+CAACGGCAACCAGCTGGTGGATATCGACACCACGGTGGCAGGGCTCTATATGACGGCAAG
+CGCTCTGGGCTTCTTTGATGGAGAGGAGTGGACAGCAGTCATTAATAATGATGGTACCTG
+GTCCTTTCTCGGGGACGGGAATAACTACATCAAGTGGGACGGCTCACGTCTTGAGGTCCA
+CGGGGACCTCTTTCTCTCCGGTGACTCAGAGCTTCGGGGGAAGATTACCGCAGGCAACGG
+TATTGAAAGTGACGACTACGAGCAGGGTGTTTCCGGCTGGAAGATTGGAGGGGACGGGGA
+TGCCTTTTTTAACAACGTGTGGCTTCGTGGGGACCTGTACGGCATACTCCATGACCTGAC
+TATCGATGGAAACCTGATTCTCTCAGACGGGGCGATTAAGGCGGGGGATACCATCCTCGA
+TGCCTCGGGGATCAGAGCCAATGCGGGACGGGTCGGCAACTGGCTGCTCTCAGCTACCGC
+TATACGCTCGGATGAGGTGGGAAAAGCGAGGATAGAGCTTGATCCCGGGGACAACCGTAT
+CGAGGTGTGGGGTTCAAACACAGCCGAGCCTCGGGTTGCCATGGGATACCTTGGGGGCTT
+ATCCGATCCTTCGAACAGAGCAAAAAGCCTTGCCTCTACCATCTTCGGTTTCTGGACCGC
+CGACGGGGATTCGATTGAGATCAGGGGCGAGATGCGCCTTGTTAACGGTCAGTATGTGCT
+CCAGGATGATGCGGCTTTAGAGATCCAGGACAGTAGCACCGGTAAGGCTATCCTTCGGGT
+GGGATCAAACGCGGGGACTCAAGGGGTGCATTTCTTCGATGAGGCGGAAGCGCCTCTTCT
+GTCTCTGGTGGCCGATGGTATCAAGGCCGAAGCTTCAGACAGAACCCTTCATACTATCGT
+ATTCAGCAAAGCCAGCTCTTCGTTTACCTCATATCCTTCCGGTATGCCGAATAAACGTGG
+GGTGTCATTGGAATCAGATGGGCTGATCATTATTGCAAAAGCAAAAGAGAATGTAGTCCT
+TGGATACATAGATGTTAATAAAAAAGTTTTTGACTGGATCGGGGACATCAATTTCGACAT
+AGCAGGCAGCGGCGGAGTAAACCGGTATATCAAGGCCGACGGTCATATTGCGTTGACATT
+CCGTGTTGGCGACACCGAATCAGGGCTTGCGCTTGGGGAAGGGTTGAATCATATATCAGT
+CATACCTGCCATGATATGTAATTCAAATGTTATTGTTCGTCAATCAATGGATGTTTATCA
+GACGCTGACAGTTGGGAAGGATAAAGCAATCTTTCAGATCGACCCTGAGCATAATATTTT
+CACGTACAAGGGGGTATCGGTATTCGAGGCTTCTCACCCCATAGGCTCTCAGTACACACA
+ATACGCCTCAAGCGCAAGTAACGACTTATCGGTTGCCTTCCCGAATAGCGAGTCCCCCGC
+TTACCTGTTTGGAGGGACCTGGGAGAAACTGTGGGACGGCGAAGGCATAGACTTTCATAC
+CGAAGGTTACAACGGTTCAGGACGAACAAATGGGCTGATGCCCGATAATCTGCAATACCA
+CTGGCACGCTGCTTATCAAGTGTTCGCTACCGTCGATGGGGGAAAATACAATGTCGGTCA
+AGCGATCAGCCCCACTTCAGGAACACAGAGAAATGTGGGTGGCCCCATATCGGACGGCAC
+CCACGGAGCCCCACGGCTGGGCGAGCGGACCTCCGACCGCAACCGGCTCATGAGGATATG
+GAGGAGAATTGCATGAAAACCTATGCCGTAATAGATGGATCAATGATTACCACTGTGGTG
+CAAAGCGCCGATGAGGCGGCCAAGCTTGCAGAGCTGTTTCCGGAAAAAACCATCAAGGAG
+GTTCCTGCAGGGTTTACCGGAAACAAAGGCGATGATATCCGCTTCTTCGATGAGGATGGA
+AAGCGGCTTTCGATAGCAGCCGCAACAGAAGCCGGGCTTGTGCCTGAGGTCGGAGAACAT
+GAGGCCGCTATTTGGGAAGGCGGTAGGTATGTGCTTACCCCTGACTATACCGGTGTTCCC
+TACTGGAAAAAGGCCACAGGAGCGGCGGTACACCTGTCCCTCGGCCGAAAGCCCGATGAG
+AGTATGACCGATATAGAGCCTTCGGACCCGCAGGCCGTGTGGAACGAAACGGGCTGGACA
+GTTCCCGAGGAGGTGCTCTCCGAACGGGTTCGCTTAGAACGAGACAGGCTGCTTTCAGAA
+AGCGACTACATCATGATGGCCGACTATCCCCTTACCGACAAATCGGACTGGAAAGCCTAC
+CGGCAGGCTCTCAGGGACATTCCATTGCAGCCAGGCTTCCCTCAGGAGATTTCCTGGCCA
+CAGGCACCGGAAAAAAGGAGTTAAGCCAATGGGCGATAACGACAAAATCGATATGGTCTT
+AAGCATTGTGACGGAACAAGGCCGGGACATCAAAGAGATCAACAGTAAGCTCACCGACTT
+TTTCATCAACCGGGAAAGTACGTGCCCTGTTGAGAAACGCCATGAGAAGAAGATTGAGTA
+CCGAACAGTCATTGTCGGAATGGTGTGCGGTCTTGGTGGTTCGATTATCGGGGGATTACT
+CCCCGTTGTTTTGGGAGGGTGATATGTATTATCAAAACAGTATTGAGATGCCGGAGCGGG
+TACAGAAATGGGGATGCTACGCTACCGTAATTTCTGCGGCAGTAGCAGGAAGGACAAAAC
+GTTCTATCTCACAAGAGGATTTTGTTAATTGTGTGATTGAGTCGGAACGCCGTCGATACC
+TGACTGAGGACCCGGAGGCGCCTGGAACCTTTATGTATGTGGCAGACCCGACAGGGATCT
+TCCGCCTCTTCGGCCTGAATGTACGCTACCTCGGGAAAAAAGACGCGGACTATATATGCC
+AGCCGAACGAGATAGAAATACTCTTGTGGCGACGGTGGAATGAAAAAACGCGCAAGTACA
+TCTACCATTTCACCCTGGGTAACGGCCGTGGCATGACCGTCTATGATCCATGGGCTCCAT
+TCAGCAAGACTGCAAGCGAGGGGGAACTTCGGTCGAAGCGCATCTTTCTCGATCTTGGAG
+AAGTAGCGGCATGAAAAAGCTCATCGTAAAGCTGTGGAAGGCTCTGGGAGAGAAAGGAAA
+GGTGGCGACAATCATCGGTTTCCTTTTTGCCTTCCCGGTGAACATCAAGTTTGTCATCGA
+CTACTTCTCCGGGATCTTTTACTCAAGGGGACAGATGGAAATGGCCCTTGTTACCAATGT
+GCTGGCCATGGTGTGGCTGATCCTGCCGTCGGTTATTTCCATTCATAGCCCGAAGATCAG
+TATCGAGGTAAAGGATTGAGATGCGCAAAATTATTAGCATTATCCTTACTCTTTTTGTGT
+GTTTTTCCGCCGGCTTCCTCCTGGGCACTTACCGCTCAGGAGGCGGCGATAGTGGACGAG
+CTGCAGAGTACGATAGTCGAGGCAAAAAGCGAGATACAGAGTATCAAGCACTCAGCGATG
+AGTATGAGCGAGCAGTTGAGGCTTACGAGGGAGAGCTCGCAGAGCTTCGAAAAGAGGTGG
+CAGGCTACCAGCGAGAAGCTGGAGGACTTACAGAGCGAATCGGAGGAGCGCAAAACGAAA
+GTGTCGGCATTGCAGAGCGAGCGGGACGGGCTGAGGACGGACTATCAAGAGCTCTTGATC
+TATTGCGAAGGCTTAGAGAGGCGGAACCGGCGGCAGGGAATGGCCCTTAAAGCCGGGGGC
+TCTGCCCTGGCTCTCTCTATCATCGTCAATGTGCTGCAGACTGTGTTTTGATTGGTGTGT
+TTGGTGGAGTATAGGAGTTGAACCCTTCGCATGGCAGAATTATAATACTCCCAAGTCATT
+TCGTTGGTTATCTGCATGAATTTCATGTTGATAAAGGAAGTTATATGTAATGCTCTTTTT
+CTCAGATTTCCTTTAAAAAAAGGCATCATGATGTAAATAGTTACATAACGTATTGACTTC
+TTTATCGTGATGCATTATGTTACATCATGAAAGCGGTTTTAAAAAAACCTAAAGGAGTCA
+AATATGGAAACAGTAACAGTAACTTTCAGCATAGAAAAACCAGATTTAGCCGATTATAAT
+CAGCTATACCCGAAAATGCCTTGTAATACCGAAAAGAAGCAAAATCTTTTTGAAGTCATT
+ACAGATGCAAGGAACATTTGTGGTGCATTGCAATTCACAGAATCTACAGGTTCATCACCT
+GTTGCTTTTTATGAAAAACAAATTCAGTCAATGATTGATTCGGGAACTCTTTCTGAACTA
+GATTGGAATGAGAAACAGTTTGTAGGAACATCAACGAGTGTCGTTATGCAAAGCAATGGT
+TGGAATAAAACTGGCCGAAAACAAAGATTCTCAAAAGGGATCTTTAAAAGTGCAGAACTT
+TATTCGCGATAGGGCATTTACCAAGGGTATTTCTTAATTCTCTGGTTGTTTTTCTATACC
+GCGCGAAAAAGAACACTACATATAACAGCGAATATGCGGTTCCGCTTCGCTGCACCCAAA
+TGCGGCGTTGCCGCACTTCGCATATTTCTGAAACGTTAGATGTAATAAATGTTGGACATT
+ATTGAGGAACAAATGGGGCAAGCACTTACAGAAAAAGAAAATGAACTTTATAAAAGGATT
+GATGAAGTTACTCATTATATTTGGGATCCTATTGGCGTGAATGGCTGTCCTGGTGCAAGA
+GATGAGTATTATTCATATTTACCCAAGATTTTCGAGCTTGCCCAAAAAGAGAATTCAGAA
+TCTGAAATTGCAGAATATCTAAATTATGTACAATCTGAGAGAATGGGTCTTAAATCTGAC
+ATAAAAAGATGCAAGGAGATTGCTTCCATAATTATTGACTGGAGCGAAAATCTTGGAATA
+TTGGGGTCTTAACCAACCCCGACATTTACTACATCTAACAGCGAATATACGCTGCGGCTT
+CGCCTTGGCCTTCGCCATATTATGCTGCCAAAAACATCATATAAAACCAGAACGTTAAGC
+ATAGTATGTATTTATTCTCTATTCAAAAAGAACGTTATGGTATTGTTGCTTTCGATAAAT
+CTGATCCATTCGACTATATTATAACCTTACAAGTAAGGAAGAATCCTGATAGATTGAGGT
+CAATCACCATGAGAGGGGGAGCCCGTTTTGCCTAATAAAATAAACAGTTTCCTGGACGTC
+CTAAAGGCTGGTGCCTTAGTTTTGTTCTCCGGGATTATATATGCAGTTGCTATCAAGTAC
+TTCATCATGCCATCAAAAGTCATAATGACCGGATCAGAAGGAATTGCTTTAGCGACATCT
+TATTTTTATAGCTCAGAGCGACTATTTGTTCTCTTATACGCAATTTTCCAAACAGCGCTC
+ATCATTTTTTCTTTTGTAAAAATCGGATGGATATTCAGCACCAAGACTATACTGACAATA
+CTGACGATCATTGTGCTTCTCCTTATCTTACCGGATATCAAAGTGGCATCGCCAGAGCCA
+GAGAATGAGCGTCTCCTCCTTGTGCTCTTTGGTGCTATCATTGCTGGGATTGGGAAAGTC
+GTCTCGTTTCTTAATCGTGGCTCTACTGGAGATGAAGATATCGTCAGTGTTTACTTTTCA
+GAAAAACTGAGAAAACCAGTTGGTAAAATCAGTATTTTCGCCGGCGTTATTTCTACCGTT
+TATGGTTTGATTCTTAATTTTGTCAATTCCCACGATATTTCTATTGTGGCCAATACGCTG
+ATCTATACAGTTATCTACATTTTTGTTGGTGCATTTACGGTCAACACCATATACAAAAGG
+TACAGATACTCCAATATCATGATTAATTCGGAAAATCCTGAAGAGGTTATCAAAATTATC
+AAGTCCATATTGCCAGAGCGAACTTATACAAGGATCAGTGGGACTGGTGGGTATTCCAGC
+AAGGAGAGAACCTTGATATCGATTATTGTAACCCAGGAAGAACTTCCCCAGATAATCCGT
+TCCATAGAGCAGATGGAGGGGAACTACTTTCTTTATCACTCAGAAATAGATGGAATCAAA
+GGTCGTTTTACATATTCCAAAATACGATGAAAATTGGATTCTTGCTTCAGTAAGAGAATC
+GTAATATACCCATAATCATTTGACACGGGTACTAAGCTTAACAGCTGTTGATACGCTCCG
+GCGATACAAAATATACTCGCTTGACAAATGGCGATGCTTTGCCGGGGAGCTATGCCCCGG
+CTTTGCTTGTCAAAAAGTTTTTCTGAGCTTCCGCGATTTGCCGTAAATCCTCCGGCAAAT
+AATCGGTATAATGGTCGGTCATTTCCTGCGAGTCGTGTCCGGTGAATTTCCGTATCACAT
+CGTCAGATACTCCGTTATGACGTAGCAGGGTATTGAAAAATCGCCGAGCTGAATGGAAAG
+TTATATTCCTTCCTTCTCGCTCTATTCCCATCTCGTCCATTCTCTTGTACATCCACTCTC
+GCAGCCGGTTCGCCGTGAGCGGTGTTTCTTGCCGCGGGTGATGCGAGAATACGAAGCGCT
+CAGGGCCTGTCATATAGCAATTAAGCTCTTCTCTCAGCTCTGGCATAATTGGGATTTCCC
+TTATACCTTTATCTTTCACCGGAGTTCGCTTTTTAAGCTTGCTGTGGTACTGCTTTGAGA
+TTTGGAGATAAGAGAGTGTGACTGTTTTATCTCCCCGGACAATCTCAGAGTCAATCACAT
+CATCGGTGAAAAGTCCGCATACTTCGCCGATTCGCAAGCCAGCCATAAAAGCAACTTTCA
+TCGCTGTATAGTAGATTCGATCTTTGTCGCTTGATATTCCCGAGTCTTCGAGAAGCTTTT
+CCACTTCATCTATACTCAAGGCTCCGTATCTATTCTTGTCGACCGATAAAGGCCTGACCA
+TGCGCCAGGGATTGAAATATGCCGCTGTCGTGTCCCGCATCTTCTGGATCCGTTCGTACT
+CTCCAAGGATGGTTGAGTAGACGCTTTTCCAGTTGTTCGCTGTTTTATGACTCACCTGGT
+TAGCCCACTTGAACAGAAGGTCCTCGCAGTCCAGCGGGGTGATTTTCTCAATCGGTTTGT
+CTCCGTGGTATGGAAGGATATGGTCTCTGGTTATCTGGGTAGCTCCGTTGCAGTAGTTCT
+CTGTTATCCCTGGTTTTTCTTTCGAAGAGCGGGCGAGAATTGCCCGGACGTAGCTACTAC
+GCCTATAATCCCAGAAGTACCGACTCTCTACCCATTGGGCAAGAGTTACGACCTTTTCCT
+TTGAAAGGCGGTTTTTCTCAAGTAGCTCCTGACAGTAAGCAACTGCTTCTTTGCGGCTTT
+TGACTTCATCTTTCTTTCGTGTGTAGCCAATCCCGGTGCTTTTCGCCGGTAGACGCTTGC
+CGTCAGTTCCGTATGCTTGATAATACCAGACTGTCTTGTTCTTGAGTGTTCGTGGAAACA
+GGATGTATTCGTTGTCTCTAAATCTTGCCAT
+>NC_014364.1|provirus_2329685_2350621
+ATGGCAACTGATTTCTACCATCTTTTCAAGCGAAAATATCAAAACAAAGCAGGCAGAGAG
+TACTTCTACTGGTGGTATTGGTGGTACGACCCCGATACCGGCCGACAGCTCCAGAAGCCC
+GCAGGACGGGCCGAATCCGTCAGGAAACATGCTCAGGAATATATCAACAATCTCCCTATC
+CCAAGCGGTAAAGCGGATACCGTTCGCGCCGTTGCAGAGGGTATGTTTGAGGCGGGCTCC
+CCTTACCTACTCCGACGTGAAGCCAAGGGTTCGGGGATGAAAGAAGGTACCCTCAGAGCT
+TACTCAGGCTTCGTCAGGAACCACATTGTCAAAGACTGGGGAAATACACCACTTAACCAG
+ATAGAAGGCGCTGACATCGAAGATTGGCTCATGGAGAAGCCTTTTTCAAACTCCACACGG
+AACAGCATCATCGATTGTTGGAACCTCATCTTCCGGGAGGCAAAGAGGTCTAATCAGGTC
+CGCCGGATTCCCACAATAGAGCGCTTTGCCCGGAATTCAAGGCGGTATGACACCTTCCGG
+GATGATGAGCTGTTCGCCCTATTCCCTGAGAAGCGCGAAGACCTTATAGCTCTGTACAGT
+GATCCTGAGAACGACTATTACGAAGAGATTGAGTACTACGGGCTCATGTTTGCCGTGATG
+CTGCTTACGACGGTTTCCGGGGGCCTGCGATCCGGGGAGATACGGGCGCTCTGTAGGGAC
+CAGGTATTCATCAATCAGTCGGGTATCGTGGTTAGTAAGGCTCTGGACAGCAACAACAAG
+GTAACGCTTCCGAAGAAAGGGAAAGATGATAATCCGAAATGGCGGGCTGTACTGTTGCCG
+GAAAGAGCGATCCAGGCCCTCTCATGGTGGCTTGAAGTGGCCCCACCCTCCGGGATGCTG
+TTCAAGTACGCTGATAAGCCGGTTGACCGCAATCTGCTGCTTGATAGGCTCAAGCTGGGC
+ATGGAGCGTGTAGGGCTCAAGCTGGGCATGGAGCGTGTAGGGCTCAAGCTGGGCATGGAG
+CGTGTAGGGCTCAAGCTGGGCATGGAGCGTGTAGGGATCAAGCCGGAGGGGCGGAAGCTG
+AAGGTCCATTCTCTCAGGTACACGTACAACACGAGAATGGAGACTTTACTATCAGAGGAG
+CGGTTATTGCAGTTCATGGGGCATGAATCGAGGCAGATGACGCTCCACTACTCCCGGCCG
+TATTGGCAGGAGAGGCTTGTTGCGTATGGAGGTGACAAGGAGAAAGTCGAGCAGTTCTGG
+AAGTGAGAGATTTTAACGATAGAATCGCTTTAAGCAATTTACTTTAGTCTTTTGAAAGCC
+GAATCGCTCATTTGCTTTTCCATCTTTCTATTACAATTGGGACATAGATACTGTTTTTTC
+CCATCTATCTTCCATACATAATACTTTCTTTTAAATGGAGTTGAACAAATAGCACAACGC
+CTCGGCTTTCGGAAGACAATAGCCAAAATAATTACAATGACAATTATTACATATTCCATA
+TAATAATGTTAATCCGGTTTTTAAGTTCTGTAAATAATTTAGTGTATAAAAATAATTGGT
+AAGTGTTAAGCAACTCTAATCTATTGAGAAGATATTTACCAAATTTTTATATTTTTAAAT
+ATTGCTACTCCTACAGGAGGTGTAATTGAGATATTTGGAGTACAGTATTTATAGACCGTA
+ATAAAAGACGACGACTACTGCACTCAATTAGTTAGTATAAAATATTTCTAAATCGCAAGC
+CTTTCTTTTTTTAATTCTTTAATATAAATCTTAGGTCCAATTCCGAAAATCTCCAACTCT
+AAGTAATCATCAAGTATTTTCTTAATCTTAGCAGAAGTAATAAACTTACTATTTTCATCA
+ATATTAATATTCTTAAAATCATTATTCTTTAAGGCTACCATAACGTAATCACCAATCTCT
+AAATCATTCTTTATATCTCCCTTAGTTACTTCTTTTACAAGTTCTGCATTTAGATATAAT
+TTAGTAACTTCGTCATTATTCGTTAATGCCACAAAAGTATCATTCGTTATATATTTGTCA
+ATTTTTACTTTCAATTTTCTATATCCCATTTCTGGATGCAATAAATAAATTTTCATATAC
+ATGCCTTGCTTCTTAAAAAAAACCTTAATACCATTTTTTACAGTAAATGGTGGGAAATTT
+ATTTCTGAATCTTTATCAATCCATCCAGGATTTCTCTCTACTTTGATCCAAAACGTAATA
+GAAAAATTATATTTATTATTCATTTTTCATCTATTCCTATGTTTATCATTTCGTTCAATT
+TTTCTTGTGTCAAAATATCACCTGTATATTTCTCAGCAGAGGCTCCTTTGTTTTCTTGTT
+TTAACAAATTAGCAATAGCTGTCCAACCAATTAAACCTGAAGCAAAGGCATTGACAGCTG
+TATTGGGATTGATTAATAGCAGCCCTCCAATTGATGAGATCAATACAAATCCAAACCCTT
+TCCACCAAAATTTTACCTTAGTATCTCCTATGGAATAGAAAATATATTTAAAGAAATATG
+CAGCAAATGCTCCGAAAATTGAAGCAGCAATTTTAAAAAACACCCAAGCGTTTGGATCTT
+TACCTTCACATAGCCATTCAAAAACTATTTTCATTTGTTCCATGAATTATTAGCCTTTAT
+TATCACGAAATTATTCTTTTATAAGAATTACTATATCATTTACAAAGATCATGATATTTG
+CCACTCCTACTACAAAAAATTAAAGCATTGTAGATATTTTTACCTCTGTATCTATGTTTT
+GTCGTTTTTGGACAATCGCATTCTCTCCATATTGTTTCTTGAAATATTCTTTAAATTCCT
+CTGTTTTTCTTAGCTCTTTGAATAAGGGCCATTCAATCAGCTCATTTTTACCAATCACTT
+TTCTCTTATTATTATCCTCTTTTATCATTCGTATGGCTGTTCTAAAATCTCTTTCTATAA
+CAGCCTTTGCTATTAAATACTCTTCTGTACATAATGACCAATCAATTTCTGATAGTATTT
+TCTTTGATTCTTCATCTCGCTCTTGCCATAAATATGTCTGAGATAGATTTATTTTTAACA
+TTGTGTCTAATGCCAATATTCTAATTTTACCAAAACTATTTAATGCAAAATTTAAAATAT
+TTTCAGCAATGTTATAGTTTTCCTCTTGTATTTGTTCATATGCAATGGTATTTAAATTTT
+TCTTTATGCTATCGTCTGGATCAAGTATATTCCATACAATATGCCCGAGATATACAACAA
+TTAGAAATATAACATCACATGAATGCTGGAAATATTCAGGTGAAACAGATAATTTAGATC
+CAACAACTATAGTATCACTATTTCTTCCAACTTTTTCTAAATACGACTCATTAACAGAAC
+CATCACAATGGGTAAATAAATTACGCCTTTCAGTGATCTCAATAAACTCCTCTATTAGTT
+TTTTATCACTTCTCAGATTTATGTTAAGTTTTTTCTCAAACCACTTAAGATGATCATCAT
+GTGAACATCGAATAACTGAATCAACTTCTTTTTCAATTAAATATGTAATAGCCTTCTCTA
+TAGAATCAAATTTTTTAATATCTGCAAATGTTAACTTCCTATCTGAAGTATTTAATATTT
+CAGGCTGTTTATTCAGAACATAACGTATCAAGTTACCTATGTAGAAATCAAATTGACTTA
+TAAGAGATATAATATAATTCCGTGGTGCTATATTTAAAGATATTTCTAATTTACTTATTT
+TTTCTTTTATACGTATAAATCTTGTGAATTGGGATTCTGGAATTCTATATCCTTCACCTT
+TCTCTTTATCAGATATTTTCTCACATTTAGTTTCTAAGAATCTGTTATATTCAATCAAAA
+GGTTATTATGTAATTGTTCATACAAAGTAGCAGAAATTGGCAATGTATTCTTGATGGCAT
+CAATCGCACTTACGGTCTTGTTAAGGATATCAATAATTTCCATAAACTACCTTTTCTGTG
+TAATAAAGATTTGATCTTCCGTTCACCTCAAATATTCAAGATATTGACCTGATGCCAAAG
+TGTAGGAGAACAACGATTTTACTGCCGTTGTAACGTCTCCGCAGAAAACGTGACAATGGA
+CAAGCCAACTTTAACTAGTTGTTCTATAGAATTATTTTTACATGATATTCTCCAGGAAGC
+CAAGCAAATCATTACTCCACTTATTGTAAGTTTTTACTCTACTATACAAGGGTGTTGAGA
+ATAAGATATCCGTTGGCCATTTTATTTTAGCTATAGAATAGTAAGGTATAACTTTTTTGT
+ACATATCATTCATTGTCGCTCTATTTAAATGTATTGTACAATTTCTTGTAATCTGCAAAT
+GTTTAATACTATTACTATATGATCCTACAAGGGAACTAATCTTTACTTCATGTAATGCAA
+TTGCAATATTTAAAATTGAATCAAAGGATCCCCAAGTAGGCTCTTGGAACGAAGCACTTA
+TAGCTCCATAAGGATTTTTTCTCTTATTTATTTTATATAAAATATTATAGACTATCTCTT
+TTTCATTTTTTGTATTTAATATACTATTTCGATGTTGATAGCTATTATTAACATCGAAAT
+AACCTGTGTATTTTGATATCCAATATGATCTCCAATACGAATTCCATGCCTGCCAGAAGT
+AATTAATTATTCCATCTATTTCAAAGCGATTATTACATGATTCATTCTTGTTTAATAAAA
+AGGTACACTTTTCAAAAGAATTATATAAGGATAGATAGTTCTTTCTTAAATTCATACTTT
+CTGTAAAGCTTTAATAAAAAATTTTGTACGATTTATTCTATTGCTTACACTATGAGTTGT
+CTTTAAGCTTGATTTTACAAATTCTGAATATTCACCATCTTCAACTTTTTCATCTACCTC
+ACTTAGCATATTTATTATTTCACTAATTGATTCATTAGTATTATTACAGAATTTCCCTAT
+AGGTAATAATCCATCGATTATTTCTGAATTAATATTTTTTATGCCCCAATTATTATACAA
+TAATGCTGCAAATAAACTATAAAAATTAAAACCACTTAAAAGTTCTTTTTCTAAAAGATC
+TTTTAACTCTGTTTTGATGAAATCTAATGTTAGAAATAATTTACTTTTTATCTCATCTCC
+ATATATGAAATCTTTATCATTGATTTTGTAAAGATTATCAAGCTTTGAGACGCTCCTTGT
+GACAATGCCTTCTATAATCAATTGACATAATTCTGTGAAAAGATCTGCATCTATCATCCT
+AGAAATATCTCTTTGAGATAATATTTTATAATCTTCAAGTATTGGTGTGTATCGTTCAAT
+AACATCTTTAATAAACCATTTAAAATATCCTTGATAGGTAGCATGTCTTTGTTCCGGTTT
+ATTCAATGGCAAAGTATAAGAATTTATTCTTCTGAAAATTTCAATAACCTCATCTCTTGA
+AGCACCTACAGCTGTGTCTACTGAAATCTCATAAGATAAGAAATTTGATTTATCATCATC
+TGACAATTCTGAAAATATTATATTGGGATATTCAGAACTTATTTTTGATAGTTTAAATTT
+GTTATCTATAAAATCTATAATAGAAGTACATCTTTGTTGTCCATCAATAATTTCCCGTAT
+AGACCTTTTAGTTTTCAAATCTATCTTCTGTAATAAAGTAATTTTAGGAAAAGGAAATCC
+TTTTATGATAGTATCAATAAAGAAGGATCTTGAATTATTAGGCCATAAACCTCGTTCCCT
+TTGATACTCTTTGTTAATTATTAATTCCTCGTCTGTATAGTATTTATATAGATCAGCTAT
+ATTCATTGTATTTCGTATAATTTTCATTCTCGCTCCTTATAAAGGACTTCATTTACCATG
+ATATTAAAGTATGGTATTAAATCAATTTCTGTATACTGATCACATGAACTGTTTGATGAA
+GTGTCATAACGTTACCCACACAACACAAAACAGCAACGTAGCGATATGCACCCAATCTGC
+TCAATGTTATTGTTAAGTTTTTCCCTTTGATAATGTAAATAGAAAACCGCTCAAGGCACC
+TCCAATATCATTAAGCAGCCTAGCATGATCGCCATTTAATTCGTAACTTCCTGGAGCAGC
+ACCATGGGCGGAACCAAAATGTGTTCTTAGGCTGCCAATAGCACTGAAAATGCCCTTTAC
+ATTCCCCAATAGTCTTTTTAGATCATCATTTACTTGCTCATCTGGTGAAAGATTTAATAC
+TTTCATTGTTTCCGCAATTAAACTAGAAATATCTCTCCTAACAGGTTGTGGCTGCTCTAA
+ATCTGATAGTATCTTTTTACAAACTGCTTCAAGATAACTACATGTTCTTGTGATGGAATC
+GGCGGGATCAGTTTGAATGCAGTTTCGTGCTTTCAACCAACTTCCATACAAATTGTGATC
+ATCAGTCTCTTGAAGTACCTTCGTTGTATGTTTAAATATCAGATTAGATTCACTATTAAG
+CATCTTATCTATAACGGTATAATTATTAGCTGGCAGCTCCATATCATCCAACTGGGATGC
+GAGATCTTCCAGCAACGAATTTAATGACTCTTCGCTTGATAATGATTCAAGCCATTCGAT
+AGGCGCGGAAGATAGTTCCTGTATACTATAAGTACGCCAATCAACCGGGATATGTTCGAG
+TGAATCTTCTATATCCATATAAGTAGATCTATAGGCAATGGCAAGTTTTTCAGAATTACA
+AAATAAGTACCCGTATACCCAATCGTCTGGACCAATCATCCCCAGATGTTTTTCTTTTGA
+ATGACCAGAGATAGAGACATCCTGCAATGTCTCTTTTATTACAACCCCAAATTCCTGCAG
+TTTTGGATAGATCTTATCTCTTTTGGATTTTATTGCTAATACTCTTGATCTAATGTCATC
+TATCGTAGGCATTTTAATAATCCCCCAAGTAAACTTACCAGCGCATAGATTAAGTTTTTT
+GAGTAGAAAAGGATCCACAGTCTTTTCTGTATATAGACCCAATAAAAAGTTAATAATCTC
+CTTGTATTTGATAAAAGCATGAACGGGTAGTTTTGGGGCATAAGACCAATCACAATTCAT
+ACTTATATCTAAATCTTTATATGAATAATTGTAACCCCACTGTCTTCATAGAGCAACAAA
+AAAACTCAACTTTCTCTAACAGCTTGCTATCGTGAGAACTTTATAATCTTGCATTCGATA
+GCCTTTACGCCTCTCGCTTAGCTCTTTGAGCAGAACGATCAGCCAGGCTGGAAGTCAGTG
+CCCTAACTGTTTCCAGATCCTTCTCATCCAATGCTTCCAAGTCCTCTACGATATCTGCAT
+AGCGTTTCGGTACTTGCCAGTTGTCCGGATTCTTGCCAGTTACCAGATATTCTACGGTAG
+TATCAAGCACCTCAGCTATTTCTACGGCTTGATCCGCATTAGGCATTGTTTTTCTTGACA
+TCCACTTCCGAAAAGTTCCAAAACTCACGCCGGTTTTATTGGCGACCCATTCTTGAGTTG
+TCTTTTGCTCTTTAATTAAGGTCTTTAGCCTTTCCCAGAAATCCATACTTCATTATCGGC
+TATAAATAGAGCAAATTGTCACAAAAAACACTTGACAATGTTCCTTTATTGCTCGATTAT
+GAATGTATGAATAGAGCAAAAATGGAACATAAGAGTCCGCCAGCTGTGAAAGTTAATCTA
+ACTGAGGATGAAATTAAAAGAATTGATAAGGGTCCCTTAAAAGCAACTTCAGGGAGAGGT
+CGTGCAACTTGGGTTCGTAACCTCATTACCAAGGAACTTGACCGTTACGAATCCATCCAG
+TCCGGCAACACACAACTCGACTCAAAACCATTTAATCAAAACAAGGAGATGAAATGACGT
+ACATGAACCAGACCGAAGCGGCGAAGTACCTTCACGTATCGCCCAGCTATGTGAGCAACC
+TGACCAGACAAAAAATGATACCTCACAAGCGGATCGGCGGGAAAGTGATCTACACAAAAG
+AGCTTCTCGACCGGTGGATACTTGAAGATTCATTACGAAGCGTCGGGATAGACCCGAAGA
+AAAGCCGCCTGAGCGACACGGTTTTAGGAGAAGAGCCTTCAACTACGGGGGATGAGTAAC
+GGGCCTACCCGGCCGGAACCTCAGATCGGTGATCTTTGACAGATAAGAGAAGGGATTAAG
+AGATAAGGATTTAGTGCTGTCCTGTATAGGGAAACCATTTGGAATGCTGAGAAAGCAGCC
+TCTGACCAGGCCATTACCACTTGTGGGGTTCGAATCCCCGAGGGCAGCAAATCATAATCT
+GCTACCGGTCAGTAGACCGGCAATCTACTCCGTGAAAAGCGGGAAAGGAGGAAAGCGTGA
+CAGACAAAACGAAGCGCATTATAGCCTATGCGCTGACTGCGATAGCCGCCGCAGTTTTGG
+CGTTTGCCGAGCTGTTTGGCTGGGACCTGCCGGACTGGGGAACAATCATGAACGTAATAG
+TCATCATTGCATCTCAGGTCTTCGGCATTGAGTGGATTCCACCCAAGCGGGCAAGCAATG
+GAACCGGCGGAAACGGTTAAAAATTTCAGATGAGATAACGGCTAAAAACAGGCAAACGAG
+ACGCAATCGTTAACTGCGTTGGCGCCCGGGAAAATTAGATAGGGCTGACCGGGGGCAACC
+AGTGAGACCGCAAGTAGACGGGCATAATTGAGGCGAAAGCCGAGTGAATGATCAGGATGG
+CAACCTGATTGAAAAGCGTGTTATGTCGATAGCCTAAGCTCCGGGTCGCGCCGGACACTG
+GTTATTGTTGATCTTACGGTATAGATGTGTTGGCCACCAAGTACCAGCAATGGTGATTTA
+TATCGCACTATCAACTACCGAGCGCCGGGGAATCGTGGCGCTTTAAGTGACCGGATGACC
+AACCATATACCTTTTCGATATGGCGGTAAACAGCACCTCCCCAAGGCGTAACGGTCGTCC
+GGTTTCTTAACTCCCTCGTATGGGGGAGAAAAACAATCCGTGATGCCGGAGAAATAATAG
+CATCTATATTTTCGCGGCTGTATGCCGGGATTCAAACAGGTTGGATCGGTAAACACCAAT
+TTTCCTACCGGTCCAACAACTTTCAACCTTTTTCAAGGAGGACATGGTAATGGAATTGGA
+AGAAAAAGAAAGCTTGCAAGGTTTCATAGGAGTGAAAAGGATCAAAGCACGACCGATGAC
+CAGGCGTGGATACAACGGCTATCGTGGCTGGCAACTTCCTGCGGATGAAAATGGAGATGA
+TGAAGGGATGCTTGTCGAGTATGTCGATGGCGGTAAATCCAATCATCCCGCACATGAGGG
+CTATATCAGCTGGTCACCTATCGATGTTTTCAATCGTGCATATCGGCCATGTGATGCCCT
+TACGTTTGGCTTTGCAATCGAAGCGGCAAAGGCCGGAGAGAAGATTGCCCGAAAAGGCTG
+GAATGGAAAGGGCATGTTTGTCTTCTACCAGAAGGGCTACCCGGAAGGAATACCGATCAA
+CAAAAATACCGCAGAGGCAACAAGATTGCCGGAAGGAACCGTCTGCAAATTCCGGCCGTA
+TCTCATGATGAAGACAGCACAAAACGACTTCGTGCCATGGGTTGCATCGCAGACCGACAT
+CTTAGCGGAGGACTGGGAGATTATCGAGCAGGGAGAACAGAAATGAGTATTGAAACAAAA
+GAAAAGGCCGCTCCAGGCAAGGATACGGCCACAGAAAACAACCACACCAATACTACCATG
+ATTGGATTCAGGCAGCAAGAACTTCACGAGATCGAGGAAAGCCTTGAGGAGATGGACCAC
+AAGATACAGGAGCTTTTCCGTTTCGGAACCGCCCATAACCGGGACATCTTCGCCATGAAG
+CTATCTGGTGAGGTACGGAGAATCAGAGATCAGTTGAACGAAGGGAGGCTGATGTGACGA
+TCGAAAAGACAAGCCAGATCAAGGCAGGTGATAACCTTGTGATGGTGATCTACGGCAAAG
+GCGGTGTGGGAAAGACAAGCTTCACCGCCTCAGCTCCGAACGTGATCCTTCTCGACTTTG
+AGAACGGAACCAAATACCTGGGAGCCCGCGGCTTCAATGTAGATGTGATCAGGCTCAAGA
+GCTGGCCGGCAAACGCTGAGAAACAGAAGCTTGCGGCCTTGGTTGCACCCTACCACACCA
+TCGCTCTTGATCCCCTTGGGGAAGCGATGGAGAAGCTCCTCAATTCACCGGCGTTGAATG
+GCCGGAAGTTCCGACAGGCAGACGGATCGTTGACCATGGCAGGATGGGGCGAAGCTAAGG
+CACAGATGCGAAGCTTCATTAAGTGGCTCCGGGATTCCGGAAAGAACGTGATCATCGTCG
+CTCACGTTTCGGAAGAGAAAGACGGGGAGATGATCACCAACCGCATACAGGTTGCAACAA
+AGCTCAGGGAAGAGATACCGAACATCGTGGATGTTATCAGCTACATGGGAGTGAAGATGG
+TCGACGACAAACCTGTTCGCATCCTCTACACACCCCGGCAGGGAGACCAGTTTGACTCAA
+AGGATCGAACCGGCCGGATTCCCTTGACTGTACAGGTCAGCGAACATGATGGCTTTAACG
+ACCTGCTCAAGGCTATGGAGATCGGGCAGCAGAACATCCCTGAAAACAAGATGCCGGTAC
+CGGAGGCAACACCTACCACATCCCAGGGGCCGCAGGACGAGAAGCATACGGAAACCACAC
+CAAAAGACCCGGACGAGGAAGCGCGAACACAACTCAAGTACCAGCTTGACGGTGCCATTG
+TCGGGGAGCTGGTTACCAAGGCCGAGCGGGATGAGGTGCTTGCAAACAGCAAGAAGTACA
+AGGGCCAGGTGCTTGAGGCCTACATCAAGAGGATCAGCGATGAACTCTTCAATCTCCAGC
+AGAAGGCAGAAAGCGCAAACAGCACCGTTGCACCTGAGCGGAAAAATCAGCAGGCAGAGA
+AACCGGAAGAGGTTTTGGAAGAACAGCCGCAGGACGACGAAGAGTATGCGGCAGAAGAGG
+CCGGACAAGCAGAGCTCGAAATCTGGTAGGACAGGAGAAGGACATGAATATTACGGACAT
+AACCGTTGAGGATATCATCGAGGAACAGGAGACGGCAGAAGAAACGGGACTTGAGAAGCT
+CAAAGGCGATATTGATGAAGTGATCAGTCGGATGGAAGAGCTTTCCATCCAGAGTGACGA
+ACAGCTTGCAGAAGCAGGTCAGTGGCTTGTGAAGAACAAGCAGACACAGAAGATCGTCAA
+GGACCACTTCGAGCCTGAACGCAAAGAGACCTATGCGGCCTACAAGGCTGTGACCGATCA
+GATCAAGAAGTACACCGACATCCTGACCAAGGCTGAAAGAACCGTCAAAAAGAAGATGGG
+AGCATACCAGGCGGAACAGGAACAGCGACGCATCGAGGCAGCAGAGAAACAGCGTAAAGA
+AGCGGAGAAGGAACGGGAGCAGCCAAAGGAAAAGGGAAATTCTGCACCTTCTATTCCCCT
+TCCCCCTGAGAAGAAAGAAGAGCCGGTGAAGATTGACGGGGTTTCCTTTTCGGATAACTG
+GACCTTCATCATTGAAGAGACCGACAAAATCCCGAGGGAATACATGATCCCGGATGAGAA
+GAAAATCCGCCAGGTGGTGAAGGCGTTAAAGGCTGATACCAATATTCCCGGTATCAAGGT
+CTACGCGGAAAAGACCGTCAGTGCCAGGACATGAGACCATGACAATTGAGGCACGAATAA
+ACATTGACTTTGCCCCTGAGGAACACACCTACCGCGTTGACGGCAGGAAAGTTTCCAGTG
+TGACAAGCATCCTCAAAAGTGAAGGGTTCATTGATACCCGGTGGTACAAGCCATCGGGTA
+CTTCTCGCGGGGAAATGGTCCACCAGGGAACGGAGGCAATCGACCGGGGCCACCTTACCA
+TTGCACAGTTCCCACCATCGGAAATTATTCCCTACCTCAAAGCCTGGCAGGCCTTCAAGG
+CTGATATCGGGGTGAGCGAGTTTGTGATCATCGAGCTTCCGATCGGCAGCAAGGTTATGG
+AATACGGGGGAATCCCGGACCGGGTTGCAGTGATCAACGGGGAGTATTGGCTTCTTGATA
+TCAAGAGCGGAGCACATGAGCTATGGCACGGTCACCAGCTGGCCGCCTACAAGATAGCCC
+TTGAAGAGACCTTCGGACTGCCGATTGCAAAGCGTCGGGTGGTGCACCTGAAGAAAACCG
+GGAAGTACTCAATTTGTGGGGAGGACAAGAAGATCGGTTCCTTTGACCTTCCGGTCTGGG
+AACAGCAGTGGATTGCGATCGCGACCGCTCGGCTGATCAAACAGCGGTACGCAAAGATAA
+AACCGGAGACTGTATGAGCCAGAGAGCAATTGTCATTCCAGCGGCCGAACGGATGAAGAC
+CGGAGAGCCGGGAGTCGTTTCCTTCCGCGTCGGTGAGGTATTCCATGAGTACCTTGTACA
+CCTTTTCAGGTACCAGGAGATAGAACGCAAGTCACCATCACCCTATTACTCACTCAAGAT
+CGACACTCCAAAGCGGCCGAGGACAACAGGAGAGAACAGCCAGAACCATCATATCAACGG
+TCACTGTCAACAGATAGCCGTTGATACCGGCCAGCCATTTGAGGACGTGAAGAAGTACGC
+GAAACAATTCGCGCTCACCATGGGCTACCCCATCCTTGAGGACGAGAACGGCGAGCCTAT
+ACACGACCTATGGGGAAAACCGCAAGGGATCAGTGAGTCTGATTGCAGTACGGAAGATGC
+CGCGATCCTGATTGAAGCGATCCACCAGTTAGCGGCGGAAATGGGAATCAACCTCATCGA
+GGACTAAGGAAGCACCATGGGAAAAACAACAAAGCAGAGAGCAAAACCGGTACGAAGACA
+GAAGACACGACGGCAAAAGGCCGTAGATGCGGCAGACCGGTGGTTCAGTCTCTACATACG
+ACAACGGGATGGGAACCGTTCAGTGACAAGTAACTGTATAAGGAACCTGACCTGTTCACA
+CCTGTTCTCACGAAGATTCTACGCTACCCGCTGGGATGAGATGAATGCCTATTGCCAGAC
+GGCAGGAGAGAACCTTTACCACAACCGGGATGCAGGACCTTTGACCAGTTACTTTCTCGA
+TGTGCATGGAGAGGAAGCCTACCGGAAGCTGTATGAAAAGGCCCGCTCAGGGGCCAAGTT
+CAGAACAGACGAGATCGAGGATATCGCTGCTTACTACAAGAGCCGGTTTGAACGGCTTAC
+ACAGAAGCAGCGCGACTTTTTCAATGTTATTTAGGGAGGGACTATGGCAAACGATATTAC
+CAGTTTCACGGCAGTAGGACGAGTGACCCGTGATGCGGAATTCCGATACACGAACGGTGG
+AACACAACTGTGCAAGTTCAGCATTGCGTCGAATTACAGCAGGAAGGTACGGGATAACTG
+GCAGGATGAAGTCAGCTATTTCGATTTCACCCTATTCGGGAAACGGGCAGAAGCACTTGC
+TCAGTATCTCACCAAAGGTCAGCAGGTGGTGGTTTCAGGACAGCTCAGACAAGACCGGTG
+GGAGGACAATGGGGAGAAGCGAAGCAGGGTTGCGTTCTTCGCCCAGGATGTACAGCTGAT
+CGGGGGAAAGCCCGCCGGTCAGAGTAACGGGCAGTATGGAGAGGCCCCTTACCAGGGTCC
+GCCGCAGAACCGGCAGCAAGGCTACCAGCAGGGGCCTCCGCCTAACAGCGGCTACCAGAA
+GCCGACAAGCGGCTATGACCAGTGGGGACACCCCATAAACCCCGGACCTAATAATCAGGG
+CCCGGAACAGGAAATGAACTTCGACGACGACATACCGTTTTAAGGACGAATTACCATGGC
+ACGACGCAGAATGATCGACCCGTCAATTTGGAGCAATGAACAAGCGCAGTGTTTATCAAC
+ATCGGCGTTCAAGGTGTATGTGTTTCTCATTTCACAGTCCGATGATGAGGGGTACCTGAA
+GGTATCCCTCGTCATGTGGCCCTCATTGATTAACCCGGTTGACAGGAGCTACACGAAAGA
+ACAGCTGGTAAATGACCTCAATGAGATTCTTGCCGCGGGGCTGGTGGAAGCCTACAAGTC
+GGGTGATGAGGTCTATGTGAAACATCCTCATTGGACACTGTACCAGACCATACAGAAGCC
+TTCAGGAAGCAAATACCCGAAAGATGGCGAAAGAATCTACCGCATAGAGGAATATCGTAA
+TGATATCGGTACGGTACCACATGAATATGATACCGATACAATACCGGTAAACGACCACTC
+TCATTTCGTACCGCCTAAGTTAAGTAAAGAGAAGTTAAGTAAAGATAATACTAAGATACC
+TTCGGTAGCATCGGCAGAGCCTCAGCCTGAGCAGGGAGAAGCGACTAAACCGGCAGAAGA
+GCCGGAGCCGGAAAGCTCTCCACTTCCCCCACCCGATTCGCAACCCGATCCAGAACCTGA
+CATCGAACCGGTTCTTGAGCTTGAATGCCAGGCACCGAAGAAGCGCAAAGCCAGCAAGGG
+GAAAGCACCTACCGCCGGGAAAGAACCGGCAGACCCGCTGTACCACTCGATCAAGGATTC
+CTTCCTCGCTGTGGCCGGAGACTTCACGAACTGGGGCAAGGAAGGCAAGGCGATCCACGG
+GATCATCGAGAAATGCTCACGCGCCTCACCGGAAGACCCTGCCGGGTGTGCCGAGCGGAT
+GATCGGGGAGTTATGGCGGCTAAAAAATTCCCGAGATCGGTTCTACCGAGATCAGCCCTT
+TCTCCCCTCCACCCTCAACGCTTCGGGAATCTGGGACCGGGTGGCGGAGCAGCTGAAGAT
+CACGGCGGACGAGCTGGAAGGTGCGAGGATGTGGGAAGCGCTTGACCCCTACGGGGTGAG
+AGGTAAGGCAAAGCAGGCGGTGGGAGGCTAACAGGTATGCAGTGGAACAGCAACTGGAAC
+ACGAAAACGTTCATGGCGATGTTGCAGCAGTACTACGGCAAGCTTTCGCCGATCCACGCG
+GGAGCGCTTGTCGACTGGCTCGATAGCAAGCAGTTTTCGGGGGAGTATCTCAAGAGGCTG
+TACCAGGAGATAACCGAGAGCTACTCAACGAAGTTCGGCCGTCCCTGTGATCTTGCGATC
+GTGAAGGAAGCTGACGAGCGGCTGTACCCGCATTACTTTCCACCGGCGAACCTGCTTGAG
+GGGGACGGGAAGATGATTGAGGAGCGGGTGGCCGAGCGGGAAGAGGCGGCACAGTTTATG
+CATAACCTGATCGAGAACCTTGTGAAGAAAAAGCGGCGGGTGAAGCCAGTGAAGAAGCCG
+AGGAGAGTGCGGAATGACATTCACAGATAAGTACCTGAAAGAAAGGATTCCGGCGTTAAA
+GACCGTTTTCAAAGGCGATGATCCTATTGAAAAGGAAATGGTACTTGAGATAACGGACTA
+TGACCGAGGGATCATTGAAATGAAAGCTGGTAATGAGTACTACCGGTTCCGGCATGTTGA
+TCTTGAGCGAGCCGTTACATCGATACAGGTGCGGCAAGAGGTAAATGCATGAGCGAGTAT
+GGTGTAAGAAAAGTTTGTGGGAATTGTAGATCCTTCGAAAAGTGCTTTGCCGAATCAGAG
+GAGCTTATCGGAATCTTTTCCTCCGGTTGTCTTGCGGCTGATAAGGAGGAGACGCGGCAG
+ATGCCTGCGTGTGGAGACTTTGAGCCGATGATGAAGCCGGTACCGCTGTCCGGGGAATAA
+AGGTGCTGGTGTTGGGAGGGGCAATGAGCACGATGATATCGGCGGACTGTAAGGATCAGC
+GGGTGGCTGACTCTATCCGCTGGCTTTTGTATGAGCTTGAGAAGGCAAAAGACGGCGAGG
+TGGTGGTGTCGTTCTATGTGAAGGGCGGGAAGGTTCGGGGAGTGGAGAAAGTGGTCAGGG
+ATAAGAGTATTAAGCCGACATAGGACATACACGGAACATGTTGTGTGAGAATTGGAAAAA
+AAACTGGCTGTATATTGTTTTTATAAGTTTACGGTATATACATTATGGTGGTATAACGTG
+TATAAATTGTTTTTAAAAAACCAAACTAAAAGAAAGGATGGAAGGATGAAGAAAATCTGG
+ATTATTCCGGTGTTGCTCCTGTCGATAGGCCTCGCCGGTTGTAGTATGTTTGGAAACGAC
+GGGGATGACGACGATGATAACAATACCTCCGCTCCCTTTACTATTGTTGGTTCCTGGGTT
+AGGGAGTCGCCCTCTTATTCCGATACTGATGTCTATCTATTTGCCTCAGATGGTACGATG
+ACTCTCTATAGCGATTATGCAATGACAACCGTAGCTTCAGTATGGACCTGGGCATTATCT
+GGCGATACATTAGCCTTTGATGGTGACACACCCTTGCAAATGACAAATATCAGTGAAAAT
+GAGTTTATCATGGGTTCTTCTACCTATTATCGTAAGGGGTTCGAGCCTGATGGACATTCT
+GAATCATTGCCTGTTGGTTTCTGGGTTATGGCGTCTCCCTCTTATTCCGATAGTGAAGTC
+ACTCTATTTGCCTCAGATGGGACTTATACTCTTTATAAAGACTATGCAGTGGCAAATGTA
+AGTGAAAAAGGGACCTGGTCATTATCAGATGACAGTTTAACCGTCGACGCTTCTTTAACT
+AACGCAACAGAAACAATAACGGTTGTTAGTGAAAATGAATTTACATGGAATGGATGGACC
+TTCTATCGCAAAGGCACCGAGCCTGATGGACATAATGATCTAATAGGTACGTGGGTTCCA
+TCTTTTTACTCTATACCTGATACCGAAGTACATCAGTATAAAGCTGATGGAACCTTCACA
+TACTATAGTGATTACGCGATGCAGAAGATCTATCGTGAAGGTACCTGGACGTGGAACTCT
+GATCATACAGTCCTTACAATAGTCTTCACACGCTACGCCAATGGTTCTCAAGACTCTCAA
+GTTAAGTTTCTCAGTGGTAATAAAATCCAGTATGGTGCTGAGTACTTATATCGGAAAGGA
+TCTGAACCCTGTGGGAATGTCTTGTCCGGTTCTGCTACAACGCTGGCTGTCGATACAGCG
+TATACAGGTGAATTTACTGATCTAAGTGCTAAACTTTTTTGTGTAACGGTAGAGGATGGG
+GCAAGCTATGAGATTTCCTGGGATGATTCTGATGAGGGTAGCGGTTCCTATACTGGAGAT
+ATATCAGTCTCCGCATATAAAGCGGATAAGGCAAGCAAGTATTTTGCAGAAGAAGATCGT
+GGATATTCTGTTCCCCAGAGTCTTTCCGCTAATGGCACTGTCATGTATATCGTTGTGGTT
+CCTTACCTTGAGTTTTATTTTAGTGACTCCCTTGGTACCTACAGCCTAACCGTAACAAAG
+GTGACACCATAGTAGGCATATTTCCTAAGGCTCTGTGACAAAGAGTAGATATCGGGCATA
+GATTTCTCTATGCCCATTTTTTTTGTCTTCGTGAAGGGCGGGAAGGTTCGGGGTGTGGAG
+AAAGTGGTCAGGGATAAGAGTATTAAGCCAGCGTAGGACATACACGGAATATGTTGTGTG
+AGAATCCTGAAAAAGAGCTACCTGTATATTGTTTTTATTGGTTTACGATGTATACATAAC
+AAGTATAATGTGTATAGTGTAAACTATAAAACAAACCAAAAGGAAGGATGGAAGAATGAA
+AAAAATCTGGATTATTCCGGTGTTGCTCCTGTCGATAGGCCTCGCTGGTTGTAGTATGTT
+TGGAAACGACGGGGATGACGACGACGATGATACCGCTGCTCCCTTTACTATTGTTGGTTC
+CTGGGTTAAGGAGTCGCCCTCTTACCCTACTACTCATGTCTATGAATTTGCCTCAGACGG
+ATCTTGTAATATTTATGACAACTATGCAATGACAGGCGTACCGTATAAAACAACCTGGTC
+ATTATCTGGTGATACTTGGAGCCTTGATGACGACTACTCAGCTACAATAACAATTATCAG
+TGAGAATGAGTTTACCGTGAACGACAGCACTACCACCTATTATCGTAAGGGCTACGAGCC
+TGGTGGGCATGTTGATGAAACATTGCCTATTGGCTCCTGGGTTATCGACCGTTGCTCTTT
+CCCTAATACTAATGTCTATCTATTTGCCTCAGATGGGACTGTTATTCTTTATGCAGACTA
+TGCAATGACAACCGAAGATGCTGCAAGTACCTGGTCATTATCTGGTGATACTTTGACCCT
+TGATGGCGACTCAGCTACAATAACAATTATCAGTGGGAATGAGTTTACATGGGATGGATA
+TAGCTACTACCGCAAAGGCTACGAGCCTGATGGGTTTGCATTGGATGGACCTGCTGCCTC
+TCTGAGTTTAGGAACCGCCTATGACGGGAACTTTACCGATGGAGCTGATTTCGATGTGTT
+TACTGTGGCGGTAGAAGATGGGGCAAACTATGATATTACCTGGGATGACTCTTTTGACGG
+TAGTCACCACTATAGTGGAGACATAAAGGTTATTGCATATGCGGCAGATAGAGCAACCGC
+TTATTTTTTTGACAAAGATAATGGATATACTCACCCTGAGACTATAACCGCTAGTGGAAC
+AATCATCTATATCATTGCCCGTCCGTATGATTCAGACTCGGTAGGGACCTACAGCCTGAC
+GGTGACAAAGCAGTAGCATATTGTTGTTATCACCATGAACTAAAACACATGACGGGCATA
+GATTCCTCTATGCCCGTTTTTTTATGGTTTCCCCCTTGATGCAAAAATTCTTCCGTGATA
+GAATTTTTCTTGTTAGATAACCCAAGGTAAGCATACTTACCCTGGCCGTTCCGGACGGAT
+TCCGGTCGCTCTAATGGTGCAAGAAGCAATCAGGCGGCGAAGTACCTTACGTTAAACACT
+GTAACAGGTGTCTTTCGTGAGCTACTTCGCCGCCTTTTTTTGTGCCCTTTGGCTTTGACA
+GAGGAGAGGACGAGAGACTATGGGAAGGCAGGATAGACGAAAGAGTTCGACACAGCGCGG
+GTATGGAGCAGCCTGGCGGAAGATACGCATCGAGGTCCTCCAGGCCTGGGGCATCCCGAG
+GCTCCATGCAGATCACAGCAGAAAAACTGCGAAGTTTGACAACGGCTTTGGTAACCAGAA
+GAGGAAGGAACCTCGTCCCGTTTCCCCTATCATCAATCAGGGCACAGCCCGCCTTACGGA
+GGGGGGATGTAAATCTCTGGGGGAAAAATGCCCAAACCACGCGCCTATACAAACAAACAC
+TCTGTCAGCAAAGGCAAAGGGGGTATAGGCCATGAGTCGCGGCGGACACAACAAAAAGCC
+GACTATTTTAAAGCTTACCCATGGCACCTTCAGAGAGGACCGGGCCAATGAGAAGGAGCC
+GGAAGTCAAGGCACTTGATGAGGCGCCCAAGGCACCGAGCCACCTCAACACTTTTGCAAA
+GAACAAGTGGAAGGAACTTGCCCCGGTGCTTGCACAGACCCGTGTACTCTCTGCGACTGA
+TCTCACCATGCTGGAAGCCTTGTGCGAGGCATACGGACAGTACCGGGAAGCGCAGTATGC
+GGTCTACCACTACACAGATGATGACGGGAAGAAGAGGAAACGAAACCTTGCCCAGTACAT
+GAGTGGGAAAAACTCTCAAACCATGCCTGAGTACACGGCCATGCGGCAGGCGTTGTCCAT
+GGTCAAAACCATATCCGCAGAGTTCGGGCTCTCGCCTGCAACCCGCTCCCGCGTGAGTGC
+AATCGACACACCTGAAGCAAAGGACCCTATGGAAGCGCTTTTAGAAGGGGCCGGATGATG
+TGGAAGCGACTCGTACTTGTGGGGCTTTTGATGAGTAGCCTGTTTACCTACCGCCAGTAT
+GCCCAGGATGTTGCAAGCGGGAAGGTTGTCACCTGCAGGTGGGTGAAGCTTGCTGTAGCC
+AGGTGGGAAAATGACCTCTTACGGCAGAATACTCCGGATTTCCCCTACTACTTTGATGAG
+AAATGCGCCAACAGGTATATCAGCTTTGCTCAGCAGCTTGAGCACACGCAAGGCTTCAGC
+GGGAAGATCGTGCTTGAACCCTGGCAGCAGTTTGCCTGGGCGAATATCTTCGGGTGGAAA
+AGTACGGCCACGGGCCTGAGGCGGTTTCGAAAGGCATACCGGGAGGTTGCAAGGAAGAAC
+GGGAAGACGGTCGAAGGGGCAGCAATGATGAACGCCTGCTTTCACCTCGATAAAGAGATC
+GGGGCCGAAGAGTTCTTTCTGGCGGTGGACCGGAACCAGGCGAAGAAAGGCTATGACGAG
+GCGGTACGCCAGAACCTTCGTAACCCTACATTATCGCGGCTTACCAAGGAGTACCGATCC
+TCAAAACGCCTTGTAAAGGTCAATGACCCTGCGGCCTTCATGACCCCGGTCTCAAGAGAT
+CACAAGAGTCAGGACTCCTGGAACCCGCATGCGATCTTAGTGGATGAGTACCATGCCCAC
+GCGACCAATGAGCTGATCAACGTGTATGAGTCGGGCATGGGAGCACGGAAGCAGCCCTTA
+ACGATCATCATCACCACGGCCGGGACGAACATCAACGGGCCTGCCTATCAGGAAGAGCGC
+ACGCTCGTTACCAAGATCCTTGAGGGAAGCATCGAGCCGGTTCCGGAACACATCTGGGGG
+ATCATCTACACCCTTGATGAGGGGGACAGGTGGGAAGATCCTGCGGTGTGGATCAAAAGC
+AACCCTAATATGGGAGTGAGCTTTTACCGCGACTATCTTGAAAAGCGTATTGCAGAGGCC
+AAGGGCTCGCCCCGGAAAGCCAGCGATGTTTTGACGAAGAACTTCAACATATGGCTTTCC
+TCTCCCACCCGGTGGATGGATCACTCGGTGTGGATGCGGGGAAGCGCTCTGGTCATTGAA
+GAAGAGCTTGTCGGACGAGGGGCCCGTGGCGGGCTTGATCTATCGATGACAACCGATATC
+ACGGCCCTGTGCTGGGCATTCGGTGAGAAGGACGGGCTGAGGAGGGACTATCAAGAGCTC
+TTGATCAGATACGAAGGCTTAGAGAGGCAGAACCGGCAGCAGCAAACGGCCCTTAAAGCC
+GGGGGCTCTGTCCTGGCCGCCTCTATCATTGTGAATGTGCTGCAAGCTGTGTTTTGA
+>NC_014364.1|provirus_2666253_2703772
+ATGGGACGAGCAAGGAAGCCTTTCAAGTATTATTTCCGTCAGGTTAAAGGAAAGAATATC
+TGGTATTATTCGATTTCCCCGGTTTCTGGTGTGCCTTTCGAGTTATGCGAGGACCGGAAA
+AGTAGCCATATAGAGGCTGAACTTGACGGTTCAGGCAAGCCAAAGAGATCGAGTGAACAA
+AAGATAGTACGCTTTTGCCTTAACAGAATACGCGAGCTGAAAGACGGTTCAGAATCACAA
+TCGCCAACGCTCGCGGAATTCCTTCGTCCATACTTCACGCCAGAATGCCCGCACATTACC
+CGCGTTCTATCAGACGGCAGGCGTTATTCTGACACCTTTCGTAAAGACCAACGATCACGA
+ATAGACCGTCTGGTTCTTACGCACCGAATAGCCGAATTCAGAATGGACGAACTGACTCCG
+GGAGATATCGAGGACTTTAAAAAGGATCTTCGAAGGTCAGGAACAGGAACGAGAACAATC
+AACCTTACCGTCGGAGCGATAAGGACAGCTATCAATGAGGGGCTTCACAGAGGCGACATA
+AAAAACGATCCAACCGTCGGGGTACATAGTATTAAATCCGACGAAGAGGAAAGAGGAATT
+TTCTCAATCGAAGAAATTAGAAAGATGTTTTCCTTTCCTGGTGGATTAAGATTGTGGGGA
+TATGATACCGGATACCACGGATCTCCGTCTGGGGAGAAGGTATTGCCGATTATTCCTTAC
+ACTCTTGCACTCTTGATGTTTGCAACCGGTGAAAGGCCATCCGCCATATTGCGACTTAAT
+TGGGAAGATGTAGATAGTGATATGATCACGTTCAGGGTTACAAAGGCGGCAGGGGCCAGG
+AGTATACCCATTGTCACGATGGCAACAAAGGCGCTTCGTGAGCTCTCTGATTCAATGCTG
+CATGTGGCCCCTGCCGATCCTGTTTTCTGTCATGACGACACTGGCCAGCGTTTAACATAT
+GCGTTTTTCCCAAAACGTTTCGCCCACATGATGGCTACGCTTGACCTGCCGACTAATGAT
+GCTGACGGACGAAAGCGAACGCCCTACTCACTTAAAAGTTCTTTGATTACTCACCTCATT
+GACGGCGGAGCCGATCCTATCCTTGTACGGGAATATGTAGGACACTCACACGGGACGGGT
+GAAAAACGGCTCACTAAGGTACAAAGTAGGTATAAAAAAGCCCAACGAGAGAGGCTTAAG
+ATATTGCTGCCGGATATTGAGGTTCTTCTTTCTGCGGAATCTGTTGTAATAACAGAAAGT
+TAAGGAGTATCCTCTTTGGCCAAAAGAAGTAGTCTCCAAGCGGCTGTTGGTATCCCTCTC
+TCTCCCCCTACCCACTTTCTAATTGTGCGAGGGTTGACCCCTGCAATCTTGGCAGCCTGC
+GAACCAGTTAAGCCTTTTTCCTTGAGCAGTGCCCTGAGTTTTGCCGGTGACGGTGCTGTA
+TTTTCAGCAATTGCCCATTCTGAGTTGTCAGGGTAATTATAAGAGAGCTCACCCGGCTTG
+TCTTTATTGCCCTTTCCTATGTATCTATTTGCCAGGATATCAATTTTACCATTTTCAACT
+TTGTAGTATATTTCCTCCCCCTCTTCGTCGTGTACAAAAATCTGCAAGTCGCCACGTTGG
+AAGATGATGAAATCACTTTTCGGTCTTAATTTATCTTCTACCATATTCGCCTCCTCCCCA
+TTGAGGGAGAGGCGGGTCATAAAGACCCTGCCTCAGCGAAGCTATAATACCGGCCGTTAC
+CAATGATTATATGGTCAAGTACCGGTATCCCAAGTATTTCGCCTGCATCATGCAGCCTTT
+GTGTTATTTGCTCATCCTCTGGACTCGGCAAAATCTGTCCCGATGGGTGGTTGTGAGCAA
+CAATGATTGCCACAGCATTGTCAACAATCGCCGGATAAAATACCTCACGAGGATGCACAA
+GCGTCCTGTTTGCAAGCCCTATTGTGACAATATGCTGACCGTTTACCTGGTGCGCACCAT
+CAAGCGTCAGTACAATAAAATGATCCTGCCGCTCGCTGGCATAGCGGCTCAATAAGTCGT
+ATGCATCTACTGGATTGTTGATTTTGGTTTTCTCGTTCATCGGTAACTCCTTGGTTCCGG
+TATTTCAGCCTTCCCATACGGGCGGCCTTGGTTGATCTCTCAATCAACCTTACTTTTATA
+GTATAGGCCCATTGGGCCTATGTGTCAACTATTTTTATTATAAATTATTTAATTTTTTAG
+ATATAAATAGTATCAGTGTCGTCATCATACCCTATCAATAATTCATGATCATTTTTGACA
+AAACGATGCATATCAATTTCGCAATCTACAATTTTAGAGCCAGAAGAGTGATCAACCCCT
+CATACTTCTAATTATAAATATTGCACCGCTTTCCCGTATTCTGGACCGCCATTGATAGAT
+GTCGTCCAATCGTTATTGATACCGATCTCCTGCTCTATTCGTTGCAGAGTGTCTCTACTA
+TCTATGATCATGCCTTCATTCAATATTCTGGTAATCGTAGATTTGTTGACGCCGATCTTT
+CTTGCAAGATCAGCTCTTGATAATTCTTGTTGTTCCATGTAATCAATGATCTTCTTCTGT
+GCTATCGTCACCGCCAGCATCTCCCCGGAGCTCCTCAAGATAGTCAACAAGTGCAAACTG
+CTGACCAATATTGAGTGACCTGAGCTTTTTTATAATATCCCCGCGGTTAACCCCAAAATA
+TTCAAACTGTGCATCTATCTCGTCTTCCGTATCCGCAAGGACCGCTCCAGGAATAACAGC
+GCCAGGCTCATAAGCTGTTGACAATGCATTATTAAGCATCAGATTCACTTCTCCATCTGA
+AAATAGCTCACGAAGCGTTCGCTTCTCCCTCTTCATGAGTTCCTCGTACCTGTCGGCAAC
+TATAGTGATTGCTCTCGATGCTCCACCATGACGTTTGACAAGAGGATCAAGCTTCTTCTC
+AAGTACCGAATTCCAATAGATCGATGTTTTCCCGCTCATGCTCGTTTCTCCTTTTGCTTT
+ATAAATAGACAGCCCCGCCGAAGCGGGGCATGATTGGTTAAGCCTCTATGATATAATAAT
+CAGGTCTACCAGCTTCGTTGTGAGATAGGTAATATATACCATCTTCCTCTTCGTCAATCC
+ATTCTTGAGCCTGAGCCGCAGAATCAAATGTAATCTCTTCCCATCCTGATTCATCCCTTG
+CCCACTGGATTGGCTGATATCCATAGTAATTTCCGATAACCAAAACTTTACATTCCCCGG
+TATACTCAGGATCTGCTTTAATACTATCAGGATCTCTATGACCCCATGCAATAGATTCCA
+TAATCGGATCATCAGAATTGCTTATCCACTCGCTTACTTGTTCGCTGACAAAGGCCTCGT
+AATCTTTTTTAGTATTTCCAAGCAAATCATCTTCTTCAACTTCCCATAATGAGTATTCAT
+TGATCTGATCTTCATAATAGTAAATTCTACCAGTTTCAGGGTCTTTGTAAAGCGTGGAAG
+AATAGTTATCAAATTGATTAGTATTTTGATGTTCTTCGGCTAAGATTTCCCATCTTTCCC
+GAACTTCAGCCTGATCGATTTCGTCTGTGCTTAACTTCTCAACTCTTATTTCTGTCATTT
+CTTTCTCCTTCGCCTTCCCTTCCGGGTAGCGTTTTGGTTTTGTTAAGGTCTCAATCAACC
+TTACTCTTGCATTATACCTCTATATAGCGGTACAGTCAACAGAAAGTTTCAAAAAAAATG
+TTAATTTTCTTTGTTAATTTATTATGGTATTTTATTGCGAAATGAGGAAATTCAGAAGAT
+TGCCTGTAGGATGTTCACAATAATAGAGACAGCCAGGACAGAGCCACCGGCTTTAAGGGT
+CGTCTGCTGCCGCCGGTTCTGCCTCTCTAAGCCTTCGCAATAGATCAAGAGCTCTTGATA
+GTCCTTCCTCAGCCCGTCCCGCTCGCTCTGCAATGCTGCTACTTTCGCTTTGCGCTCCTC
+CGATTCGCTCTGTAAGCTTTCCAGCCTCTTTTCTGTATCCTGCCACCTCTTTTCGAAGTT
+CTGCGAGCTCTCCCTCGTACGTCTCAACTGCTCGCTCATACTCATCGCTGAGTGCTTGAT
+ACTCTGTATCTCGCTTTTTGCCTCGACTATCGTATTCTGCAGCTCGTCCACTATTGCCTC
+TTCCTGAGCGGTAAGTGCCCAGGAGGAAGCCAGCGGAAAAACACACGCCAAGAGCAAGGA
+TAATGCTAATAATTTTGCGCATCTCAATCCTTCACCTCGATACTGATCTTCGGTCCGTGG
+ATGGAAACAACCGACGGCAGGATCAGCCACACCATGGCCAGCACATTGGTAACCAGGGCC
+ATTTCCATCTGGCCCCGGGTGTAGAAGACTCCGGAGAAGTAGTCGATGATAAACTTGATG
+TTCACCGGGAAGGCAAAAAGGAAACCGATGATTGTCGCCACCTTTCCTTTCTCTCCCAGA
+GCCTTCCACAGCTTTACGATGAGCTTTTTCATGCCGCTACTTCTCCAAGATCGAGAAAGA
+TGCGCTTCGACCGAAGTTCCCCCTCGCTTGCAGTCTTGCTGAATGGAGCCCATGGATCAT
+AGACGGTCATGCCACGGCCGTTACCCAGGGTGAAATGGTAGATGTACTTGCGCGTTTTTC
+ATTCCACCGTCGCCACAAGAGTATTTCTATCTCGTTCGGCTGGCATATATAGTCCGCGTC
+TTTTTTCCCGAGGTAGCGTACATTCAGGCCGAAGAGGCGGAAGATCCCGGCGGGGTCCGC
+CACATACATAAAGGTTCCAGGCGCCTCCGGGTCCTCGGTCAGATAACGACGGTTTTCAGC
+CTCAACCACAGCGTTCACAAACTGCTCTTGTGAAATGACTCGTTTCGTTCTGCCTGCTGC
+TCCCGCAGCAATTGAAGTAGCGTAGCATCCCCACTGCTGCACCCGATCCGGCATCTCAAT
+ACTGTTTTGATAATACATACGTCTTCACCCTCCCAAAACGACGGGGAGTAGTCCCCCGAT
+AATCGAACCACCAAGACCGCACACCATTCCGACAATGACTGTTCGGTACTCAATCTTCTT
+CTCATGGCGTTTCTCAACAGGGCACGTACTTTCCCGGTTGATGAAAAAGTCGGTGAGCTT
+ACTGTTGATCTCTTTGATGTCCCGGCCTTGTTCCGTCACAATGCTTAAGACCATATCGAT
+TTTGTCGTTATCGCCCATTGGCTTAGCTCCTTTTCTCCGGTACCTGTGGCCAGGAAATCT
+CCTGCGGGAAGCCTGGCTGTAGGGGAATGTCCCTGAGAGCCTGCCGGTAGGCTTCCCAGT
+CCGACTTGTCGGTAAGGGGATAGTCGGCCATCATGATGTAGTCACTCTCAGATAACAGCC
+TGTCTCGTTCTAAGCGAACCCGTTCGGAGAGCACCTCCTCGGGAACCGTCCAGCCCGTTT
+CGTTCCACACGGCCTGCGGGTCCGAAGGCTCTATATCGGTCATACTCTCATCGGGCTTTC
+GGCCGAGGGACAGGTGTACCGCCGCTCCTGTGGCCTTGTTCCAGTAGGGAACACCGGTAT
+AGTCAGGGGTAAGCACATACCTACCGCCTTCCCAGGTGATAGCCTCATGTTCTCCGGCCT
+CAGGCACAAGCCCGGCTTCTGTTGCGGCTGCTATCGAAAGCCGATTTCCTTCCTCATCGA
+AGAAGCGGATATCATCGCCTTTGTTTCCGGTAAACCCTGCAGGAACCTCCTTGATGGTTT
+TTTCCGGAAACAGCTCTGCAAGCTTTGCCGTCTCATCGGCACTTTGCACCACAGCGGTGA
+TCATTGAGCCATCTACTACGGCGTAGGTTTTCATGCAATTCTCCTCCATATCCTCATGAG
+GCGGTTACGGTCGGATGTTCTTGCCCCAATGCGAGGAGTACCGTTCGTACCATCACTTTT
+GGGGCCCGATGTTTTGCCTTGAATTGTTGTATCAACATTGGCAGCCGCATTGATATCCTC
+AGCTTTTCCTGGTACGTCTTCAGTCGTGTATCCATAGACAAAAATTTTAGGATTACTTCC
+GCTTGTATTAGTTCCTACACCATTAAGTGTGATAAAGCCTTGGAGATTATCGGGCATTAG
+CCCATTTGTTCGGCCAGAACCGTTGTAACCTTCGGTATGAAAGTCTATGCCTTCACCGTC
+CCACAGTTTCTCCCAGGTCCCTCCAAACAGGTAAGCAGGGGACTCGTTAGTCGGAAAGGC
+AACCGATAGGTCGTTACTTGCGCTTGAGGCGTATTGTGTGTACTGGGAGCCTACAGGGTG
+GGAATTTTGTTCTACATCGAGATTCCCTTTGTGGTAAATATCATATCCTTTGTAACTCAG
+GTGCTCGTTATTGACGATAAAATCCTGTCCGCCTAACTCAACGATAAGTTCAAGTGAAGC
+AACTATCTTTCTGGTGGTTAATTTTTCACAGTAAAACCCACCGTTGCCAAATAACGACAA
+TCCATCGGGGTTAGCTTCTGTAACATAAAGCTGTACATAACCAACATCATTATCCGCGGG
+GAATTTCAGAACATCTCTAATCCACATGGTATTTGTATGTATTTCGCCGTCCCAGACAAA
+GTTTGCGAGATCTATATATCCGTACACTCTCTTGGACCCAAAACGTGTAAATGTAATCAA
+TCTTTGCGGCTCAATTGAAAGAGAAGGTTCATCCGGCATGCCGGCAGGATAGGAAGTGAA
+AGCAGAGCGGGCCTTACCGAAGATAACCTGTTCTCCGGCAGCCTTGATACCATCGGCCAC
+CAGAGACAGAAGAGGCGCTTCCGTCTCATCGAAGAAATGCACACCCTGTCGTCCGGCATT
+CGATCCCACCCGAAGGATCGCCTTACCGGTGGTACTGTCCTGGATCTCTAAGGCCGCATC
+ATCCTGGAGCACATACTGACCATCAACAAGGCGCATCTCGCCCCTGATCTCGATCGAATC
+CCCGTCGGCCGTCCAGAAACCGAAAATGGTAGAGGCAAGGCTTTTTGCTCTGTCCGAAGG
+GTCAGAAAGCCCCCCAAGGTATCCCATGGCAACCCGAGGCTCGGCCCCGGCAGCCCCCCA
+CACCTCGATACGGTTGTCTCCGGGATCAAGCTCTATCCTCGCTTTTCCCACCTCATCCGA
+GCGTATGGCGGTGGATGAAAGCAGCCAGTTGCCGACCCGTCCCGCATTGGCCCTGATCCC
+CGAAGCATCGAGGATCGTATCCCCCGCCTTGATGGCCCCGCCCGAGAGGGTCAGGTTTCC
+GTCAATGGTCAGGTCATGGAGTATGCCGTACAGGTCCCCACGAAGCCACACGTTGTTAAA
+AAAGGCATCCCCGTCCCCTCCAATCTTCCAGCCCGAAACACCACCCTGCTTGTAGTCGTC
+ACTTTCAATACCGTTGCCTGCGGTAATCTTTCCCCGAAGCTCTGAGTCACCGGAGAGAAA
+CAGGTCTCCATGAATCTGGAGGGTTCCGCCGTCCCACTTGATGTAGTTATTCCCGTCCCC
+GAGAAAGGACCAGGTACCATCATTATTAATGACTGCTGTCCACTCCTCTCCATCAAAGAA
+GCCCAGAGCGCTTGCCGTCATATAGAGCCCTGCCACCGTGGTGTCGATATCCACCAGCTG
+GTTGCCGTTGACCGGCTGTATGATGCTTCCGTCCGACTCAAGGCCCACATCCACCCGCTC
+GGCCACACTCTTCGCCTCATCCGGATTGGTCGGCACCACAATCTGCCCTGCAACAACCGT
+CCCGAGGATGGTTTCAAGCGGGGCCACACTTACGCCCTCGTATTCCCATATCTCCGTTTC
+AACATCCCAGCTTCGGGAAGTGATACGAACGGTATTTGATATGCCGAGGGAAAGGGAGCT
+CACCGTAACGTAGCTTCCAAGGCTCTTTTCGGTAAGACTTTTAAACGTGTAATGAAGTCT
+TCCTGTGGTAATCGAGGAATACAAAGCGTTTGCAAGCTCGGTTGCCGCGTCATCGTCATA
+CAGGTAGTTGGCTGAATACTTTTTCAGTTTGCCCGTGCTCTCCGGCCTTGAGAATACGGA
+GGTTTTCTTTTGATCCTTGTAAACAATATCGAGATCACCGGTTACCTTGATCTCATTGAT
+AAGCTGGCCGTCTGCAAGGTTAAATTGGAATTCCGAATAGGTTGTTGCATGGTTTTCCAT
+AACAAGGTCATAGACACCGAACAACTGTCCCATCCCTAAAATATCTATCCATGTGCTGTG
+TCCAGGCTCCGGACCGAAAGAAACCCACGTATACCCATGGAGTTCCAGTTTTTGGTTTTC
+AGCTCCGACTATCTCATAATTTGAACTACCAATATCGAGATTGTAGTCACAGCGATAGGG
+ACCATCTGCCGGCCAAAGCGCCGGACCTTCGGCATCCTGGCCGCTATTTGATGCTATCGA
+TTCCCATTTATCAACCTTCTCATAGTAGAGGGTAAGCCCGGTAAGCTTCTCATACTGATT
+GAAGGATACCTGTACCTGCTCAGCCTCAGAATCCTTTCTCTCAACCTCCAGAGATCCTAT
+GATATTCTGTTCACTGAAAGCCCCGTCCGCTTCGACAGAAGAGGATGCCCAGTCGTAGAT
+GTCGATCACCCCGTCGGGGAATACATTGTAGAGATGATGGTAATCCCAGAGGATTGCCTC
+AAGATCGTCTGCATAGCTGTCGCCGGAAGCAAAGGCAAGCTTCGGGATAACTTTGTTTAT
+CGTTTCCCGTATTCCGATGTACTGGGAAGGGTAGCCGGCCGATGCCAAGAGTATGTGAAC
+AATAGAATGGTCGGGATCATCAGGGTCACAGATCTTCCCGTCCGATATCATCACGTCGTC
+CTGCAGGGTGGATTCAAGCAGATACCCATAATCATAGATCTCGAAGTCGATCGTCCGGTC
+GTTATCGGTGACCTTGTACTTGGTCACCGGCCGGGAGAAGCCGCGAAACCAGATCACCCC
+GTCACGATAGATTTCACACGGAATATCTCCGGTACACTGCAAAAGCCGCATTGCAAGGGC
+CGGAGTGAGAGTAGCCGAGAACGTGGCCGAACCTAAAGCAGGTTTGAAATCATCGTCATG
+AAGCTTCTCGGTAAGCTTCAGAGAGTCTCTGACAAAGTTATCTCCACCGTAGCCGGTGAT
+ATCGACCCAGCCGTCCCCGTAATCAATGAGAATTTGCCAGCTCATCGTCAGGCTCCCCAC
+TTCTCGACACGGCCGGATGACTGGCCGCGCTTTACCGTCTGGACGATGTACTTTGCAAAG
+GCCTCCGATCCTCCGGGACCGTACACGCTGTCCACATGCACCTGTACCGTCGTCCCGCCG
+CTTTTGAGGTTCCGGATGTCAAAGGGGATGACCGTCTCAGCTTTGTTTTTATCTCCGAGC
+CGGTACAATCCTCCGGACTCTCCCTGCGCCGGCACAATACCGCCGTCTGCAAGGCCCGTG
+TACTGCTGCTGATTGATCAGCGCCACCTTGCGGGCGGTCAGCCCTGCAATGACGGCGGCC
+ATGGCCGAGGCCGCAATCGGGTTCATGGATGCATAGGCATTGATAACCGCCTGTGCTCCC
+GATGCTATGGTTTCACTCTTCCTGTTCTTCTTGTCCCGTTCGAACTGCTTCCGCGCAAGC
+TTGTCCTCTTTCTCCGTCTTCTCGGCTTCAAGGTCTTCGTATGTTTCCCCGGCCGCCTTC
+TTAAACTCGATCTGGTTGTCGAGGTTGGAAATTTCCTTCTCGGCCGCAGCATCCGAGAGA
+TCCCCCTGGAGGCTGTAGATATCAGAAAGCATGCCGTTTAGCTGGTTGTAGATGGCCATA
+GCCTCCTGGGCCCTTGAGGCATACAGCTGGATGATCTGCTCGGTTTTCCACTTCTCAACA
+TCCACCTCATCCACACCGGCCTGTTTGGCCGCATCCACCTGCAGGCGTATCTCATCAAGG
+CGGGCCTGCAGCTGGCTCTTTCCAAAGCTCTCCCGTATCTCGGCAAGACGGGCCTCCTCG
+TCCCGTTCCATCTGCTGCCGGTCAAGGGAGGCTTCATTTAGAATGTCTTTATACTCTTGT
+TCCCACTCAGAAAGCCCTTCAAGCGGCTGTGACCAGTCGGTCTTGCCTTCCGAAAGCTTT
+CGGTTTCTCTCATCGATAAGATCGTTAAGGAGCCTCTGGACCTCAGCCATATCCTGACCG
+GCGGCCACCCCGGCATTACGAACGGCAGCCCACTTGTCGATCTCATCCTGCAGGAGTTTC
+AGCTGCTTCTCGTTCGGCTCCATGGCATCGAGCCGGCGCTTTCTGTACAGCTCAAGGGCT
+TGTACATTGTTCTTTGCAGCCTCGGCGGCAATTCGGTTTTGTTCGGTTGAGATGCTCGCA
+AGTTCCTGTTCAGCCTGTTTCTGCTGACCTAATGCCCTGATCGTTGCAATGATCTCGGCG
+ATCTTCGCTTCCTGGTTTGCAATGATCGTACTGGAAGCCTCATTCTCCTGGCCGTAGTAC
+CGGTCCTGCAGATCCATGAGCTTTTCCTGTTCAAGGGCAAGCGCCTGCTGAGCCTGCAGG
+AGTGCTTTTGACCCCTTGGTATCGACCGTTCCTCCTGCCTTCTCATAGGCATCGAGGACC
+TCTTTGATATCAAGAAGACTGTTGCGGGCGTTTGCCGCCTCGGTGACGATATCGGTCAGC
+CATCTGACAAAGGGCTCCATACCGTCGGATATCGATCGGCCCAGACTCTCCTTGTAATCA
+CCGACGGCATTACTTAACTGGGTAACCGCAGCAACACCGTTTTGAGCTTTTGCCTTGGCA
+AGTTCGAAGCCGTCAGCCATGGCCTTCTGAACGATTGCATGCTTCTCTCCATCGCCGGTG
+GCGGTCCTCAACTGCGGGATGTATCGCTGGAGCATGGTGTAATCGTCATTCATCGCCAGA
+GCAACAGCCTTCATGGATGTTTGCAGGTTGATCCCGAAGGCGTTTGCAAGCCCGATCGCT
+CCCTTCGATGCTTCTTCAAGCTTATCGCTTGCAACTCCCTGGCTTTTTGCAAGCTGCATA
+ATACTCAGGATAGCCTCATCACCGTAGGTCGTGACACTTTGGATCCCCGAAGCTATCTCC
+TTGAGGCCGGGTAACAGATCATCGGCAGACTCTCCGGTCGCCCTGATTGCCGCGGCAAGA
+GCATCCTCGGCTTCTATCTGTACGCCGTACAGCTTGACCGATTCCTTCATCTGCTGCATC
+ACCGCCTTCACTGATACGGCCGCAGCAGCATAAGCGCCGAAACTCTTTGCAGCCCCCACT
+GCAAGGTTTTTGAGCTGGCCTTCCAGTGAGTCGGTTTGCTTCTCTGCATCGCGCATGGCC
+TTTACCGCGGCCCGTGTCTCTGCGCGAAGAAGTATTTTCAGCTCGTCAATTACTGTTGAT
+CCCATACCCGTTCCTATAGGCACCTTCCGCCGTTTCTATGATCTCGACGATGAAAGCCGG
+TAATTCCGCCCATCCCCCTGAGAAGGGAAGAGCGCCGAAAAGCTTATAGCGGTACCACAG
+ACCGAAGGCACTCCAAAACCAGTCATCAAGGTACTCGTTCACTTCACTTCGCAGGATCGT
+TACCAGCCTTCCGTCGACCACCACGCCGAGCCTTCCGTCTCCAATCTCCCGGCGCACCTT
+CTGCGAGCTCTGGCCCTTCATCCACAGCCCGATTCCAAGAGCTATTTTTTTTTATCAACG
+GAAGTCAGGCTCTTGAGCTCGTGCATGAGCTCACTTGCAAGTGCAACAAGGGGTAGATCG
+GAGAACAGCTGCTCTCCGCTGTCCACTTCAATACAGTTTCCCTCGACGCACACGACAAGA
+TTATCAATACCGGTAATCATCTTCTTTACCCGAAGTACCCACGCTATTGTCAGATAGTCG
+GCATACCACCCTTCGTACGCTGCCTCATTATCCTTATCCGGCACCGGCCCGGCTTCCCGA
+CGTGCCCGGCCGTAGATCTTCTCTTCCTCTTCAAAGGTGAGAAACCGGTAATGCACCGTT
+ATTCTCTCATCCTTCTTCCGTCCCTTATTGCCCCAGGAGGGGACATACACCCCGTCCCGG
+GCTATGGTGATAGGTTTCGCCATCTTTATGCCGCCTCTCTTATGTACAGGGTGGGATCAG
+GGTCTCCCGGTGCTATGCGAAAGCTACTTGAAAAGTTCTGTGCATCTTCTCCCGAGGCCC
+CAAGGCTGGAAGAAAGAATGATGACCTTTGCCCAGATAAAGGCTTCCTTTTCCCCTTTAT
+CCGTTGACTTCTGGATCACGCCCTTGATGTAGATCGGCGAGCCGTCCACATCGTTTTTGA
+TGATGGTGCCACTTGCCGACTGCCTTATAACCTTGATGAAGTTGTTGATGACGTAGCCGG
+CTGCATCGGTAACATCCAGGGTAGTAAGCCCTTCAAGGCCGCCTGTCATATCCGTTTTCC
+CTGATCGGTAGCGTTTGACCTTGTCACTCAAGGTGGTCACATCGATCTCATTTTTATTGA
+AATCAATCGAAAAGCTCTGGATATCAGCCTTCTCACTTTCCTCTAAAAAGGCACACGCAT
+CTCCTGACTCAGGCACAAGAGAACCGTCGTCCCAGAACAGCTCGCCATTTTCAAGGACCG
+AGGCAAAAGCGCTTGTCTCTCCCACTGCCGTGATACTCCACCAGCCGGCGCCTTCTCCGC
+TTGCCACTTCTCCTCCTACCAGTTCATCAAGACTCTTTGCCCCGTCGCCTGCAACCTCAG
+AGTCAAGTTTGACGGTGACAAGCTTCCCGTCACTTCCCACAAGTCTGTCTATTTCCATAT
+CATCCTTCTCCTTCTTCCGTGTAATCTGCCCTAATCTCCACCATCCAGCGGTAGAGCCCA
+TTGGGGGCAATGCCGAGAGACGCATCTCCTGTGACAACCACCGAGGAGAACTTCAAGGCC
+CCCGATACCCCGCGAATCCTTCGAACCGCATCTTTGACAAAGGCCCGAAGATCAGAGCTT
+CTCTCATCCTTTGCATAGATATCGATCTGTATGGCAGCTGATCCCCCGTAGTATGAGAGA
+TACACCTTTTCATTCGTGTCGCTTACAAGGCTCACCACCAGGTACGGTATCTTTAACAAA
+ACCCGGCTCTCGGTGTCATAGATCGCTTTGATCCTCTCCATGAGGGCCGTGTCGGCTCGA
+AGCTGCTCTGTGATCTCAACTTCCGGTGCTCTGCTCATCAAGCGCCTTCCTCAATCCTTC
+TTTCCAGATCTTCCGTATCTCCCTCATGGCCTTGTTCTTCCCGGCCCGCATGAAGGAATG
+CGGCTTCATACGGCCACGGTTCTCACCGGTCTTTGTCGCCCGTTCCTCTGTTCCATACTC
+AACAATGAAGGCATGGGGAGCATTGTTCTTCACCGCTCCGGTATGACCCTTCACGTCATA
+ACTCATGCCGGCTCTTAGGTTCCCGGTCCTGTCCGTCACCCGTTTATCTAAAAACTCGAG
+GGCATACTCATAGGCCTTCTCGGTCAACGGCCCGATCGTGTTCTCGGCCGCCGAGATGGT
+AAGGCCTGCATACGAGCGCACGGTCTTCCGGCGTCTGACCGTACTTCTCTGGCCACTGCT
+GCTCCTTTTCGCCCAGCTCATACCGAAACCTCACGGTAGGCGTCCCACACATTACGAACC
+TGAAAAGGCAGGTCCATGACCCCCACATACATGGTTTGATACTCCCCACTTAATGCATTC
+CCCTTATCCAGCCAGCTGATACCCTGGGAACCAAGCCAGTAGCCCACCAGCTGTATCACC
+GACTCCTCAAGGTCCTCAGGGATAGATCCTTCCTCATACCCAGCACGGTAGGACACCTTG
+ATATTGCGAAAGCCGCGTACCCAGCATGAGCGGCGAAACAGCCTGCCGGTCTCATCATCC
+CGTGTGTACTCAGTAAGCTCAGTACCGGTGTCAAAGACTCCATAGGTATCAAACCACACT
+CCCGTGACACTCAGGATCGGATATTGCGGTAATTGCAACGTCCGGCTGCCGGTTCCCGAT
+AAAATGACAACATGGTCGTCTGCTGAAAGCTTTCTGCTTGTGTAGGTTTCTGCCCGCCGG
+GATGCCACGGCGATAAGGCTTTCTGCCTCATTCTCCTGGCTCTCCTCAAGATCAAGCCGC
+TTCTTCACCGCCTCCCATGTTGTCAGGTTATTCATCTCTTACGCCTGGCCCTTTGCAGCT
+GCCTCGCTGATCGCAGCTTTCAGCCTGTCCTCTCCCCACCGTTCAAGGGTGGACGGAGCT
+CCCACCTTCAGCTGGGCGGCAAGGTCGACAAGACCACTCTTGTCAAGCTCATCAAGCTTC
+ACCGTCTCAATAGTTTCCTCGTTTGTTTCAACACCCTTTTCGTCAAGGAATTTCGCATGA
+CCTGCACGTACCAGGTCCTTTGCAACGTCATCCGGTGCCGAAACCTTCCCCGGTATGTAC
+GAGAAATCCTTCCCGACAACCGAAACCAATACTTCAATGTCTTTCAAATCTTCTCTCCTT
+TTCCTACCTTGCAAGCCGGATGCCTTCCGGCTTGCAAAAGGGGCTCTATGCCGCCGCCAT
+TGCAAGGTGTTTGATCGGATGCGTACCCGCATCAACCAACAGCGAACCGTGGCGGAAGAA
+CGCGATAAACCCAACCTGGGCATACTCGGCGTACCGCTCGGTCAAACGCAGAATGATGCC
+GCCTGTTACATCCCGAATCTTGAAGGCCGACATATCTCCGAACAGCACCGCTTTCTCTCC
+GGCTTCCATCCCCGCCATGTTCTGGTTGATGATGTACTTGTACCCGTTGATCGTATCGGG
+TTCTCTAAGCGCAACACCGGGAAGCCACAGGGGCCTGCCCTGGCTGTCCTTGAGTTTCTT
+GAAAGCCTTGAGCGTACCGTCGTTGAACATAAGTTCTGCATTCAACCGGTAGGAAGGATC
+GATCGAGTGAATGAGATCTATGACCTCATCGTAGGAAAGAGCTCCCGCCGCTGCTGCGGT
+CTTTCCGAGTACCGAGCCTGTGACAATGCCCTGAGGCTGCTCGCTTCCGGTTCCGGTGGT
+AAAGTAGGCGGATGTGGCCCTGCCGATACGCTCGGCAATCTTGGCCCGCAGGTACGCCTC
+GATATCAACACCGGAGTCCTGCAACAGCTGATAGCTCACCCGGATGATTTTCGATGAGAA
+CATGTAGGCATACAGGTTTTTCGATCCGAATGTCAGATCTTTCTCGCCAGCGGCCGTGTT
+CTCCGAGAGAATTTCCCCCACGTTCTCGGTATCGTTTCCCGTCGGAATCTGTATGTCACG
+GCCGTTGGTGGTGGTGATCACCTCGGCCCGGCTCTGACGGGGACCGTTGAACTGCTTCAT
+TGCATCCACAATCCCCGAGGCCATTTCATCGGGCACCGTATACCCTCCGGTGCTGTCGGT
+TCCCACACTCAAAGCACGGCCTTCAACCTCTTTGTGGTGCTCCATGAGAATGGAGCGGTG
+CTCAGCACTCACCCCGGAAAGGCCGTTACGAAGGTAGGAGTCAAAGGCAGATCGATAGGT
+ATCGTGTTCCTCTTCCTGCTGCCGTCCTTCATCCTTCTTACGGGCATCCTCTTCGAGCAT
+CCGCTCTTCAATGGCAAGCTCCCGTTCGGCTGCCTCAATGTCGCCGGTAAGCTTTTCAAC
+CCCGTCAAGCCGCTCGTTGTACGAGCGAAGCTCTTCTGAGGTGAGCTTTCCGTCTTCGTT
+CGCCGCTTCTTTTTCTTCGCGGTATTTCCTCGTCTCTTCCCACAGGGTTTTGCGTTTCTT
+CCTCATCTCAACAATCTTGTCGAATCTCTGTGCCATAATTCCTTATCTCCTTACATGAGC
+ATGCCGAGCATCTTCTCGCGCTCTGTATAGTTGCAATCAGCCTCAGACCGCTTGCGCTCT
+TCCGGGTGGCTCGTAGCCGGCGCGGTTAGCTCTTCGATCTTGCTGCCGATATGTTCAAGT
+TTCTGTCGCTCCTCTTCGCTGATATCCCCTGATACCGACCTCAAGGTCAGTTCCTGTAGC
+TCCTCCGGATCGAAATCAAGTCCCATTGACCTAAGGTCAACGGAGGTCTGCGGATAGGCC
+GGGAAGGTCACCGGTGATACTTCAATCAGCTGCACTTCCACCAGCTCCCGGACCAGCCGG
+TTGTTCTCGTCCTTGGTCCACTTGTCCCGTATGGTGCGGAACCTAAAGGACATCTGGTCC
+ACATCCCCACGCTCAACCGAAAGCATGAAGTCCCGTGCCCACTGGGTATCGGGAGGAGAT
+GCCTCAAAGGAAAGCCCGTCCGAGTCCTCGATAATGGACAGGGTCCCGGCCTTCCGTGAG
+CCCAGGACATAGTTGTTGTCATGGTTCCACAGGGCTTTCACGTTGCTCTCACTCAAGGTC
+TTGGTAAAAGCTCCGGGATTGATCTTCTCCCGAAAGCCCCCGAGGTCCTCCGAAAGCTGG
+TTGTAGACCGCAGGACGTCCTACGATCTTCCGACTCTCTTCTCCTTCCTGCCGGCTTCTC
+AGCTCAACGGGAAAGGTCAATACGTCATGCTTTATCATCCCTCATCTCCTAATGATCTGA
+TTTCGGCTTCAAGCCTCCGGGCCTCCCAATCCTCAAAGCCTCCTGAGTCAAACAGCCGTA
+TGGAGCGCTCCGTATAGCCTTCAGCATCAAAGCAAAGCCCTGCACGCCGTAATGAAGGCT
+CTAAGGCAGAGAGCTGTTCGACGAAGCTTTTTCCCTCATCCGCATAAAAGGCCCGTACCG
+CTTCCGCATCACCTACCACTTGCATTTCGCTTTTCTTCATCCAGGCCGAAAGGCTTCGCG
+CCTCACGCCGTGCAATCCGGCTCACTGTGGATCGCAGATACTCTAGGGCAATCTCCCTGG
+CCGCTTTCTGTCCTCCTCGCTCCTGACTTCCCGCAGAAGGGGCGGAGAGCGGAACAACGT
+CCCCTGCCTCGGTGATCATGGCGTTGTTCATCTGCACGACAAACGAGTCGCCGTATTCGG
+ATTCGATCGGATTCTTGTTCTCCATCTGCCGCCACTCGTTCGGTGTGATAATGCCGTTGC
+GCCTCTCTATCTCCAAAGCCTCGGCCCTGCTTTTCTTATCTCCACGAAGCAGGGAGTCAA
+AGTTGAACTCCACAAACACCTCAGGCTCTCCGGCGAAAAGCTTGTAGTTCATCTCCTGCT
+CAAAGCGCACAAGCCAGGGGCGAAGCGAGTGGACCAGAAAGGAAATGTTCAGGTGTTCGA
+TGTTCGAGAAGGTTGCATGCTCAAGGTCGTTGATGAAGTGGGCGGGAACTCGCAGGATTC
+CGGCGATTTCGCTTCGGGTGAACTTTCTCGCCTCGATCGCCTGTGCCTCTTCAGGGCTTA
+CCGAGGTCTTCTCCCACTTGATCCCTTCCTCAAGTACTGCGGTGCGGTGTGCATTCGAAA
+GCCCTCCATAGGCCATCTGCCATGCAGTTTTTAATCTGGTCTTTGCTTCCGGTGTGAGCT
+TTGACGGGTGACTCAAGAAGCCCGAAGGATGGGCACCGTTTGAGAAAAAGGTCCCTTCAT
+ACCGGTCAAGAGCTGCTGCATATCCCACCGTTTCTTTTGAGTAGTCAAGCAGTCCCCGGC
+CTTTGATGCCGTCCCCAAGGGCCGAGATGTGCAGGACCCGGTACGAAGGAAGGCCGATGC
+GCTGGTTTCCAATTGTGGTCACATACACGATTGACTGCCGCTCGGTGTAAACGACCGTGG
+TCTGTTCAGGGGCAAGGGGCCAGAGTGCAACAGGATACCCGTCCCGGTCAAACTCGATTT
+CCGCATAGTGGTTTCCCCGCATGACAAGCTGCTTCATGGCAAGCTCGCGGTAGTTGATCC
+CACTCATAAAGGGATTCGGCCGTACCTTGAGTATCCGGTAAGCCGGGTGATCTGTTGCCC
+GCATCTTCCCACCGTTTCCCGTCCTCCGGTAGGTCTCAAGGGAAAGGGAGCCCACCGATT
+CAGAGAGCACCCGCACACAGGCAAGCACCGAAGCAACGCCCATGGCGCTCTTCTCGTTGA
+CCGCCACGCCCGTGCTGGTCGGCTCCCCCTCAAAGTAGGAAACAACCTCAGGGGAGGATA
+AGGGAATTTCCGGATTCTCAAGGCTTCCCCGCATCTTGGCTATTGCCTTTAGTCCTCCGA
+TTGCACCGCGAAGGTCAGAGAACAAGCTCATAGGACAAGGACCTCCTGGCTGTCGTATAC
+CGATCCGTCCGATCCGTTTTCCACCACCTGGTGAAGCGCCATGATGGCAGCCACGATCCC
+GTCGATCCTCTTGCCGTAGGAATCACGCTTCGGCTTCATGGGCATGATGTTTCCCTGCCG
+GTCGTCTTTGAGCTCCACATTGCTCATCATCCAGGAGGCAACCGGGTTGTCCCCGTGAGC
+GATCTTCCCGTCGATCACCATCCGCTCAAACAGCTGAGTAGGAACCGTCATCCCCGAATA
+CCGTTGAGGATATTTGACAAGCTCGATCTCTCCCTCAAGTTCCCGCTCAAACTCTCCGGC
+ATGCCACGGATCGTATCCGATCGACCGGCCGCCGAAGGTGTTCGCATCCTGCCGCAAGAC
+CTCTAACACGATCTCGTAGTTGACCGTCTGTCCCGGTGTTGCGATCATCCACCCCTCATC
+GATCCACGACCGGTAGTCAACCTGGTCACGGTGACAGCGATCAAGTAATCCCTCTTCCGG
+TATGAAAAACCGCCATAACAGCGGATACCGTCCGTCCTTCTCACCGAATGCCCAACACAG
+GGCCGTGATATCTGTTGTCATCGACAGATCAAGCCCGCCACGGGCCCCTCGTCCGACAAG
+CTCTTCTTCGGCAACAGGAGCGCTTCCCCGCATCCATACCGAATGGTCCATCCACCGGGT
+GGGAGAGGACAGCCATATGTTGAAGTTCTTGGTCAAAACATCGCTGGCTTTCCGGGGCGA
+TCCCTTGGCCTCTGCAATACGCTTTTCAAGGTAGTCGCGGTAAAAGCTCACCCCCATGTT
+CGGGTTGCTTTTGATCCACACCGCAGGATCTTCCCACCTGTCCCCCTCATCCAGGCTGTA
+GATGATCCCCCAGATGTGTTCCGGAACCGGCTCGATACTTCCTTCAAGGATCTTTGTAAC
+GAGCGTGCGCTCTTCCTGATAGGCAGGCCCGTTGATGTTCGTCCCGGCCGTGGTAATGAT
+GATCGTTAAGGGCTGACGCCTGGCTCCCATGCCCGACTCATACACGTTGATCAGCTCATT
+GGTCGCGTGGGCATGGTACTCATCCACTAAGATCGCGTGAGGGTTCCATGAGTCCTGACT
+CTTGTGATCTCTTGAGACCGGAGTCATGAAGGCCGCAGGATCATTGATCTTTACAAGGCG
+TTTTGAGGATCGGTACTCCTTGGTAAGCCGCGATAGCGTAGGATTCCGAAGGTTCTGCCG
+TACCGCCTCGTCATAGCCTTTCTTCGCCTGGTTCCGGTCCACCGCCAGAAAGAACTCTTC
+GGCCCCGATCTCTTTATCGAGGTGGAAGCAGGCGTTCATCATTGCAGCCCCTTCGACCGT
+CTTCCCGTTCTTCCTTGCTACCTCCCGGTATGCCTTTCGAAACCTCCTCAGGCCCGTGGC
+CGTACTTTTCCATCCGAAGATGTTCGCCCAGGCAAACTGTTGCCAGGGTTCAAGTACGAT
+CTTCCCGCTGAAGCCTTGCGTGTGCTCAAGCTCCTGGGCAAAGCTGATATACCTGTTGGC
+ACATTTCTCATCAAAGTAGTAGGGGAACTCCGGAGTATTCTGCCGTAAGAGGTCCTTCTC
+CCACCTGGCCACGGCAAGCTTCACCCACCTGCAGGTAACGATCTTCCCGCTTGCAACATC
+CTGGGCATACTGGCGGTAGGTAAAAAGGCTACTCATCAAAAGCCCCACAAGTACGAGTCG
+TTTCCACATCATCCGGCCCCTTCCAGAAGGCACTCCATGGGGTCCTTCGCTTCAGGTGTG
+TCGATTGCATTTACGCGGGAGCGGGTTGCAGGCGAGAGCCCGAACTCTGCGGATATGGTT
+TTGACCATGGACAACGCCTGCCGCATGGCCGTGTACTCAGGCATGGTTTGAGAATTCTTA
+CCACTCATGTACTGGGCTAAACTGCGCTTTTTGGTTTTCCCGGACTCCTCATCTTTGTAG
+TGGTAGACCGCGTACTGTGCTTCCCGGTACTGTCCGTATGCCTCGCATAAGGCTTCCAGC
+ATCGTGAGGTCCGCTTCCGAGAGTACACGGGTCTGTGCAAGCACCTGGGCAAGCTCCTTC
+CACTTGTTCTTTGCAAAATTGTTGAGGTGGCTTGGCGCCTTGGGCGCCTCATCAAGTGCC
+TTGACCTCCGGCTCCTTCTCGTTGGCCCGGTCCTCCCGAAAGGTGCCATGGGTTAGCTTT
+AAAATAGTCGGCTTTTTGTTGTGTCCGCCGCGGCTCATGGCCTATACCCCCTTTGCCTTT
+GCTGACAGAGTGTTTTCTTGTATGGGCGCGTGGTTTGGGCATTTTTCCCCCAGAGATTTA
+CACCCCCCCTCCGTCACTCGGGCTGTGCTCTGATTGATGATAGGAGAGACAGGTCGGGGT
+TCCTTCCTCTTTCTGTTGCCAAACCCGTTGTCAAACTTCGCGGTCTTTCTGCTGTGTTCT
+CCATGGAGCCGGGGGATGAGCTGGTACTTTCGGTGATCTGGTTCAATAGCCGGGTCATAG
+GCGGGATTGTGGTCCACATCGTACTTCGGCCACAGTCGCTTTGGGATGCCCCAGGCCTGT
+AAGACCTCGATGCGTATCTTACGCCAGGTTGCTCCATACCCGCGCTGTGTTGATGTCTTC
+CGTCTATCCTGCCTTCCCATAGTCTCTCGTCCTCTCCTCTGTCAAAGCCAAAGGGCACAA
+AAAAAGGCGGCGAAGTAGCTCACGAAAGACACCTGTTACAGTGTTTAACGTAAGGTACTT
+CGCCGCCTGATTGCTTCTTGCACCATTAGAGCGACCGGAATCCGTCCGGAACGGCCAAGG
+TAAGCATCCTTACCTCGGGTTATCTGACAAGAAAAATCCTATCACGGAAAAATTTTTTTA
+TCAAGTTAAAATGTAAAAAATATATTAAACTTTTCTTAATCTATTCAAAACGTCATGATA
+ATATTCACGCTCCCAGTTTTCCCAATCATAGAAGTATTGATCAATTCCACCAATAGCATC
+TACACGTATATGATCTCTTTCATAACGTCCACCACCAAGCATTGCATATGCGGGGTGTGT
+CGGCAAATCGTGTTTCTTCAGATATGCGAATATCTCCCATGTTTTCCATAATGAAAGCGG
+TGCTGCCGTTTTTTTTGAAGTAATCCCATGAACAAAATACCGTATTTTTCTGGTGTTAGA
+TTCTTGCATCCTTATCCCAGTTATGCGTCGCCCAAATTCTTCAAATAAATAATCTCCTTT
+TTCTTTAAAAGGCTTCGGACTATACATATTATCTGGCGTGTATTCAATCTCATATTCGTA
+ATATCTAATGCTAAAACGTTTTAAGAATGCATCCCTAACCGGTAGGCAATCAGGATTAAA
+GAATGGCTTTTCTACAATCCAGATGAACGGTACATCTATGCCGGCACATACGCACAGATG
+TGCCAGAACAACTGAATCTTTACCCCACGACACAGAAACGTAACAGACTTCTTTAGCAAT
+TCCTTGAATATCAATGATTGCCTGATCTATTTTACTTTGTTTTAAATCAGCTGCCCGTAT
+ACCGTCCGCTTCCTCTAATTCTTTCCACAGCTTCAAATCATGCGATGTATTCCTTTCGCT
+TTTAATCAACATGTAAATACCCTTTTTCGTCTTCCCTGATCGGCACGACTACAGATAAAT
+CATTTACATTGCGGGTAATTGTAGATTTGTTCACGGAAAAGACTCGTGCAAGATCAGATC
+GTCTCATAGGCTTTTGTTTTAATAATTCTTCAATCTTCCGACAGCGTATATATTTTGTTT
+CAAACATCGAATATTTGCCACGATCAGACTGTTTTAATTCCCTAAGAAAATCTAACATGG
+TATTGCAATCTCCATAAATGTATCAGGATGCCAATATGGTGGGAATGCTCCTCCATACGA
+ATGGCGGAAACCATACCAGTCTTTAACGGCTTCAATCGGCATTGTTTTCATCAGAACTTT
+TTTACCTTGGTGCATTGCAAAGATAGAATTATCTTCCTCTTGTTCTTCATACTCCCATCC
+TCCGATAATTCCATAACCGACATTTCTTAAATGACCAAGCGAAGGAATTTTTTTCAACAA
+CTTATTGATTTCTTTCCTATCGCCGCGAACGAACCAGCATATTTTATCTATAAGCCGAAT
+ACGGAGCGGAACAAATCGTGATTTATATGGCCCTGACGATGTTAAGAGTTTTTTCCGATG
+TAATGGATGCAGCATAAGAGCGGACAAATCTGTGTCAAATCGCTTTGATTGATGATCGCT
+CCATTCTGCTTTGACCTCTCCAAGTATCGGATCAGAGCAACAATATACGTCGTGTCCACA
+AATTGTCCGCTGTGCAAGTGGTATAGGAGGCCTTTTGATTTCAGAAAGAGAAACATTACG
+TGTTAATTTTCGAGCATGTTTCATTCCTAACCGCATGGATAATTCGTATTCCAGAAGCGA
+GTCGATAAATGGCGCATCACCGCAGAGCGGTGATAACAGGTGCGCCGTAACTTTCCAGTT
+TTTTATCATAACAATTCAACCTTTGAAGGAAACGCTTTTGACAGCCATCTTTTGAATGCG
+TCTGTGTTTGCCTGCACGTGATCGATATATTCCTGTACCAATTCATCAGGGCCCCTTTCT
+GTTCCAAACCAGTCTGTCAGTCCATCAATCCAAATTGATGATTTTAATTTTCCATGGCCT
+ATACGTGCGCTTCCACCGATGATGCCATCGTTGTCTTGCCATAACTTAATGGCATGCAGG
+GCTGATCCAACCTCAAGCGGAGAGACATTGTAAAGCGTTATGTCGTGATAAAACAAAGCT
+CCAGGTATAATGTTCTCTCCAGAGTAAATCATAAGGTTAGATTTTTTTTCTGCTATCTCA
+CCGAGTATTTCGGTAGCATCTTTCATGCGAGACGCATCGCCACGGGTATATTGATATTTT
+GAAACAAAATGTTGTGCGGGCTTTAAAACACCATCAGGTAATTCGTAATCGCCAGAAAGT
+TTTTCAATTACCTCTTGATTTTCGGCACAGCACAGAAGTCCACGAGAGACAAATAGCGAG
+CCACCGACTACCTGATTTTTCAAGCTTCCTCCGAGCAGACGATACAACGGGGATACTTCT
+TGAAGCTCTGCAATAAGCGGAATATTATCGTTCGTTGATGACTCGGTAAGGCTTCCTCCG
+GTCAGCATATAATTCGCCTGATCGATGGTGAGCTTTCCGCGAAGTCCACATTGATCGATA
+AGATATAGCGCTCCAGGTTGTCTTATCATTTTGTGCCGGAGAGCGTTTCCGGAAAGAACA
+GGGATTTCAACAACGTCGTTGTCATAAAAAACCTTTTCGCGGTTAATGATAGACTCATTC
+CCGGAGACTCCCATCATGTGAGTAATAGGAGAAAGCGCTTCTGAGAGAAAATGTATTTTG
+CATATTCCAATCTGTTTCATTACTTCTCCACCTTCTTTGTATTCCATAAGTTCCGAGAAT
+AAACCAAAATAATATTGTATTTTTTCTCCATGATGTAGAGAAAGTGCTTTTTCCACTCTG
+TAGGCTTCGTTTCCATGCTTTCGAGAAAATAAGCCAACTCTTCACATGATGCAACTTTTC
+CCGGATCGGCCTTGATAAACTCAAGGATAAGATTAACAAATTCTTCGAAATCCCCTCCAC
+ATTTTTTCACTGATGAAACGATTCCGTTCCCGATTCGCTCCCATAGAGTTTTACGATCGA
+AATCATCAGAGAAGAGCTTAGGTAAACTCGAACAGAACTTGATCGCTTCCTCCTTGATTA
+CCTTCTCTTCCATTTCCGGTAGACTTTTCGACGTATCTACCAATCCCGCCAGCTTTTGAC
+GAAATTCTTGTGCTGATAACAAAGTCATTTTTTGCCTCTTCCTTTCCCGGGCATAACCAT
+GCCGCGAGCTCTCCCAATGGGGAGGAATAGATTTTAATCCACTCAACGAGTGGGCCTTCT
+GAACCATACAGATCGATAATGTTTTTATAATTGATAAACTCATCAGGATTTTTTAATGCA
+ATTTTCCCGATAGCAGCAGCGACAAGTTTTGCTTTTTGTAAATATTTTTTTAGCGTTGCT
+ATCTCAACGCTGATTTCCTTTTCTTCAAGAAGTACGGAAAAAATGTTCTGATCATAATTA
+ACCGGCGCGCGGAAAATAAGCTGCTTTTGTCCAGAATCGGCAAGTACGATAGAAAACGGC
+GGTTTCGGAGGAGATAAACATATCCGGCGCAAAACGCGCAGATGTTTTTTTGTCATGGCT
+AATTTTTTATTTTCAGTCAGTACCCACGAATACATTCGCGGTTGACCAGCGCGTCCTATT
+TTAGTTGTACCGTCTATCTGAGTAACTTCATAAATCCCTGATAAAGATTCAACGCAGCAT
+CCGCAAACATAGTCGGAACCAGGATATTTCACAATATCGCGATTTGTGAAAGTTTGTTTC
+ACATATTTTTTCTTGGTGTATGTTCCATCGCATGGCATTCCGCAATAAAAGCATCGATGT
+TCCCCTATATTATATTTATTTGGTGCAAATAGATATGATGCTGTTATCATATTTCAGAAC
+CTTTAACATTCTTATCCCTGACCACTTTCTCCACTCCCCTGATATTCCCGCCTTTCACAT
+AGAACGACACTACCACCTCGCCGTCTTTTATTTTCTCAAGTTCATATAAAAGCCAACGGA
+TAGAGTTAGCCACACGCTGATCCTTACAGTCTGCCGATATCATCATATTCATTGCCCCTC
+CCAAGGCTGAAGCCTTACTCCCCGGATAGCCCTACCAGCTTCATGATCGGCTCAAAGTCT
+CCACACGCTGGCATATGCCGTGTCTCTTCCTTATCAGCCGCAAGACAACCGGGGGAGTAG
+ATTCCAATAAGCTCCTCAGATTCGGCAAAGCACTTTTCGAAGTTTCGGCAATTTCCACAA
+ACTTTTCTTACACCATACTCGTTCATGCATTTACCTCTTGCCGCACCTGTATCGATGTAA
+CAGCTCGTTCAAGATCAACATGCCGGAACCGGTAATACGCATTACCAGCTTTCATTTCAA
+TGATCCCTCGGTCATAGTCCGTTATATCAAGGACTATTTCCTTTTCAATAGGATCATCCC
+CTTTGAAAACCGTCTTTACCGCCGGAATCCTTTCTTTCAGGTACTTATCTGTTAATGTCA
+TTCCGCACTCTCCTCGATTTCTTCACCGGCTTCACCCGCCGCTTTTTCTTCACAAGGTTC
+TCGATCAGGTTATGCATAAACTGTGCCGCCTCTTCCCGCTCGGCCACCCGCTCCTCAATC
+ATCTTCCCGTCCCCCTCAAGCAGGTTCGCCGGCGGAAAGTAATGCGGGTACAGCCGCTCG
+TCAGCTTCCTTCACGATCGCCAGATCACAGGGTCTCCCGTACTTCGTCGAGTAGCTTTCC
+GTGATCTCCTGGTACAGCCGCATGAGGTAATCCCCGGACAGCTGTTTGTCGGCAAGCCAG
+TCTCCAAGTGCTCCCGCGTGGATCGGCGAAAGACGCCCGTAGTACTGCTGCAACATCGCC
+ATGAATGTTTTGCTGTTCCACTGCATACGCCTATCCTCCCACCGCCTGCTTTGCCTTGCC
+TCTCACCCCGTAGGGGTCAAGCGCCTCCCACATCCTCGCACCTTCCAGCTCATCGGCCGT
+GATCTTCAGCTGCTCCGCCACCCGGTCCCAGATCCCCGAAGCGTTGAGGGTAGACGGGAC
+AAAGGGCTGATCTCGGTAGAACCGATCTCGGGAATTTTTTAACCGCCATAACTCCCCGAT
+CATCCGCTCGGCACACCCCGCAGGGTCCTCCGGTGACGCCCGTGAGCATTTCTCGATGAT
+CCCGTGGATCGCCTTGCCTTCCTTGCCCCAGTTCGAGAAGTCCCCGACAACGGCCAGGAA
+GGAATCCTTGATCGAGTGGTACAGCGGGTCTGTCGGTTCTTTCCCGCTTGAAGGCGGTTT
+TCCCTTTCGCGTTTTCGGTTCCGGGCATTCAAGCTTGAAAACAGGCTCCGGGGAATCGGG
+TTCCGGATCCTCCGGTGGTGAAACCTCCCTGTCCCGCTCAGGCTGAGGCTCGGCCGAAGC
+TGCCGCAGGCATACTAGTCTCACTTCCCTTCACTTCACTTCCCTTCACTTCTGTGGTCAC
+TGGTGCACTACCGGTAGCACACTGGTGAGTCACCGGTGACTCACTGGTTGTCGAAGGCGC
+TTTGTCCTCCATTTCCCGGTTGCTCACCGGTGACTCACCTCTGGAAAAACAGGTCTCAAA
+GGGATACGGGGCTTCACTTCCCCTCCTGAAGGTCTCAAGCCATTCATTCCGGTATTCGTC
+CGTCAGATACTCTTTCGGCGGCCGGCGGAATTTCGTCTCCTGCGGCTTTCGTCCTTTCAG
+GTTCTGATACTTGAACCAGTTCGGGAAAAAGGCGTATCCGCCATACAGGCGGACAAGACC
+ACAGGCCCCGAAGTCTTCCAGGGCCTCTTTGATCATATCGATGGTGATGTCCTTTCGTGC
+CAGCCTGAAGTACAGGCTATCCGGTTCAGCCTCGATGATTCCCTCATCGTCGGCATTCGA
+GATCATCCCGATGAAGATGAGTACCGACACCGAGGAAAGTTTCATGATCTTGGGGTCCGT
+CCAGATCCCCGGATCTATCATCCTTTTTTTTGCACCCATAATATCCTGTCCTTAAAAGGG
+TATGTCGTCCTCGAAGTCCATTTCCTGATCCGGGCCCTGATTATTCGGTCCGGGGTTGAT
+CGGGTAGCCCCACTGATCATAGCCGCCTGTCGGCTTCTGATACCCGGAGTTAGCCCCCTG
+TCGACGTTGCTGTCCCTGCCGGGAATTCTGCTGTTGCCTTTGCTGTGGAGGCTGCTGAGA
+ATAGCCGCCCCGCTGGTTCTGCGGCGGTCCCTGGTAGGGGGCTTCTCCATACTGCCCCTG
+CTGGTTACTCTGGCCGACAGGCTTTCCGCTGATCAGCTGTACATCCTGGGCAAAGAACGC
+TACCCTGCTTCGTTTCTGTCCGTTGTCTTCCCACCGGTCTTGTCTCAGCTGTCCTGAAAC
+CACCACCTGCTGACCTTTGGTGAGATACTTAGCAAGTGCCTCAGCGCGTTTCCCGAATAG
+GGTGAAATCAAAATAGCTGACTTCCTCCTGCCAGTTGTCATGCACCTTCCTGCTGTAATT
+CGATGCTATGCTGAACTTACACAACGGTGTCCCGCTGTTCGTATATCGCAACTCTGCATC
+ACGGGTAAGCCTTCCGACCGCCGTGAAACTGGTAATATCGTTTGCCATGGTTCCTCCCTA
+AAGAACGCCAAAAAAGTCATGGTTCTGTTGTGTGATCGCCTCGTACTTCTTCCGGTAGTA
+CTGTGCAATCGTCCGAATCTCTTCCGTTGTAATCTTTACGCCGGACCTCGATTTCAGGTA
+AAGCGCTTTGTATGCATCCTCTCCGTGAAGCGTAATGAAGTAGCAGATAAGCTTCCCCGG
+ATCCCGGTCATGCTCTTCGTTCTCTGCTGCACTCTGACAATAAGCATTCATCTCATCCCA
+GCGGGTAGCGTAGAATCTTCGTGAAAACAGGTGTGAACAGGTGAGGTTCTGTGTACAGTT
+ACTTGTCACTGACCGGTTACCGTCCCTCTGTCGTATGTAGAGACTGAACCACCGGTCAGC
+CGCATCTACAGCCTTCTGTCTTCGTACCGGTTTGCCTTTCGCCTTCGTCATGCTGTTATC
+CCTTCAAGATCAAAAAGTGTAGGCGTTGCCGCTTCAATATCAGCCGCCTTAAGATAGGAC
+AGCCCATCCTTGAAACTCTGCGGGTTTAGCTCGTACCCGATACCATATCGGCCCATTTTC
+ACCGCCATGTACGGAACGGTCATGAGCCCGCCGAAGGGATCAAGCACAACTTCTCCTTTG
+CTGCTGTACCTGTTTATGATCCGCTCCACGATGTCGAACTGCAAAGGGCAGATGTGAAAC
+TCAAGGTCCTTTCGGGCCTGCTCCCCGTTGAGCGTTCGCATACGGTTCACATCGTCCCAC
+ACATCAGGATGCCAGCTCCCAGGTGCTACGACCATGAACCCGGAGGGCAGTTTCTCACGC
+TGTTGGAGCTTTTCTGCCAGGTTGATATGGTCGTGATAGTCATAGACAGAAGCACGGGAG
+AACTCTCTATAGGTTTTCTGCATATCGCCTACCGATACCTTTTCAAGCTCTGCACTTGTA
+AGAAGTCTGTCACCGGATGACCGCCAGAATTGATGAGCATCGATCTGCCAACGGGATCGC
+GGGTATTCTTGTTTTGTTTTTTTGACGGTCTCATCTGCGTAGGCCCTGGATGTATCGGTC
+GGCAGCTTCCGAAATAATAGGATATACTCCGGGCAGCCGACGCCCATCTTCGTGCCGTCC
+TTACATTGTTCAGTCCATCCGAGACGGTAGGTCTGGTTATTCTCGCGGACCACATCGGTG
+ACAACAGTAATTCGGCCCATGTACATAAAGCCGTGCTTCATAAAGTGGGATACGGTAAGA
+TCGCTGAAAGGATCAACTGTCGGCATTCCGCTTCCGGTAGCATTACCGAAAAGGATCCTG
+TCTTTCACATGGATAGCAGCGACCCGACCGGGCTTGAGAACTCGCATAAGCTCCGGAGTA
+AGATAGTCCATCTGCTCAAAAAACTTGTCATTGTCCACGTTGTGGCCAAAGTCGTTATAG
+GTCGGAGTGTATTCATAATGATTTGAAAACGGGATCGACGTATGAATAAGATCGACTGAG
+TCGTCCGGCCGGTCTGCGATCGCTATGACATTGTCGGCATTTACAGCCGTCCAGTTTTTC
+CCCTTCTTGATGATCTTCTTTTCCCAGATCGACCGCTCAAGGCGGGTGACAGCATCGAAA
+GAGTTGAGCCCGTATTTCCGGACGATCTCAGTCATCATGTCTACAAGCCGCCGGTGCTGT
+TCCCATTTGTGCATGAGTGTTTCATATATTGACCGCTCGCTTTCGGTGTAGATGATATGG
+ATCTCCACCTGCTCGCTTTGGAGAAAGCGGTAAATACGGTGTACCGCCTGGATGAAATCG
+TTGAACTTGTATCCGATCCCGAGAAAAATAGCCTTGTGGCAATGGTACTGAAAGTTTGCT
+CCTGAGCCGCTGATTTCCGGCTTGGTAGAAAGGTACTTAAACTTTCCATCGGAAAAACCT
+ATGGCGTTCTCCGCCCGTTCTTCTTCTTTTTGGCTTCCGTAGATCCAGCGGGACTCCGGC
+AAAGCCTTCTTGATTGCATGTCTCTCTGCTTCCAGGTCGTGCCAGATGATGTAGTGACTA
+TCAGGATCCGCGTCGATGATCTCCCGCATTTTCGCTACTCTGACATAAATACTTTCTCTC
+TTTTCCCTGCTGGCATCTTTTAGGCCGGTGGTTGCATCGCGGAACATCTTTACCTGTCCG
+TCATCCTCAGTACCTGCGGTTGAGTGGTCCACCTTGAGTTCATGCTCTATTACTTTAAGT
+TGAGGCAGGTCATACCCGGTATCATCATAGCCAAGGTCTGAAGGTTTGGTGATGAAAAGA
+GCCCAGGTGGAAAGCCAAAGCCAGAATTCTTCCTCTTTATGAGGGTGAAGCTTAAGATTG
+TTTGCCTTGGTACTATCTCGTTTGAAAAAGCGGGTAAGTGCCTGGCCCGTGTCCATGATC
+TCCAGATACCCGGCGTAGTGGATCAACTCCTTGTATTTGTTCGGCGAAGGCGTGGCGGTT
+GCGACGTACTTATATTTTACCCCTTGAAAAAGGTTCAAGAAGGTCTGATAGGTCTTTGTG
+CCATACCCGCGAAGTACCGATGCCTCGTCAAGGCTGGTGACAGTGAAAAAGCGCGGATCA
+ATATCACCATCTCTCACCCGCTCATAATTTGTGATCAAAAGGCTTGCATCTGCGCCTTTT
+ACCTCATCCATGGTTCGCACATAGCAGAGTTTGACTCCGAGCTTTCGCTCTGCGTCCTTG
+GCAAACTCGTGACGGACTTCCAACGGAGCTACAATGAGCGATTTACCTCCTTCGTGTTCG
+ACAATCGTCTTGCAGATAATAAGCTGCTGAATGGTTTTGCCGAGTCCAAAGCTTTGAAAC
+AAGGCCCGGCGTCCTCCTCTCAACGCCCAGTTGATGGAATCCCTTTGATGTGGCTTGAGT
+TTCGTTCCGTCGAGAAACTCGATATTGCCAACTTGTGCATCAATACCAGAGTCCGGTGCA
+ATGCACATTTTATCTTTCAAGAAATCTATGTATGGTTTCATTCTTAGTCCTCGATGAGTT
+CAATTTCCATTTCCGCCGCTATCTGGTGGATAGCTTCGATGAGGATCGATGCATCCTCTG
+TACTGCACTGTGTTTCACTGATCCCCTGGATATCTCCCCACAGGTCGAGTATGGGCTCCC
+CGGATTCGTCCTCAAGGATCGGGTAGCCCATGGTGACGGCAAACTGTTTTGCAAGCCGCT
+TTACATCCCCGAAGGGCTGGCCGGTTTCCACTGATATCTGTTGACAATGGCCGTTGATAT
+GGTGGTTCTGGCTGCCATGCCCGGTTGTCCGGGGACGGTGGGGCACATCGATCGCCAGCC
+AGTAGTACGGGGCCGGGGACCGTCGTTCGATCTCCTGGTAGCGGAACAGGTGCACAAGGT
+ACTGTTCGAAAGCCTCACCCACCTTGAAGGAGACAAGGCCCCGCTCGCCGGTTTTGATAC
+GCTCGGCCGCGGGGATGATGATTGTCCGGGGACTACTCATGACGTTTTCGCCAGATTGAT
+CGTATTGTCATATTCGTAAACCCAAACCCAGGGGTTTGCATCCCAGCCGAGGCCTCGCTC
+TTTGTAGATAGCATCCCAGACAAACGCAAACTCATGGCCGCATCCTTCGGCTTCCTGGTC
+ATCGGCGCTTATATCCTGTACTCTCTGTAATCGAACACCGGTGATTCGGCGTTTAGTCCG
+ACAGGCCCATTTCGGCATGTGGATCGATGGATGCCATTTATTTTGTTTAATGTCGTCAAC
+CGAAAAATAAACAGTTCCGTAATGTTCAATAACATTGGAATCAGCCTTATATCTAATTGA
+TGTGCCAGAAGTTGAACCAGACCAGATAGATATAGGTTTCCATGTCTCTCTGATCCAAAG
+CACATCACCGACGCCTCCATACGGGCCATGCTTTTGCAATTCACTGAAACTACCACAACA
+CTCTATCGTTTCATGCTTTCTCTGTTCCCACCACGATATGAGCTCCGGCTCGTATTCTGA
+TCGACAAAACTGGTGTTTAACAGGCCGTCTTGTCTGCCATTTCTTTCCGGCAAGATCAGC
+ACGGACCATATCGGCGTTGAAGATGATTCCGTGTTCTTTCATGATTCCATGCACCTTTCC
+TTAAAAGATTTCCAACTCTTCAGGCTCCGGCGTCTGCGGATCCCCGGAGCCGTTACCCGA
+TATAGGAGGCCTCTGCCCTGCTCTCTGCTGCTGACCATAGAGCCTCTTCTCTACCATCCG
+AATGTAAGAGTCGAGCGTCTTCCCAGAGTGCTTCTTGCTGTTTGCAACCATCGTGTTTCT
+TTCTTCCCTGGTGATCAGTTTCCCGAGAAATGCCCCGTCAAGTCTGTGCTTGAAATCCTC
+CCGAACCTTTGCATCCGGATCCTGGGCGGCAGCCTCGGAGTGCTCCGGAACCTTGGTAGA
+TTCTTCTTCCTGTACCGGCGGAGTACCCTGTTCCTCGGTAACATCTCGGTATCCGGTTTC
+TTCGTCGGAAAGCTCATCTGCGGTATACGGCATGCCTCCAAACTCATCGGGAAAACAAAA
+CCGGAAGGCCTGGGCGATGGCCACCTTCTTGATCATGGTCACCGGCTTCTCGTTCCACAT
+ACGGTTGTTCTGCTTGTACTCAATCCACCACGCTTCATGTACAAAGGGATTCTGCCAGTC
+CTTCCGGTGAATGGTAACAATGGCTCTGAGAGAGCGAGTTCTGATCGATCCGGCCGTTTC
+GACACTCCACCCGTCAAGCTTTTGGGTTCGCTCCGCCCGTTTGAGATAGACCTCGTAGCC
+TGTTATGATCGACAGCCTCCGGTTATCTCCTTCCCCGTAGGCCACACAGTATATTTCACG
+TTTGAAGGGGTTTAGCTGGTAGGCCTTGGCCACCTCGATAAACTGCCGTTTTTCATGATC
+GTTGAGGTTGTTGCCGATTCCCGAAGCTTCCATGTATTGGATGATCTTGTTCTCGGAAAC
+CACGTCCTGACTCTGCAGATCGTTCACTCAAGTACCCCTTCGTTGAGGGTCTCCCGGATC
+ACCCGCACCAGGGTTGCAAGCCTCATGGCAAAGAGGTCACGATTTGCCCGGTTGCCGTTC
+TTAAAGAGGTCCTGGATGAGATGGTCCATAGACTCAAGGTGTTCATCAATTGCCTGTATT
+TCCTGATTTTTGAATCGGATAGTGCTACTTTTCGGGTGATTCATCACAACCTTTCTTTTA
+TTTTCTCTAACCGCTACCGGTTCGGTAGCGGTTTTCATGTCTGTACTGCTCATGTTTTGC
+ACCTCGCATTGATCTTTGATAAAATCCTCTCCCCGGAGACCATTCTCCGGAGAGAGCCGT
+TTGTGAAACATGTTTCCCCCACATCCTCGTGGTTTCGGCGTGTGGTTGGCGCCGTATTGG
+GACCAGCAGGATTCGAACCTGCAGAGGTTAGCGCTTTCATGGTTGCAACTCCATGCCCCA
+TTTTCTGCCTGAACGCTGCTGTCAGACACACTCATCGGAATAGGGTCCCGATACGATACC
+GTTTCGCTACAGTCCCAAGGTGCGCCACGATTCCCCGGCGCTCGGTAGCTACTGACGTAG
+CCTCTTCCCGTTGGTAGACATTTATTAAGGCCGTCTTGAACGGGATGCGAAACCATCCAG
+CCTTTAACCAGTGTCCGGTTTGGCCCGGAGGTGAGCGATCTGGAGATTTGACAACCGGAC
+GAACCTATGACCTTTTCAGGCTCTCCCAACGTAACGTTGCTCACTGCGTATCCTCTCATC
+TGCCTTCCGCAGACTCACTGGTTGCTATTTTTGCCAGGCCGGCATAGCTGCCTGTGAAAA
+GGGCATCTCTAACCGCTTCCGCCGGTGGTGTTGCTCGCCCGCTTGGGTGGTATCCACTCG
+ATGCCAAATACCTGAGATGCAATGATGACGATTACGTTCATAACCACTCCCCAGTCCGGC
+AGGTCCCAGCCAAACAGCTCGGCAAACGCTAAAACTGCGGCGGCAATCGCGGTCAACGCA
+TAGGCTATAATGCGCTTCGTTTTGTCCTTCACACTTCTCTCCTTTCCCGCTTTCGCGGTG
+TAAATTGCCGGTTCACTGACCGGCGGCAGTTCTATGAAACGACCTTGATACCGTCCAGGC
+GTTCAAGGAAATACTCTGCAACCCTCTGCACCGCTTCGATCTTCCACTTCCCCCCGTCTG
+CCTCGAACAATGCCAGGGTGGGAATCTTCCCTTCTTCTGCTTTCATGCGGAAAAGTAGCT
+GGCTCTCAGGCTGGTCGATCTCCCGGAAGGTCCGGTACGGTTTGAGTGATACAATCGGCT
+TAAATGACCCGGATTCTTTCAAAGCGCCACTCATTCCTCGCCTAAGCGATACTTCCTGAG
+TCATTCCGTCATCACCGGAGACAACTTCATCGGTTACCGTCAGGCGCGAAGTAAACTGCA
+AAAGCAATTCTTGGTCCTCAGTCGGAACCAATAAGGATCGGAGCTTGATTTGAAATTCTT
+CACTTACCATGAACCGGCTGAAAGGGAAGGTCTCAAAACCGTCACTCAGGTTGACCTCGG
+CATAGAGATCACGCTGACGTTTACGTCCGGCAAGTTCCCCGTAAAGGCGGACCTTTTTGT
+AGGACACAACGTGAATGAGTAGCTCTTCTCTGTTTTCCAGTTCCTTGTCGATCGGCTCAT
+CAAGTAAGTCGACAAGCCCCTGGAGCGTTTCGAGCTTCAAGCCCTCCGGGTGAGGTTCAA
+ATAGAATAGGTTCGAGATTCGGGGATGCATACTTGATCCCGTCTACTTCCAGCTCCAGGC
+TTTCCTCCCGGAGTTTTGCAATTTGCTGTACGGCTGTTCCGTCCATTTACTTTGCCCCCT
+GCATTTGTACGATGTTCTCTTCCATGGGAAGGTCCTGCTGTCGCGGATCGGTCGTGTAGG
+CTTCCATTGAGCCTCCGCTCTTTGAGAACAACACGAACGATTCCGTCGGTTTGATCGGTG
+CAAGTTTTGTTTTCACACCGCAGATTGTGTTTGCGCTGCTCCGGTCCTTTGACGGTTTCA
+CCTTCACGCTGACGGTGACTTCCCGGGTGATCTGGGCATCACAGTTATCGTCTGCAATGT
+TGTCCATGATCTGCTGCCAGGCTTCGTCAAAAAGATCGATGACAGCGCCTTTGTTGAGGG
+TCTCTATCGTGACCCGCTTGTAATCTTCTGCCATTGGTCCTCCTTCAATTTTTGATTTGT
+AGGATTGCAGGACTGGGATTTGAACCCAGGGCGACGGGGATATGAGCCCCGCATGTTCCC
+ACTACACCATCCTGCTTTGTGTCATTTACTCGAATGGTTTTATATCGAGTTGTGTCTTTC
+CTGATTGGATGGTTTCGTATCGGTCAAGTTCCTTGATGATGAGCTTGCGAACCCATGTCG
+CACGACCTCTTCCTGATGTTTCTTTTAATGGGCCATTATCGATTCTGTTGATTTCATTCT
+CAGTTAGAACGACTTTCACAGCTGGAGGGCTTTTATGTTCCAATTTTGCTCTATTCATAC
+ACTCATAATAGAGCAATAAAAGAACAATATCAAGTGTTTTTTGTGACATTTTGCTCTATT
+TATTGCCGATAATAGAGTATGGATTTCTGGGAACGGTTAAAGACCTTAATCAAAGAACAA
+AAGACAACTCAAGAATGGGTTGCAAATAAAACCGGCGTGAGTTTTGGAACTTTTCGAAAG
+TGGATGTCAAGAAAAACAATGCCCAATGCGGACCAAGCCGTAGAAATAGCTGATGTTCTT
+GATACTACCGTAGAATACCTGGTAAAAGGTAAGTCTTCAGATACCTGGCAGCCTCCGAGA
+CGTTACGCCGATATTGTAAAACTGCTCGAAGAGCTTGACGACTCGGAACTTGAGGCCGTA
+AAAGTCCTGGCCGAGGGGTACGCCTCCAGGAAGCGAAACAAACCCCAGAAAGAAACGTGA
+AGCCAGGTAGCTGAAAAACCCTTCTCTAATCTGTCAAAGATCACCGATCTGAGGTTCCGG
+CCGGGTAGGCCAAAACGTCACTCAACCCCTCGTAGTCGAACGCAAGATTTCTTTCGCGGT
+AGCGCCCAGGCCACAAGATTCAATGCCGACAAATATGGCCCTCAATAACAGACACAAGAT
+AATCGGGAAGAGTTCCAGCCGAATGCTGGGCCATGAGCTCAGCAAGCACACCGTCGCCTA
+CATCCGGACACGTTAACAATGCTTCCAGGTACAGCGCCCGCGTCTCCGATGTGATCTCAA
+GCCACTCCTCGATCTGCTCTTCTGTCCACATTCGCTTGCTACCCTCAGTGTGGTTAGAAA
+AACCAGCCATAGGCTGCATGTGACGAACAGAGGCAATGGTCTTGTAGCTAACTCCTTTCA
+GCGCACTTGCCGCCTTCATGTCATACAACCGTCTTCGATTGTTAATTGTGTTTGCGGTAA
+TATCTCCGAGCTCCTCTATGGCAGTAGCTAATGATCTGAATGCGGATTGGATTCTTTCGG
+TAATAACTTCATTCTCTTTCATGCTACTCCCCTACTTTCTCGAATGGCTTTGAGTCGAGT
+TGCGTTTTGCCGGACTGAATGGCTTCCCATTCCTTTACGCGGTTCATCATCTCTACTTTT
+AGATAGGGCCCAGCCTTCCGGCCAGTAGATTCGAGGAAGCTAACAAATCTGGCTCTCTCA
+TCTTCGCTGAATGGAATGGATACCTTATAACGACTATCTTGTTGTCGTTTAGCAACTTTC
+ATAACTGTATATTATGGTCGATCAACAACTTTGTCAAGAAAAATATGCGTCATTTGACAA
+CATTTTTAGACGATAATAGGTGTATGGAATTTTGGGATATAGTCAAAAAAGAAATAAAGC
+GGCAAAACACTACTCAAGAATGGGTTTCTAATCACTCGAATATTAGCTTTGAAACATTTC
+GAGGATGGATAGCAAGAAAACGATTACCTCGAGTTGATGATGGGGTAAAAATTGCCCAAT
+CATTGGATACTACCGTAGAATACCTGGTAACAGGAAAGAACCCCGACAACTGGCAACCTC
+CGAGACGCTATGCTGATATCGTTGCAGCCTTAGAAGTGCTTGATGATAAAGACATCGAGA
+CGGTTAAAACATTAGCGGTTAGCCTGGCAGAGAGAACAAACATTGAATATCGCAAAAAGA
+GAGACGCTTAACGTAAAAAGTTGTAACATTATTCCTTTTAGACGTTAACATTTTTTACAA
+AAAGTGAATCTCTCATTGATTTAATCGAGTAGTCGTTTTAACATATTCAAAAATAGAGTA
+TTGGGAGATATAAATGAGAAAGAAGTATGCAATACTAAGTGAAGACGAGCTACACGAAGA
+TATCAAAATCATACCACCGAATGATGACAAGATTATCGAAATAGCCGATAGAGATGGTAA
+TACGTATTCAGTCAACATGAAAGAGCTTTCATGTACCTGTGAAGATTGGGAAACTGATAG
+ACATAATTTCTGCATCGGCGATCCGAGAAGATGCTGTTTTCATATCAAGAAAGCGTTTAG
+AAGAAATAATGCTATAGAAGAGCAAAAACCTGTCATAAAGGCTATTTTAAACGAATATCA
+CACTGTAAGACTGAATATGCTATTCGGAATGCTTGGAAGCCAACCGGTAGCAATCTTCTA
+TGATGATGAATCACCATGGATGGATGTATTCACAGAAATTGATCAAAACAAACAAATTGG
+TAGATCTGGATTTAACTATAAAGAAAAACGCTGGGCATATAACGAAGAGCCTGTCAATGG
+CGATAAAATAGCTTCGTTTATTGTAAATAGTATATAATTCCAAACTCTTCAAGTAGAGGC
+TATTTAAACATCAGGAGGACATAAATGAGTTTTGTTGTTTTTATCATCTGGGTTGTGCTT
+GCTTTTCTTTTGGCTTCGAGTGCTAAAAGCAAAGGACGTTCTTACGCAGGGTTTCTGGTA
+TTAGGGTTGATCCTATCGCCAGTTATCGGATTCATTATTTTGCTTGTGATGGGAGAAAAT
+AAAGACATTGTGCAGCAGCAAAATATAGAATCCGGTATTACAAAAAAATGCCCTTATTGT
+GCAAATGAAATTAAGAAAGAAGCCATTGTCTGCCAATATTGCGGGAGAGACCTCCCCCAA
+AAACCGGAAGAATAATCATGAGCGATATAGATAATAATGCAAATGATAAAAAAGCCAACA
+AGTCTAAAAAAGTAACACTTGTTTTGATCCTAATAATCATTGTTGCAATTCCGATCTTTA
+CCGGTTTTATAGTAATTCAGCCAGTTGGGGCATTGCCTGACGGTATCACAATATGGTACT
+TCCGCGCTGGTCTAAACTTACCCTTTATCACCTCGCCAGACGGATTTTCTTTGAAACAGA
+CTGGCCAATTGTCTTTAATGAGTAGAATGGTATCTATGTCAGCAATAACAACGGCGATTA
+AAGATAGGATTATTATTCGTTTGCCATATAGTAGAACTCTATACAAGATTTCAACAGGCG
+GGCAGGAGTTTGGCCAATAA
+>NC_014364.1|provirus_2976748_3014759
+ATGCCAAGGAAAACTGAACAATTCTCCATTATTCTCCGTCCTCCATCAAAGGTGTATCAT
+TTCAAGTTGGCAGGGTGGTCCAACTATAAGAGCACTCAGGTGTTTTTCGATCAGCACCGG
+GAGCGTTTTCAGAAACACCTAAACTGCAAAACAAAAGCCGATGCCCAAGAAGTGGTCAGA
+ATGGCAATCACCATTCAGGAAGAATCAAAACGGCCTATGCCATTATCTTCCCAGGTGAGA
+CTAATAGACCTGCTGAAAGATGCCTACACTTGGGACCGATGTCCACATGTCCGGCGTCTA
+CGGGACGAGGGAAAGGCTATCACAAAGCGCCATGTCCAAGACAGTCGGAACATTATCAAA
+TCCCACATCCTCTGTTGTAAAGATTTTGTGAATAAGCCAATTGCCAAGATGAGAAGATCA
+GACGTTCTGGAGTTCCGGTCATTCATGTTGGATCGGGTAGGACCAAGAACTGTCAACAAA
+GCACTTTCGATTGTAAAGGCGGTTATTAGAGAAGCAATCTTCCAGGAGGTGATCGACCGA
+GATCCTACAATCGGAGTAAGCAAGGTGAAGCTTACCGAGAAAAAAGAACCTGGCGTTTTC
+ACTAAAGAGGAGCTTCTATTGATGTTTCCGGAAAAAGGGATTGGCCCATGGAAAAGCATC
+ACTGATCATACGGTCTTCCTTACCGCTGCAAGCACCGGGATGCGGAGGAGTGAGATACTG
+GCCCTACGGTGGGAGAACGTGAACCTGGAAAAGCAGTTTATCAATGTGGTCGAAGCTTTC
+AAAGACTACCGGATGATAGAGATCGGCAAACCGAAATGGGAGCGTTCCCGGGTGGTCCCG
+ATTCCCAAGAAACTGGTCACCAGGCTGAAGGATCTGAGAGATCAATCACCATACGCAAAA
+GATTCGGATTATGTGTTTTGTTACAAGGATGGTACTCACTTGGGTGGAACTTGGTGGAGT
+AAGCATTTCCGCTCCGCTTGCATTGCTATTGGAGTGATCAAAGCTAAAAAAAAGGTCAAA
+GAAAATGAAGATCCTAACCCACGGAACCTTACTCCACATTCCTTCCGGCATACACTAAAT
+ACACTGTTACTAAGCAACGGATACGATAGCGGAAAGATCAGAGCTACTCTGGGATGGACC
+AGTGAAAAAATCCAGGACAATTATACTCATTTTTCGATAGACCACCTGAACGGTCAGTCG
+GATATGGTAGAGAGCTTTTTTGAAAAGGATAAAAAAAATGGAACCAATTAAAAACGATAT
+CATTCCGGGAAAACATTTTTTATAGCCTCTTTCCAAATTTCGCTTAGATAAATATCAAAC
+CTTACTCAACCTTTCACTTCCTAAATTGCAAAATTTTACCCTGTGTCTTCCGCCCTTCCC
+TCTTCGTTTTCCCAGCGCCTAGCCATAACCAGAAGATCATCAACTCGATCCTCCGGGAGC
+CGCAGGGCCAACTTTGCCAACTTCAATGCCTTGGGATTTGCATTCAGTTGAGCCCCCAGA
+ATATCTTTCGACTCCTCCCCGCTTATCAGGTACTCCACGGAAACGCCCAGGGCTTTGGCT
+AGCAGAACAGCCCTATCTGACCGGGGGATAGAGGCCTTTGCACTCATCCAAATTTCTATT
+GTCCTGTAATTGATGCCAGTTTTCTTTCCAAGTTCTTTAGCAGTGAAGCCATGAGAGACC
+ATTAATAGTTTTAGTCGTTCAGTAAACTTAGAAGCAGTCATACCTCTTTCATCGGCAATA
+TTAGTATGTTTCTGGAAAAAAATACATATAAATGTGTGTTTTTGTTTGACAAACACATAT
+TTATATGTAAAATAATCTTCATAGCACATAAAAACATGTGTTAAGGAGATTGTATGAGAG
+ATATCAGGGTTCCTCTTGATGAAGAAATTATCGAAGAAATCAAAACAGGCCCCCTTTCTA
+TAACAGGAGGACAGGGAGCCGCTTCCTGGGTACGTCAGTTGATCCTGAAAGAACTGGAAC
+GATATCGGTCCATAAAGAATGGCAACTCTCAGCTCAATGTAGAGGCATTCCATAATTGAT
+CAAGGTTGAAGAACGCAATGGATATCGTAAATAGAAATGAGACTATCACCTTCGATGATT
+CTATCGAAGGTGTAACCAAAACTCTGGCAGAAGCTCTGGCTATGGTTGTTTCAAAAGGGA
+TCAAGCCGGTGGTGATCGAAAAGCAGGATACCATAGTTGATGTTAAAGGCGCTGCTGAGT
+ATCTGAAAGTATCTACTGCCACCATCCATCGGATGACTAAAGATCGGGAAATTCCCTATT
+TCAAGGTGAAAGGCAATAACCGGTTTTCGATCAAAGAACTGGAGAAATACATATCAAATC
+AAATGATCCATCCTAACAAAAGGAGGAAGTAGAGGGACTACAAGAAGGGCGCCATTGTAA
+ACCTGATTAATGTCTTGCGGCTTGAGCGCTACCGCGAAAGAAATCTTGCGTTCGACTACG
+AGGGAGTGAGTGAGGCTCCTGCCTTCACCGGGCGGAATCTCAGATCAGGGATCTTTGACA
+GATTAGAGAAGGATTTTGCAGCTACCTGGCTTCATGTTTCTTTCTGGGATTTGTTTTGCT
+TCCTGGCGGCGTACCCTTCAACGAGGATTCTTACGGCCTCAAGCTCCGAGTCGTCAAGCT
+CTTCGAGCCGGTTTACAATATCGGCATAACGTCTCGGACGGATATAACCAATAAATAAAC
+TACAATTAAAATATGTAATGCAATATAAGGTCTAATCTATCTTTCTACTAAGTATTCATC
+AAGCATTGAGTTAATCACCTTAGATACAGTCTTATTGGCACCATAAGGTGAATCACCCGA
+AGCAGTACCCTCTGCCAGAATAAGCCCGGAAGATATCTCCACCCATCTTATAGAAAGATC
+AGTTATAACATTATGGACAACATCAAAGTAATATCTATATTTAAAGTGGACAGCTATTCT
+CTGAATATCCTTACCTATAGCATCAGCACTATATGTTCCTTTTTCTACATAGTTAGGGTC
+AATTCTAAGTATTTCGATATTCCTTTTATCAAATTCTTGAGAGATTACCTTCCCGATATT
+TAATGGATCATCAAGTTCTGGGAGGAAGAAAACCACATCTTTTTGTATCTGTTGACGAAA
+AGATGTGTCATAGGTGGCACAGCCAAACAGTAAAAACGTTAAGGATATGAACAATAGATA
+TGCTCGTTTCAATTTTGTGCTCCATTTTTATTCTTATGACCAATTATAGATGAATTGAAG
+AGAAATTCAACTGTGCTTTTACGATTACATTTTTAAAGATCTTTGTTAATCTGGAAAATA
+CAGGATTTTTCGCTACCCTGACCTACGCCTCTCTCTGGGCCCTATTCTGTTTTCTGGCTA
+CATAGCCTTCAGCAAGTACTCTCATAGCCTCAAGTTCTGGCTCATCGAGCTCCTCAAGCA
+GATTGAAAAGATCGGCGTAACGGTGGGGAGGCTGCCAGGAGTCAGCTTCTTCACCCGTTA
+CAAGATATTCAACAGTGGTATTGAGTGCTTTTGCAATTGCAGTGGCTTGCTCTACATTCG
+GTAGACGTCCCTTTGCCGTCCACCCTTTGAGGGTGTTGTAGCTAATGCCAGCTTTCCATG
+CTAACCATTCTTGAGTCTTCTTTTGATTTCGTAACTCTTCTTTTACTCGGTCAATGAAAT
+CCATACTCTCTTTATCGGAAAAAATACTCCATTTGGATACCATTTTTCTTGACAAAGAAT
+CCGTTCGGAGTAATAATAGCAATATGAAAGAATCCAAACGGATACCTGATGATCGTTATA
+AAGCATCTATCCCATTCAATACAGAAGAGAAAAGTAGGTTCATCTTTTTTCTAAAGGCAA
+CCGGCAGGAAGGCTGGACCCTACCTAAAGGTAGAGATGATGAATCGCGTAAAGGAATGGG
+AAGCCATCCAGTCGGGAAAGACACAACTCGATATAAAACCATTCGAGTAAATGAGACAGA
+GCAGGATCGTGTAAGGAGAACATACGGGCTCATATACGAGGGAAGAGCGACGTTTCGGCC
+TACCCGGCCGGAACCTCAAATCGGTGATCTTTGACAGATAAGAGAAGGGATTTAGAGATA
+AGGATTTAGTGCTGTCCTGTATAGGGAAACCATTTGGAATGCTGATAAAGCAGCCTCTGA
+CCAGGCCATTACCACTTGTGGGGTTCGAATCCCCGAGGACAGCAATCGGAGCGAAGCCTT
+GTTTGCATGCCGAAGCGCAATAGTGCAAATGTCGGGATTTAACTCGCCGGAGACGTAACC
+GGCACAATCTACTCCGTGAAAACGGGAAAGGAGGAAGGCGTGACAGACAAGACGAAGCGC
+ATTATTGCCTATGCGCTGACTGCGATAGCCGCCGCAGTTTTGGCGTTTGCCGAGCTGTTT
+GGCTGGGACCTGCCGGACTGGGGAACAATCATGAACGTAATAGTCATCATTGCATCCCAG
+GTCTTCGGCATTGAGTGGATTCCACCCAAGCGGGCAAGCAATGGAACCGGCGGAAACGGT
+TAAAAATTTCAGATGAGATAACGGCTAAAAACAGGCAAACGAGACGCAATCGTTAACTGC
+GTTGGCGCCCGGGAAAATTAGATAGGGCTGACCGGGGGCAACCAGTGAGACCGCAAGTAG
+ACGGGCATAATTGAGGCGGAAGCCGAGTGAATGATCAGGATGGCAACCTGATTGAAAAGC
+GTGTTATGTCGATAGCCTAAGCTCCGGGTCGCGCCGGACACTGGTTTTACCTTATTTCCG
+CAAGGAAGCAGTCTGGTCGTTACTGTACAAGTGGTTTGCCTTATTGGTTTAGCAAAGTGG
+AAACGACAAACCAGGTCTATAGACTGCCTTAACGGGTTAAGGTACCGGGCGCCGGGGAAT
+CGTGGCGCTTTTAAGTGACCGGATGACCAACCATATACCTTTCCGATATGGCGGTAAACA
+GCACCTCCCCAAGGCGTAACGGTCGTCCGGTTTCTTAACTTCCCCGTATGGGGGAGAAAA
+ACAATCCGTGATGCCGGAGAAATAATAGCATCTATATTTTCGCGGCTGTATGTCGGGATT
+CAAACAGGTTGGATCGGTAAACACCAATTTTCCTACCGGTCCAACACCTTTCAACCTTTT
+TCAAGGAGGACATGGTAATGGAATTGGAAGAAAAAGAAAGCTTGCAAGGTTTCATAGGAG
+TGAAAAGGATCAAAGCGCGATCAATGACCAGGCGTGGATACAACGGCTATCGCGGCTGGC
+AACTTCCTGCGGATGAAAACGGAGATGATGAAGGAATGCTTGTCGAGTATGTCGATGGCG
+GTAAATCCAATCATCCCGCACATGAAGGCTATATCAGCTGGTCACCTATCGATGTTTTCA
+ATCATGCTTATCGGCCATGTGATGCCCTTACGTTTGGCTTTGCAATCGAAGCGGCAAAGG
+CCGGAGAGAAGATTGCCCGGAAAGGCTGGAATGGAAAAGGCATGTTTGTCTTCTACCAGA
+AGGGCTACCCGGAAGGAATACCGATCAACAAAAACACCGCGGAGGCAACAAGATTGCCGG
+AAGGAACCGTCTGCAAATTTCGGCCGTATCTCATGATGAAGACAGCACAAAACGACTTTG
+TGCCGTGGGTTGCATCGCAAACCGACATCTTAGCGGAGGACTGGGAGATTATCGAGCAGG
+GAGAACAGAAATGAGTATTGAAACAAAAGAAAAGGCCGCTCCAGGCAAGGATACGGCCAA
+GAATAACAACCACACCAATATTACCATGATTGGATTCAGGCAGCAAGAACTTCACGAGAT
+CGAAAAAAGCCTTGAGGAGATGGACCACAAGATACAGGAGCTTTTCCGTTTCGGAACAGC
+CCATAACCGGGACATCTTCGCCATGAAGCTGGCTAATGAGGTACGGAGAATCAGAGATCA
+GTTGAACTCAGGGAGGCTGATGTGACCATCGAAAAGACAAGCCAGATCAAGGCGGGCGAC
+AACCTTGTGATGGTGATCTACGGCAAAGGCGGTGTGGGAAAGACAACCTTCACCGCCACA
+GCTCCTAACGTGATCCTTCTCGACTTTGAGAACGGCACCAAGTACCTGGGAGCCCGCGGC
+TTCAATGTGGATGTGATCAGGCTCAAGAGCTGGCCGGCAAACGCGGAGAAACAGAAGCTT
+GCGGCCTTGGTGGCCCCCTACCACACCATTGCTCTTGATCCCCTTGGGGAGGCGATGGAG
+AAGCTCCTCAATTCATCGGCGTTAAACGGCCGGAAGTTCCGTCAGGCAGACGGGTCGTTG
+ACCATGGCAGGATGGGGAGAAGCGAAGGCGCAGATGCGCAGCTTCATCAAGTGGCTCCGG
+GATTCCGGTAAGAACGTGATCATCGTTGCCCATGTATCGGAAGAGAAAGACGGGGAGATG
+ATCACCAACCGCATACAGGTTGCAACAAAGCTCAGGGAAGAGATACCCAACATCGTGGAT
+GTTATCAGCTACATGGGCGTGAAGATGGTAGACGACAAGCCTGTTCGCATCCTCTACACA
+CCCCGGCAGGGAGACCAGTTTGACTCAAAGGATCGAACCGGGAGAGTTCCGCTTACGGTA
+CAGGTCAGCGAACACGACGGCTTTAATGACCTGCTCAAGGCTATGGGAATCGGGCAGCAG
+AACATCCCGGAAAACAAGATGCCGGTACCGGAGGCAACACCTACCACATTCCAGGGGCCG
+CAGGACGAGAAGCAAACGGAACCCACACAAAAGGACCCGGACGAGGAAGCGCGAACACAA
+CTCAAGTATCAGCTTGACGGTGCCATTGTCGGGGAACTGGTTACCAAGGCCGAACGGGAT
+GAGGTGCTTGCAAACAGCAAGAAGTACAAGGGCCAGGTGCTTGAGGCCTACATCCAGAGG
+ATCAGCGATGAACTCTTTAATCTCCAGCAGAAGGCAGAAAGCGCAAACAGCACGGTTGCA
+CCTGAGCGCCAGAAAGAGAAAGAGGATCAGCCGCAGGAAGAAGAAGAGTATGCGCCAGAA
+GAACCAGAGCCCGAAGAGCTCGAAATCTGGTAGGACAGGAGAAGGACATGAATATTACGG
+ACATAACCGTTGACGATATCATCGAGGAACAGGAGACGGCAGAAGAAACGGGACTTGAGA
+AGCTCAAAGGCGATATTGATGAAGTGATCAGTCGGATGGAAGCGCTTTCCATCCAGAGTG
+ATGAACAGCTTGCAGAAGCAGGCGAATGGCTTGTGAAGAACAAGCAGACACAGAAGATCG
+TCAAGGACCACTTCGAGCCTGAACGCAAAGAGACCTATGCGGCCTATAAGGCTGTGACCG
+ATCAGATTAAGAAGTACACCGACATTCTGACCAAGGCTGAAAGAACCGTCAAAAAGAAGA
+TGGGAGCATACCAGGCAGAACAGGACCGGCTACGCATCGAGGCAGCGGAAAAACAGCGTA
+AAGAAGCGGAGAAGGAACGGGAGCAGTCAAGGAAAGACGGAAATTCCGCCCCTGTTATTC
+CCCTTCCACCGGAGAAGAAAGAGGAGCCGGTGAAGATTGAAGGGGTGTCCTTTTCGGAAA
+ACTGGACATTCATCATTGAAGAGACCGACAAAATCCCGCGGGAATACATGGTTCCGGATG
+AGAAGAAAATCCGCCAGGTGGTGAAGGCGTTAAAGGCTGATACCAATATTCCCGGTATCA
+AGGTCTACGCGGAAAAGACCGTCAGTGCCAGGACATGAGACCATGACACTTGAGGCACAA
+ATAAACATAGACTTTGCCCCTGAGGAACACGCCTACCGCGTTGACGGCAGGAAAGTTTCC
+AGTGTGACAAGCATCCTCAAAAGTGAGGGGTTCATTGATACCCGGTGGTACAAGCCATCG
+GGTACCTCTCGCGGGGAGATGGTCCACCAGGGAACGGAGGCAATCGACCGGGGCCACCTT
+ACCATTGCACAGTTCCCACCATCGGAAATTATTCCCTACCTCAAAGCCTGGCAGTCGTTC
+AAGGCTGATATCGGGGTGAGTGAGTTTGTGATCATCGAGCTTCCGATCGGCAGCAAGGTG
+ATGGAATACGGGGGCATCCCGGATCGGGTTGCCGTGATCAACGGGGAGTATTGGCTTCTT
+GATATCAAGAGCGGAGCACATGAGCTCTGGCACGGTCACCAGCTGGCCGCCTACAAGATA
+GCCCTTGAAGAGACCTTCGGGCTGAAGGTTGCAAAGCGTCGGGTGGTGCACCTAAAGAAA
+ACCGGGAAGTACTCGATCTGTGGGGAGGACAAGAAGATCGGCTCCTTTGACCTTCCGGTC
+TGGGAACAGCAGTGGATTGCGATCGCGACCGCTCGGCTGATCAAACAGCGGTACGCAAAG
+ATAAAACCGGAGACTGTATGAGTCAGAGGGCAATTGTCATTCCAGCGGCCGAACGGGTGA
+AAACCGGAGAGCCGGGAGTCGTTTCCTTCCGCGTCGGAGAGGTATTCCATGAGTACCTTA
+TCCACCTTTTCCGGTACCAGGAAACAGAACGCAAGTCACCTGCCCCCTATTACTCACTCA
+AGATCGACACCCCGAAGCGGCCGAGGACAACCGGAGAGAACAGCCAGAACCATCATATCA
+ACGGCCACTGTCAACAGATTTCCGTTGATACCGGCCAGCCTTTCGAGGACGTGAAGAAGT
+ACGCGAAACAGTTCGCGCTCACCATGGGCTACCCCATCCTTGAGGACGAGAACGGGGAAC
+CCATACACGACCTATGGGGAAAACCGCAAGGGATCAGTGAGTCTGATTGCAGTACTGAGG
+ATGCGGCAATCCTCATTGAAGCGATCCACCAGATAGCGGCGGAAATGGATATCAACCTCA
+TCGAGGACTAAGGAAGCACCATGGGAAAAACAGCAACAGGGACAAAGCAGAGAGCAAAAC
+CGGTACGAAGACAGAAGACACGACGACAAAAGGCCGTAGATGCAGCAGATCGGTGGTTCA
+GTCTCTACATACGACAAAGGGATGGGAACCGTTCAGTGACAAGTAACTGTACAAGGAACC
+TGACCTGTTCACACCTGTTCTCACGAAGATTCTACGCTACCCGCTGGGATGAGACGAATG
+CCTATTGCCAGACGGCCGGAGAGAACCTCTACCACAACCGGGATGCAGGACCTTTGACCA
+GTTACTTTCTGGATGTGCATGGAGAGGAGGCCTACCGGAAGCTGTATGAAAAGGCCCGAT
+CAGGGGCCAAGTTCAGAACAGAAGAGATCGAGGATATCGCTGCTTACTACAAGAGCCGGT
+TTGAGCGGCTTACACAGAAGCAGCGCGACTTTTTCAATGTTATTTAGGGAGGGACTATGG
+CAAACGATATTACCAGTTTCACGGCAGTCGGACGAGTGACCCGTGATGCGGAATTCCGAT
+ACACGAACGGTGGAACGCAGCTGTGCAAGTTCAGCATTGCGTCGAATTATAGCAGGAAGG
+TACGGGATAACTGGCAGGATGAAGTCAGCTACTTTGACTTCACCCTATTCGGAAAACGGG
+CGGAAGCACTTGCTCAGTATCTCACCAAAGGTCAGCAGGTGGTCGTTTCGGGCCAGCTGC
+GGCAGGAGCGGTGGGAAGACAACGGACAGAAGCGAAGCAGGGTTGCGTTCTTCGCCCAGG
+ATGTACAGCTGATCGGGGGAAAGCCCACCGGTCAGAGTAACGGGCAACGGTATGGAGAGG
+CCCCTTACCAGGGTCCGCCGCAGAACCGGCAGCAAGGCTACCAGCAGGGGCCACCGCCTA
+ACAGCGGCTACCAGAAGCCGACGAGCGGCTATGACCAGTGGGGACATCCGATAAACCCCG
+GACCTAATAATCAGGGCCCGGAACAAGAAATGAACTTCGACGACGATATACCGTTTTAAG
+GACGAATTACCATGGCACGACGCAGAATGATCGACCCGTCAATTTGGAGCAATGAACAAG
+CGCAGTGTTTATCAACATCGGCGTTCAAGGTGTATGTGTTTCTGATTTCACAGTCCGATG
+ATGAGGGGTACCTGAAGGTATCCCTCGTCATGTGGCCCTCATTGATCAACCCTGTTGACA
+GGAGCTACACGAAGGACCAGCTGGTAAATGACCTCAATGAAATACTCTCTTGCGGCTTGG
+TAGAGGCCTACCGGTTGGGTGATGAGGTCTATGTGAAACATCCTCATTGGACACTTTACC
+AGACCATACAGAAGCCTTCAGGAAGCAAATACCCGAAAGATGGGGAAAGAATCTATCGCA
+TAGAGGAATATCGTAATGATATCGGTACGGTACCACATGAATATGATACCGATACCGTAC
+CGGTACGAGAGGAGTATGATACCGATACAATACCGGTAAACGACCACTCTCATTTCGTAC
+CGCCTAAGTTAAGTAAAGAGAAGTTAAGTAAAGATAATACTAAGATACCTTCGGTAGCAT
+CGGCAGAGCCTCAGCCGGAGCCTGGAGAGGCGACAAAACCGGCAGAAGAGCCGGAGCCGG
+AAAGCTCCCCACTTCCCCCACCCGATTCGGAACCCGATCCAGAACCTAAGCCGGAGCCCG
+AACATGAACCCGACATCGAACCGGTTCTTGAGCTTGAATGCCAGGCACCGAAGAAGCGCA
+AAGCCAGCAAGGGGAAAGCACCTACCGCCGGGAAAGAACCGGCAGACCCGCTGTACCACT
+CGATCAAGGATTCCTTCCTGGCTGTTGTCGGGGACTTCTCGAACTGGGGCAAGGAAGGCA
+AGGCGATCCACGGGATCATCGAGAAATGCTCTCGCGCCTCACCGGAAGACCCTGCCGGGT
+GTGCCGAGCGGATGATCGGGGAGTTATGGCGGCTAAAGAATTCGGCGGATCGGTTCTACC
+GAGATCAGCCCTTTGTTCCGTCGACCCTCAACGCTTCGGGAATCTGGGACCGGGTAGCCG
+AGCAGCTGAAGATCACGGCCGATGAGCTGGAAGGTGTGAGGATGTGGGAAGCGCTTGACC
+CCTACGGGGTGAGAGGAAAGAGCAAGCAGGCGGTGGGAGGTTAAGCGTATGCAGTGGAAC
+ACCAAGACATTCATGGCGATGTTGCAGCAGTACTACGGCAAGCTTTCGCCGATCCACGCG
+GGAGCGTTAGTCGACTGGCTCGATAGCAAGCAGTTTTCGGGTGAGTATCTCAAGCGGCTG
+TACCAGGAGATAACCGAGAGCTACTCAACGAAGTACGGGAGGCCCTGTGACCTTGCGATC
+GTGAAGGAAACGCACATGGCCCTTGCACCTTCGTATGTGCCCCCTGCCCGGCAGCTTGAA
+AGTGATCAGCGGATGATCGGGGAGCGGTTTGTTGAGCGGGAGGAAGGCGCAAAGCTGTTT
+GCGAGCATCATCGAGAATCTGACGAAGAAAAAGCGGCGGGTGAAACCGGAGAATAAGTCG
+AGGAGAGTGCGGAATGACATTCACAGATAAGTACCTGAAAGAAAGGATTCCGGCGGTAAA
+GACGGTTTTCAAAGGGGATGATCGTATTGAAAAGGAAATGGTACTTGAGATAACGGACTA
+TGACCGAGGGATCATTGAAATGAAAGCCGGTAATGCGTATTACCGGTTCCGGCATGTTGA
+TCTTGAGCGAGCCATTACATCGATGCAGGTGCGGCAAGAGGTAAATGCATGAGCGAGTAT
+GGTGTAAGAAAAGTTTGCGGGAATTGCAGAAGTTTCGAAAAGTGCTTTGCCGAATCAGAG
+GAGCTTATCGGAATCTACTCCCCGGGTTGTCTTGCGGCTGATAAGGAGGAGACGCGGTAT
+ATGCCTGCGTGTGGAGACTTTGAGCCGATGATGAAGCTGGTAGGGCTGTTAGGAACGGAA
+GATGAGGGCCGGTAATGGGACGTAAGCTTGCCATTGAAACACATCCACAGCGGCACGAAA
+TAGAGCAAATGCTCTTGAATAAAGTACCGGTGTCCCACATTAGCGAGCAATTCGGTGTCA
+GTCGCGGTGCAATTGCCCGGTTTCGAGACAGCTTTGAAGGCAGTTTCAAGGCAATTGCGA
+CGAAACGAAGTGAATTGCTTACAAAATCGGTTGATGATCTCGAGGAGTTCCAGGAGGACC
+TTCGGGGTGCGGAGAGTATCTGGAACACCTTAAAGCGGATCACCCAACGGGCATGGATGG
+TCCTTGACGCCTGCCATGCGTACCTGCAGGACCCGGACGATCCAGGCAAGTATGACCTCG
+GCCCTCGGGGAGAAGATATCACCGTTGTGCTGACCGAGTACGATGATGAGGGGAAGCTGC
+AAAAGGAAAAGCGAAAGCTCTCGGATGTGATCGCGGAGATTGAGGGGACGGGGAAGAACG
+TTGCCGAGATCAACTACAAGATCGCGGATCCCCGAAAGCTGATCCTTGATACGGCCAATA
+CCCTGAACAAGCAGCTTGAGCTTATCGCGAGGCTGCAAGGAGAGCTACAGGACGTGACGG
+TGAACATCACCCAGACATCTGAATGGAAAGAGATACAGACGACCATCCTGCAAGTGACAA
+AAGACTACCCAGAAGTGAGGGAGAAAATTGCCAGTGCCTTTACCGCCGGGGATGCTCCGG
+CAGACGTTAACTGAAAGCCTTCGGGCGACACTCGCTCCAAGGCAATACCTCCGGTCTCTC
+GGGTTTACGCCGTTCCTGTGGCAGGATTGGGCCCTTGACCAGTCGCTTCGCAGACTGCTT
+TTGAATTGCTGCCGACAGGCGGGCAAAAGCACGGTCATAGCTGCAAAGGCGGCACACAAG
+GCGAAGTTCTTTTCAGGCAGCCTCATCATTCTGGTGTCCCCTGCTCTGCGGCAGAGCAAG
+GAGCTGATGCGCAAGGTAGAGGACTTCATTGCACTGGACAAGAGCTTTCCTCCGGCAAGT
+GAGGAAGACAACCAGCTGACCAAGGAGTTTAAGAACCGTTCCAGGATCGTGGCGCTTCCG
+GGAAGTGAGAAGACGATCCGAGGCTTGAGCGGCCCGACCTTGATCATCATCGATGAGGCG
+AGCCGAATCCCGGATGAGCTGTACAAAGCAATCAGGCCCATGATGGCCGGAGCAGATACA
+GAGCTGGTACTCATGACCACGCCTTTTGGAAAACGTGGTGTGTTCTATGATGCGTGGTCA
+AGAAGTAAACGCTGGACAAAGATCGAGGTCGTCGGCCGGGACATTCTCGGACGGTTTCCC
+AACGAACAGGTTTACGCACAGCTGAGGCGGAAAGACGGGATTAAGGCCTGCTATTCGCCC
+CGCCATAGTGTTGAGTTTCTCGGGGAGGAGCTGGAAGAGATGGGCGAATGGTGGTACCGC
+CAGGAATACGGCGGAGAGTTCATGGACCCGATCGATTCGGTTTTCAATATGGAAGATGTA
+CGGGCGGCGATTATCAACGATACACCGGCCATAAGCTTTGCGCCGATTATCGAGGAAGAC
+GTACCGGCGCTTCACTTTTAGGGACATGGGAGGGGAATAATTGATCCGAAACATTGTATC
+TGTTGACCTTGGCCAGCAGTTTGACTTTACCGCAATCAGCGTGACGCAAACACGTGAACA
+GTGGACGACGGGGCCGAACATCCCGGCTGAGTGGAAGGCGACAAGCGGGGATAGGCTTCT
+GACCTATTACTACTATCTGCGGTACCTGGAACGCATGAAGATGAAATACCCGGACGTTGT
+CCGCGAGGTCAAGAAGATCGTTACCGCGCTTGAGAATGACCAAACAACGGCGCTTTTGGT
+GGATGCAACGGGCGTGGGCCTGCCGGTGGTTGAAATGATGCGGGAAGACCTGCTTTTGCC
+GATACCGATCATCATTACCGGCGGTAACAGTATCTCAGAGCAGAACGGAGGATTCCATAT
+TCCCAAGCGTTTCCTTGTTGCGGCATTGCAGGGACTCTTTGAGACCGGCCGACTGAAAAT
+CGCTTCCGGTATCGGTTGCCTTGCAGAGTTCATGCATGAGATCGAAAACTTCCGGGTGAA
+GATCACGCAGAGCGGGAACGACACGTATGAAGCATGGCGGGAGAGTGACCACGACGACCT
+TGTGATCAGCGTTGCGATGGGAGCCTGGTATGCGCAACGGGAAAGCATCAACAACATTCT
+CATACGAAAGAACGATAAGGAGGTGCTGGATGAGTACGATCCTCTCGATAGACTGTAAAG
+ACCCAAAGGTCAAACGATCGATCCAGTGGCTCCTGGCTGAGCTGGGAAGCCTCTCATACG
+GGGAGATCATGCTCTCGTTCACGCTCCACGACGGACAGGTGAAGTCGATCGACAAGGCGA
+CGAAAGAAAAGCAGAGGAATGCTTGATCCGGGAATTCCGGGAGGTATAAGATATGGATAT
+GCAAAAACCATTAGACAAAAAGATCAAATACGGATTGTGGATCGCATTCGGATATGTGTG
+CGGGGTGCTCCTCATCCTTGCGCCTATTCATGAGTTTGGCCATTGGGCCATCGGTAACCT
+CATAGGCTATCGGACCTATTTCTATGGCTGGACCTATGTAAGCCATGACGGATATCCGGA
+CACACCATGGCAGGGATACGTCGAAATGGGAGCAGGCCCAACCTTTGAGATTGTGGCCTA
+CCTTGTGATCTCGGCACTCCTGGCGTGGAAGCGAAAGTATGGTGGAGCCTTTTTCTTCTT
+GGGCCAACAGCTCTATTTTCCGATCAGGTTCTTTCACGATGATGAGTGGTACTTTCTGTA
+TGCGTATGGGAAGGCATTGATCCCGGCGAGCATTGTATTTGCCGTGATCATGTGCGTGGT
+GATCTGGGCAAACATGGAGCAGGACAAGGTACGGGCTGCGAAGCTTGCACGGGAGAAAGC
+GAGAAAACAGAAAACGAACGAGCGGCCCCTTGTCAAAGAAAGAGCTTTGAGATAGAATTT
+TTCATAACATAAGGGCGGGAAACCGTCGCGATCCGGCCGTATGCCGGTCGTCTACCTGAA
+TACCACAGGCGGCGAAGTATCTGAGTTGACATTGTAACAGGTGTCGGCGCAGGTACTTTG
+CCGCCTTTTTTTGTGCCCTTTTGGTGGCACTGGGAGGGATTATGCCGATTAATGCGCTTC
+GCAGGCGATGGAACGAGGGAGTTGTGGCAGACAACGCCTATGACAAACAGAGCGGTGATG
+CTGGCGGTGGTTACACCTGGCAGGAACGACGGCAGCTTAGAAATGATGGTGCTGAAGACG
+TCTCCAACGAGCAGATGGGAAGCATCCTGAAACAGGTATACGGTGACGCTTCGGAAGAGA
+CCTTCAAAAAGGCCGTGAAAGAGTATGACCTCTCCGATCTCAACCCTCAGCGGCAGAAAA
+ACTTTCTTTATGAAAAGCTTCAGGAAAAAATCAGGCAGGACCGGGAAAACAGCGCGGAGC
+GGGTGTGGTAAGAGGCTGGCATGGCTGAGGAAAAGAGCGCACAAGAGATCATCCAAACCT
+TCGAGCAGCTCAAGCAGGAACGATCCACGTGGGAAGATGAGTACCAGGAGATAACCGAAC
+AAATCTTTCCCCGTCGAAGCGTATGGACGGACAACAAGGGCCGCGCTTCCCGTTCAGGCG
+GGCTCATCTATGACGGCACCCCGATCTCCGCTCTCAACCTCCTTGCAAACGGGCTTGTCG
+GCTATCTCGTATCACCGGCAACTCGGTGGTTCAAACTCAGGCCGACACAAGATGAACTGC
+TCCAGATACGTGGGGCCAGACAGTGGCTTGAGATCGTTGAGAACCTCATCTATGACGAGT
+TTAACAGGTCCAACTTCTACGAGGAAATCGTGGAGTACTTCCGCGACGGCGGCAGCATAG
+GGATCGCAACCATTTATGTGCAGGAGGACATCGGCCGCCGAATGGCCAATTACTCATGCA
+GACACCCGAAGGAAATCTACATTGCCGAGGACCGCTTCGGGTACATCGACACCGTGTTCC
+GCCGATTCTTCCCAACGGCCAAGGAACTCGAAGAAGAGTTCGGCCGTGAGGCGTTATCGG
+ATGGCGTGCAAAACCTCTGTGAACGCAGTCCCTATGAGCGGGTGGAGATCATCCACGCGG
+TTTACCCTCGTAAGAAGCGCAATCCCAGAAAGAAAGGCAATCGTGACATGAAGTTTGCCT
+CTGCCTATGTGGAAGGCGGAAGCAACCATAAGATCAGGGAACGGGGGTACGAGCGGCTTC
+CGTATGTAGTGTGGCGCTGGTCGACAAACTCCGATGAGGTGTACGGCCGGGGACCCGGAT
+ATGATGCGCTTGTCGATGTGAAACGGCTGAACAGGCTGAGCCGGGACATGCTCAAACAAA
+GCCAGATGGCCGTTGATCCTCCCCTTGCTGTTCCTGAGAAGATGCGGGGAAAGGTCAACT
+GGGTTCCTCGGGGACTCAACTATTACCAGAACCCGAATGAGGTTCCTGTTGCCCTGAATC
+CCGGTATGCAGTTCCAGGTCGGCCTTGATCGGGAACAACACATGCAGCAGATCATCGAGA
+AGCACTTTATGACCGACTTTTTCCTCATGCTCGAACAGGCACCGAAGGAGATGACGGCAA
+CCGAGGTAATGGAGCGGCAGTCGGAGAAAGCGGCGGTACTCGGTACGGTGATCGGCCGAA
+TCAGCAGTGAGTTTCTCGACCCGATCATCGACATAACCTTTGATATTGCCATGAAAGGCA
+AACGGCTTCCCCCTCCACCGCCGGAGTTTGCCGAGGCCATGTACAAGACAAACGGCGGAA
+TCGAAATCGATTACCTGGGGCCGCTTGCACAGGCACAAAAGAAATTCCACGTTACGCAGG
+GAGCACAACAGAGTCTCAACGCCGTTGCTCCCATTATGCAGATCAACCCGCAAGTCGCGG
+ACCTCATCAACTGGGATCAGCTGACAATGGAAATACTCCACGCCTATGGCATGCCGCAGA
+AAGCCATTGTCGACCTTCGGGATGTGCAGAAGATCAGGCAGCAACGAGCGGTGCAACAGG
+CTGCGGCCATGCAACAGCAGCAGGCACAGCAGCTTATCGATAAGTACCCCATGGACAAAC
+AAGCCCCGCCGGACTCTCCCATGGAGGAAATCGGTAACCAACTCCGTGATGCCCTGAAAG
+GCGGAAATGGAGGTGCGGCGTGATCAGATGGGGAGAGCCGGTTTCACCGGAAGCAGAGCG
+TATCAGAGAGACCTACCGGAGGACCTTTTCCACCCCGGAAGGGAAAAAGGCACTGCTCTA
+CATCCTCACCGACCTGGGCTTTTTCGATGCGACGAAGGACGAAGCCGCACAGGCCCTTCG
+CAATTTTGCAGTCAGACTGCTTGAGCAGATGGGAATACTGCATGAGGCCAATGCAGAAAC
+ACTGGTGGCGCAACTTCTCAAGCTTGCGCCCTATGACTTACAGACTCACCGGAAGATCGG
+TGAACGGGAGGACTTTTCATGAGTGACATTATGGACCCTCAGACGACTGGGGACAATCCG
+AACAACGATAACGGTGCCGGTGCGAATGCTGGCGCCGAAGGGGCCGGAGAACAGCAGCAA
+GCGCAACAGACACAGCAGACAACGACTTCGGACCTTCCCAGGTGGATGTATCAGCTTTCA
+GGAGACCTGCAGAAAGACGATCGCCTGTCCGGTTTTACGAAACCCGATGAACTGGCGAAA
+GCGTATCTCGATTATGCGGGGAAAGCCGACAAGCTGATTGAGCTACCGGGAGAAAAGGAC
+GCGGAAGGATGGAAGAAGTTTTACGGCAAACTCGGCAGACCGGAGACACCGGAAGGATAC
+GACTTTTCCGGTGTGAGTATCCCGGAAACCATAGAAAAGAGTGAACTTGCCGACTTCCGC
+AACATGGCGCACGAGCTTGGACTATCGAAGGCCCAGGCAGCGAAGCTACTCGAACACTCC
+ATTGCCGACCTCAACAGCATCACCACCAAAGCCGACGAAAACGCGAAGGCTGAGGCACAA
+AAGAAGCTTGATGAGAAGAAGCAGAAGATCGGAGCCCTCGTGGAGAAATACGGGGACAAC
+TTCGAGGAGATTGTCACGAAGGCTCATCGTGCGTATGAGGCAGTCGGGAGCAAGGAACTC
+GGTGAGTACCTTGACTCAAGCGGACTTGGTGACGACCCGGTGATGGTCGGCGCGTTTCTT
+TCCATTGCGGAGAAGATCGGGGAAGACACGCTGTTCGGCTCATCCCATGGAGGTGGTCGT
+GACGAAGGCGCCGACTGGTATCCCAACACAAATTTTGACTCATAACGGGAGGGCATATGC
+CTACTATACCCCAGAAAAGTGAGCTTACGCTTGTCGAGCTTGCAAAGCGAATGGACCCCA
+AAGGCAAGCAGGCGGAGATCGCCGAGGTACTCGAAGAGACCAACGAAATTCTCGAAGACC
+TTCGGTTTGTTGAAGCCAACAACGTAACGACTCATGTGTCGTCTATTCGTAAGACCTTGC
+CGGAAGGTTCCTGGCGTTCGATCGGTGGATACACCAAGAGCACCTCCAGTGCTGTTCGTC
+AGATAACCGAGGACGTGGGAATGCTTGAAGCCTACTCCAAAGTAGACAAAAAGCTTGCCC
+ATCTTTCCGGCAATCCTGCGGCGTTCCGCAAGCAGGAGGACAAGGCCTTTATCCAGGGAC
+TTGGAATCCAGATGGCAACCGCATTCATCTACGGCGCCAGGGCGATCGATCCCGCATCGT
+TTAACGGTCTTGCTGTTCGGTTCAACGCTTACGGCATGCCGAACGTAACCAATGCAGGCG
+GCAACGGTGTAAACGAAGGTGTTACCAGCCTTTGGATGGCGCAGCACGATGTCGGCTCGT
+TTCACGGATTCTATCCCAGGGGCAGCAAGGCCGGTCTTGATGTAAAGGACCTCGGGGAGG
+ATACGGAAACCACGGCGGAAGGAGAACGGCAGATTTACCGGTCGCACTTCACCTGGGACA
+TGGGAATCATGATCCGCGATTATCGTGCGATACAGCGGGTTGCCAATATTCCGGTTTTCA
+ATGATTCGGAAAAGTTCGTGAAGTTCGACAACTTCATGATTGCCGCCCTCAACAGGATGC
+CCAAGCGCGGCCGTGGTGCTGTTATCTACGCGAATCTCGACATGTTCACCATGTTCGACA
+TTCTCGCAAAGGACAAGAGCAATGTCGCCTATGGCTCTGCGGAAGTGTTCGGCAAAACCG
+TTACGACCTTCCGTGGTGTTCCCATTCGACTCGTTGAGGCAATTTCTTCCGATGAAGACG
+TTGTCACCGAGACTGCGGCATAAGGAGGTTTACACAAATGATTCTTGATAAACGACTGAT
+GTTCAGCGAGAACCAGGCTATCACGGCCACTGCCGTGAGCACAAACTCGCTCACCTTCGA
+GGTCGATGATCTTGGCACGGGCGAGCCGGTTACCCTCTGGACGCAGGTAACCGAGGCCTT
+TACTGCTGCCGGAGATGCGAGTCTACATATTGATCTCCAGCATTCCGATGACGGGAGCAC
+CTGGAAAGACCTTGTGCCCTCCAGGGCCTTTGCGCTTTCCGATCTTGGCCTTGGGGCGAA
+TCCCTTGAAGATCAACGTACCTGCCGGGGCAAAGAAGCACATGCGGCTGAATTACCCGGT
+AGCAGATGGTCCCATGACCGCGGGGAAAATTACCGCCGGGCTGAAGCGATAGGAGGTGCA
+ATGATGAAAGTAAAATGCCTGGTATACACCTATCACCTGGGGCGTATCTGGCGCGAAGGG
+GTCGTCTATGATTATCCCGACGACAAGACTCCGCCGAAACGGCGTTTTAAGGTACTCGAA
+GCGCCGAAGGAAAAGGCGAAAGAGAAACCCGAAAACAGTGATCCGGAAAAAGAGAAGCTC
+ATCGCCCGTGCATCCGAACTGGGTATCGGGCCACCTTCCACCCTCTCCCGTTGGGGCGTG
+GATAAGCTGAAAGATGAGATCGGCAGGGCTGAGGCTGCCCTTGCTGCGGCAAGTGTCGGC
+GGCAGTGGAGCGTAAAGGGTCGCCATGACTGCGCTGGAACTCATCAACATTGCCTTGACT
+CGGATGAATGAATCGAAATTGACGAGCATCACGATCGACACCTATGTTGCCGACCTTTGC
+AGGCTCTTTCTCAAACCTGTTGCCGATGAGGTGACCCTTGAGGAAGACTGGCAGTTTGCG
+CGTAAGCGGGAAGCTTTGAGAACGGACGATGAGGGTGAGAACCAGACAGATTATGGATAC
+ATGTACCGGCTCCCTGCGGACTGTCTTTTTCCGAGGCAGCTCCGCAGTAAGGGGCAGTAC
+GAGATAGAGGACGGACGGCTTTACACCGGGGATGAAGCGGCAGTGCTCATCTACACAAGA
+TCAATGGTTGAGATAGCGCATGATGACGAGAATGGGCTCGATATTCCCGTACTTGTGACC
+TCGTTCCCGGTGACCTTTGCCCAGGCGGTTGCTTGCCGTCTGGGGAGCCAGATCGGCCCA
+AAGATATCGGACAATTTCAATCTCGCCTCCGCGCTCGGCCAGGAATACATGGTCATGCTT
+GAAAAGACCAAGGCCTTTGACGGCATGCTTTCTCCGGCCGAGGATGAGGCGGTAGAACTC
+TGGAGTGATATTCAATGAGCCGCCAGAGAATCCTTGTGACAGATTTTACCCGTGGGATTG
+TCTCTCCTCGGATGGTTCCCAGAATCGACCAGACAAAGGCGGTGTCAGAACTTACCGGCT
+TTGTCGTCCTTCCCGACGGTGGAATTCGGCGCCGGGAGGGGACCATCTATGCAAGGCGAG
+GGCTTGGGGTGCTTCCGACAGACTGTGAAGCGGTTCCGGCCTTTACCACCTTTGACAAGC
+GGATTACTGGAACAGAAACGCTACACCTTGCATGGATCAATGACGCACCACGCCAGCTCA
+ATGTACAGAACATGACCAATCGAACCATACAGAGTGTGGCAAGCGAGAGTCTTGAGGCTG
+GAAAGCCTCTTCTTGATTCGGGGAAATTCAACAACGATCTTGAATCCCTGTACGCGCAGA
+ATATTCACCTGTGGACACCTGGGGCCAGTCATGTACTGGACCTTGAGACCTGGGCCCTTG
+CAGAAAAGACCAGCCAGGAGATCAGCACGATCTATCAGGCACGAATGATCGCGGTAAACC
+GCACCTGGGGAACGGTCTACATGAGTGTCGCGTACATCTATCTTGATTTTGATTCGGACG
+GACACCTTGAGCTTATTCCCGATTTCTACGGATTCGAGCATCCCCGGTGGATCGTTGCCT
+TCGGTGGGGATGTGTATATCGGAACGGACAAAAGCGAGTGGATGCTTACCAGTGGGTATC
+CCTACTTCACCGATGACCTTGGCGGACTGATGATGCAGAAGATTAGCGGGATCGGGGCCG
+ACCTTGCCGTTGTGTTCGGTTCCTCGATCATCCTTGCAAAGGATAGACGGCTTGTCAGGA
+TCGTGTATTCATCGGCCGGGGAATTCCAATCCCAGAGCATGGCGGAGCTTATCGACAACA
+CGGATATCATTCAGATCGATGTGATTGAATACGGAAGCCATCGGTACCTGGTCTTTATTG
+ATCGGGATCGTCGGCTTTGGTGTTTGACCGAGTGCCAGAACACCGGCGTTGCTGCATGGC
+AAATCCTTGCCGAGCATGTCGGCTGGGTGAAAAGCTACGGCCAGGACCTCTATATCGCTA
+TTGAGCGGGACGGAGACTGGAACGTCGAAGTCATTCCCATGGACAACCTGAATTACCCAG
+GGAACCGGTCACAGGGGCTCAAAGACGTGCTATTTGAGCGGAGGGTATACGGCGATTGCG
+GGGGCTTTCTCCGCATTGATCATGATCCTTCGACCGGCTACTCGGTTACCGGCGACAGAT
+TACCGGAACGTCAAACCATGGAAGTCTACCTCCCGGAAGGCCAGTACATCGGCCAAAGAG
+ATACCGATGCAAACGGCCTCCTCATTGGATCGGCCGAAGAGATCGCAACCTGGGCAGGTT
+ACGACGGGAAACCGGTCTACCTCTATTGCTACCAGAGCGGGAAAACATTCACCTCCAGGG
+TGAAGACGCTCCCGCTTGAAATGGGAACAGCAATGGGGCCCGGCCTGGGCGCTCTTCGGA
+GAATCAACCGGGTGATTGTCAGAGTATTTGAATCAAAGGCACTCAGGGCCCGTGCCAATA
+CCGGGCGATGGGAAACATGGGAAAGTGAGGACTTGTTTTCCGGAAATGTAGAGCTTCCGA
+TCGACTGTGCTCACAGTGATCTCGTGCAGCTTGAGATCGAGGCAATCGGAGATAAACCGC
+TGCATATTCACTCAATCCAAATCGACGCAACCATGGGGGACGAATGATGATAGAGCCTGT
+CATAGTGCAGCACATGGTCGCCGAGGCAATGGGAATTGATTTCACAAACGTTGCCGTATG
+TATTCAGCAAGGATGGCTACAGGCCGTCATTGCCGGGGCGGCTCTCGTAGTAGGGGCCGT
+TGCCCAGTATCAAAGTAATAAAGCAGCAAAAAAGGCAGCGAAAGAACAAGCAGAACTTGC
+CAAAAAGCAGGCCGCCTTTAACAAAAAACAGGGCCTACAGCTTTACGGTGATGAAGGACT
+ATACAGGCAGCAAGCCAGCGAAGCCTTGGCTAATACCCAGGAAGAATACGATATAAACAA
+AGAGCAAATCGAATTTTCCTGGGATCAGGCGCAGCAATCCTACGACCTCAACCTCTCCAC
+CCTTGATCACAACAGATTGCGTGCGGATGAAAGCATTGATGATCAGAACTTGAAAAATCA
+GGCTGCTCTCGGTGCCTTTGGCGTCCGTGGCGGTTCCTCCAGAACAAAAGCCAACAAAAC
+GATCGCAGATGCAAGAGAAAATCTTTCCTTTGAATATGGCCAGAACAAAACACAACTCAA
+CATGAGCCTCGAAAGCGCTCAAAAGCAGACTGAACTTGCACAGGAGCAGCTTGACCTCGG
+GATGCAGAAGGCACAGCAGTCGTATGGGTACGCAATCGAACAGGCAGACATGGGCAAAGA
+GGCGGCCCTGAAAGGCTATGAGTTTGCCTCAGAGGGAATCAGCAACCAGTTGCAATCAGT
+ATATGACCAGGCAAATTCCTGGTCGGTTATAACCGCAGGTCTAAGCGGTCTACAATCCGG
+CTTTCAAATGGCATCGGCCGTTAACACTTTTGGACAACAGTATTTAAACGACGATGATAA
+AGTCAATTTTTGGAAAGATTGGTGGGCGTGATAATGGAGGACCATAATGCCTAATGCGTT
+TGATGCCATCTTAAAGGCAATGGAAACAACGGCTATGGGGCTTCAAACATACCAAAGAAT
+TGATGCTCCACGAGTCGAATATGAAGCGACGAAACTCCAGAGCCAGATAAAACTCGGCCT
+CGATTCTTTCTCTCGTGACGCGGAGAAACTGCCGTATGGACAGATACAACAGGCATGGAC
+CGAACGGCAGGAACAGATTACCGACATGATCGGGCAACAGCCCTCGGAAATCCAGTATGT
+CATGAAAAATTGGTGGCAGAACGCATCGACTAGCTACCAGTCAACCATGAACGGGCTTGT
+TGATCAGAAGTACCGGGCACAAGAACTGACTTCGCTTTCCGAGCAAATTGACGAACTTGC
+AAAGGACGGAAGCGATGAATCAATTGCAAAAATCAAGAAGCTTGTCGAATCTGCCAATGG
+AAGTGGGGTTATCGATCCTGGGACGGCGTACAAGCTGAGTTTTGAGTCAATCGCGAAGGT
+CAACTACAACGCCGCCAAAGCCAACGCTTTGCAGATCATGGATAAGGACGGTGTCAGTGC
+AGCCCTTGAGTATGCCATGAACGGAAACGAGAAGCTCTCAAACGACATGCGCATAGCGCT
+ACGAAACGAGATCAAGACCATTTACACCGACCGGGAGAATGGAAGGATTCAGCTTGATAC
+GCAGGCGAACGACGATGCCTCTTCCCTTGCTGAACAAATCCTTGATGGTGAGAAGCCCTT
+GTCTTCAATGGACCAGTTGATTGAAAGCGATACTCGCATGAGCGGCAGAAGTCGACTGAA
+TTGGCGTAATTGGATGATCGCCGTACAAACCCAAAGGGACAAAGAACCCGATCCCGAAAT
+GGCCGCTTATGCAAAGACTGCTCTTAACAAGGTTATGGAGGACTGGGAGAAGAATGGACC
+GAAAGCTGAACAGAAGAACATGCTTTTGCAGCTTTTGACAAATGGCTACATCAACAAAAA
+CACCTATGATGATTACCTCTCTACGATTTCCAAGGATCCCATAACAGAGCCGGAGTTTGA
+CGACGGAATCAAGCTCATCAAATCAGCCTTGAAAGATAACGACGAAGGCATGGAGCAGGC
+CCTTGCCGCCTTCAGGCAGAAAGTCTATGCAAATCGTTACATCGGCGATGAGCTCAACCA
+AAATCGGTGGACCGGCCAGGAGCTTGCCCAGGTTGCGCAGAACATCGCAGCTCCCACCGT
+CTTGAACGAAATGAAGATGGATCAGTTTCACGTCGGAGGATTTAACCTTGACGGTTCCTT
+CTTAAACTCCGTTGAAGAGAACATCCTGAACGCTCAGAACGGAAGGTTTCTCGGTTTGAC
+GGAGGAACATGCCCAGATGTTCAACCAGATTCAGGAAGGCCAGGAACAAATCATCTTGCA
+GCTCCTGCCGGACGGAACCACGATCAACAAGATCACCAGGAACAAAAACGGTCTTCCCGA
+ATTCCACACGACAGTCGGAACATTCATGTTTGCAATCCCAACAGATGAGAATGGGGAGCC
+AACGTCAAAAGACGAGGTCCTCATCTATCACCTTGGTGGCGATCAATGGGCGGAGTATGA
+CCGAAAAGCCGTCAAGCAAGAAGCCGACCAGCGCAATGTTTCCGATGCTACGGCCCTTGC
+CTCAGCAGAGAAAGCCTACCTTGATCAGGAAGATACTCCGAGGCAAGGCATCCCTCGGTT
+TACCGTCAATGACGATTACTCTCCCTTAGAGAAAGAGCTTGACCTCATGCGGCAAGAGCT
+CCTTGTCGGTGGCGGATTTAGTCAGTATGGGAGGCAGTGGGACTCTACCGCAACCCGAAG
+AATCAAAGAGATTGCAGAGCGTCGGGGGCTGCCGACTTCGACCGTCGTCCAGGCGGCAAA
+GAGCGTCGGATATGTTGATGAGGATTTCAAGATCGGCGTTTTTCGATTCTGGCCTTTTGG
+AGGTCGAGAGTGAACATCCTTTGGAAGAAACGGGAACCGGAAAACACACGGGGTGCTGCA
+ACCTCCCCCTGGAAAACCGACGGATTCAGAATCGTGTCGGGCACAATCAATTCTCTTGAT
+CAAATGAGTCAGGAAACCGAACCCACCCCAGGAGAGGCGGTCGAGAAGCTCAAATACAAG
+GATGCATTCCAGCAAATCCTTGAGGGAACGCTCGGCGATGGTTTCTCCGATGAAAGCCTT
+CAAAAGCAGTTCTACCAGGTAGCAATGGCCGCCAAGAATCCAGAGGAAGAGATGGCAAAG
+ATGGCAACATCCGCCTTTCTCTCCCAGCGTTTGAATGCTCCACCCGATGTTGTGTACAAG
+AACTTTGATTTCTACACCGAGAAGTACATGACCACAAAACAGGCGCCGCTCTCAGCTTGG
+GCCGCGATCAAGAATGAAGCGTACACCAGCCAGCTCATGATTGAGCGTGGAAAGATCGGC
+TATGAACTCATGTTTGACCCGGAGAACCAAGAGCTTTGGGACAAGCTGCTTGATATCAAT
+GAGAAGGTTCCGCCACAGGATAACCAGAAACGCTCTGTGCCCATTGAACTGGTAAAAGGT
+GCGGCGAAATTTCTTCCCTACGTGGCGACCGGAGCAATCGGCTCTGCCGATGAATCGATG
+TTCGGTGCAGGGCTTGGCGCTGTCGCAGCCGCTTCGCTGGCCTCTGCCGGGACACTTTCC
+GGGGTGCTGACCGTACCCTCTCTCATCCTCTCGGGCTACCAGATTGGGAAAAAGGTCGGG
+TCAATGGATGAGTATTTCAAGATAAGCGCCGGAAATACCTATGCGGACACCATGCAGAAG
+AAAAGCGCTGACGGGAAAACGGTTCCCGTGGGCATTGCCAGGGCCTTTGCCTTGGCCTCC
+GGGACACTTGCCGGAGCATTGGACACCATACAGCTTGATCGTTTTGTAGGCGGTTCCCAG
+TGGTTGCGTAAGGCCGTACCGCAAGCCGTCAAGAAGAGTCTGCAAGACAGCTGGTTTTCA
+GCAATCCTCGGGAACCCCGTTGCGAAGTTTGCCGGCCGATGGGGATCCTCTGTAGCGGAA
+AGCGTGGTTGAGGAGACCTTCCAGGAGACCATCGAAATGATGGGAACCGAGGTTGCCGTA
+ACCGTTGCGAATTGGGCAAAGAATACGAACATCCCACAGGCGACAATCGACGACTGGAAA
+GATATGTGGATGCAGACCATTCGCGATACGGCGAAGGGAACCACCCTTCTCGCCCTGCCC
+GGCGTTACGGCCGAGAGCTTTGCGGCCGAACACCAGAAGCGACAGTCGGCAAAGGATCGA
+GAGGCCGCCCTTGCCAGCGGAAACGCGGATATCGATCTCGGGAAGTTCAACGACTATGCG
+GCCATTTTTGAGGAAGAGGATCTTCAGAAGAGCACTGAGAAACTGGTCGCCTGGAAAAGC
+GCGGAGCTGAAAAAGGCGGAACAGCGGCTTGCCTCCGACCCCACTCAGGAAAACTTTGCG
+ATGCATGAACTACAGTCGCAGGAACTTGATAGAGCCGAGCTTGAGGCCTCCGTCGCAAAG
+AAAGTGAGCGAGCCAAGAGTTTGGGAGATGACGCAAGACCAGTGGATAGCGCAAAAGCAG
+AGGCTCTCAGACCAAGAGCTTGAAAGCCTCAAGACTTCCATTGCCGCAGGCTTTCCCGGA
+TTCACGGATCAAGAGCTTGAGGTTTCCGCAATCGCAATGGATACCATTGCAAGAAACTTC
+GGACAGACCGGGACCGCTTTACTCGATACCATGCTGACGATCGTACCGGCAGATGAAGGG
+CAAGCAGCGGTTGAAACACTTTTCCCGGGTAAGAGCGTATCGCAGACAAACAGTGCCGCT
+ACCTTTTTCCGAGATGCAGAGGGGAAGCTCCTTTCTCCGACAGAGGCCGCAAGGGGACAG
+GCTAAGGCCTTTATCGCTTCCCTCTCTTCTCCAGATTTGTCGACCTTTCTGCATGAGTAT
+TTTCACTTTGCCGATGTCATGCTCATCTCTCAAAGCCCGGAGCACCGACAGCTCTTTTCA
+AAAGCGCTTGGAAAGGATTACTCACAGTTTACCGATCAAGACCGCGAATACCTTGCGTAC
+ATGTTCGAGAAATATCATCGAGACGGTACGGCTCCCACTCCTGAACTCAAAAGCTTGTTT
+GCCAGGATCGCAACGTCACTCAAGCAGTTTGTAGAACGGATGGTCGGCCTCAAGCCGATG
+AATGAGGATCTACGCAAGGCCTATGATGCGCTCTACTCCCTGAGGTCGGAGGATATCAAG
+AACGACAATCCCGATCTCAAGGAAAAAGTGGTACCAATCAAAAGGTATGCACTTTTTCAA
+GCAGAACCAAACGAACGGGAAGGCTTTCAGAGGACACTAAGAGAGGCATTTGAATATAAA
+GGCCAAGGTGTTATTAAGCTTTCAAATCGAACGCCTGAAGCTTTAAAAGCATCTGGAGCA
+AAAGACCTTCCTATAGTCCTTACAAGAAAGAGTCTTGAGCATATCAGAAAGGACCATCCC
+AATATACCAAAATTGGTTTTGTTATCAATGCTTGATGATATTTCCGATCCGGTAATGGTA
+TTTGATAGTGCTTCGAATACTGAAAAAAGAAAAGGATTTGTCATTGTAACTAATCAGATA
+GTTGATGATGCGCCTGTAGTTATTGCTATGCATTTGGAGGTTGGGAAGCCTCAATGGCAA
+ATACATAAAATAGCTTCCGAGTATGAAAAAAACAGTTATAAAACTGTCTTTTCGAAATGG
+GTAGATCAAGGTCTGCTTCGGTATGTAGATAAAGAAAGAGCCCTGAATAATCCACACATC
+TCCGCCGGGCTCCGCTTGCCCCTGGAGGTAGATAATTCAAGACCCCTCTTAAATAAGGTA
+GTACTGAAAACTGACCTTGTCAACAATAAGCAAACAAAGCCACTTTTCCAGGCTCTTTCT
+CCCTTGCAAAAGCTCAAGCAGAAATGGGACCAAGAAATCGAAAAAGCGGAACAGGAGCTT
+GCAGAGGCAGAAGACCGGGTAAAGGCCGGAGAATCATTTTCCGTTGTCGACAAGGCCCTT
+GAGCATCTGCTTTCCCTCCAGGAAGAACGCGAGCTTGCAATCCGGGATTACGAAGCGAAC
+CGGATGACGGACCATGATGCGTATTCGGATGCCGTAGAAGCCTCGGTACAAAAGACGGTG
+GAAAACGGCGATTGGGTACCGGATTCCCAACTGAAAGATTATAGCTCGCAGAATTGGGCC
+CGTGATGAAATCGAATACCGGCAGCAGGCCATAGAGGATGCTGGAAAGTATGCCGACAAA
+GACGAGTATATCGCCTCTCAGGTTCTTTCCGACAACCTCGAAGACGGACACACGCCGGAG
+TACTACGGGAACATCTTTGATGCCTCCCGCGAGACAGAAGCGAATCTGACCGGCCGGGAA
+GCAAACTATCGCTTTATCAAATCACTTTCTGCAGATTACCTTTCCTCTGAACTCCTTGAG
+GCTCTGCACGTGTTTGGAAGCGATGGCCTTTCCGGCTGGCATCCTATAGTAAAGAACGCA
+GCCCTTAGCCTTAAAAAAGGCAAGAAGCTTTCACAGGCCCTGTACAAAAAGGTTATGGAT
+CAGATCAAGGCCGATCCCGAAGTCTACCGGATGAGTTTTGCCGAAGCAGCTCAGGACACC
+GAAGGAATGCGACAAATTCAGTGGGAAATCGAGCACTCAGAAGAAACAGAACTCGAGAAA
+CAGCTCAAGGCAAACCGTCAGCTGCGCAGACAAAACGAAAAGCTCAACAAGTCGGTTGAG
+GCCTTAAACCGCGAAATCGACCTAACAAATAGTGTCCTCGGCGATTACAAGCGAAAGCAA
+GAGGGATTGGAAGAGGCTTTCCGTTCTGCTCGGGAAGAAGCGCGAAAGGGTGACGTTGAA
+AGTCGAAAACAGTGGGTAAGCCTACTCTCTGATGCAAGAAAGGAAGCGTATCTGCAAACG
+CGCAGGGCCGTAGCTGATACGAAGCAGAAAATCCGAGATATGCGGGATGCAAAGGCCTTC
+TATGAACGAATGATAAAAGCCATCATGCGACCGGCCGGACGCTCAATTGCCTATGATCAG
+CAGGTCCAGATCAGGGAAATACAAGGCCGGTATGTGGCCAGGTTTACCCGACGAGAAAAG
+GAAATGCGGCAGGCATACCGGAAGCTCCTTTCCGACGCCGGTATCGATCCACGAATCAAG
+GAAGCCATACAAGAGAACCTGAGTAAGCAAAGCCTTCGCGATCTATCTCCGGAAGAAATA
+GAGAGCCTGCACGCTGAGATTGCGGCCCTGAGAACAAAAGGGCGTGAAATTCGGGAAGCG
+CAACTTGCCACTGAGCACATCACCAGGCAATCAGCCATCCAGAACGTGCTCGAAACACTG
+GGCTTTGAAAAGCCGGAAGAAGGGCTCGGGCTCAAGAAAACAGAACGTGGACGCAATAGC
+TCTATCTTGCAGAAAGAACGCCTGACCACCCTCCTTCCGTCTCATATCGCGGAGATGTTT
+GACGGAGGCAAGAAAGGCTCGTTTTACCGCTGGTTGATCGTTGAGGTTGAGAAAGCAAAA
+TCCGAAGCAATCAACAATAAAGACCGAAGGATGAACGCCGGGTATGAAGAAATGAAAAAG
+CTCGGCATCAAACCGAAGGACTTGATCAAAGAGCGGAGCATTGACGGGCTCACCTTCCAG
+GTTCAGGAAATCATGGGGCTATACGTCTATATGCAGAATGAATCCGAACGTGAACGACTT
+CTGTATGGGAATAGGATAAAACCGGAAACCATAGCAAAGGCAATCAAAACGCTTACACCG
+GAGCAGAAAGCGTTTGCCGATTGGATGATCGACTCTTTTGAAACCGACTATTCTCGTTTT
+GAGTCTGCATTCATCGCCGACCAAAATACAGCAATGGGGAAAGAGAAACGCTATTTTCCC
+ATGATGGTGAAAGACCTCCAATTCGATACGAAAGCACAGGAGATTGCCTCTGATTTACTC
+TCCCGCAGCCATGCCGTAAAAAGCTTTGTTTCAAGAGGATCAACACATAATCGAATCAAA
+ATAAGCAGAGAGCACCAGCCCTCCATGAGGCTTGATGCCTTCAATATCTGGGCAACAAAT
+GTGGATCGCCAGGAGGACTACATCAATAACGGTCTCCTTGTTAAGCGGCTGCATGCAATC
+TTCGGTAACCGGGAGGTCCAGGAAGCCATCATACAGCGCTATGGTAAGGATGCGGCAAAC
+TGGCTCAAGGATCAGATCAACGAGATTGCAAAGCCGCTTGCCGGAGTTAAGTATTACGAG
+CCGATCATGCAGCTTTCGCAAAAACTCCGTTCACATGTCGGCTTGGCCGCTCTTGCCTGG
+AACGCACTCACCCCCTTAAAGCAGTTTCCTTCCCTTTTCCTGGCCATGGGCCGGGTTCCT
+GCAGGAGAACTCCTTGCAGCAAGCGGAAGGCTTATCGCTTCGGGTACCGGGCTGGTTAAG
+AAAATGCACGAGCTTGATCCCTATATGCGGGCCATGGACTACGACCCGGTGCTTACGGAA
+ATGAGGGAAGCGGACAAAAACCGCTATGAAAGATTTGTCACCAAGACTGGAGAGCTTGGG
+ATGAAAGGAATCTTTGTCGTCGACAAAGCCGTTAAAAGCATTATCTGGGATGCTGTCTAC
+GAGCACAATCTGAAACAGGGGAAGACACAGGATGAAGCGATACACGAAGCACGCAGGGCC
+ATCATTGAAACGCAGCCAGGCGGATTTCGTGAGGACTTACCCGTTGTTGCCCGTCAGGGT
+GAGTTTTTCAAATGGATGACGCTTTTCAGCTCTCAGTTGCAGAAGCTATACAACATGACA
+ACCTATGATATTCCCCAAGCCGTCAAGCAGGGGGACATCGCCACGGCACTTCGTATGAGT
+ACCGGGTATATCATGGCTGCCGTTTTGATCGGGATGATTAACAAGAAAAGCACGCCGGAA
+GACGCCAAAGATGCCGGAAGCATGGTCCTTGAACAACTGGTCACATCGATCCCGATTCTT
+GGAAGCCTCTTTGTGCAGGGGGCAAAAGGCTGGTCGTCAAGCAATCCCGTGACGGAAACG
+GCCAACCAAGTCGGAAAGGTTATCAACGCAATCGGAAAAGATAAGTCGGATGAGCAGGTC
+ATGAAAACGGTCATGGATGCTCTGGAACAAGCTCTTTTCTTGGGAGGACTGCCGACGGTT
+CAGGCAAACCGGATGATCGATTTTGCCGAGACCGGGGATCCCTGGGAAATTGTGGGAGGA
+CGGAGCAATGAGTAACGTTGAGCTTGAACTTAAAGGCCTAAGAGCTGCATCACTTACCAA
+GAAGGAGTACGAACAGGGGTACGATCGGAGTGATGCAGACGGTAATAGCATAGTCACGAC
+AACACCACAGGCACCGGAGAACCTTATCGTTTCAGCACGAAATCGAGTGGTTTCGATTAC
+GTGGGACAGGCAGGAAAACCTCACTCCCCCTCACAGTTACATCATCGAATGGTCCCTTGA
+TGAGGAGACCTGGAATAAAGTCGGCGATACCACCTCCAATCTGTTTATTCATGAGGGATA
+CATAAAAACAGTCGATGATGCTGCGGTCGATACCCGGAATTTCTACCGAGTGAAAATACT
+GTTGGCCAGTGGTATATCGGGCCCCTATAGCGAGATTGCTTCTGTTCTGTGTGAACCGGT
+AAAACAGACCGACTTAATTGGTTCGCTTGCCGGGAAGATTGATGCCGGGGCCTCTGCAAA
+CGATATAGCTCAGATGCTACAGGGCTATGCAAAAGAAAAAGGCGTTACCCTTACGCAGGC
+GTTCGGCAACTGGGAGAACCTGAGCGATGCATCCGTGACCGTTGATGAAGGAGGACCGGG
+GGAAACAACAAAAAAACTGTCCTTCATTATGAAGAATGTAGTTATTGCCGATCTTATCCT
+CGGTTCCCTGATTAAAGGTGAACACATCGAAGCACATAGCATTGACGCAACACACCTGAA
+AGCCGACATCCTGAAAGTACTTTTCAGCCTGACCTCGCCGAATATCGAAGTCACCGATGA
+GGGACAAGCATACAACTTGAATAATTATGCAAGGCTCCTGATAACTCCCTATACCATCAC
+CTGGCAGACGAGAAGTTCCATTGACTCTCCCTGGACCAGCCGAAGAATGCTCGGCAATAA
+CGAAGGAGATGATCTACTTGCCGATATAGCGCGTTTCCGAGGCCTCTTTCCATTAGATAG
+GGGCTTTGACCGATCTATTGGTTTTGGAAGGCCGGTAGGTTCACTCACCTACTCGTTTGA
+CAACATACTAACAGATCAAAACGGTGAGAATGCTTTTAGTGGAAAACAGACCGCATATAC
+AACGGGGAAATTTGGAGAAACACAAGCGGGAGCTATTGCCGCATCTACTAGTGCCGATTA
+TGCGGGGATGGTAGAGAAAGTATTTTCCCGGTCAATTACTGATTATTGGACATTGGCATT
+CTGGCTAAAGGAAACAGCCGCTCCCGTCTGCACGACAAAAGTCATTGAGATCAAAGAATT
+AACGCAAACGATAATAAGAAATACACAGGCCATAGGCGACGTGTCTTTTTCCAAAAGTGG
+AAATTACCTTGCGATTGTTTGTGCAGGAAGCCAAGGCCAGGATAACGGAACCTTTATCTA
+CAAGAAAAACGCAGGGTCCTTTTTCCTTTTAACAAAACTTGTACCATCTGCATCAGAGAG
+CTACCAACCTACAAATATCGCTTGGAGTGCCAACGATCAGTACCTTGTGATCACCGGTAA
+CTATGCAGGGCACATGTACAAAAGGAACGAGGATACCTTCAACTTACTCGGCCGCCTTGA
+GGGGATAGACAATACATCACGATCGGTTTGTTTTTCGAGCGATGGGAATTATCTTGCTTG
+TTCTTCCGGGTCAGGAAACTTGCTAAAAGCATATAAAAGGTCCGGCGATGTTTTTTCCAG
+GTATTCTCTTTCCTACACCATAAACGCAAATGCAAAAGCCCTTAGCCTTTCAAGTGACGG
+CACGTATTTGATGGCGACGGTTTCAGGATATGGTGGTGAAATTGACGGTCTATACCTCTT
+TAAGAACAATGGCTCCGAATATCGGTTACTCACTATTATTCACCATTATGATATCGATAA
+TAGCTATTTTTACTCAGTAGAATTCTCTCACAACGACAATTACATTGCTTTCGGTACTCG
+TCACGGTGTCATGATTTATAAACGTGTTGGGGACAATCTCCAGAAAGTGACAGATGTAGA
+GGCTGAAAATGATAGTGTCATTTATTCGGTACACTGGAGCCCCAATGACAGATACCTATT
+TTTTACGGGAGCAACAAGACCGTCAATTTACCGTCGAGATGGAGATGTCTTTACAAAGAA
+ATCCGATTTAGGAATATTCTCAGAATTTTACCAGTCCCCTTGTGCTGGTCTATCGGCAAC
+ACATTTTGCCTATGCAGACAGAGTCGATAGTACTTCAACCACACATGAAAAGGTTTACAT
+CTATGCGTTTGAGGAGAATGACAACTGGTGGCTTGAACCTTCTTTGCAGAATGTACCGAA
+GCTACTCTCGTTTGAAACCGATGAGGATGTTTTATCCGTTTACCGGAAACCCCATTCCAT
+AGTCCTTGCAAAGGCCGTAACCAAAACATCTCAAACACTCACCATCGATGAGGTAAAGGT
+TTGGAACTTCATAGCTTTACGAAGCAATGGCGATGGGACAATCAGCTTCATGCTCAATTC
+GCAAAAGGTCACATTGACGGTATCGCTTAAAGATACAGAGAGCTTGAAAATCATCTTTTA
+CCTTCTGAAAGAAAATGGTCTCAAGATCGATGACATGATCTTCTTTACCGGTCTACTGAC
+TGACGACTTCCTTCAGACCTATCGAAATTCTGGCTATCCCTGGGCTGATGCGGAATTCGG
+CGACACCTTTATAGGAGCTTCCCCAGGAAAAAAAATCCGTGTTATCGACAAGGTCGTTTT
+TGAGAAAGAGATTGATGCGGCCATACCCACCCCCGTTGTGGATCACGAATGGAACGGTAC
+GCAGTTATCGATTACCGATGAAAGCGGTCAGGGGCCATATGTCGATCTCAAGGGACCCGA
+AGGCCCTCAGGGGCCCCAAGGTAAACAAGGAGTCCAGGGGCCTACCGGACCGACCGGTCC
+TAAAGGAGACAAGGGGCCGACTGGCCCTACTGGACCGAAAGGACCAACCGGTCCCAAGGG
+AGAACAAGGCCCCACGGGTCCCACAGGACCCCGCGGAGTACAGGGGCCGACAGGGAATAC
+CGGGCCCGCCGGACCAACAGGACCACGGGGGCCTCAAGGAAATCCCGGAATAACAATTCC
+CGATATATCAGGCCTTGCCGAAATTACATCGATCGACCCGTCAAAAGATAAGCTGATTGT
+CTATGACGCAAGTACGGGTACGCATAAATCAATGCGGATATCAGAACGTTTTCCCGTAGG
+CTCCCAGTACACACAATATGCCTCAAGCGCAAGCAATGACCTCTCGGTTGCCTTTCCGAA
+TAGCGAGTCCCCCGCTTACCTGTTTGGAGGGACCTGGGAGAAACTGTGGGACGGCGAAGG
+CATAGACTTTCATACCGAAGGTTATAACGGTTCAGGACGAACAAATGGGCTAATGCCCGA
+TAATCTCCAAGGCTTTATCACACTTAATGGTGTAGGAACTAATACAAGCGGAAGTAATCC
+TAAAATTTTTGTCTATGGATACACGACTGAAGACGTACCAGGAAAAGCTGAGGATATCAA
+TGCGGCTGCCAATATTAATACAACAATTCAAGGCAAAACATCGGGACCCAAAAGTGATGG
+TACGAACGGTACTCCTCGCATTGGGGCAAGAACATCCGACCGTAACCGCCTCATGAGGAT
+ATGGAGGAGAATTGCATGAAAACCTATGCCGTAACAGACGGCTCAATGATCACCGCTGTG
+GTGCAAAGCGCCGATGAGACGGCAAAGCTTGCAGAGCTGTTTCCGGAAAAGAGCATCAAG
+GAGATTCCTTCCTGCTTTAGCGGAAGCAAAGGAGATGATATCCGCTTTTACGATGAGGAT
+GGAAAGCGGCTTTCGGTAGCAGCCGCAACAGAAGCCGGGCTCGTGCTTGAAGCCGGAGAA
+CATGAGGCCTCTATCTGGGAAGGCGGTAAGTATGTGCTTGTCCCCGACTATACCGGTGTT
+CCCTACTGGGACAAGGCCACAGGAGAGGCGGTACACCTGTCCCTCGGCCGAAAGCCTGAT
+GAGAGTATGACCGACATTGCCCCGCCGGACCCTGGGGCCTTGTGGAGTGAAACGGGTTGG
+ATGGTCCCTGATGAGGTGCTCTCCGAACGGATTCGCATGGAACGTGATGCGCTGCTTTCA
+GGGAGTGACTACATCATGATGGCCGACTATCCCCTGGCCGATAAATCGAAGTGGAAAGCC
+TACCGACAGGCTCTCAGGGACATTCCCCTACAGCCAGGCTTCCCTCAGGAGATTTCCTGG
+CCACAGGTACCGGAGAAAAGGAGTTAAGCCAATGGGCGATAACGACAAAATCGATATGGT
+CTTAAGCATTGTGACGGAACAAGGCCGGGACATCAAAGAGATCAACAGTAAGCTCACCGA
+CTTTTTCATCAACCGGGAAAGTACGTGCCCTGTTGAGAAACGCCATGAGAAGAAGATTGA
+GTACCGAACAGTCATTGTCGGAATGGTGTGCGGTCTTGGTGGTTCGATTATCGGGGGACT
+ACTCCCCGTTGTTTTGGGAGGGTGAAAAATATGATTATGAGCTGGAATCGACGAGAGAAA
+AAACTCGTTTGTGGAAACAGAAAAATACCTTGTTCCTGCATTGTTCGCAACGAGCTTAAT
+GGATGGAGACCGCTGGCAAATAAACCGGCACAGGATGAGGTCGTAAGGTCTCTACCGGAG
+AATATTCCGTACATGCCACGACCGTTTCCGGTCGGACGTTGGAATGTTGGCAGACCAGTG
+CCTCGATCTCATCCGTATAAAGCCCCCTATTACATCCCGACTGATGCCTTCCAGATGCTG
+CCGAGATGGGAACTTGACGACGATGGTGGATATCTTCGGGAAACGGAGGATATGGTCCGT
+GACGAAGATTATGGACTTCATTGCTCATCATCAAACACAACACTCGGCTGTATCAGAATC
+ACCAAGGAAAAGGATTTGCTCTGGATGGTCGAGAAGATCAATAGAACGCTTGATACAGGA
+GAAAAGGTGTATCTGGAGGTAGCGGCATGAAGAAATTCTTCAAAAGTTTTTTCAATTCCA
+CGAATGACATAAACGAGAGTACGGTTATCGGGTTTGTCGTTGCCATTTTGTTTGTTGCGG
+CGACCTTCCTGAATATTGTGGATGCCGAAAAATACCAAACGATCGGCTGGGTATTGGTTG
+GATTGTTTACCGGATCAACGGCGCGAAATATCGTTGACACATTGAAAAGGTCAAAGGGCA
+ATCCCTAACGAGGTGAAGGATTGAGATGCGCAAAATTATTAGCATTATCCTTACTCTTTT
+TGTGTGTTTTTCCGCTGGTTTCCTCCTGGGCACTTACCGCTCAGGAAGAGGCGATAGTGG
+ACGAGCTGCAGAATACGATAGTAGAGGCAAAAAGCGAGATACAGAGTATCAAAAGCTCAG
+CAATGAGTATGAGCGAGCAGTTGAGACGTACGAGGGAGAGCTCGCAGAGCTTCGAGCGGA
+AGTGGCAGGATACGGAAAAGAAGCTGGAGGGCTTACAGAGCGAATCGGAGGAACGGAAAG
+CCAAAGTGTCGGCATTGCAGAGCGAGCGGGACGGGCTGAGGAAGGACTATCAAGAGCTCT
+TGATCTATTGCGAAGGCTTAGAGAGGCGGAATCAGCGGCAGCAGACGGCCCTTAAAGCCG
+GGGGCTCTCTCCTGGCCGCCTCAATCATCGTGAATGTACTGCAGGCTCTGTTTTGATCTT
+GCTAAGGGGGAAGAGTTGCATCCTTCTCATGGGAGGATTATAATACTCATGGGTCATTTC
+GTTGGTTATCTGCATGAAATTCATGTTGATAAAGGAAGTTATATGCAATTTCTTTTTTGG
+CTAAAGATATATGAGAAAGAGCCCGCCGTCCATGGGCTCCGTTAAGAAATTAGGAGGATT
+AGATGAAAGATATCTCAGAAATAAATATGAATCTTGATGAATATAATTTTTATACTTTTC
+AATTCGTTGATGAACTTAGATATTTTTTTACCCCTGAACAAGTTTTTAATAAAAATGACG
+CATTTAATAATTTCATTGAAAATTTAAAGGTAAAATTTAGAGACTGTGGATGGGAAGGAG
+ATGGAGAACTTAATATTGGTTGGCTTCCTCCATTTCTTGATGAATCTATTGATCCTAATT
+ATGGAAATATATATTGGCATATTAAACAGGATAATAACGGCTATTCTTTTATTGCATCAC
+CTTCTACTTTTTATTCTTCACGAATATTGGATCAAAATAAAAAACGTTTTATAGGTAGCA
+AGATTCTTGAAACTCAATCTATTACGGAAATTACAAGTAAAATACTTATAGGGAAAACCA
+AAGAGATTCAAGATATTATTAATGATTTAAAATTAGAAAGTTATCCAGATATCATTTTAA
+AAACTATACTCATTAGCATCCAAAGTGATCTCGTTTCATCCTTTATATCTTTTATTGAAG
+ATGTATATTTACAATTTATCATTCATTTTTTCGAGGAGAACAATAGAGACAATTTAAGAC
+TAAGTAAAATCGATGCTAAAATTGATATGAAAAGTATTAATTCAGACATTGATTATAGTG
+ATAGAGAGCAATCATTAACACTTCGATTAATTATGAAATCTATTTGGGAAAATTTTAAAT
+TTTGGCCATTTAAAGAAAAATATAATGAGATCACAAAAGCTATTGATTTCCAAATTGATC
+AATCATCTCGTGATATGCTTTTTAAGCATGTATATTTACGAAATTGTATCCATCACAAAA
+ATGGACAAGTTCAGAATGATTTACAAAAAATGTTAGGTAGAAATAATATAAAGGTGTTAA
+ACAATCAAAATAGAGAAATTGTGTTGAAAGAATGGGATTCTATAGATTTATCTATAAACG
+AAATATCAATTTTTAAAGAAAAATTAGAAGACTTCATAAGCAAATATGAGGTACATATTT
+TACAAAGAATGACAAGTAGATCAATACATCATAGTTTTAAAAACCCAATTGTCAGGAAAT
+TTGATTTATCAGCAAAGAAAGACACTGATTAA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_015761.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1407 @@
+>NC_015761.1|provirus_847397_862760
+TTACTGATAGGGATGCTTCTGTTTTTCTTCCCCCTTCGTTCTTACAAAAGTAATTCGATA
+TTTGGTCACCTGTAAGCCGGTAAGATTTATTGCTTCTCGCCAGCGTGCGCCTGTGCTTAA
+GCATATCTTGACTACCAGTGCCAGAATTGAGTCCTGACGTTTGCAATCAGCCAGCAATTC
+AACAATCTGCTCATGGGTAAGCCATGCCATCTCTTTTTCTGCGATGATGAATTTTCGCAT
+GTTCTCCAGTGGGTTCGGATACGACTGTGACCGAAGTGGACCGGGAAAACTAGCTGTGCC
+GGGTGAGAGTGGGCGAGCTTGAAACCAACTGGATTAACTGGCTGACGCTGCGTGCCGGTG
+GTGCCCGTACATGGTGGTGTCCGTCGCCGGATGAGCAGGTGGTGGTGCTGAGCATGGGCG
+GCAATCTGGAAACCGCTTTTGTGCTGCCCGCCATCTACTCCAATCAGTTTGCGCCGCCGT
+CGGATTCTGTGGACGGCTGCGTGACGGAGTACCCGGACGGGGGCTGGTTTGAGTACGAAC
+CCGCCACCGGGCGGTGGCATGTCCGGGGTATCAAATCCATGGTGATCGAGGCGGCGGATA
+ATATCACCCTCAAAACCGGTGAGTTTGTGGTGGAGGCTGACACAACACGCATTAACAGCG
+AGGTGGTGATCAACGGCGGCGTCACCCAGGGCGGCGGCGCAATGAGTCTAACGGGGTCGT
+GATGGATAAACACGGTCACACTGGCGTTAAGTCAGGCGGGGATACATCGGGAGGTCCGGT
+ATGACGTTGTATATCGGTATGAGCAGGAATGACGGGCAGGTAATTGCAGATACCGACCAT
+CTGCGCCAGTCGGTGCGGGATATTCTGCTGACGCCGCAGGGCAGTCGTCTTGCTCGCCGG
+GAATATGGCTCCCTACTGTCTGCCCTGATTGACCAGCCGCAGAACCCGGCACTGCGCCTG
+CAGATTATGTCTGCAGTCTATGTGGCGCTGAACCGCTGGGAGCCGCGCCTTACGCTGGAC
+TCCATCACCATCAACGGCAATTTTGACGGCTCTATGGTGGTTGAGCTTACGGGACATAGT
+AATAACGGAGCACCGGTTTCCCTTTCCATATCAACAGGAGCAGACAATGGCAGTCATTGA
+CCTTTCCTGGTTACCGCCGCCGCAGATAGTGGACGTGCCGGATTTTGAGACGTTGCTGGC
+TGAGCGCAAGGCCTCTTTTGTGGCTCTTTATCCTGTGGATGAACAGGACGCGGTGCGGCG
+CACGCTGGCGCTGGAATCTGAACCCGTCACCAAGCTGCTGCAGGAAAGCACCTACCGCGA
+AATCCTGCTGCGCCAGCGTATTAACGAGGCTGCGCAGGCGGTGATGGTGGCCTATTCGAT
+GGGAAATGATCTTGAGCAGCTGGCAGCCAACTGCAACGTGAAACGTCTGACGGTAGTGCC
+TGCTGATAATGATGCAGTACCGCCGGTCGCCGCAGTGATGGAAGATGATGAGGCGCTGCG
+CCAGCGCATCCCTGCAGCATTTGAGGGACTGTCCGTTGCTGGCCCTACGGGAGCCTATGA
+ATTTCACGCCAGAAGTGCGGACGGACGTGTGGCAGATGCCAGCGCAACCAGTCCGGCCCC
+TGCCGAGGTGGTACTTACCGTGCTGAGCCGGGAGGGTGACGGTACAGCAGTAAAAGACCT
+GCTGGATGTGATTGAAAAAGCCCTGAACAGTGAAAGTGTACGCCCGGTGGCTGACCGTCT
+GACGGTTCGTAGTGCGGAGATCATCCCGTACCGGGTGAAGGCTACCATTTTTCTTTATCC
+AGGGCCGGAAGAGGAGCCTGTTATGGCGGCGGCAAAAGCCAGCCTGCAGAGGTACATCGC
+CAGTCAGACGAGGCTGGGACGTGATATCCGCCGCAGCGCCATTTATGCCGCGTTGCACGT
+GGAGGGCGTCCAGCGTGTGGAGCTGACGTCCCCTCTGGAGGATGTGGTGCTGGATAAGAC
+GCAGGCGGCATCCTGTACTGAATGGAGCGTTACCAACGGGGGCACGGATGAATAGTCTGT
+TGCCGCCGGGTTCGTCGCCGCTTGAGCGCCGACTGGCGCAGACCTGCAACGGGATTTCCG
+ATCTGCAGGTATCGCTGCGTGATTTGTGGAACCCGGCAACCTGCCCGATCAGATTTCTGC
+CTTATCTTGCCTGGGCGTTTTCTGTTGACCGCTGGGATGAGAGCTGGGCAGAAAGCGTCA
+AGCGCCGCGTTGTGCAGGACGCTTTTTATATCCATCAGCACAAGGGGACAACCAGCGCCG
+TGCGGCGCGTGGTGGAGCCGTTCGGCTTCCTGATCCGCATCATTGAGTGGTGGCAGACCG
+GCGAAACGCCGGGGACGTTCCGTCTGGATATTGGCGTGCAGGACCAGGGCATAACAGAAG
+GAACCTATCTGGAGCTGGAGCGCCTGATCGGTGATGCCAAACCATGCAGCCGTCATCTGG
+TTGGTATGTCCATCAACCTGCAGACAGGCGGCCCGTATTTTGTGGGTGCAGCCACCTACA
+CCGGCGAAGAAATCACGATCTACCCGTACATCAACGAAACCATTATTTCCGGCGGCACCG
+CCTATGAGGGCGGAGCGGTCCATGTTATTGACACGATGAGAGTGAACCCATGAGCGCAAA
+ATTTTACACCCTGCTGACGGATATCGGCGCGGCGAAACTGGCAAGCGCCACCGCGCTCGG
+TGTCCCGTTGAAAATTACCCATATGGAGGTGGGTAGCGGTGGCGGTGTGCTGCCCACACC
+CAATTCGCAACAGACCGCATTAGTGGCTGAGGAGCGCCGCGCGGCGCTGAATATGCTGTA
+TATCGATCCGCAGAATAGCAGCCAGATTATTGCTGAGCAGGTGATCCCGGAAAATAAGGG
+CGGTTGGTGGATTCGTGAAGTTGGTTTGTTTGATGAAACCGGTGCGTTGATCGCTGTGGG
+TAACTGCCCTGAGAGCTACGAGTCACAACTGGCAGAAGGGAGCGGACGTACGCAGACCGT
+GCGCATGGTACTGATTACCAGCAGCACCGATAACATCACCCTGAAAATTGGCCCTGCTGT
+GGTTCTGGCAACCCGCAAATATGTGGATAACAAGGTGCTGGAGCTTAAGGTGTATGTTGA
+TGACCTGATGGCAAAGCACCTTGAAGCTGTTGATCCTCATTCGCAGTATGCACCAAAAGA
+CAGTCCGACACTCACCGGCACGCCAAAAGCGCCGACTGCGGCGGCAGGCAATAATTCGAC
+GCAGCTTGCAAATACGGCCTTTGTGCAGGCTGCTATTCTTGCCATGATTGGTGGCGCACC
+GGCAACGCTGGATGCGCTGAAAGAAATTGCAGCAGCTATCAATAATGACCCGAATTTCAG
+TACCACCATGAACAATGCGCTGACACTGAAAGCACCGCTGGCAAATCCGGCCCTGACCGG
+AACGCCCACGGCTCCCACTGCAGTTCAGTCAACGAACAATACGCAGATTGCCACTACCGC
+GTTTGTGAAATCTGCCGTTGCCGGGCTGGTCGGTTCCGTCGCCGGAGGCGCTGGATACAC
+TGAATGAACTGGCGGCTGCGATGGGAAATGATCCTAACTTTACGACAACAGTGATGAACG
+CGTTGTCGGGAAAACAGCCACCTGATGCCACGCTGACAAATCTCAGCGGGAAAAGCATTT
+CAGGGCTTCTCGAATACCTCGGTTTTCAAAAACGTCAGAATAATGTGGGACATTGTTAAT
+TCAAACGATACATACAACATTTATTTCATTGGAAAATAATAGTTAAGATTGAATTAAAAA
+AATACCATTCACACATTTTTATTTATATAAAAATATCAAAAAAAATTAGTCACAACAAAC
+ATCATTTATTTTCATCCCTGCCATCAATCTTAGATTGAATTTTAGCATGTCAAATGATAT
+ATTATAAATCGTTCATTATATTTTAAAGGGTTAAACAAAGAATGAGTGATAGTCAGGGAT
+TTCAGATTATATTTATTTTTACATGTTTGATATTCGCAATAGTATTATTCTCTCATAGAA
+AATTTAGTTATATTGATCGTGTAACTGAGAATGACAGAAACACCAGGTTGGATAGTTTGA
+GATTTTTAATGTCATCATTTGTTGCATTTCATCATTTTATTTTTAGCTATCATCTTGTCA
+ATAGTGGGCAGTGGATAATCCCAAACCATCCAATTGAAGAATTTGCTGGAAAGTTCGGCG
+TTGCTATTTTTTTTATGATTTCAGGATATTTGTTTGTTAAGTGTATAGAAAAAAAAGTAA
+ATTGGCTAACTTTCTTTATAAAGCGGTTTTTTAGAATTTGGCCTGTATGTGCTTTGTCCT
+CGGTAATTTGTATACTAATTGTTATATATATTGAAATTAAAAATAATATCCCCCTCAATA
+CTGATGGCATAATGCAATGGTTTGATGGCGGTCTAATCATAGATACACGTCCCAACCTGG
+GCTACGAACATTCAACCTTAATAAATGCAGGTGTTACCTGGACATTATATTATGAGTGGG
+TGTTTTATTTCTCGTTGCCTTTTATTTCTTTATTTTCTTCTAAAAACAAAAGCTCTCAAA
+TTTTACTATCAATAGTCTTTTTATCTATATACATATTTAGTAAGTATGATTATTTATTGT
+CATGTTTTATACTGCTTTTTGCGCTTGGTGGTATGGCAAAAAAAATAAGAGAACAAATAT
+CAAATGTTAATCAACATACTGTAAACATACTGGCAGTCACTTCATTTATTTTATGCTTCT
+ACTTTGGTTATAAAGAAAATCCATTTACGATATCAATGATATTTCTGTATTTTGTTTTTT
+TCCTTTCAGTTTGTCTTGGCGCTGATATTTTTGGAGTGCTTAGATTAAAAGGAATCATTA
+GGCTTGGTGATGTCAGTTATAGCATATATTTGCTGCATGGGATATTTTGGTTCATCATGA
+ACAAGCTCATATTCAGCGCAGGGTTTGAGAATTCACAAGCCATATACTATACAGCTTCAT
+TTTTAACATGGATTTTCATATGCGTATTCTCCAGCATCGTGTATGCATTGTTAGAAGTGA
+AATTTATACATATTGGAAATATTATATGTAAAAAAATCACAAATAGTAACATTCAGTAAT
+CTAAAAGATATTATATATAAAAAATTAACACCAGACCTCCTAAGATCTGGTGTTAACACA
+TGATGTTATGAGCACTTAATTGAAAGACTGAAAACCATTAATTACTTCTTGCGGAAATAT
+AACTGTAAATGATGAATATTTAGTATTAAAAATAAACATTAAGCACATTGATTTTATCTT
+GGTTTTTGCCAAGTACTATAGCAGATGGATGAGATTGTAATTAACTGGTGGCGGTGGATA
+CTTCCAGCACACACCAGAAATTAACTAAACTGTTCCCCGGTAAGGCAGGCCATACAGGTT
+TTGAAGTATCTACACGCATCAACAAGACCCGGTATTTCCTCCACGCAATCAATGCAACGG
+ACTCATCCGCAGTCGCTATCTCCGCATCAACAGCATCCTGACGCCATTCAATCTCAGTAT
+CGGCTACTGTCTTTAAACGCAATTTTTCAGATTCTGCACGAGAGACTAATTCATCATGAG
+TCGGGGCAAGAATATCAACCCATGCAGGCATTCCATCGCAGTCCACTCCGAGAATTTTAC
+CCTCAGGCGCGGGGCCAGAATATTCAATGTGGATTGATGCAGTGACTTCAACTAAATCAT
+CAGGCCAATTTCCTGCCTGTTCATAGAAGAACTTCAATACTTCATCATAAAAACCGATAT
+TTGACGCGCTAAATAAAATGATCATATCAATATCCTATAGCGAACCAGAACCCACCACCG
+TTTGAGTTGAAATCAGAGTCATTAGCGACATAGAAGCCAAATCCTGTTCGCGATACCCCT
+GTCGACGAACAACCAACCCCTTTACCAGATTGTGACGTTGCGTCCAGACTACAAATAACG
+GAAGCCGCTATTGGCGGAAATGTAATGGTAAAGGTTACATTTGTGTTTTCCCAGCTTGAG
+TCGGCCCGACTTTACCCCATTGAAAAATAAGCCCTCCGGGCAAATACTGATATCCGGTCT
+CGTTTTTTGATACACCAAAAGCGTTCATATCCGGAACTTGATTTGCTCCAGTACCAATTA
+TTTTGAGAGCAGCGCTTCCCAGTTGAAGTAACGTTCTGACCTCATCAACAGTATTTTTGG
+CGATAATATCGCACCCAGTTTTGTCAGTGTGGTTATATCAGCAGAATTGTTACTGTTGAA
+AAATGGCAGTTTGTCCTTCGCTATTTCCAGCCCGGATAATGCAGTCAGCTGTTGTGAGTA
+ATTCTGTTTGTTTCCCAGTGCTTCTGTTAAACCGACGTTTAAGAAAATGCTGTTTTCCCG
+TCTGGCTGGCATTATTTGGGCTTTTGCATAAGGGAAAACAAATGTTAGTCGGCTATGTGC
+GCGTATCAACAAGTGAGCAAAACACAGCGCTGCAGCGTGATGCACTGGAACGCTCAGGAT
+GTGAGCTAATTTTTGAAGACAAAATGAGCGGAAAAACAGCAGACAGGCCCGGGCTAAAAA
+GGCTGCTCAGGACGTTATCAGAGGGAGACACGCCGGTTGTATGGAAACTCGACAGGCTGG
+GACGAAGCATGCAACACCTTGTGACCCTGATAGAAGAACTCCGACAGTGCGGAGTTTAAT
+TTCCGCAGTCTGACTGACAACATAGATACCAGTACGCCAATGGGGCGGTTTTTCTTTCAC
+GTTATGGGGGCACAGGCGGAGATGGAACGCGAGCTGATAGTGGAACGAACCCGTGCGGGA
+CTACAAGCTGCAAGAGCTAAAGGCAGGATTGGAGGGCGAAGACCAAAACTGACGCCAGAG
+CAATGGGCGCAGGCAGGTTACTTGCTGAAGGTGAAACACGGCAGCAGGTTGCTTTAATTT
+TTGATATGGGTATCTCAACGTTATACCGCAAATATCCTGCGACATTGTGTGATTAACAGG
+ACAACGCCGCGCAGCTGTCTGCGTGACGTAATCAATACAACACAGGGCGAAGCCTATTCC
+AATCAGGAGGTTCGCCGCTATGGCTCAGGATTACCACCACGGGGTGCGCGTTGTTGAAGT
+CAACGAGGGCACCCGCTCTATCACCACGGTGAGCACCGCTATCATGGGCATGGTCTGCAC
+CGGCGATGATGTTGATGCGTCCGTGTTTCCCCTCAATAAGCCGGTCCTGCTGACTGATGT
+GCTTACCGCCAGCGGTAACGGGTGAGTCAGGAACGCTGGCCCGTTAGCTGGATGCGATTG
+CCGACCAGTCAAAACCCGTGACGGTTGTTGTGCGCGGGCCGCCATAAAGAAGTGGATTCC
+GGCGAGTGGAAAACCGGCGAGAGCAGCAGCACCAAAGTCAGCAGTATCAACAGCTACGCG
+AAACTGACCATTAATGGTGAGGTGCTCTATGAGGTCGATCTGGTCAACATGGTAGAAATC
+GTTGGCGGCGTGGACCTGATGGAAGAACACCGTAATGCCCTTGGCCTCTGATTAACCTTA
+ACGGCGCGGGCAGCCGCGCCAGTATTTCATTAACAGGATACGAACATGAGCGACAAGCTG
+ACTGAAAAGACCGTAAAACTGGATACTCCCATCATGCGCGGTAAAGCTGAAATTACCGAA
+ATTGTGCTGCGCAAGCCTCAGTCCGGCGCACTGCGTGGCACCCGTCTGCAGGCCATTATG
+GATATGGACGTGGGCGCAATGATGACTGTGATTCCACGAATCTCCACCCCGACGCTGACC
+GCGCAGGAAATGGCAGAGCTGGACCCCGCCGATCTCACCGCGCTGTCGGTAGAGGTGGTG
+ACTTTTTTGTTGAAGAAGTCGGTGCTTGCCGGTTTACCGACAGCCTGACGATTGATGATC
+TTGTGGCGGACATCGCCACCATCTTTCACTGGTCGCCATCCATCACTGACGTTATGCCGC
+TGACTGAGGTGCTGGCGTGGCGGCATAAGGCAATTCAGCGAAGCGGGGCCAGCGATGAGT
+GACAATAACCTGCGTCTGCAGGTGATTCTTAATGCGGTTGACAAGCTCACCCGCCCATTT
+CGATCCGCGCAGGCCAGCTCAAAAGAGCTGGCTGCAGCCATTCAGCAAAGCCGCGCCCGT
+TTAAAAGAATTAGATGCTCAGGCGGGCCGCATTGACGGTTTCTGCAAGGCCAGCGCGCAG
+CTGGCAGTCACCGGTAACAGCCTGAAAGCCGCACGCGAAGAAGCTGCGAAACTTGCCACG
+CAATTCTCTGCCACCAACCGCCCGACGGCGGCGCAGGCACGGCTGCTTGAGCAGGCAAAG
+AACCGCGTTACGGAGTTACAGAGCAAATATAACGGTCTACGTCAGTCAGTGCAGCGCCAG
+CGTCTTGCGCTCAATGAAGCCGGACTGGACACGAAAAAGCTCAGTAGTGCGCAGCGGGAA
+CTGCGGCAGAATGCCGACGAAACCCGGCAGGCCCTGGACCGGCAGCAGAAATCCCTTAAA
+CGCCTGGGCGAACAGCAGGCGCGAATGAACGCCGTCCGCGATCAGTATTCGCGCCGTCTT
+GAGGTGCGGGATCGCATCGCCGGGGCAGGGGCTACCACTACGGCTGCAGGGGTGGCAATG
+GGCGCACCTGTTGTGGCGGCAGTTAAGAGCTACGCCAGCATGGAAGATGCCATCAAGGCC
+GCCAGCGAACAGCTGCCGATGGAGAACGGCGCTATAGACTATGCCGCGCTGGTTGAAGGT
+GGTGCTCGCATGGGTGTGACCAATCAGGACGATCCTTACGAAGAGCAGAAACGTGACCTG
+CTGGCTTTTGCATCCACGGCGGCAAAAGCGGCAACGGCCTTTGAGCTGCCCGCCGATGAG
+CTGGCGGAAGGATTGGGGAAAATCGCACAGCTCTATAAAGTGCCGACGCGCAATATTGAA
+CAACTGGGCGATGCGCTGAACTACCTGGACGATAACGCCATGTCAAAGGGTGGGGACATT
+ATCAACGTCCTGCAGCGTATGGGGGGCGTGGCTGACCGCCTTGACTTCGAAAGGCTGCTG
+CGCTGGGTTCAACATTCCTTTCTCTTGGGGCTGCCCCGGAAATTGCCGCCAGCGCCTCTA
+ATGCCATGGTGCGTGAACTGTCCATTGCCACCATGCAAAGTAAGCGCTTCTTTGAAGGCA
+TGAATCTGTTGCAACTCAATCCGGCGGAGATTGAAAAGCAGATGACCACCGATGCCATGG
+GCACCATTCAGCGGGTTCTGGAGAAGGTCAACAATCTGCCGCAGGATAAACGCCTGTCAG
+CCATGACAATGATTTTTGGCAAAGAGTTTGGCGATGATGCGGCAAAGCTGGCTAACAACC
+TGCCGGAGCTGCAGCGTCAGCTGAAACTCACATCAGGCAGTGGTGCTAATGGCTCGATGC
+AGAAAGAATCCGACATTAACAAGGATTCATTGTCTGCGCAGTGGTTGCTGGTTAAGACTG
+GCGCGCAGAACGCTTTCAGCAGTCTGGGGGAAACGTTGCGTCAGGCGCTGATGGATATTA
+TGGGCATGGTTAAGGGCGTGACCGGGGCGCTGCGTCGCTGGGTGGAGCAGAACCCCGTGC
+TGGCTGGCACGCTGATGAAAGTGGCGGCGGCTACGGCGGCTGTCACTGTAGGGCTGGGTA
+CACTTGCCGTGGCGGTAGCTGCCGTGCTGGGGCCGATTGCGGTGATTCGGTTTGGCCTGT
+CTGTGCTGGGTGTAAAAACATTACCTTCCGTTGCTGCAGCGGTAACACGTACTGGCGGTG
+CCCTGTCATGGCTGGCAGGTGCGCCACTTTCCCTGTTGCGTCGGGGTATGGCGTCATCCG
+GTGGCAGTGTCGGGTTACTGAGTGCCCCGCTTAATTCCCAGCATCGCTCAGCCGGAATAG
+CGGGTAATGCGCTGAAAACGGTAGCAGGTGTGCCGCTTGCCGTGTTCCGTGCCGGTATGT
+CAGGCATCCGTAATGTTATCGGTATGGTGATGAACCCGCTGGCGGCGTTGCGGGGTGGGC
+TGACAGCTGCCGGTGGCGTGTTGCGTTTTCTTGTTTCTGGTCCGCTGGCATTACTTCGCG
+GCGCGCTGTTTGGCATTTCTGGCCTGCTGGGCGCGCTGCTCAGTCCGATAGGGCTGGTTG
+TGGCTGCGCTGGCTGGTGTGGCGCTGGTTGTGTGGAAATACTGGCAGCCCATCGGTGCAT
+TTCTGGGGGGCGTGGTGGAAGGGTTCAAAGCCGCTGCTGCGCCCATCAGCGCCGCCTTTG
+AGCCGCTCAGACCCGTGTTTCAGTGGATTGGTGACAGGGTGCAGGCCTTGTGGGGCTGGT
+TCAGTGATTTACTTACCCCGGTTAAATCCACTTCCGAAGAACTGAACAGCGCAGCTGCAA
+TGGGGCGTCGGTTTGGTGAGGCGCTGGCGGAAGGTCTGAATAGGGTGATGCACCCGCTGG
+AGTCTCTTAAATCCGGTGTGTCATGGCTACTGGAAAAGCTCGGTATTGTCAGTAAGGAGG
+CGGCAAAGGCGAAACTGCCCGCGCAGGTTACGCAGCAGCAGTCCGCCACAGTGAACAGTG
+ACGGCAAAGAGGTGCTGCCGCCAGGCGGGTTCCCGGCTTACGCGGGGATGTACGACAATG
+GCGGGATCATTCCACGCGGGCAGTTTGGCGTTGTCGGAGAAAATGGCCCTGAAATTGTGA
+ACGGACCGGCAAATGTTACCAGCAGGCGGCGTACTGCTGAGCTGGCCTCTGTCGTTGCTG
+GCGTGATGGGGGTAGCTGCGACACCTGCAGAAGCGGCTCCGCTTCATCCGTTCAGTTTGC
+CTGCGAGGGCATACCAGCCCCCGCTTGCTAAGGCAGATAGCCCGCCGCCGGTTATTCGTT
+ATGAGATAAATGCGCCCATTCATATTGTCGCTCAGCCTGGGCAGAACGCGCAGGATATTG
+CCCGTGAAGTGGCACGCCAGCTTGACGAGCGGGAGCGCCGGGCCAGGGCAAAAGCGCGCA
+GCAATTTCAGCGATCAGGGGGGGATGAATCATGATGATGGTACTGGGTTTATATGTATTT
+ATGCTGCGCACTGTCCCTTATCAGGAACTGCAGTATCAGCGCAGCTGGCGACACGCCGCC
+AACAGCCGGGTGAACCGCCGTCCGTCAACGCAGTTTCTTGGCCCGGATAATGATTCACTG
+ACACTGTCCGGGGTTCTGCTGCCGGAAGTGACCGGCGGCAGACTGTCATTACTGGCGCTT
+GAACAGATGGCTGAACTGGGCAAGGCATGGCCTTTGATTGAAGGCTATGGAACCATTTAC
+GGCATGTTTGTTATTGAGAGTCTGAGCCAGACAAAGACGGAGTTTTTTGCCAGCGGAATG
+CCCAGGCGCATTGAGTTTACGATCACCCTCAAACGGGTTGATGAGTCGCTTTCTGACATG
+TTCGGGAGCCTGAGTGACCAGCTCAGCAACCTGCAGGACTCTGCTGTTTCTGCGATTGGG
+GGGATTAAAAACACGGCTGGAGGGTTGCTGCAGTGAACGTTAATTCTGATCTTCTGAATC
+TGAACAGCAAAAGCCCGGCTTTCAGTATCGTCATTGAAGGTAAGGACGTGACGACCGTGC
+TGGATACCCGCCTGATGAGTCTGACACTGACGGATAACCGGGGCTTTGAAGCGGACCAGC
+TTGATCTGGAGCTGGACGACGCCGACGGGCTGATCGCCCTGCCGCGACGTGGGGCTGTGA
+TTCAGCTGGCGCTGGGCTGGAAAGGCCAGCCGCTTTTCCCTAAAGGGGCTTTTACCGTAG
+ATGAAATTGAACACAGCGGAGCCCCTGATCGGCTGACCATCAGAGCGCGTAGCGCAGATT
+TCCGTGAAACCCTCAATACACGGCGCGAAAAATCATGGCATCAGACAACGGTGGGGGAGG
+TGGTAAAGGAAATAGCCGCACGGCATAACCTCAAAATGGCGCTGGGTAAAGACCTGACGG
+ATAAGGCGCTGGATCATCTGGACCAGACCAATGAAAGCGATGCAAGTTTTCTGATGAAAC
+TGGCGAGACAGTATGGGGCGATTGCTTCCGTTAAAGACGGGAACCTGCCAGTTATCACCA
+TCACGCGCAAAGTCGGTGACGGTCATCGGTTCACCCTTGCTGATCGTGGTGCCTATACCG
+GTGTTATTGCCAGCTGGTTGCATACGCGTGAACCCAGGAAAAAAGAAACAACCAGTGTTA
+AGCGTCGTCGAAAGAAAACCACCACACCCAAAGAGCCGGAAGCAAAACAGGGAGATAATC
+TGGTGGGAACGGATGAAAACGTGTTGGTTCTTAATCGTACCTACGCCAACCGGAGCAATG
+CAGAGCGCGCAGCAAAAATGCAGTGGGAACGCCTGCAGCGCGGCGTTGCGTCATTCTCGC
+TGCAACTGGCAGAAGGCCGGGCAGATCTATATACCGAAATGCCGGTGAAGGTGAGCGGCT
+TTAAGCAGCCGATTGATGATGCCGAATGGACCATTACCACCCTGACGCATTCTGTCAGCC
+CGGATAATGGATTTACGACCTGTCTGGAGCTTGAAGTGAGAATTGATGATTTCGAAATGG
+AATGATTATTCGCAATGGAGAACTTTTAAGTTTGCAAAATGGAATAATACGGTATTATTA
+TTGTGAATTTAGCAAAAATGGGGAGAGCTCGAAAAATGATGATTTGCCCACTGTGTGGAA
+GTGCCGCCCATACTCGCAGCAGTTTTCAGGTATCTTCATTGACCAAAGAGCGTTACAACC
+AGTGCCAGAACATTAACTGCAGCCATACTTTTGTTACCCATGAAACTTTTGTTCGTTCAA
+TTGCAACGCCAAAAGAGTCGAATCCGGTTCGGCCGCATCCAATGAAATCAGGACAGGTGA
+CGTTCTCTCTTTGACGCTGCCGCCATTTTGTCGCCATCTTTAAAAAACAGTGCTTCTAAC
+ATCATGATTTTAAACGGCATAAAATTCAAACAACAAAAAACCCATCAACCTTGAACCTAA
+ATGGCGGGGTTGATGGGCTCCACAAAATGGGGACATCAAAGAAAAGCAGTGGCAATAGGT
+ATGACTGAGGCTTTAACGGAAAGTTCTACTTATCTGCAAAATTTTTTCACTTAAAGGCAA
+ACTTCAGTTTTATCCTAATCCCGGCCAGATGATAACAATGAGCGTCCCCGCCAGTGTCAG
+CAGAACGTTGGCGATAGCATAAGTCCCGGCATAACCCAGCGCCGGAATATTGCTGCGCGC
+CGTATCGCTAATGATTTCCATCGCCGGGGCACAGGTACGGGCGCCCATCATGGCGCCGAA
+CAGCAGCGCCCGGTTCATACGCAGGACATAGGCACCGAACAGGAAGCAAATCACTACTGG
+CACCAGGCTAACGACAAGGCCTGCTATTAGCATTTGCCCGCCGACCGCGCCCAGACCATT
+ACTGATACCGCTGCCTGCGCTTAAACCGACGCCTGCCATAAATACCATTAAGCCGAACTC
+TTTTACCATGTTAAGCGCGCCCTGAGGAATATAACCAAAGGTAGGATGGTTAGCGCGCAG
+GAAACCGAGCATGATCCCGGCGAACAGCAACCCGGCCGCGTTACCGATGCCGAAACTAAA
+ATTGCTGAACTGGAAGGTAATCATCCCGATCATTAAGCCGATGATAAAAAAAGCGCAGAA
+GGCGAGCAGGTCCGTCACCTGGCTATGAATCGAAATAAAGCCGATGCGATCGGCGATGGT
+TTTTACGCGTCGGGCATCGCCGCTCACCTGTAACACGTCGCCTTTATTCAGCACCACGTT
+ATCATCGATAGGCATTTCGATCTGGCTGCGGATGACGCGGTTAAGGAAGCAGCCATGATC
+GGTCAGCTTGAGTTGAGCGAGACGACGACCGACGGCATTGTGGTTTTTCACTACAATTTC
+TTCCGTTACGATGCGCATATCAAGCAGATCGCGGTCAAACACTTCCTTACCATTACGGAA
+GCTGGGGTCGAGCCGGGCGTGCGCATCCGGATAGCCGACCAGTGCAATCTCGTCGCCCAT
+TTGCAACACCGCGTCGCCATCCGGGTTCGCCAGAATGCCGTTACGGCGAATACGTTCGAT
+ATAGCACCCTGTCTGGCGGTAAATACCCAGTTCGCGCAGGTTTTTACCGTCAGCCCAGGC
+CACCAGTTCCGGGCCCACCCGGTAAGCGCGGATAACCGGCAGATAAACTTTGCGATTGGC
+ATCGGTATCCAGGCCACGTTCACGGGCAATTTGCTGGGCGCTGGTTTGCAAATCCTGATG
+CTGTAGTTTAGGCAGGTAACGTGCGCCCACGATCAGGCTGACCAACCCGATGAGATAGGT
+CAGGGCATAGCCCAGACTGAGATTATCGAGAGCGGAGGAGAGCTGCGCGCTGGCGATGCC
+GGAATGTCGCAGGGTATCGCCTGCGCCCACCAGAACGGGCGTCGATGTCATTGAGCCCGC
+CAGCATACCGGCCGTCAGACCGATATCCCAGCCAAATACCTTACCCAGGCCTAAGGCAAT
+CAGCAGGGCGCTACCGACCATGACCAGGGCAAGCATCAGATAATTTTTACCGTCGCGAAA
+AAAAATCGAAAAAAAGTTGGGGCCCGCTTCAACGCCGACACAAAAAATAAATAGCATGAA
+TCCCAAATTTAGCGCGTCGGTGTTAATACTAAAGTGTTGCTGCCCTAATAAGAGAGAGAC
+CACCAAAACGCCAATGGAATTACCAAGTTGGACTGAACCCAGGCGTAACTTGCCAAGACA
+CAGGCCCAAAGCAAGGACCACAAATAATAACAGGATGTAATTCCCATTTAACAAATCTGC
+GACGTTTATATTCACGGAGACTAACTTCTTGTTTACGAGTAAGCTGTTGAAAGAAATGGT
+AATTTACGCTACTGTTTTTATCATGCGTTAAGGGTGTAATCGTATTGCATATAGCATCCA
+AATAAAACAACACAACAATATATCCTGCTAGTTTAATCTTATTGCGTACTAACGGCTATA
+AGAATCGTGCAGGTGTGTTTTTGGCATGGAATGCCACATGACTTTATCTGACTGGATGCC
+TCACGGCGGAAAGCGTGTTCGATAGAGAGAGTGTCAGGAGGAACGATTGAAACATAAACA
+GAGGTGGGCAGGCGTTGTCTGCTGCTTTGTACTCTTTATTGTGGTGTGTCTTTCATTAAC
+TATGCACGTGCAAGGCGCTTTTCGCGCGACCGGGCATCCTGAAATTGGGCTGTTATTTTT
+TACATTGCCAGGTGCAGTGGCGAGTTTTTGCTCTCATCGGCGCGAGGTGATCCGACCGTT
+GATCGGGGCGATGCTGGCGGCGCCGTTTTGTCTGGTGCTCATGCGCTTTGTATTTATGCC
+CACTCGTTCATTATGGCAAGAGCTTGCGTGGCTGTTTAGTGCGGTATTCTGGTGTGCTTT
+AGGCGCGCTCTGCTATCTGTTCATCAGTAGTCTGTTCAGTCAGAGGCGGAAAAAGCACCG
+ATAA
+>NC_015761.1|provirus_1007223_1045009
+TCACTTTTCCCCAATAACCGGACGATCCAGTGTCGGGCTGATTTGTACCTTCCTGTCGTA
+GATAAGCACCTGGCTTTCTGTTTTGTGGCCGCTGAAAATCTGCTTATCCCTGCTACTACC
+CTCAAAATCTGAAATAGCTTTTGCCTTGATATCATGGAATGTGTAATCCAGCTGTCGGCC
+CAGTTCACTTTGTGCGGCGCGTACAGCTTTTAACCAGCGATTATTGAACGTCTTGTGGAT
+GAACTGACCACGATTGTTGTTGTAGAGAACCAGCGCGTCAGGTGACAGTTTTGGACATTC
+TGTCTGTGCTGTTTTCAGCGCTTGCTGAAGGCGAGGTGTCCAGACCTTAATCTGTTTTTT
+TCCGGTCTTTCCTTGCTGGATAAAAATACCCTTATCAGAAACTTGCATCCAGCGCAGAGC
+GAGTACGTCAGCTTGCCGGGCGGCGCACAGGTAAGAAATTTCCATTGCAGCCCTGACAAC
+GTGATCAGCATGCTTATAAATAGCCAGGTAGTCTTCGTCAGTGATGTATTGCTCGCGAGC
+CTTGAGAGAGAATTTACTGACGCCAGCACACGGATTTCCCTTAACGTAACCGCGTTCATA
+TCCCCAGCGGTAAACACGTGACATACTGCTCATCTCCTGGTTGGCCTGGTTTTTACTTTG
+CAGTCCACGACGATCCATAAACTGACGCACATCTTCTGGCTTTATTACATCAGCTTTAAC
+TTTACCAAACACGGCAAGTAATTTTTTCTGATGTTGTAAATAATCCCGCTGGGTTCGTAT
+TGCAAGCTCGGTGTAGTAGGCGCTTTTAAGAAACATTCCCCAGAGCTTTTCAAACGTCAT
+TACATCTGAGTAATTGCGCCGTTCTTCCTCGTACCGTTTCCATAATGCCGACATAGTGAG
+TGTGATTGGCCCCAGTGTCACAGTTTCCCGCGACGTGGGTTTGTAGTAGTAACGCGTTTT
+TGTTTTGGATACGCGCGGCGGCAGTTTGTTATCTCCAGGATCCTTTCTTCTGCGCCCCAT
+TTAAATAGCTCCGAAATCGGGTTTTTCTTCTGTTCTGGTCTGTACGGTGATCTGTCCGTT
+CAATACAGCGTTAATGTGCGTCCAGGTCACCATCGGGCGACCTTCCCGGTCGGGTATGTA
+CGAGACGCCGCCGCGGTCAAGGATTTCCCTTTGTTTGGATGCCTTCTGATAACCGGTAAA
+CTCAATCAGTTCTGCGTCTGTTAGCAGATCGTTTTCTCTGGTCATGTTGGTCTTTCCTCA
+TCATCCGGTAACCGCATTGTTTAAGCATCCGGATCTCCTTTCTGCGCCAGCAGGTAGCAG
+AGGCGGCGGATTAAAACCTCAATCCGGTTGAGCGGGACGGCCTGCTGTCGAGCTGGTTTA
+CGTGCGAAATCAATCATTCTCACCCTCGTTTGCCTTATCGCCGGCCAGCGGAACGTTTAT
+CACCTTCTGCGCGTTAACTTTTCCACCTCATTCCGGTCTTCGTATGCCCCGGACGGCTAC
+TTCGTGGGCGTCCTGCCTCGGTGGTTCGTTGTTGCTATGGAATAAGTAAAGCATCATTTT
+ACTTCTTAGTCAACTTATACGGAATTAAAGCGTAAAGCAAAGCTGTACAACAAGCATGTT
+CATTTTTGGACTATGTTTAGCAGCTCAATATGTATATGATTAAAAAAACATCAGTAAGAG
+GTGGTTATGGAACGCGATGAGCTGGAAGAAGACCGTGCGACATTCATTGCGGGTGAGATT
+GGCGGCGCAGTGGTCGAATTGATAATCGACGGCGTAGTGATCAGCCGCGATGCAACAGTT
+AAACGTCTGAAGGAGAAGAGGAGGTGAGTCGGGAACGTTATTCACAAAGGTGTATTACGG
+GATGCAGCAGCTATGGTGAGGAAAGGGCAGTAAATACCCGGCGCGGTGGCCGGGTTGGAT
+TCATAAACTAAATTACTGAAGCATTGACGCAGCGTTTAACATCTTCTCATAATAAAAATT
+CATATCTTCTTTACTGTACGCGTTTATAAGGTTATCTGCATGTTTTTCAAGAAGATTTAT
+TTGCTGTTTTGCTGTTTTTTCTTGTGCTGTAGTTTCCGCTGCATAAATAACAAATGAGTC
+AATATTATATTTGTAAATTTCACATGCTTTTGAAATTGTTAAAGCACTCACAGCAGCCTC
+ACCCATTTGTTTTTTAAAATTTTCTGAACGGAAATCTAAAGTTTCAGTCAGATGGTATTT
+GCCGTTCTTAAGCAAGAAATCTGCAACTAAACCTTCGTCATCGCTTATAGGATAGTTAGC
+AACAATCTTGTGCTGATAAAGGTCTTCAGAGTATTTGCTAAAGATTCCGTGCTGCATGAA
+GGTTGACTTTATTTCAAAGAAAACTTTTCTTTTCAGTTGCTTGTGAGATTGTTTCTGTGG
+ATTTACTAACCTATTCATCAAATCAGTAATTTTTGTTTCGTAATTATCATTGCTTTGAAT
+GGTAAACATACCAAAAGAAGATAGTGATAACGATCCCTTAAAAAGGCAGGGAAGAAGTTC
+AACGTCATTTATTTTGTGTGACAAATCAAAAAGTGAGTTTGAAAGATCTTCCAAGTAATT
+TTGTGAAAGACCTTTATCAATTGCTTTAAGCTTTGAAACTGAATTAAGCATGCGTACGTC
+TATGTCGGAGTCGTGGTAAACGATCAAGCCAACGTTAATCGTTTCACCTTTCTCAAGATT
+AGGCGTAACTCTGATTAAGCTGTATTTGAAGGTTTTCAAGAGGTTATCTCCAGTCTTATA
+GCGTTTATTCGCTCAATTCTTTCCTCACTATCCCACCACTTCAGAAAATATTCTTTATGC
+ATTGGTGGCATCCATGCGACAGGCATGGACTCTAGTATATCAGAGATTGTAGCAACTCCA
+ATTTTCTCAATCTTGTCAAGTATTGACAATGCGCACATTCTTAATTCTGGTGTATCGCCG
+ACAAATTGCTTAGCTATAGACCAGTTTGTTGATGTGCTTGAGTCCGTAGGAAGTGTGTGC
+GGGGTGCTACGTGGCCAACCGATAACAAAAGAACTCAAGCTAAAATCGAACGTTTTTACT
+ATGATATGACCGCGCGTATTCTCCATGTAAAGATAATTATTGAGATGGCGATCAATGTTG
+TACACGAATTGGTCAAATGCATAAATTGCCCATAGCTGTTTTTTCAATGACTCAGAGGCG
+TTTGCCAGCAAATTGATCCATTGCGGGCCGTTAAGTCCTGACTTCCATGCAGAAAACTCA
+ATGCGAGAGCCAAATACATACTCGCCATCAGCAATACACTTAAGAACCTTACAAACAGGA
+GTTGCAATACCACACCTTTCAGCCAAATTTGTGCAAAACCACTCTGCAGCAGGTACTTGA
+GTTGGGTTTTGTACAGGAAAAGGAGGTGCAGTTTTCATACTTTTAACCGCATACTCCATC
+TCATCAGTGGCAATGGCAAAACCAGAAAGATGCACAGTACCCAAGTTCGATGGGGTATAT
+TCATTGAACTCTAATTCAAATAAACTTCCTTGTTCCGGGTCCGGTTCGCTATTGTTTGGA
+TCTTGTTCTTCTGTCATCTGCTTTTTACCCCACAAAGAAGACATGTAAACCTCATGAAAT
+TAAATTATCTCTATAATATTCTTAGCTTTTTTCTATTCCGGTCTCTCATGGCGAGCATAG
+CCAAGTTTTCTCCCCATGCTTCATGTTCGTAAGCGGGGCAGTTCTAGTTTGTTAGGCTTC
+GAAATGTGTGGTTGAGCAGAGCCTAACTAGGGTAGTTACTCCACATCGCCCTTAATCCGC
+CGCCCCATATACTTGGCGTACAGTTCATCGAGCTCCTTCAGGCGCAGGGATACGATTCGC
+AACATGTTCTGTTGTTCTTCTTCCGGTAACTGGCGATAGAGCTCAAGCAGGCGCTGTTCG
+TCAGGTTTAAGTCCGTCTTTCTCTCCGACATCCTCACCAAGCAGCCACGGAACTGATACG
+CCAGCAGCATCAGCAATAGCTAATGCGGAGCTTTTGCTAATTCTTCCTGTTTTGAACCAA
+CTGGAAACTGCTTGCTTGCTGACACCAGCTACCCTGGCCATCTCTGTTTTAGAGAAACCC
+TTCTTATTTAACTCTGCCAGCCTGGAGATCAGGCCATTCGTCAGTGTGTTATCGCTCATC
+GCCTCATTGTAAATGATTGCTTTACTTGTAGGTAGGCATGCTATGTTTGACTTGTTGGTA
+AAATGATGCTTTACTGTTGTCATCTAAGGAGGTCCTATGACTGGTATTGAAAAAGCAATT
+CAAAAATTTGGAACAGGGGCTGCTCTTGGAAGAGCGCTTGGATTTTCAAAAATGACAATT
+TCCAACTGGAAAAAGACCGGGATTCCACCCGATCACATTCGTTCAGTTTTCGAACTTACA
+GGTGTTACGCCACATGAGTTACGGCCTGACTTGTATCCAAATCCAACAGATGCATTACCA
+AGCCAAGAGGCATCAGCCAAATAACCATAGAGGATATTTACCCATGGAGAACGCAATTGC
+ACGAAAGTTAGACCCACCAGAAATCAACCCGATTGAGATAGAGAGTGTCCTGCTCAACCG
+GCTTGCATCAGTAGGGCAGAAATCATACGCCGAGCATATGGGCATCAGCGAGTCGACAGT
+CAGCAGGCGTAAAGCTGAGGGATATTTCTGCAACATGGCGAAAGAGCTGGCTTTTCTTGG
+GATTCAGGCCGCGCCACCGGAAGCGGTACTGGTATCCAGAAACTATCTCACAGCAGTAGA
+GATTCTCGCTGATGCCGGGCTAAAGGCTGAACGAGCCAGGCCGGATGCGCTGGGGTGGGA
+CTGAAAATGGCAGCAACCAAAAAGGCGAAAGCCGCGGTGAGGGGTCACCAACGGCTTTCA
+GGTGGAATTAACTGGATCAATTCACAGGAGTAATTATGGCAAACACTGCCGAAGTAATCA
+ATTTTCCTGTGCCTGACGTGGCACCTAAGGAGCCGCGCGTGGCAGATCTCGATGATGGCT
+ATACGCGCCTGGCAAATGAACTTCTGGATGCCGTGATGTGTTCTGGTTTGCCGGAGACTG
+AGCTGTGCATCCTGATGGCCGTATGGCGCAAAACGTATGGATACAACAAGAAAATGGACT
+GGATCAGCAACGAGCAGCTAGAGGAGATGATTCAGAAGCATCATACCCATTGCTCGACAG
+CAAAAAACAGTCTGATCAGGAAGAAGGTTCTGATTCAGGAAGGCCGCAGGGTTGGTATGA
+ATATCCATATTTCCGAATGGCAAACTAAAAATAACGGATTCTGCAAAACATTAGCCAAAC
+CTGCTAAGAAAACCTTAGCGGAAGTTGCTAACGCACCTAAGCAGAAGTTGCTAACCACAA
+AAGACAAACTAACAAAAGACAATATTAAAAGATCTACGTCCGAGAATTCTGACGAATCCT
+CTGACAATCCAGGAAAGAAACCTCATGTTCTAAAACCAGAAGCGGCGATTCAGAGAGGCA
+ACAAGTGGGGAACTGCTGAAGACCTAACTGCTGCCGAGTGGATGTTTGACCTGATAAAAA
+CCATTTCTCCATCAGCCAGAAAACCTAACCTGGCAGGATGGGCTAACGATATACGCCTGA
+TGCGTGAATGTGACGGACGAACACATCGCGACATGTGCGTGCTGTTTCGCTGGGCGTGCC
+ATGACAGCTTCTGGGCTGGCAATGTCATTAGTCCGGCAAAGCTCCGCGAAAAGTGGACTC
+AACTCGATATCAACCGCAACAAGCAACAGACTGGCACAACTGCCTCTAAGCCAAAACTTG
+ACCTAAATAACACTGACTGGATTTACGGAGTGGAGCTATGAAAAACATTGCTGCGCAGAT
+GGTTAATTTTGACCGTGAGCAGATGCGCCGTATTGCCAACAACATGCCGGAACAGCATGA
+CGATAAGCTGCAAGTTGAGCAGGTTGCTAAGGTCATCAATAACGTGTTTAGTCATCTTAT
+GGCCGCGTTCCCTGCTACCACGGCTAATCGCAGCCAGGCCGAGATGAACGAAATCCGGCG
+CCAGTGGGTTCTGGCTTTCCGTGAGAACGGCATCACCACCATGGAGCAAGTTGCGGCCGG
+AATGCGTGTCGCCCGCCGTCAGGAACGTCCGTTTCTGCCATCGCCGGGACAGTTTGTAGC
+GTGGTGCCGTGAGGGGAGTGGAGCACTCGGGGTCAGTGTTGACGACATCATGGGCGAATA
+CTGGCGCTGGAGAAAGCTGGTTTTCCGTTATCCGACAGGTGAGCAGTTCCCATGGAGAGA
+TAAAAATCCGCTGTATTACCACGTCTGCCTGGAGCTGCGCCGCCGTGGAACTGAGGGGCA
+ATTAAGTGAAATGGAACTTATCCGGGCCGCTGGCGACATCCTGCATGACTGGGAAAAGCG
+AGCTCTTGCAGGTAAACCCATACCGCCTATTCGTCGCGCTTTAGCCGCGCCGTCGCGGGA
+TCGCGGTCTAACGCCAGCCGAGATGCTAATGGCTAAATACAAACAACGCAAAGACGCCGG
+TCTGATTTAACAGGAGCAACCAATTGAGCATTCTCACCATTCTAGATGTCGGTCTTGCCT
+TAATGGGGTGGCTGTTCATCATGTTCAGAGCGGGTCAGTGGTTTATCTCCGTTGCGCTAA
+AGCAATGGGATAAGCGCAGAAAGCAATCTCGTCGGCAAAAAGCAGTAAACGAATTTTACG
+ATGCGTTTGACCTGTCCAGTATCGAACCTGGTACAACGGTTCGCCTAACGACTAAAGGCG
+ATCTGACAATCATGATGTTTCGCCGGGAGGCCGCCCAATGAGCAACATCGACAAACAGGC
+GCGGGAGCAACTGGAAGCCGCAGAACGCAGCATGGCAGAACAAAGCGCGATTGTAGCTGC
+TGCTGAAAAACTGGTCCGTTGCAAAGGTCGTTATCACAGCGAACTGAACTACCGGGCGCT
+TGCAAAACTGTTTGGTGTCATTACGCCGGATTTACCACCACTTGAGCATGAAAACGTTCA
+ATGCGCAGACGCTGCTGAAGGGTTTCGTATCGCGCTGGCATCGTTGGAATCCATGACACC
+AGAAAAGCGGGCGAAACATGACGCCAGTATAGAAGCATTCAAAGAGATGTTGCCGCAACC
+AGCACCGGTAGACAAAGAATTTATCCCTAAAAACCTGGACAAGGCGTTGGGTGTTGTTGG
+TGTTGCGTTACCTGAATCAAAGGAAGAGTTTAATTTCCAGATAGAGCGCTGGATACAGCG
+TCTCATTGATCGGGTTATTCGTTATGCCGATGAATTCAAAGAGCAGCCAGCGCCGGTAGT
+GCCGGATGAGTGCCCGGCTGAGTTATTGGCGTTCTGTGAGCAGGTGATTGATAGCCGTAT
+CACCGCAAACGCAAAAGCTGATGAGCTATGGAACGACTGCCGCGATGCCATGCTTAATGG
+CGATACTTTTCGGGGAAACTCAATTTCGTCAACCAATAATTTTCGGGGAATCGCGGAAAC
+GTCAACCAACTCTCAGGTAATTCCGGATGGCTGGATAAGCTGTAGTGAGCGGATGCCTGA
+GCAAGGTGCTTACATTTCAGCGGTGTCAAGGCATGGTGAATACGTAGCCGGGCAAGTTAT
+TGACGACTGGCTAGATCTGCATGATGGAACATCATTCGGACTTGATGAGGTGTATCTATG
+GATGATGTTGCCTCCACTGCCAGCAGCACCACAAAAGGAGGTTAAGTGATAGGCGTCAAG
+AGCAAGAGGGAGAGGTTAGCATAAACATTAATCAAGGCTCTTATGGGCTTTTTATTCTAT
+TATAAACGGACTTTTTTTGAGGGTGATACCATGAAGCCGAAGAAGCTAAATGCTGAGCAG
+CAATATCAAACAGACCTTGAATTGGTCAAGAAGAAGCCCGCAAATCGTACCGAGGCAAAA
+GCTCATTTGGCAGCGCAGTTACGGATTAGCAAGTACAAGGCGCAGAACTCTTCCAAAATT
+CGCGTTGGCAGTTTCAGGGGAAGAAAGAAGGTGCATTTCAGTAAGGCCGAAGAAGATGCC
+AGGGCGGCACTAAATAAAGCAAATGCCATTAGATTTTCTGAAGGGGAGGTTGAATCCGTT
+GATACAGATCGAATCTCTGAGAGTAATAAACGCTGGCGTGGGAGAACTGCTGACTAATGT
+CTGACTGGAATATTGCAGCACAATCAAAAGACAAGCAGGACAACGAGGCGCTCAGTTTTA
+CCTACGAATACGCGTTTGCCCCGGAAAACCGCTACAAATACTAACCCGTTGCGGCGGGTT
+GGCGGGAGGGTAGATTATAATTAAAGCCCACCCAGATGGGCTTTTTAGCAAGGTTTATCC
+GAGAGCGCCGTAAAACCCCGTTCTTTTAGGTCGGGGATATAAGGCGTGCGTGCCCTTGAT
+CTTCTAACTAACCAAGAATTCCCTTCTTTTAGGGAGGGGAGTGTCAATCAGGAATGTGTA
+TTATAAATCCACTTATGTCCCAGGTATCCATCGGGACGTGATACCCTAATTCTTTCAAGC
+GATTAAATGTTGGCTGGAAAACGGATAGATAATCATCTTCGTTTAGACCCTCAAGATCTA
+AATCGTCGAGCTCGACACTGAAACTAGAGTGTCCTAGCTTTATTTTTTTACTTATCTCGG
+CGAATGTTCTCTTAAAAATGATTCTGGAAACTTCTTCTTTTGCTTTTTGTATGATAGCGA
+CGGCCTCTTTGGCTGAAATCTGTTTATCAGCAGGGATTTCTCCTACAAAACTACCTTCTA
+ATCTTTGAACAATCTCTGCGTTCATTGATCGGCCATTTCCCTTAGCGGCAACTTCAATTT
+TCTCTTTTAATTCAATTGGAAGTCTAATACGCAACTGCGGATCTTCTCTGCTCATTTTTC
+ACGAACACCTTAGAAAGTTCACAATATGTAAATTATGCCCCACCGTGGGGTTGACAGCAA
+TGACGCACGGTGTGACAATCAAATTGCCCCACCGTGAGGCAATTTAAGGGGGTGGAGATG
+GAAAAAGCAAAAGACATGTATCAACGCAAGGTTCGTTTTCCAGAGGATGTAAGGAAGGCG
+ATTGAAAGAAATGGGGAAGAAGAGTGTCGGCAGTTCAACACGGAACTTATTTATCAATTG
+AGGAAAGTGTACGGACTGGTTAGAGAGAAGAATGCTAGGACATAAAAATGGCGAAGCCCA
+GCAGTGCGCTAACACTAACCGGGCCTCTATCGAAGATAACCGCAAAGGAAATATCGACAT
+GCCTAATTTAGCAATAAAACCTACTGAATGCACTATCAACGTCCCGTTTTACGGTTCTGA
+GCTTTATGTGGTTAACCATAACGACGAGCCGTACACCCCAATGAAACCGATCGTTGAGGG
+TATGGGCATGGATTGGAAAAGCCAATTCATCAAATTAAAACAGAGATTTAAAACCTGCGT
+GGTGGATATCACCATTCAGCTACCCGGGGATAACCAACGGCGTAGTGTTATCTGCCTCGC
+CTTGCGTAAGTTGTCCGCATGGCTAAACACAATCAGCCCAAACAAGGTTCGTCCAGAAAT
+CTGCGAGCGCGTTATTCGTTATCAGGAAGAGTGTGACGATGTGCTCTATGAATACTGGAC
+TAAGAGGCAGGTAATTAACCCGCGCAAATCGGAAACGAACGTTGACGATCGTACTCCATT
+GCGCGGCCTGGTAAACCGCATCATGGGTAAAACCGGTATTCACTATCAGACCCTTTACAA
+AATGATCCACCGAGAGTTTGGCGTGAATCATATTGATGAATTGACAGGGAAACTGATTGC
+TGAGGCGATGGAATACCTTGCGGGGAAAGTTCTGGAAGGTGAGTTATTACCAAAAGACCA
+AGGCAGATCCACGCTTTCATCCGCAATCCCCAAACATGGGCCTGGTAGGGTACTGCTTAA
+CCTGAATGAAAACGGTCAGGTTAAGGACACTTATCCGTTAACTGAGGATCAGGTAGTCAT
+GTCATTTGATGCATTTGTCAGCTATTTCAGGAAAAAGGGATGGGTAGTGGCCCCAAGGGA
+TGAGGTAGCAAAAGGAATAATGGGGGCAATACAGGTTTTATCGTAGCAAAAAAGAAAAAC
+CGCCAGTTGCTGCTGGCGGCCTATGTCACAAACCCTATCATCACATAAGGAATGTCGAAT
+GACTTGTAAGAATGTAGCAAAGCTCGGATCTGTTGTCACGGATAAAACCATTGATAGCCA
+GTACCTGCTTGAGATGGTAAATCACGCTCGTAAACAGTGCGGTGAAAAAGAAGTCCGCAA
+CAACGACTTTATTGGACGTATTAAGGATGAGCTTGAAGGTGAGCACTACGAAATTTTCGT
+AGTTCAAAAAGCAAACAAAACAACCTCTGAAAAAATTGTTATGTCAATTAAGCAAGCCCT
+TCGAGTGGCCGCTCGTGAATCAAAAGCGGTGCGTCGCTCCCTGGTCGATAAACTGGAAGA
+CATGCAATCCATCCAGATTCCTGCGCAAAGTAATTCCGGTCTTTCTGAATACCGTCTTGC
+AAAGGCCGAACAGTTGAAAGCGCTGGCGCTGGAGAAAAATATCGTATCCGCTCGTAAGTT
+GATGGTGATGCTGCCCCGTCTTGACCCTATGTCCCACCAGACGCTGGCGGCTTCGCTGAT
+TAATCCGATTATCGGTTATGACGCGATCCCCTTACCAGTGATTGAAGAGCATTACTACAC
+CGCAGCGGAAGTGGGTGAGAAAATCGGTGTCAGCGCCAATAAAATCGGTCGCATCGCTAA
+CGCAAACAACCTTAAAACTGAGCAGTACGGCAAGTTCTTCCTGGATAAATCCGCGTACTC
+CAGTAAGCAGGTCGAGGCGTTCCGCTACAACACAGAAGGGATCGAGGCGCTCCGCCATTT
+GATTCAAGGTGTTGATGTGGCATAAGAATCACAACTCAGAAAGTCTAACCCGCCCATTGC
+TGGGAATTCCTCGGCAATGGGCGGGTTTTCCGCTTAAAATCTGATATGAAACAACATGCT
+AGCTTTTGCAAAAAGTGCTATTCACCTCTTGAATATTCTTTCTAACATGTATACTGTGTT
+TATATACAGTAGTTAAATGTAGAGGGAATTATGAGAATTGAGCTTGTTATCAGCCGGACA
+AAACAGCTTCCGGAAGGTGCCGTTCCTGCACTTGAAAAAGAATTAATTACCCGTCTCCAG
+AATCAGTATGAAAACTGCAACTTAACCATCCGTCGAGGCAGTCAGGATGGTCTGAGTATC
+ATCGGCGCCGCTGATGGCGATAAAAAACGTATACAGAGCATTCTGCAGGAAACGTGGGAA
+AGCGCTGACGACTGGTTTTATTAACATTGCGCTTAATGCTGGCGCGCATTTTTCAGAATA
+CCGCAATTTGCGTATCCCTTTGATGCTGCTGCCGACAATTTTTAACCGCGTCTGTACATC
+GCCTGAAGGGAGAACAAAAATTGAGTAATTCAGCTTTGCAAAAGTCAGAAGATAGCTGGT
+ATGACATTGTAAGAAGATCTGATGGCTGCGTGGTGTTTAGCTTTCCATCATCAGGCAGGC
+ATCTTATCTATCGTGTAAATGGCATGGTATCTATGCGTCCTTTGCTGGATGATGAAGAAG
+TTTTTACTCCCAACGGTTTTGTGCATTTTATTCGCCGTCTCGGCTACCGGGTAACACCAC
+CTTCTGATAATATGAAATCAACGGCCTGAACAACCGTTAACCTTCTGCGCCACGGAGAAC
+ACCATGGCGCACGAATTACAACTCATCAAGCAGTCATCTGGAATTCTGATCCCCGCAACG
+CCGGAGACCAGTGATATTCTGCAATCAAAAATCAAACTCGGCGCCGTGCTGGTGGCTGAG
+TTCCGTCAGGTGAGGAATCCTGCATTCCATCGCCGCTTTTTCGCGTTGCTTAATCTTGGG
+TTTGAATACTGGGAACCCACCGGCGGCGCCATTTCTGCCAATGAGCGCAAACTGGTAAAC
+GGTTATGCAAAGTTTCTCGCTGCATATGGCGGGAATGAAAGCGCATTACTGGATGCGGCT
+GAACAGTATCTGGAACAGATTGCAAACCGCCGGGTAACAAACGGGATTAGCCTGTGTAAA
+TCATTCGATGCCTACCGCGCATGGGTGACGGTTGAGGCTGGTCACTATGACGCCATCCAG
+TTACCGGACGGCACCCTTCGCAAACATCCCCGCAGCATCGCTTTTTCCAGTATGGATGAG
+GTCGAATTTCAGCAGGTGTATAAATCTGCGCTTGATGTTCTCTGGCGCTGGATTTTATCA
+CGTACATTCCGTACTCAGCGCGAGGCCGAGAACGCTGCCGCCCAGCTCATGAGCTTTGCG
+GGGTGATGGCGATGAAATACTCCTGGTTCCATCATCACGACTGCACAACCGAGCAGGCCG
+ACACGCTGATATCGGATTATCAGAAGCGGGGCGTAAGGACAGAAAAGAGCCTGAACCCTG
+ACTTCATTACCTGGACTGTCAGCGCGAAATTACCTGAATATGCACACCGGGAGCGGACGC
+CAAAATCCTTACGCCAAAAGGTCTGGGGGTGAACATGGCTATTTATCGCAGTAAAAAGTG
+GCTTGCTGGTGGTGCCAGTTTGACTGCTCCCCGGCCTGAAGGCCGGGGTTTCCCGGAGGT
+ATTCTGATGAAGCCTGAAGTTATTGAGTCCCTTCGGTGGCGTACCGAATCCTTCACAATT
+ACATCCGTATTCAGCAAAATGTAGGGGAAAATAAGTGAAAAATTTATCCTGGATACGCCA
+GCAACTGATCACGGCGACGGCAGATCTAAGCGGTGCAACAAAAGGGCAGCTTATGGCCTG
+GCTGGAGAACGCACAATTTGACACGAAAACCTATCCCCGAAAAAAACAGCGCATCCGTGA
+TGAAGTGACCGGGAAAATAATAACGCTGAATAACCCTCCGATTCCGGGTAAGCAATCACT
+GGCGAAAGGAAGCGCAATTCCGCTTGTGCAGCCGGTAGAATACGCCACTTCCTCATGGCG
+TCGGGCGCTTTTGTCACTTGATGAACACTACAAGGCCTGGCTGCTGTGGAACTACAGTGC
+AAACACTTGCTGGGAGCATCAGGTTGATATAACCCGCTGGGGCTGGAGTGCGTTTGCGGC
+GCAACTCGACGGAAAGAAGATGGCCGGTAAAACACAGGAACGACTCCGGGCGTTAATCTG
+GCTGGCGGCACAGGATGTCAAATCTGAATTAGCCGGGCGTGAGGTTTATCAATATAAAGA
+GTTAGCGGGACTGGTAGGCGTTAGCGAAAAGAACTGGTCAGAAACCTTCACCAGACACTG
+GCTGACCATGCGTGCGGTATTTCTGCGTCTTGATCAGGCGTCTCTTTTGAGTGTATCGAA
+GACGCGATCGGAGCAGGTCGCATTCAATCAATACGCACTTAATTGACACAAACAGGCATC
+CGGGGCTATATTCCCGGAACGCCAGCAAAATCTGGCGTCGGGATTGGCGTCCCGGATGTT
+AAGAGGCGACACCAGACGCGCCAGCGTCTTTTTTATTGTCGTTTGCACAGTCACATCTTC
+GCATTATGGTGGGCTGTGTGGGGGCGGAGAAATCCGCGCCGGTTCCTCTTACCCGGTTAC
+GCCAACCCTGCACAGTTCACCACCCATCGATTGGCGTCGTTGGTGGTGATTATCTCAGTT
+AAGAGGGAATTACCATGACAACTCAAATTTCTGCCGAAACTCTTGCTCCGATTACCCATC
+ACCAAATCCCCGTCATTACCACTGAGCTGTTGGCGCAACTTTATGGAACTGAAACAAACA
+ATATCAAAGTAAATTTCAGTCGAAATTCAGATCGTTTTGTATGCGGGAAACATTACTTCA
+AGATTGAAGGAGATGAACTTCGCGCTATGAAGCACGAGGTTACTCAAAGTAACTCTGTGA
+AAATTGCCCGTAATGTTCGATCCCTCATTCTCTGGACAGAACGCGGCGCAGCCCGCCACG
+CGAAGATGCTCGAAACCGATCAGGCTTGGGAGGTATTCGAGAAACTGGAGGATTACTATT
+TCAGCCGGAAGCAACCTGTTCCAGCACGTCAGTCCCATCCCGCGATTCCATTTCCAAAAG
+AACGGCGTTTCATTGTAACAGTGTTCCCTGACGGAACTGCTGATACCCAACCTTTGCCTG
+ACGACGTATTTGTCGGCAAAATATCGAGCATATTAAGTGATCTTCGCCAGATGGGGTGGA
+TAGTGATTAAGCGTGACCGGCTGGTTGAAACGCTCGCGACATGGTGACTGCAAAACTGGA
+TTAAAACGGCTATATTTCGTGTAAATCTGATATTGTTGTTATAGTTTCAATCGTCGACCA
+AACAAATTCAAGCCTCGCCAACGTGCGGGGCTTTTGCGTTTTAGGGGGCTCTCATTCGCG
+GGCCTTTTCTATTCAACAGGCTTTGAATTGTGGCTTCTTGTGCACGTCGCCACAAGAGCC
+TGAATCGTATTGCCGCCAGTTGCGCATAACGTTCTGGAATCATACTCACGTGACCAGTGG
+CATAACCAATTTTCCAGGTCATCCACTGAGTAATCTTTACGGGCCAAACCCTCTGCGATG
+GTTACGACCTCATCACTCGGTGCTGTAAGCTCATATCCGTTCAGCAACAGGAATACGTAA
+CCTGCCATCATAGCGGTGCGTTTGTTTGCGTTTGCGAATGGATGATTCTGGATCAGGCTT
+TCAATTAGAACAGCAGACAGACGAAACATATCGTCTGTCTGCTCATAATATCGAATGGTA
+CTTGGCCGGGACTGGGAAGAACTGAGGTTGTTCGGATTCAGTACGCCTATCGGTTCATTG
+GGCGTCTGAATCTCAATCAGAGACCTGTTGATGTAAACGATATCTTCAATGGAAAGATAA
+TTGACTCCTTCAACATACTCTATCGTCATCCGTTTTTACTCAGACCTTTGAAAGTTCTTC
+CATCGCCTTCTCGTAACGAGCAAACCCAAACTCAAAGGCGTTTTTAACTTGAGCAGTATG
+TGAACATGCTTTGCTGATCGCTGCACGAGGTTTCGCCACCGTGGATTTGTCACGAGGCGG
+AATGTACAAGCGATCTGCCTTTTTTAATGCGTGACCCATGATTATCACCCTCATGCACGT
+TTGGCAGTGCTTTCTCAAATTGTAAATTTTAGGATGTAAACACATCCAAAGAATTTATGA
+CTACTTTAAGTGGTTGAGGACAATTTAATACCATTCGTCATATTTGAGCAATGGGCCTAT
+GTCTGAAGATAGAAGCAAGTTCGACGAAAATTGCATTGGACACTTTGCAAGTTAACGACA
+TTTTCGCAGAACTACCCCTCATGTAATAGTAAACTATTGTCACGTTCTCAGGAGATAGTC
+TGAGCCTATGACTCGACTAGAGTGAACACAATGCCGATAAATAGCACTTTTTGCACAAAA
+ATCATGTCCTGGTTGGAATGCACAACGCCCAACATTGCTGTGGTATTACGCCCCCAGTGA
+CTGCTCCCCGCCCTTCAGGGCGGGGAGCAGTCACGGAACATTGTTACAACGAAACGCCGT
+TCTTTTGGAAATGGAATCGCGGGATGGGACTGACGTGCTGGAACAGGTTGTTTCTGGGTG
+AAATAGTAATCCTCCAGTTTCTCGAATACCTCCCATGCCTGACGACGTATTTGTCGGCAA
+AATATCGAGCATATTAAGTGATCTTCGCCAGATGGGGTGGATAGTGATTAAGCGTGACCG
+GCTGGTTGAAATGCTCGCGACATGGTGATTGCAAAACTGGATTAAAACGGCTATATTTCG
+AGTAAATCTGATATCGTCGCCATAGCTTCAATCGTCGACCAAACAAATTCAAGCCTCGCC
+ATCGTGCGGGGCTTTTCTGTTTGTGCCGTCCGGAATAATCCCACTGAGTTTTGTCGTTAA
+TCCACCGGGTGGCCTTCCTGCTTCACACTGAGCCATTCGAGCTATCGAAAGAGAGGTTTT
+GACTGCTCCACGACCTTCAGGGCGGGAAGCAGTCGATTCTTTTTCTTAATTTAAATGAGA
+GGTTGAATATCATGAAGAAGATTTTTTTTGCTTTTGCATTGGTAATGATGGCTGGTGCGA
+GTAATGTCTATGCAACGGTTAATAACTGGTATCTGAAAGACACTACGAAATATGAGAATG
+TTAAAATTACGAATGTTTTTTATGCTCCTTATTTACACTCGCCAAGGATTTGTGCATATT
+TCACTGCATCATCAGGTGGTTCAAATGTTACTGGGTGCGCGGTGGCTGATAATGGCTATT
+ATCAGAAGAATGCAGGACAGACATCACCTTTCATGGAAATTTTTGATACTGTAAAATATT
+TTTATACAACAGGTGAGAAAATATCTGTTTATATAAGAATAAATGCATTTTCGCACTTTG
+ATTCAAGCGTGTCACAAAATGAAATCGTGGCTATCGGGACCTGTAATCAGTGGTGTTTTG
+GAGAGATAATTAAATAATTTTTATAATATACCATAAGGAAATATGATGACAGGTTATTCT
+CGTTTCTTAAGGCTGGGGGTATACCTTATGTTTGCGTATAGCCCTTTTTCATCTGCTGTC
+GATTTTGTTTATCGTGTGGACTCGAGACCTCCGGATGTTATTTTTCGGGATGGCTTTAGT
+TCTCACGGTAATAACAGAAATCTTCAGCAACATATCAGAGGTGACTCCTGTGCCGCCGGT
+AGTCGGGACAGTAACTATATTGCGACCACCTCAGATATTAATGAGACTTATAATATAGCC
+CGAGTATATTATTCTAGGGCAACATTTAGTGGCAGATTGTACAGATACAGAATCCGTGCA
+GACAATAGTTTCTATAGCCTTCCGCCGTCTGTCGCTTATATTGAGTCACGTGGTGTCCAG
+TTTAATCATTTTGAGCGAGTGATGATGCGGTTGCAAAGTGAGTATGTAGCCGTAAATTCT
+ATCCCAATTGAAAATATCCAGGAAGCAGTTGAGCTTGTTTACGACAGAAATACAAGCCAG
+GTAAGAGACGGGCCTGGAACATCAAATTCCCGTTATTTACGAGTGAGTACACAATCAAAT
+CCAGGGGTAATACCCAACTTACCAGTACCACAGGTCAGTACCCGGGAAAGGATTAGTGCA
+TTTGGTACTTTAATCAGTGCTTGTTTTTCAATGAGAGGAGTGCGCAGGGATGATACACGT
+ATTAATTCTAATTACTATGAAATGGAGTTTTACGACGCGCGGGGAGTTTTAACGGAATTA
+TTGAAGTGACTGCTCCCCGCCCTGAAGGCCGAGGTTTCCCGGAGGCATTCTGATGAATAG
+AGAATTTGACAAGTGACTTTCAGGAAAATGTCTCGCACTAGCGGGGCATTTTTACCCGGC
+TTTTCGCGGAAAGCCCCTTCCTTTTAGGTAGGGGATATAAGGCGCTCTCGGATAAATCAG
+CCCGTGAAGCCTGATCCTATTTCCCCTCAATTCTGAGAGGACTCACAGCAATTAAGAGGG
+GGATGAATGTCCGAACCTGTATCCAGTGCGACAGTGTTGGCTGGTGGAGTAATGGGGGCC
+AGTGTATTCGGCCTGGCAACCGGAACCGATTATGGTGTGGTATTCGGCGCTTTTGCCGGC
+GCGGTATTTTATGTCGCCACGGCAACCAACATTGGACGCATCAGGCTGGTCGCTTATTTT
+ATTACATCATTTATTGTGGGAGTGCTTGGCGCCGGGCTGATAGGTACTAAGCTTGCGGCA
+ATAACGCATTATGAAAAACCACTGGATGCTCTTGGCGCAGTGATTATTTCTGCAATGTGT
+ATAAAGTTTCTCACTTTTCTTAACAGTCAGGATCTGAACAGCCTGTTCAGTATTCTTTCT
+CGTATCAGGGGAGGGGGATCAAATGGTAGCAAATGACCCTTCTGCAGTTCTGAATGCCGT
+AATTTGTGGGGTAATAGTAATCGTTCTGATGTTTTACCGACGCGGTGATGCGGCACACCG
+CCCCCTGATTTCGTTACTGGCCTATGTCATGGTGCTGGTATATGCCAGCGTCCCTTTCCG
+GTTTGTTTTTGGTTTATATGAATCATCCCACTGGCTGGTGGTGATGGTGAATATCCTTAT
+CTGCGCCGCTGTGCTGTGGGCTCGCGGTAATGTGGCGCGTCTGGTCGATGCACTGAGGCA
+CTGATGGATCAACAACAATTTCAGCAGGCGGCTGGTATCAGCGCCGGGCTTTCTGCGCGC
+TGGTTTTCGCACATTGATGCGGCAATGAGCGAATTCGGTATTACTGCGCCACTGGATCAG
+GCCATGTTTATTGCACAAACAGGACATGAATCAGCAGGATTTACTGTTCTGAAGGAAAGC
+TTCAATTATTCGGTGGAGGCGCTGAAAAAGACGTTTGGTAAACGCCTTACGCCTTATCAG
+TGCGAAATGCTGGGGCGTATTGATGGTCGCCAGGTTGCCCACCAGCCACAAATAGCCAAT
+CTGGTTTACGGTGGTCGCATGGGGAACAAAGACACCGGAGATGGCTGGAAGTATCGCGGG
+CGTGGGCTTATCCAGATTACCGGGCTGGAGAATTACACCAGATGTGGCGTTGCCCTGAAA
+CTGGATCTGGTGGCGAATCCGGGACAGCTTGAGCTGGATCGTCATGCCGCCCGTTCCGCA
+GCGTGGTTTTTTGTGACTAGAGGGTGTCTGAAATACTCCGGCGACCTGGTACGCGTTACG
+CAGATCATTAACGGAGGGCAGAACGGCATCGGTGACAGGCGAGAGCGCTTTGAAAAAGCA
+AAATCGGTGCTGGTATGAATCTGTTACCTGTATTGCTTAAAAAATTCTGGAAGCCATTAG
+CAGAAATACTGCTGGTGGCTTTTTTGTTATGTGCTGGTGCGTACTGGTGTTATTCACGAG
+GTTATCAGAAGGCGGATACATCCTGGAAATACCAGTGGGCGCAACGAGACCTTACCGATG
+CGACCGCTGCATTGCAGCGTGAAGTAACCGAACGAGCGAAAGAACAGCGTCGCCAGCACG
+CCGCAGATGAAGAACGGAAAAGAGCCGATGAAGAACTGGCAAAAATACAGGCCAACGCTG
+ATGCTGCTGAGCGTGCTCGCGGTGGGCTGCAACAGCAGCTCGCAGCAGTACAACGGCAAC
+TTGCAGGAAGTGAAACCGGCAGGCTTTCCGCTCTTGCCGCAGCAAGCCAGGCAAAAGCCG
+AGACCGGAATACTGCTCGCCCAGTTGCTTGGCGAAGCTGACGATCTGGCGGGAAAGTTCG
+CAAAAGAGGCTGATGAGCGTTATGTCGCCGGAAGCACATGCGAACGTACCTGGGACAAAG
+TGACCGGGCAGAAGTGAAACCTGGTGACTGCTCCCCGGCTTGAAGGCCGAGGTTTCCCGG
+AGGCATTCTGATGAATAGAGATTTTGACAAGTGACTTTCAGGAAAATGCCTCGCACTAGC
+GGGGCATTTTTACGTCTGCAGTAAACGCGCTTCACACGCGCGACTTATGAACACAGAACC
+TTTCAGGATGACCCTTGAGGATGCCGGTTTGGTAATCGGTGCCTTTCTGTGGGCCGGAAT
+CCTGTGTGACAAGGTTCATCACTAAAAGGTAATCACTGATGAATTATCAAACAGTTATTG
+TCAATGGTGTGTCCGTTCGTGTTGATGAGGGGGGACGCTACAACTTAAACGATCTCCATG
+CAGCAGCAGTTGCAAATGGCGAGGCAACTGAATCTCAACGTCCCAGTAATTTTCTGAGGA
+GTGCACAGATTAAACGGTTCATTTCAGCACTAAAAGCCAAAGCTCAAAAAAGAGCTTTGA
+AAGAGATTCAACCACTTAAAGTAATAAAGGGTGGGGTTGATTCTGGTGTGTGGGGTGTTG
+AACTACTGGCAATCAGATATGCAGCATGGATTAAGCCGGAATTTGAAATCGAAGTTTATG
+AAGTTTTCAAAACGGTTGTCCGTCTCGGCGTTGGTGCTATGTCTCGCCTGAACAAAATTG
+ACCACATCATCAACACGGAAACCAAAGCGATAAGCCAGTGCGCAAGTCAAATGGCTAAGT
+GGGGCGTTGGTGGGCGGAAAAGATTGCTTCACGTTGCTCGTGAGCGAGTAGTGAATGAAG
+TGCAAATGTATTTACCCGGCATGGTGTGATTACAGCCGGTTAATCCAGTTTGTGCATTAC
+GACAGTACTGCTGGCCTGTCTGTCACTGTTAGCCAGCTGCGTGCCGAAGCAGAAAAACTT
+GCCACCCGCCTGGACGCCGCAAAGCACACCGCAAATCTTGCCGCTGCCGTCAGAAGCAAA
+ACAGCCGACGCCACCGCCGGAATGCTTGCCGACATGCTCGGAGATATTGCAGCAGAAGCT
+AAACGATATGCTGCAATCGCTGACGAACGTTACACCGCCAGGATAACGTGCGAATGGATA
+CATGGCTCTTTAAGAGAAGAAAAAAATATGTTGAGTCGGGGAAAGTCATATTGATTTTTG
+TTAACATTACTATTTTGGTAGGGTGGTAATTGATATAATGAAGAATTCATTACTACGAGA
+ATTTCATTATGAGAATAAATATTGATTACCTTAAGGGCCTAACTGGACTTTTTTTAGAAT
+CCAATCAGCACTTTTTAACCATATCTGAATTAATTGAATCGGGTTATGACATTACTACCG
+GAGAGGGGGCATTTCATGCACTGCTGCTTGCAGAACAGGGCTATATAAGTAATTTGAAAA
+ATGAAACTGGAACCCCTGAGTCCATCGGTTTGTTTGTCACCAGGAGTGGAGACTTTGATT
+ATACAAATTCAAAGCTTAGATTAACGACTGATGGTATGGAATTTGCATTGTCTCTAGATA
+AGGACGATGTTTTTGAGCGCTTGAAGAATCTTAGTAATGAACCTATTTCAGTAATAAAAG
+ATGTTGGTGTTGAATTATTGAAAGGATATGCAAAAAAGAAATTTGGTTTGAGTGTTTAAA
+TTTAGTTAAATTCCATGGTGATATTTACATTAACTATCCGTCATAATTTAACACTTAATT
+TCTGAATTATGGCAACACGAGGTGTAAATGGCTGAATTAAATTATGAGGCAATTGGGCGT
+TGCAAAGTACTTGGCGAAAGTATCAGACGACTTGATATAGACCGCAACAAGTACATCCAA
+GAGTTACGCGCTGAAGTATCTAGATTAAGCAAAGGTAACTCGAATGCTACTCCACCAGTG
+ATAGTTATCTTTGATATAAATCTGATTAATACATTATCGGAGAGAATTGCCATTGCTGAT
+AGTGATCTTATGTCAGCTGTTACAGAGTTTAACAACTGGTGCCAGGATGCAGGAGAGAAA
+CCTGTAGTTCTTAAAGAACCTTTCCGTACATAACTGCTAGATTATCACTACCACTTATTT
+ACATAGCCTCGCATATGCGAGGCTTTTTTATGTGCAGAACACGAGCACCACCATGGATTT
+TTGTAAGGATGAACCATGCCAGCACTAATTCCTCGAGCCTGTCGTAAGCGCGGCTGTCAC
+AGTACAACAACAGATCCATCCGGATATTGTGAAGGCCATAAAAGTGAAAGCTGGAAGCAA
+TACAAGCCAGGCCAGTCCCGACATCAGCGCGGCTACGGTTCGAAGTGGGACATTATCCGT
+GCGCGTATCCTGAAGCGTGATCAATACCTGTGTCAGAACCATCGACGGCAGAAGATAGCT
+AAGAAAGCGACCAGCGTTGATCACATCATTCCAAAAGCTCATGGCGGCACTGATGATGAT
+TCGAATCTGGAATCGTTATGCTGGGAATGCCATCGGGCCAAGACAGCCAGAGAGAGACTG
+AACTGATGGTGTATATCCACTGCACATATTGTGGTTCAAAACTGCATTCAGTCGCAGTCG
+CTAACTGCCCAAAAACATAAGGAGGTCAGTATGTTTATGTTACTGCTCAGCGGTAACCGA
+TATACCCCTGATACCTTCATTTCCGTCAGGCAGGTGTATGGCTCGGTGATGCAGAACGCA
+GGATTATCAGTGGTGGTCAGGTCTCTGCGGGGAGAGGCCGTCAGCAGAGGGCTTATGCTT
+AACGTGCCCGTCAGGATTGTCGGTGGAGCGGTCCTGAGTGGTGGGGACACACTGGTTAAA
+CCGGTGAAAAGTCTCCACGGTTTTCTTTTAGTGACAAAAGAGGTGTGAGTTGACGAATAC
+AGTTAATCCCCTGACAGTACTGGACATCAGAACGCTGGTCGGATTTAAACAGATAACGCC
+TGGTGAGATTACCGGGGAGCCGGTGGAGGCCCTGAAACGGTGCGGCATTACTGCTTTCAG
+GGACATTGTGCCAGGAAAGTCGGTTATCCGGACAGGCAGTATGATGGTGCAGGGCAATAC
+ATTTTATGGCCTGCAGGCGCAGACAGAGAAAAACATGTCTGCAGCAACATTCACGCTGGA
+ACTGCTCCCCCGAATGCTGGATCTGAAGGTGCAGGCCATACAGGTTGGTTTCCGCATGAG
+TCAGAAGCCGGTAGTACTCTCGCAGGTGAACACTACTATGTTATCGATACCAAGAAATGG
+GACTGCGCCCACAAGGGTGAATAGTGTCAGAACAGCAACGGAGGAAACCAGCGCGTACTA
+TGAGCTGGTAATAAGCACGGACAGTCAGGGGGTAAATGCAACTGTACAGGTGTATGTCAG
+CCGCCAGCCTGTGGAAAACCTTACTTTGACAATGGCTGGCAGTCACGGTGAATACCCTCT
+TGCACTGACGGTCGGGTCAGTATTCAGCCCGGTGAAAGAGGATGGTTTCAGCTTTATGGT
+CGGAGATATTTATATTGCTCAACTGGATTATAACAGCGACCACACGGTAACGCCGCATCT
+GCTGGGTAATCTTACGCTGGAGCCATTTAAAGTAGCCTCTTACGAGGGGGACCGGCACAG
+CAACACTCACGGTGAGGATATTGTCACTGCACTGAACACGCTGGACCCGAATAATGATAT
+GGGGGTGCTGGCGGTGAAGCCGGTGGCGCAACCGGCCAGCGTGACGTTTGAGCTGCCGGA
+CAGTACAGGGAAGGCGATACTGGGCGTGGCGCTGAATGTAGTTTATCGGGACTCTATAGC
+GCCGGAAAACCGGCTGCGTTATCAGATAACCGAAGGCACAACACAGCTGCCGGTGGAGAT
+TATCACCGAGCGAAGGGCGGATGTGACCGGGTTTACCACATTTAGTAAGTTCATGGCATC
+CCCTGTGGATGGTGGAGAATGGAATGCCGAAAATCTGGCGTTCAGTATGAACCTGTTAAA
+CAATCCTGGCGAGGGGCGTTAAACAGAAAGTTTCCTGCAGGCATCACGAAGTGAAACCCG
+GCTCCGGCAATCATCAAAATGCCTCCGGGAATCCCCGTCCTTCAGGGCGGGGAGCAGTCA
+ATGGGGAAATTACCGGGAAGTGAAATCTGCATGAAAATGGAATACCAGGAAGGAGGTGCT
+GAGTCCCGTCTGAAACTACGTGTGAATAATGAGCAGACTAAATGGAATGTGTCCTAAATA
+TGATTGAAAGCGTTGCATTAAAGATATTAAAACCTTGAGGATATTTAAGTATCAGTACTG
+GATGGATGATAGTGAGATGATGTGAGGTATATTTTCAAAAGAAATTAATAGCTGCTGTAT
+TTTTGATATTAATAATATAAAAGGAAATGAAATATGCCGTTAAGTTTTTCAAGTTTAAGT
+TTAAATACCTTTGATGGGAGCGGGAGCATAGATACATATACGTTGGATATGCTCGACAGT
+ATACGTAATGAAGCCAGACCTGCTGATGGCGGGACTGGGTCGACTGAAATTCAGGTGCAA
+CTATCTGATGTGCTATACCAGGTATGCCATCGGCCCGATAAAGGCTTATTTAACGTGGTT
+CCGTTGTGTGAGCCGGGGCTGGATCGTTTTTCTTGTCAGGTAAGGGAGGGCAATGCAAAA
+AAGCTGGCAAAAGAATTAAACATTTCATGGAAGATTGATTTATGTAATTTTCAGGTTGAA
+TCAGGAAGTTTTGCATGTTCTGAAGAATATTTAACATGTCCGATAACGATGGCTATTCCA
+ACAAACGGTATTTTTGTTAAAGCATCATCACGGTCAGATGTTTGTCACTTATTTGATAAA
+GAGGCATTCTTCAATGTACTGTCCCTGGAGTTAAGACACCCTTTGAGTCAGGAGCCTATC
+CGTAGTGATATGATAGTTAGAAAGAGCGAATGTTATTTTAATACCGAACGTGATTGTTTT
+ACCTTAAGATAGAATCTGATTAAACATTATCAGATGAACATGAACTTTGTACGGACAGGC
+GGAGGCGGCTGTCTTCACAGCTTACGAGTCTGAGGAGTAAGAGACCCGGCAGCGAGAAAT
+CCCCGCCACCTCTGATGTAACAGGTACTTCAATGCACCCGTACTTAACCCGCTGGGCGGG
+TTGGCGGGAGGGTAGATTATAATTAAAGCCCACTCAGATGGCTTTTTAGCAAGGCTTATC
+CGAGAGAGCCGTAAAACCCCGTCCTTTTGGGGCGGGGATATAAGGCGTGCCCTTGATCTT
+CTAACTAACCAAGAATCCCCTTCCTTTAGGGAGGGGAGTGTCAAATTACGCCCAGGCCAG
+TGGCAGGATGGATGACAGAACACCCGGGAAATGTTCTCTGGCATGACGTTGCATATCATA
+CGCCACAATGCTGGTACAGGTAAAGGCATTATGGAGGCCGTGAAAACGGTTGGACCAGTC
+GGTAAGCTTGTCTACGGACGGGAATATTTCCGGAGACAGTTCATACGCTTTCTGCATCAG
+CGCCTCCGCATAGCCTCTCAGGATAGTCGGAGAATCGTGTTCAGTGCCGAAAATAGCGCT
+GGAGGAATAGCGTGCGAATGCGGTACTGAGACAGAACAGGGTTTCCGCCTGTTTCTGTGG
+GGTGGCATCAGTCAGGTGATAAGCATTGAGGATATGCTGGTAGTGTGGCGGGCTGAGTTT
+ACCTTCAGGAAGCAGGGATTCAAAAACAGCGTTCAGACGTGACTGTGAAGGGGCATCAAC
+AAACTTCACGTCGGAATATTTCTGTTTCGTGGCGGCAATAAACTGCTGGTTAAGCTCCCT
+GTGTTCTTCAGAGCTTAGGATGGTATCAATCAGTTGCCCAAAGCGTCGCTGTTGGGCCTG
+CTGATTAAATGCGGTGTGAAACACCGGAAAGTCATGACGGAATAATTCTTCCGGAGAGAT
+TTGCGCGGTGGAGACGTTCTCTCCCCCTCTCAGCAGGTAAAAGCGGTCCCATGCAGTGTC
+AGGTTTGGGGTTTAACATCGTTGACAGTGTGTCAGCGGAGAGCATCATCGCCGTGTCAGA
+AGCTCGGGAGGAGAGCAGCAGGAAATTATCTGCAGCGCTGGTTGTCCAGTCCGGGCTGCC
+GTCATAATCGCCGAACAGCCCATTATTGATGTGTGGAGACACCAACGGGTGAGCAAGATA
+CCGCTCATAAAGTGCCGCGGCTTTCTGGCGGATGTCATCAGTGCAGTCCACGCCTGTCAT
+ACAGTGTACAATCACCTGATTAAAGAATCCGCTGTGAGTGGTCATGGCGGCGCTGTTCCT
+GTCAAACGAATCCAGCAGCACAGGCAGTATGCGCTGCTGATGATATGTGTCAGGAGCTGG
+CAGGGGAACGTCATTATAGGTCTGGCACTGATGGGCAAAAAAACTTTCCTTAACAGGCCT
+GAGCCACTCGCTGATAAGTACACTTTGCGTATAGGGGGGGTGGGCCAGCACGCTTACCAG
+CGAACTTTCAACTGGCCGGATATGTGCCTCTGATAAGCAGCCACTCCGCAATGACTTAAC
+CAGGTCTTCCATTGCCCGGACTTTTTCCTGACTGTATTTATCGGGCAGGCTGTCAATGGT
+CATCAGAATACTTTTACCATCATTGTGTTCATGATTTAAAAATCCATCCACAGCGTTCTC
+AGTCCAAAGGAGTGGCATTTGTATCCAGATATCACCTAAACGAATAAAATCTCCGCCCCC
+TGATTTTGACGGAGGTGATGAATTATCCGGTTCATTTAAAATAACGCCAGAGAGGTTTGC
+TTTGTGATGCATACACGTATTTTTTAATGTTGTATTAATAAAAGAGGGCTGTTGTTGTGT
+AAAAACTGAATACTGTAAAAACGCATTATTCATATCTGAATGACTAAATTTCGTATTGCT
+GCAGATTGCACCACGCAGTGTCGAATAAGTGAACCGGCATTCGTCAAAATGTAAATCAGA
+TATATCAGAATGAGCGAAATTTGAATTTGAAAAGTTGAACCCCTTAAGGATATCGCCGTC
+TCGCTCCATGAAGCTGGAAGGCAATATTTCACTGAATAAAATGTAACGGAAATCTGCGCC
+TGAAAAATCAAGTTCTGTGGTCGAGAGAGTTTCTCCGGCTTTCTGTCGTAAAACTGCATC
+CGTGAGTTTCTTAGCCCATTCGGCAGGTGATGACGGGGAAGACGTAGCCTGAAGTGAGAG
+GGAGGGTGATACTGGTGGTGTTCTGGCTTCAGAAACCGTTGGCCTGTTATTGGCTGATAC
+AGAGACTCCACCGGGGAGTGGGGCCGCACCTGTCACTCTGTAATTATAATCACGTGATTG
+ATTTGCAATATTCTTATGCATGAATGCTGTAGTAATTTTTGAGACATCTTCCGCTGAAAT
+ATTTTTCTTACAGGTGTTATTTGTGTCAGTAATATTTTTAACAGTAATCAATGTTTTGTT
+TAAGGTGTTTTTATCTTTCGGATGAAAGAATTTTTTTATTTTTTGTGGTAACGCGAATTC
+AATCGGTGAGTCCTTTCCTATTTTAAATTTTTCATTTAAAGATATAGGTGTGTTTTTAAC
+GCTGGTTATTTCTGAGGAGAACCGGTTTTTCGTACGCTCATGGATAGTTTTAACTAATTT
+TTTAACCTGGAAGGGAATGGTGGAAAAATTAATTCTGCTTGATGATATATTCATTAAAAT
+CCTTTATCAACATCTGTTATGGAAAAACGCTCTGGCTTTTTAACGCCTTAAAAGTAAGTT
+CCATATGTTGCTATTGCAATAGCGATCACAATTCATCATATTATCTGGCATGTTTCTTTC
+AGAAAGTGTCCATTCTGTCATTATGTTTTGAAATAACCCACCGTGTGGTGGGGGCTGACG
+TATCTGCGGAAAAATACAGGTATAAGGGAGCGGGTCGGGTACCGAAGCCCATGGATGCGC
+AAAAGTGAACCCGCTTCGATGCCCAACCGTTGCCAGGCCAATCCGCTGGCGCCTGATTGA
+CAGCTCCCCGCCCTGAAGGACGGGGATTCCCACTTCAACGAGCCGAACCTAAGCCGCTTT
+GAGCGATTCAGGATTTACAGGCTCTCCGTGGGCTAACACTGCCAGCCCGGCAGCTTTGAT
+ACTACGTGCCGCGTTAACGTCCCTGTCGTGGTCAGTTCCGCACTCAGGGCACTGCCATTT
+ACGAACATCAAGAGGCATTTTTTTCATGGTGAAACCGCAACAGCTACAGCGTTTTGAGGA
+CGGGAAAAACTGGTCAATGGCGACTACTGACCGCCCGGCCCATTCGCCTTTGTACTGGAG
+CTGGCGCACAAGTTCGCCCCAGCTCGCGTCTGCTATCGCTTTGGACAGCGACGGGTTGCG
+GAGCATGTTCTTCACTTTCAGGGATTCGACGCAAACAACTTGGTTATCGTTAATCAGTTT
+GCGGGATGCCTTGTGCAGGGCATCCAGTCGGCAATCAGCAATTTTCGCGTGGAGTCGGGC
+CACCTTTAAGCGGGCTTTGGCGCGGTTCTTTGAGCCTTTGGCCTTTTTGCTTAACCGGCG
+CTGGAGTAGTGCCAGGCGAGCCGCGTATTTAGCGGTATGGCGGGGATTGCCGGACCTGAA
+TCCGGTATCGGTGACGAACAAATCTTTTAAACCAACATCAATGCCGACCATTGAAGAGGT
+GATCGGCAGTGATGCGGGTTCAAATTCGCAAAGGCACGAAACAAAGTACCGCCCTGCGGC
+ATCTTTGGAAATGGTGACGGTAGACGGCACGGACGGCAGCGGACGACTCCAGCGCACGTC
+TAAGGGGATTTTGCTCTTTGCCATGTACAGCTTGCCGTCGCGGTATTTAAACGCGCTCGC
+AGTGAACTCAGCCGCCTGCCTGTGCCGTTTGCTTTTGAATGTCGGATATGCAGCCCGTCC
+GGCGAAGAAGTTAGCAAAGGCGGTTTGTTGGTGGCGCAAAGACTGCTGGAGGGGAACGCA
+GGAAACGTCGTTAAGCCAGGCAAATTCCGGCTCCTTTTTCAGCGCCGTAAGGCGAGCGTT
+GGCCTGTAGGTAACCGATCTTTTCCTTTCGCTCGTAGTACGCATCGGTACGCCAGCGGAG
+GATGGAGTTGTAGACGAAACGCACACAACCGAACGTCTGAGCTAAAAGCTCAGCCTGCTC
+AGTCGTGGGGTAAAACCGGTATTTATATGCGCGTTTCATAGCCTCACATATTAAAGAGGA
+AAATGTGATTATGCAAAAGACAGTTAGCCGGAAAACCGCCTCCTTTCCTCCCCGGCCTGA
+AGGCCGGGGTTTCCCGGAGGCATTCTGATGACTGAAAATACTCTGCTCCGGGACGAGCTT
+TCGTGATGTTGAAAAAATACCACTCCCTCCTTTCAAAAAGCGTATCAGCTTGATAATACG
+TTTGAGAGCGAGTGCTTAGCTAACCCGGAGATTCACTATGCAGTTTTCAACGACCCCAAC
+GCTGGAAGGACAAAGCATCGTGGAGTACTGCGGTGTGGTGACGGGCGAAGCCATTTTAGG
+TGCCAATATTATTGGTGCCTGGTCTGACGCCCGGCGAGTGGCGCTTTATCCCTGCATCCA
+TATAGTCGATTGCCTTTTGGAGTTCTTCAATCAAAGTAATGGCTTTCGTCCGTGAGATAC
+ACATAAACTGGTCAAGGAACTCTTGCAACGTCAGTAGCATTCCTGAACTGACAGATTTTG
+AAGTGAGCTATTCACTTCTCACGAACGAGGTCTATCTGTCCACCTCATTTACAGACAACA
+TGGCCTGTATACCAAACTGGCCGTTGGAATCTGTACTGGTCATATGGTTATCTGATACTG
+TTTTTTTTGTACAGTTCATTATTCGGTGGTTGTGTAAGTGTAGTCAAGTGGATATGCCTG
+ACTGGAAAGAATATTGTTTGTTTGATAGGAGCTAACTTTTTGTTTTTGCTGAATGTTTGA
+AATAAAGTAGTATTCTTTCTATTTATTATAACCACATGATAATAAATAAATTTTTTCCGG
+TCTTGAAAACCGGCGACCCGAAAGGGTTCCAGAGTTCGAATCTCTGCGCTTCCGCCAGAT
+TAAACAAGGGGTTACCGAAAGGTAACCCCTTTGTTTTTGGGCTGTTAGAATACACTTAGA
+ATATTCACTTAGAATATTTTCCCTTGTTCCTTTAACGGCAGACAAAAAAATCCCGCCGAA
+GCGGGAGAATTTCAGGCCTGGATGAGACGCTTAAACAGCAACTGTTTGATGTCCTGACGG
+TGCGACAAAATCGCATGTGCTGTTACTGTCGAGCCATCCACCGAATACAAAACACGATAC
+CCGCCTGCGGTATTGCATTCCCGGTATTTTGCCACCCCGAGTTTCATCAGTTCCGGGCAA
+ATCTGACAACCGAGCGGAAACTGGCCTACCTGTTTCTCAAATTGTTCGAGAATTTCTGAA
+ACCACAGGTTTAGCTTCTACCTCATGCCGGTGGAGAAAACTTGCGATATCGTCGACGCAG
+GTTTTGACGGTGTGTGTGTATTCGATTTTGACTTTTTCCATTACTGGATCCTTATATCAA
+TTTCTCTCATATAAGCCCGTCCAGTAACTGCTCCTTTGAATATACGTTGCCATTGGTTTT
+GTCCTGCTCTGACAGGGTAAGAAGTTTCAGAAGAGCAATGGCGTTTTCCCGCTCCTGTTG
+CTGAGCATATGACTCAATAACATACGCGGGTACACCATTTTGAGTTACCAGTATTGGCTC
+TGACAATTCGAGAGAAGCAGCATTCTTCTTGACGAAGCTGATCGTTTCTACTCGCATTAG
+GCGTAACCTCGCTTTAAATAAAATCCTCAGGATTGTTGATTCGGCCTAAATATAGACCAT
+ATTTAGGCCTTTGACAACTATGCGAACTGGCTGATAGCCGGGATATCAAGGGAAGGGGTT
+ACTTTAACCTTACGATCGTAAACCAGTACCTGGCTCTCGGTTTTGTGGCCGGAGAATAGC
+TGCTTATCGCGACTCGATCCTTTATAGTCAGAAATCGCCTTTGCTTTGATGTCGTGGAAT
+GTACATCCGAACGGTGTTCCGGCTTTTTGCTCTGCGGCTTTTTTTGCTTTGTCCCACCAC
+TTATTAAGTGTCCTGCCCGTCACCTTTTCGCCGTTAGCGTTGGTGATAACATATTTTCCA
+TTTTCGCCCATAGTATTTCTCGCGAGTTGAAATGCGGAACGAAGGCGAGGAGACTGCTCC
+TTAATTTGTTTCTTCCCGGTTTTTGTTCTGCTCAATAAACAAATCAGCATCCATCACATC
+ACCCGAGACCTTCTCCAGAACGTCCCCTGGCGGGCGGCGCACAAATACGAAACTTCCATC
+GCAACGCGTAATGTAGGTGTGGTTTCTTCATAAATCGCCGCATAATGCTCATCACTGATG
+TAGACGGTACGTGGTTTCGAGATAAATTTACGTCCCCTTTTTCAGGGGTTCCCCTTCACA
+TATCCACGTGCAAATCCCCATCCGTAAACACGGCTAAGGCTCGCGAGCTGTGTCTTACTT
+TTCAGCCTTCTCTTGCCCATAAAAATTCTGATGTGTTCTGTTTTTACCGTGTCTGCACGC
+ATTTTCCCAAAAACAGCCAGCAGATTACGCTGGGGCTGGTGATACTCTTTTTGAATTCGT
+GGTGCTGGCTCGGTACTGGCATTTTATCGGGGATATTACCGGGGGGCGAAATCTGCATGA
+AAATGGAATACCAGGAAGGAGATCAGGAACTCCATCTGTGAACACGGCTCAATAATGAGC
+AGACTAAATGGAATATGTCCTAAATTTGATTGAAAGCGTTGCATTAAAGATATTAAAACC
+TTGAGGATATTTAAGGATCAGTACTGGATGGATGATAGTGAGATGATGTGAGGTATATTT
+TCAAAAGAAATTAATAGCTGCTGTATTTTTTATATTAATAATATAAAAGGAAATGAAATA
+TGCCGTTAAGTTTTTCAAGTTTAAGTTTAAATACCTTTGATGGGAGCGGGAGCATAGATA
+CATATACGTTGGATATGCTCGACAGTATACGTAATGAAGCCAGACCTGCTGATGGCGGGA
+CTGGGTCGACTGAAATTCAGGTGCAACTATCTGATGTGCTATACCAGGTATGCCATCGGC
+CCGATAAAGGCTTATTTAACGTGGTTCCGTTGTGTGAGCCGGGGCTGGATCGTTTTTCTT
+GTCAGGTAAGGGAGGGCAATGCAAAAAAGCTGGCAAAAGAATTAAACATTTCATGGAAGA
+TTGATTTATGTAATTTTCAGGTTGAATCAGGAAGTTTTGCATGTTCTGAAGAATATTTAA
+CATGTCCGATAACGATGGCTATTCCAACAAACGGTATTTTTGTTAAAGCATCATCACGGT
+CAGATGTTTGTCACTTATTTGATAAAGAGGCATTCTTCAATGTACTGTCCCTGGAGTTAA
+GACACCCTTTGAGTCAGGAGCCTATCCGTAGTGATATGATAGTTAGAAAGAGCGAATGTT
+ATTTTAATACCGAACGTGATTGTTTTACCTTAAGATAGAATCTGATTAAACATTATCAGA
+TGAACATGAACTTTGTACGGACAGGCGGAGGCGGCTGTCTTCACGGCTTACGAGTCTGAG
+GAGTAAGAGGCCCGGCAGCCAGAAATCTCCGTCACCTTCGATATGTCAGGTATCCTCAAC
+GCACCCACATTCAACCCGCTACGGCAGGTTTTTTAATGTTCGGGAAATACTGGCACGACA
+AGAGGCTGCGATGGAGGCCTGATAACGGACGAGGTTTACAACAATGGCTATTCTACGCAA
+TACGAAAATATTTTGCGTCTGGCCGGAACTGGTGATGGGGAGATATTAATCGGATGGAGT
+GGGGTAACGGTGCGCCAGCTCCCGCCTATCTCTGTGGCCATCGTGATGCCGCTGACGCTG
+AGTGGTCCGAATGGGCAATGCTCTACACCTTACTAAATCCGCCACTGGTTCGTATCCAGT
+AGGGGAGGCGATTGTATGGCTGTCTGATGCCACTCCAGCAGGTTACGCCCTGATGTACGG
+GCAGTCCTTCGATAAATCTGTTTACCCGCCACTAGCGATAGCCTATCCAGCCGGCGTTAT
+TCCGGGCATGTGCGGCTGGACAATCAAAGGTAAACCCGCAAGCAGCCGCGCAATGTTGTC
+ACAGGAAATGAGCGGTAACGAATCGCACAGTCATAGCGCCAGGACGCAGGATACCATAGG
+GAGACTGGTAGACTGTGTTGATACCTCAAGCCCCACCAGGTCGGAAATACCAACATGATG
+CGTTTTGTACGGGCTGGATTTCCGGTACACTGTTGTACTCATATTCACACTTAAAATATT
+CTTATCATTCTTATAAACAATTTATATAAATTGTTTTGCATGTTAGCATTCCATATTGGT
+TTAAATTCACAGGATTTTTTAAGAGGTATGACCACTATAGCAATTGTTACTGCTTATTTT
+GATATAGGCAGAAGCCAATGGACATCTCAAAATGGATTTGCTCCATGCATTGAACGAGAT
+ACTGATGAATATATGGCCTGGTTTTCTAATCTTGCACAACTTGAAAATGATATGGTTATT
+TTTACCTCACCTGACCTCAAACCCAGGATTGAGGAAATCCGGAGAGGAAAACCAACAACG
+ATTGTTACATTAGATTTCAATAAAGAATTTCATCATATCAGGAACCGGATTGCCTCTATA
+CAGTCAGATGTAACGTTCAGGCTTAGAACACCTGTCGAGCAGCGCGGGAATCCAGAGTTC
+CTGTCGGCTGATTACGTTTTACTCTGCAATCTGAAAACATACTTTGTAAATAAAGCTATC
+AGGCAGGGGTTGATCAAAGACGACATGGTTGCCTGGATTGATTTTGGATATTGTAGAGAT
+TCAGATACCACGAATGGAATAAAAACGTGGTCCTGGTCCTTCAATAAGGAAAAAATGCAT
+TTTTTTACGATTAGAAGGGGTCTTAAACTTGAAACACTGGAATCAGTATACAACTGTATG
+TCAGGTAACCGTGTGTATATCATCGGTGGCGTTCTGGTCGGAGCGCTGGAAAAGTGGCAA
+GAATTTTACAGATTGGTGTGGCATTGCCAAAAAAAGGTGTTGAGAGAAAATATTGTGGAT
+GATGATCAGGGGATATTTCTAATGTGTTATTATTATAGACCTGACATGATAAAGTTAAAC
+TACCTGGGTAAAAACAAGTGGTTTGATTTATTCAGATGTAAGGGAAGGCGAACGATTCGT
+ACTTTTTTTCGCAAGATGAGAATATTATGTCTATACAAATGAATGTGTTAATTTATAAAA
+AGCCAGGCATGTAGATTATGCCGGGCTTTTAAAAACTGAGAGATTTATTTTTTACCCTGT
+ATCTCTAAATGAGACTGGTTTTCATTTGCCGATTTCACTCTGTCATTATTCATTTCACTA
+TTAACAATCTTTTTATTAAGCATATAACCAATGAGACATGAAAGGATAGACTTAATCATT
+AGACCACTTAGCCATCTGTCCTTGCTTCTGAATTGTTCAGCGAATGAACAATCAAATTTG
+TCATTGGTAGATTTATATAGAAAGGTATGTACCATTGCTCCCTGCCTATCATAATCCCAT
+GACCTTTATTGATCATTTGTTGATGACACCAGATGCCAGGTCGGAAATGGCGTAAACCCA
+GCATCGCAGGAACCCGGTAGCAGACTGTAAGGGCAGATAGCACTTCCGGGCATATATCTA
+CTGAAAAATCAACATATATAGAATTGACTCCAGATCAGAATAATGTATTTCTATTCCTCC
+TCCGGTGAAAGTGGTTCCTCCTTAATCTGCACTAAGCGTAATGCCATGCCCGGTTCAAAA
+TGCTGGTAATCCGCTCCGTAGTCAAACCACAGTTCTTCCCCGGCGGAGATGTCGCGTGTG
+GTGAGGTAAAAGGTAATATTCTTTCCGACAAGGACCGCGCTGACGTTCTGTCTTGCTTCT
+GCCTCCGCGGTCCGGCGGCCAAATACCGGGTTGTTAATCAGGCTGAGGAGATTTCCCTGC
+GGCCAGGCAGAAACGATTCGCTCCTGGCTTCGTGTGGCAAAGTAATAATTACTGGCTTCC
+CTGCCGTATTCTTTTTCATATTCATACCGTACCGTTTCGCTTTCCAGCAGGCGGCCGGAG
+TAGGGCCCCAGTACGGTGAAGGCGGGAAGGTCAGTACGCGCGTAAACGGTGCGCCCCCGG
+TAGCCGTCGCTGTCATCAAGAGGAATCGACACGGTCATCATGTCATTCATGCGCGCATCA
+TGGTTACCTTCATTTTGCAGGAACCACTGGACATCCTGATTAATCCGGGCTTTTGTCTCC
+CGGGGGAGCCGGTTAAAAAGGCTCCCCCAGAGAGTGACCTGTAAGGTCTCCTTTCTGCCT
+TCTGCCTGTGCCAGAACCGATACCGTCGGGTCACGCCAGTGCTGCAGAATCGGCAGGTTA
+TTGTTTATCTGATGCGTCCGCCAGGTCACGGCGTCTTCCTCTTTCTTAATCTGTTTTGTC
+GTTGGAACCGGAATATCTTCCCCTGCCACGGGGATGGCGCGCTTATCGCCGCTGCTTGCC
+AGAGATGTATCCGCCCTGACGGTGAGTGACCCCCTTCCACCCGTGGATGTTGAAGGCTGT
+GAACTGTCCTGCGTGACAGTGGTGGTGAATAACGTGCTGCCGTGGGGCATTTTGCTGTCT
+GCCGGTGCCAGAGATTGTCCGGTACGTTCGTTGGATATCCCCTGTGCCTGCGCCCATGTT
+CTCTGGCCGCCAGCCTCGCGTGTCGCCTCCGTCGACAGGTTCCGCCATGTCTGCATCGGG
+GAATCGGTAACAGGGGCATTCCTTTTCTTTGACTGCTGCAGCCGCACTACACCGCGGGGT
+GCCAGTCCGGTGTTTGTCAGAAAGGTTCTGGCACTTCCGACGGATATTCCCTGTGCCTGC
+GCCCATGCTACCCAGCCACCAGCCTCGCGTTTCGCCTCTGGTGTCATGTCCCGCCACGCT
+CGAATCTGTTTACTGGTAATAGAGGTTCCTTTTCCCTCTGGCGGCCGCAGGCGCGCCACG
+CCGCTGGAAGTCAATCCGGTGTTTGTCAGATAGTTCGCTGCACTTATGATATTTATTCCC
+AGTGCCTGCGCCCATGCTTTCCAGCCGCCAGACTCGCGTTTTGCCTCCGGTGTCAGGTCC
+CGCCACGTCTGAATCTGGGTTTTGGTAATAGGGACGTCCCTTTTCCCGGGCGGCTGCAGC
+CGCGCCACACCGCGGTATGTCAGTCCGGTGTTTGTCAGAAAGGTTCTGGCACTTCCGACG
+GATATTCCCTGTCCCTGCGCCCATGCTACCCAGCCACCAGCCTCGCGTTTCGCCTCCGGT
+GTCATGTCCCGCCATGCTCGAATCTGTTTACTGGTAATAGAGGTCCCTCTTACTTCTGGC
+GGTCGCAGGCGTGCCACGCCGCCGGGAGACAATCCAGTGTTTGTTAAAAAGTTCGCTGCA
+CTTCCGACGGATATTCCCTGTGCCTGTGCCCATGCTCTCCAGCCACCCGCCTCGCGTTTC
+GCCTCCGGTGTCAGGTCCCGCCACGTCTGAATCTGGGCGTCGGTAATAGAGGCTCCTCTT
+CCTTCTGGCGGCTGCAGTCGCGCCACACCGCGGAGTGTCAGTCCGGTGTTTGTCAGAAAG
+CTTTTGGCACTTCCGACAGATATTCCCTGTGTGTGCGCCCATGCTCTCCAGCCGCCAGAC
+TCGCGTTTCGCCTCCGGTGTCAGGTCACGCCACGCCCGAAGTTGTTTGTCCGTAATGGAG
+GGGCGCTTCGCCTCAGCCGGCAACAACCGCTCTATGCCGCGCGGAGTCAGTCCGCTGTTT
+GTCAGATAGTTCTCAGCATTCCTGATGGCTATTCCCTGTGCCCGCGCCCATACTTTCCAG
+CTACCAGCCTCACGTTTTGCCTCCGGCGTCAGGTCACGCCACGCCTGAAGTTGTCTGCTT
+GTAATGGAGGAAAACTTCTTCCCGACCGACAATAACCGCGCTACGCCGCGGGGAGTGAGT
+CCGCTGTTTGTCAGATAGTTCCTGCTACTCTCGATGCCTATTCCCTGCGCCCGCGCCCAT
+ACTTTCCAGCTACCAGCCTCACGTTTTGCCTCCGGCGTCAGGTCATTCCACGCCTGAATC
+TGCGCGTTGGTAATGGAAGGGAGCTTTGGGCGCGCTCCAGGCTCTGTTACGGTAGCGGTC
+CTGCTGTCAGAGCTTACTGACAACGGTAGTTCTTCCTGGGAATGTGCTGCATGCCATTCC
+GGGTCGCTCAGAAGGAGTGTGACAGTAGGAAAGTTGCTGCTTTTACCGGCGGCAATTGCG
+CATTGGGTTTCACCTGTGCCGACCATTCGCTCTGCCGTAAAATTTGCCTGCCGTCCCGGG
+GACGCCAGTGCTTTTAGCCTTAAAAAGCGCTTCAACCTGTCCGGTGCCGGTGTGCCTTCC
+TCCGGCTGATAAAAAACGCGAAAGCAGTGTGCAGCCTCATCCTGAGCGGTCAAGGGGAAC
+CAGTCCCGGATATCGTTCCACGCCCGGCTTAAGTGGGTATCTGAGGTGCTGCTGGCTGCT
+GGTGCGTGAAAATGAATGACTGACCCGATACCCCGCATGGTGCCTCCTGCTGATACCCGT
+CTGGTTTAACGTAAACAGGAGAACGCTACCATCGCGCCTTATAATTTTCTTTTAAATAAT
+GTCCATCTGCATGAACGTGCTCCGGTCCTGTCGATTTAAATCGGTCAATTCCGTGAGTGG
+CCGAGTACACAACAGGGGGCGAAAAACTGTGGCTATCTGACTGGGTAAGCCGAGGCAGAA
+CGCTTTCATTGAGCGCTTTAACCGGATATACCGTACAGAAATACTTGCTTTTATCTGTTC
+AGAACACTGAATGAAGTGCGAGAAATTATAGATAATGGTTGTCAGAATATAACTGTTAAC
+GCTTGTATGTATCACTGAACAATATGAAGCCGGAGGAATATCGACAACCCCCTTATTTGG
+CCGGGAACTAAAAAAATACATGGAACTAAAATGAGTCTATTTACAACTGTTTCATAAGGG
+TTCAAAATCAACCGTTGTGCCAGGAATCTTACCTGACAACCTGTATGCCACCCTCAAATT
+GTTGCGTTGAGCCTGCTCCACCAGTGAAATAATCGTGATGAAAAATAGTCCAGGTTGTCA
+CAAAAAAACGGATATATAATAATTAGTCGGTTAAAATCGCAGCGGTCAGTTTAATTGGTG
+ATTAATTAAATAAATATAGTTACCAGTCTTATATACACGTTAATTATTAAAACAATCACT
+CTACGGTAGAGTAATGGTTTAGATTTGTTGTGCTATGAATATCATTATGAAGCGGCATAA
+TGCCTTATGAATAAATAGGCGAACAGTCATTTATCATTATGACGGTTAACTTTCAAGTAA
+CGGGTGGAGCATTATGATTTGTTGTTATCAATCGGTGAGGCAGAAGGGGAGAAAAAGAGA
+TGAAATACCAAAAGCGACTAGCGGGAATGATGGTTATTACCGTCATGATGATGACGGGAT
+GTTCAACGTATAATCCCGTACAACTCCGTCAGCATCAATTAGAAAGAAACTATACTTATT
+ATCTTCTTGATCCTCCGCTGTACGAAGGAGATGTAGTAGAATATAAATGTAAAGACGGAA
+GTCAGGATACAGTGACTATTCAGAAAGTAACGCCGCAGTCATTAATCACCAGTACTGGCC
+AGGTTATTCCACTATCTGATCTGACCTCACTTGAGAGAAAGGATATTTCCAAAGGGAAAA
+CCGCTGCTGCTGTGGGGGCTGGCGTTGGCGTGACGGCGCTGGTTATTGCTGCGATTTTTG
+CTGCCACCCTGTCTGCCGGATTAGCTGCAATGATGGTCCATGGTTAA
+>NC_015761.1|provirus_3084741_3115735
+TCAGAGCCACAATGGTCGCTGACCACCAACAGTCGGGTGCGGCGGTGCCGGGTCGATGGA
+TCCCGGAGTAACAATAAAGCGTTCTATCGTTTCCATTGTCATAAACGTACAACTGCAGTT
+GATATTCTGGCACTGGTGGTAGCGCTCTTTCGTATTTTCGGTTAGATAGCGGCTTGTTCG
+CGCATGTGCGGCATGATGGCACTTCGGACAATGAAACATAACCCACCTCTTATTCTCAAT
+TCGTGAACCAATAATAATCACTAATTCACTTTTTGTGAATACATTTTATTCATCATCCGA
+TTCTGCACTGTACTCCACATCAGAGAGTTTAACCTCAAGCTCTAAGCCCGTCGTGAAGCC
+ACTATTATTCATATTGTGAGTCACCTTACTGATTAACCACGATTGCTCGTCTATGACGCG
+CTTAAAGCCTGACACGCGCACCGGTGTCTCAGGGAATAAATCAGCCCTACCAAGCGCCAG
+CGTAATTGAAAACTCCGCAACGCCTCGCTGCAGCTTATCCCACTTAGCCTGAGCGGCGCG
+CATCGCCTGCGCCTTAGAAGCGTAGACCGTCGTCAGCGCCAGTACGTTATCGGCCTCACC
+GGCCATATACTCACCCTCGCGAGCCTCCGGCTCTTTTCTGGACTTCGTCTTTTTGCTGAC
+CGGCTTTGCTTTCGGGTGTTCCAGTGCGCGAAGGTGCTTCTCTTTTGGCTGGCGTTTCAG
+CGTCACTTTCTGTTTTTGCGGCTTCGGGTCTTTGGTGTGCAACCATTTAGCTGTTACACC
+GGTATAAGCTCCGCGGTCGGCAATGGCAAACTGATGACGGTCGCCGTCACTGCGGGTCAG
+CGTCATTTGTGGAATGGGCTTACCGCTGGCCGTCAGCGCACTACCGGCTTTCAGAAACAG
+TAGTTTTCCCGCTTTAACCGATACAGTCGCTCCGTTTCGGTCAGCCAGCCGGGTAAGAAA
+TACCGCGTCGGATTCCTGCGACTGGTCGATATGTGGTACCGGTATTTGTTTCAGCGAATC
+CGCGACGCTGGCCGTCAGTTTGTTACGCTTTGCGATGGTGCTAACCAGTTCGCCGAGGGT
+GGTGTCGTGCCATGATTCCTCGCGCCGTGAATTGAGCGTGCCGCGAAAGTCTGCACTACG
+CGCCCGGATGGTCAGGGTATCAGGCGCACCCCGGTGCTCAATCTCATCGACCGTAAAATC
+GCCTTTATTCAGAAGCGCCGAACCTTGCCAGCCAAGCCACAGCGTCAGCACCGCCCCGCG
+CATGGGTAATTCGACTTTTCCGTCGGTATCGTCGAGCTCAATGTCGAGCTGGTCAGCCTC
+AAAACCCCGGTTGTCGGTCATGGTGAGAGAAATCAGCCGGTTACTAAAATTGCTGGTAAT
+GTCCTGGCTGTTCAGCGTTAGCATAAATGCCGGTGCAAGACTGGCACCGGCGTCAATGGT
+CATGCCCGTAATCATATGGTCAGCCCTCCGAGCGCACCCTGCAGCTTATCGGTCAGATTA
+CCGGCAGAGCCGAGAAGCTCGCTCGCCTGTTTATTCAGGTCGCCAAACATTGCCGTCAGT
+GATTCATCGACCCGTTTTAGCGAAAGCGTGAAATCAATCTTTCTTGCCGCGCCATCGCTG
+AAAAACTCGGCGTGCGTGGTCGACACCTTATCGATGATATACATCCCGAGGATTTTGCCG
+GTCCCCTCAATCAGCGGCCACGCCCTGCCCTCATCGGCCATCAGTTCCACAGCCAGCAGG
+GATATATGACCGCCGGTAATGGCAGGGTAAAGCGTACCGGCAAGCTGTATTGAGGTTTCC
+CCCTCGCCGAGAAACTGATATGCAGGCGGTTTACCGACCCGGTCATTAGACGCCCAGCGG
+TAATCTTTCGAATGCTGCATTGACTGATAAGGCAGAGTACGGAGTTCAAATACAAACATG
+CCGAGAGCAAGCATCATCGTTTAATTCTCCCTTAGTCGTGGCTCATGCTGGCGCGCTGAC
+GCGCACGCTTTTCGCGCTCAATTTGTTCGAGTGTGTCGCGTAGCTGGCGGTCGAGTTGAT
+GCCCCGGAGCAACACCGCCCGGTAGCGAAATGTTGTATTCGCTTTTGCTCTGGTCGATGT
+AAGAGCGTCCCGCCGGTGCGGTAACGGGCTGATAAGCCTGATACCCGCCATAGGTGCTGG
+TCGCCGGAATGTAGGAATTCCCCTGCGTGGCGGCGTTGGTTTTGGCGGCGGTCTGGTCGA
+GGCTGTCCGATTCTTTGTTGATGATGCCGAGCTTTTCGAGAAGCCAGTCGACACCACTGC
+GTAGCTTGTTGAAAACGTTCAGCGGTGCCATCAGCGCTGAGGCCAACGCCTGACCGAAAA
+TAACGCCAGCATTTTTACAGCTATCGAGCGTCTCCTGCGTAGCTTTGACCGGTGCAATCA
+GGTCTTTAAACCATTGCCAGACTCCGCGCAGCTTCTCACCGAGTCCGTCAAAAATGGGTG
+CCAGTGGTGCAAACATTTCCCCGACCGGAGCAAAAGCACTCATGATGCCCTCAATCACCC
+CCGAGAAAAATGCGCTGATGGGCTCCCAATATTTACGGATAAGTAGCGCCCCGGCCACAA
+TCGCCGTCCCGACGGCCACAATCGGCCAGGTGATTGCACCGAGAGCTGTCACAATGGCAC
+TACCGGCAACAGTCAAGGCGGTACCCATCACGCCAGCGGCGGCAATGATGGCGTTAATCC
+CCATGACAACCGGCCACGCAACGAGACCAATGCCACCGATGATACCAATCAGAGCAAGTG
+CGCCCCCGGCAATAATGCCGATAGTTGTCGCCAGACCTTTGTTTTTCTTGATCCAGTCGT
+CGAGCTTTAACACGTATTGTGTGGCGGTTTTGGTGAGTTTACGCAGCGAGTCCTCTTGCT
+GGTCAAAAAGGTCGGTACCGACGGCCTCATAAGCCGACTGGAACTCTTTAAAGTCGCCGC
+CGAGGTTATCCTGCATAACCTTAACCAGTTCCTCGGTTTTACCGTCCGAGGCTTTAAACG
+CGGCAGTGAGCCGGTCAAGTTTTCCGCTTGAGGCTGCTTCCATCAGTACCGCCGCCGCCG
+AGCTGGCCTCCTCGCCGAAAATGGTTTTCATGTACTCGCCGCGCTGGCTTGTCCCGAGGT
+TGTTTTTCTCAAAGCTGCGCTGCATTTCTTTCAGGATGGAGAATATCGGGCGCGTGTTCC
+CCTTGCTGTCTGACGTTTTGACGCCGAGTTCCTTAATGGCCTCAAACGCTTTTCCGGTGG
+GAGCCTGCAGGCGGCTGAGAATGGCGCGGCTACCCGTACCCGCCATTGACCCGGTGATTT
+TGGCGTCGTGCAGTGCACCGACCATTGCGGCGGTTTGCTCGATGCTTACCCCAGCATTTT
+TCGCCACTGGCGCGGCATAGGTCAGCGCGTCGCTCAGTCCGTCAAAATCGGCGGCGGTTT
+TGTTCATCGTCATCGAGAGAACGTCGCCAATGTGAGCAATCTTGTCGTTTGAAAGTTGAA
+ACGCTGATTTCATCCCGGTCAGCAGCGCAGCGTTTTCCTCCATTGAGCGCCGGTTTGACA
+GCGCCATATTCAGCGTGACTGGCGTCGCCGCCTGAATGGCAGCAGCGTCACCGCCGCTTT
+TCGCAATGATGATTTGCGCGCTCGCTGCGTCATCTGCAGAGGCTGCAGTATTGTCGCCGA
+GCTGGCGAGCCTGTTTGCGTAGCGCCTGCATTTCTGGCGACTGTTTATCAACCCCGAGCA
+CAGCTTGCAGCTCGGAATTTTTCTGTGCAAAGTCATAACCGGGCATTAGTAATTTAACCC
+CGGCCATCGTTCCCGCCGTCGCAATACCGACCCCGGCAGCGCCTGCTGCGGCCATGTTAC
+CGGCAAGCTCTTTACCTGATTTATATCGTTCTTTCACCCGGCTTAATTTCGCCTGCTGCG
+CACTGACGCGCGCCAGTGCATTACGCTGTCGGTTAAGCTGCGCCGTCGTTTCGCTGATGG
+AGGTTTTGAGTCGACGTTCATCGGCAGACAGGGTGCGGGTATTGATACCGGCCTGCATCA
+GCTCGGAACGCTGGCGCTGTACCGATGTTCTCAGGCTGTTATATTTCATCTGCAGCTCAG
+AGGCGGCACGTTTTGCCGCTTCGAGCGCCTGCGCCTGCGCGCGGGTCGGACTGGTGGTGT
+TTTTAAACTGCACAGCCAGCTCACCGGCTTCGCGCTTTGCCTTGTCAAGCGCCTGACCAG
+TCACGGCCAGTTGCGCGCTTGCCTTACGAAAGCCGTCGATTTTCGACGCCTGACCGTTCA
+GGTCGCGCAGACCCTTTTGTGTGTTGCGAATATCACCCGACAGGGTTTTACTCGCGGTCT
+GGATGGATTTAAGCGGTCGGGTCGCCTGGTCGACCGCTTTCAGCAATACCTCAAGCCTCA
+GGTTATTACTCATTGTGGTTTCCGCTACGCTGCAGCGCCTTTTCGCGCCATGTGATGAGC
+TCGGTCAGGCTCAGGGAACAGAGTTCTGATGGCGGCCAGTGGAATATCACTGCGATATCC
+GCCATCAGGTCATCAGTCGACAGGTCTGGCGGGAAGTCTATTCCGCCGAAGCTGGTGACA
+AAAAACCAATCACCTTAGCGGCCAGCGACAACATATCGGGCAGGTTCATCGCGGTAAGCT
+CCTGCGCGGTGAGCGCGGGGTAGGTCATGCGGGGCAGCACCTTAATCAGGGCGTCGACTT
+CGGACTGCGCCACCGCTGCCAGACTGACGCCGCGCAGGGTACCGGCGTTCGGCTCAATCA
+GGGTGACTTTATCAATCGTCTGACCGGCGCGCTTAATCGGTTTGTCCAGGGTCACGACGT
+TCGGGTTTACGGTGTCAGTTTCATTTCCAGCCGTATCAATAAATTCAGCGGTTTTACGTG
+GTGCTTTTGCCATGATGTTTTTCTCTGTTCTGAATGGGGTTAATAACCGGCCAGCAGTGC
+TGACCGGTCAGGGAATTACAGCCCGATTGCGCGGCGGTGCTGCTCCAGACGGTCGACGCC
+GTTCACCTTCTCGACCATGTTGACGGTGTCGATTTCGATGACGTCGCTGCCATCAATCGT
+GAGGCGGTAGTAGGTGCAGACAGTCGACAGTTTGGTCGAGGTGTTTTCACCCTGCTTATT
+CTCACCGCCGTCGATTTCTTTATGACGGCCACGCATGACCACCTCGACCGCCACGATTTC
+GCCGGTGTCGTCGCGCTGGTAAGAACCAGCAAAACGCAGCGGCACAGCATCAGCGCCCGG
+GGCGGCGTACTGCGCCCACAGAGCCACATCAGGCAGGCCGCCGACAGACCATTCGACGGT
+TAATGCATCGTCGTCGAGGCCGAGATCAATCGCTGCCGCGCCATTCATACCGCCGCCGCG
+ATAGTTTTCGAGCTTGCGGGTCAGCTTCGGCAGCGTCACGGATTCAACAACGCCCATGTA
+GCTGAGGCCATCGTTGAACATATTCAGGTATTTGAGTTTACGGGGTAGTGCCATGTTGTT
+TCAGGCTCCTTAGCTGTTGACCGATTCGGCCAGATTCACCAGATATTTATCGGTGATACG
+CTGGCGCAGGGTCAGGCTTTCCAGTGGCGGAACTGGTGTATAGTCGTAGTCGATATACAG
+TTTCCCGGCCTTGAGGGTTTCCTTGTCGTTCGATTCCTCATCGAACCAGCATTTACCCTC
+CACGATGTAGCCGTTTGATTTCAGCTCGCGGAATTTGGCGTTAATGCCGTCAACAATGTC
+ACGAATGAGCGTGGCGGTAATGGGCTTGTCGACCGCCCACATGTGCGCCTCCGCCATCGT
+GTCGGCCAGTACCTGCGCGGTGCGGGTGTAGTTCTCAAACAGAAAAAGCGGGTCATCCGA
+GCAGGTGCGGTTACCCCAGAAGCGGAAACCGTCCTTGCGTACCAGCGTTGTAACCCCGGC
+CTCGTTGAGCAGGTCAGCATCGGTGCCGGATGCCTGCAAATCCCAGAACACTGAGGCGCT
+GATGCCGGTAACGCCCTGTACACCAACGTTAGACAGGGTTTTGTGCCAGCCGACAGTCTG
+GTCGATGTAAGCACGCAGGCCGAGTGCACGCGCAGTGGCGTAAGCCGTTGCGGTGGTATT
+TTTGACGGTGTCCCATGCGAGGAAATCAGGCCAGATAACCATCAGCTCGCGCTGGCTGAA
+ATTTTTACGATATTCCATCGCTTCGGAAATAGTCTTACATCCCCACGCGCTGAGGTAAGC
+AAATGCACGTAACTTAATGGCAGCCGACGCAAGCGCAACCGCGACCTCTTTAGTATCCAG
+CCCCGGCACCCCAAGAATACGTGGCTTGACGCCGGTGACGGCCTGAGCGGTCAGGAGAGC
+CTTGATACCGGTGTATTTACCGTTCTCATCCGTACCTCCGATAATGTTGGAAACAGTCTG
+TGCGAGCGCAGCTTCCTCGTCATCGCCGGTTCCATCCTCAACACGCACAACAACAGTGAC
+GGGTTTTGACTGGTCTGCGATGGCCTGCAGTGATGCAGCCAGCGTGCCTTTTTTACCGGC
+TTTCGCAATGGCACTTTGCACATTGGTAATCAGTACCGGTTCATTGAGGGGAAATAGCGT
+GGCATCTGCATCGCTGGCTGTACAAACCATGCCGACGACCGCAGTCGCTACTGTGGAAAT
+AACACGCGTACCGTCATTAACTTCGATGACCTGCGTGCCGTGGTGAAAATCACTCATCCG
+GTTAACTCCGTGGTTAAGGGGTGAGTATATTTTCAGGTCAGTACACAAGAGGGGGCTATT
+TGTACCGGCTGTCAGGTTGATGGCACAACGACAGGAAAAAGAAAAGGCGGGTAATAAACC
+CACCTGAATATTTAGCGTGGTATATCCGGCCAGTCAGGCGCAGATGTATCCACCCTGTTT
+ACCATTACGCTGTAGAGCTCCCATGCTTCCAGCCGTTTAAACTCTTCATCTGTGGCAATT
+TTTAGTTTTACTGCCCGCGCCAGCGGTGCAATGGCTGATTCAGCCTCAGCAAGGCGGCGA
+ACTTTTTCAGCCTCCGCCTTTTTACGCAGCTCTTCCGGCGAATAAACCCGTTGAACGACT
+TTACCGTCTTTAAACTGCCAGCCGCCTGAAATATCAGCGCGACGGTTTTCATCCGTATCA
+GGTAGCTCCGCCACGCTCTGGCCTGCAGGCCATAAACCGGAAATATCGCGCGTGATACAC
+GTAATAACATCGTTATCGTCGTAGGTAATTTTCAGTGTGTCTTCTGAAAATAATTGCTGG
+CATGCATACCAGTCCTGACCATCCTCTGATTGTAGATGCGCCGCACCGGCGAATAATGTG
+TCGTCTGGTTCCGGTGTATACGGAATGAAATTTTTAATATTTAAAAACTGCTTGTTCTTT
+TTATTTTTTGCCGCTGTCATAATTATTCCTTCTTATACACTTGGGGCTGTCACCCACGTA
+TCACCAACCAGATACTGAATTGGACGGTAATAAACCTTGTCATCACCACCTTCCATTTCC
+CAGCTACCGTCAGTATGGAACCCCGTCACCACCTGTCCGCCGCCAAGCTGAAAATCACGC
+CACAGACCGCCAGAAAGCGCCACGGGGCCAAGTCTGACCGCTTTTACTACATTGTTGTGA
+ATCCATGTACTTAACCAGCCATTTCCCCATAACGAACCAAAGATATCACCGTTATTCTGA
+TAAATAGCGCCACCTATATTTAACGCGTTACAGTAGACGATACCGTTAACAGTAAATGAA
+ATACTTCCGTCCGTATTTCGTTGACTGTATAAATGCCATCCCTGTTCATCGCTCAGCTCA
+ATGACTGTTGGACGTTCTCCACCTCCCCACAGACTTAAACCAGCATTCAGTGCAGAATTG
+TTACCACTCGATAACGTCAGTGTTTTTCCGTTGCCGGTGCGCACGACACCAGTAGCGCGA
+ATATCTGCCAGCATGTGCAGCCCGGAATTGTCGATATAACCGACCTGGGCACTATTGGCA
+TAAATACCCAGAACGCCGTCACTGTGCCACTTAAACCCTGTATCGTTATCGCCGAATACA
+ATCGAATTACCGCCCAGTGCATTGTCAGTACCAATACCCAGTGGGCCGTTAAGCCGCCCC
+CCGGTAATCGGCAATGCACCCACATCACTGGCTGAAGGTTTATTTACGGTGTTGTAGTCA
+ATAACCCACTGGCGGCTGGTATTCGGTTCCGTTCCCCAGTCCTGGCGCTTTGCGTTCGCG
+CCCATATGCGCGTAATAGTGCTGAAACCAGACTTCACCGATTTTCTCAACAAACAGATAT
+CCATAGCTGTACAGCTTGCTGCCATCCGGATAGGTCGGAAAATCAGCGACCGTATCAGAA
+TTCGACACCGCCACCCGCCACCATCCTGGAGTATTAGCTGATGCCATCGTGCCGTTATCG
+GTAATCTGTCCAATGGCATCGGCGGAAATAGCCTTCACATCTGACGCCCACAGGGTGATA
+TCCCCGGATAATGGATGCCCATTGACCTTACGGTCTGACGGGACGCGTCCGTTCGCATTA
+TCCATAGCCGCTTTAACCGCTTTCGGCGTTGCGGCCAGCGTCTCAGACGTGCTGTCAGTG
+GCATTGCTGAGCTGGATAATCCCTTTACGTGCTGTAGTGGCGTCCTGAGCTGTATATTTC
+GCGTTAGCAAGGTCATATGCCACCTTGACCGCTTTCGGTGTCGCGGCAAGCGTCTCAGAC
+ACACTGTTAGTGGCATTGCTGAGTTGCACAATGCCTTTACGCGTTGTGGTGGCGTCCTGA
+GCTGTATATTTCGCATTAGCAAGGTCATACGCTGTCTTGACAGCTTTCGGCGTCGCTGCG
+AGCGTTTCAGACTCGCTGTCTGTCGCGTTACTGAGCTGAGTAAACCCTTTTTCTTTAAGA
+GTGGCATCAGGATGACGACGGGATTTTTCATGTTCGGCGAGCCTGTCGTCGACATAATCC
+TGCGTCGCCATCACCATCGTTGAGTCAATGGAAAGCTCCACAGACTCGACACTGCTGACA
+ATGATGACCATGCGGCATGTCTGCGCACGCCCTGAGCCCTCGGCCAGTTCTGGCTTGTAG
+CTTTCGGCCATATTGGCGACAGCAATCAGCGTCCCTTCATCGTCATAAAGGCCAAGCTCA
+CGCATCCAGAAGCCGCCCACCTCCGGCGGAATAACCAGCTCGGCCACAATGTAATTACTG
+TACCGGTTGTCCTGGCTGATTTTATTCAGAGTGTGACGCCAGACCTCATTAACAAGCTGC
+GTCTGACCGGCATCAGGCACCGGCAGTTTTCCACCGCCGTCACCAACAGCCATAACGTTA
+AGATTTATTTTCTTACCGCCCGGCATGGTGGCCGCAGCAAGCTTAGCGGCTCCGGCAGTG
+GTGATAACGGTTTTAAATTTCGTGCTCATTATTCCTCACTTATCCCGGGTAAACCGTAAT
+AATATCGCCATCGCAGGACACGCCGCCGGTATACAAATAACCGGGAATGTCCCGGACAAT
+ATTCAGGCCAGTCAGATGACGACTGGCTGGTTTTGCATCCGCAATCAGTCGTTCCATTTC
+GAAATACATTTCCTCGGTAATGCCACTTTCAAGCACCCCGATATCAAGCCGGAATGTGCC
+GGGCGGGTCGCTGCTTTCCCACCATTCCGTTACATTGATGACATAGCCGAGAGGCTCCAC
+TACCCGACGGATTGCGCCGATAGTCCCCTTGTGGCAGTGAATGAAATATGCATCATGGAT
+AACGGCACGTTTTGTTCCCTCCGGCCAGTTCTCATCCCACCGGTCGACAGAAAATGCCCA
+CGCCAGCCACGGCAGCAAATTTTCCGGACAGGTGTCAGGGTTCCACAACGAGCGGATGTT
+GACCGGCGTTCTTTCAATCTCAGCACATGCCCTTGCGGCGGCAACCTCCAGTGGCGATGA
+GCCTACCGGCAGCAATCGTGAGTCATTCATCAGAGCCCCCGATTACAAGGCTGTAGTCAG
+TGCAAAAGGACGCCTGTGTGTTATCGAGAACAATATCCGCGACCGGTGCCGCCAGCTCCA
+CCCGCTGAACACCCTCAACATGCAGGGCGGCATAAATCGCTGATTTACGGATATCGCGCC
+CGAGGCGGTGCTGCGCGCTGATATAGGCTTTCAGCTTTGCCTCAGCCGCCGCCCTGATGG
+GTTCACTTTCCGGGCCGGGATAAAGATAAAGCGTGGCGTTAATCTGGTAGTTAACAATTT
+CGGCTGACTGTACCGTCACCCGGTCAGCGACCGGCCTGACATCTTCTGCGTTCAGGGCAT
+TGCGCACAATTGCAAGCAGTTCCTCAGATGCGACGCCGTTGTTTTCACGAGACAGCACGG
+AAATCGTCACACAGGCTGGCGACGGGCTGATAACTGAAATATCGCCGACGCGCCCGTCAG
+CACTACGGCCGTGATACTGGTACGATCCGACAGACCCCGCCACGCTCAGTCCCTCAAAAG
+CCTGCTGTATACGCAGACGATAATCGGCGTCGAGTTCCATTTCTGCCGGAGTGGGTGGAA
+TGGTGGTGTCATCAGCAGGCGTGACGACAAGGCGCTCAACACTGAAATTCGCCCCGATAT
+TATCGAGGTCACTTTCTATGGCATAAGCCAGCATCACTGCGCGTGCAGCTTCATTGACAC
+GCTGACGCCAGATAACCTCGCGGTAGGCGTTTTCCTGCAGCAATTTAACAATTGGCTCAG
+ACTCAAGTGCGAGCGTCCGGGCGACGGCTTCCTGCTGGTTTTCCGGATAGAGCGAAATCA
+GCGTTGCAATGCGCTCCGCAAGGATAGTTTCATAGTCCAGTTCCTCGACCACATCAGGAA
+CAGGTAGCAGACTCAGGTCAACAGTTGCCATAGTGGTTTAACTCAGTGAAACAGTGGTTG
+AAACTGACGCACCGGTATCGGTACGCATCCCGGTAATATCGACATACATTTCGCCAGTGT
+CGCCACGCTCAAAGCTGATTGAGGTAAGCCTGATGCGTGGTTCCCATTTCTGGATCGCGG
+AATAGCACGCCACCATGATTTGCAGCCTGAGCGCCGGGTTTTGCGGCATATCAATCAGCG
+CAGACAGGAGCGAGCCATATTCACGACGCATTACCCGCGAGCCGACCGGCGTCAGCAGAA
+TGTCGCGCATGCTCTGGCTGATATGCTCACTGTCACTGATAGCGAGGCCGGTATTGCGGT
+TCATCCCCAGATAACGCGCCGTCATCTGGTGCCCTCCGTCCAGCTCCCGCCCCGTTGCAC
+GCCGCCGTGACCGTGGTCATCGACCTGTACGCCGTTTGATTTCAACGTGCCACCGGTATG
+TTCGATGTTTCCCCGCATGGTGCCGCCTTTCTGCACCTCAAGCGTCGCCGTCGTCAGTTT
+GTTGGTGCATACCACCTCCGGGGTGTCGAGGGTGATACGTTCTGCCGCTTTTACCAGTAC
+CACCGGCACGGTGGCGGTAATGGACTCCGATGCCGTCACATCGGCAGTCTTGATGCCGCT
+GACCGTCAGTGCACCGGTTTCCGGCTCATACTCCATAACAGCGCCGTCGGGGAACACCAC
+ATGCCACGCATCCGCCGAGGCTGACGGGGCAGGGTTATCGTCGGAGAAAATCCCCGGCAG
+CACGAAAGCAGTATCAAGCTCGCCACCAATTGCCAGCAGCAGCACCTGCTCACCGACCGA
+GGGAGCCCACCATGTCCGCGAACGACCGGCGCGGGTGGTCAGCCAGTTCAGCCATGCAGT
+CTGGATCCCGCCGCTTTGTACGCGGCACAGCCCCTGCGCGGTATCGACCTCAGTCACCAC
+ACCTGAGCGGATGAGGTTGCGAATCGCGCGCGTGAGCTCCTGTATTGTGGATAACGTATT
+CATAGTGCAAGGATGCCTCTGGTCTGGAGTCGCGCCAATTCGCGCGGCTCCGGTGGTGGT
+TCACACAATATTTATTTACCGAGATGCCTGATAATGATGTCTTCAATCATCTGCTCATCG
+TCGCGGGTGAAACCGAGCAACGGGCGCGCCGCGTACTGCACATCCCGGCTGTGACGATTT
+GGCCGGTCTTTTAGACCATACTGATGCACCCGCGCCATGCGCTGTACCCTGCCGGTAAAT
+TCCACCACCGCCGCACTGTCGCTGCCTTTGGCTTTCATAAAGCGGTTAGTGCGCAGTCTG
+GCGAACATTTCGCGCCTGATACGGCCTTTCTTACTTCGTACCGGCTGGCGCTTTCGGGCG
+GCATACGGGGTGCCGTCGGGTGCCTGCTGTCGCCTGATGCGCTGCTGCTGACTGGCGCGC
+AGTTTTTTTGCAATGTCAGCCGCCATTTGCCGACGCGCCGCCGGTGACAGGCTGGCAATC
+AGACCGGTAAGGCGCTCCTGCAGCGCGGTTAACTCACTCATCCCACTTACTCACCAGCTC
+GCCGTTAACGTACAGCTCGACCGGGCGCGTCACTGGCTCAGGCAGCGGTGGCTCAGGGGC
+ATAGCTGACATGCAGTGCGCCGTCGACCTCTTTGACGAGCGTGCGCTCGGTGAGTCTCAG
+GCTGATACTGATATCGAGCGAGTCGTCGTTATTGATATCAATCACCCATGTGAATCCTTT
+CTCCCGCCCGTCGTCGGTGGTCATAATGTCCGGCTGATGCTCACGCAGCCATGCCTGTAC
+CGGCACAAATATCAAATCGAGGTCGCCGGTAAAGTCAGTCACCACCACGTTAAGCACGTA
+CACCTTTTCAAACGACAGCGAGCTCTCCAGTCGGGAATCCGTATGCCCGTTATCAGCGAA
+CAGGCGCAGCATATCGGGGTTGTTTCGGAGCTGCGGCACGGCGTTAATCAGCGCCTTGCG
+CAGGCTTTTGTGCTTCTGCATCGAGTTCATCCTGACAGTGTTTGACGGTTTTGACCTGTA
+GCGCGCAGGCGGTCAGCGCGCCCTCAAGGCGGCGGATATCAGCGCTCAGGTCACCATTAG
+TTTTCGGATCACTTCCCGGCATCGGGCAAAGGCTCACCCTCGGGCATCCGCTGACCACAA
+TCACCGGCGCTGGCGCAGGCGGCGCGGGTGTGCAGCCTGCGCACAGCATCAGGCAGAGGA
+GCGTTATACCAGCGGCGAAAGGCTTCATTTTCATCAAGTAACCTCGTTATCGTCTGCTCG
+CGGCGGTTTGCTTCTGCGCCTGCCTTTGCGAGCTGTTCGCGCAGTGCCACCTGCGCGGAT
+TCATTACGTCGGGCGAGCTGGCCGGCGACACTGAGCTGATTTTTCAGCATGCCAATCGTC
+GCCTTTTGCTCGCTCGCAACGCGGTTTGCCGTCTCAAAGGAACGGGATAAATTGCCATTC
+TCATGGCGCAACCACATCAGACCGAGCACGGCCAGCACAAACAGCGTTATCAGGACTTTC
+ATGCCACCACCCCGCCAGCCGTGCGCCAGACGGTAACCAGCTTTTCGAGACTGTGCTCGC
+GCTGGCCGTAACCGGCACCCGGCAATGACGCCCAGATATTCCGGCAACGGGAAACAGCAC
+GCTCAATACGCCCCGCCCGGATATCGTCAATAGCACCGCGCTCCCGGATTAACTGGATCG
+CGAGCTTGTCCTGCGACAGTGGGCTGAAATCAGGCAATGCGAGCTGTTTTTTATAGTGCG
+GCCAGAACATATAAAGCTGCTGGTAACGCCCCGATGCCGTGGATTTCTCGCCACGGCGAT
+TAAACACTTTCGCGGGTCGGCCATGTGCGAAAGGGTGGTCGCTGTAATCGGTGAAAATCT
+CTGGCCTGCCATCAAGGCCGGTAACAATGACGTCGTAGCCACGGTTTTTCGTCAGCGGAT
+GGTTCGCCGTTCCTTCGGAATACGCCAGCATGTCCAGAAAGGCGGCGATATTCTGGTGAG
+TATTAATGACCGGCATCGCCTTCCCCCTTCTGTGACTTAAAGCGGCGCTGAATGGCGATT
+TCCACCACCTGATAACCGGCAATACCGAGCATGGATCCAATACCGCACACAGCGGGCAGT
+GACATATCAGGAAACTGCACCAGAACAACACCGGCGACCATTGAGACAAAACCGCCGAGC
+AACATGCGCCCGATAAACAAACGCGGGGTGATGGGTTCACCGCCTGCCAGCACTTTTCCG
+ACCACAATCAGTGCCCCAATCACAAACAGTGACAGGACGCCTTTTTCCCCTTCTGTCATG
+GTTTACTCCCAAAGATTGATAGTTTCAGTTACGGGTGAAGACGGCACATCGGGCAGGTCA
+ATTGCCGTGCCATTCGGCAGAATGACGCCCAGCTCAGACAGGCCTGGATTAGCCTGCAGC
+ACCGTTTCAACCACGCCCTCAGTGCGCCCGTAATACCTGGCGCAAATCACGTCGAGGGTG
+TCGCCCTGCATCGACCTGACCTTCATCAGAGTTGGCCCACGATGCAGCGCGGTTTGTCCT
+GCAGACGCGCGACCGACCAGCGCATATCCCGCCACAGGTCATCAATGGTGGTTTCGACGC
+TGTCGGCTTTTTTGTCACCCTTGCCGGTGGCTTCAACACCGCGATAGCGCTCATACAGGG
+TGGCGGTTGCCATCGCCGTTACGGCGCTCAGATAGTGGAAAATACGCACATTCTCGCCAT
+CGATTTCCTCAGCAGGCACGTCGGCCAGATGCTTAAACCCGGCGGCAGTCTGGCGCAGCC
+GGTAGTCGTAAAGCTCCGCATTGGTTTCCGCCATGCCAGTTCTGATGGCATGGCGCAGGC
+GCGCATCGGAAACCGTCTGCTCAAGCCGCATCAGCTCGCGCACACGCTTCGGATCCACAT
+CAGGGAAAAAGAACGTGTTTTTAATTACTGCATCGCCCGTCTCCGGTACGGGAATCACCA
+CGCCCGGTACGTCCTGTGGTTCGTCGGGCTGGTTCAGAATCACTGTCGTCATGACAACCT
+CATCAGGTTGGGCGGTGGACGCCGGTCGCTGTCAGGGTCAAAACCCGCTTTGACCGGCGT
+GCCGCCCGGCTCGGGGAGCGTTCAGTTAACCGGCGGTTTTTACCGCCTTTGGTGGACGCC
+CGCGCTTTGCTGCCGGTTTGGCGACAGGTTTGCGCGTGCGCGGTTTAGTCGTTTTACGGG
+GTGGTGCCTCCGCTTTTGGCTTCAGTGCGCGTTCCAGCCGCTCAATCTCTTTGCGCACAC
+CGGCATTGCGGTCGAGCTGCATCGCACGTTGAAACTGAGCCAGTGCCTCAGCATTCTGAC
+CGATATCGCGCAGGGTCAGGCCGGTCACCTTATGCAGACGGGCGCGCACCATATCGGGAA
+CGTCAGCGCCGTCGGTCAGGCTGAGGGTGGTCAGCAGTAATGCGAGGTCGACAGGCTCAC
+CGGCATCGCGCAGGCGCAGTGCGGCAAGCGCCACCTCCTCAACCAGCATGTAAGGCGTCG
+TGCGGCGATGGTCAGTGGTGAGGCCGTATTTCAGCGCATAGGGCGCAATTTCCAGCGCGC
+CAGCGATATCACCGGCATCAAGACGCCACAGCATGACGGTCATGACAATGTCATCCTGCG
+CACCGCGACCATCAGCCAGCACACCGGCGACCCACGGCGCATAGAACGGCAGCAGCTCGC
+GCTTTTTCTCGGCTTTACGTTCGTTTGAACGGATATTTTTTAACGTGCGGCGGTCATCGG
+CCAGCTTAACCAGCATCTGCTCATAGGCGGTTGCATGGCGCAGTGGGGCTTGCTCCCGCT
+GCGCGGCTTGAGAGGCCGAGACCCGCATCATGTGACGCTGTGCGGGGCTCGTCATGGTTT
+AGACTCCGCTTTCCGGTGCTGCAGGTGCGGTGAAATCGCCCAGGGTGATGTTTTCCAGCA
+GGCACCCGGCGGCATACGCCTCGACCACATAGTCGATATTCATCGACTCGTAGTTTTCCA
+CGCGGTCACGCTTGGGGTTTTCGATGACTGAACGCCGATGACCATCATCCATGAAGTAGA
+TTGAGAGATTTTCCATCGTGGTCACCAGTACAGCATTCGCAGGGAAGTACGGCACGCGCA
+CGGCAGGCAGGTTGCCGATGCGTTTCTGGCTGATGATGGTATCCGCAGCGAGCGACTCGC
+TGTTTTCCTGCTGCTTGTTAACCAGCGGGAAATATTTATCGGCCAGCAGCTTACGGCCAA
+CGATGGCAACCAGTTTGGTTGAGTCCTGATAAACCTCATCAATCAGGGTACCTGTCGCAT
+CCATTACCAACGCGTCAAGATTCTCATAGTCGCCGTTTTTACCGACACGAATCACATCGG
+AAACGACTTGACCCTCATCGTCGGTGATTTTACTCATCACGCGCGCCGGTGCTTCGTTAC
+GGTACTTCTGCAGCCAGCCGACCGCTACATCCTGCAACATTGGATTAGTTTTGCGATTCG
+AGGTCGGCGCACGATGAGTACCGTTAAATCCGGCCATGATGAAATCCAGTGCCTGACGCT
+GGATAATCGCGTCACGGATGCGGCGCTGGAAGTCCTGAAAACGCGCCCACAGGTCGAGCG
+TCTTGTAGCGCAGGTGGAAGTCAAAGTTGACCTGGTTGCACTCGTACAAATTGGACTCAA
+GCGCGACAAAGTCAGCAGTTTCACGCTCATCGTCACCTGAGGTGTCGGTCGTGCTGGCAA
+TAGTGCCATCCACACCCACACCGATTTTTTCACCTTTCAGCTCATCAACCGGAAAAATGT
+TAATCATCTGCAGAAATGCGGATGACGCCTGCACGGTGTTCATCAGCGTTTGCGTGACGG
+ACGGCTCGACGGTGAATTTTTTGCTAACGTCATCAACGCTGATGCCGTTCAGTTTGGCGA
+GCTGGGTCAGATAGGCATTGAACTTAAAACGGGTTTCCTGACGCATAGTATTTCCTGTTT
+GAATTAATCGGTTAGTCACAGCATCGGGCGGAATTGCCGCCCGGTTCCAATCTGCGGTTT
+ATCAGCAGTCGGTCAGCAGCTCGTCGCCACCGCCGCCGCTGGCTTTCGTGCGTCGCGGCT
+GGCTGAAACTTTCGGTTTTGTCGAGGGTGGTTTTCAGGGCGGAAAATGCCTGGCTGGTTT
+CTTCAACCTTGCCGGTCAGTTCCTGTTTAAAGGTGGCTAGCGCGGTTTCCATATCGGAAA
+GACGCTTATCCTGCGCAGTGAGACTGGTCTGCACATGTTCGCTGACGGCGGTCACCGCCT
+CATGCACATCACTCATGCGCGCATCGTCGCTGACCTGCTTACGGCTGAAAATGGCTTTCA
+CCTTGTCGGCCAGGCTGTTAAGCACTGTGTCGGGAACATCTTCAAATTCCAGTTCGGCCA
+GCGTGGCGACTGAAAAGACATTTTCAGGACTGGCCTTAAAGCGCTGCAGCGGGTTGTGCT
+TCGCCTTACGGCAGAATTCGAGGTATTCAGTGCCGAGGCTCGCAGGGTCATCAGTGACCG
+CAAGGCCGACAAGATAGCATTTGCCGGTGTTACCAAAATTCGGCTGAATTTCCATAGAGG
+TATAGACCTTCTGCGCGGCTTTATTCATCGCGATAAGGTCATCGGTTGGGGTGATTCTGG
+CGAACAACGCCCATTTGCCATTCAGCGCAGAATCGTCGTCAATCTTTTCGGCTTTCAGCT
+CAACCACATCGCCATAACGTTTAAACATGCCGTCGGGCAAAAGGCCGCGAATGTGTTCAA
+GGTTAATACGGCAACCGTAGACGCGCGGGTCATAGGTTTCGGCCATTTCCTGAATATCGC
+TGGCGCTGATAATGCGCCCGTCGCAGGTATCACCCTCGACGCCGATGCGAAAGAATTTTG
+AGACTTTTTTTGCCATTGTCAGGAGTCCTGAGGTTGGGGTTACGGGTCAACGCCAGTTTC
+CAGTCTCAGGACTCGCCAGACCACCAATGACGACTGGATAACCTCCCACACAACAGCACC
+TTAGCGAATCACTGGCGGCCATTAAGTAGCCTTGCCCTGAATCCACTACGGCGAGGCATC
+AATGACCATTTCCACCGATACAACCTTATTGCATGACCCGCGACGACAGGCATCGCTGCT
+TTACTGGCAGGGCTTTTCCGTGCCACAGATTGCCGAAATGCTGCAGGTCAAGCGCCCGAC
+CGTGCAGAGTTGGAAACAGCGCGACGGCTGGGACGGCATCGCACCGATTTCCCGTGTCGA
+AAGCAGCCTTGAGGCGCGCCTGATTCAGCTCATCGCCAAGCCGCAAAAGTCAGGCGGCGA
+CTTCAAAGAGATTGACCTGCTCGGGCGGCAGATTGAGCGACTGGCGCGCGTCAACCGCTA
+CAACCAGACCGGCAACGAGGCCGACCTTAACCCCAACGTTGCCAACCGTAACAAGGGGGA
+GCGTAAGAGGCCGAAAAAGAACTTTTTCAGCGATGAGGCTGTCGCAAAGCTGGAAGAAAT
+TTTCTTCGACCAGTCTTTCGAATACCAGTTGCAGTGGTACCGGGCAGGACTGGCGCACCG
+TATTCGCGATATTCTCAAATCCCGCCAGATTGGCGCGACGTTCTACTTTTCCCGCGAGGC
+ACTGCTGCGCGCGCTCAAGACCGGCCATAACCAGATTTTTCTGTCGGCCAGTAAAACGCA
+GGCTTACGTGTTCCGGGAATACATCATCCAGTTTGCGCGACTGGTTGACGTCGACCTGAC
+CGGCGACCCGATTGTCATCGGCAACAACGGCGCAAAGCTGATTTTTCTCGGCACCAATTC
+CAACACCGCACAGAGCCATAACGGCGACCTGTATGTCGATGAAATATTCTGGATCCCGAA
+TTTTCAGAAGCTGCGCAAAGTCGCATCGGGCATGGCCTCGCAAAAGCATCTGCGCTCAAC
+TTACTTTTCGACACCTTCCACGCTGGCGCACGGCGCTTACCCCTTCTGGTCTGGCGAGCT
+GTTCAACAAGGGGCGCGCCAGTGCCGCTGACCGCATCGAAATCGACATCAGTCACAGCGC
+GCTCGCCGGTGGGCTTCTTTGCGCTGACGGACAGTGGCGGCAGATTGTCACTATTGAGGA
+CGCCCTTGCCGGTGGCTGCACCCTGTTCGACCTCGACCAGCTCAGACGCGAAAACAGTGA
+TGAGGACTTTAAAAACCTGTTTATGTGCGAGTTTGTCGACGATAAGGCATCGGTATTCCC
+GTTCGAGGAACTGCAGCGCTGCATGGTCGACGTGATGGAAACATGGGAGGACTTCGCCCC
+GTTCGCCGACCATCCATTCGGCTCGCGACCGGTCTGGATTGGCTACGACCCGTCCCACAC
+CGGCGACAGTGCCGGATGTGTCGTACTCGCGCCGCCGGTGGTTTCGGGTGGCAAGTTTCG
+CATGCTGGAGCGTCACCAGTGGAAAGGCATGGACTTTGCCGCGCAGGCAGAAGGCATCCG
+CAGGCTCACTGAGAAATACAACGTCGAATACATCGGCATTGACGCAACAGGCCTCGGTCT
+CGGCGTATTCCAGTTGGTGCGCTCATTCTACCCGGCGGCACGCGGTATCCGTTACACGCC
+AGAAATGAAAACCGCAATGGTGCTCAAGGCGAAAGACACGATTCGCCGTGGCTGTCTGGA
+GTACGACGCCGGAGCAACTGATGTCACACAGTCGTTTATGTCCATCCGCAAAACCATGAC
+CAGCAGCGGGCGCAGCGCCACCTATGAGGCCAGCCGCACCGAGGAAGCCAGTCACGCTGA
+TATCGCATGGGCCACCATGCATGCCCTGTTAAACGAACCGCTTTCTGCCGGTAGCGGCAT
+GCAGCCTAAATCTATTCTGGAGTTCAACTAATGGGTAAGCAAAAATCCCGTAAAGCCGCC
+GCGCAGAAAGCCCGCGCACCACAGCAACTGAAAGCCAGCGCACCGCAAAAAATGGAGGCA
+TTCACCTTCGGTGAGCCGGTGCCGGTGCTCGATAAGCGCGATATTCTGGATTACGTCGAG
+TGCATCAGTAACGGCAAATGGTACGAGCCGCCGGTCAGCTTCTCCGGGCTGGCAAAAAGC
+CTGCGCTCTGCAGTGCATCACAGCTCGCCGATTTACGTTAAACGCAATGTGCTCGCAAGT
+ACCTACATTCCGCATCCACTGCTGTCCCGTCAGGATTTCAGCCGCTTTGCGCTCGACTAT
+CTGGTATTCGGTAACGCCTTTCTTGAGCAGCGCCACAGCGTCACCGGCCAGTTAATCAAA
+CTGCTGACTTCACCGGCAAAATATACCCGGCGCGGGGTCGATGACTCGGTTTTCTGGTTT
+GTGGAAAACTTCACTCAACCGCATGAGTTCGCACCCGATACCGTGTTCCACCTGCTGGAG
+CCTGATATTAATCAGGAGATTTACGGCCTGCCTGAATATCTCAGCGCGCTTAATTCCGCC
+TGGCTGAATGAATCCGCGACGCTGTTCCGCCGCAAGTATTACCAGAACGGCGCGCACGCA
+GGTTACATCATGTATGTGACTGACCCGGCGCAAAGCGCGACTGACGTCGAATCGCTGCGC
+GATGCAATGCGTAACTCTAAAGGGCTCGGCAACTTTAAAAACCTGTTTTTCTACTCACCG
+AACGGGAAACCGGACGGCATAAAAATCGTGCCATTGAGCGAAGTCGCCACAAAGGATGAC
+TTTTTCAACATCAAGAAAGCCAGCGCCGCTGACCTGATGGATGCGCACCGCGTACCTTTC
+CAGCTCATGGGCGGCAAGCCTGAGAATATCGGCTCAATGGGTGATGTTGAGAAGGTGGCA
+AAGGTCTTTGTGCGTAACGAGTTATCACCCTTACAGGACAGATTCAGGGAGGTAAACGAC
+TGGCTCGGCATGGAGGTCATCAGGTTCAAAGAGTACACCCTCGACAACCCGGAATAACTT
+AGGTCAGCTTAATCTCTGCGCTCATCATTGAAGATACAATCTGCGAAAGCTATAGTGCAT
+CAGATATCAAAATAATGGATGCGGAGATTAATATTTTGGAAACTAATTTTGAAATAACCC
+TGGAAGGTTTCGCTACTGAAGAAGAAGCAAATAATATCGGTAGGTTCACGCTAGAAGCCA
+TCCGGGCTTTAAATAACAATCTCAACCTTGAAATCTCAAAATTAAAATGCATTGTTATTT
+CCTATAACTTTAGCGAAGCCCTTCAAAAGATAACATCCACTTACCAACACAAATCTCCTA
+GTTCATACACCAATAGCAAACAGGGTGCAGCCGTCGGACAATTAGTATCAAAAATTGGCA
+ATGATGGGCTATGTGAAGAATATACCCTTGTACTATCTATTGAATTTTTTGCTGAGCTTT
+TCAATGATGGAAGCTTCTTAAAATTGAACGAAGAAGGATACCGCGCAGTCATCCATCGTA
+TTCACCATGAATTAGTGCACGTACATGAAAAAAACTTACTAACATGCTTAGCCCAAAACT
+TTACGGTCAACGAGTATGGCAGCGCGCTTCTTATCTCAGCCACGCGTGCATGGTCTGAAT
+ATCTCGCTAATTACATGTCTTCAGGGTCAGCCCCTCAAGAGACTATCGATTTATTTCTAG
+AGAATCTTGATACCGTTGTAAATGAAGTATCTGACGAGATTGGAAAACTCATCTGGGACT
+ATAAACGCTATAATACGCCTCTGAGTGAAATGTATCTCGAAGTAAAAAAACGCATCAGGC
+TTATCATCAACTCTTATGCTTATGCGATGGGTTATGTCCACTCTCTAAATATCAATATTA
+AAGAATACGATCCAAAGCTATCCCTTACACTATCCAACTCAAAGATAAGATATCAATTAT
+CAGAATTAGGCATTGCTTTTCAGAATCTTTATGGCAAGTTTAATGACCAGCACATTACAG
+GTTTTGATGATTATCGGGAAATAACAATAGTCATTAGTGAAATATTCAAGCAGTTTGGGC
+TTGTTTTAGAGTGTCCCGATTGGTCTAGTGACTGTGAACTCTACATACATGTAAATTAGT
+TTAATCATTGTAAAAACATTAGCAGTTTGAATCTCGCCATTCCTGTTAAGCCGCTGTCTC
+TAGGCGGCTTTTCCATGCACACCACCGTCACGCCTCAGACGCGCCACACGCGCACAACCA
+CCCCCGACCACCAACGAACCGACAGCGACCACGAAAGCGCCATCACGACGCGCTCAGACG
+ATAATTTTTAATATTACGCACCACCGCTGGCGCGCAATGCTTTCCCCGCCACGCCTGCCC
+GCTTTATGGGTCGGTTTTAATGCAGGTGCATGACCACTCTGGAACCGCGCCAGCTCTGAC
+AGAATACGCTCAGAACTGGCACGACTGGGGCATGCAAAAAAATGCACCTAAGGCATGCAT
+CATTTACTTGCGTACTCTTTACTCATTTTTTTCGCTGTTAATTTTCGCAAAAATACCTTC
+TTGAATGAATCCAATAGATGACATCTTGTCATGCTTACCAACAAGAAAGTCTTCAAATTC
+CTGAAAGTGCCCTAGAATACACTCTTGAATTTTGTCAAATACAGGTGTGAATTCATTTGA
+GTTGATGAGAGAGGTGATTTTTGTTGCGAAACCTATGCTATCAACACCAAATGTATATGA
+GTCATCATCATTTTTTCTGAATTTGAAATCTATTTGGAAAGGCGACTGTGGGTAAGTATT
+AGAGTCTTTATAGACGGTCAATATAAATCCTAAATGCCAGAACCCATCATCCCCCAAATG
+AGTAGCTCCAGTGGGAGTATATTTCGTATTTGGTTTTTCATCTTTATCTAACGGGATTAT
+TTTATATGCTTTTTCATTATCAATCCCAAGATAATCTAAATAATTTTTAATCACGTGACC
+AGAAAAGTTATACGCATCAAATCGAGTATCAGAAAGTTTGTTCCGAAACTCGGTATATGC
+ACTGCACAGCTCTGTAAACTTTGACATAATCTATCCTCTTTCGATTGTAAGTATCTAACG
+CCTCGCAGGGCTCGTTGTTCAACCCTGCCAGTACTGAAAGCGAGTTTCAGCACCGGCAGC
+GTTCGTCACTATATTGTTTAATTGTCGAGTATCGAATCGACCTCACCCGTTCGCACGTTG
+ACGCGTGCCGCTACGGTTTGTTTGACCACACCACCATAAGCATTAGTACCGCGAAACGTT
+GTTTTTACAACGGCATGCGGGTCTTTATTCAAAATCAGATGGTAGACCGTTGAAACATGT
+TTATAAGAAGAATCATCATTCATGCTGGCTTTTATCAGCTTCTCTAACGGGCGATAAGAG
+CCATCCCAACCGCTAAAATTACCCTGAAATGCGTCAAGATTGATTTTATTATTCAGGGAT
+TGTGGATCCTTCTCGAAGTCGTTGAAACACCACCCCAACACATCACCGAGCTTTAACGCA
+TCATCTTTCGTAAAAGTGTACTCACTCATACAGGCATAAAAAGCATCAGCAGAGCTTACC
+GGTACACCTTTGAAGCCAACATAGCCTTTAACGATATCGTGCCGGGTTTCTTTTGGCTCA
+TTGCGATATTCTTTGAGAGTCTTATCTGCGTACTCAAACGTTGGCGTAGTCGGTTCCACT
+TTAACCTCCGGCACGTCAGTTTTTGCCACAGGCTGACTTTTTTCAGTCGGCCATAAGATT
+GAGCCAATAACACCCAGCGCCAGACAGCCACCGAGATAAACCGCACTGGAGCGCTTACGG
+TTCGGCATTCGAACCATCGACGGCTTGATTAACCCCACGATAAAAGCAATAAAGAGAGCC
+AGAGATAAAAATGCTATTACGGTATCCATGATTTTCCTTAGTGTGTAATCCCCATACAAA
+ACAACCCCATGCTATCAAACATGGGGTCGAGGGTTGCACATTTTTCAGGGATTAACGCCA
+GCTCTCATCTTCCCACACTTCCTGAAGGATGCTATCCAGCGCTTCGCGGTCTGAATCTTT
+ATCGAATCCCATCAGCTCGACACCGGTCATGGCTCCCTTTTTAACAGTAACGCGCGTTGA
+GGGGAAAACAGACTGTATTCGCCTGGTCAATTCGCATTGAAAAGCATCAATTACCGGCTG
+GCCGATTTTTTGGTCTTTATCCAACGTGATATTTACTTTCACCTTGCCCTCCTTTGCAAA
+GGTTGCATCAACAGGTGGCGCGGAAAAAACAACAGAAAAATTATTATTTTTCATTAGGTT
+GCCTCTTGCTATCTCCGCGATTAGATTCAATGCAATTTCACGATCTCTTTCCTTACAAGT
+ACCTTCAGCAGTCAGACGCGCAATCATTTCGACCCGCTCAATCATAACGTGCTCGTTTAG
+CTCTCTATCCACACAACCTCCATTACGAGATACTGTATATACATACAGTAACACGTAATA
+ACAAAAGGTGTGAAGAAAAAATCACAGTTAAACACACTGTATGTACATGATATGGATGAA
+TATTAACGGTTATATTTTCGTTGCGAGTTCAGCTAAAGCCGCAACACGATTGAGGATTAT
+CCTAGCCTTAGCCTGATACGATGGTGCTGAGGTAAATATTTCTCCCTTGGCCGTTCCTCT
+CAACCATTTACCGTTAAAGCAACTTTTACCACCGGCCATCAGGTGCAGGGCTTCGCCCCG
+GCTGATTGTGATGCCGGTAGTCAGATGTATCTCGTCGATAGTTTTCGCTATAGCTGCGTT
+TTGCTCATCCGTTCCGTGGATAAATTTTCGCCGTATTGCTGGCTTTTGCTTCCTGAGTCG
+GTTTGTCAGCTCTCGTTTTTCACGTCGACTTAGGGGTTTAGATAAATCGAGTTCCGGTGG
+ATCGCTTTCGCTTCCCGTACAGTTATTGACAGAACTCCGAGAGGGCGCAGGAGCGCCCTT
+AACGTCAACGGCCAAATCAACGGCACGCTTCGGCACAATTTTCCACTGCGTTAGCCGGGT
+TAAAATCGGAGTGCCAGCACCAATAGCGGAATCGTATACGCCACGAATGCAGACGGTTTC
+CTCACCATACTGATTAAACTCGGTGCGCGGTTCATACAGTGTGCGCACCTGCAAATCATC
+GCGACGGACAAACGGCCCACCCTGCGCATTAACGTAACCAGCCCAGTCACCGGCGTCAGC
+GGCATCATGGACGGCGGCAAACTCAACGCTCAGACCGTGCGCGACCTCGGTATCAGCGAG
+ACGACGCAATTCACGGTAGACCGTCACCGGCGCACCGCCGATAAACTGAAACTGACGGAT
+GTGCCAGCGCGCCGCCCATGCTGAAACGGCGGGCGCCGTCTCTTTTAGCAGCTCACCGCT
+TTCGTCATCGGTCTCGTCATCGAGAGCATAACCGTCGATGTTTTTAGAAATGTATTTCGC
+GACATAACCGGTAGCACTGCCTTTCTCCGGGTCGATAGCCTCAGCATGAAAGCGGGCTTT
+TTTAGCCTTATCACTTTTAAGTTCGTGGCGGTCTTCCTCCCATGCATAATCGCGGATGAT
+GAGGCGCACGCGCTCGACGTCTTCTGGCAACATGAACATAAGCATGTGCCAATGCGGCGT
+TCCGTCGTGATGAGGCTCGGCAACACGTATGCCGAAAATGCGAATTTCTTTCCGATGTAG
+CTTGGCACGAATGCGCGCCCAAAGGCCGGTTAGGTAGCTCTGCGTGTCCGACGGGCTGGC
+GCCGTTCCATTTGCTGTTACGGTATCCCCCTTTAGTCGTGGCATGATATTTAGACGGTGC
+GGTCAGAGTGTAAAACTCCCCGACGTATCCGAGTTCATTGCAGATATTTTCAAACCCACG
+GATGCGGGTCATCAGCTCGCAGCGGCGTATCGCAGGGTTAGCGACCGAGCCGTCAAATTT
+TTCAATCAGGCTGATACGGTTGCCGTCTTCGTCTTCGAGATCCAGACCTTTGAGAAATTC
+ACGAGTGCGGCGCTTTTGTTCACGCCAGTCAGTCACGCAGTTTTTACTCGCATAGGCATG
+CTTTTTCTTACTGACGTTACCGACAGTAATTTGCAGATGTTCGCGCCATGCAGCCGCAAT
+GCGACGAAGACGACCACGCCACCACACATCGTTAAACATGCGAGCGATGGCCGGGGCGAT
+TTCATCTTCTCCGACATATTTCTTTGTCACTCGCTCCCAATGCGGAGGGGTAACATTGAA
+TTGCAGAGAAATAAAACCGGCGCGCATGTACCAGGTGTACAGCGTTTTAAGCTCGCTAAA
+TCCGGTGTCATCAATGTCAGCCAGTTCAGCGCGAATGAAATTCGCGATATCAGCGGCCAA
+AAGGTCGATATCGGCGCGTGACATGTCCGGGAGTCGGTTATATCTGGCAACCATATTGAC
+CATGCGTGACGCCAGATATTGCATAAGTTCAGTATCAAAATGACTGCCAAAAACAGCGGC
+TGATACATTGCTGTTGATACCCGCGCACTCGTATTTTTTTGCGACCAGTTCAAGACGTGG
+CAATACCCTTTTGCAGAAACTTATTAAAAAGGCATTGGCTCGTTGACTGCCCTGATTTTT
+CTCCAGCACAGCAGCGGTGCGATAAACATCAAAACGCACGCATTCAGGCTGGAGAGAAAG
+CACCTTTCTCGCATGCAGCAAAGCCGCGAGCATACGGTCGCGGCGATATTGTTGGTCATA
+GGTAAGATATGGGCTGGCTATTGCCTGTTTTGGAAAATTCCATACAAAGGCATAATCAAT
+CTCACCCATAGCCTTTGCTGAGACAGGTGTGTCTATGACTTTATTCACTGAAGAAGATCC
+CACCCAACGCCGCTATGTTGATTCGATTACAGAGGTGACAGCTTTCGAAGCTACGAAAGA
+ACCAATGAAGATCATTTCCGCATCCGACATGCTGGGCATTTGCGATGCTTTTCTTTCTGA
+GACTCAATGCCACATAGCAGACCGGCTACCTCTTTCAATAGCTGGTCGGCATGAGCTAGG
+TCGGAAAATTGAGTGGAATTGTCCACATAGCTGGAAACCACGCGAAGAATGGTCAACACA
+TGTTCGGCACGCCTTACAAATTTTAAATCGACGTTATTTGGATACCCCAGTATCTCAACT
+GGATGACTGGCAGACCTGGGAAGAACTATCGACAGATATTCATGTGTCGGCTCGCTGTAC
+TCGGCGGACTGTTGAGTTTTATCGCTCTGGAAATCCCCAGCATTTACCGATGTCGACTGA
+GCTTTTTGCTGTTCCCGAAGTTTTTTCAAAATTTGTAGCTTCGATTCTTTCGGGTGATAT
+TCACCCTGTTTGGATGTGGCATGCTGACGCAGCCAAAACGCCGCGATGCCTCGATGGGCT
+TTATCCCAAATACGCGCCGCTTTCTTGAGCTGGCTTAGTGGTCTGGTAGTCATATCGCAC
+CCCGATAGTGTTTTAATTTAAGTTCGGCGATTTGCTGGCAGGTCACGCAAAAAGCCACGC
+CCGGAATCGCAGCGCGGCGAGCTTCCGGGATTGGTGCGTCACATTCTTCGCAAAGAAAAC
+GGGAAGGCGCAGCGATACGGCTGCGCGCGTTGCTGATGTGGCGCTCGCGGTCTTCCTGCT
+CGCGCTGTTGTGCTAAATCCATTGCGTCGGCCATTAGTGCAGCTCCTGTGATTCATTCTC
+AAAGCGGGTTGCTTCACGACGCAGCAGTTCGGCAGCTTCGGTGCCGCTCATACCCTCTTT
+GGTGATATGGATAGCCAGCGCCTCAAGGCGGATGGAAACAGCGAGCGCGCGGTCTTTACG
+CTCTTCTTTTTTTGCATCGATCAGCAATACGGCCAGCGCATCACTATCAGTGTTAAAACT
+ACGGATTTCGGTATTACGCATAATTGATTCTCCTGATTTCGGGCAATAAGAAGCCCGGCG
+GGTTTACGCCAGATAATTTCTTTTTTTTAATTAGCTATAACCAAATACGACGGCTGGTTT
+ACTTTTCAATTGGCTGATAATTTCAGCTTTCAGGCTATCTTTAAACTGCTTGCAGCACTC
+CCATTCCGGGTCAACTCGTAAAATTATCCCATCGCGGGTTTTAATTTCAAAACCGTCTTC
+CATGTTCGGAATCATGGCACCTAAAACAATCCTTAATTCATCGCGTGACATGTTTAACCC
+CTTTAATAATAAAGTGGACAATACGAATAATTAAAAAACCTGACGATTTCGGCGGCTTTG
+TTTTCAGCCCTTTTAATAATTCGGACTGTGAGTGGCTCGGGTGCCAGCGCTTGCCGTCCT
+TACCTGCGATCCAGCCGTGGCCGTAGTGCATGCCGGGGCTTTGTTTAACGAGCAGAGACG
+CGAATGACGGTTCACTTTTCAGCATACGCACCTCAAATCAGCCCGAAGGATGCGCCAATA
+CCGCTCATGGTATCGACCACGCTCGACATAGCGGGATTAGTCTGCAGACGCGCATGCAAC
+GCCAGCGCCGACAACGACAACATGCGAATGCCAGCATTAACGCTTTCAATCATGTTGTGC
+TTACGGGCAGAGGTCAGGCGCTCGTCAGAGGCTGCACCGCTCGCCAGCTCGCCGAGTTCA
+CTCATTGCACGCATGACATAAGACTGCAATTTGTCTTTAGCCAGCTCATTAACCGGCACG
+CATGGCAGGCAATGAATCTGCGCCAGAAAACCATCAACGAGGGTTGAATCTTCGGTCAGG
+TCAGTCAGCAGCCACAATTCAGGCGGCGTGAACTGGTGAGGCTGTTCCGGGTTGAGCTTG
+TTACGTAACGTCTGAACATTCATACCCGCACGCTCGGCAAGCTTCGCCATGTTGTGACGC
+TGCGCAAAAGCCCTGCACGCTTCGTCATAGTGGGGATGTTTGGAAATCTGAAAATCAAAC
+ATGTTGAGCCCTCAAAATTCACATAAAGTGAATTACGCACCAATAACGAGTTGAAAACGG
+GAATGGCCCAATGCCTTACGCATCTGTTCCTCTTTCCAGCGGGCATAGTAGATACGAACT
+TGACCGCCAGCACGTTTACAGCCCTTACGGATAACGCGAGGTTCGATAGGTAAACGCGGG
+TTATCTCCGGTTGTCCAGCGGCGCGCGGTGCGGTATGACACCCCCTCAAGTTCTGCAAAC
+TGTTGCAGGGTGACGATGGGGGCAGGCACTTTGATGATTGCGATTTCAGAAGCCATGTTG
+CATGATTCCCTATTTGCCAAAGATTGCAATTAAAGGGCCACCGTTTGCCAACATAGGGCC
+ATCAATTGCGTAGGTTTAGCCAAAATATACTTCCCAATTGAGAAGTAGTAAATAGGTTTT
+ATCGATATGAGAATAGATTCTTTAGGATGGAGCAACGTTGATGTACTGGATCGCATCTGC
+GAGGCTTACGGGTTTTCACAGAAAATTCAGCTAGCTAACCATTTCGATATTGCATCGAGC
+TCCCTCTCTAACAGATATACCCGAGGCGCTATTTCGTATGACTTTGCGGCACACTGCGCT
+CTTGAAACAGGGGCCAATCTGCAGTGGTTACTTACAGGAAAAGGGCAACCGTTCACATCT
+TCTGCGACAGCCGAGGACACAATGAGCATCGAGTTATTCACATTAAGTGAAGAAATACTC
+AAAAGTGATGGTTCTATAACAGTCGACGCTCATTTTTTCACAAAGCCGCTTACAGATGCG
+ATGGCTATACGAACGGAAGGAAAACTCCATTTCATTGATAAGCAGGCATCACTCTCTGAC
+GGCCTTTGGCTGGTCGACATAGAGGGTGGAATTAGTATTCGAGAGCTAACAAAACTCCCG
+GGTAGAAAATTGCACGTTACTGGTGGAAAGGTTCCTTTTGAGTGCGGTATTGATGACATA
+AAGACGCTGGGTAGAGTGGTAGGTGTGTACAGCGAGGTTAATTGATGACTGTCCGTAAAA
+ACCCCGCTGGAGGTTGGATTTGCGAACTTTATCCTAACGGGGCAAAAGGCAAGCGTATCA
+GAAAGAAATTCGCCACCAAAGGTGAAGCGCTGGCCTTTGAACAATACACCGTACAAAATC
+CGTGGCAGGAGGAAAAGGAAGACAGGCGAACGCTAAAAGAATTGGTCGACGCATGGTATA
+GCGCTCATGGTATTACCTTGAGAGACGGACTAAAACGCCAGCTAGCTATGCACCATGCCT
+TTGAGTGTATGGGCGAACCACTCGCACGCGATTTCGATGCACAGATGTTTTCCCGCTACC
+GGGAAAAGCGGCTAAAGGGTGAATATGCCCGTTCAAATAGGGTTAAAGAGGTTTCCCCTC
+GCACGCTTAATCTTGAACTCGCTTACTTCCGCGCGGTGTTCAATGAGTTAAATCGCCTCG
+GCGAATGGAAGGGTGAAAATCCTCTAAAAAATATGCGCCCTTTCCGCACAGAAGAAATGG
+AAATGGCCTGGTTAACTCACGACCAGATTGCGCAACTGCTCGGAGAGTGCAAACGCCATG
+ACCACCCTGATTTAGAAACAGTGGTGAGAATCTGTCTCGCCACTGGCGCTCGATGGTCAG
+AGGCTGAGAGCCTGAAAAAAAGCCAGCTCGCGAAATACAAAATCACGTACACCAACACAA
+AAGGCAGAAAAAACCGCACAGTTCCCATCAGTAAAGAGCTTTATGACTCCCTACCTGATG
+ACAAAAAAGGCCGACTGTTTAGTGATTGTTATGGGGCGTTCAGGTCTGCTCTGGAAAGGA
+CAGGCATCGAATTACCGGCCGGGCAACTTACCCACGTTTTACGGCATACCTTCGCCAGCC
+ATTTTATGATGAATGGTGGTAATATTCTGGTCTTGCAGCGCGTGCTTGGTCATACCGACA
+TAAAAATGACGATGCGATATGCGCACTTTGCCCCTGACCACTTAGAGGATGCCGTTAAAC
+TTAATCCACTGGCGATGAGTGGCGATAAAATGGCGGTAGAAATGGCTCAAACTGGCCCTT
+AGCTGGTCAAGAGTGGCCCTTTATGTCTATGATTTATAAAGCAACCTATTGATTTTCGGT
+TGTTCTGTTAGGAACTCATAATCGCTTGGTCGCTGGTTCAAGTCCAGCAGGGGCCACCAA
+ATAAAACAAGGGCTTACGCTAAAAACGTGAGTCCTTTTGTTATCTATGGAAAACCCCCAG
+CCTAGCTGGGGTTTTCCATAGACAAAAAAAGCCGGTCGTTTGACCGGCTACTTGTTGTTT
+TAGTTCTGTGACGCTTTCCCGTCAATACACTGATATTCGACGTAGACGTCCATTTGTCTG
+CATCCTATTGGGCTGGGATCCGTACATTGTGACGTCTGGCCTCCGAACGCCTCGGCGCCA
+TCATATCCCCACACCCTGCATTTTTGGGCGGCCAATGATTGGCCCTGATTCATATCTACG
+CTCGCTTTTTCAAACGCGCCGTAACTTTCGCCAACGTGATACCCCATCCTGATCGTTCCA
+TCGGCTTTACTTCCTCCGACGGGTGTCATTTGCTTATGAACAGTGCAACCAGAAAGTATT
+AAAAAACCAAAAAGACAAAATGCAATTTTTTTCAT
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_017033.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1731 @@
+>NC_017033.1|provirus_1052334_1094910
+TCAGCGCCGTCCCAAGCCCAGCCTGGCAGCCATGGAGCTGGCGGAGCGACGAGTGAATGA
+CGCCTGGGTTGAGGCATTGTCCCGGTTGCGATCCGTGGAGGTGTGGCCTGTTCCGCGGCG
+GCCCAGAGCGCAGATGGCCTGCCAGCCCGACGTGGCCACGATCCGGATCAGGGTCGAACG
+CGTATTGTATGAAAGTGTGTCCATGGTCCCGGCCTCTTGGTCTAGACGATCTCGACAATG
+CACCCTTGCGTACGGCAACGCGACAACTTGGCCGCTGTTGGCGGCTCGGTCTGATGGACT
+TCTGCTTGTGAAGCGACATCCCCGGACCGTGCGGGACAGGCTCGGGTCCCGTTTGACCAG
+GCCTGCAATCGTAGACTGCACTTGTTGATGTTAGCTGGGTGTTATGCGCAGGGGGCCAGT
+CCCGGCTTCGCATCGAAGAGACACATGGATGGCCGTCCCCATGCCAGGGCCGTCATGCCG
+ACATCGGGGGGCATCATCGGCTGGCCGGGCGCGGATCGACTGCAGCCACCCCATCCAGTC
+CGGGCATCGACGGTTTCTTGCCAGCGGGCGACACGCCATCTGGTGGCTCAACTACACAAA
+AAATCAGAAAAGACTCGACGCCCCGAACATATGCAGGCATACTACTTCGCTCCGCTGCCC
+GAGTGGTGGAATTGGTAGACGCAGAGGACTCAAAATCCTCCGCCGCAAGGCTTGTCGGTT
+CGAGTCCGACCTCGGGCACCAGCGGAAAATCAACAGGTTGCAAGTCTGGTCAAAAAGTGA
+CCATTTCCGCAATCAGGTGACTTTTCCGCAATTGCTACCGTGTGGGTGTGACTTTGTCCC
+CACGCCGGTTCCGGGTGTAGTGCTCCGTCATGGTGACCGAGCTGTGCCCCAACTGCTTCT
+GAGCTTGCCTGATATCGCCCGACGACTCTGCCTTGTCGGTGCCGGCTTTCGCTCGCAGAT
+CCCTGAATTGGAAGTTTTCGAATTTCACCCCGGCTTTGACCCTGGCGCGCTGAAAGGCAC
+CATTGAGCATCCGGTATGACATCGTGCCGCCTTTGGCTGTGGTGATCAGTTTCCGGGTAA
+TGGCCCCCATGCGCCGCTTTCGCTCCACCATTGCATTGATCAGCTCGGCGAGCTCGCCCA
+CGACTTCGATGCGCCGCTTGGCTCCGGTCTTGCCCTGGACGACTTGCAGCTGTCCATTGC
+GGATATCGTCCTCATCCATGCTCAAGGTATCGGCGACGCGCTGACCGGTGAGGTAGGCCA
+GATCCATGGCATCGCGCAGCGGCTGCTCGGCTGCCGTCCACACAGCCAGGAAGACCTCGT
+CCTCGATGTAGATGTCGCGGCCGGTTTCCCGATTGCCTCGCACGCCGGCGCATGGATTGG
+GGAGCTTGGTGTAGCCCATTTCCCGGGCCCAGTTCCAGATATGCGAAAGCAGGGCGCGTT
+CCCGATTGGCGCGGACCTTCGCCTTGCGCCACACGATGTACTGTTTGACGTGCTGCGGCT
+CGATGGCCTCAAGCGGGCAGGGCGGATCATCAAAATAGCTCATGAGCATTTTGACCTCCT
+TGAGATTGCCCCGCTGAGTTGTCGGCGACTTGGTCGGCAGCACCTCGGCGATATACCGAT
+CGGTGACATATCGCAGGGTGATGATCCCTGCCGGCCGCTCATGACCTTCGCGCTCGATTT
+CGGCCCAGCGCTTGATGGCCAGGCCATAGTCCGTACCGAGGGGCTCTTCCTTTCGTGGTT
+TGCCGCCGTGGTCGTAGTAGTAATAGGAGCGAGTCCCGCGCTTGCGGATCCGCAAGTGCG
+GGATAGCCCCGGGGTTGGATGGCCTTCGGCCCATGTCATGCCCTTGCTTTGTTGGAGGCC
+CAGCGTTTGGTAGGCTGCTGTGAGCTGGTTTCGCCCTCAATCGCGCTACGGGTAACGATC
+GGCCAGCCGCCGGCGTCCAAGTGGTGCCGGATGCCATTCGATACCAGCACACGGATCTGT
+TTCTTTCGTGTGTAGGCCCGCAGGTAAGCCGCGAGCTCGGTTTTGCTCAGAGCAATCTTT
+TCCGCCGCTCCCATCACGCTCCCTCACGATTTCGCGCCATGGCGCCGTCGATGGCAATGT
+CCATTGCCTTTCCAATGAGCATCGTTGCTCCTGATGCATCGTCATCCACTAGAAAAGGCG
+GCTCGATCATGCCGGCGGTAAATCCAGTTTCAGGGTCGGGAGACTCGATCGCTGCGAATC
+GTTCGGAATGGTCTCGAAGCCATCGGTAGCGCCGCGCATCCAGCATTGCCATTTCGAAAT
+CTGCTGTGTCGATGCCCTGCATATCAGTTCATCCTCCGAAGCATTAGTGCGGGCTCCGAT
+CCTTTTGCCTGCTCTACTCGCTTATCCATCCAGTCCGCCGTTGCCTCCTCTCCCGCGAGT
+GCTCGCATCGCCTCAATGACGCCGATCATGAGCAGATCCAGGTAGTCAGCTCTGGATTCC
+ATGTCAGGTAGCTCATCCATGAACCCAAGGGCGGCAATGACTTCTGCAGCGCTTTTGTCT
+TGATCAACCATAGTTCTGTTTCTCACATTCATTGCGTGCGGCCAGCCCTGCAGCTGCAGG
+CGGCATTGGCGTGGTGGTGTAGATGGCCCGGATCGTGCCGGCGGCGGCCGGGCGAGCATC
+GGGCGGGAGTTCCTGCAGGCCGGCCAGCATCTGGTCCAGCGATACCCCGGCGGCGCGGGC
+CTGCTCTGCGGTGGATGCGACTTGGGCGAGTGAGCTGCACCAGGTAGAAGTTGCCGGTGC
+CGGCTGCGATGCCAGCGTGGCGGCGAAGAGCAGGGCGGGGATCACTGAGTTCCCTGGATC
+TGTAAGCTAGGCCGACCGATCGGGCGAGCGGAGGTCGCATCAATGGCCGCCGGCAACTGA
+CCCACTTCGTCGGCGAGGCGGATAGCGTCGATCTCGACCTTCACTGCGTTGATGTAGGTC
+CCAGCGACCAATGCCGTGGCTTTGGCCCGCTCGATGACCTCGGGGTTCGACTCCGGATCA
+CCCAAGGATTCCAGCATTGCAACCAGGTGATCTCGCACATCGGACATCTTGTTCTTCATG
+ACTGCTGCCTTTTGTTGATCTTGCGTTGTAGGGCACCCTTGAGCTGGATGAGCTGGGCGA
+CTTCCTTGGGATATCGGGTGTGGTAGCTGTTCCGGCGCATCAGTTCGGCTCGGCTAAGCA
+GCTCGAGTCGGTCGGCCGTGATAAGTGAGGCCTCAACGGTTGCGCAGCCTGGCTTGAACA
+CCACGGCGTGACCCGGCGGAATGGGGCCATGGACTGCCTCCCAGACGAGGCGGTGTACAG
+CGACCCACCGTCTGGCCGGGTAAAGCGAGGGATCGTCGGTGACCTTGCGTTCAAGGTAGC
+CATCCCTGCAGATTCGCTCGCTACCAATTGGCCGGTAGTTGTGCTGAGCAGCGCCGGCCA
+TCTTTCCAGCCTTGAATTGAGTTTCAGCCATTCGACCCGGGGCCCAGCCTGGAGGATGCT
+TCTTGCCTTTGTTGGCAGGAGTTTGGCCAGGCTTGAATTGGGTGGCGATCATGCGCGGAT
+TTGTCCGTCCTCGAGCGATGCGGCCGGAGACATCGCTGGCCATGAAGGCCTCGCTTTTCC
+TGACGCCGAGTGTGGCGGCCCGCCCGTAGATTGCCGGCTTGGACCTGCCCATGCGGCGGG
+ATAGATCTGCGCAGGTGATGTCGGGGAAGAACTCACGAACCATGGCGTCTTCTGCCTTTG
+TCCAGGGTCGACGGCTCATGCCAATGCCCTCCGGCCAATATCAGTCAGGTCATACCTGCC
+CTTGCCGGCGTGGCGTAGCAGGCCTGTACGAGCGAGGCGGCGGAGCTTTCCGGGCGGTAG
+CGCGACGGCACCGGAGGCGAACAGCTGGATCTCGCCGCGCTCGGCCGGCAGGACCAGCTC
+GGGGTTGATCGGATCGGCCGGCGCGGCCGGGATCTCAGCAGCGGTATTGCCGGGCATGCT
+TCCGTAGCCTATTTTCGCCAGCCCCTGTTCGGCCTTGCGGACCATGTCCTGGGCCGATTC
+GCTCTCGCGCCAGTTGGGGTAATCCTCGAGCCAGTGATCGAGGAACGTTTCTGCCGGGGA
+GGCCATAACGGTGGTTCCTGTGTAGCCGCCAGCTATCGAGCGGCGATGTGGGTGGTCAGC
+ATTTCATTGAGTGCTGGAGGGATATCGGGGAAGTGCAGCCAGGGCTGCTTGAATTGCGGG
+GCCCAACTGCATTCGCCTGCTGCGTCTCCGACGCAATTCCTTCGACACCAGGCGTTAGGC
+TTGCCATTGAGGACCTTGACCCGGACGCGGTGGAGCCGTGAGTCAAACCAACCATCAAGT
+GGCTGGAACATGTCGATGGTCGGCACAGAGTTATCGATGGCCATCTGCAGGCCTCCGTTG
+GCTAGAAGGGGATATCGTCGTCATCGAAGGGCGGGGCGCCCTGATCCGGCGGAGGCTCGT
+GTTGCTGGGCATGGCCGCGCTGGTTGGCCTGCTGGCCACGACCGCGGGAATTGCCGGGCT
+GCTGCCGGTTGCCGCTGGATCCACCATCGCCACTCAGCATCTGCATATCGGTGGCGATCA
+CTTCCGTGGTGAAGCGCTTGATGCCTTCCTTGTCGGTGTATTCCTTGGTGCGCAGCGAGC
+CTTCGATGTAGACCTGCCGGCCCTTGCGGAGATACTCCTGGGCAATCTCGCCCAGCTTTC
+CGAATAGCACGACGCGGTGCCATTCGGTGCGCTCCTGCCGCTGGCCGGACTGCTTGTCGT
+TCCAGGTCTCGGCTGTGGCGACGCGGAGCTGGCAGACGGCTGTGCCGCCGCCGGTGTATC
+GCAGCTCCGGATCGCCACCGAGGTTGCCGACCAGGATGACCTTGTTGATGCCGCGGGCCA
+TCAGTGGGCAGGCGCCGGGGAGGTGGCAGTCGAGCGCATTTTTGCGGCGTGGAAGTCCAA
+AATCACCGAGAGCCACAGCCGGATAGCGTTGGGTGTAAATCCAGCCCGGATCAAGGCCTG
+ATCAGCTGCGCTTGAGGCTTGCGGATCTTCCGAAGCGCTGCACATCGCGAGGCCCCCAAC
+CATGGCCATCAACTGGCCTTTGATGGACATGACTTCAGCAACAAACTCAGCCTCACCAGA
+GGCTTCGGCGCGTTTAGCTATCGAATCGACAAGGTCCTTGAACGACTTTTTTTCGTGAAT
+CACGGCATGACTCTCCCGTGCCGGCCCAAAGAGCCAGTAGCAAAATGTGTGTTGTGGGGT
+GACCGGTGAGCGCCGGCCGCGCGGTGGGTCAGGAGGCTTGGGCTGCGTTGTCGGTGGTGC
+TGGGAAGAGTGGCGTCCTCGATTTGGATGCCGAGTCCAATCTTGCTCACAAGGTCATCCT
+GGGAGGCGAGGTCAGCGCGGATGTGCTTGCGAACCACGTAGGCAATAGCCTGGGCCTTGG
+ATGGTGCTCGGACCAGGTAGTCTCGGGCCAAGCCGGCTTCGCGGGGCGCATCGATCAGCT
+CATTCGTCACGAGGTAGATCCGTGCCTTGGCAGGCTGGCCTGTATCGGTCGGGCCGTGTC
+TCACGAGCCACCTCCGAGCATGCCGGCAAAGGCCAGGGTAAACATGGAGCCAAGGAAGAT
+GCCGGCGGCCATGTATGCGGCGCGCAGAGCTTGCCCGCGGCCGGTGGTGATGGGAGGGAT
+GTAACCCATGTTGGTGATCTCCATCCGCCCGGGGGCGGTTCTGCGTGAGATGTCTCACAG
+TTGTGGCGGTGCGGCCTAAAAATGAATGAGCGAGCGACGCAAGACTTGTATAGGATCAGC
+GGTTGCTCGGCGGTTCGAGCTGAAATCCCTGCTGATTGCAGTTGCTATGTGGATCTGAAA
+CGTAATGTGTCACCTGTAATGCCTATGCATGGATATTCGTCGCTACCCCCGCTCCTGTTC
+CTGACTGGACTCATTTGTGCGGCTGGCTTTTCAATGGTCTTGAGGGCGCTCGGTGACGAA
+AGGGCGTACAAGTACTGGGCATTGAGTCTGTGGGCAGGTGTCTTTTCAGCTGCCTTGATC
+ATCATCTTCCCCAGTCACCGTCCTTTGGCTGTGGTCGTGTTAGGCCACGCCGCACTGGCT
+GCATCACAAGTCCTTTTGATTGCTGGCTTTTTCAGGTACTGCCGCCTGAAGTGGAGCGTT
+ACAGCTCTGATTGTTCCTGCTGTTGCCTACACGGCTGCTCAGACGGCGCTGTATCTGTTC
+GGGCTAGGAAGCTTCCCTAGATTCGCTCTGTACAGCCTTGCTGTTGCAGTTTGGGATATT
+TGGTCCGTCCAGCTTCTTTTGCGATACCTCCCGGGACAGGCTTTTTACGGGAGTCGTCTT
+GCCGTGCTCGTGATCTCGGTGCATGCGGCATTGCATACCTTCAGCCTTATCCTGGCTTCG
+TCGGACCTTTTGTTTGGACTCGCGAAGAGCGCCAGTGAGTCGCTGCCGATCTACTACATT
+GCGATTTGCATGAGCTTGGCGAAGGCCTTTGCGTTGCTTGCGATGGTCATCGAAAAGCTG
+ATCAACGATCTAAAGATTGCCGCCGAAATTGATGGCATGACAGGCCTTGCAAATAGATCC
+TCGCTCATAGATCGGGGCGAAGAATTGCTCATGCGGTGCAGAGAAGAGGGCGTCAAATTC
+GCTGTCTTGTTCGTGGATATCGACCAATTCAAAGCAATCAATGACGACTTGGGGCACCAC
+GCTGGGGACATTGCCCTAAAAGCATTCGCATCGATCGTCAAAGACATCTTCGACGAAGAG
+GATGACATCTGTGGCCGCTATGGTGGTGAGGAGTTCGTCTGCCTCCTTACAGGCGATTCG
+GCCACCAACGTTGTGCGGAAGTCTGAGATGCTGCGTAGCAGGCTGGCTCACAAACCGATC
+CGGATCGGTGGGCATGCGCTAACCATGACGGTAAGTATTGGCGTCGCAACTGATGATGGT
+GAGATCTGCCTGCTTAGACTGATCAAACGAGCTGATGGCGCACTATATGAGTCCAAGAAC
+TCAGGTCGAGATCGCGTCACTCTGGCAGTCTGATCTTGAGGGCGGGCCTGACTCATCCTT
+GCTGGGTTAGAATCAGGCACCCGGTTGAATGGTGCTGGCATGGCTATTTGCGATAACCCA
+GACGTGATGGATAAGGTCTGGCAAGGCCTGGTTGATGTGGTCAGCCGATACGATCCGGCG
+ATCCGTGGGCATCTTCAGCACTGGGTGCAAGAGGAGCTGGACCGGTTACCGCCAGAGGCG
+GGGCAGGCCTATCTACGTGCCTCCTCAGGGCGTGCTGTGATCGAGGCTGAGGAGCAGGCA
+GAGCTGTCTGCGATCCTGCGGTCACTGAAGAAGACGCTTCACGAGGATGCTCGAGGCAAA
+TTGCGCGGAGTGGTCTAACAGGGCGTCTGCTTTCCAGCTGATCCGTAGTTGCGATGTTCG
+GATTGGACTGGCGACTGGGCATTTCCAGGGGATTTCGGAGTTTTCCATCGCGGTGCTGGG
+CGGCCGCCTCACGGCGTCCAGGCTGCTGTCTACAGCCGCCAGTCCAATGCCCCCGGCTAC
+TCGCAGGGGCGGCGAGGTCATGTCACCCAGCGGTGGTTTGCGTCGTCCGAGGAGCGCGCT
+TGCACCGGGCCATGGCTGCCGAGGTTTTGTTGTGCACGCCCACTCACGGCTTGGACGCTC
+CGGACTGACTCCGGCTGCAAGGCATTGGGCTGCCGCCTGGCGGCCCCGCTACGGGCCATT
+CCTTTTCCCAGCGATGAGATGGCACTCCGGGTGTTCAGCGCCCCGGCCGGCGCAATTTCC
+AGGCGGCAGGCCAATGCCTACTCATGGGGTGAGCGGTTTGTCACTGTTCACAGGTATGCG
+GCCAGAGGAGATTACGTTGTTGATGAGCCGCGGGATGAGGTCAAACAGCTCGCGGTCCAT
+GTGCTTGAAGTCAACGCAGTGGATCATTCGCAGGCGCTCATATGACTCGCATGTCTCTGG
+TGTCTGGGGGATGTTGAAGGCCCCGACAAGGTCATTCAGAGGGCAGATGTCGAAGAAGCC
+GCTGCTTGAGCCGGATCTCTTCTGCCAATCTGAGATTGACTTACGCAATACGGCGCGCTG
+CTCAAGAGTTGCCCCATCCGGATCTGGCCATACGATCATGTCGATGAATGATGGCGCTCT
+CTTTATGGTTGAAAACACCATCGCTCCAGTGTCGATGGTCACTTCCTGCTTGGCTGCGCT
+ACCGCCAAATAGGCGTGCGATGATCGCTTTCATGCTTTGCTCGTTTTGGCGTCGAATTGT
+GATGAGGTCTGTCGGGCCCGCTACGGCCCTGTCCGACGCAAGAGGCGCCGAGTGTTCAGC
+GCCTCGGCCAGCGCAATCCCAAACCCCATCACAATGGCCACTGTCTCCAATGGCCGTTGC
+TGACCTCTATCCAGGCTGGTCAGGCCTTGGCTCCCTATGCATGTCCAGCGCAGCCTTGCG
+GGTGCGTGCTCCGGAGATCCTCAGGGAACCGTCCCGTTGTGAATGAGCGGGTGATGCGTG
+CCGGGCGTTTCGCGCCGGCAATCCAAATATAGGTACGACTATATATTCATGCAAGCATGC
+CTATTAAGCAAGCTTATATTTGTTCATCATTTGTTTATGATTCTGTGCATCCTGTACTTG
+GGCATGTAGAGCAGGCGCATACGCCTGACGAGGGTTACAATGGAGCCACCATCTAGGGGA
+TAGATATGCTCAAGAGAATGTTGCTCGTTGCAGCCGGCTTGGCTATGTGTGGCCAGGCAT
+ATGCCATTACGTATGGCCAATATCAGGCCGCTGAGTCCGAGCCTGGGTCGGTTGCTGCTG
+GCGCTATGGGCATGTACCTAGTGGGGGCTAATTGCCGGAGCTCAGATGACCAATGCCTAC
+GCAAAGATTTCAGGTCATGGGGCGCTTTTTTGCCCGCCCGGTAAATTGAAGCTGGACGAT
+AGGGTTGCCGCAGTATTGATAGATCAGGAGGCCCCCAAGGGCCATGCGACTGATGACACG
+GACATCGAGTCGATTCTGATTGCGGCCATGGCTCAAGGCTTCCCCTGCAAGGAATGATCC
+AGGTTATCGGCTGGCGCTGACAGGGAGGGTTGCTGATTGGTCTGATTGATGGTCGTCTGC
+ACATGGTGGTCTTTACGCCACGCGCTGGCGCGGTGCACGTGATCAGCTTCCGCAAGGCCA
+ACGCCAGAGAGGTTAAACTGTATGAAAAAAGCACCAAACCCCAGCAAGATTGATGCTGAA
+GCTCCTGAGTGGGGCGTCGAGGCCTTCGGAAAGGCCAGGCCAGCGCATGATGTACTTCCT
+GGAATCTTTGGCGAGAGGGTGGCCAAGGAGTTGCTGCGCCCACGGGGAAGGCCGCGTGTA
+GCTGAGCCCAAGGTCGCGACCAACGTACGTTACTCTCCGGAGATCCTCGATTACTTCAAG
+GCGGATGGCCCAGGCTGGCAGACCCGCATGGAGCAGGCACTATGCGAGTACATCTCGGCG
+CATCCGAGGGCTTGAGGCACTAGACTGCTGCTGAGCATAGCTGTATGAGATCTGTCGCAG
+TGGATGAGACGCCGCTATGTCAAATTCCCAGCCATGTAATGACCCACCGCTTTCTGCTCA
+GGTCATGCGGTTAATGTAGCGGCGTAAGCCTCATCCGGGGTCATCATCTTCAGTGCCTGA
+TGCGGGCGTTGTTGGTTGTAGAAGGCGATCCAGTCGGCGATCACCCGCAGGGCATGGACC
+TGGCTCTCGAAACGATGCCGGTGCACGCACTGCCCGCAGCAGAATGGCATAGCCGAGAGC
+CTAGCCCGCACGATCAAGCGTGATTACGCGGCCTTGATGTCCAAACCTGAGCCGGCCATG
+GCCATGCGAAACCTCGCATTGGCCTTCCAACACTATAGCGAGCATGATCCCCTTAGCGCC
+CTGAAGTACCGCCTTCTAGTGAGTACCGGTGCCGATTGGCGTCGTTAAACCAAGTGTGAG
+TCGGTGTCCGAAAATATGGGGAGCACTCCAACTATCAAAGACTCATGCTGATCGCCTTAT
+AGATCGCATTGGATTGAGTGTCGTGTTATGCACATGTTATCCACAGACTGATCGATTGAG
+AGGTGCTAGACTTGCACACAAGTTTTTTCAAAACTCCCGTTTATCGAGGATTGCTATGAG
+CGAGCGACTGACGAAAGTTCCGACCCCGCAGGGCGAAGTTGAGGGTAGGGAAGTGCAGAT
+TGTTGAGTCCTTAGAACGCTGGTCTGACGTGACTCTTTCTGACGGGACGACGTTTCGTGC
+AAAAATTAATATTGTTAACGTTGTTCGCATTGATGGTCAGTATGATGCTCAAGGTAATCC
+TTCATACATGATTAATGCTCAGCCAGCTATTGCAATGGTGCACGTTCCTGACGAACTGCG
+TAAAAAAGGATAGGTCTTATGATCGAATTCCAGAGCAATATCGGCACAGTAATAAATTAT
+GGCTCTAACTCTTTGATGCCTATTTCGGTGTTAATTTCAAGAGATTCGCCCTCTGTGGAT
+TTTGACTCTAGAAATGCTGGTAAGCACTCCTGTTTTGGAGGTGCGCTCGAGCCAATGTCG
+GTGAGTGCATTTACTGGCCATGATTTTGCCATTAAATCTAAAGGCAGGCCATTTGCTTTC
+AGGTTAAACCCTTCTTTGAGATTTATTTCGGATTCTCATGATTATGGTGAAGCATCGTTT
+AGACTGTTGGCAGAGAAGTTGAAAGACGATGTGAGGATGTCTTCTTCGCTTTCGGATATG
+GAGTCCTCTAAATATTTTAGAGATATCTTATCAATGAATGGGGATGTGGTTAGATGGATT
+TTAGAAGATATTAAGAGTAATAGGAAGGATCCTTTCCCTTGGTTCAAGGCACTGCGCTTA
+CTGACAGACGAGGATCCAGCCAAAATTGCACCTAGAGGGGACTGGGTTGCAATGGCTGAT
+AAATGGATTGCCTGGGGGGAATCTGATGGGCGATTGGTTTGATCTAGCTAAAGAGAAGGG
+TTTTCCTAGACTGACAAAAAGCTCGTCTCGTATTACGAGTACTGAAACAAGTAGATACAA
+CTGTCTCGCATGGGCTGCAAATGTAGAAAACAGGTGGTGGTGGCCATATGGAGACGCTTG
+GTGGCCTGAAAATGTGCCGCGAACACTTGATATCGATTCATTGAAGGCGGCATACAGGAC
+TGTTGGATTTGTTGATTGTAATGACGGATTGCTTGAGGCGGATATAGAGAAAATCGCCCT
+TTACGCATTGAATTCAGAATTTACCCATGCTGCGCGCCAGCTCCCAAGCGGAAAGTGGGC
+TAGTAAAATGGGGCATAGTCATGATATCGAGCACGACTGTGTGACCACCGTTGAAGGCGG
+GATTTATGGTGAATGCGTTGCTTATATGTGCCGGCGCCGTGCCATAGATTGACTATTTAG
+ATCAATTGCAGGACGCCAAAGGTCGGAACTCTTTTTTGAGTGATTACCTTCTTGCCTTAT
+TTAAAATGCATATACCAGCAGGTGTGAGTGATCAGCGGTGTAGTGTGCTCGTCACCATGC
+GATCCAAGTCAACGAACAGAGCATCACGTTCGGTCTTCGAGGCAGGTGATGCCATAAGGA
+AAGCGGCCACGATTACGCTATGGCCATCAGGCCAGGTCAGGATACCGATGTCGTTGTAGC
+TGGAGGTTAGGCACGTCCAGTGTGTAGGACGTGCCGCTTTTGTCCGCAAGTCGTAAGCCT
+TGGGGCAGTCCTCGCCGCAGGCGTTCCGGCTTTGTCTGTGCCTGCATCAGTGCAAGCAGC
+GCGTGTGTCGATGTAGGTGAGAGCAGGGCGCCATGTTGCAATTTCTGGAGAAAGTCCGCA
+TCCACCCGCATGCCTGTGATGCCATGTGCGCGCAGGAAGGTCGTGACCTCCTGCGGCGGA
+ACCAGCTTGAGCAATGCATCGACGGCGGTGTTGTCGCTATCGCTGACTGCGGCGGCCAGT
+AGTTGTCGAACGGTGTATGTCATCCGCCCGCCGTGAAAATGCGCACCGATGGACGGTACG
+GCGGAGCCACAGACAACATCTGAGCGCGTCAGCGTTACTGTATGTTCCATCGACAGCTTG
+CTGCCGCTGGCCTGAGCGACACCGCTTCCGCAAGGTGAGGTCGCCGGACGCTTACGATTG
+CCTCAGTCATTGCACTCAATTGATGACACGCCCTAGTGCACCAACAACGAGGCGCACCCT
+GTTCAGGCCTGACATTTTTCATACCCTGGAGCTGGATCGGGTAATGATGCTGCACCAGGG
+GAGGCTTACACGTCGTGCTTGCGTGGACTCATGGTATCTCCAGGTCAGATGGCAGTGTCC
+CGCCTGTGGCCCGGTTACACAAAATCTAGGACACCCTCAGACCTCAAATTTTCAGCCCTT
+TCCAAACCGTCCGTAATTTCGGGGTAGAACCCCTTACGAGAAGCTTCGCCGAGTTGGGCC
+TCGTGCCGCTGCTAGCACTCCATTGTGCTGGCAGACATGGCGCGGCTTACAGTTCTTCGT
+CGCGCTTCATCTGGATCGCTCCCAGGACGCGGCCAGCAATGCAGATATCAGAGGCCTGAT
+CAGGCCGGTAGATATCCGGGTGATCCGGATCGGCCAGGCTCACAACATGGAAGCCGTCGC
+GACGGATCTCGATGCGCTTGACCAGGGCATGGCCATGGAGCAGGACGACGAAGATACCGC
+CGTCCATGGGGTCTCGATCCTCAATGTCCACGAACACGACATCGCCATGCTTTATGCGCG
+GGGTCATGGAGTGTCCGCGAACTGTGAGGAGCTTCACTCGATCGGGGCTGACGGCGCGGC
+CAACTTTCTGACGGACCTGCCACTCGGCGATATCCACTTCCTGGAGCACTTCCGGCTCTT
+CACTGTTCAGCACACCTGGCCCCGCTCCGCCTGCACCCATGACTTGGAAGCGAAGGTAGC
+CTTCTGGTGTCTCAGATCGTGAGATTCCCAGATGTTCGAGCGGGCCTCTTGGGCCTACGC
+CAGTGGCCAGCCAGCGAGGGGATACGTCAAGCACGTCTGAAAGCTCAATGAGCGTGGTGT
+CCTTGAGGCTCTTGGTTGAGCCTGACTCCCATTGATAAGCCGATGCTGCCTTGACGCCTA
+CCCGTCTGGCTAGCTCTGCCGGCTCACTGATGCCTGCAGCCTCTCTGGCTTCTTTGATTC
+GTTCTGCGAGCGTTCCAGTCATGTAAGGGAGCTTATATGGTGCATGTATAGTTGTGCTTG
+CATGATAGATGTAAGCAAGCCTATTATTGCGCCATGAAAAGCGCACCTAAGATCACGAAG
+GCAGAAGCAATTTCGCCCTTTGGCAGCGGCTACGCTCTTGCGAAAGCCCTGGGAATTGCA
+CCAGCGTCCGTATATCAGTGGCCTGATGGCATGCCTATACCTGAGCTTCAGGCAATGCGC
+CTGGCATTTTTGATCCGGCCGGATATTTTCGGCCCAGCTCAGACCAAGCGTCGTAGTGGT
+CACGGTAAGGCGGCGTGATGAATCGACTGATCCTTTCCGATAGCGCCGCCGTGATTGCCC
+TGGCCATATACCTGGGCATCCCCTTCGAGCTGATTCCCCGCGCACTGCGCAACCTGCTGC
+TGATGGCCTGGGGCGCGTTCGTGCTCCTGCAGATCGCCGGCCGGTCTGTATCTACCTTTT
+CGCTTTTCATGAAGCGCCGCCCATCGGACTGCACTCCGGAGGCCAAATGATTCCTGCCGC
+AATCGTTCTGCATGCCAATGGCATGTTTATCGAAGACGACTCTGTCGAAGTTGACTGCAT
+CGTGCTTCCGTTGACGGACTGTCTCGACATCAGCTTCCACCGGATACGAACTGGCGAAGC
+AGTGTTCCAAGCACACTCGGTGCTGGCGACAGCGTCGACCAGCCCGCGTCGATCAGCTTT
+TCGACCAGGCGTCCTATGGCATCGCCCCGTGCGTCACGAAGAACCTGTAACCAGCCTTTC
+TTGTCCTCGTCCGGAATGCTCATGCGCTGGACCTGAGCCTCAAGCAGCTGACGGAGGGTG
+TCCTCATGAAGCTTGACGGTCACCGTTCCAAGGATGGCGCTGAGCCCTCCGTCAGCACGC
+ATGAAGTCAATGCCGGCGGCCGTTATGCGCGCTCGAGCCATCCCGTATTGGGAGGGATCC
+TCAACGTATGTCTCAAGATGCGCAGCAATCATTCCGTGCTCATCGAGATAGTGCAGGTTG
+CGTGCGACTTCGCCAGTCGGGTCGTTCTTGATGGCCTGACAAAAGTCTTGTTGCTGCGGG
+TATGCCTTAAGCAGCTCTTCAAGAATCTTGCGTTGATGGTCTCGCGCAAATCTTTCCATG
+GACTCCATCTTCCGGTGAATACCAATGACTGAACTGTCGCATTCCAAGGGCGTCAGTGCC
+ATGAGTATCGTTTTTCATGCCTCCCGCAAAGACCTGGTCCGGAGCATCGCCCGCGATGCC
+TTCAACGCTGGCGATCTCAACCTGATGAACTACGCGGACCGGATCCAGGAGCTGTACTTC
+ACCTTGATCCCGCCGGCGAGCCAGGACACCAACCTGCGCCAGCCTTGTGATGATGCCACC
+GGTGAGCGGTTCGAAGCTGATCGCCGCCACAACCGGCAGATCGTTGAGCGCTGGGTGAAA
+GGGCGGGTCGCTGAGTTCCCTGACGATCTGGAAGAGCCATGGGTCATGGCATTGCCCGAC
+CAGTGGCGTGACAAGGCGCTCACGGAGCTGTCGGCCCGCTATGGCTTACTGCCTGCGCCG
+ATCCCCAGTGGCGGCCATACAGCGGCATGGACCGGCGACATCATGCAGTCCATGGCCGAC
+GTCCTGCGTGACTTCGCGCCTATTGCCGAGGACGGCGTGATCAATCATCTGGACGCCGAC
+GATCTGCCGGCCTTCATCCTTTCCAGTGCAAAGGCCATGGGCATTTTGTCGAGCATGCAG
+CGGCAGGCAAGCGAAGCCTTGCAGGAAGCCGAGCGGAGGAAAGCACGGTGAACTATTACC
+AGCGCCATATCGGCGACTACGCCCGGGATACCGGCCATCTGTCCCTGCTGGAGCATGGGG
+TCTACATGATCCTGCTCGATCACCATTATGCTTCTGAGGCGGGCATTCCCGATGGGAAGC
+AGTACCGCCTGGCACGTGCACGCACGCCCGAGGAACGGGAGGCCGTCGACAACATCCTGG
+ACGAGTTCTTTGACCTGAAGGATGGGGTTTGGATCAATCGCCGCGCACATCACGAGGTGC
+TGCGCTTCCACTCCACCATGGCCGACGATGCAGATCAGAAACGCGGTGCTGCAGAACGCC
+AGGCAAAGGCCCGCGCACGTCGCTCGGCGCTGTTCGATGAGCTGGCGACCTACGGGGTGG
+TGCCCGACTTCAACGCCTCCATGCAGCAGCTCCGCCACATGCTTGATGAGGTGAAGTCAC
+AGCGTAAGTCACAGGCTCCGTCACGTAACGTCACGCGTGACGTTACGGCTAACCAAGAGC
+CATTACCCAATACCCATTACCCAACAGCCAATACCCAAGAGCCAGTAAACCTCTCCGTAG
+GTGAAGTTGCTCAAGACTTGGGAACTGAGGTTCTAGGGGAGGTCTTTTCCGCGCGCACGG
+CAAATGCGCCGGCAGAGGATCTGGATGGCAGGGTGATTGACGCCTGCAAGGCACTGCGCC
+GTCTTGGGGTTACCAGCGCTAATCCCGCGCTACCGAACCTGCGGGCGGCTATCCAGGCCG
+GAGCGTCGACGGATCACCTCGTCGCGATCACGCAGCAGCAGATCGAGGACGGCAGGGCGC
+CCAATGCCAACTACATCGCCCGCAAGGCGATTGGCCAGATCGAGGACGCCAAGCGACCGG
+CGCCGGTCCGCGCCGGTGGCGCTGGGATCGCACAGAACAAGCAGGAAGCCATCGAGAACC
+GCAACCGCAGTGTCGCCCAGCGTTGGGCCAGCTCTGCCAACGAAGAGCCCCAGGAGGCTG
+AATATGCAATCGGGTGATATGAATGGTTTTGCCGAGATGCTCTCGGAGGTCATGGCCTAC
+TACGCCAAGGACGTGAGCGAGTTCATGCTCTCGGTGTTCTGGGACGGGCTGAAGATGCAC
+GAGTTCCAGGACGTGAGCCGTGCATTCACGCTGCACGCTCGTGACCCGGATCGCGGCCAG
+TGGGCGCCGAAGGTGGCCGATATCACCCGCTTGCTTGAAGGCTCGACCAGCAGCCAGGGC
+ATGACGGCTTGGTCGAAAGTCGACAGGGCCATTCGGTCGGTCGGCGGCAACCAGTCGGTG
+GTCTTCGATGAGCCGCTGATCCATGCCGTGATCTTCGACATGGGCGGCTGGTCGAAGCTC
+TGTCAAACGATGGTGGATGAGCTGCCTTTCGTTGCACGGGACTTCGAGCGACGCTTTGGC
+GCCTATCGCCTTCGCCGCGAGCTTCCGGATTACCCCAGCCACCTGATCGGGAACCACGAG
+GCTCAGAATCGCCTCAATGGCTTCAACCGTGTTCGCCCGGTGCTGATCGGCGACGAGCAC
+AGGGCCCTGGCCGTGATGAATGGCGGGTCCAACGGGAGCCCGCTACGGATCACGCGGATC
+AGCGACGAGGTTGCCCGCATTGGTCAGGCGGCAGCACTAGAACACGGAAAGGGGCAGGCG
+GCGTGATCATCAACCTGCCGCCCGGCACCCATGCCACCGAGCTGTCCCTGCGCTTCGCCC
+GCTTGGGTGATCCCTCCAAGCCGATGACCTGCGGGCAGTGCGCTCATTTCATTCCCAGCA
+CCAGCAAGAGCTGCGGCTATGCCGAGCGACCTGCCGGCCAGGGCGATGCAGCTGCCTGCA
+TTGAGTTCGAGGTGGCACCGTGAGGGCCTTCAAATTGATCCTTGGTAACCGGCAGAGCGT
+GTTTGATCTGGCTGGCATCGTGCGCGAGCACGTTCGTCAGTCGACCTTCGAATGGGCTCT
+GGTGATTCGTCCCAGCGGTGACGCGGCCCTGTACATCGCCACCACGCAATCGACCCAGAT
+GACGGCTCACGACCATCCGGAGCAGATCGTGGGCGTGTTCACGCGGATCCATGATGTGGC
+AACGATCCGCCGTGACATTCAGCGCTGGGTCGATGCCGACGGCTACAACCAGAAGCTGGC
+TCCGATCCGCCTGGTCGAGGGGCGCAACAAAGGCATGTGGGGCGGTCCGATGTTTCGTGA
+ACCCCGCCGGATTGCCCCGCTGATGCATGGCCGCCGCAAGCCCCGGCCGACGTGCCCGGA
+GCATGGTATCCCGTTGCCTCCGGACAGGGACTGGCGCGGCCGAGCTATCAACGGCCCGTG
+CCCGATGTGTGTCGCACGCCGCAAAGCCCGGGAGGGATTGCTGTGAAGGGCGGTCGTCAT
+GCGGCGCAGGCCACGGCCGTCCAGCGCGACCGGATCGTCATGGTGAAGGAGCTTGGATGC
+ATCTGCTGCCAGATGAACCGAGCTGCTGGTCGACCCACGGCATTCTTCGGCGTGGCTGAA
+GCGCATCACCTGCTGTCTGGCGGTCGGCGGCGCGGTCATGAGTACACCATCGGACTCTGT
+CCCTGGCACCACCGTGCCGTGCCGCCGTTCGAGTCGGCCGGTACCGCCGATATGGTGCGC
+ATGTTCGGCCCCAGCGTGGCCACCGGCAGCCGGGCATTCCACGAGCGGTACGGTACTGAC
+GACGAGCTGCTCGAGTACCAGGAGCAACTACTGGCCGGCGCGCGGGCGGTGATGCGGGAG
+GTGGCGGTATGAGAAAGGCAGTGTTCACGGCATCCTGGGTAGCGGGTGGTTCTATCGCCG
+GCGTTCTTCTGTTCTTTGGCCTGTTTTGGGTTGCCAGTCACCTTCATGGTCTATGGGCCG
+GTGCATTTTGCTGTCTACCCATGTGCGCATGGAGTGCAGGGTTCATTGCATGGATGAAAT
+ATCCAGGAGCAAAGGATGAGCAAGCGAGCACATCCGAGATGTCGAAGGCTCGCCAGCTGG
+CAAAAGGGCAGCCTTGCATGATCGGAATCGCAGGCACGTGCAATGGAGACCCCGAGACGA
+CGGTATTTGCACGTTACCCAATGGATGTCTACTTCGATATCGAAATGAGCTCAGATGACG
+AGTTGGGGGCATGGGCCTGCTCAGCTTGCAATGCTGTGCTGGTTAGACGCCCCCCTATCC
+TCGAAGAGTTTTTTTTGCAGTTGAGGCTCTTTCACGCCGAAGGCGTTCTGCGCACCCAGC
+ATGCGATAAGGGAGATGGACAGGTGAAAATGCATTGCGTGGCCACTGAGCACGCCGAGCA
+GGTCGCACTGATGCGCTGGGCTGCCGCAGCCGTGAAGCGTCACCCGGATCTGGCGCTGTT
+GTTCGCCATCCCTAACGGCGGGCAGCGCCACAAGCTGGTGGCGGCGAAGCTGCGGGCCGA
+GGGCGTTCGCCCAGGTGTGCCCGACCTGTTCCTGCCGGCGCCGCGCGGCCCGCATCACGG
+GTTGTTCGTGGAGATGAAGCGCACCGTAGGCGGCGCCGTCAGTTCGGTCCAGAAGGTCTG
+GCACCGCGAGCTGGCCGCCCGTGGTTATCACGTCGTCGTGTGTCGTGGATGGGAGCAAGC
+ACAGGCCGCGATACTCGAGTACCTCTGCATGACAGGTGTCGCGTGATTGCCTGGACGCGC
+GGCAGCCAGCCGCCGGCGCAGGGACGCTACTTGGTGATCGAGAAGGTGTACCAGCGCCCG
+ACATTCGGGTCATGGCGCCCAGATCTGGGTTGGTGCATCGGTGGGCGATGGATTGGGCGC
+AACGCGGTCGAGGCCTGGGCCGATGAGCCGGCAAGTCCGGAATGGTTGAACGATTGCCGG
+ACACAGCCGGCGGCAGCAACGAATTGACGAACGAGGATCTGAACAACATGGCACACATCG
+GCAAAATGCTTGGCCGGCTGAACCCCAAGACCCAAACCTACTCCGACTCGGCCGGCGGCG
+TTGTCGAGCTGAGTGCACAGGACATTGCCGCCGCGCTGGCGTTCGTGCCGGCCGGACTCG
+GCCGTGAGCTGCTTTGCCATGTCTGGTGGCCCGGTGGCGCCGACCGCACGCGGGCACAGC
+TGGATGCGGCTGTGATGGAGCTGCTGGCCAATGAGTGGCGCATCAGGGAGAGCGCAATGC
+TGGATGCGATGCTTATGGTGGCGACACCCGATGTCGGCCGCCGGCGTGCGCAGGATGCCT
+ATGCCCTGGCGCATGCCAATCGCTGGCCGAGCTGGGGAAAGGTGCAACAGGGATTGCTGC
+AGCCGTCACCGGTGTACGCGGCACTTCGGGACGCGGTGCTTTTCGAGCTGCGCACCGGTC
+ACCATGGCGATGCGGACTCCGGCGCATCGGGGGCGATGAGTGATCGAGAGCGGGCAGAGA
+TGATTGGACGGTCCCATGTCACCTACATGAACAACGGATGGCGCCGGGTATATGAGTGGC
+TGCTGGATCGCTGCACAAGCGAGGTGGGTGTCGCTCAGCGAAGGTTTGGACGGGCGGCCG
+CGTAAGCCGCCTCGCACTGGTAGCGTGCAGCACTACCATTTTTGAGGGTAAATTCCCTAT
+CGTGACGAAAGCCCCGCAATCTTGTGGGGCTTTTTTACGCCACCTTGCAACGGGTCAGTT
+ACTGCGTCGCAGCCTTCATTGGCGACACGGTGAATTGCATCGCCAGACCCAAGGCACTGC
+TGATCCGGGCCATCGTTTCGAATCGCGGCTTGCTGCCGGGAGTCAGTGCTTTGTAAAGGC
+TTTCCCGCCCAAGGCCTGACTTGCGGGCAATCTCGCTCATACCCTGCGCCTTGGCAACAT
+GGCTGAAGGCGCGGAGCAGTTCGTCCTGATCACCATCGACCATCACCTGGTTGAGGTATT
+CGGTAATCGCTTCTTCGCTGTCGAGCAAGCTGGAGAGATCGAAGTCAGTCAGTTTCGTGG
+TCATTTTGGATCTCCTTGGCCAACTGCTTGGCCTTGTTGATATCTGCGCTTTGGCTACTT
+TTGTCGCCACCGCAGAGCAGAATGACGATCTGAAGGTTGCGAATCGTGTAGTACACCCGG
+TAGCCAGGGCCTGTTGGGATCCGCAGCTCTGACACACCGTCGCCAACAGGCTTGTGATCA
+CCGAAGTTGCCCTGTGAAGCACGTTCGATGCGCCGAGCAACAGCGATCTTCGCCTTGAGG
+TCTTTGACCGAAGCGATCCAGCTACGGAAGCCATCGGTCTGCTTGACGATGTAGTTCATA
+GGCCAATTGTATCCAAGTGGATACAGTGATAGCAACAATATCCACGAAGTGGGACGCTCA
+TGAGCCACGTTATCGAACTCGTTACGCTGGATGGCGAGCATCGTGTCGGCAGTATGGATA
+TCGCCTCATCTCTGGGGATCCAGCACAAGAATGTGCTCGAGCTGCTACGCCGTTATCGCG
+ATGACTTTGCGCAGTTCGGAAGGGTCGCGTTTGAAACGCGACCCTTTGAAACCCCGGGTG
+GCAGCCAGTCACGTGAGGTGGCAATGCTGTCTGAAGATCAGTGCTATTTGCTGCTTACCT
+ACAGCCGCAACACCGTGCGGGTCCGGTCGCTCAAGGTAGCGCTGGTGCGGGCATTTGGCA
+GCGCGCGCCGCGAAGGCATCTCCCGGTCGCTGACCGCCTGGCAGGAGCTGCAACGCCTCG
+AGATCGAGAACGCCAGCTCGCTGACCCGGGCATCCATCGGCTCGCGCCTGATGCTCGAAC
+GCAAGCGCGCCTTGCCTCAGTTGCGGGCCCGGCGCGAGAAGCTGGAAGCGCAAGTCATCC
+TGCCGATGTTCGCCTTGCCGAACTGACGGTCCTATCCACTGAACAGGCATTCCCGCGGCT
+GCGGGTTTTTTTATGCCCGGAGAATGAGCATGAGCAAAGAAGCCGCACTCGCGGTGGCGA
+AGATCTCGCCGCCCGTAGCGTGGCTGTATGGCGAGATCACAGGTTTCTGGCAATGGATGG
+GCGGCGTCAATTGGGGCGTGGTCACCGGTGCCCTGACTGCGCTGTACACCCTCTTGATGA
+TGATCCACCTGCTGGCGCACTGGAACCAGCGGGGCGTGCGGAGTGAAGACGATGGCAATC
+TCCCGTAAGCCCGCGGCCGTCGCCGGCCTGTTCGGTTTGGCTGTGGCCATCGCAGGCTGG
+ATCATCGCGCCATCGGAAGGCAACAGCCCTGTGGGCTACGCCGATCTCGCTGGTGTGCCG
+ACGGCATGCCTTGGCCACACCGGCTCGGGCGTGGTTGTCGGCCAGCGATACAGCGAGGCG
+CAGTGCCAAGCCTGGTTCGCCAGTGATGTCGGCGCGGCCGCTCGTGGCGTGCAGGCCTGC
+ATCCATGGACCGATGACCAGCTACCAATGGGGCGCGTTCACTTCAACGGCCTTCAATATC
+GGCGTCGGACAGTTCTGCCGGTCATCGATCGCTGCCAAGGCCAATGCCGGCGACATGCCG
+GGCGCGTGCGCCGCGATCTCGCTGTACGTGTATGCCGCGGGCCAGCCGCAACCCGGATTG
+ATACGGCGTCGCGCGGCCGAGCGTGCGCTGTGCGAGGGCCATACCTGATGCGCGTCATGG
+CCGGAATCATCATTGCCCTGGTGCTGGCTGTGGCTGGTGTCAGCTGGCACGACATCCACG
+AGACGCGGGCAGCGGCGAAGGCTATCGCGGCCCGCGACGATGCCCATGCGGCCAACGTGC
+AGCTGCAGCTGACGCTGCAGACCGAGCGCAACAACACCGCTGCGGCCAACGCGGTCGCGG
+CGCAATACGAGAAGGACAAAGCCCATGCCGAACAAACGGCCACTTCGATCGCTGCTGATC
+TGCGTGCTGCTCGTATCCGGCTGCGCCCAGTCTGGCGTTGTCCGGCCGCAACTGCAGTGC
+CCGCAGCCAGCACCGGTACCGGCCAGCCTCATGCAGTTACCGACGTACAGGCAGCAGCTG
+CAGCAGCAGTTGTTCGAGTCGGCGCCGATGCCGACGCACAAGTGAAGGCGCTGCAGGCTT
+TCATCCGATCACAGCAACCGGCCGCGGCCGGCACGGCGAGTCAGCCATGAATTTCATCAC
+CACCATCCGCTGGCTGTTCCGCCGGCTTTTCGTCAAGGAGTCACCCATGACCGAACCCGT
+ACAGCCGGCTGTCGCCGGCACCGCCGCCGTGGCGCAGCCCGCACAGTCCGTGCAGCCCGC
+CGTGGTCCGCACCGATGTCGTCCAGGCCCAGCCCGTCGTGGCGGACCCGTCCGTCGAGCA
+ACTGAAGGCCGAGGTGGCTGCGCTCAAGGCCGAGCTGGCCAAGGTCGAGCCTGCGCGCCA
+GAAGTTCGTCGAGCTGCTCAAGTCCGTCGGTCATGACGTCGAGCTGGTCGCCGACGAGGC
+CTGGGCGCTGGCCAAGAAGGCCATCTGACCGCGGGGATGGCCGTGGGGTAGGTCCCCGCG
+GCCTTCCCGCATCAAATGCGATCCATTCCCATTTGCGCCCGAATGGGCATGGATGGGAGT
+CATTCGCACCTAGGGTCCTCCTGAGGCCCCCCTGGGCCTGCTACGGGTGATCAACACCGC
+GATCCTTCGCTACATACCACCTTTTTTCGGCATGTCCGTGTCCGGTTCCGGTTGAGCAAA
+AATGGCCCTGCAAAAGGACATCGCCGAGCACCTGGATTTGAGCGATCGGCAAGTGCGCCG
+ATTGCTCGCAGATGGCTTCCTGCCTAGCTCCAAGGGCACTGGCGGCTATGATCTGGACGC
+ATGCCGGCTGGCCTATATTCGCTATCTGAGAGGCCTCGGAAACGGGCAAGTAAAAGCGGA
+CACGGCCCCCCTCGAAGACCTCGATCTGGACCCGTTGGCCGAAGAGAAGCTGTTGCAGCA
+GAAGCTGCGTCTGACCGCGGCTCAGGCCGATGGTCAGGAGCTGAAAAACGATATCAGCCG
+CCGGCGCTCGGTGCCGGTGGATTTCGCCATGTTCGTGCTGAGTGGCCTGGCGGCCGAGGT
+CGCCTCGATCCTCGACACGCTGCCGCTGACCATGCGTCGGCGACATCCCGAGTTGGAGCC
+ACGGCATCAGGAAACGCTGGAGCGTGAGCTGGCCAAGGCGCGCAATCGCGCCGCCGGGCT
+GGACGAACGCCTGCCAGGACTGCTTGATGAGTATCTCGCCAGCCCAGATTGATGAGCTGG
+GCCGCGCGGTCAAAGCTGGCCTGCTGCCACTGGCGCGGCCTGAGCCGCAGACCCCGGTGG
+AATGGGCCAACGATCATTTTTACCTGAGCTCGGAATCGAGCTATCAGGAAGGGCGCTGGG
+AAACGCTGCCGTTTCAGGTCGCGATTCTCAATGCCATGGGCAATGACTCGATCCGCACCA
+TCAACGTGATCAAGTCGGCCCGCGTGGGCTATTCGAAGATGCTGCTGTGCGCAGCGGCCT
+ATCAGACCGAGCACAAGAAGCGGAACATCCTCGCGCTGCTGCCGACGGACGATGCGGCCG
+CTGGCTTTATGAAAAGCCAGATCGAGACGATGATCCGCGACGTGCCGGCCGTGCGTGCAC
+TGGCGCCCTGGTACGGCACCAAGCATCGCGACAATACGCTGACCGCCAAGCGGTTCAGCC
+ATCGCAAGCAGCTGTGGTGCTTGGGCGGCGCCGCGGCCAAGAATTACCGCGAGAAGTCGG
+TCGACACCATCATCTACGATGAGTTGGCCGCCTTTGAGCCTGATGTGGAATCGGAGGGTA
+GTCCGACTTTCCTCGGTGACAAGCGCATCGAGGGCTCGACCTTCCCGAAGTCGATCCGCG
+GCTCCACGCCCAAGATCAAGGGCACCTGCCAGATCGAAGCTGCGGCGGGTGAGTCGCCGT
+ATCTGTTTCGGCTGGCCGTGCCTTGCCCGCATTGCGGTCAGGAGCAGGTGCTGAAGTGGG
+GTGGCAAGGATTGCGCCTACGGCATCAAGTGGGACCCCGACAAGCCGACGGATGCCTGGT
+ATGTCTGCGAGCACCATGGCTGCCTGATCCGGCAGCACGAGCTGCAGCCCTTGCAGGCCG
+AGGGGCGCTGGGTCTGCGAGCACACCGGTCTGTGGACGCGCGACGGGTTGGATTTCTTCG
+ACTCTGCTTGCGAGCCGGTACCGACGCCGGAGTCGATCACCTTCCATATCTGGACGGCTT
+ACAGCCCGTTCACGACCTGGTCGCGGATCGTGCTGGATTTCCTCAAGGCCAAGAGCGACC
+CGAACAAGCTCAAGACCTTCGTCAACACCACCCTGGGCGAGACCTGGGAGGAAGAAACCG
+GCGAGAAGGTCGAGTGGGAGCAGCTCTACGGTCGCCGCGAGATCTGGCCGGGTCTGCCGG
+CGCGGGTCGGCGTGCTGGTCGGTGGCATCGATACGCAGGATGACCGTTACGAGGGTCGGG
+TCTGGGCGTTCGGTCCGGGCGAGGAAAGTTGGCTGGTCTCGCGCTGGATCCTCTACGGGG
+ACCCGGCCAGCGAGGAGCTTCGCCGCAAGGTGCGGGAAAAGATCGCGGAGATCTTCGCCC
+GCGAGGACGGTGCCCGGATGCGGGTATCGATGTGGTGCTGGGACTCGGGTGGTCATTACA
+CCGATGAGGTCTATGCCGAGAGCAAGGCCATCGGCGTGCAGTGGGTGATTCCGGTCAAAG
+GTGCCAGTCGGTACGGGCGGCCGATCGCCAATTTCCCGCGGACCAAGAACAAGGCCGGGG
+TCTATCTGACTGAGGTCGGTACCGACAACGCCAAGGAGCTGATCTACAGCCGTCTGAAGT
+TGCAGCCGACCCCGGGCGAAGCCTCGCTGGGCGTCATTCACCTACCGGCTGATGATGCGA
+TCTGCGATCAGACCGAGCTGCAGCAGCTGACCGCTGAAACCAAGGTCATGAAGATCGAGA
+AGGGCCAGCGGGTCTACCGCTGGGACGCCAAGGGGCGCCGCAACGAGGCCCTGGACTGCC
+TGGTGTATGCCGTGGCGGCCCTGCGCATCGCCCAGCAGCACTTCGGACTCAATCTGGACA
+CACCGCCGGCCGTGGCGACTACGCCGCGGGCGCGGCCTGCGCGGCGCGGCACACGGAGCA
+AGGCAAGCTAAATGGCAACGACATCCCCCGAAGTCATCCAAATCCAAGCACGGCTGACCC
+GGGTGGTGGCCGCGATCGATGCGTTGATCAGCGGCGCCCAGGTGGTGCGCTTTCGTGACC
+GCGAGGTGCGCCGTGCCGATCTCGGTGAACTGCGCAGCCTGGAACAACAACTGCGCTTGC
+AGCTGGCCGCCGCCCAGGCTCGGGCCGCGCGGATGGGCCGCAATCGCGTCAGCTATGTGG
+CGATCTGATGGGCATGTTTGGCAAAACCTCCATCCGTGACCGGATGAACAAGCTGGCCGT
+GTCCTATCTGGCGGCGGGCGGCGTCAAGGCGCAGGGTGGAGGCGGTGGCGTGGAGACACG
+CTGGCGCGGTGCCTCGCGGCTGCTGCGCTCGATGGTCAGCTGGGTACCGGGCGTGGGCAG
+CCCCCGCCGGGACCTGCAGCGCTACGAGCGGCATATGCTGGTCGCCCGCTCGCGCGATGC
+GATGCGCAACCATCTGATCGGCCGTGCGGCGGTGAACCGGGTCCGCACCAGCGTGGTCGG
+TACCGGCCTGCTGTGCCGGCCCAGCGTGAATGCCCAGGCCCTGGGCCTGAGCGAGGACCA
+GGCCGATACCTTGAATGCGCAGCTGGAGCGTGAGTTCCGGCTGTGGTCGGAAGATCCGCG
+CGAGTGCGATGCCGAGGCCAGCAGCAATTTCCACCAGCTGCAGAGCCTGGCCCTGGTCAG
+TGCGCTGACCGGCGGCGATGTGTTCGTGACGACGCCCAGCATCGAGCGCGAGGGCGCGAT
+CTTTTCGACCCGGCTGCAGCTGATCGAAACGGACCGGGTCAGCAACCCGGACGGCATGCC
+GGACACCGACAACCTGATCGAGGGCGTGGCCTTCGACAACAACGGGGCACCGACGCACGT
+CTACGTGTGCAGCGGCTACCCCTACGAGCAGAAGATCCGGACCATGCTGACCTGGCAGAA
+GATCCCGGTGTTCGGTGCCGTCACGGGCCGGCGCCGGGTGCTGCAGATCTGGTGTGATCG
+GGATCGGCCTGGCCAGAAACGCGGCGCGCCGTATCTGGCACCGGTGCTGGAGCCTTTGCA
+GAAGCTGGAGCGCTACAGCTCGGCCGAGCTGATGGCGGCGGTGGTCAGCGCGATGTTCAC
+GGTGTTCATCAAGAAGACGCCGGAAGCCGATCCCGCCAGTCTGGTCCAGAACCCGCTGGT
+GTCGATGGGCGGCCATGACGAGGCAGACATTCCGGTGCCGATCCCGGACGAGCCGGGCAC
+GGTGGAGCTGGGCGAGGGCGCGGTGGTTGATCTGGCCCCGGGCGAAGAGCCCGCGGTGGT
+CAACCCGGCCCGACCCAATGCGCAATTTGATCCGTTCTTCATGGCGATCGCCAAGGAGAT
+CGGCGCGGCGCTGGAGCAGCCGGTCGAAGAGATCCTGATGCACTACAGCTCGAGCTACAG
+CGCGGCACGTGCCGCGATGTTGCAGGCCTGGCGTTATTACGAGATGCGCCGGTGGTGGCT
+GGTCTGCGATTTCTGCCAGCCGGCCTATGAGCTGTTTATCGATGAGGCGGTCGCACGCGG
+CCGTATTCATCTGCCGGGCTATGCCGATCCGGCCCAGCGCCGGGCCTATACGCGGGCCAT
+CTGGATCGGCCCTGCACGGGGTGCGATCGATGAGCTCAAGGAAGCACGGGCGGCGCAGGC
+GCGCATCGATGCCGGCGTCAGCACGGAAACCATGGAGACCATGGCGATGAGCGGCGAGTC
+GTGGGAGGAAGTGATCCAGCAGCGGGGCCGCGAGATGGAGCGCCGTCGCCAGCTGGGCCT
+GATCCCGCCGACACCGAAACAAGCCCCGGTCCTGCAGGAGCAAGAGTGATGATCAACCTG
+GCCGACATGGCTGCGGCGCGGCCGTGGCTGATGATGCCGCAGTCGCTGGAGCGGCTTCTG
+GCGATTGCCGACCGGCAGCTGGAACCGCAGGCGCTGGAGACACGCCCCGGCGATGAGCTG
+CGCAATACCCGCACGACCAGCGTGCGTGATGGCGTGGCCATCGTGCCGGTGACCGGCCCG
+ATCTTCCGCTACGCCAATCTGATGACCCGGATCTGCGGCGCCACCAGCACCCAGGTGCTG
+GCGACCGATATCCAGGCCGCGCTGGATGACCCGAGTGTGCGAGCCATCGTGCTGGATATC
+GATTCGCCCGGCGGCGAGGCCAACGGCATCAACGAGCTGGCCGAGATGATCTTCGCGGCC
+CGCGGGCAGAAGCCGATCGTGTCCTATGTCGGCGGTACCGGCGCCAGTGCCGGTTACTGG
+ATCGCCAGCGCGGCCGACGAGATCGTGGCCGACGAGACGGCCGTCCTCGGCAGCATCGGC
+GTGGTGCTCGAGGTGATGCTGGCCGACGATGCGCCTGGCAAGCGCCGGCTGCAGATCGTC
+AGCCAGAACGCGCCGAACAAGCGGCCCGACCTCAAGACCGAGGAAGGGCAGGCCAAGGTC
+GGCGACATGATCAACAGCATGGCCAGGGTCTTCGAGGCCAAGGTCGCGCGCAACCGCGGC
+GTGGCCCTGGATCAGGTCGGGCCGATGGGTGACCACGGTGGTGTGCGCATCGGCGCCGAT
+GCTGTGGCCGCCGGCCTGGCCGATCGGCTGGGCTCGCTTGAATCTGTGGTGGCCGAGTTG
+AGCCAGCGCAGACCCTCTCCTTTCCAAAACACTCGGAGGTCCCCCATGGGGCACAAAGTC
+AGCAGCACCGAAGAGCTGCAGCAAGCCATCAGCGCGGGTGTGGATCCCGCCACCATCGAA
+CTGATTCCCGCCGCGGCGCAGGATGATCCGGCGCTGGCCCAGCAGGCGGCCGCCGCCGAG
+CGTGCACGCATCCAGGGCATCAACGCCTTGGCGCGGCCCGGTTTCGAGAAGGAGGTCGCT
+GCGGCGATCGAGAGCGGGATGCCGGTGGCCGAAGCGGCCCTGTCGATCCTGACCGCCGCC
+GGCGAGCGCGGCATCACCCTGGAAGGCATCGCCGCTGATGCCACCCATGCCCGTGGCGCT
+GCCCCGGGCGAGCAGGCCACGGCCGCACGGGAGTTCAACCCTCGTGCGATCTGGAGCAGC
+CGTAAAGGAGCGCAGTGATGACCACTCTGACCATGAATCCCCGCACCGGCGAGTTCCTGC
+TCAGCGAAGCCATGGGCACGCGCTCGCGTGACCAGGTGTCCCTGGCGGCCACCGCCGCGT
+ATATCCCGGCCGGTACCGTCATGGCCAAGGCCACCGATGGGACCTGGGCGCCGTATGCCG
+ATCCGGTGGCCGCGGCCGCCGGAACCAGCACCGGCACCACGTCGGGCACGACGGATACCA
+CGGGTACCGAGACCACCACGGCGGCCACGACGCCTTCCGAGGTCGGCGTGCTGTATCGCG
+GCGCGCAGATCAACACCGATACCCAGCCGGCGGTGATGGTGACCCGCGATGCCGAACTGG
+ATCAGGTCCTGCTGATCGGCTTGACCGACACGGCCAGCAGCCTGCTGGCCGCCCAGGGCC
+TGATCCTGCGTTAAGCGCACACCTCATCACCTCTACACACAAAGCCGCCTTCGGGCGGTT
+TTTTTATGGGACACATGCATGGCGACCCTCGATATTTTCAATGACAGCGCGTTTGGGCTG
+ACCTCCCTGACTGCGGCGATCAATCAGAACCCGGAAGGCCAGGCGTCTCCGGACATGCTC
+GATGCCCTCTTCTCTGAAGATGGCGTGACCACCACCAGCGTGTTCATCGATCGTCAAAAC
+GATTCGCTGGACCTTGTGCCTGCCGCCGAGCGCGGTGCACCGGCCAGCCCGACCCGATCG
+CCGAAGCGCGACGGTATCGACTTCCGCACCATTCACCTGCCGACTGACGGCGTGGTGCTG
+GCCGATGAAGTCCAGAACATCCGAGCCTTCGGACGTGAGAGCGAGCTGGAGCAGGTGCAA
+GGCTTTGTCGACAAGCGCCTGCTCAAGATGCGCCAGCGGCTGACCGCAACGATCCGTTAC
+CACCGCATGGGCGCGGTCGCCGGTCAGATCTACGATGCCGACGGCAAGACCTTGCTGTAC
+GACCTGTTCAAGCAGTTCGGCATCAAGCAGCAGGTCCAGGCCTTGGGGCTGGCGACTTCG
+ACCAGTGGCATTCTGCAGAAGATCGTCGCGGCTCAGCGCATGGCCGAGGATGTGATCGCC
+GGCGCTGCTCCGATCACCGGCTGGCAGGCGGTCTGCGGCCGTGGGTTCATGGATGCGATG
+ACGGCCAACGAGGACATTCGTCAGTCCTTCCAGCGCATCAACGAGGGCACCTTCCTGGTG
+AACAACTACCGCGGCGGCTTCCCCTATGCCGGCGTGATGTGGAAGGAGTACTACGGCAAG
+TTGGGCAGCACCGAGTTCATCGACACCAACTCGGCGTATCTGATCCCGACCGGGGTGCCC
+GATCTGCTGATTACCCGCTTCGCGCCGGCAAATCATATCGATGTGGTCAATACCACCGGC
+GTGCCGTATTACGCCAGTCTGGAGATGATGAAGCATGGCGCGGGTGTGGATCTGTTGGCG
+CAGTCCAATGCCCTGAACATCTGCACCCGCCCGCGGGCGATCATCAAGCTGACCGCCTGA
+TGTTCCGGGACCTGGTCAGCCAGATGGACGACCAGGTCTTTCCGGCCCTGGGCGATCCGG
+CGGTGCACAAGGGCGAGACGATCCTCGGGATGTTCGATGCGCCGTGGCTGGAGCCTGAGT
+TCGGGCGTCAGCAGACGGCGCTGCGATCACCGGTGTTTGTGGTGCGTGACGCGGTGGCGG
+CGGCCATCGCACCGGGCGATACCCTCGATCTGCAGATTGAGGGCATCGATGCCGGCCTCT
+ACACGGTGACCAAGCTGGAGCCTGATGGCACGGGCTTGATCACCCTGGTACTGAGGCGCG
+CCAAATGATCGAGCTGAAATTCTCGCTGGCTGATGCCCGCAAGCTCGAGCAGTTTCGGCA
+GGCCGCCCCGAAAGAGGCGGCCGATGCCCAGCGCCGGGCCATCAACAAGACCCTGCGCTG
+GCTGCGCACGCACATGTCACGGGCCATCAGCCGGCGTGATCGCATTGCGGTGACGGCGGT
+GCGTCAGCGCCTGTCGGCCTATGCGATCCGCCCCGGCGGCAAGCAGGGCAAGCTCTGGCT
+GGGTCTGGATCCGTTGGAGGCCTCGCGGTTGGGCAAGGTGCGCCAGACGGCGACTGGTGT
+CTCGGTCGCAGGTCGGCGCTTTCGGGGCGCCTTCTACCAGAAGGTCTATGGCGGCAAGCC
+GGACGTCTGGATCCGCACCCACAGTAAGCATTTCAGCACCTCGGCTTATCCCGGGGTGGC
+CATGGGCGGCCCTGCCATCGATGAAGGCATGTCCGGCCGCTTTCCGGTGGCCAAGGTCAA
+GGTCAGCATCGAGGACGTGCGCGAGGAGTTCGAGCAGTGGGTGGACCGTGCTGCCGAGCG
+ACTGGCGGTCGTGCTGCAGCAGGAAATGCGCTACGCGATGATGAAGGCGATACAGCGATG
+AGCAACGACGAAAGTGCCGGCGACATCCAGTCGGTCGATCTACCCGCTGTCAGCACGGCG
+ATCGCCTCGACCTTGAGCACACTGTTCCCGGCCTTCGTGTCGGTGCAGGCCATGCCGGAT
+CAGGGCGAGATCATGGATCTGCCGGTACCGGCCGTGTTTATTGACCTGGAACAGATCGAG
+CCGGCGCCCGATCCCGGCACGGGGCAGTCCGCCGTGCGCTGTAGATTCTGCGCCTATCTG
+CTGATCGGCCCGGAATGCCAAGGCCATACCCGGCTGCTGGGCAGCATGGTGACGGCAATG
+ATTGCGGCGCTGCGCGAGCAGTGCTGGGGCGTCTCGGCTGAACCGGCCGAGTTCGTGGAG
+GCGATGCCAGATGGCAGCCGGCCCGAGCTGGACAATCTTGTGGTCTGGTCGGTGCGCTGG
+GATCAGGTGATCTATCTGGGCGAAGCCAGCTGGGACTGGGCGGACAGCACCGGCTTGACC
+CTGCTGGTTGGGATCTCGCCCGAGGTCGGGCCTGAGTATATCCAGGACTATTTCGATCCA
+AAGGAGCGGCTCGATGAGCTATCCACTGGCCGAACATGACCGGATGATCGCGGCCATGCT
+GCTGCCTTGCGTGGTGGAGGCGGTCGATCCGGTCCAGCAGCGGATCAAGGTCAGCAACGG
+CGACTGGATCAGCCCCTGGGTGCGCTGGCACAGCGGTGCGGCCGGCGCGGTGCAGATCTG
+GCGCGTGCCCAGCGTGGGCGAGCCGGGTGTGCTACTCAGCCCCAGCGGCACGGTGGCGGC
+CGGGACCTTCGTGCCAGGCCTTTTGAGTGCGCAATGGCCGAACAGCGAGAGCTCGGCCGA
+TGTGACCTCCATCCAATGGCCGGACGGTACCCGTATCGCCTATGACGCCGCCAGTGGCGC
+GCTCACGGCGGCGCTGCCCAAGGGGCAGCTCAGTGCATCGGTGGGGCAGGTATCAGCCGT
+GCTGAGCGAGCAGAGCGCCGTCCTCACGGCACCCAACATCAAACTTGCGGGTACGGTCGA
+GATCGAGGGCGATCTGACCGTGTCCGGTACGGCCCAGGCCGCGAGCTTGTCCAGCCAGGG
+CGGGATTGACGCGAAGGGCAACATCCAAGCTGCCGGCACGGTGCACGGCAGCAACCTCTG
+AGAGAGAAGCCATGGCAACGACCACTGATTCGGGCGCGACCACCGCGGCCGCGGATACGG
+CCGCAACGACGGCCGCCAATACCTCGAGCACCAGCACGACTGCGTCCGCTACCGCGGCAA
+CGCCCGCAACCAGCAGCACGGCGAGCACGACCGCCACCCGCACCACCGGTACAAGCTCCG
+CCACGGCGACCACCGTGACGCCTGCGGCGCCGACCCTGCCGGTGACCTTCAAGGATTTGC
+AGTATCTGAGCCGGGTGCTGATCCTCGATGACGGGCGCACCTTGCAGGTCAGCCGTTCCA
+AGGTGACGGCCTACGATGCGGCCGCCTATGCGTTTCTGGCCTCGCGTGTGGACTTCGCCA
+AGTCATGATCGTCGGGATGAGCCGCACCACGGGCCAGCCGGTGCATGGTGTGGCCTATCT
+CGTGCAATGCATCGAAGACGTGCTGACCACGCCGCTGGGCAGCCGCCGGATGCGTCCCGA
+GTACGGCTCATCCATCCGCCAGATGGTCGATCTGCCCATGAACGAGGGCTGGAAAAGCGC
+CGTGCAGGCCGAGACCGTGCGGGCGCTGTCCCGCTGGATCCCGACCTTCAAACTTTCCTC
+CGCCCAGGTGGTGTCCGTGCTCAATGGCACGATCAGCTTCACCGTGAAGGGGCAGTACCT
+GGGTGACAACGTCACCCTGCAGGTGAGTGCATGAGCCTGATCGATCTTTCCCAGCTGCCG
+GTACCCGACGTGGTCGAGACGTTGGCCTACGAGGATATTTTCCAGGCCCTGCTGACCGAC
+CTGATGGCGGCTGCCGGTGACAGCTGGACCTCGGCGATGGAAACCGACCCGGTGATGAAG
+CTGATGGAGGTCTGCGCCTATCGCGAGCTGATGCTGCGGGCCCGGGTTAACGATGCGGTG
+AAGGGCTGTTTTCTCTCCACGGCAACTGGTTCGGATCTCGACAATCTGGCGGCGTTCTTC
+CAGGTCGAGCGGGAGACAGTCATGCCGGCCGATGCCAGCACCGGCACCGCGGCGGTGATG
+GAGAGCGACGATGCCCTGCGGGTGCGCGTCGGCCTGGCACCATCATCGTTCTCGGTAGCC
+GGGCCGGAAGAGGCCTACGAGTACTGGGCCCGCACCGCTTCGACGCACATCGTCGATGCC
+AAGGCGACCAGCCCCAATCCCGGCGAGGTGGTGGTGGCCGTGCTGGCTGACAGCGCGGAT
+GGCACGGCCTCGGACGATATCGTGGCCGCCGTGCAGGCGATCCTGTCTGATGACGATGTG
+CGGCCCATGACCGATCAGGTCACGGTGCAGTCAGCCGCGATCGTGGGCTTCGCGGTTGCG
+GCGACCTTGCCGACGTACTCAGGGCCGGATCCTTCGGTGGCGCTCAGTGCGGCTGCGGAT
+GGCCTCAACACCTACCTGGCCAGCGCCAAGAAGATCGGCGTGTCCGTCACGCGGGCGGGC
+ATCATCGCCGCCCTGAAGGTGGCGGGTATCCAGAACGTGATCCTGACCGAGCCGGCCGAA
+GATGTCGCGATCAGCGATACCCAGGCCGGCAACTGCACGGGCATCACTCTGACCCCGGGG
+ACGACCGTTGACTAGCCTGCTACCACCCAACCGCACCAGCTTCGAGGCGGCGCTGGAAGT
+GCCGCAGGAGCGGGTCGATGCCATCCCGACGCCACTGGCTTCGCTCTGGAACCCCGACAC
+GGTGCCCTCGGCGCTGCTGCCGTGGCTGGCCTGGTCGCTGTCGCTGGAGAGCTGGCAGTC
+GTACTGGTCCGATACCGTCAAGCGCAACCGAGTCCGGCAGGCGATCACCATCGCCCGTCA
+TCGCGGTACTGCCGGTGCCGTGAAGGCAGCGGTGGAAGCCTTTGGTGGCTATGTGTCCAT
+TCGGGAGTGGTGGGAAACCACCCCGAAGGGCACGCCGCACACCTTCGCCTTGCTGCTCAC
+GCTCTCCGGCGCCGATGGCAACGTGGCCACCGCCGAGTACGTCGACGATGTGATCGAGGC
+GGTCCGCCAGGCGAAGCCGCTGCGCTCGCATTTCACCTTCACGCAGGGCATCAACGCGAC
+GGGTTCAGTCGGCGTGATCGCCGCGGCCCGCCCGCTGGCCTATGCGCATCTGCAATTTGA
+TGGAGCTTCCTGATGGGTTTGACAGTCACCATCACTGACGCCGGCCGCGCGGCGCTGCGC
+AACGCCGCCGGCAACGGCACCAATGCGGTCACGATCGCTGCGGTCGGACTCAGTTCGCAA
+GCCTTCACGCCCGGCGCGGCCATTCCGGCCGAGATCAAGCGGCTGACCACGATTTCCGGC
+GGCGCCACGGCGGCTGATACCATCCACGTCACCGTGCTGGACTCCGGCGATGACGATTAC
+TCAGTGTACGGTTTCGCGCTGTACCTCAGCGATGGCACGCTGTTCGCCTCCTATGGGCAA
+TCCACGGTGATCGTGGAAAAGTCCGCCCAGGCCATGATGCAGCTGGCGCTGGATGTCCGC
+TTTGTCGATGTCGCGGCCAGCAGCATCAGCTTCGGCGATGCCAATTTCATGAACCCGGCG
+GCGACTGAGGACACGCTGGGCGTGGTCAAGCTGGCCAGTGCCGATGATGCGACGTCCGGC
+ACGGACAATCAGAAAGCGATCACGCCGCAGGTGCTTTCCGGGCTGCTGACGCCGAAGATC
+AACAATCTGCAGAGCCAGCTGAATACGGCGGTGATGACGATCCTGCCGGCGGATGACACC
+GTCAACACCCGGATCAATCTCTTCGCGGTGAACGATGCGACAGGCCTGCCGTTTGTGGCT
+GATGCCAAGGGCATCACACGCCAGCTGGCGACGGTGTCCTGGTCCTCGAACCTTGTCGGC
+CAGGAGGCCACAGCGCGGCAGAGCGCAGATCAGAACCTGCAGAATCAGGTCAATGTGAGG
+ATCCCAAGTAATCCCGGCACGGGGTTTCAGTCCATCACCAACCTGACATTGTCAGCAACG
+GGGCAGCCCATCTTTGTCGGCTCCGGCGGAGGGACGACCCAGGGCATCACCACCTTCAGC
+GATGCGCAGACCAATCAGGTTCTGCAGATCGGCTACCAGTACAAGGGGGATTACCTCTCG
+ATCAATGTCGGTGGCTCGTGGGTCTATGGCGCGACCCAGAGCTGGGTGAACAACCAGATT
+GCTGTCGAGACAAAGCGAGCATCCGGTGTCGAATCGGGTCTGCAAACCCAGCTCAACGGC
+GCTGCGATGACGCTGACGGTGGCCGATGATGGCACCAATCAGCGTGCGGCACTGGTAGCC
+ATCAACAAGGCCTGGAATCTCCCGTTCATCACCTCAGCCCAGAATGTGGGCTATCACCTG
+GTGCGGACCGAGCCGGGTGCGGGGTTTCAGGCGGTCACCAATTTCTCGCTCAATGCCGCG
+GGCCAGCCCATCTTCGTGGGCTCCGGTGGTGGCACGACCCAGGGCATCACAACCTTCAAT
+GATGCGCAGACCAACCAGGTGCTGCAGATCGGTTACCAGTACAAGGGCGACTATCTTTCC
+ATCAACGTGGGCGGATCGTGGGTCTACGGCGCGACGCAGAACTGGGTCACTGGCAACTTC
+GCCGGTCAGCAGGTCGACACGAATACCTTCGGTGTCTCCAAGATCGGGGTGAGCAAGCAG
+GTCGGCGCCGGGATCCAGATGCTGTGGACCTATGGCACGGACGGAGTAGGGCGCTGGTGC
+CCGATTTCCGCACCGGGTAATGGCTTCTATTTCGCCACCAACCTGACGATGGGGGCCGAT
+GGGTCGCTCTATGCCTTGTCCTCGAAAGATGGTGCGACCAACGGCTATGCACCAAGCTCC
+TACGGCACCATCGCCGGGGGCTACTACGTCCGCATCGGAAACATACTGATCCAGGCGTTT
+TCAGCAGGCGTGCTCAGTGCAGGCGATTCGATTGCATTTCCGATTGCCTTTTCAGCCGCG
+CCAGTGGTGTCCACGACCGTCGACAACAACCGGGACGGCGCCAATCGTCCGGTCGCCATC
+AATCCGACGGTCGGGACAGTGACTGCATCGGGTTTCAAGATCAACATCGCCGCCATCTCG
+GGGGCGAACCAGCCGGCAGGTACCGGCCAGGTGTGGGTATTTGCCATGGGGCCTGCATAA
+ATGACTGACAACACCGACGAGACGGCACCGGTGGCCACCGCAGCTGCCGTGGACATGGCG
+ACCGATGCGACATCGAATGTCGAGACGCAATGGCCTGCCCGCTACTACGCCAGCTATGAC
+ACGTCCGCCACCGGGCCCACCGAGGTCTCCGGCTGGTATGACGTGTGGGGCATGTCCAGC
+ACGGCGAATGTGCCTGCGGCTGCGGATATGCTTGCGCTTACGGTCGAGCAATGGGCTGCT
+CGGCTTCCGTATGGGCAGGGCGTGCATGAGGGGGCCATTGTGGCCTACACGCCATCCAGC
+ACCGTCACTCTGGCGGATCAGGCTGGATTCGCCTACCCGGCAGCCGTCGCGACGGTACAG
+AGTGAGTACGGCGTCCTCAACGAGCCAACACCCGATGACTGGGTGACCTATTTGAAGGCG
+CTGAAGGCCATCCGGGACGGCACCGACACCACCAGCACGGCGCTACCGGCTGCACCCGGT
+AGCTGAGCCCTAGCAGGCCACATTTCACCGATTTAGATGCCCGCTGATGCGGGCTTTTTC
+ATGCCTGGAGCTTCTATGCCTTCCACCAGTTTCTTTCATGGCGTCACGACCTCGATCGTG
+ACCAACGGCGTGCGCACCATCTCGGTGCCCAGCTCGTCGATCATCGGCCTCGTCGATACC
+TTCACCCCGGGCGCCGGCGCATCGGCCAGTGCCGATACCCCGACCCTGATCACCTCGCTG
+ACCGATGCGGCGGCGGCCTTCGGCTCGGCGTCCTCGATCTACAAAAGCCTGCAGCAGATC
+TACAACGTCGCCCAGCCGGTGATCGTGGCAGTGGGTGTCAACGCGGCCGCAGGCTCCACC
+ACGAGCACCAGCGGCACGACCACCACCGATGCCAATGCGCTGACCTCGGCGATCATCGGC
+GGCGAAACCACGGCCGGCGCGCGTACCGGCCTGCAGGCGCTGCTGGATGGCCAGTCGGTG
+CTCGGCTACCGGCCGCGCTTGGTCATCGCCCCGGGTCAGTCCGCCAATCAGGCGGTGGCC
+ACCGCGATGGATACCCTGGCCGGGCGCCTGCAGGCCATCGGCATCATCGATGGTCCCAAC
+ACCACTGATGACGATGCCACCGCCTACGCCGCGAACTTCGGCAGCAAGCGACTCTTCATG
+GCCGACCCCTATGTGCAGGTTTATGACACCACGAGCAGCAGCACGGTGGCGCTACCCAGC
+AGCCCGGTGATCGCAGGCATGTTTGCGGCGACCGATGCGCAGTATGGCTACTGGGCCTCG
+CCTTCGAACAAGGTCATTGCCGGCATCACCGGTACCGTGCGGCCGATCGAGTTCCTGGAC
+GGTGATCCGTCCTGCCGTGCGAACCTGCTCAACAACGCCAACATCACCACCATCATCCGC
+GAGAGCGGCTTCCGGGTGTGGGGTAACCGCACCCTGTCCAGCGATCCGCTGTGGCAGTTC
+GTGACCCGGGTCCGCACCGTGGACATGGTCATGGCGGCCGTGTTGGCCGGCACCCGTTGG
+GCGGTCGACCTGGGCATCACCAAGGCCTATGTCCACGAGGTCACCGAGTCGGTCAACGAC
+TTCATGCGTGACCAGAAGGCGCTGGGCGCGGTGATCGATTTCGAAGTCTATCCGGACCCG
+GATCTGAACACGGCGAGCGCGCTGGAGCAGGGCAAGATTTACTGGCGCATCCGCTTCACC
+GACGTGCCGCCGGCAGAAAACCCCAACTTCCTGATCGAGGTCACCGATCAGTGGATCACC
+GAGGTGCTGGACAGCACCACGACCTCGAGCAACTAAGGAGCCGGCATGATTCCGCAGACC
+CTCTTCAACACCAATCTCTTTGTCGCCGGCGTGTCCTTCGCCGGCGATGTGCCGACCCTG
+ACGCTGCCCCAGCTGCAGCTGGCCACCGACGATTACCGCGCCGGCGGCATGGACGGCACC
+ATCGACATGGACATGGGCCTCCAGAAGATGGAGGCCTCCTTCACCACCAATGGCGTGCGC
+GCGGAGTCGCTGAGCCTATTCGGCCTGGCCGACGGCAACGGCTTCTCGGGGACCTTCCGC
+GGCAGCTTCAAGGGGCAGGGCGGCGTGACTACCGCCGTGGTGGCCACCATCCGCGGCACC
+CTGAAAACCATCGACCCGGGTGACTGGTCGGCCGGTACCAAGGCCGAGATCAAGCATACC
+GTCGGCGTGACCTACTACAAGCTGCAGGTCGGCGGCACGGTGATCTACGAGATCGACCCG
+GTGAACGCGATCCGCATCATCAATGGAACCGACCAGCTGGCCAGCATGCGCAGTGACCTG
+GGCCTGTAAGGAGCCGACATGACCACGAAGAACGAAAAGAAGAACCCCTGGCTGGATGTG
+ACCGATTCCGGGGCCGTGATCCGCCTTCGCCGGGTGAGCGAGTGCAATGGCGTCAAGGTC
+GATCGGCTCTCGATGCGGGCCCCGACGGTGAAGGACGTGCGTACGGCACGCAAGGCTGCG
+GGCGAAGATTCGGCCGACCATGAGATGCAGTTGTTTGCCAGTCTGTGCGAGGTCAGCCTC
+AAGGATCTGGAGGGGCTGACGATGGTCGACTATGACCGTCTGCAGGCCGCCTATTTTCGC
+CTGGTGGCGGACGACGGGGCTGTCGCCGGCGACTGTGCATAAGCTCGCTGTGCAGTGTGT
+CCGACAGCTGGGCATCCAGCCGTCGGAAGTCGATCGCATGACGGTCACCGACATGCTCTG
+GTGGCTGCAGGAGTCGTAGGGAAGGACCATGGCCAGGAACATCAATATCGGCCTGGTCAT
+CGGCGGCGCGATCGCGTCGTCCATGGGCCGGGCCTTCGATGACGTGCAGTCGCGTATCGG
+GCGGCTGGAGAAGACCGGGCAGCGGGCCCGCGTGCTGCAGCGGATGATTGGGGAAACCCA
+GGAGCTGCAGCGGGACTATCAGCGTCTGGCCGCCACCGGTTCATCCATGGCGGATAGGGT
+GCAGCGCAAGCTGCACTCCAATCTCGATGCCTTGCGTGATCAGGGTGTGGCCGTGGCCAG
+CCTCGAGGCGGCCTACCGCAAATTGGGCGCGACCGCCCGGCGGGCGGAGTTTCGGGCGGT
+GGGCACCAGCAATTTACAGACGGCTCGTGATGGCCTGGGGCAGACCGTGGCCCAAGGCGT
+GCGCGTAGGCGCGACCGTGGCGGCACCGGCCTACACGGCGGCCAACTTTCAGGCCACGGT
+GCGCGATATCGCCATCAAGGCCGGGATCGCCAATACGGGGCAGGAGAGCCAGGTCGCCCG
+CGGCATCATCGCCAATGGGCAGGCCAACGGCATGGGGCGCGGCCAGATGGCTGACCTGGT
+CAATCAGCTGGTCAGTGCCGGCATGGATCTGAAGCAGGCAATGAGTTACGCGCCGGTGGC
+GGCGAAGTTCTCGGTGGGGCAAGGTGTGTCCGGCGAAGATACCGGCAAGCTGATCTCCGC
+CATCAGCCGCAATGCCAAGATCACCACGCCCGAAGGCATGGCCAAGGCTCTGAGCTCAAT
+CGCCTACCAAGGGCAGGCTGGTAACTTCGAGGCCGAAGACATGGCGCGCTGGTTCCCGGA
+TCTCTTGGCCCAGATGCAGAAGCTGGGGCTGACCGGTCAGGACTCGGTGAACCAGCTGGG
+TGCCATGCTGCAGGTTCAGCGCAACGTCGCCGGCACGTCGGACGAGGCCGGCAACAACCT
+GGTCAACTGGATCAGCAAGATCGGCGCGCAAGAGACGGTCCAGAACTACGCCAAGGCCGG
+CATCGATTATGCCGGCTCCATGCAGATGAACATGACCAAGCATGGCATGTCGGCCCTCGA
+GGCCAGTTTTGGCCTGGCTGAGAAATACATTGAGGCGGTCGATCCGAAGCGTGCGGCGGA
+CATGGCCAAGGGACTGGCCGGTATCGACAAGACCCTGGATCCCGACAAGGTGCGGGCGCA
+GGTGGAAGCGCTGAATCAGCAGATGCGCACGGGGCATATCTTCACCGATCTGCAGGTGAA
+TGCGGCGCTGACCGCCTACCTGCAGGGCCGCAAGCTTTATGGGCAGCTGAAGGCCGACTC
+AGCCAAGGCCGGCGATATCCTGGACAAGAATCTGGCCCAGCGCAGGCAGACCAGCCTGCA
+GATGTGGAAGGAGGCCGGCTATGCCTGGGACAACGCGCTCAACTCCATGGGGCAGGCGAT
+CGAACCGCTGACCGACAAGGTGGCCGGGTTCGCCAAGACGGCGGCGGCTGCGGTGGATAC
+CGTTGCGACCAAGGCGCCCGGGGTTGCAGAAGCCGTGCTTGGCGTTGTGGGCGGTCTGGT
+GGCCCTGAAGGCTGCGGCCGTGGCCTTTACCGCAGTGAAGGGGATCTACCAGATCGGACG
+CTCTGTGACGGGCAAGGGGTGGCAGCCGGAAAATCGCCCGGCAGGCTTGCCCACCGGCTC
+CGGCGGCCCGATGGATCGAGGTGGCGTGGTGCCCGTGCGGGTTATCAACTGGCCCAAGCA
+GTTTGGCCCATCAGATGAGCCGGGTGGAGCCGTGGCAGGGGCTGAAGGTAGCCCTAGTGC
+CGGTAGCCGGATCGGCAAGGCCATCGAGGCTGCCCGCGGAGCGGCGAAGTTTGGTGGCGC
+GCTGGCCCTGATCGACGGCGCCATCAATGCCGGCAGCGTCTTCGCCACTGCCAAAACGCG
+AGATGAGAAGTTCAGCGGCTATGGCGGCGCGGCCGGCGAGACGGTCGGGGCCACGGCGGG
+CGCTGCCGCCGGCGCGGCGCTGGGCTCGATCGTGCCCGTCGCCGGCACAGCCCTTGGCAC
+CATCGCCGGTAGCATCATTGGCGGCTGGGCCGGCAAAACCCTAGGCGAACTGGCCGGCAA
+GCATCTGGCCACGAGTACCGCGGAGCACGCCGATGACAAGTCCTCGGCGGATGCCGACAA
+AGGTGCGGCGAACTTGCCGCCGATCCAGGCGGGGCCGTTCTCGCCCACCATCCAGATCAA
+TATGCAGCAGCCCACCGGTGATCCGCGAGCCTGGGCCGAGCAGGTCTGGCCCATTCTTCA
+ACAGAAGCACGCTGATTACCTGGGCCGACTCCAGCGTGGCCAGCTCTTCGATGCGCCGAT
+GGTGTAACCCATGCCGTATATGCAAAACATGCAGGGGGCGCTGCAGTCCCTGGTCAGCTC
+CGGCGCGGCCGGTCAGCGCAGTCTGGACAGTATGCTGGGTCCGATGAATACCGGTACAGC
+CCAGCTGACCAGCTCGGTGTCCGAGATCAGCAGCCTGCCGTTCCTGTCCTCGGGCGATAG
+CCAGTCGATCCAGCGGGTGACGCGCCGCATCGTCCAGGCCCAGGCCATGGTCGGCAAGGT
+GATGAACACCTATACCCAGGTCAATCGGGTGGCTTCGGGTGTGGCGGCCTCCTATACGGC
+GCTGGGCGGCCAGGTCACGGCGGCCCGTAATGCGGTCAGCAAGATCATCGGCAAGGTCAA
+TCCCTCGCTGGCCAGCGCCATCTCCACATCGATCCTCAACCCCACCACCAGCCATGCCGC
+GGCGGTGAAGCCCTTTCCGCATCTGCTGATCATGCAGCCGGTCGTCTCGGGCGGCACGCC
+GTTCTATTTCAACCTGGACACGGCGGCTTTTGATTCGCTGCAGCGCCAGACCAGCTATGG
+CTGGCAGGGGCAGGAGCGTCTGGGTCGGCGGCCGGCGCAGCAGTTCGTCGGCATGGGCAC
+CGACAAGATCACCTTGTCCGGCGCGATCTATCCGCACTTCAAGGGCGGCCTGACACAGCT
+GGACAGCCTGCGCACCCTGGCCGGTACCGGCAAGCCCTACATCCTCACCACCGGTTACGG
+GCAAGTGCTGGGTACCTGGTGCCTGAGCTCGATCAGCGAACAGCAATCTGCGCTGCTGCA
+CGGCGGTATCCCCCGCAAGCAGGGCTTCACTTTGGAATTTGACCGCTATGGCGACGATCT
+ACAGAACCTGTGACGGCGACCTGCTGGACATGCTGTGCAACCAGCACTATGCCTCGCTGG
+ACGGAACCGTCGAGGCGGTACTGTCCGCCAATCCCGGTCTGGCCAGCCAGGCCCAGCCTT
+ATGCCGCCGGCATCCAGATCATGATGCCCGACATCGCCACGCCTGTTGAGACCGAGGTAC
+AGCTATGGGATTGAGCAACACACCGCTGGCTCGCGTCGAGGTGAATGGCAAGGACATCAC
+CGCCCTGATCACCGACCGGCTACTGATGATCCAGACCATCGACAAGGCCGGCATGGAGGC
+CGACCAGTTCGAGATACGGCTGGATGACCGGGACGGCAAGCTGTCGCTGCCGGCACGTGG
+CGCCGTGCTCAGCATCTACCTGGGCTATGCCGAGCAGAGCGTGGGCCTGGTCGGGCAGTA
+CACGGTCGACGAGATCGAATATGCCGGGCCGCCGGACAGCATTGTCCTGCGAGGCAAGTC
+GGCCAGTATGCTGGGTTCCGGAAAAAGCACTCGATCGGGCAGTTGGGACAATGTCCCGCT
+CGGCCAGATCGTGGCCGACGTGGCCGGCCGCAATGGCTGGACGCCGCTGTGCTCAGTGGC
+CGATGTGGTGGAGCGTGCCGACCAGGTCAAGGAGAGCGACTTCCACTTCATCACCCGCAT
+TGCTCGGCAGCATGGCTGCACCGCCAAGTTGGGGGGCGGCAAGCTGATCGTGGTGCCGCT
+AGGCATGGCCAGCAGCGGCAGCGGCAAGAGCATCTCGGCCATCACGCTGACGCGATCGGA
+CCTGACCCGCTTCCAGTTTCAGCTGGCCGACCGGTCAGCCATGGCCTCGGCCAAGGCCGG
+CTATCTCGATCCGGCCTCTGGCAAGCTTGCCATCGTCGACGTGACCAATCCCAATGTACC
+CGACGGGCTGCCCGGCGTGCATGTGGACCGACACCTGCACCCAAATCGTACAGCGGCCCA
+GCGCGCGGCCAAGGCACGCATCGATGCCTTCAACCAATCCACTGCCCTGGTGCGCCTAGA
+GATGCCGGGGCGCACCGAATTATTTGCCGAGCGCCCCATCAGCATCAACGGCCTGAAGAC
+CGGTATCGATGGCACCTATATTGCGAGCAGCGTGGAGCAGACGCTCACGCGGGCAGGTTG
+GAGCACGACGGTTGAGTGCAATGGTGGGAATGATGGGAAGGCAGCGGCATCTGGCAAGCG
+GAAGTCGGTGCTGAAGGTTATTGATGCTGGTGAGTAA
+>NC_017033.1|provirus_1557694_1600481
+TCACTCCCCCTCCTTGTATTCCGGGGCGGCGGCAAGAAATGTCCTCCAGATCGTTGACGG
+GAAGGCATTCGGGTTCTGCTCATCCAGATAGGCCGCCACGTCCATGGCCTCGGTGAGCTG
+CTCCGGCACCAACTTCCACCCCGGCGGCGCTTTGGTGAGGGCGGCCATGATGCAGGCAAA
+GTTCTCGGGCGTGTATCGGCCGCTGATCACCTCATCCTTGATCAGTCGATGAGATCCAGT
+CGATGCGCAAATATCCCGTGCCATCCTCTCCAGTACAGTCATGGCCATTACTCAACCCTC
+CCTGTTTCGGCAAATTGGGCCAGCATCCGAGATAGACGCCGCGCCTCTTCGCGGCCTACC
+TGCACACTTCTCGTCGGCCTGCAGGTGCTGCTACATACCAGCCAGCATCGGCCGCCGATC
+ATCTGCAGCTCGATCGACTCGGTGCGGTCGTTTTTGAGTCGGATCGCATCGGCCATTACT
+CAATCACCTCGCGCACGTGGATGCATTCGATACATCCGTTATCAGCCCCTTGATCAGCTG
+ACTCCTTGCTATCGCAGATATATATCTCGCCGTCAAAATACAGATTCACCCAAAACTCCC
+GCGGACTCACCTCCTCGCTGATGCGGTATTTATCACTTGCGTGAAGATGGTCATTTTTAC
+CCCACGCGCACCATGAATCAGACATCCAGCACTGAACTTTCTTCCCATTCTTCATTCCCT
+GAGCCGCGGCAATAACGCCATCCCACCCAGTCACGGGCTCGCCCCATTTGATTCGGTCAG
+TCATGCCATGTCCTCATCGGTGATGGTGTGTTCCTGGATGTTTTTGATGGCACCGAACAT
+CGCGGGCGGCAGTTCGGATAGCCAGGAACGCAGATGCTTGACCAGAGATTTGTGGTGCGG
+GTCGAGAAGTCCAGACTCGTAATCGTCTGCCAGAAAACCATGCTTCTCCTTCGCATGGTC
+GGCCATCGAAGAGATGACTTCCCATGAAAGGGTGCTTGCCGACAGGTGTTGGTATGGAGT
+GAACTGGCCAAACCTGATCACCGATCCAGCACTGAGATCGCCACCCGATGCATCTATGGC
+ATCCCCTATGGTGTCGTACAGGAATGCGTCGTCTCCGGGACGCTCCCACTTGATTTGTGG
+ATCACCCATCGTTCTGTTCCTCACATGCATTGCGCGTGGCCCACCCTACGGCTGCAGGTG
+GCATCGGCGCGATGGTGTAGATGGCCCGGATCGTGCCGGCGGCGGCCGGGCGAGCATCGG
+GCGGAAGTGTGTGCAGGCCGGCCAGCACCTGATTCAACATGATGCCGGCAGCGCGGGCCT
+GCTCGGCGGTGGATGCGACCTGGGCGAGTGAGCTGCACCAGGTTGGCGCGGCCGGCGTCG
+GTGTGGCCAGCGCGGCGGTCAGGAGTAGGACCGGGACCATCACCCCACCTCCGGCGCGTC
+AGGGATGGGCATGTAATGGCTGTAGTTGGTTGACACTATTTTGCCATTGGGTGACTTCCA
+GCATTCCTCGATGTCATCCCATCCCGCAATTGCTTTTGGATAGATGGCAGCCAGTGTTAG
+CTGACCTAGAATGACATTTCCAGCGGCCTTTTCTGACCCATCAATCGGCAGCCAGCGCGG
+GGCGTATTTGGCGTGGGCGGCTTTCCATGTCTGCCAGTTCAAATCAACCTCACGGCCCTC
+CAGAGCCATGTACCGCGCATGGTCCTCAAACTCATCTCGCAGTGCGATTACTTTCTGCTC
+AGTGCTCATGCGGCCATGGCCTCCATGTTGTGGGCCGGATCGAGGTTCGCCCGGGCGATG
+GCAGCCAGCGGTGGCGGGCTAACCGAATTTCCGCACATGCGCGTGCTGGCGCTGATGCTG
+AGGCGCCGGCCGTCAGCGGTGCGATCGATGATGTAATCCGCGGGAAACCCCTGGGCCCGG
+TAAAGCTCGGCCGGCTTGAGCATCCGCAGGCCGATATCCACGATGACGTAGGGCGTGCCC
+TTGATGGTTACAGTGACCAGGGCCAGCCGGTCGCGGGTGGTGACGGTGTCGAGCGGGTCG
+CGCAGATTTTCGCCGTGAGCCGTTCCGTAGTATTTGATCAGGAATGCCGCGACGCGCAGA
+GCTCCATCGGTCTGCTGCTGGCTGAGAGTGCATGTCACCAGTCGCTGCTGGCTTCCGCTC
+CCCACGATGGTCGGTGCCGGCTGTCGAAGGTCATTCCCGGCCCCGGTGTAGAAGCCGCCA
+TTGGCCTGCTCGAGAAAAGCAGATACGACACCGAGAGCATGTGCAGCACCTGCCGGTCGG
+GCTGCACCGGCACCGCTGGTGATCGTGGGCACCGGCTCAGTAATCGCAACCCCGGCCCGG
+ACATCGCCTCGGATCTTGATCAGGTGCGCCGATACGGCGGAGAAGTGCCCACCTTTGATG
+CCGCTGACCTGTGTCCGCAGTGGCTCATCAGCTGCAAATACTCGCTGGCTGCTGCCGTTG
+GCATGTTCGGTGAGGAATGCTGCTGCTGGGCCCGGAACAATGAACGGCTCATCTGTATCC
+AGCACGAATTTGTGGATGCCCTTGGCGATGCGCCGGCAGGTGGCATCTGCCAGAGGCCTT
+GCCCGCTCGAATATCGACGGGCAGGGTATCGACCAATCGATGCAGTCGGCGGCGGTGACG
+AGCGGCTGTAGGCCGAGACCGCGGCCATGGGTCTGTGCTGGCCAGACAATGGGCAGCCCA
+TCCCGGCGCGCGATGAGAAAAAGTCGCTCCCGGCTGGTGCCGGCACCGTAGTCGCTAGCG
+ATCAGGAGCCTGTGCTTGACCTGGTATCCCATGCCGCGCAGCTCATGAAGGAAGCGCGCC
+CAGGTCTGACCGGCTCGGCGCTTGTCGGGGACCAGGAATTGCTGGTCGACCGGGACACGC
+TCACCACGGAGGGCGACAGTGCCGTCCAGTTTCACAACGCGTCCGGTCGCCGGATCGCGC
+TTGGCAATCAGCGGACCCCAGCTGCGGATTTGTCGGACGTTCTCCAGCGAAATGATCCGC
+GGCGCACGCCCGGCACGCGCCAGGGCTCCGGCCCACTTCAGCACAACCCACGATAGCGAC
+CGGGTGGCCCGGCTTCGCGGTTGGCCGCCCTTTGCCTGGCTGAAATGGGTGCAGTCCGGG
+CTGGCATGGAACCAGCCGACCGGGCGGCCGGCGACTTCTCGCACTGGATCGGTCTGCCAG
+ACATCCTCGCGGTGATGAACGGTAAACGGGTGGTTTGCAGCATGCATGCCGATGGCGTCG
+GCATCATGGTTGATGGCGATATCCGGATCCCGCCCCAGCGCCTGCCGCAGGGCCTCACTG
+GCTCCGCCACCGCCGGCAAACAGGTCCACGATGATTTCTCCCGGGTGTAAGCGGCTGAGT
+CCGGAGGTGCGCGGGAAGTTGAAAGTAGGCTGTGCGCTCACGCCACCTCCCTCCGCTCAA
+CCCTGGCCCGAGGCTTCGGAGGAACCCGAATAAACCCCATCCAATGCTCCAGATCTGCCA
+TTGCCACGGCGAAGATGGAATGCTCTGGATGGCACTCGCCAGTGCCCGACGCATTACCCT
+GGTAGACCCCGACAAGTCGGCTGGAGTGCGTGACCAGAAACCCGTCATATCCGGCCTCGT
+GGTGCGTGACGAACGCAACGCCGCCGGTCTCGCCGATGTACACCGCGATCCGACCATGCT
+CCAGCGCGTTCTCGCTGATCTCTTTCGCTATGGCATCACTGCCACGGCTGATGTTTCCGA
+GTGATTTCATGCTTCGTCCTCAGGAGGCCATTTTCTCGGCCACTGTTTCGGGCAGATCCG
+GGAAGGTGCCCCACGGTTTGGAAAACTCAGGGGCCCATGGTGAATCGTGGCCGCAGGCCA
+TCTTTCCGCAGCGCATACGTGGCTCGCCGTCTCGGACAAGCACTCGCATACGGCCGGATC
+GCCAGTCGAACCAGCCGTCGAGCGGCTGGAACATGTCGATGGTTGGAAGGGAGTTGTCGG
+CGGCCATGGTCAGGCCGCCTTACGCTCGGTGAGGCCGAGGCCGACATCCTTGATCCGAGC
+CATCATGGCCCGCAGCATGTCGAGCACCTGGTCCTCGCGGTACAGCTTGGCTGCACGATC
+GGTGCCGGCCGGGTTGAACCCGAGCTGGGCCAGTCCGTCTGCAGTGATCGAAAGCGGTGC
+GATCAAGGCGCTGATGTCGCCCAGCTTGATGGTCTTGGCAGGGCCTGCCGGTTGGGCGAC
+TTTTTCGGCCTTGGCTGGGATCTCGTCCGTTGATGCCGCAAAGTGGCTCTGCGCCTGAGG
+TGCGGACTGGACGACTTTTGCAGATGCCGGCGGAGTCTCGTCCACCACCTTGGCCGCATC
+CTGCTCGCGGGACAGCTTCTCGGCTTCTTCCTTGCGGATCTGCTCGCGCTGCCGCTCCAG
+TCGCTCAGTCTCCTGCCGTTCGAACTCGCCGATACGAGCCGCGACCAAGTTGCGGAGATC
+TTCAGGCGACTTGGTTTGTGCCAGCATCACCCGATCGGCAAACAGTGACTGGTGCTGATG
+TTGATTTTTCAGGATGCTGACGTTGGCGCGGATGGTCTCGGCCCGCTGGCTCGCAGCGAT
+CTTGATGTCGGCCACGGCCGTACTGACTGCGTCCCGCATGCTGCTGATCGATCGCTTGCC
+TTTGATCGATGCGCCGATGCCCGCCAGGGTGGCCTGGTCCGGCCGCGGCGCAAATTCACC
+GAGGCTCACAACCAACTGCTCGTAGTGGGCCCTGGCTGCACGGATGCCGGCGTCGACGAT
+CTCCTGTCGGATGCTGATGTCGCGAGCCTTGACGCATTTTTCCAGATCAAGACGGATACG
+GCGGGCCTCTTCCTTCAGCTCATCCATCGCCCGGAAAACCGCCTCGACCGGCGCGGCATC
+GGCGAGCGCTGCAGACTTCACCGATTCCAGACGGTCTTCCACGCCCTTCGCCCAGGTGAT
+CGTCTTCCTGGCATCGGCGAAATCTTCATCAGTCTGCAGATCCCGGTTGATACCGCCGAA
+CACAGCCATGGCATGAGTCTTGAACGCATCCAGATTCGATGCGGTGACCATGCCGCTGAC
+AGCCACATGCAGGGCAGGGAGCTGATCCGGAGCCTTGCCGACCGGCGCCGGCGCCACTTC
+CTGCTCCGGCTGATAAGCGGAAATGTCCTGCTCGAGCTGGGCCCAGCCGGCAACAATGCG
+CGCACGCAGTGCGGGATCTGAGAGATACCAGCAACCACGGCTATCGGACTGGATGTCTCC
+ATCCCATGATGTCGCCATAAACAGAGCCCTGTCTGCGCCGGATACCATCATCTGCTGCTC
+TAGCTGGGCGCAGTAGATCTCCGGAAGCACGACCTCATCGCCATGAAGCGGGATATGGCC
+ATCAGCGACATGCTTGCGCGGAATCGCTGATCGCAATGCCATGTTGAGCGTTTTGTGCTC
+CCAGATGGCATCTTCCATCATCGTCAGGCCGTCGAAGCTGGCTGAAAGACGGCCCTCGGT
+GCCGACGCAGGGGAACAGATCTTCGCCAATGACTTGTTCGGCCAGAGGCCTGCACAGCGC
+CTCAATGCGATGGCCTTCATCAAAGATGCGTTGCAACTGCGGGGTAATCTCGCGCTCGAT
+ACCAGTAGCCAAGCGCTTGATCAGCTCGCTGCGCGACTCATAGGGCGACAGTCCGAGCAT
+GGCTGGTGCATCACTGGCATTGAAATGCGCAGAGCGGTGGGCATGCCATTCCGGCGTGCC
+CTGGGTGAGCTTTACGATCTTCATTCGACTACCTCCACCTCGGTGGTTTCGAGGTCACGG
+ATGGCGCCCAGCTGACCGGGCGTCAGGGTGTATTTGGTATGGACCATGGCGATGATCTCG
+TCGGCAGTTTTGCGACCACTCTGGATGCGCTCGGACCAGGTGCCAAAGTTCTTGTTGAAC
+TCGTCATCCGAGTAGGGCGGAAGCTCCTGTGCAATCCGCTCAGCCCGCTGCGTGGCGCTA
+TCGGCCTGCGATACCGTGATCCGCTCTGCCTCATCGTGGTCATAGATCCCAACGAATCCG
+AAAGCGATACGCGAGCACTGGATCATGGCCTTGTGGCGTAGCATCCGGCGCGGGTGGGAC
+TGCCAGGGGCCTGCGTTGTTTCGCTTGCACTCGGCCATCCACTCGGTGACGCGAATCGGG
+TGCGATCGATCCTTGCGGTAGATGATGCAGGTGCAGCTCTGGTCATCCTGTTCAAAGTTG
+ATGCCATCGAACTGGGCGTGACCGTTGATGATCCGCGACCATCCATCGACGCCAACCACC
+GGAACGATGCCGCCCTTGTCCGGGAAGGCATAGATCTCTTTCGTCCAGGGATTGAGGCCG
+TACTGGTTGGCAACCATGAGAAGGGCCGCCATCTGCTCGTCGGTCACGTTGCCCTTGAAC
+GCGGTGGACTTGAGCGTTTCGACCAGATCCTTGGAATCAACATTCAGCAGGCCGAGATTC
+TTGGCCAGGCCATCGACCTGGGTGGTGACGAGTGCGGACATAACAACTCCTGCCGGCCTG
+CGCCAGCACAATCAAAAGGGAAGGGGATTTGAATTAGTGGAAGCCGCGGGGCGGCTCTTG
+GTAATTTCGTTCGGCTCGTCCGTAAGCCCATGACCAAAGCAGCGCTTCGATCTCTCGCCA
+GTCCTTGGTGGCCACAGCCTTGGCCATGGCCTCACAGTCGTTGGGGCGGTCGAGTAGGGT
+GGCGAGAAACTCCTCGGCCACCTCAGGATCTGCTACGGACCGGATTGCTTCGCGCTCGAT
+GATCGATTCACGATCAGCTGCAGCATCGCCGGCGTGGTCGCATTGCCAGCCGGGAGGATC
+GGGGAGGTATAGGGTCATTCCTCCACCCCGTCATAATCGTCATCGACTTCCATCCAAGCC
+GAGTCGTCCTCGGCCTGGTTATCTGGATTTCCGGGATGGGTGCAGCTACCGCATGGCGGG
+GTCAAGTGGCACGAGCAATTGCCCCCGTCAAATTCGGAATCAAAATCGGCTCGCTCGGCT
+TCAGCCTCAGGCGTCAGTACACGCTTCATGCCGCCATCTCCTGCCTCGACCCAGCATCAT
+GCGCATCAGCCATCTCCGTCAGGCCTGCGATCAACTCGCGGATGCTACTCATCGGAATGC
+ATATGGACACAGCCATGTCGCAAGTGGTCCGATCAAACACAATCGCAGCCCGGCTAAATG
+CCGTCTCACCCCGGTAATGGATGTAGGTGGTCAAATTGCTCTCGCTGCCTATGACCTTCA
+TGCCACACCCCCGGCGATCAGTGGCCACTTCGGATGGATGGCCAGCATCAGGCCAAGGTC
+CGTCTGATTGAACCGGCCGAACCAGCGGCAGGCCGCCTTGCAGCGCTTCGTGTTGGATTT
+CATGACTTTCTCCAGGCACAAAAAAAGCCGGATGGCCGGCTGTTGGTTGATTAGATTTCG
+ACGGGCCTGCCGTCTTTCAGTGAGTACCAGACATTCGGCTTGATGCCATCCTTGCCGACA
+ACGCCTGCCCATACGTCGATGATTTCGTGGTCCTCGTTGCGCTCAACGAGGAATAGGGCA
+TTTCCGTCTGTGCCCATGACTTTCCCCTCATAACCCGAGGCCATGGCTGCTCCCCAGTCG
+CCGGTCGAGCTGGCTGCGCCCCAGTCGCCGGTCGAGCTGGCTGCGCCGTAGTCGCCGGTC
+GAGCTGGCTGCGCCGTAGTCGCCGGTCGAGCTGGCTGCGCCCCGGTTGCCGGTCGAGCTG
+GCTGCGCCCCGGTTGCCGGTCGAGCTGGCTGCGCCGTAGTCGCCGGTCGAGCTGGCTGCG
+CCGTAGTCGCCGGTCGAGCTGGCTGCGCCCTGGTAGCCGGTCGAGCTGGCTGCGCCGTAG
+TCGCCGGTCGAGCTGGCTGCGCCCCAGTCGCCGGTCGAGCTGGCTGCGCCGCGCTCATCC
+TTGGACTGATCGCCATCCGCTTTCTTTGCCCGACTGAACGTAAAATCGATGGCCGCCTTG
+ATGATGCCCGGCAATCCGATTTCAGCCTTGATTCCAATCTTCTCGCAGGCCAGCTTGTCG
+CTTTCCCGATCCACCTTCCCGGATGCCTCGATTACTGCGAAGCGTGCACCTGCGGGCGGG
+TAGTATCCAAACACATCGAGCGGATACTCGCAGCAGTGGAAGCCTTCGTTGCAGGCCTTC
+ACCTCGCCTTCGTGGACATACTCCTTGCCGACCTCATACTGAAAATCTCGGCACTTGAGA
+TCCTTGTCAAAGCCCTTGTAAGCCACGATCACTTCGTTTGCCATGAACTTTCCTCAAAAA
+AAAGCCAGCTCATGGCCGGCTTGAAAGTGGTAGATACGGCATGTGCCGCACCGATAGAGA
+ATGAGTGGCTGGGTATTGCGCCGGCCTCGCACGGCTCAACGCCATCCAGTGGCGGGGTAT
+TGCCGGCCTATCAGTGGCCGGGTCTTAAATCAAATCGACTTACCGCCAGGCAGCGCCCGA
+TTTGCAGGCAGATGATCGGCCCGCGTGGCGTTGTAGCGAATCTTCTCCATGGCCGCGCCG
+AACACGTCGAGGTGAAGGGCCCCAGCCAGATCGAGGATCCGGATCACCGCATCGGCCATC
+TCGACTTCCATACCCTTGCGCTCAGGCAGATGGTCGTCCATCAGATCCTTGCGGAACGCC
+TCCAGCGCCTCGCTGACTTCGGAATGCACAAGGGCCAGCTTGCCGGCGATGAAGTGCTTC
+CTTGCATCGGGATCGCGCCACGCCAAACTGTTCCACCAGCCGCCATCGACGGCCGCGCCG
+TGGCATAGCGACTGAAATGCCTGCAGAGACGACAGGCTCAAGCTGTGTGCTTGCATATTT
+GCGCTCCTCTGCGCGTTGAATTGTGATGGGGTCTGTCGGCCCGCTACGGCCACATTTTTC
+ACCAACAAGGAAGTCCGAGTGTTCAGCGCCTCGGTCAGCGCAACCTCAAATCCCATCACA
+ATGGCCCCTGCTACCAAGGGCCAAAGTCTCTGCCGATCCGTCACTTGGCTGAACATCCCT
+CAGATGCTTTGACCCGCCGTGACCGGCAGCTATTCGGTTGTGGAAGATCCCAGGCCGTGG
+GTCAGCGTTTCGCTGCGGCGCGGGTTGACTATACGAAACGCATACCAACGAGGCAATGCG
+AAACGCATAATTTATGGATGCGAATCGCATACTGTTCAGCGTCCATTTATCTAAATCTCA
+CCCCGTGAGACGCGCACAGGCCATCATTTCCCCACCAGGAGGAAACATGGCCAAAGAGAC
+GATTTACGTGGTGCAGACGTGGGTGGCGGGGAAACGCGGGCAGTTGATCGCCGATCCGCC
+GATACCGATGACGGCAGAGGATGCGGCTGTGCGCCGGGCCTACAGGCTGGAGGAGGATAA
+GGCCGCGGTCATGGTCTTTGCTCAGACGGCGGACTCAGAGACGGGCGACTATGATGATCC
+AAGGATCATCCTGCGGCTGGGGGAGGAGGTGGAGATGGGGTAGGGCATGAAAAACCCCGC
+CGGAGCGGGGTTAGTGATTTATCTTGGCCTGTACCGCGGGCTGCATGCCCGTTGTTGGCT
+GAGCGTATGCTGGAACTTGAATGATGATGGGGGCAGCTTGGGTCGCTGAGAGCGTCGATG
+GCGGCTTCCACAGGGTATTCATAGCAACCACCACTGCGACGAGTGTGCCAATGATTGTTA
+GCACCGTCGCAAGCATCCACCCCTTGATATCACTGCGCACACCTTCGATGTCTGCCTTGG
+TGGCCAAGGTAGGCAAGATGGTGTCTAGCCGTGTTTCAAGGGTGGTAAGGCGCTGTTCCA
+TACCTCCATCATGTGTTCCACCACCGCCATTTGCAAGTGCTGGGCCAATAGCTGCCGCTT
+GCAGCGGATCCATGGCGCCAGGAAGGTAAGTTACCTTAGGCATCGTCGGCGGCCTTCTTT
+TCTGGGTTTCTCCTTACCCACTGCGACACGACGAATAGGTCATGGCTCCTGATATATCCG
+CAATTACCACATCCAAGAGATATTATTGCCCTTCCTGCTACGCTCCCACCCAGTCGCTCT
+ACCATCCCACTATCTGGTCTTGGATTTTCTGCGAAAGGGATCATTGTGAATAGCCCAAAT
+CTATTTTCTGTTCCGATATAGAACCATGCTGACTCGCCGCAGCACGAGCAATTAGGGCTT
+AATGTTTTTTCTCCAAGAAATCTTCTGAAATCTTCCTCAGTTACAGATGTAACTGGCGGT
+GATAGTATTCTCGATTTACCATCGTTCATTCATTTGCCTTGACTGAGTTGCAATATATAA
+GTGAAATATCGATTCTTTTTTTGGATTGCACACCTCACTCCGCCAGCATCAGGCACTCGG
+ACCAGCGATTCACTTCGGTACAGCCTTTAATAGGGGCTTTAGGCTGTTTGCATTGGCCTT
+ACCCCAGGCTATCAGTGCGGCCTGCAGGCGGTCAGACATGTTGTTCATGTCTGCGATGCA
+TGACTTATCGTCTCCATGTCGACATAACGTGTTCTTCGGCTCTAGCTCGTCAAACTGGAT
+AGCCATTTCAGTTTGGATGATTCTTTCCAAGTTGATTGGTCCATGAAGGAAGGCGTCCAT
+TGCGATCTTTGCAAGTTCAGTAATCACTTCATCTTGCTGGACACAGGACCCCATCTCGAC
+GAACTCGACGCCCTTGCCGTGAACGATGCAAGCCATATCGATGCGGTCACCCGGTTTTGC
+CATCTCAAGGAACTTCGAGTCTCGGACGCTAATATATGCAGTTACCATCTGCATTTTAAT
+GATAAAATCATCATCACTAAATTTTTCAGCTCCTCCAAAGTATCCATTCACAAAAGTGTA
+CTTGTTTCGGTACTTGGCATCAGCGCCAATTGGATTCTGCATAAATTCAGTGGCGATAGT
+TAAATCGCGCGTGCTAGGAATGACTAGTTTTCGCCATAGTTCGGCATGTTCGCTTTTGCC
+ACCATGGACAAAAGTCAGAAGATCGTTAGAGAAAAAAATCCTTAAGAAGCGCTGCTGTAC
+TGCGTCTGGATGTATGGCCTCATCAATAGTCGCCGACCGTGCATTGGAAATAGTTGCAAA
+AAAGGCAAGCGCTGAAATAAATACAAGCGCGACGAGCCTCATCAGAGCTCGCCTATCACA
+CGCGCCTTGATCGTCTCGTACTCCGAGTCGCTGATCAGACCCTGGTCGAGCATCTCCTTG
+GCGTTCTTTAGTCGTGCCGCGGGATCGGGATCGGTCGCCGGTTGGCTTGATCCAAATCCA
+CCCTGAAATCCACCAGATTTCGCCCGCATCTCTTCCAGCTCACGATGCCGGCGCTTCTCG
+CGCCAGGACTGCTCCTGAGCCTGGGCCATTCGGTAAACCTCTTGGGCCTCAGCCTTCCTC
+AGCCCATCGATGCGGTATGTGACCACAACACCGCCGCTTGCCAGATCGGGCTGAGTGAGA
+TGCCGGATGATGACTGAGCTGCTGAAAATTCCGACCCGGATATTGGCATCTTTCACGTCC
+TGCCAGCGGATGTCAGTTGGCGTAAAGCCACCGAAAAGCCCGCGCGTCATACCGATAATA
+CGACCAGTGGTCGCTGCCAAAAGAGCTCTTCGATGGGTGATCGCAAATATGCGCCTCTGG
+ACAGTAGATGCCCTTACGGACTCACCCGGGACCAGCATGGATGTGATGTACGAGAAGGCC
+TTGGCCGGTACGCCCTCAAGGCCAAGGGTAGAGTCTGTGCGCATTACCTTTCCCCAATAA
+GCGGCCGGTCTAGGGCCGCATGCTCCTGATCATTGCCAGAATCGCCTGCTGCTGGGCTTC
+AGATAGGCCTCTCATTTCACGTGCTACAGATGCCGCAATTGGCTCCTCTACGAGCTCTGC
+ATTGCCTGCCATAGCATCCAAATCGGTCTCCAGCACATCCAGGAGCGCCCTCAGTTCGTC
+CACTTTCCACCTCGATCCGCGACTGCCATTGAACCATGCGGCCACCGTCTGATACGCAAC
+AGCGATACCGCGAGTGTTGAGCGCGTCCGTGATCTGCTCGATTGAAAGATTTAGGGCTTC
+CCGCCGAGCGCGGAGATTAGCAATGAACTGACTCAAATCCTGAGACTCCATATGGATGTT
+GTCAGGGTATCGCGAGCACTTGCGCGCAAAGTATGCGAATCGTATAGTTGCAACATATGC
+GAAACGAATACCTGCCCATGACCGAAAAAGAAGAGCTTTCCGCTTACGTCCGTGATGCGG
+GCGGCATCTCGTCTGCTGCGCGCAAGCTTGATATTCCATACCAGACACTCGCCGCGGTGA
+TGAATGGCAATCGAGGCATCGGACGGTCCCTGGCCAGCCGAATGGAAAAGGGTTCTGGTG
+GCGTCCTGAAGGCTTCGCGCCTTATTTGGATTGCCGCTGAGAAAAAGGAGGCTGCATGAA
+CGCCTCTCAGCGTCAGGTCTTGTCCTCAGTCCTCCGGCTCGCCGCCGGCCTCAATCCTCC
+TCAACAGGATTGTCCTTCTCCCACTGAATGCGCTCATCGAGGATCGCGGTGTACTCGCCG
+GTCATCTCGGTCACGAGATCAGAAATCCCGCGTGGAATTTGTCCGCACGAAGCAGCGATC
+GATGCAGTGGCAACAGCTTCAGACAAGCACTCATCAATCCGACGCCGGCAGTGCGGGGCG
+TCGCACGTATCCATCATCAGGGCCTTGATCACCGCGTCTTGCGCGAGTGACCGCGCATAG
+AGATCAAGAACCAACCTCTCCAGATTCAGCTTGGTATCCGACATGTACGAGAACCCTACT
+CATATCCGCGACAAAATCATCAAGGTTCGCCTGAACGCCGACGAGCGCAATCTCGTCGAC
+GCATTGGCCCGCATCAACAAGACCCAGCCCTCGGTCTTCCTGAGGGACCTGGTGATCCAG
+GGTCTTGCTGTCGTGACGAAGGATACCCCCAAGCAGAGCGCCGCCTGAAGGACCCTAAAT
+AGGCCCTCAGGAGGGCCCTCTAAATGACAGAAGACCTTCCCATCGACCTGACGCCTGCAC
+AGGCGGACAGGATCTCAGCGTTTGCGAAAGAACAGGGCCTGACCGTCGAACAGGCCGTTA
+CCAAGCTGGCCCGTGAAGCGATCAATGAGCGCTACGTGCTGCCCAAGAACCGGGGATCAG
+TTTTGCCCATAAGGGCCCTCAAAAGGGCCCCAAGAGGTCCCTCTCATGACTGATCGAGTC
+ATCCATACGCCTGCATCTCGCGCCACCGATCCTGTGTCGTCGCACGACGCAGAGATGCGC
+GTCACGCGCTCCGGCTCCAGGCACTCCAACCGCCTCGCTGTCGTCGAGGCTGTTCGCCGC
+TACAACGACGACATGACGTCTGCCGAGATTGCCCTGGCTGCGGGCCTTGATTACCACGAG
+GCTGCGCGCCGGCTGCCCGAGTGCGTGACAGCCGGCGATCTGAAGAAGGGTCCCATGCGC
+GTCTGTTCAGTGCGCGGGACTCTGGTCTGCTCGTGGGTGATGGCATGAGCATCGAGATGA
+TGAATGAGGTCAAGCCTCTAAAGATTGGCCCCACGCGAAAGGCCGTCATGATCTGGCTGG
+CCAACTGCGCCAATCATGACCGGAAATGCTGGCCCAAAATGAGCGACCTGGAGGATTGGA
+CGAACTACGGTCGGACGGCAATCATTGAGGCGATCAAGTCCCTCGAAAAAGACGGCTATT
+TGACCGTGGATCGATCGGGGCGGAACAACGTTTACACCATGAATCAGGTCCGCCAGACGG
+ACCAGTCCGTCTCCCGGACCAGTCCGTCTCCCGGACCTCAGAAGTCCGTCTCCCGGACCT
+CAGGAGTCCGCCAGGCGGACCCTAACAGTAATAAAACCAAAATAACAAACGAAGAGGAGA
+GAGTCGGGCGCATCCAGGCGACCTCGATCTCCTGTCCCGACGGCATCAGCGACGACCACT
+GGTCGATGTGGATCGCCCAGCTTCAGAGCGACGGCAAGGAATCAATCTCCCGCCTGCAGG
+CCGCCAAGCTCCAGGTCCTTCGCATCGTCCGTGATGGGGGCGACGCCGAGGCAGTCATCG
+AGGCCGCCGTGCTCCGCGGCTGGCGCGACCTGCAGGACATCCACGCCGAGATGAAAGCCA
+GGGCATCGGCCCGCAAAAACAATCACCAATCCAGCGCCGGCGATACGGCCGGTGGATCCA
+GCACCCGCACCGGAGTCAACTACCGTGGAAACCGCACATCAGGCCGCAAGCTCAGCGCTG
+TTGAACAGGTCGAGGCAGCCATTGCAGAAAACGAACGAGCACGAGCGGACGCTGCAGGCG
+CAGCATGCATCGCAGCCGAAGGCGCCGCAGACCATGGTCAATGCTTTTTGGGCGCGGATG
+GCGACGATGTTCGGGCATAGCTGGGTGAGCCAGTACGGCGCGAATCCTGCCGGGTTGGCG
+GGAGATACCTGGGGCACCGTTCTTGCTGGCCTGACTGGCGAGCAGATCGCCCAGGGCATG
+CGGGAGACGCTGGCACTGGGTTCCGATTGGCCGCCGAGCGCTCCGCGGTTCCGCGCCATG
+TGCATCGGCATCCCGTCGCTGGCCGCCACGCAGCACGCGATGCGTACCGGTGCCACCGAC
+CCGTTTACCCGGCAGGCCTGGACCTACATCGACTCGTTCCAGTTCCGCTCGGCCGATGCT
+GATCAGGCCGCTCGCATGATGCGTGACGCCCACGAGCTGACGGTGCGATTTGTGATGGAC
+GGCGGTGAGCTGCCCGCCGAGCCCGTCGCGGCGATTGCTGTAGACCCGGCGCCCGAGCAT
+GTGCCGGCCAGTCCGGATTTTGCACGGCAGAGGATCGAGGAGATCCAGCGTCAGCTGGGT
+GCGGGAGAGGTGGCATGATCGAGCGCATCTCCGACACGAACGATATGTCCAGCGCAGCTG
+AGGAAATGGCCCGGATCGCTGCAGCTCAGTTCCGTAAGCCCGAAGGTCCCGCAGCCACCG
+GCGAATGCCTCAACTGCGGCGAATCACTGCCGGATGGCCTGCGCTGGTGCGACACCGATT
+GCCGGCACGATTACGAGCGTCGGGAGGCGATGTCCGCATGAATATGGACGTTCTCATCTA
+CCGGATTCTGGCAGAAATGGGTCCGATGACGATCAGTCAGATATCGACGGAACTGTCCTG
+CAGCAACCGCAGTGTTCGCCAGCCTCTGGACCTTCTGGTTAATTCGGGGAAAGTATCGGC
+TACCCACTCGGTGAAGGGCGGATCTTACTGCGTCACCTATGAGGCCGTCGCATGACTGCC
+TTCGCCTGCGCCCATCACATCGCCCGCATCGGCCGGCTGCCCAGCGCCCAATGGCGTGCC
+GAGGTCAACCAGCTCCCCGCCGACTGCGGTCGCAACGATTGCACCACCCGGAACTGCCAG
+CGCGAAGTCCAATCGCGCCTTGAGATGCAGTGGAAGATCCGCCGAGCCAAGAGGAAAGCA
+GCATGACCCAGACATTCACCCTCAACGCCGGCGGGGTAGAGCGCGCCGATGTGATGGCCA
+GCGCTGTGCGGTTCATTGCCGGATTACCTGGATCCAAGAGCTGGAAGGTCGAGATCAAGG
+AGTCCCGCAAGGGCCGCACCCTCGACCAGAACGCAGCCCTGTGGGCCGTGGCCTATCCGC
+CGCTGCGCGAGGCCACCGGCCACAGTGTCGAGGATCTTCACGAGTATTTCTGCGGTGAGT
+ATTTCGGATGGACCGAGTACGAGGTGATGGGAAATCCCCGCAGCCGGCCGATCCGGACCA
+CGACGACCGGCGAGGATGGTAAGCGAGACCTGATCGACGCCCGGACTTTCAGTGACTTCT
+ACGCCACTGTGCAGCGCATTGCTGCCGGCATGGGAGTGATCATTCCGGATCCCGATCCGT
+TCCATGGGGACGCCGGGAGGTGGGCGGCATGAAGGTTTGTCCGATCAAGCCACGGATTGC
+CGCAATCTTTGGTCAGTGGATCTGTTTTTCTGACGACTGCGGAGGGCGAGGCTTAACGCC
+AAGGGATGCGTACATCGCGTGGTTTTTGAACTGGTCTCAAGGCGGCCAGAGGGCATTTCG
+ATGAGCGCACCCAAGATGACCAAAGCCCGCAAGCTGGCCAAGGGGCAGCCGTGCATGATC
+CGCATCCCCGGCATTTGCAATGGCAACCCTGAGACGACGGTGCTGGCTCACTACCGGCTT
+GCCGGCTATAGCGGCACCGGAATGAAGCCGCCGGACGAAATGGGGGCATGGGCCTGCTCG
+GCGTGTCATGACGTGGTGGATGGGCGGGTTCGACCAAAGTACTCATGGATTTCTGGTGGT
+GATGGCAGCCTCCTTTCCAGTGATCGATTCTCCAGTGGTGCGATCAAGCTCATGCATGCG
+GAGGGCGTCATGCGCACCCAACAGGCGATCAGGGAGATGGGCCGATGAGGGCGATCATGC
+TGCATATCGGGCTGGGCCTTGCGATGTTCGCGGCCATGCTCCCGGGCCATCCGGCGCTCA
+AGAGCATCTACCGGGCAGCGGCAGAACGGACGGAGGAGCAGATCCGGGCAGAGCAGAAGC
+GGGCCCGAAAGCTCGCACGGCCGGCGTGGAGGCAGTGATGGTCATGATGCCCATCAAGAC
+TGTATCGGTCCTCAACGGATCGCAGGGCAACTGGCGGCCGGCTGCCGCACGCCGACGCCG
+GCAGCGGTCGGATGCATTCGTGCTGTGCCCGCGGGCCAGCCTCCCATGCACCGTGACCAT
+GACGCGGCTATCGGCCGGCACGCTGGATGACGACAACCTGCGCAGTGCCCTGAAATCAGT
+CCGGGATGGCATTGCCGACCGGCTGGGAATTGATGATCGGGATCCGCGCGTGAGCTGGGC
+CTATGCCCAGGCGAAGTGCCCGCGGGGGAAATTCGGTGTTCGCGTTGAATTTGAATCAAA
+ACAGGGGATCTGACCATGGCGCATATCGGCAAACTACTGGGGCGGCTGAACCCCAAGACG
+CAGACCTTCACCGATGCCTCCGGCGGCGTTCCCGAACTCACCCCGCAGGATATCGCCGGG
+GCGCTGGCGTTCGTGCCGTCAGGCCTCGGTCGCGAGCTGCTGTGCCACGTCTGGTGGCCT
+GGAGGTGCTGAGCGCACCAGGGCGCAACTGGATGCGGCGATCATGGAGTTGCTGGCAAAA
+GAGTGGCGCCGCCGTGAGGACGCACAGCTGGACGCCATGCTGATGGTCGCAACACCCGAT
+GTTGGCCGCCGCCGGGCGCAGGATGCCTTTGCCCAGGCCCACAAGGAGCGCTGGCCGAGC
+TGGGGGAAGATGGAGCAGGGCATTCTGCAGCCGTCAGAGGTCTACGTGCGGATCAGGGAC
+GCCGTGCTTATGGAGCTGCGTGCAGGCTATTTTGGTGATGCTGACTCAGGCGCAGGCCGC
+GCATGGAGTGACCGTGATCGGGCTGAGATGATCGAGCGCTCGAATGTCACTTACAGCACC
+AACGGATGGAAGCGAGTCTACGAGTGGCTGCTTGATCACTGCGCGAATGAGGTCGGCATT
+GCTCAGAGACGATTCGGACGTGCAGCCGCTTAGACTGTTAGTGTGAAGCACTAACAGTTT
+TTGGGGTAAATTCCCTATCGTGACGAAAGCCCCGCCGGGCACTGGCGGGGCTTTGACTTC
+ATTAATCAGCTGTTGCGAAGATGGTTGAAGAGATCAAGTATTTCCCTTACTGATGATGCA
+GTGATGATGTTGTCCATGTCTAGATCATGAGGTGACGGGCCAATGACTGATTCGCCCTTG
+ATGTTCCACGAGCATCCCGTGTCGACTGCCTCGATATCTATCGACCCCGAGAATGTCTCG
+TCTTTGCTCGATGGGTTGTAGCCGTCAATGGTTCCGAACTTTCCAGATACGGTTCTGATG
+GGCATTTCAAATATCTTCACATAAGTCATTTTCACAATCTCTTTGATTTTCAAACGAAAT
+GAGCTTCGGATTCAGCCGTAGCTGTATTTATTGTAGCTAATCGGTGCTTTATGCCTCTTC
+CCCTGCCAATCGAGCCGCAGGTGGCACTGGCATCTGTCATCGACCCAGCCCTTGAACAGC
+TTCCCCGTGCCCTTGATAGCGATCAGGCCGCCGTTCTGCTGCTGGCGATTGCCATCCAAG
+AGTCGGGCCTGCGTACCCGTCAGCAATATGGCGGACCTGCACATGGCCTGTTCCAGTTCG
+AGACGGGCGGATGCAGCGCAGTACTGGGAAGCCCGCTCAGTCGGCCGCTGCTGTTGCCAG
+TCCTCACGCAGCATGGCGTGTCGGCCACTCCTCAGGCGATCTATCAGGCGCTGCTGACGG
+ACGACATCCTTGCCGCCAAGGTTGCGCGTTTGCTGCTGTGGACTGATCGCCGCGTATTGC
+CGGCCCTCGGCGACATCGAGGGCGCCTGGAAGTACTACTACCGCAACTGGCGGCCCGGCG
+GCCCACGGCCTGACCACTGGCAGGTCAATTACCGAATAGCGCTCACAGCGCTTGGGAATC
+ACACATGTCACTGAGCATCTTCGCATCCATCGGCGTGCGGGCATCTGCTGTCGTCGCTGG
+TTTTGCGGGGAGCGTGGTGCATATCGCAGTCACCGAGCAGATGACCCGGGCCCGTGCTTT
+GGCGGCCATTGTTGCCGGCACCGGCTGTGCCGCCTATCTGCCCGACTACCTGGTGCTGCA
+CTACCAGCTGCCGGCGCCCATGACCAACTCAATCGCGTTCGTCTGCGGCCTCTGCGGGCT
+ATCGGTCGCACTCCGGGTGCAGGCGATGATCACCAGCGCATTTCATGGAGGTAACTCCAA
+ATGATGCTCGCAACGATCAACATCCTGTCAGCCCTACTGGTGTTGGCCGTGTCCATCGAT
+GCGGCTCGGCGCCTGTCATTCCGCTGCCACCCGGTAGCCACTGGCGGTCATGTGTTGATG
+GCGATTGCCGAGATGGTGTGCATCTACCAGACCGCAGACCTTCGCAGCGTCCCTGCCTGG
+GTGGCAGTCATCAACCTGGTGCTGTCCTACATGGCCATGTCGTCATACCTGCACATCGAG
+CGCACAGGGAGGTTCGGCTGCAAATGAGCATCGCAACCATCATCGCAGTGCTCAATGGCA
+TCTGGACCCTTGGCAAGAACCTGATCGGCGCCTTCAAGAAGAAGCCGGCAGGGCAGGGCG
+CCGAGGATGCCGCCACTCAGGCAGTAGCTGCCACCAACACCGAATCGAGCGAGACGGCGA
+GCATCGCCCGCCAGTCGATCGCATCCGTCCAGGAGTCAGCCAATGCTGCGCGTACTGAGA
+ATGACCACCTTGCTGCTGATGCTGCTTCCGCTGGGAGCGTGCAAGACGCTGACCAAGTCG
+TCCAGCGAGCCATCGCCGCAGCAAACGCAAAACTTAATCCAGGTTCGGACCATCAAGCCG
+ACCGTCCTGTGTGATATGGGAGATCTCCAAAGTGACCCCCTCCCGAATTATCCAGCTCTG
+CCTGGAATGGTTCCGCTCGCCGCTGATAAAGCCCGCGACGTCTGGGCCATCGGCGTTGCC
+GGTCAGTACGGCCAGCTCGCCATCCGATACAACGCAATCCTTTCCTGTCTCGCCGGCTAT
+CGCCAGCGCGGCCTTATCAACTGACGAGGTTATCCCCATGTCGTTTTCCCTGTCCAAGAT
+CGGTGCCGATATCACCGAGGCCGTATCCGCCGCCGAGGCCGTGGGCGATGCGATCAAGGT
+CGTCTACAACTCCGTCGCCCCGCTGATGGACTCGGCTGAAAAGGCCTATGACGGCGTCAC
+CGATGCCGGCGGCACCAAGAAGGCTGCAGTGCTGGCGAGCGCCAAGGCCGTGGCCGAGGC
+CCTGGGGCAGGACTGGAAGAGCATCGAAGCCGGCGCATCGTCCCTGGTTGACGCCATCAA
+GGGCGCCTACAACGTGGCGAAGGACATCGTCGATCCGGCGAAGTCGACCACCGTCGCCAG
+CGCTGCGGCGTAAGGGGGTAGATCATGACTGTCAATGTCGTGACCGAAGACGGCACCATC
+GCCGAGGTTTCCACCCCGAGTGATGCCTCCGGCTCCTCCTATACCCTCCCGGCTGCCACC
+AGCTCTGCCCTGGGCGGTGTGAAGGAGGGCGCGTATGTCGCCAATGCCGGCGAGTCCACC
+GCAACGGATGTGGCTGGTGCGGTAACGTCCATCAATGCCGTCGCCACCCAACTCAATGCG
+CTGATCGCATCGCTCCAAGCATCGGGCGCATTGGCTGCGTCCAGCTGATCGAGGTAAGTC
+ATGGCCGGCAACAAATCAACGAAGCCGGCCACTGACTGGGAACGCATCGAGGCGGACTAC
+CGGGCTGGCGTGCTGTCGATCCGTGAGATCGCTGGCAATCATGGGATCACGGATACCGCC
+ATTCGTAAGCGGGCCAAGGCCCATGGCTGGGAAAGAGACCTTGCCGAGAAGATCCGGGCA
+AAGGCCGAGTCCAAGGTTCGCAGTGCAGAGGTTCGCACCCAGGTTCGCACTGAGGGCGCA
+ATCTCGGATCGCGAACTGATTGAGGCCAACGCCGAGGTCATCGCCAACGTCCGCATGGCC
+CACCGGCAGGATATTGGTCGGGCACGCAGTCTCGCCATGTCCCTGCTGGCTGAGCTGGAA
+TCGCAGACGCATCACCTCGATATGGTGGATCAGCTGCGCGACCTAGTGGTGAACAGCGAG
+GACGGCATCGACGCCAAGCTGCTGACGATGTTCCAGGCCGTGACCTCACTACCTGGTCGC
+ACCAAGACCATGAAGGAGCTGGCCGACTCGCTGCAGAAGCTCGTGACGCTGGAGCGTGAT
+GCCTATGGGCTGGCCGAGGCATCCAAGGTTGAGCTGACCGGCAAGAACGGTGAGCCGATC
+CAGCAGCAGGTATCCCATGTCGATGAGCGCACAGTCTCAGCGGTCATCGACCGACTCAAC
+GCCGAGTTCTGAGGGGCTTCCCCTCGATCTGGCGATCATCAAGCAGCTGTGCGAGCGGGA
+TCACCTGTTCTTCAGTCGCTACTTCTTCAAGCACCGGCAGGGCATCCGCTTCCTGCAGAA
+CTGGCACCACCGCCGGATCTGCTCGATTGTCGAGGATGTCATTGCTGGTCGACGTAAGAA
+CGTCGTCATCAACGTTCCGCCGGGCAGCTCCAAGACGGAGCTGGTGGCAATCAATCTCAT
+CGCCCGGGGGCTTGCCATCAATCCCCGGGCCCGGTTCCTGCATATCTCCTATTCGGATGA
+CCTCGCGCTGCTCAACAGCGAGACCGCCAAGGAGATCGTGCAGTCCGAGGAATACCAGGC
+GCTGTGGCCGCTCTCGATAGCCTCAGACGCCAAGAGCAAGAAGCGCTGGAACGTCGAGGC
+CAATGGCCAGAAGCTGGGTGGCGTCTATGCGGTTTCGCTCGGCGGCCAGATCACTGGCTT
+CCGTGCCGGCCACATGGCTCCCGGATGGCAGGGCGCGATCATCATCGATGACCCGCTCAA
+GGTCGAGGATGCGTACAGCAAGACGAACCGCGACAAGGCGAACCGTAAGCTGCTGTCCAC
+GGTGAAGAGCCGAAAGGCCAACCCGGACACGCCGATCATCATCATCATGCAGCGCCTGGC
+TGAGGAAGACCCCACCGGTTTCATCAAGTCCGGCAAGCTGCCGGGTGACTGGGAGTTCAT
+TGAGATCCCTGCGCTGATCGACGATGCATACATCGCCGCACTGCCCGAGGATCTGCAAGA
+CGCGGCGTCCCAGGGCGATGCAGATCAGGACGGCCGGCGCAGCTACTGGCCCTACAAGGA
+GCCACTGGACGATCTGCTGGCGATGGAACGGGCTGACCGGTTCGTGTTCACCGGCCAATA
+CATGCAGCGGCCCAGCCCGCTCGGCGGCGGCATCATCCAGTCGGCCAAATTTGGCCGGTA
+CAAGGTGGTCCCGGAGATGGTCAAGCGGGTCATCTTCGCCGATACGGCGCAGAAGACGGC
+CGAGCGCAACGACTACTCAGTGCTGGAATGCTGGGGTCTGGGCAAGAACGGACGCATCTA
+CCTGCTGGACCTTCTCCGCGGGAAATGGGAGGCGCCTGAGCTGAAGCGCAAAGCCATCGA
+CTTCTGGCACAAGCACCTTGCTGTGCCGGCGTGGCCGAATGGCGCCCTGGTCAAGCTGAT
+GGTCGAGGACAAGGCCTCGGGCACAGGCCTGATCCAGGACATCCGGGCATCGGGATTGAT
+CCCGGTCGAAGGTATCCAGCGCAACACCGACAAGCTGACCCGCGTCATGGACGTGGTCAG
+CTATATCGACTCTGGCTATGTGCACATCCCCGAGGATGCGCCATGGATCAGCGACTTCAC
+CGCCGAGTGTGACGCCTTCACGGCGGACAACACCCATGCACACGATGACCAGATCGACCC
+TATGGTCGATGCCATCAACAACCTGCTGGGCACCGGCAGGGTGCTGAGCGTCTGGGAGAA
+ACTGGGCCAATGAGCCGAGGCAAACGGAAAACGCCACGGCTCGGCACGTCAGCAATGGCG
+CGCGACTCGGCCAAGGCCAGGCGCAAGACCATCGACAGCTTCGAGAATTTCGAGGCTCGG
+GTCGGCATCCAGGCGGGCAACCTGTCGGGCGGTGCCGGCTACACGTTCGATTTCGTCTCG
+CGCAACCGCGTCGAGATGGAGGCCATGTACCGGTCCAGCTGGATCGTCGGCCAGGCCGTC
+GATGTGGTGGCCGAGGACATGACCAAGGCCGGTATCGAGCTTCGGTCTGAGCTGGACCCG
+AGCGACGAGGCCAAACTGCTCAAGGCCATGACCAAGATGCAGCTCTGGGATCAGCTCTGC
+GACACGCTCAAGTGGTCACGCCTCTACGGCGGCGCGGTCGGCGTGCTGATGATCGACGGC
+CAGGACATGAAGACGCCGCTGAACATCGACAGCATTGGTCGCGGCCAGTTCAAGGGCATC
+CTGCCGTTGGACCGTTGGCTGGTGCAGCCCTCGATGGAAGAGCTGATCACCGAGTACGGC
+CCCGACATCGGCAAGCCGAAGTTCTACGACGTGGTGGCCGACAGCATGGCCCTGCGCCGG
+CAGCGGATCCACTACACCCGCGTTGTGCGCTTCGATGGCGTGGATCTGCCGTACTGGCAG
+CGCATCAGCGAGAACCTGTGGGGGCAGTCTGTCGTCGAGCGCCTGTATGACCGCCTCGTG
+GCGTTCGACAGCACGACGCAGGGCGCGGCCCAGCTGGTCTACAAGGCCCACCTGCGAACC
+TACAAGGTCCCAGGCCTGCGCGAAGTGATTGCCATGGGCGGCCCTGCGCTTGAGGGCCTG
+CTCAAGCAGATCGACATGATCCGCCGGATGCAGACCAACGAGGGCATGACCCTCATGGAT
+GCTGCCGACGAGTACGAAGCCCACCAGTATTCGTTCTCCGGGATGGCTGACATCCTGCTG
+CAGTTCGGCCAGCAGCTTTCTGGCGCCCTGCAGATCCCACTGGTCCGCCTGTTCGGTCAG
+TCTCCGGCTGGACTGAACTCGACCGGCGAGTCGGACATGGAGATGTACCGCGATGGCATC
+CATCAGCGGCAGGAGCGCCGTTTGCGCACGCCGGTGGACACGATCCTGCGCATCCTCTGC
+CGGTCGGTGCTGGGCATCGACGCACCGGAAGAACTGGACTTCGACTTCGTCCATCTCAAG
+CAGATGACGGCCGAGGAAAAGGCCAATGTCTCGAAAACGACCACGGATGCCGTTATCCAG
+GCATTCGATGCCGGCCTCATCTCGCAGCGCGTGGCTCTGAAGGAGCTGCAGCAGTCGAGC
+GACGAGACCGGCATCTGGACCAACATCAGCGACGAGGATATCGAGGCGGCCGACGATGCG
+CCGCCCGATCCGGGAGAGGGCGACTTTGGCGAAGATCCATACCCGCCGGAGCCCGGTGCC
+GACCCGGAAGGCGGAGATCCAGTACGCGGCCAGTCTGAAACAGGTGGCGGCCGCGATCGG
+TCGATTGATCGCTGGCTTCGACCCTGGCGATATCGGCGCGCTGCCTGATATCCAGTCTCG
+GCTGGAGCAGTACAGCTACAACCTGGGCGACTGGGCGCATCGCACTGGCCTGAGGATGAT
+CAAGGACGTCAACGCCCGCGATCTGAAAGCATGGCGCGAGCACTCGCGGGACATGTCCCA
+CGCACTTCGCAAGGAGCTGCTGAATGCTCCGACCGGCCAGGCATTCCATCAACGGCTGAC
+GGAGCAGGTCCACCTGATCCAATCCCTGCCGCTGGACGCTGCGAGGCGCGTGCATCACCT
+GACGACCGAGGGCCTGACCAGCGGCCGGCGTGCTGAGGACATCGCCAAGGAGATTGCGAG
+ATCCGGCGAGGTGTCGGCATCGCGGGCGATCCTGATCGCTCGGACTGAGGTGTCCCGCAC
+GGCATCAGTTCTCAGTCAGGCCCGCGCCCAGCATGTCGGTTCGACGGAGTACATCTGGCG
+AACCTCGCAGGATGGCGACGTCCGGCCTGGGCATAGGGCCATGAACGGCACCGTTTGCAG
+ATGGGCAAGTCCGCCGGGCATCAATGAGGGCACGGCGAGCAAGCCGAGAATCATGCACCA
+CCACCCCGGCTGCATCTGGAATTGCAGGTGTTGGGCGGATGCGATTATTGCGGAGTGAGT
+TCATGGTCCGCATTCATCCTGACTGGAATTTGAGCCGTGATTGAGCAGACTGGACAGATT
+TAAAAAGCTGGCCAATAGACACCAGTTGATGGCATGATTCGGCGCCGCAATATTGCGGCG
+CAACATAGGCATGACATGGCTACCGAACTGAAAGAAGATCAGAAACTTAAAGCGGACATC
+ATGGCTAAGATTTTGGCAGGTGCCATCGATGGCGCGACCCTGTACGCCATCGGCCATGGG
+CGCGCAAACCTCAAGTACTCCGGGATGCTGAATGGAGCAAAGCGGATTGCCGATGACATT
+CTCAAGAAAGTCTGATCCATCGCATCAATGTAGAACGAAGGCCCGCACTGCGCGGGCCTT
+TTTTATGGGCCAAATATGCGCTTCTACACCATCCAAAAGCTCGGACCGAAGCGCGAGCTG
+ACGCCCGAGGGCTTCCTGCTGTGCCTGGACGTGCCGGTGGCGCGCACTGGCGAGATGATC
+TACGGCGAAGGCGAGGTGCCCATCGAGGGCAGCATGGACGGCCTGATCCGGATCACCCGG
+ACGCCGGACGAGGTATTCCGTGCCGAGACACTGGCCAGTTGCCAGGGCAAGCCCATCACG
+CTCGACCATCCTGACGAGTTCGTGACGCCTGAAACGTCGCGCACACTGTCCATGGGGTCG
+ATGCAGAACATCCGGCGCGGCACTGGAGCTGATGAGGACGTGATCCTCGCCGACCTGCTC
+ATTACCGACGCGGAGGCTATCAAGGCCGTGCAGGCCGATGGCATCGAAGAAGTCTCGCTC
+GGGTACGAAGCCGACTACGAGCAAACCGAACCCGGCCGCGGGGTGCAGCGGAACATCATC
+GTGAATCACTGCGCCCTGGTGCGGTACGGGCGTTGTGGCCCGCGCTGCGCGATTGGGGAC
+AAGGAGACTGTTATGGCCAAGCCCGTCAAGCCCGGGAAGAAGTTGTCGTTCAGCGACCGA
+CTGCGTCGCGCCTTCATGTCCAAGGACGCCGACGAGGCCGAGAAGCTGGCCCAGGAGGCC
+GAGGACGCAGCCGAAGAGGAAGAGCAGAAGCGGCGCGAGTCGGAAGATTCCGGCGACGAT
+GATGACGGCGACGATGGCAAGGGCCGGGACAAGGTCGGCGACACCGCCACGCTGAAGCTG
+CTGCGATCGATGGACAAGCGCCTCAAGTCGTTGGACGAGCGCATGTGCAAGATGGAGGAC
+GCCGAGGGTGATGGCGAAGAGGAGGAAGAGGCGGAGACCAACGACGCCGGCGACCTGACC
+AGTGCCGAGGCCTCCCCGAAGGTCGATCTGGATGGCGTGAAGATCTACACCGGTGACGCC
+CGCACTCAGTTCCGGCAGCGGCTGGAAATCGTATCGCCCGGCGCCAAGATGCCGACCTTC
+GATGCCAAGACCACTGATGCGGCCATTGCCGCGAAGCTCTGCGCGTGCCAGCGCCGCGCC
+CTGGGCGACGCCATGAAGACCGACGGCGGTCTGAGTGCAGTCTCCCCGTTCCTCGGCGGA
+CTCGATCCGCAGACCGCCCCGATGGCCGTAGTCAATGCCGCTTTCACCGGAGCTGCCGAG
+CTGCTGCGCCGTCGCAACAACGACCACGGCAGCATGAGTCTGCCCAACCAGCGGCAGATG
+CCCAACAGCATCGCCGACATCAACAAGCGCAGCCAGGCCTACTGGGCCGACCGCGCCGCA
+CGCTGAGGAGCTGACATGCCCGCCTATCTGTATCGCATGCCGTCGGGTATCCCCGGCGAC
+GTCACCCGCTATTCCGTTTCCACCATCGAGCCGGTCCCGACCGATTCGAGCAATCCGTTC
+GCCAGCTTCGGCATCCCCGGCAAGATCGTCAGTGGCAAGTTCGTGCCGCTGGCATCCGGC
+GACACCGATGTGAAGGTCTACGGCTTCCTGGTCCGCGCCTATCCGACCCAGAACGGCGTC
+AATCAGGCGCTGGGTGCCGATACCCCGCTGGCTGGCGTCATGGGCAATGTCCTGCGCCGC
+GGCTACATCGCCGTGAAGCTCAATGCCGGCGTGGCCGCGCTGGGCGCTCCGGTCTACGTC
+CGCGTCGGTGGCGCCACGGACTCCCAGCCCATTGGTGGTATCGAGGCCGCGGCCGACGCC
+ACGGCCGGCAACACCATCGAGCTGGCGAACTGCACCTTCATGTCCGCGGCTGATGCCTCG
+GGCAATGTCGAGATCGCCTACAACCTGTAATCCCCCACAAAGCCCTGCCAACGAAGCCCT
+GCCATCGAGCGGGGCTTTTTTGTGGGCGCGATTCGAGGAAACCCCCGATGAGTCAACTGA
+TTCTCCCGCGCTCGGTGAAGCGAGCGTATACCCGCGATGGCCTGCAGACCTTCGACAGCC
+GCACCATCGACAGCTCCGGTGCGTTCCTGGTCGGCGAGCTGGAGCGCCTGGACTACCGTC
+TGCACGAGCCGCTGGCCGCAGTGACCTGGTCGCGCGATATCCATCTGCGCGAAGATGTTT
+CGATGGCCGACGAGATGTCGAGCTTCACCAACAGTTCGTTCGCTGCCGCGGGCGGCATCT
+CCCCGACCGGCAAGGCCTGGGTCGGCAAGGACGCCAGCGCTATCACCGGTCTGGGCCTGG
+ACATCGGCAAGACCATGCATCCGCTGTCCCTGTGGGCCATGCAGATCGGCTGGACCATCC
+CGGAACTGGCCTCGGCGCAGCAGCTGGGCCGTCCGGTGGATCAGCAGAAGTTCGCCGGCA
+TGAATCTGAAACACCAGATGGACATCGACGAGCAGGTGTACATCGGCGATACCGTGCTGG
+GCCTGGAGGGCTTGGTGAACAGCTCGGCCGTCACCACCACCAACGTGGTCAACGGTGCGA
+GCGGATCGCCGCTGTGGTCGAGCAAAACCCCGAAGGAAATCCTTGCGGACTTCAATGCGA
+TTTTGAATCTTGCGTGGGAGGCATCCGCATATGCGGTGTGCCCGACCAAGGTGCTGATTG
+CTCCGGCGAAGTACTCGATCCTGACCCAGCCGGTTTCTGAGGCGGGCAATATTTCGATTC
+TCGAGTATGTTCGGACCAACTGCATATCGCACAACGTGAATGGGCGTCCGCTGGACATCC
+AGCCGGTGAAGTGGCTGGCGGGCCGCGGAACCAGCGGCACCGATCGCATGGTGGCCTACA
+CGCAGGAAATGGACCGCGTCCGCTTCCCGTATGTGCCACTGCAGCGCACCCCGCTGGAAT
+ACCGCGACCTGCGTCAGCTGGTGACCTACTTCGGTCGCCTGGGTGCTGTGGAGTTCGTGT
+ATCCCGAGACCCTGGCCTACGCCGACGGCTACTGAGGAGGTCGATATGCCGAGGATCAAC
+GTGACCAAGGCATTCACCTTCACCCATGCCACCGGGGAGCGACAGCGCTTCCCGGTGGGC
+TGTCACGAGGTCGCCGAGTCCGTGGCCGGGCACTGGTACGCGCATGAGCACAGTGAGCCT
+GTAGCTGATGCAGACGTGATCGAGACGGACACACCCGCAAAGCGGCCGCGCCGCACGAGG
+AAGGCCGATGGCTCTGACACTGACGCCTGACCAGTTCAGGGCGGACTTTCCAGCGCTGGC
+CAGCACCACGACATATCCCGATGCGCAGGTGAATTTCTGGATCGAGCTGGCAGCTATCCG
+GCTCAACGAGGCCCGCTGGGGCAAGCTCCTGCAGTACGGCGCCGAGCTGTTCGTGGCTCA
+TAACCTGGTGCTACAGGCGCGGGATATCGCGGATGTGGCGGCCGGCGGCGATCCGGGTGA
+GGTGACGGGCCCGGCGACAGCCAAGAGCGTGGACAAGGTGTCTGTGAGCTACGACGCCCA
+GTCCGTCGCACTGACCGACGGTGGCTTCTGGAACATGAGCAGCTACGGCATTCAGTTCCT
+GCAGCTCGCGCGCATGATTGGCACGGGCGGTATCCAGCTATGAGCATCAAGGTCAAGCAG
+GACAAGGTGAACGCCATCCTGCGGTCTCTGCAGGGCATGGAGCGAAAGCAGGTCATGATC
+GGCGTGCCGTCGGACACCTCGGACCGCCGAGACCCGACGCAGCCGATCACCAATGCCGAG
+ATCGCTTACATCCAAGACAACGGATCGCCGGCGAACAACATCCCGGCCCGGCCGTTCATG
+CGTCCCGGCATGGATGATGCAGCGCCCCGCGCGGCGGTGCAGATGAAGAAGGGCATCACC
+GGGGTGCTGGATGGCGATCACGCGGCTGGAGAAAGGGCTCTTGATGCTGCCGGCATCGTG
+GCATCCAGTGCGGTGAAGAACGTCATCAACTCGGGCAATTTCACGCCTCTTGCCGATTCC
+ACCCTGGCTGCCCGCGCGGCACGTGGACGCGCCGGCGCTCAGGAAGAGCTGGATCGACGC
+GATGCCGGCCATGCGCCGGGCACGGATCTGGCGAAACCCCTGGTCGATACCGGCCAGCTT
+CGCAACTCGATCACCTACGTCGTGCGATCCACGGAGGACTGATGCGCCTCAATGTTTCCC
+GTGTCCTGGCCTCGCGAGAGTTCCGGGACACTTCACTCGTCCGCATTCGCAACACGCAAA
+CCGTCGGAGACGATGGCCGTGCGGTGAATGCCCAGGACAGCACCCCATTTTCTGGCGTCG
+TGACGAACGATGCCGGGTACATCCTGCGCCGCTTCCCGGCGGCCAGCGTCGTGTCCGGAT
+CGATCCTGATCACGTCGCAAACCCCGCTCACGTCGGGCACCCCTGACCTGGATGCCGACA
+TCGTGCGGTGGCGCGGCCAGCAGTACACCGTGTCGATGGTCAATGACTATACGACCTACG
+GCCAGGGCTTCACCGAGGCCATCTGCAATCCGCTCAGCCTGCAGGGAGGTGCTGACAGTG
+GGTAATGACTCTTCCACTGGCGGATACCTGCTGCCGGCGGCGGGCGGCCCGAGCTTCGAT
+AACGCCCTGGATGACGCCATCCAGCAGGCAGTGGTCGGCATCACCGGATTACCGGGCAGC
+CTGGTCCGCCCACGTTGGCAGCCCATCGTGGCCAAGCAGCCGCCCATCGATACCGACTGG
+TGCGCCATCGGCGTCACCGATACCGAGCCCGACGACTATCCGGTGCAGGACCAAACTGCT
+ACCGGGTCGGATCTGATCGAGCACGAGACGATCACGGTGCTGGCCACCATGTACGGCCCG
+CAGGCGGCAGCCAATGCCAAGGCCCTGCGCAACGGTCTGTATGTCGCCCAGAACCGCGAG
+GGGCTGCTCGCAGCAGGCATCAACCTGACGGATACCGGCAAGCCGATAGCAGCCATGGAT
+TTCGTCAATCAGCAGTGGGTCCGGCGCTACGACCTGACCATCCGATTTCGTCGAAAGACG
+ATCCAGAACTACGACATCCTCACCATCCTCTCAGCCGAGGCGGATGTGCACACTGACACC
+CACGAGGGGTAAATCATGGCCCGAGGCCTTCCCGTATCACGCATCATCAATATGAGCGCG
+GTCATCGCATCCGTCGGCGTCGCGACCGCGGACTTCAACTCGCTGCTGATCGTCGGCGCA
+AGCTCGGTCATCAGTATCAACGAGCGCCTTCGCTCCTATGGCTCTCTGGCCGATGTTGCA
+TCGGATTTCGGCACCAGTGCGCCGGAATACCTGGCCGCTGCGCTCTATTTCGACCAGTCG
+CCCCGGCCGAGCGAGCTGTATATCGGCCGCTGGGCCAAGACGGCCAGTGCCGGCGAGCTG
+TCCGGCGGTGTCCTGAGCAGTGCCGCGCAGGCCATTGCCAACTTCACCGCCGTGTCTGCG
+GGCGGCATGGATATCACCATCGACGGCACGGCCAAATCGCTGAGTGCGATCGATCTGTCC
+GCCGTGACCAATCTCAACGGTGTCGCCTCGGCCGTCACCACGGCCCTGGCTGGCGTCGCC
+ACCGTGACCTGGAACTCGGCCACCAATCAGTTTCAGGTGGTCAGTGCTACCACCGGCGCC
+ACGTCTTCGGTGGGCTACGCCTCGGCCCCGTCCACGGGCACGGACATTTCGGCTCTGCTG
+GGCCTGACCTCGGGCGTAGCATCGGCACCATCCGACGGTATTGCTGCCGAGGAGCCGGTG
+GACGCGATCACCGCACTGGATGATGCCTCGGGCGGCTGGTACGCCTCGATGTTCGCCGAT
+ACCTCGCTGACCATCGCGCAGCACGAGGCAGTGGCCAGCTACATCCAGGGCGCGGCGCGC
+CTGCATCTGTACGGCATCACCACGCAGGACAGCCTGGTCCTAGACCCGACATCGACCACC
+GATATCGCCGCCGTGTTCGCCGGCCTAGCTCTGGATCGCACGGTCCTGCAGTATTCCAGC
+AGCTCGCCCTATGCGATTGCCTCGCTGTTCGGCCGTGCGCTGACCGTGGACTTCAACGCC
+AACAACACCGCGATCACCCTGAAGTTCAAGCAGGAGCCCGGCGTTACTGCCGAGACCCTG
+ACCACCACGCAGGCCAATGCGCTGGAGGCGAAGAACTGCAACGTGTTCGTGAACTACGCC
+AATGGTTCGGCGATTCTCGAGCAGGGCGTGATGAGCAGCGGCGCATTATTCGACGAGATC
+CAGGGTGTGGACTGGCTGCAGAACGCCATCCAGACCGCGATCTTCAATCTGCTGTACACG
+TCTACCACCAAGATCCCGCAGACCGATGCCGGTGTGGCCCAGATTTGCACCACCGTCGAG
+GACCAGTGCGAACAGGGCGTTTCCAATGGCCTGCTGGCCCAGGGTGTCTGGAATACGACC
+GGCTTCGGATCGCTGTCGGAAGGCCAGACCTTGACCAAGGGATACTACGTCTACGCCGCG
+ACCATCGCCAGCCAGTCCACGGCCGACCGCGCCGCGCGCAAGTCCCCGCCCATCCAGGTT
+GCCGCCAAGCTGGCCGGCGCCATCCATTCGGTCGATGTTTCGATCACCGTGAACCGCTGA
+GGTAGACCATGGCAACGTACAGTTTTCTCGATGTGGCTGCCACGATCACCGGTGTGGGCG
+GATCTTTCCGCCTCGGTAGTGGTGCGGGTGTGGCTGAGGAAGGCATCTCGTATGAGATGA
+CCGAAGACAAGAACAACATGACCGTGGGCGCCGATGGCCAGGTGCTGCACGCACTTCATG
+CCGGCAAGAGCGGTCACATCACCATCCGGCTTCTGAAGTCGTCGCCCCAGAATGCGAAGC
+TGCAGGCCATGTATGACGCCCAGTCGTTGTCCAGTGCCACCTGGGGCCAGAACGTCATCA
+GCATCCGCAACTCGGCCGTGGGCGACGTGATCGCCTGTACGCAGGTGGCATTCCGCCGCT
+CGCCGAGCAACACCTACGCGAAAGACCCGAACGTGATGGAGTGGCAGTTCGATGCCGGCC
+AGATCGACGCGATTCTTGGCGAATACTGAGGAATGACCGATGCAGTTTGAAATCAATGGT
+CGGCAGTACCAGTCGGCCAAGATGGACACCCGTAAGCAGTTCCACGTCGCCCGCCGGCTG
+GCCCCGGCCATGGGCTCGCTCGCCGCAGTCGCGGCCAGTGGGTCAGTCGACAATCTGTCG
+GTGCTGAGCCCGCTGGCATCGGCCATCGCCGCCATGCCGGATGCAGACTGCGATTTCGTG
+CTGGATGCCTGTCTGGCCGTGGTCAGCCTCAACCAGTCCGGATCGTGGGTACAGATCGCC
+AACCGATCCGGAGGCCTGCAGTTCGACGAGATCGAACTGGGCGAGATGCTCCAGATCGCG
+GCGAAGGTGATCCAGGAGAACCTGGGCGGTTTTTTGCCCGCAAAGGCCGCACCCCTACCG
+AAGCAGTAGGGTCGGCCGGCAGCACGGATGCATGGGCCTGCCTTCCCGACGGGGAGGACT
+GGCTCCTGCGCCCCGTCGTGCGAGGCATGTGCAAATTCGAGAGCCTGATCGATGGGACGC
+TCGACCTAGAGCACATCGCCCTGATGAATGACGCCCTCGATGTCGTCGACGAGAACCGGA
+TCAAAGCGGAGCGGAAACAGTCATGAGTTCGGAAGTCATCCGCGAATACCTGGTGTCGCT
+CGGCTACAAGATCGATGGCGACAGCGAGCGCCGATTTACTGAAAGCCTGGGTGGGGCCGC
+CAAAGATGTTGCGGCCCTGGGAGTCGCAATGGCGGCTGCAGCGACGGCATTTGTTGCTGG
+CGTGGCCAAGATTGCCGGCGGCATGGAGCAGCTGTATTTCGCTGCTCAGCGGACCCATGC
+GGCCGTGGAGAGCATTCAGGCCCTGCAGTACGCAGCCGCCCAGATGGGATCTAGCGCCGA
+GGGCGCTGCCGGCTCGCTTGAGTCGCTGGCGCGCTTCATGCGTGAGAACCCGAACGGGGA
+GAACTTTGTTCGTAGCCTGGGTGTATCTACCCGCGATGCGAATGGTCAGCTGCGCGACAC
+TACCCAGATCATGGGCGATCTCGGCAAGCGCTTGGCGGCCATGCCGTATTACCGCGCTCG
+GCAGTACGGATCGATGTTCGGGTTCGATGAGCGCACGCTCATGGCCCTGCGCTCGGGCAT
+GGGCCAGTTCACCGACCAGTATCAGCAGATGCTGCGCGTGGCCGGCCTCAATTCGACCCA
+GGCGGCAGCCGCGTCGCATGGCTTCATGGTGCAGCTGCGAGAGGTAGCGGCGTGGCTGCA
+GATCCTCTCCCAGAAGGTCTACACGGATCTGGCACAGGGTATTGGCGACGATATTGAGCG
+CTTCCGGGTCCGTTTTATTGCGGACTTCGGGAAAATCTCGCACATCATCGAGTCAGTGGT
+GAAAGGCATCCTGTGGGCAGTCGACATCGTGACCAGCTTCGGCATGGTGGTGGCCGATGC
+CATCGAGGGCGTGATTGGCTGGTTTCGTGGACTCGATGCCAATTCGAAGCATGTCGTGGA
+GGCCATTGGCGCGATTGCTGCGGCATGGGTAGCGCTTGACGCGGCCATGGATGCCAACCC
+GATCACGCTGGTGCTGATTCTGGCTGCGGCAGTCGCCTCCCTATGGAATGACTTCAAGGT
+CTGGAAGCGGGGCGGAACAAGCCTGATTGATTGGGGTAAATGGAAGCCAGAAATCGATCT
+GGCGAGCGCAGGCATTCACCTAATCACCCATGCCATCGAGGCATTGGTGCATATGTTCGA
+GCGGCTCTGGGAGCAGACGGCAAAGATTCGATCCGCTGGCCTTGGCGAGATTTCAAAGAT
+TGCCCATGGCATTTGGGATGCAACCTCAGGCGCGCGGCAATGGTCCCTTCAGGCCCAAAA
+ATCCATCTGGGATTGGGCCACCGGCGGATCCCCGCAGGTCGGGCAGGACGCGCAGGCACT
+CGCCGCTGCTGCTAACCAGATCCGCAATCAGGTCACAGGCCTGCCATACGAGCATGGCCG
+GCCGGGCCCAGATGCTCCACGAGGCATCCGCAACAACAATCCCTTGAACATCCGTCACGA
+TGGCGGATCGTTCAATGTGTATGCCACGCCGCTTGATGGATTGACAGCAATGGCTCACCA
+GTTTGCCCTGTACTACTCGGGCAGGTCCGCCACCGCGCACCATGAGGCACTGCACTCCAT
+TCGTCAGATCATTTCGACGTATGCACCGCCCAAGGATGGAAACGATACACAGGCCTACAT
+CGCCGACGTCTCCAAGCAGACCGGCATCGATCCAGATGCTGACCTGAATTTTGCTGACCC
+GGCGCGGATGCAGGCATTCATGCAGGCCGTGACGCGCCATGAGAACAGCGGACGGAACCC
+CTATGACAACAGCCTGTTCGCTCAGGCGATTGCCAATCAGGGGGCATACCCGAAGGCAGT
+GGGCGTGGATCGAGGATCAAGTTCCGCACAGCTTGCTGATGGCTTCAGAAAGCTCCACGA
+GCTTGTCAGCACCATTCACGGCAACCTGCAGGGACCACAGATTCAGGGTCTGCTTTCATC
+GCTGATGGATGCATACCCGGCGGCCCAGGCAGAGAACAATGGCGCATTGAGCGGAGCCAT
+TGCAGATGCGGTGCAGCAGATCCAGAAGCTTCAACCTGGTCAGCAGTTCGATGCTCGGGC
+ACTTACGCAGCGCCTCGACGATCTGTCGCGACCTCGGCTACTTGCAGACGCATCCACTGC
+GGCAGCGGCTGGCCAGCCTGCGGCGTCACGGTCAGGCAACACATTGAACCAGCAGACGAG
+CATTGTTGTGCATGGCGCCACCGATCCGCAGGCTACGGCCAAAGCGATTCAGGAGCGGCA
+GCAATCGGTGAATGAGCGGGTCACTCGGAACATGACGGCAGGGACGGCGACATGAGCATA
+CTCAGCACAGCCGCCGTTCTTGTCGGCGGAACCGTGGCGGATATCCTGATCACGCAGAAG
+CGGCGAATCGGGACCATTTATCCGCAGGTGACCATCTCGGAGCGCATGCACGACGAGCTG
+GCCATGACGGACAACCCCGTTGATTCGGGTGAGGTCGTCACCGATCACTCATACAAGTTA
+CCGGCCGAGCTGACCATGCGCTGCGGATGGAGTGAGAGCGGATCGCTGTTCAATGACATC
+GACAGTCTGCAGATCGCATCTACTCCCAACGAGGCCTATCAGAACCTGCTTTCCCTGCAG
+AAATCGCGCCTTCCGTTCACGGTCACGACCCCGCGTCGACAGTACAGCAACATGCTGATC
+CGATCCCTGGACGTGACCACGGATGCGGCGACGGCCAATGTACTGATGGTCGAGGTGGTC
+ATGCGCGAGGTGATCATTGTCAGTACCCAGCAAACGACCATGGCGGCAGCCGAGGATCAG
+GCCAGCCCGCAGGACACAGCGGCCACGACCAATGGCGGGGTGAAGCAGGCGACGGTGGTC
+ACCGATACATCGGTTTTGAGCAAGATCGGGACGGGTGTAGAAAGTGCATTCTCCGCGATT
+ACTGGAGGGTAAAGCATGGCAAAAACTGTCTACCAGATTCCCCTGGATGCGGCCGGCCAG
+ACCATCCAGGCGATGATCGGCTCAGTGCAGTATCAGCTCACCGTTCAGTGGCGGAAATTC
+TCCGGCTGGGTGCTAGATATTGCCTCTACGGATGGGACTGCCCTGGTGTCGGGCATTCCG
+CTTGTCACCGGCGTGGATCTTCTGGGCCAGTACGGATACCTGGGCATCGGGGGATCTCTG
+CTCATGGCTACCAATGCCGACCCCGATGCTGTGCCGACCTATGAAAACCTTGGCACGACT
+AGCAATCTGTATTTCGTGGTGACCTCATGAGCCAGTCTGCCCAGCAGTATTTGCGCCAGG
+TACAGCTGGTGATCGGCACCCCTGGCGGCCCGGCGGTCGATGTCTCTGATCTTCGCGTGA
+CCTTCAATGTGCGCTCAGCTTCGGTCGAGACCCTGAAGTCCGCGAACATCCGGATCTTCA
+ATTTGGCCAAGGCCACAGCATCGAAGGTGCTCAACGAGTTCACTTACATCGAGCTGCATG
+CCGGCTACCCGAACAACATGGGCATGATCTTCCGCGGCGAGATCTGTCAGGTGAAGTATG
+GCCGCGATCAGAACATGGTCGATACCGTCACCGAGATCCTGGCCCAGGATGCTGACACGG
+CTTACAACCAGGCGGTGATCAGCAAGACGCTGGCCAAGGGCTGGACCTACGAGGATCAGT
+TCAGTGCGCTGATGCGGCCTTTGAACAAGTACGGGGTCAATCCTGGCTTCTCGCCCAGCC
+GGACAAACAGCCCGGCACCGCGCGGAATCACCATGTACGGCATGGTCCGCGATGAGATGC
+GGATCCTCGCCGAGGATATGGATTGCGACTGGATCATGGAGGACGGGTTCCTGCACCTGA
+TTCCGTCCGATGGATATATCCCAGGCAACGTGCCGGTGATCAATGGCATGACGGGTATGG
+TGGGTATCCCAATGCAGACCATTGAGGGTATTGAGGTGCAGTGCCTGCTCAATCCCCTGG
+TAAAGGCGGGCGGGGCGGTGAAGCTCAACAATGCCGAGATCGCCAAGGCGGCCAACCGCG
+TGCCGACGAATACGACAAACGGCTTGCAGCCGGTTGCCGGCCTGGATGCGGATGGCTTCT
+ATCGCGTTGCGTGCGTGACGCATACGGGCGACACCAGGGGGCAGCAGTTTTACACCTACA
+TCATCGGCTATTCGGTCGATCCCAATCAGGCTCGGCCCATGGTTGGCCCCTCAGTTACAG
+CGGTGCCCGGATAATGCGACCCACTGAGCGATACGAGGACCACGAGCATGTCCTGCGCGA
+GATCATGCGCTCTGCGCGCACTCGGCAGTGGACATGCATGCCTGGGCATTTCGTCAGTTT
+CGATGCCGGCACATGCACCGCCGTCGTGCAGATTGGGATCGCTGGCCAGCAAACAAGTGA
+CGGCGTATCGACGGCCGTGCCGTATCCCGTGCTGGTCGATGTGCCGGTGCAGTTCCCGCG
+GGGTGGTGGTGCGGCGCTCACGTTCCCCATTGCCGAGGGAGATGAGTGCACGGTGCATAT
+CGTGGACCGTGCGATTGATGGCTGGTTTGAGTCCAGTGGCATCCAGCCGCCGAGCAGCAA
+GCGACGGCAGGCGATAAGCGATGCGTTTGCAGTCCCCGGCTCTCTGTCGAAGCCTGCTCG
+GCTGCAGAACATCAGCACGTCCACAGCGCAGCTGCGGAGTGTGGATGGCAAAACCTATGT
+TGATCTGGACCCGACTGGCCAAGTGGTGAAAATCACTGCGCCCGGCGGCCTGGTCATCGA
+TGCGCCCAGCGTCAAATGCAGTGGCACAGTCACAGCATCGGGCGAGATCACCGGCAACGG
+CATCCCACTGTCCACCCACACTCATTCAGGCGTGCAGTCAGGTTCAAGCAGTACCGGCAA
+GCCGCAGGGGTAGCCATGATTTACCGAAAACTCAACGCGGCTGGTGACTACTCGTTTGGC
+GCCGGCCCGGGCGACTTTTACCAAAACTCTCCAGAAGCGGTGGCTCAAGCTGTACTGACT
+CGACTTCGCCTACTGGTAGGCGAGTGGTTCCTTGATACAACTGCCGGCACACCCTGGGCT
+ACCCAGATACTTGGCAAGGGCACATCGTCGGTCTACGACAGCGTGATCAAGAATCGCATC
+CTCGGGACCACTGGCGTCCAATCCATCGACTGCTACAGCAGCTCGGTGTCCGACCGGAAG
+CTGTCAGTCACCGCAACCATCACCACCGCATACGGAAGCACGACCGTGGAGGCATCGCTT
+TGATCACGACCACGGCCCCGACAATCGGTGCTTCGGGCATCAGCGCGCCGACCTATGCCG
+AGATTCTCGCCTACCTACAGGCCAAGATGCAGGCTATCTATGGCGACGACATCTATATCG
+ACCCGGACAGTCAGGATGGCCAATTCATCGCCATTCAGGCGCTGGCGATCAGCGATGCGA
+ATGCTGCCGCGATACTGGCATACAACAGCCTGAGCCCATCCACTGCTCAGACCTCGGCCC
+TGTCGAACAATGTCAAAATCAATGGGCTTACCCGGAACGTGGCGAGCTATTCCACGGTCA
+CCGTCACATTGGTGGGCGTGGCCGGCACGATCATCTCTGGCGGCTCAGTGCAGGATGCAT
+CCGGCAATCTGTGGAGCCTTCCAAGCAAGGTTACGATTCCGTCATCCGGCACAGTCGACG
+TTACCGCTACCTGCCAGACCGAGGGCGCCACTGTGGCGGCCGCAGCGTCGCTCACGACTA
+TCGCCACGCCGACGCTTGGGTGGCAGTCGGTCAGTAATGCAGCGGCGGCGACATTGGGCG
+ATGCTGTCGAAACCGATGCCCAGCTCAGGGTTCGCCAGGCCAACTCGACCATGGCCCCCT
+CCCAGGGGCCGGCCGACGGCATTGTCGGCGCGATCTCCGATATCACCGGGGTGACTCGGG
+TCAAGCTCTACGACAACAACACCAGCGCCGCTGACAGTAATGGCATTCCGGCCTATACGC
+TTGCTCTGGTGGTGGAGGGTGGCGATGCCGAGGCCATTGCGAGCGCATTTGCCCTACGGA
+AAGCGCCGGGTGTGCCCACGGCTGGCACTACCACGCAGACTGTCACCACTCCGGGCGGGA
+GCAGTGTACCGATCAACTTCTATGCTCTGGGCGAGACGACCATCAGTGTTGCCATCGGTC
+TGAAGGCCGGGTCGGGATATAGCTCGGCCGTGGGCGAGCTTATTCAGGAGGCGGTAGCTG
+CTTGGATCAATGCTTTGGACATTGGCGCCCCGGTGGTCTGGAATCGCCTCTACATCCCGG
+CGAATTTGTCGGGAGATTCCAGCAGCAGCACCTACGAGATCACCAGCCTGGAGATCTGCA
+TCAGTGGGGGCGCGCTCGGCACCGCGGATCTTGCGATTCCATTCAACTCAGCGGCTTATT
+GCACCGCTGATGATGTGGTGCTGGCGGTGACCTCATGACGGCCTATGTCAGCGACTACAC
+CGGCCTGATTACCTCCGAGCACTCCGACAAGCCCAAATTCTCCGCAATGGTCCAGGCCAT
+GGCGCAGTGCTGGGTTGATTACCAGAACGCCATGCAGTCGCTCGTTGATGCGATGAATCT
+CGACACTGCGGTCGGCGATCAGCTGGATATTCTCGGCAGGTGGATCGGCATTACCCGCAA
+CATCAACGTGCCGATCGATGATCTGTATTTCGCCTACGACGATGTGGATGGCATCGGGCT
+GGATCTCGGTATCTGGAAGACCCCGAGCGACCCAACGACGGGTGTCACCCAGATGGATGA
+CACCACCTATCGCGCAATCCTGCGAGCAAAGGTAGGCGCAAATCACTGGGACGGCAGCAT
+CGAGGGACTGGAGCCCATCCTTAGCGCGATCTTCAGCCCAGGCGGAACGACGGCAAAAAT
+CGTCGACAACGGCGACATGACCTACAACGTCAATTTGACCGGGACCGAGCCGACCAAGCT
+GCTCATGACACTGGTCGATGCCGGATACATCCAGTGCGTTCCGGCCGGCATGGCCGTGAC
+CTACACCTACACCGCATAGGCCCGCGTTTGAAACGCGACCCCTGCAGGCGCCTTTGAGGC
+GCCTTTATTGTGCCCAGAGGAAACCATGGCCACACTTGAAAATGATTTCTTGCCGTTCGC
+CACCGGATCTGGCGCCAATGTCGACGACCAGGCGACTTATGCCGATGCAGCCACGACCGG
+GACGGGGTTTGTGTCTGGTATCGCAAAGTCCGCGTCTGTGAACAAGGTTCTACGTCAGGC
+CTCGACGATGGCTGCCGTGATTGCCGCCCTGATCGTGGATAAGGCCGCGGTAGCGGTTAC
+CGATGATGGGAGCGTGAGTACCATTGAGGCGAACCTGGTCACGGCCATTCAGGCTGTCGC
+GCAGGCGCTGGACTATCCAATCAGCCAGGTGACGGGTCTGCAGGCTGCGCTGAATGCGAA
+ACTGGATGCAACGGCAAATGCCGTGTCTGCGAGCAAGCTGGCCAACACCTTCAATCTCGC
+CCTGACGGGCACGGTGACTGGCGCAATCAACATTGATGGATCGCAGAACGTCTCGCTGTC
+GACATCCATTGCCGATGCAGCCCTCTCCGAAAGCATGGTGAACGGCCTGCCGGCAGCGCT
+GTCCACCATTACCAACACGCTTGCGTCGGCCAGTGATGGGACGAATCAGCGTGTAGCCCT
+GGTTGGCATCAACATCGCCTCTGACGCACCCTTCATGACGAGTGCGCAGAATGTCGCCTA
+TGACCTGATCAAGTCGGCGCCAGGAAGCGGATATTTGCATGCCCGCAACCTGACCCTGGA
+TGCCAGCGGCAACCTGATCGCTGTGGATAGCGCAGGCAATACGCGAGGTTACGGTACGAG
+CGCATGGGTTACCACGCAGATCAGCGCAGAGACCGCGCGCGCCGAGGCCGCCGAGTCCAC
+GCTGACCACCAATCTTGCCGCAGAGGTGACGCGAGCCAAGGGAGTGGAGGCCACGATCAC
+CAATACCATCGCCTCGGCTGATGACGGAACGAACTTGCGCATCGCGCTGGTCGGCATCAC
+CAAAGCGACTGGCGTTCCGTTCATGGCCAGTGCGCAGGGGGTGACGTACAGCCTGATCAA
+GTCGGCACCGGGGACCGGGTTTCTTTCGGCCCAGAATGTGACGCTGGATAGTTCCGGCAA
+TCTGATCATCGTCGATAGTGCTGGGAACACTCGCAATTATGGCACCATCAGCTGGGTTAA
+CACTCAGGTTGCGGCTGAAGCAGCCCGAGCCAAGGCGGTCGAGTCAACCCTGACTTCGAA
+CTTGGCGACAGAGACCGCGCGCGCCGAGGCCGCCGAGTCCACGCTGACCACCAATCTTGC
+CGCAGAGGTGACGCGAGCCAAGGGAGTGGAGGCCACGATCACCAATACCATCGCCTCGGC
+TGATGACGGAACGAACTTGCGCATCGCGCTGGTCGGCATCACCAAAGCGACTGGCGTTCC
+GTTCATGGCCAGTGCGCAGGGGGTGACGTACAGCCTGATCAAGTCGGCACCGGGGACCGG
+GTTTCTTTCGGCCCAGAATGTGACGCTGGATAGTTCCGGCAATCTGATCATCGTCGATAG
+TGCTGGGAACACTCGCAATTATGGGACTAGCTCCTACGGGACCATCTCCGGTGGCTACTA
+CATCCGCATCGGAAACATCCTGATCCAGGCGTTCTCTGCAGGGGTCCTGAATGCCGGTGA
+CTCAATTGCATTCCCTGTAGCTTTCTCTGCCGCGCCAGTGGTGTCCACGACCGTCGACAA
+CAACCGGGACGGCGCCAATCGTCCGGTCGCCATCAATCCGACGGTCGGGACAGTGACCGC
+GTCGGGTTTCAAGATCAACATCGCCGCCATCTCGGGGGCGAACCAGCCGGCCGGCACCGG
+CCAGGTGTGGGTATTTGCCATGGGTCCTGCATAAATGACTGACAACACCGAAGAGACGGC
+ACCGGTGGCCACCGCAGCTGCCGTGGACATGGCGACCGATGCGACATCGAATGTCGAGAC
+GCAATGGCCTGCCCGCTACTACGCCAGCTATGACACGTCCGCCACCGGTCCCACCGAGGT
+CACCGGCTGGTATGACGTGTGGGGCATGTCCAGCACGGCGAATGTGCCTGCTGCGGCCGA
+GATGCTTGCGCTTACGGCCGAGCAATGGGCTGCTCGGCTTCCGTATGGGCAGGGCGTGCA
+TGAGGGGACCATTGTGGCCTACACGCCTCCCAGCACCGTCACCCTGGCAGATCAGGCTGC
+CACAGCATACTCGGCGGCCGTCGCGACGGTGCAGAGTGAGTATGGCGTCCTCAATGAGCC
+GACGCCGGATGACTGGGTGACCTACCTGAAGGCGCTGAAAGCGATCCGGGATGGAGTCGA
+CACCACCAGCACGGCACTGCCGGCCGCGCCGGCGGCATGACGAAAAGCCCCATCCCTCGC
+GGGGTGGGGTCTTTTTTGTGCCTGAAGCTCGACCATGAAAAATCAATGACTTGCCAATTA
+TCCGCCGTAGTAGACAATCCATCGCTACGAGGTCAGATCATGAGCAGCATTGCATCCATC
+ATCCGAGAGCTTCGCATTGCGCGAAAAGAGCTGCGGCCAGCCGACTTTGTTTTTGGAGTG
+TTGATTCCAACGATGGTCTTGGCGCTAATCAGGAAGGGGTCAGTCCTTTACCATCTGATC
+ACGATAGCGGGACAGGTGGCGGCCGTCGCAGCCTGATCTTGATGGCCATGGATGGCCTAG
+TCCAGCTTCGATGCCATATCCGATGCCGACTCCCGGTAGTAGATCATCAGCGACTGCAGG
+TCTCGATGACCGATGGCCCGAGCAAGCTGGAGTACATCCAGCTTTTTGCTGAGTCGCCAG
+ATAGCTTCGGCCCGGCTGTCATGGAAGTGTAGGTCTTGAATGGTCGTTTTGTTCCGCACC
+TTGCGCCAGAGAGCATCCCGATTCGCATCCGATAGTTGGAAGCATGGGGCATCATCGCGG
+GGTAGGGCCTCCAGAATCTCAATGGCTCGAGACGATAAGGGAACGTCGCGGGCATCACCA
+TTTTTCGTTTTGGGAAGATGGGCGTAACGCTCACTGATGTGAACATGGTCCCATGTAAGG
+GCGGTGATCTCGCCGGAGCGCATCGCGGTCTCAATCGCAAAAAGGAATGCAAGCCCGATC
+CGATTTGTTGATGTCCTGCAGGCGAGTCCCGCATCCAGGCCAAAGGCCAGACTTATCTCT
+TCCACCTCTGCCTGGGTGATGCGCCTCTTTCGGCTATCTGGCTGATCGGGGAGCTGCATA
+CCCTTGATGGGGTCATGGTTCATGTAGAACCACTCTTCTCGGCAGTAGCGAAACATCGCC
+CGGAGCATGTTCAGCTCGCGAAGCATGGTCGCCGGCGTGACGCTCTGAAGGCGCTCATCG
+CGCCATGCAATGATGTCTGATCGATCGAGGTCTTGCATGCGCACCTTGGCGATGCTTTTG
+GACTTGAGTGATCGGCATTTCATCACCTCCCATCGCCCTGCGCCTCGCGTGGGGGCAACT
+TCTCGCTCGTAGCGCTCAAGCGCATCAGAAACGAGGCGGGGGATGGTTGCTCGGCCAGAT
+GAAACGGCCTCCTGTTCAATGGCCCATGCCGATGCCTGGGCCTTGGTAACGAAGACCTTA
+CTCTTGCGCTGACCCTTGATCAGAACCTGCGCTCGCCAGCGCTTTCCATGCTTGAAGATG
+CTTGCCAT
+>NC_017033.1|provirus_2089294_2107522
+CTATGCCCGAACATCGTGGCCATCCGAACCCAGAAAGCGTCGATCATCGACTGCGAGGCC
+TTGGGCAGCTGGCTGTGCTTCTGCTGAGGCTTCGGCCTGCTTGCGGATTGCGATGGCGGC
+CTCGACGCGTTCGACCGCGCTGAGCTTACTGCCGCCACTGCGGCCTGCTGGATGGTTTGC
+ATGGGCTGATCCTTGGGTGACGGGCTTGGGGCCCTCGGCATGGCGATTACGGGCGGTTGT
+GATGGCGTAGGCGAACGGCTTGGCCTTGTTGCGGAACTCCGCAGCTGTGGCTGCCAGCGT
+TTCCGGGGTGATGCCCTCGGCCAGAGCGGCGAGGAGATCCGGATGCTGAGGGTTCACGTC
+GGAGCAGCCGGCCTTGCGCATCAGCCGGCAGGCTCGAGCGGCTTCGGTGATCGTTGGGCC
+GTCGTCGCTTGAATCGCTCGCGCTCGTGCCCGCGTCTATCTCTCTCTCTTGGTTATTGGT
+TACTGGTTTATGGATACCCGTGTCTTCACATGTGACAGGTTGTGACGTCACATCGTCTGT
+CACGGGACTTGTCACACCTGTCACGCGTGACAACATCTCCCGAAGCTGTGACATGGGCGT
+ATCAAATCCCGCTGTCACACCGTGACGCTCGAGCTCAGCAAAGAGATCCGCGCGGCGCTG
+CCTGGACTTCTTCTGGCGTTCTCGCTCGTTTGCTTTCTTGCTTTGTCGATCCGGTTCGCC
+TGCGCGGTAGGACGCAATAATCGAGTCGGCACGATGCTGCCGCCAGAAGCCGTCTACCTG
+GACGAAGAACTCCTCGAGGATCGCGTCGACCGCAGCCTTCTCTTCTTCAGTGCGGGCACC
+AACAAGTCGATATGCCCTGCCCTCTGGAATGCCTTCCTCGGACGAGTAGTAGCGATCCAG
+CAGCAGCGTGTAGACGCCATGCTCGAGGATCGTCAGATGGCGGGTGTCCCGGGCGTAATC
+GCCCAGGTGGCGCTCGTAGTAGTTCATTGCCTCCGCACCTTCCGCGCGATCGCGGCGACA
+AGGCGAACCACGATGTCCTGGACAAGGTGTCCGGCGTGGCTGGTGTCCTTGGACTCGCTG
+TGTGTGATCACGCCATCGGCCAAGGACTCGCGGACGGTGCCTGCAAGCCCGCCGCTGCGC
+TCGACCAGCTCCAGCACCAGGGCGGTCACGTCATCCTCTTTCTGCTGGGCAACTTGGTCC
+AGCGGCGTCAGGGCAAAGCCATGGCTGGCAGCCAGCGCGTGCAGGATGCGCACATCGCCG
+GTGATGCCCATGAGGCGATCAGCCTCCGCCAAGGTCAGGTGGTTGCGGTCATAAGTCGGA
+TTGACCTTGTGGCGAAGGATGCCGGCTTGCAGACCCAGCCGCAGGGCAAGGGTCTCGGCG
+CCACCGGGATAGTCATGCACCGTGGCATGGGCAGCATCAACGACGTTCATACGGAAGGGT
+CTCAAAAAGATGGAGCATCGGTTTTGCTGTACTGGCAAGATGGCAACTCACCACCTTCGC
+CACTTGTGACCTGCTCATGGATTTCGCTTCGATCACCGGCCTCGCCTCCTCGACGATCTC
+GACAATCACTGGCGCCAAGGATCTGATCAGCGCTGCCGTCGACATGCGGGACGCTGCGAA
+ACAGAGCGCGGAGCTCGTCAAGGCCAATGACCTTTTGCTCAAGGCCCAGCAGAGTCTCCT
+CACGTACACCGGCCAGCTCATGGAGCTGCAGGGCAAGTACCTCGATGCCTGTGAGGAATT
+GCGAAAACTGCGAGAAGCCGAAGCGGACCGTGGTCGCTATACGCTCTTCGAGGTCAGCCC
+CGGGGCTTTCGCTTATCGCGCATATGCCACCCCACGACTCAGCACAGCTGGCGAGCCATT
+GCCGCCGGAGCCCGAGCATTACGTCTGTCAGCCGTGCTATGACCGCGGGATCAAGTCCGT
+CTTGCAACGCTTCAACCACTACGGGTCGATCTATCTTCGGTGCTCCATCTGCAAGCAGGA
+CTTGCCCACCGGCCGTACAGAGCCTTTCGGAGGTATTTGATTGCTTCACGCAGCCACCAC
+CTGCCCCGGGCTGGCGGGCCTCGGAGGTGAGATGATCGACTTCACAGACATTCCAGTCAG
+CTTCGAGACTGCCTGGACGTGCTGATACGGGACTCGGCGCCATTGAGAAACAGCCTGACT
+GCTGATCCCGCAGCAACGAGCGACTTTTGCCGGGCCGCCGGCCCGCTTGATGATGTCTTT
+GATGTCCATAAAGCTAAGGTAAGTCATGCTTACCTTTATTGGCAAGAGATACTTCCGTGC
+GCCTTGTAAATTTCCCTTACATACTCGCCCCATGAGCGATCAACTTTGGAAACGAATCAA
+GGAGGCCAGGACGGCAGCCAAGCTGACTCAGCAGGCTGTTGCTGACGCCTTTGGGATTGA
+TCGAGTCGCCGTCTCTCTCTGGGAAAGTTCAAGTGATGCCCGGCGAACGAGGCCAGATAT
+CGGCCGGCTAAGGGAGCTGGCCAAAATTACTGGCGTGAAGATGGAGTGGCTGCTAGGTGC
+GGATGGAGATCCAATCGGATCCACCCATCTCGTCTCACGAGATGAGACAGACCCGGCGTA
+TGTTCGATTCCCTCTCCTTGAGGGTTACGCAGGCATGGGGCCTGGAACATTCATCAGCGA
+CTACCCCGAAGTGGTCAAAGACCTCCGCGTCTCCCGCGAGTGGGTCTCGCAGAAGATGCC
+AGGCATCCCCCATGACGTGATCCGCGTGATCACCGGTCGCGGCGACAGCATGCGCGGGCA
+GTACAACGATGGGGATCTGATCTTTGTCGACACACGTGTGAAAAGCTTCGATCAGGACAG
+CGCGTACTGTTTCCGCTGGGCCGGCCGCGTGCAGGTGAAGCGCCTGCAGCTCATCAAGCC
+CGGGATCGTCCGCATCCTCAGCAAGAACCCCGACTATGAGTCGATCGATGCTGAGGTCGA
+GGAGATCGAGATCGGCGGGCGAGCCATTGCGGCTTGGACCTTGAGGGAATTTTGATATGG
+CAATTGAAAAGAGGCTTTATCAGCAAAGCCACTATATTGGATACAGTGCTAGTAAATAAA
+ATACACTTACTAAAAATCAACAATTCAATATCCGCACCACCAACATATAAAGCACCAATC
+CAAGGCAATAAGAAATGAATGTCAACTATTTTGGTTATTACCTTCACGACCACAAAACCA
+ACAAAGACTACCAGATTGATCTATCAGACCTATTTGACTCAATATCAAATAACAAATACC
+CAGATATAAATAGCAACCTCTACTATAATGGAGATCGAATATACCCACTCCCCTATCTTG
+GATCAACATACCTGCTAATTCAATCAAGAGACAATGAGTTAATAAAATTTATTGAAAGGG
+CAACATTGAAACATGAAGATCTATCGACCAAGCTAGGCACGGCGAATTCAGTCGGAATGG
+CAAGCTACGTTAAGTTCGAGCCTAATTGGATAGCAATAGTTAGCAAGGTTTTGTCGCCAA
+GGATTCAGGCGCTATCCCATATAATTAATCACTTTATTAGATGCCTAGGTAGTGACTTAG
+AATTTAAGCTCGCCGCATTTAATGATAAGGTGTCAAAAAAAGATATTGTCAAATTAAATC
+ATGTTAGCTCAATATCCATTGGATTGAACGCCTCCAGCTCGTTAACCAGTAAGTTGGTCG
+GCACACTTTTAGGCAACGGGTATCCAGCCACCTCTGATATCGGAGGCATAGAAATCAGAC
+TGAAGCCATCGTCGTCTAAATCAAATTTGAAGAAAGACCTTCAAAATATAGCCATTAATA
+TACCAGACTCTGATATCGATGAATTAGATGCTCGCGGCAAAATTGAGGCGACTGACAGAA
+TGAGGGATCTATATATTCATGGCTCTGGTGGACTTAAAGATTTCATCAGGCCTAGATACG
+AACATGAAATACCTTCATCTATTACTAAAGCTGCGTCACTAAACACGGCCCTACAAGCAA
+AAATAAAGGAGTTTAGTGGTGACCCGAATTACATCAAAACTAGCGATCCCCATGCTATTG
+GCCTTAACTGGTAATTCCCTAGCGCTACTTTTGTACATCCTATCCTTTACCAAAAAAGGT
+GGCGCACTACTCATCACCCTTGGAAAAAACTCCGATAATTTTGCAGCAATGTCCGCCAGT
+GCAGAATTCTCCATGCTTGGCTTTCTATCTGCAGTAATGGCCTTATTTAGCATCATAGGA
+CAATCGGAAGCACTCAGGCGTTACCGTATTAACGGCTACTTATCCAGCCTCTTGATCACA
+TTCTCCTTCGCGCTACTTGAGACTGCGATCGCCTTCACATCATCGCTAATCCTATTCTTT
+AAGCCAGTCAGTAATATATTCATCACGATTGCTTTCATTGCCCTAGTCGGATCATTCGGA
+ATGATGTGTGTCACCTTGATACCATGCATAGGCCTTCAAATAAGAGCATCGAGCGAAGAA
+TGAGGAGCCTCATACTCCTAGAAAACAATCTTAAATTCACGACTTATCAATCAAGGCCAT
+TATTCACTTATTCACAAGACCCAAGCATTGCCATGTGATTATTTCCCACAAGTAAATACC
+CAATTCCATCCAACTCCAAGAAGCCACCGCCAAGTTCTTCGATCGCTACATCGCCAAGGA
+TCTCAACCTGTCCCCAACATGGTCAGATCCAAAGAATACGGATGGGGCAAGCGGGCCAGC
+CCCGAACTATGACCGAAGTGGTTGCTATGCCCTGCTCTCCGGCGATGAAGTGATTTACAT
+CGGCCTGGGACGCTCTTGGAAAAAGGGGCGCTACAAAGAGCACGCAATTGGCGTGCGTCT
+GAGCGCTCATGTCCTGCTCGTCGACAAGGCCACAAACACCTACATCACGCGAGAAAAGTG
+GCGCGCGCTGGGTGTCGATTCCCTCATCACCATCGGCTTCCCTCACGAGATGTTTTTCCT
+TGCATCGGCGCTTGAGGACTATCTGATCAATGAGCTGAAGCCTGAAGGTAATGGGGTTGG
+GAAAGGGCGATGAAACTTCTAGCTTATTCGACCAGAGCTGTAACCACATCAAGTCGTGGG
+CGAGTGAGGGGTACACCTCAGCCAGACTGATCAATCACCCCTTAGGCGACACAGTACCTC
+ACAAAAAAGACACAAAGACGAGTTGTATTTAACAATTTGATCACCCCCCTTCAAGAGGAA
+AGCCTTACCTCACCACCCTAATTAAGATGCATCTATCACCAAACTCAGGATTAAATATCA
+TGTCGGAAAACAATAAATCCACTGCATTCAACGACAAGTACTATGAAGAACATTTCAACC
+TAGAATTCCTTCCTAAGAAATGCATGCTATGCCAATCAGGATCATTAAATAGAAAAGGCC
+ACCTCATACCAAAATTTATATCAACCCAGATAAAGAAGAAGCTTGATATACCCACACTTC
+GCTACAGTACAGTAACCGACCAAGGATTGATTAACGAGGGCAGGCATCGGCAAGACACGC
+TGGCATTACAGTTTCTGTGTGATAATTGTGAGAATAGGCTCGGACTGGCTGAAAGTGCCT
+TTTCGAACAGTCAATTTCGCCCACGTCTTGAAGGCGCCCAAATTCCGGATATGGATCGAT
+TAACTCATGACTTCATAACATCTATCGCATGGAAATATGCGACCTTCAATAGCTTCAAGA
+AAGTTGGAAGCAACTCTCTTTCAAGAATAGAGCCTGAGATCGAAAAAGCGAGAAAATATT
+TAGCAGGAGAACAAGAAAGCAATCCTTTTGATATATACTTCATAAACTTGGAGCGCGTGA
+GTGAGGTAATGGAGAATACAGACTCAAACAGATTTCTCTACAACATAACTCTCCGCGATC
+GAGAAATAAATCCAATCCAACTGATTGGAGACACTTGGTTTCCCGGCACCTCGTCAGGAA
+TTCCAATAATAACAGTTAGGCTAGGACCGCTATGCTACATTATAGCTCCAAGCGGTCACT
+TGCATCTACTCAGATGCATGCCTGAAGAAAGGCCATCGCCACACAACATAGTGGAATTGG
+AGGTGACGCAAGATATTATCAACCTGCTTATATCGCTAGAAGGAGGATTTATTGATGGCA
+TCCCATCAAGAATAAACAATCCAGCCATGGAGTATGAGATGAGATGAGATGCAAACTTCT
+CAATCTCCACAGAGGCCGCATATCACTAGCGACATAATATTCAGCACGCCTGACTTGATG
+ACATCATCAATAAAATTCCTACTCCCAAGTTTTTTTCATACACTACCCCACGTCTAGATC
+CGCCCCAAGCCTCAGGGTGGTCCTCGGCTCATCGTAGTCGCCCGTCTCTGAGTCCACAGT
+CTGGGCAAAGACCAAGACAGCGGCCTACTCTTCTTCCAGCCTGTAAGCCCTGCGCACCGC
+CGCATCCTCCGCCGTCTTCGGTATGGGGGTTCGGCGAGCAGCTGACCGCGTTGCCCTGTA
+ACCCACGTCTGCACCACATAGATCGTTTCTTTGGCCATAGCTCCTCCTGGTGAAGGAAGC
+ATGGGCCGTGCGCGCCTCTCGGTCGGCACAAACATAACCATATGCTGAACAATTGTAGGA
+TTACCTTACCCCCCACACGTAAGTTTTACTTGCCTTTAAGTGTAAGTATGGCTTACCTTT
+ATCCCGCGCCGCAGCGAACCGCTGACCAACGGCCTGGGATCTTCCACAACCTAGCGGGCA
+CCCGAGGATGGCATCGCCATGCGGAGGGCCCAGGGTCTGACCAGCCCGGATATCGGTCGC
+CGTGCGCCTTCGCAGAGGGCGCATTGGCATGGCGGTTGGCGCTTGCGCTGACCGAGGCGC
+TGAACACTCGGAACCCTCCGTGAGACATGTGGAATGGCCTGTAACGGGGCCGGCCAGCCG
+CCATCCCAATTCGTCACCCTGCCCGCTCGGGCTATCTCGCGCTTTTCCGCGCACCTTCCA
+CTGGAACCACAACATGAGCATTTCTACTCGCATCTATCGCGTCGTCGTCAACGAGGGCGG
+CGATGACGAAAGCACGCACCTGGTGCGCGCAAACACCCCTGACAACGCTGTAAAGCATGT
+GCTGACGAAGCAGATCAGCGCGAACGTCGCCACCCAGGACGAGCTGGTCGAATTGGCCAG
+CCAGGGTGTCGCCGTTGAGACGGCAATCGTCCATGATAGGCCGGGCAAGCCGGGCCGTCC
+GAAGCAGAAGGCGGCGTAAGCAACACCCTGCAGGATGCAGGCGTAAAAACCGTGCGAGGC
+CGGCGCAATACCCGGCCACTCATTCCCCACCGATGCGGCCTATCCCGCATCGATCCGCGA
+CTCAGCTGGCAGCCGTGCCGGCTTTTTTTGTGCCTGGAGAAAGTCATGCACTTCAAATCT
+GCTCAATACCGGCTGCTGGCAAGCATGCCTCAGTACCTCGACTACACCATGGGCCAGCTC
+GCCGCTCTGTGCACTGTGAACCCGAAATTCCCGCTGATTGCCGGGGGTATCCAGTGAGGT
+CGACTACCCAGTCTTTCATCCGCCGGCGCTTCAGGGGCTTCACCCTCTATATCTCGGCCA
+CGGCCATCAGCGGAACCCACGATGTGCGCTTCAACACCGGCGCCGGCGAGTTCACCCTCC
+AGATGACACCGGACGATATCGAAGGCGTGCAGTCGGTCCTCGAGCAGGCACACACCCTGA
+TCGATGCGAACCTGCCGGGCCGCTGTCGATCCTGCGCAGGAACTGGTGAATATGGTGTAG
+GAATCGGCATTCCTCGCGACTGCCCGGCCTGCTCGGGAACTGGCCTCAAATCGCGTCAGC
+AGGTGGCGGCATGACCGACAACGACAAGACGCTGCGGGATGAGTTTGAGGAGCGCGCCAA
+GCGCTTATTTCTTCCAATCGAAAGGAACAGATTCGATCAATACCGGGATACCCGCACTCA
+GCATATGTGGTGGGGGTGTCAGGCCGCCCACGCCAAATACGCCCCGCGATGGCTGCCGAT
+TGATGAGGAGGTTAAAGATGGCAATCCCCTCCTAGGCCTACGAGTACAGGACGATGCTGT
+CTGCCTCGCCTACTGGAATGATGAATCTTTTTACAACGTCTGGACTGGGGAGAAGGTCAT
+TCTTACTCACTATCTTCCAATCCCTGGTGCGTCGGAGGTGGTGGCATGACCACCTACCTT
+CAGCCGCCGGGCATGTTCTGCGATCGAGCCGGCGAGAAAAGGGCTGACGAAGAGGAGGCC
+ATCGAAAGGCAAGTTGCCTCTGACCTCTCCGATCCAGACGTCGCCGAGGAATGGCTGATG
+AGTTCGATCGACCGCTTCGACGACACCAAGGCAGCCGCCCAGGCACTGGCCCGGGGCGAC
+CTGCACTCGTTCCATAACATCTTCGCCCACTGGGTGCAGGCGCAGACCGAACTGCGCTTT
+GAGCAGAAGCTCCGCGGCTTCCACTGATTCAAATCCCCTCCCTTTTGATTGTGCTGGCTC
+AGGCCGGCAGGAGATCCCCATGTCTGAAATATCCGTGGCCAGAGCACAGAACCTGGCACA
+AATTGAGCGTGTAAATGCGCTACTTCCCACCTCGATCGGTGAGGCCATGCAACTCGCCGA
+GTTCATGGCTAAGTCGGATCTCCTGCCTCCGCACCTAAAAGGCCGACAGGGCGACTGCCT
+GCTGGTGGTAATGCAAGCTCAACGCTGGGGTATGGACGCCTTATCAGTGGCCCAATGCAC
+GTCAGTTGTTCATGGACGCCTCTGCTACGAGGGCAAGCTGGTTGCGGCAGCCCTGTACTC
+ACAGAAAGCCATCGATGGCCGCCTCCACTATGAAATCAGCGGCCATGGGCAGGACGCCTC
+CATCGTTGTAACTGGAACACCTCGTGGAACTGGTCAGACTCAATCAGTGTCAGGCTCCGT
+CCGCAAGTGGCGAACGATCACGATGAAGAAACAGGATGGCGCCCCTCCCAAGCGGGTCGA
+CAATGCCTGGGACACAATCCCGGAAGACATGCTGGTCTACCGCGGAACGCGGCAATGGGC
+GCGACGCTATGCGCCTGAGGTGATGCTCGGGGTGCAGACGCCCGATGAAGTTGACGATAC
+ACCCATGCAGACCACTGTGATCCACAGCACGGCTGCATCCTCTCCTGCCATTGAACCGTT
+GATTCCTTATCCGGAAGAAGAGTTCAGCAAGAACTTCGACACCTGGCTCGGACGCATCCA
+GTGCGGCCGGAACTCCGCCGAAGAGGTGATCGCCAAGCTGCAGACCAAATACACCCTGAC
+GCCCGGTCAGCTGGGCGCCATCCGTGACCTCGAAACCACCGAGGCGGAGGTAGTCGAATG
+AAGATCGTGAAGCTCACCCAGGGCACGCCGGAATGGCATGCCCACCGCGCCCGTCACTTC
+AACGCCAGCGAGGCCGGCGTGATGCTGGGCATTTTCCCTGGCGTGAAACGCAGCGACCTG
+ATCAAGGTCCGCGCCACCGGCATCGAAGAGGAGATCTCCACCTTCGTGCAGAAGATCTTC
+GATGACGGTCATCGCTTCGAGGCACTGTGCCGGCCGCTGGCCGAGCTGGTGATCAGCGAG
+GACCTTTTCCCCTGCGTCGGAGAGGATGGCAAGCTGTCGGCCAGCTTCGACGGCCTGACG
+ATGATGGAAGATGTGGCCTGGGAGCATAAAACGCTCAACTCGGTGCTGCGCAAGGCATTG
+CCGGAGGCGGCCCATACCGGTGGCACGATTCCGCTGCACGGCGAGGATGTCACCCTGCCG
+GCGCACTACTGCGCACAGATGGAGCAGCAGATGCTTGTCTCCGGTGCCGATCGTACGCTG
+TTCATGGCATCAGTCTGGGATGGCGACACGATGGTCGAGAGCCGGGCCTGCTGGTATCAC
+TCCGACCCCGAACTGCGCGCACGCATCGTTGCAGGCTGGGCCCAGCTCGAGCAGGACATC
+GCGGCCTTCACCTTGGAGCCGGAAGAAGCTGTCGTCGTAGGCAAGGCACCCGACCAGTTG
+CCCGGCCTGCACATCGAGGTCACCGGCATGGTGACTGCCTCGAATCTGGAAGCGTTCAAA
+TCTCAGGCGATGGCGGTGCTTGGCGGGATCAACCGGGACCTGCAGACCGATGAAGACTTC
+GCCAATGCGGAAAAAGCAGTCACCTGGGCGAAGGGCGTAGAAGATCGCATCGATGCGGCC
+AAGGCCAATGCGCTCGCCCAGACCGAAACCATCGACACCCTCTTCCGCACCCTGGACGAC
+GTGAAGGAGGAGACCCGGCGTATCCGCCTCGAGCTCGACAAGATGGTGAAGGCTCGCAAG
+GTCTCCATCCGGGACGAGATCGTCGACGCCGGCATCCGTGCAGCAAGAGCCCACTACGAT
+CAGCTGGACTCGAGCCTGGGCGAGTATGCCATCCGTCCCGATCACGCCACGTTTGCCGTG
+ATCGGTGCATCGATCAAGGGCAAGCGATCGATCAGCAGCATGCGGGACGCAGTCAGTACG
+GCCGTGGCCGACATCAAGATCGCTGCGAGCCAGTTTGCCGAAGTCATCCGCGCCAACATC
+AGCATCCTGAAAAATCAACATCAGCACCAGTCACTGTTTGCCGATCGGGTGATGCTTGCA
+CAAACCAAGTCGCCTGAAGATCTCCGCAACTTGGTCGCGGCTCGTATCGGCGAGTTCGAA
+CGGCAGGAGACTGAGCGACTGGAGCGGCAGCGCGAGCAGATCCGCAAGGAAGAAGCCGAG
+AAGCTGGCCCGCGAGCAGGAGGCGGCCAAGGTGGTGGACGAGACTCCGCCGGCATCTGCA
+AAAGTCGTCCAGTCCGCACCTCAGGCGCAGAGCCACTTTGCGGCATCAACGGACGAGATC
+CCAGCCAAGGCCGAAAAAGTCGCCCAACCGGCAGGCCCTGCCAAGACCATCAAGCTGGGC
+GACATCAACGCCTTGATCGCACCGCTTTCGATCACTGCAGACGGACTGGCGCAGCTTGGC
+TTCAACCCTGCAAGCATCGATCGCACCGCCAAGCTGTACCGAGAGGACCAGGTCCTCGAA
+ATGTTGAGGGCCATGATGGCGCGGATCAAGGATGTCGGCCTGGCAATGTCGGAACGCAAA
+GCGGCCTGACCATGGCAACCGACAACTCCCTTCCCACCATCGACATGTTCCAGCCGCTCG
+ACGGCTGGTTCGACTGGCGATCCGGCCGTATGCGAGTGCTTGTCCGAGAAGGCGAGCCAC
+GCATGCGCTGCGGAAAGATGGCCTGCGGCCACGATTCACCATGGGCCCCTGAGTTTTCCA
+AACCGTGGGGCACCTTCCCGGATCTGCCCGAAACAGTGGCCGAGAAAATGGCCGCCTGAG
+GACGAAGCATGAAATCACTCGGAAATATCAGCCGTGGCGCAGAAGCCGCGGCAAAACAAA
+TCAGCAAGAACGCCCTGGAGCATGGACGTGTCGCGATCTTCATCGATGAGACAGGCGATG
+TTGCCTTCGTCCCGCATTACGATCGCCAATATGGCGCGGCGCTGGCGACTCTTTCCAAGC
+AGCTCGTCGGAATTTATGAGGGCAACGCCTCAGGCACCGGTGTGTGCCACCCGACGCAGT
+CGGTCTATGCCATCTCCAAATCGGACCTTGAGCATTGGATGGGGTTTATCAGTATCCCGG
+CCGGTGTGTGCGCGATGACTGAACAGAGGGCTGCAGCATGAGCGCTGCTGAAAATATTGA
+TCCGGCCGAAGGCCACCTGTGGGGTTATGAGGACTGCGCCAGGTATATCGGCGTGGCCCG
+GTGGACCTTCGTCAACCGAATCAGCAAAGAGCCGGACTTCCCGCGCCCGGCCATCGAGCT
+GTCGAGAAAGATCCGGCGATGGCTCCCCGAAGACGTGAAGGACTGGGCCTATCGCTCCCG
+CCGCCGGAACCGGCGTTAACCCAGCTTGGCCGCCATATCCGTGGCGGACTCCCGGTAATA
+GATCAACAGGCTTTTGATGTCCCTGTGACCGATGACCCGGGCGAGCTGCAGCACATCCAG
+CTTCTTGCTCAGGCGCCAAATGCCTTCCGCACGCGTGTCATGGAAGTGCAGATCCTCGAC
+GGCCGCCCTATCCCGGTACTTTCGCCAAATTGCATCCCGCTGCGCATCATTCATGCCGAA
+GCATGGCTGATCGCCATCCCTTGGTAACGCCTGCAGTATCTCGGCGGCAAACGTGGACAG
+AGGAACGTCCCGTTTGTCGCCGTTTTTCGTTATGGGGATATGCACATAACGCTTATCGAG
+GTGAACGTGATTCCAGGTCAGCCCGACAATCTCGCCTGACCGCATCGCCGTCTCGATGGC
+AAACAGAAAACACAGGCCGACGCGGTTGGCCAAGCTTTCGGCTCGCAGCTCATAACCGAC
+ACCGAAGGCCTGGCGGACGCACTCAATCTCATCATCCGTAAGCCGGCGCTTGCGGCTCTC
+TGGTGACTTGGGAGCTGCAAATCCTTCGAACGGGTTATGGGTCATCCAGCCCCATTCCTC
+TCGGCACCGCCGAAACAGGCCCCGCAGCTCGTTCATCTCTCGCCGGACCGATGCCTCGGA
+GACCTCTTGCAGCCTGGCATCCCGGTAACGAATCAGGTGATCTTTGCTCACCTCGGGTAT
+CCGCACCTCGGCAATGGGATCCAGCATCAGGCGCTTCACGCGAGCGATATCCCCCCGTGA
+TTTGCCGGCATTCACATGCTCGTCGAGCAGGCGCTTGAGGGCATCTTCCACCAGCATCTT
+CTGCGCAGGTGCCTGCTTGCCCTCAGCCTCTTGGCGAAGGGACCAGCGCTGCGCTTCGGT
+CTTGGTGGAAAACGACTTGCTGACGCGCTGGCCATGAACCATGACCTGGGCTCGCCAGTT
+TGTGCCGCGCTTTGTGATGGATGCCATGTCGCCTCGCTGCTGGTGCAATCTCTGGTGCAA
+AAGTGGTGCACTAGGGTGCAACTTACGGCAATTTCTGGCAACTAAAACGAGAAAGGCCAC
+CCCTTGCGGAGTGGCCTAACTCGTCGTTTTCTAGCGTTTTTGCAATGATTTGCAATGTAT
+CGCTAGTTGGTATTGGTGCCAAGAGGGGCATCGAAAACCGCATAGAAATGCGGACTATCA
+ATGCCAAAAGAAAAATATGCCCCCCAAAAATGCCCCCAGACCGGCCGCGCTTGAATGAGA
+CAGCATGGGACAACCGGGCCATCTGGCGAGGATATCCACCCGTCGCCACTGTAGAAATTG
+ACCCGATCTGATTGGTGCCCCTTTAGGGCACTCGATCTGGTGCAGAATGTCGCAGGTTGA
+GGGGGGGGTAAAAGTGCGGAGGTTATTACTTTTTCGGTGTTCCAGGTGTTCCACCCCTCC
+TAAACCCGCATGGTTAAGCCATTTCTCAGGCAAAAAAATGGAACACCTCCAAAAACGGCA
+GGTGTTCCAGGTGTTCCACTTTTGTCGGCGAGGATCAGCGGCGATCAGCCCTCTGCGGAG
+AAAACAGCCGCGCCCTCAAGGACATAGAACCGCCCCTTGCTCAGACCCCGCACACGCACG
+GATTGCGAGGCCTTGCCATCCTTGCCCGGCTGCAGCCATCCCGCGGCGATCAGCGTCTGT
+GCCGCCGCCTTCGGGTTGAAGCCCCGCACCAGCTCCTCGAAGGCCTCCGGCATGACCAGG
+TACTGCTCGCGCCGATCCTCGGCGCCCGGCTCACCGACCTGCAACTTGCGACGAAAGCCG
+ACACGATGTGCCACCGGCCGGCGCTCGTTATCGTGGTCCTCCGGTTCGAAGCGGCTATCG
+CCATGCGCCTCGATGAAGGCCTTCACCTGAGACAGCAGCGCCGCCCGCTCGGCATCGGCA
+GGGCCGCCGCGGTCAGCCAGCCACTGGCGAAAACAGATCCGGATTGCTTGCGCTGCCTCG
+CCCTCGGGCCAGCCGGTGATGCCGTAGGCCGTCGCCAGCTCGCCGGCGGCGCCGATCAGG
+GCAAAGCGCCGGGCCACGCGCCGGACTTGCCCGCCGGCATCTTCGGGCACCAGGTCCGCC
+AGCATGTCGGTCATGCTCGCCTCAATGCGTCGACGCGATGCACGCTGGTCCGCCGTCAGC
+TGCTCGAGAAAGGACAGCAGCGGATGCCCGTAGTGTGTCGCCGCGGCCCGCTTCAACTGC
+TCGGCCACCGCGCTGGCGCTGCTGCCCACCGGCACCGACTCGAACATGCCATGCCCCATA
+CCGGCATCCGCTGCCACGTCGATCACTCGCACCTCATGGCCAGCCCGACGCCGGCCGCCC
+GACTCCACCATCAGATCGCCCATGCTGACCTCACCCGAGGACAGAAACGCCGTGCGCCAT
+GTCGCCACCGGCCGGGCTCGGCCACTGCGATCTGATCGCCCTTTGCCCTGCCCGTTGGCC
+AGCATATAGGCGACCCTGCTGGCGTCCTTCGGCTCCAACTGGCCCAGCTCATCCAGCGGC
+AGCATCAGGTCGTTGTGCAGGGTCGCCACGCCCTCGAGCGCGTTGTCGGTCTGCCGCCAT
+GTTCGCATGTAGGCCGGCGGACCATAGACGGACGATGCCACCAGCACGGCAGTCGTCTTG
+CCGGTGCTGCTCGAGCCCCGCAGATGCACGCCGCCACCGTCCATGCCGGCCAGATCCAGG
+CACGGTGCAGAGAAAGCCATGGAGACCGCCAACACCAGGCGGCTATGCCCGATGCAAACC
+TTGGCCACGCTATCGGTCCAGCCCTCGAGCGTGCCGCCGGTGGCGACTTGCGCCGCACCC
+GGTGCCGTGGTCTGGAAGATAACCGCCTCAGCTGCTGTCGGGCCAAAGGTGCGATCAGGC
+AGCGCAAACACCTCACCATGCCAGCCGGTGCGGCTCACGCTCCGCGCCTTCTGAGTGGGG
+TTGGCCTGGGCGATGTAGTCCATCAGCAGCTTGCGGGCGTGCTGGGAATTGGCGATCACC
+AGACCTTGCCCCAGCAGCTCTGCCCGCAGCTCCGCGCCATCGGTGGCCAGCATGGCGCAG
+GGCATCGCCCAGCGGTGCGCCTTGCCGTCCCGATCCGTGAAGGCCAGCAAGCGCCCCCAT
+TCTCCGCCATCGGCATTGCGTGTCTCGGCCTCGACATACAGAGGCGCGCAGATCCACGTC
+GCCGGCTTGTCGCTGTGCGGGTCGCTGAAATAGACCCCGTGGCGTCGGCCTTTGCCACGC
+TCGACCACTTCAAAGCCGGGCCCGGCCGGCGGTTCGGCATTGCTCACCACCAGGGCGAGC
+GGCGGCAGCGACTCGGCCGCTTCAATCGTGGAGCTGGACATGATTTTTGACCTCGATAGA
+TTCGGGCGTGCCGCCTTGCGCGGCCAGGGTGGTGGCGTAGTCGTTGAAGTCGCCGGGAAT
+GGGTGGCACGGCCAGCGCCGCACCGATGGCACAGGCCGCTTGTGTCGCCGCCTGCACACC
+GGGATTGCTGCCATCCGGCTTGGCATCGTTGTCCGCGCAGATCGTGATTGGCAGATCCGG
+GTAGCGATCGCGCATCACCAGCGCTACCGCCAGCAGGTTGCCGGCACTGAAAGCGACCGC
+CACCGCCTGGCCGGTGCTGGCGTGCAGACTCTTGGCCGTGGCCACGCCCTCAGCGATCAA
+CAGTCCGTCGCGGACCTTGCCCAGCAGGCAATAGGCGCCGCGGACCATGCCGCCGGGCAA
+AAACCGCTTGTCACCGTCGCCGCGGATACGCTGCAGGTTGACCAGGCGGCCCTCGGCATC
+GTGCATCGGCACCAGCAGCTTGCCGCCAGCTTCCCGCAGCCCGTCAGCCGTCACGCCTTT
+ACGTTGCAGGTAGGGATGCCGCGGACTGGCCGGGCTGGCGCGCTGCCACTCATCGAACGC
+ACTGCCGGCGGCACGCCGCTGGCGGTGACGTTGCTCGGCATCGCGTGCGGCGCGGGCCTG
+CTCGATGGCGATACGCTGGCGCTCCAGCTCGTCGGCCGTCATGGTGCGGCCGGACTGGCC
+CAGCACCACAGTATGCTGCCCGCCTTTGCGCCAGCTCCCGAACACCGCGACAGGTCGCTC
+CGTATCAACATACACCACGGCCCAGCCATTGCGCTTGTCGCGCCGGTCGCCTTCATCGTG
+GAACCTGCACAGCACGCCATCCAGGCGCAGCCGGGTCGGATCGGTCGGCGTGATGCCGTG
+CTGGCGCATCGCGGCCACCAGGTCGGCCAAGAGATTGCCGGTGTAGCGGCTCATGCCAAC
+ACCTCCCCAGCGATCACCCTGGCCATGTCGGCCACCGTGGATGGATTGAAATGGAACTCG
+CCCGGGTCGTCGTTGAGTTTGATCTGCTGCCAATCGCTCACGTCATGAGGCCAGCTGGTC
+AGCACCCGACTGGCCGAGCCCTGGGACCGATTCAAGGCGGCCATGCGCTCGGCCGCGGCG
+CGATCGGTGGCCCAGACATTGCACAGATACAGGATCGACACGCCCGGCAGCGGCGACGGC
+AGGCCCGCCAATGATCGATGATCTGCCGCGCGCACCATGTCGGCATATTCCCGGGACAGC
+CGGCCGACCTGCGATGTACGGATATCGCCCATGATCGAAACCACGAAGTAACGTTTCATC
+GCGGCACCTCCCCGCCGGCAGCTGCCGCCCGCAAGGCTTGGTTCTCTGCCATCAGCTGGC
+GAACGGTCGCCCGCAGCTCGGTGCGCTCGTCGTCGTAGTTGGCACCGGCTTCGACAAGCA
+GGCGCTGCATCTGCCCGTAGACAGTCCGCTGATCGGTCATGGTGGCCAGGGTCTGAAACT
+CGGCCCGAGCATCATCCGCAGTCAGGCTGGCACGCTTGGCCAGGATCGCAGACCGGAACG
+ATGCTTCATCCAGCACGGTCCACAACTTCACGAACACGTCGCGCAGGCCGCGATAGGTCG
+GGGTGTTCAACGGGTCAAAGCCCGGCACGGTAACGGCGCTCATCGCAGCACCTCCACCGC
+CATAAAAGCGCAGGTGGACAGCACAACGCCGGCAACGAACGCAGCGAAGATATCCAGATC
+CGTGCTGCTGACATGCAGCCAGCCAGAAGGCCGGAAGGAAAAACGAGACGTGTGGGAGAT
+GGTGCAGGTGCGTGCAGACGCACCCTGGGCATGATGTGCCATGGTGGGGTTCCTTGAGAG
+ATTGGAACCGCCGCGCACAGTCGCCAAACCATGGGCGGCGGGATGCAACGGGTTGGCGAA
+CCGGTACTCAAGGAACCCGGCAGGCCCGTAGGCCTCCCATTGCACCCCGCCATAAGCTGG
+GCATGACGCAACAAAAAAGCGCCGAGTTGGCGCGTTGCGCCTCGAGTAAGTCGGGTCGCC
+AAACCCGGCCCCGGATTGTGCCGGGACGTGCGAATGGTGCGCGCTGGCGCATGCGATGGT
+CAAGCGATTTTGCATGGCTGATTCCTGATTTCAGGCAAGCCGCCCCCGTCCGGCCCGGAA
+ACTCCATGGCCGGTGGGCACGGTATGGGCTGGGGGAGTTACGCCGCTTCGGGCGTGCTGG
+ATGCGATGCGCAGGGTGTAGATGGCCACGCGGGGATGCTTGCGGCCCTGGTCGTCGGTCA
+TGGCTTGGAGCCGTGTGTCGATCAGATGGCCGGCTTCGCGCAGCTCCTTGATCCGTGCGC
+CTGGCATCATGATGTTGAGGTGTCGGCGGGCGTACATGGTGCTGACTGGCCCGAATCGCA
+GCGCCTGCAACATCCGGTGGCGCTGGGCCGCCGTGCTGGTATCATCAATGCGCGAGATTG
+ATGCGATGGGGCTTGCCTTCGGGTGAGCCTTTTTCGTGTCCGGCGCCCGCTGGATCTCCG
+TCACCAGGCGCATGCCGCCTGTCTGGCCAGCCGTCCCCGGCAGTGCGCGATGACTGGCGG
+CCAGATCCATCAGCCGCTGCTTGCGGTCCTCGTAGGGGATGCCCTGCCCCAGCAGCATGA
+TGTTGAGCCCTTCCAGCCTCCCGACCAGATCCAGCTCGGCCATCGTCATCTGGTCGCGGT
+CGCGCCCGGCAAACTTGCCCGTCACCACCCAATTGATCAGCTTTGCCTCATTCATGTAGT
+GATGGGGCTCCGTTTCCTTGCCCTGGGCAGCGCGTACCGTCTGCAGCATGGCCGCCTGGA
+TCTTGTGGCTGCTGGCGGCGACATGGCGCTGCCGGCGCCAATCATCCGTGCGATGCGTCG
+ATGCCTCGTAGGCGTTGATGACGCGCAGGTAGAAGGCAGGACTGACCCACGTCGCATAGG
+CGATGGCCAGCTGCTTGATGACATAGGTGCCGATGCGCTGCTTGGAGGCAATAGGCGTAA
+TTCCGCCTTTTTCGATTTCAGCGACCAGATCCTGGGTCTGCTGATTCTCGAGCCAATACT
+TGGGGCGGTGCCGCTGTTCGCCGCCGGCAGCTTGATGCAGATCGTTGAGGCAGTAACGGC
+CGGCCTTGTCCATCCGGATCGATGTGCTTGCGATCGACAGGCCATCCAT
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_018068.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1081 @@
+>NC_018068.1|provirus_1361108_1399802
+TCATTCCCCTTTGTTAATCTCATCGATGTGTTTTTTATAGATGGTTGTTATTTCACGAAG
+AAGTTTATCGGATTGCTCATCCGTTATTTTACCTTTTTTTCGTAATCGTCTTAATTCTGC
+CAAAGTATCTTGAAGATATGGATGTTCTAATATTTCATGCCTAACTATAACGGGTATTTT
+TCCGTACCTTTGGAACAAATCGTTATCTTTGACGCTATAATAACTGGCAAATTCTTCAAT
+GAGTTCATCAGAAGGCATTCTGACGCCCTTTTCGATTTCAGATAAATATGAAGGGCTTAT
+ACCTAATGCCTTACCCACGACTGGCTGCGTTAAACCTTTCTGAGTACGAAGGGAATGAAG
+ATATTGGCCAGTGTCATATTGTCTTATTAGCTGCTGATGTTTCTCGTCCTCCAACATATC
+ACCCACGTTTCGCTAGTTTATTACCATAATATACAAGCTGACATGTAAATAACTGTCTGC
+TATATTAATTCATATCAGATAACTTCACAAGCTTGTTAATATAACAAAGGTAAAGAGTGG
+TTAATTTAACAAACATGAGTAGTATTGTTATCTTACAATGTTATCGTTACCAGTCTTAGA
+CGATTTATGCAAAATAGTCTCCTTGGCATCACCGAGGAGGCTATTTTTAGTTAGGAGGTG
+AACGTTTACGAAACTTGTGTATATTTGTTCGCCATGCAAAGGCGACATCGAAAGAAACAT
+TGCGAAGGCACGAGAATATTGCTTGTTCGCGATTAAACAGAACTGTTTGCCGATTGCTCC
+GCATGTTTTTTACACTTCGATTTTAGAGGACACTGTCGAGGAACAACGCAGAAATGGTAT
+GGCAATGGGCCTGGAGCTGTTGAGCATATGCCAGGAGCTGTTGAGCATATGCCAGGAGCT
+TTGGGCTTTCGGAGATAAGATTTCAGCAGGAATGATGTCCGAGATCGAAGCTGCCGAACA
+ATTGGGAATTCCAGTCGTGTTCTACAGTGATAAGTGCCAAAGGAGAATTTTGAAAGGAGG
+TGAATAAGCCATGAACTTGAGTAAGGAAAAGATAACCTATCTTATTCAACAACGGGGACT
+CACTCAGAACGAACTTGCTCGCGCCCTAAATATTCGACCGGGTTCATTATCCAATGCGCT
+ATCCGGTAAACGTGGGGTTGGGAGGAAGATTCTATCCGCTTTGCTCAGGGAATTCCCAGG
+AGAAAGTGCTATGAGTCTTACCAAAAGGCAGGTGGCAGTATGAAGATGAGCCCATTGAAA
+GGAGGTGATCCAGCTTATGCGCACAGCAAAAAGGCCCGTCGGTGCAGCAACACCCAACGG
+ACCCGATACAAAATATAACCAGTAAGAGTATACCACGGGAACATGAACGAATCCATATCG
+GTTAGAAAAGGAGAGAAAAAACCTTCATGAGCGATGATTTAAAGGTTATCGAGCAAAGAG
+ACCTTCTGGGAAATGATTTTAGGATATACGGAGACATGGAAAATCCATTGTTTCTGGCCA
+AAGATGTAGCGGAGTGGATTGACTACGATCCCAGTAAGGTCAATGAGATGGTTGCTATGG
+TTGATGACAACGAAAAGCTGACCGAGACAATTTCGTGGTCAGGTCAGGGACGCAAAATGT
+GGTTCCTCACCGAAGATGGACTCTATGAAGTTCTCCTTCAGAGTCGAAAACCCAACGCTA
+AAGAATTTAAGAGGCAAGTTAAGCAGATTCTTAAAGATATTCGGAGGCACGGTCTATATG
+TAACAGATACCGCATTAGAAAACATGCTCACCAGTCCTGATTTTGGTATAAGGCTCCTTA
+ACGAAATTAAATTAGAACGAGAGACAATTTCTAGGCTAGAACAAAAAATCGAAGAGGACA
+AGTCCAAAGTCGCTTTTGCCAAGGCGATTGAAGCAACAAACGATACCATCTATGTAGGGG
+ACTTGGCTAAACTTCTTAAGAAAAACGGTACGGATATTGGGCAAGCGCGGTTATTTGAGT
+GGCTGAGGCAGAATGGTTATCTAATGACGGGATTCAGTAAAAATACACCGATTCAGCGGT
+CTATAGAAATGGGTCTCTTTGACGTTAAAGAAGATGTGTTTACCTTTCCCAATGGGGACG
+TTCGGATCTCCAAAACTCCAATGGTTACGGTAAAAGGGCAGACGTATTTTATAAATCTGT
+TTGCGAAAAAAGAAGGAGACATCAGAAGAAGTGAACCCACGGTTGAAGTGGATATCAATA
+ACGCGCGATGATTAAACTCCTCCCACATCAGCAATCGGTTCTTGAACAAACAAAAGCCTT
+TCACCGAGTCGCCTATTATTTGGATATGGGCTTAGGCAAGAGTTTTGTTGGTTCAGAAAA
+GATGCACCAACTCAAAACGCCTTTTACTTTGGTGATCTGCCAAAAATCTAAAATTGATGA
+TTGGGCAGCTCATTTTCGAGAGCATTACGACTATAACGTTTATAGTTTCAACAAACAATT
+TATCTCGGAAATTCCGGAACACTCTGTGCTCGTTATCAATTATGATCTCGCCTGGCGGAG
+ATCGGAGTTATTAAAACTATCCAACTATACGCTGATCCTGGACGAATCCTCTTGTATCAA
+AAATGAGACACGGCGACGATCAAAGTTTATCCTCAAACTGAAAGCGGACAATGCCATCTT
+GCTTTCTGGTACTCCCACCGGGGGGAAATATGAGGAACTCTGGAGTCAATGCCAGCTGCT
+TGGCTGGGCCATTTCAAAGCGCCTTTATTGGCAGCAGTTTGTTAAAACGAAAATATTGGA
+GGTCGGAGGCTGTCCCATCAAGGTTGTTACTGGGTATAAAAATGTGGATCGTTTAAAAGC
+CAAGCTTCGTGACTATGGTGCTGTCTTCATGAAAACCGAAGAGGTTCTGGATCTTCCGAA
+AACCATGGATCAAATTGTTAATATCGCTATCACGAAGGAGTACCGTCGCTTCAAAAAGGA
+CCGGGTAATCGATATCAACGGTAAAACGCTGGTAGGAGACACACCACTGACCCAGCTCTT
+ATATCTCCGGCAGTTAGCCGGAATGTACAACGAGAACAAGATTGAGCGTTTGACAGATTT
+AATTCAATCAACAGGGGATCGCTTGATCGTGTTCTATAATTTTGACCTTGAATATGGGGT
+TATTAGGAATCTTTGTGAGAAAACGGGTAAGCAAGTCTCTGTGGTCAATGGGAAGCTTAA
+GGATTTAAAAGCCTACGAAGAACACTCCGATTCGGTAACGCTGGTTCAATATCAGGCGGG
+AGCCATGGGTTTAAACTTACAGCTAGCCAATAAAATCATCTATTTCTCACTCCCATTATC
+CAGTGAATTATGGATGCAATCTAAAAAGCGAATTCACCGGATCGGACAGACCCAAACGTG
+CTTCTATTATTATCTGCTCACAAAAGGAACCATTGAACCAAAAATCTTAGAAACCCTGCA
+ACAACGTAAAGACTTCACGGATCGGCTATTTAAGGAAGTGGACCATGACTGAAGCAGAGT
+TCCAAAAACAAGTCCAAGAATTCCTCCGCCGCCAAGGGGTTTGGTATGTGAAGTATTGGG
+GTGGAGGACGGTTTACCAAAGCAGGAGTCCCCGATCTTCTATGCTGTGTCAACGGTTGGT
+TTGTCGGCATTGAGTTAAAAACGGAAACGGGCAGAGTATCAAAACTTCAAGAATACAATC
+TCACTAAAATCCAAGAATCGGGTGGACAAGCTTTTGTTCTCCGTCCAAGCGGATTCAAAG
+CCTTTAAAGAGTTCATCGAAGGGAAGTGAACAAACTGCAATTCAGCCACAGCCGAGTCAA
+TACCTTCGAAAAATGTCCCTATCAGTTTAAACTCCGCTACCTGGACAAACTCACCACGAT
+CTCCGACTCCTTAGCCGATGATGCACTGGTTGTTGGTAACGCCCTCCATCTGGGTGCTGA
+GAAGGACGAACGAGCGATGTTGGAGTTTTACTTCTCCAACTATACCGTGATTGATGATTT
+GCACATCAACGAAACTATGAAACTGACCGCCCTTTTACGAAAGCTTAAGAACCATCTTGG
+CAGTATCTCCGGCCAATTTAGGCAGGAATATAAACTTGAACGGCCCGAGTTTAAAGGTTT
+TGTGGACTTGATCGTGACTAATCCAGATAGAACCGTTGATGTCTACGACTTTAAGTATTC
+CAATCATGTAAATAACTATCTCGATTCCAAACAGCTTCATCTCTATAAATTCTATCTCGA
+ACGGGAAGGGTTTAACGTTCAGCGAATCGGGTTCATCTTCATCCCCAAAACCTCTATCCG
+TCAAAAGAAAACGGAAGATCTTTATCAGTTCAGAAAGAGACTCATAGAAACCCTCAGCAC
+AATGGAAGTGCAAGTGGTTTACCTCGATTACGATTTCCAAAAAGTTAAAGAGTTCTGGGA
+CTCTTGCGATTTGATTGGTGAGACAATCGAGTTTCCTAAAAACCAAACGAACCTGTGTAA
+CTGGTGTGAGTTTCAGAAATATTGCCTAGAAGGGATTGACTATATGTTATTACCAAGTGC
+CGAACGTCGCCAAATTGATGCTGTGAGTAAGAAAGTCATCTGGATTTACGGTGCTCCATT
+TACCGGCAAGACTTACTTTGCTAATAAATTCCCAAGTCCTTTGATGCTCAATACTGACGG
+AAATGTCAGGTTTGTAGATGCACCGTATATCGCCATAAGAAACGAAGTAACGGTCGAGGG
+ACGGCTGACTAAAACAAGATTGGCCTGGGATATTTTCAAAGATGCCATTGCCGAATTAGA
+AAAGAAACAGAACGAGTTTGAAACCATTATTTTGGATTTACTCGAAGACACTTACGAGCA
+TTGCCGACTTTTTATGTATGACAAATTAGGCATTGAGCATGAATCGGATAACAGCTTTAA
+AGCCTGGGATATGGTCAGAACAGAGTTCTTATCCACGCTCAAACGCCTCATCAACTTGGA
+CTATAACATTGTTCTTATTTCCCATGAAGATATGTCTAAGGACGTGACTAAACGAACGGG
+AGACAAGATCACAAGGATTGCTCCGAATATTCAAGAGAAAGCTGCCAACAAAATCGCTGG
+GATGGTGGATATCGTGGCCCGAGTAATCAACGAAGACGATGAACGGTTCTTAACCTTTAA
+AACCAGTGAGGTAGAGTTTGGTGGTGGTAGACTTACACTCATTGCTAAAAAAATACCCTT
+GGAATATGAATCATTTGTCAAACTATATGAGGCTGTGCAGAACTCGGTTCCAGCCAGCGA
+GACAAAGACCCGTCGAGAACGGAAGAGTAAGGACGCAATGGAAGAAGAGGTTACCCAACA
+AGCAACTATTGAAACACCAGAGGAAACCGTATCTGATGAACCCAGCCTGAAGGTTGAGCC
+AACCCAAGGTCTAGAAACACCTTCGCTCAGTGAACCTCCGAAACGATCCCGCCGTACCAG
+AACACAACAATAAAAGGAGATGGATTATTCATGGCAACAATATGGGAAAAATTCGACAAA
+GCAATTGATACAAAGGCACTCAAGGAAGACGTGTTAGCCGCACAAGAAAACAAGCAAGAA
+TATCGGGATGTTCCGAAGGGCCATTATGAAGTGAAAATAGAAAAACTGGAACTTGTCGAA
+TCGAAAACGAGTAAGCCGATGGTGGCCTGCTGGATGAAAATTCTGAGTGGAGAGTACAAG
+GGACAATTAATATTCTACAACCAAGTTATTCATGTTGGGTTTGGCATTCACAAGGCCACT
+GAGTTTCTGCGTTCCTTAGATAGTGGTATTGAAGTTACCTTCGATAATTACAAACAGTTT
+TATGAATTGCTTCTGAATATCTTAGAGGTGATTGAGAACAAATTCGAATATGAAGTTGAT
+TATGGGGAAGACAAGAAAGGCTATGGCACCTACGTGATTAAGGAAGTCTTTGAAGTTTAA
+CAACATGATTAGGGGATTCGCAAGAGTCCCCTTTTTCTAAAGATACGAAGAGAAGAATAC
+CGCTCAGGGGTATAACAGAAATAATAGGGGGTATAGGCATCGTGAATAGTCAACAAAAGC
+TGAGTAAAACCTCTAAAAAAAATCGAGAAGAACATTTTGATCAACGAAATCACGAGGGGT
+ATTTTGATCTTACAGCATTCCTTGCTTTAGAGAGAATAATCGATCAAAACAGACGGCAAC
+CGAGGCCTGTCCCAACGAGGCAATCCAAATGATCTTCTTCGATGCCGAAGTCTTCCGCTA
+CGATTGGTTGTTTGTGTTCATGAATACAGATACCCAAGTAACGACTGTCATCGTGAACGA
+CCCGGAGAAACTCAAACAACTTTACGAACAATACAATAATAACGTCTGGGTCGGATTTAA
+CAGCCGACATTATGACCAGTATATTTTTAAAGCGATCCTCTGTGATTTTGATCCATATGA
+AGTGTCACAGTGGATTATTTCAAATAGACAAGGTGGCTGGGGGTATAGTGGAGCCTTTCG
+GAAACTACCGTTTTATACCTTTGATGTCATGACGACTCGCTATCACGGATTAAAGCAACT
+TGAGGGGTTTATGGGGAACGACATCCAGGAATCCGATGTGTCGTTTGATATCGACCGTAA
+ACTCAGTTCAGAAGAGCTGGAAAGTGTCATTCAATACTGTCGGCACGATGTTGAGCAAAC
+GATCGAAGTATTTTTGAACCGAATAGAAGAGTTCGAGTCTCAAATGGCCCTCATAAAATC
+CTTCAAACTCCCACTGAGTTATATCAGTAAAACGAAAGCCCAATTAACCGCCGCTGTTTT
+AGAAGCCGTAAAGGTCGATCGTAATGAAGAGTTTGATATTGTCCTGCCGGACACTCTGAA
+AATCCAAAAATACCGGCACATCACAAACTGGTATATGAAACCGGAAAATCGGGATTATGA
+GAAACAGCTCGAGGTAGATATAGCCGGAGTCCCCCATGTTTTTGGCTGGGGTGGGCTGCA
+TGGAGCGATACCAAACTACCAGGGCGAAGGGATCTATCTGAATGTCGATGTGGCCTCATT
+TTACCCGGCAATTATGATTGAGTACGATTTTCTTTCCCGCAATGTGGCTGACTCCACCAA
+ATATCGTCAGATTCGGGATGAACGTTTAAGGCTTAAGGCTCAGAAAAACCCCATGGCCAA
+CCCCTTGAAAATTGTCTTGAACAGTACGTTTGGGGCCTCCAAGGATAAATACAATCAGCT
+CTATGATCCTAGGCAGGCCAATAACGTCTGTGTTGGCGGACAGTTATTACTGTTGGATCT
+TATCGAGCATTTGGAAGGTTCTTGTAAGCTGATCCAATCAAACACCGATGGATTGTTTCT
+TCAGGTTCGGAGGGAGCGAGACGTTGACCGAGTTAGAGCCATTTGTGCGGAATGGGAGCA
+GCGCACGAGAATGGTCTTGGAGTTTGATGAGTTTGAGCGAATTTTCCAGAAGGACGTTAA
+CAATTATATCGTCATCCAAAACAACGGCAGTTATAAATCCAAAGGCGCTTACGTCAAAAA
+ACTCGACATTTTAGATTATGATCTTGCCATCGTCAATAAAGCCATCGTGAACTATTTCAT
+TCATAACATTCCCGTCGAGCAGACCGTAATGGCGGCGGAAAAACTCATCGATTTTCAGAA
+AATCGTTAAAGTCAGTGAGAAATACACGTATGCCACCCATGGAAATGAGCGAAGGCCGGA
+AAAAGTGCTCAGAGTTTTTGCGTCAAAAGTTAGGACGGACCCAGGAGTTTTTAAAAGGAA
+GCAAGTGAGGGATGATTTCAGGATTGAGAAGATAGCAAATACGCCTGAGCGATGTTTCAT
+CATGAATCATGATATTAACGATGTCGAGATTCCAAGAAAACTGGATCGGAGATGGTATAT
+CGATCTAGCGAAGAAACGGATTGAAGATTTTTTTGGTCATTAAATATCAGTACGGAATTT
+AAACTTAGTGGAGGTTCCTCCCAAAATAAACCCTATTTAGATTAAAAACTGGAGGAAAAA
+CCTCCAACTGAAACTTATCACCCTTCGAAATATGTAGATATTCACTTAAAAAGTGGAGGT
+TGAACCTCCAGAAAATCGCTTCTCAAATGACAAAAAATTGGAGGTTAGAATGGAGTTTTA
+CAAAGGGTATATCCCTACAAGAAATAAAAAACCACTTAAAGAGTTTAAAGACGGCAATAA
+TTTTATAGTTCTTGACTGGGCTAGGAAACTCGACGAATATGCCGGAGTGCTTGCTGAGGG
+AGTCATTCTCATCGATATAGACGACATGGAAAGTTCTGATATCGTCTTACGAATCCTCGA
+TGACCTTAGTATCCAAACCCTTGTTATTGGAACGACCCGAGGAAAACACTTCTTATTTAA
+TAACACCGATGTGACCACTAACAAGACCCACACGAATACTGCTATTGGTATAACCGTAGA
+TATCAAGCTTGGCTCAAGGAACTCTTATCACATTTTAAAGTTTGATGGAGTCAAAAGACC
+TGTTCTTCGTAAAGCTGATGAATTGGCAGAACTTCCAAAGTGGTTGCTGCCCGTTAAGAG
+TAGCATTAGTTTCTCTATCTTGGAAGAAGGGGATGGACGGAACCAAGCCTTGTTCAATTA
+CATCCTTACTCTGCAATCCGAGGGATTTAATAAAAATGAGATCATTGAAACGATCGGGAT
+CATCAATAAATATGTTCTCAAGGCACCTTTGGAGCAGCGTGAGATTGACACCATATTAAG
+AGATGAAGCCTTTAAGAAAAAATCCTTCTTTACTAAACAAGGATTTCAGCATCAAGACTT
+TGCTAAGTATCTGGTGCGAGAAGAACACATTGTCTGGATCAATAACGTGTTGCACATTTA
+TAAGGACGGAATTTACTCTGACAAGCAACGAGACCTAGAAATCGCGATGATCCGCCATAT
+CCCAGAGCTCACTCAATCTCGGCGAAGAGAAGTCTTGACCTATTTAGAACTTGTTGCAGA
+CCATGTGGAAATGTCACCGCCTAATTTTATCGCCCTAGGTAATGGCATCTACGATCTAGA
+GATGGACGAACTTCGGGAATACTGTCCCGAGATTGTGATCAAGAACCGGATTTCCGTTAA
+TTATGAACCGGAAACCTATGATGAAACCGTGGACAAGACCCTAAGTAATATCTGCTGTCA
+AGATACGGAACTTAGGATCCACTTAGAAGAAGTCATCGGGTACTTGTTACTGCGCAGAAA
+CGAGTTAGGGAAATTTTTTGTTTTAACAGGTTCAGGATCCAACGGTAAATCCACATTCAT
+TGATATGCTCAAGTATTTTCTCAAGCCGGAAAACTACTCAGCCTTAGCTCTTGGAGAACT
+TGGTCAACGGTTTAAAACGGCAGAAGTGTTCGGAAAGCTCGCGAATTTGGGAGATGATAT
+TTCCGGTAAGTATATCGAAGAAACCGATATCCTAAAGAAACTGGTCACCGGAGAAACGCT
+TAATGTGGAGAGAAAAGGAAAAGATCCCTATGAATTTGAAAGTTACGCCAAATTGATCTT
+CTCAGCCAATGATATGCCTCGGATAAACGATCTTTCAGATGGACTAAAACGTCGATTAGT
+CATTATTCCGTTCAATGCCAAGTTTAGCAGCAGTGATGCGGATTTCGATCCCTTTATTAT
+CGATAAATTGCTCTCGGAGAAGGCCATGAAATATCTGCTGCGAATCGGGATTGTTGGGCT
+CAAGCGCGTACTGGCAGCCAAGGACTTTATCAAACCGGCAGTGGTCAAAAAAGCATTAGC
+TCATTATGAACTTGAGAACAATCCGTTACTTGGGTTTTTAGAAGAACATCCGAAACTCAA
+CAATGAACTGGTCAAAGATGTTTATTTACGATACGACCTATGGTGCCGTCAGTGTAATCT
+CAAACCCTTAAGTCGGCCTATGTTCGGTCGCGAACTGGCTAAATACGGGTATAAAAGTAA
+AACCGTCACCCTCCAGGGTGAAAGCAGCCGAGTTTATGTCATGACAAATCCCCGTAATAA
+ATAAGGAACATGTGTAATCTCTGAAAAGGGCATGGTTCAACGGACTCGGAATTAAAATGA
+CAAAATGACAACGGGTTTCGCTTTCTTATTATAGGAAACTTACGAAAACAAGAGTGCTCT
+CGCGCATTAGATAGTAATTATAGTGTATAGAGATTAATATAATACATCTTTGCAAGTATC
+ATGCCACGTTCAAAGTCCGCTAAAATCAAGGGCTCTGGTGATTGGAAGAAGATGGGGATT
+AGACGTTTAGGGGCAAATCATCTGTAATTTTTCTGTAATTTATGTGTCATTTGTTGTCAT
+TGAATCAGATGCATTAAAACGTATGACCAGATATGAATTTTATTGCCGTAGCAATCGTGA
+CAGGTAACAGTATCATCCAACTGCCAAAGAAGGCTAAATCACAATCCATAATAAGCAAAC
+CCTCCTTCGTTCGATTTTGCTTATTATTACCAAGATGTAGAAATAGTTGCATACCGAGTA
+ACAAAAGTAATCGGTAGAGAAAGGGAGGGATTAGTAATGAGGATTCGAAGCAACAACGTT
+AGAGCGGCCTTCATTTTTGAAGAACTCGAACGAGCCAACCAAATTTATGGGACAAGCTTT
+CATTCTCCTCATGAAGGCTATGCCGTGATGTTAGAAGAGATGGATGAACTCTTTGAAGAA
+ATCAAGAAAAAGAATCCCGACAAAGATAAGTTGATGGAAGAAGCCGTACAGATTGGCGCT
+ATGGCCATCAAGTTTATTCAGTCTCTGGAACACTGGCCTTGGTTGGATTTAAAAATGAGT
+GCCCATGAATTGAAATGCCTGCAGTGTCGGTACGCTGTCCTCACGGCGGATAAACTTGCT
+GAATTAGAAAGTGATCCATGTTTAAGTTGCAATAAACTGTGCCAGTGGAAGCCTTAAAAT
+AACACTGCATATCCACAAAGGTAAAAAGTGGATAAGTATGTTAATAACTGTAAGTTTTTG
+TGGATAATCTTGCTTCACGAAAGGAACTATTTCGGATTCTAAGGAGGAAGCTAATGAATT
+ACATCGAGGAAGCCGAGAATTTGCTCTTATATTATAACGATCTTTATCGGAGCGTGGAGA
+ATTTGAATCGTGAAATTTCCAAATTGATCCGTTACCAAACACCGAGTCCCCTCAACGCGA
+TCCAATTGGAGGAGACGGGTGTTCGGTCCAGTAAGGTCGAAGACACGTATAACATGATGT
+TTAAACTTAAGACGATGGTAGAAAACAAGGAAAAGACCGAATTAGAATTAAAGGAGATCG
+ACCGAATACTCGAGGAATTGAGTCAGGATCCGGGATGTGAGTACTACGGGCAACTTTTAA
+AAGAGTGGTATATTTACGGAACAGCGAAGGAGAAAATAGCGGATCTTATTAAGTCATCCT
+CACGGAATGTGTATCGTATTAAGGATCAAGCTATAAAAAAATTTGCCGTCCGATACTTTG
+GACTTGATGCAATGAGAGTCGTTTAATGTGGCAAAAAGATGGCATACTTTTTTGACTTTG
+GATGTGCTAAACTAGTATCAGAAAGAGAAGACGTTCCGATGGGAGCGTCTTTTTCTTTTG
+GTTACATCACTCATTTGAGAATTATGGCTGCCATACGGCGGCCTTTTTTAGTTAGGAGTG
+GATATGAATAAATGCCAATATTTTTCACCCAACAAACTAGGATGCAGAGTTAATTGCGCT
+AACTGTAAGCGTTGGACTGGTACCGAGTGTAAGATTGAACTGCAACTCTTTAATCGTTAC
+GAGGACACCGTAGAATTTAAATTCTACAATCGCTTGATGCGGGAAAACAAAGGGGTTAAT
+GGTCCGCTATGATGATTAAAGAAGGCGTTTCCGAAAGGGTGCCTTTTTTTAATACACTCC
+TCTCTTTTTATATAAAGCGGTCTTCGGGCCGCATTTTTTAAAACATGTCGCTGATGAGCG
+ACTTTGAATAGACGGAGGTCACCGCAATGCAGAAATTTACGCCGCGGCAAAGCAGCTTTA
+TGGCTAAAACACTACGAGATCTCATTCATGCTTATGGGTTGAGTAAAGAACAATTAGCTG
+GGCTCGCTAAAGCGTTTGGTGTTCAGGAGACCTCCGTCAAAGGAATGGAAGTTGAGTTGA
+TTCGGGCGATGAATGATGGCGAGGACCTGGATTGGAGCAAGAAGAGAAGGTGATGGACTG
+ATGCCGACCAAGCCAAAGCGTCCCTGCTCTTATCCAGGTTGTCCCTGGCTAACAGCAGGA
+CGATACTGTGAGCAGCATCAAAAACAAGTGTCCAAAGAATACGATTTAAGGCGAGGTTCC
+GCAGCTAGTCGTGGTTATGATTCAAGATGGGCTACGACCCGCAAGCGTTACTTGCGCGAG
+CATTCCTTGTGTGTAGAGTGCTTAAAGACCGGCAAACTCACGCCAGCTAATGTTGTCGAT
+CATGTTATTCCTCATAAAGGAGATATGGTTAAGTTCTGGGATGAATCCAATTGGCAAAGT
+TTATGTAAACGGTGTCATGACAGAAAGACGGCAAAAGAGGATGGACGTTGGGGATAGAAA
+ACGAATGGTGATCCAAGGGGTAGGGGCGGTCATAATCTCTACAGCCTTGGCAAATATTAC
+CGGGTGCTTGGTCACACGCGAAATTTCGCGAATTCAAAAGGGGAATAAGAAATCTAAAAG
+CCACATGAGCACTGACGTGTGGCCTTTAAATAGTCAAATTTAAATCAAAGAAGGAATGAT
+ATATGGCTCGTGGAGGAGCACGCAAAAATGCCGGACGACCTAAAAAGCCATTGGATGAAA
+AATTGTTAGAAGGTAATCCCGGTAAACGCCCATTGACGGTTTTGGCCTTTCCGGAGACAG
+TGACCCAAGCAGAAGCTCTGCCACCACCACCCGAGTTTTTGGTGGATCTGGCTAAAGGGG
+TTGGCAGGTGTCCTAATGCTGAAACTATTTTCGAGAATGTCACTACGTGGTTAGAAAGAA
+CTGGTTGCGTTAATCTGATTCCGCCAGAACATGTTACAGAATATAGTTTGCTTAAAGCAC
+GATGGTTGGAATGTGAAGCCATGAACGCTAAACACGGCCTACTTGCCAAACATCCCACCT
+CCGGACAACCGATTGCCTCGCCTTATGTTCGCATGAGTATTGATTATTTGAAAGCCGCTG
+ATTCAGCATGGTCACGTATTTGGAATGTGGTCAGTCAAAATAGTCAGAAGGAATTTAGAG
+CGAATAGCCCTCATGAGGATGCCATGGAAAAATTATTAAGTGGCAGGTAAATCAATCAAA
+GTTTAAAAATATTGCACGCTGATCAAGCGTGCTTTTCATATTGGGAGGAACTATGGATAT
+TCAGAAAATACCTGCCGAAAAACTAAATCCAGCGAAATACAACCCTCGTAAAAACTTAAA
+ACCGGGTGATACGGATTATGAAAAGCTTCGCCGCTCAATCGAAGAGTTTGGTTATGTAGA
+ACCCGTCATATGGAACAAGCAAACCGGCAACATCGTAGGAGGCCATCAACGCTATAAAAT
+ATTGACAGAACAAGGTGTCAAAGACATTGACTGTGTTGTGGTTGATATGGATGAGCAGCA
+TGAAAAGGCTTTAAACATTGCACTGAATAAGGTAGCCGGTGAATGGGATATGCCGCTACT
+TACGGATTTATTGAAGGACCTAGATGAGTCCGGCTTTGAGGTTTCCTTAACCGGTTTTGA
+AGCAGAGGAACTGGATGAGTTGTTTGGAAACTCAGGCACTGAAGGATCTCAAGAGGTTGA
+AGAAGACGACTTTGACACGGATGCTGCTGTTGCCAAAATTGAAACTCCGATCAGCCAGCG
+TGGGGATATTTGGCAATTGGGTAAGCATAGACTGATGTGCGGGGATTCGACCTTAAGTGA
+AGATATGGCTAAACTGATGGACGGACAGCAGTGTGACCTTGTTCTGACAGATCCTCCCTA
+TAATGTCGACTACCAAGGGGCTACCAAGGATAAGTTGAAAATCCAAAATGACAAGATGGA
+AGACGATAAGTTCCTAGCGTTTCTAACCGATGCATTTACCCAGATGTATGAGCATTCCAA
+AAAGGGTGCTGCGATTTATGTATTTCATGCCGATAGCGAAGGTTACAATTTCAGAGCTGC
+TTTTAAGCATGCAGGTTATACTTTGCGTCAATGCCTAGTGTGGGTAAAGAACTCCATGGT
+GTTAGGTCGCCAGGACTATCAATGGAGGCACGAGCCCATTCTCTACGGCTGGAAAGACGG
+AGCAAGCCATAGTTGGTACTCAGACCGTAAGCAAACAACGGTTGTAGAATTTGATAAACC
+TCATAGAAATAGTACTCATCCAACAATTAAACCCCTAGGCTTAGTTGGATATTATATAGA
+AAACTCTAGCAAGGCTGGAGATTTAGTACTCGATCCCTTTTCAGGGAGTTTTTCAACGGG
+GATAGCATGCGAACAAACTCATAGGATTTGTTATGGTATGGAAATGGACCCCAAGTATGT
+GGATGTATGTGCTTCGAGGTATATCGAGCATAAAGGCGGGAGCGATGATGTTTATCTGAT
+TCGTAATGGTGAGAAGGTAGCCTGGAAGGATATAAAACAAGTATAACTTAGGAGCGTAAA
+ACGGATATGTCCGGCTGAACGCTCTTTTTTATTTCGTAATAAATGAAGGATGTGATCATC
+TGCGAGATTTAAGAAATCAAAAATTTGGAAATCTGACAGTAAAAGCTGAAGTTGGTCGAG
+ATAAAGGTGGTCGTGTTCTTTGGTTATGTCTATGTGACTGTGGCAGAGATCATATTGCCA
+GAGGAACTGCGTTAACATCGAAAAATACAAAGACATGTGGTAAATGTAACTCGGTAACTT
+ATAGATTATCAGAAGACGGTGACCACATGGTAATGACATTTTCGAATGGAACTGAGCTTC
+TAATTGATTCTGAGGAAGGAAAAAGAGTAAAATCGTACAACTGGTTTCTTAATGAGAAAG
+GTTATGCATGGGCTAAGATTAATGGACAGCGAATTAGACTCCATCGGTTTCTCATAAATG
+CTCCAGCCGATCTCCAGGTGGATCATATCAATAATATAAAAGTTGATAATCGAAAATCTA
+ATCTAAGGCTTGCAACTAATAAAGAAAATAGACGAAATGAAGGACTTCGGAAAAGTAACA
+GTACTGGGGCTAAAGGTGTCAATTTTGATAAGCGTCGTAAAAAATATAGGGCTTATATTA
+CAGTTGATGGTAGATATATTCATCTTGGATACTATTCCACAATAGAAAAAGCATCCATTG
+CATACGATCACTCCGCAGAGCAATATTTCGACGAATTCGCTCGCCCAAATGATCTCACAA
+CAAAGACCCCCGAGCTGGTGTCATTTTTATTTTCCGGCAAAGAAAAAGAACTTGATTTAT
+CAGCCCGGTAGAGTGATGAATGTACACAACCAAAAATGAAAGGTTGTGTACTCATGGTAA
+ACGAACTCAGAAACTACAAAGTCAGACATGTGGGTGGTCGCGAACGGATTGTTCCAGCTA
+AAAATGGAACGGAAGCCAAACGCCAGGCTTGCAGATTTTGGGGCTATAAACCGAACGATT
+ATTGGCTTGGCATTACTGCCTGCTCAGCAAACCTCATTCCTGCCGGAAAGGTGGGGTGAG
+CCATGACGAACGAAACCTTCACCTTAACATTTAAAGTCACAGGACTAGAACGTAAGCAGA
+TTGCCTGTATTATTGGTGAAGCTGTCGGGCAGGATATTAGCTACGCAGGTGCTCCAAGTT
+TTTTCTACAGGGCTGGCGATTGGACGATTGACCGGGACAGCGTTATTACTTCCCCAGAAA
+CACCACTCCATGATAAAGACAATCTTCGGAAAATACTTGCTGCTTTGAAAGCTGTTGGGG
+TAATTGCCGAAGGAGACGGAACCGTCACACTTCCACTCGATGGACATTCTGGAAACACTT
+TGAGAAACGCGATTAATCTTATTTGGTGTAAGCAGAGTCTATTAAAAAAATCCTTTGATC
+GGCAGACCGACATGGTACCAGAAAGTCTTGTAGGTGTAATCAACGCCGTGCCGATTGATA
+CCATGGAAGAGTTTGCCGAGGTCGTAAACAATGGCATTGACCAAGGAACCATCATTGGCG
+ACAGCAACTTGGATTTCGACCTGGCAGAACAAACGGTAAGTTTTAGCTTCATGAATGCCA
+CCTTGGAATTTGACGAAGTTCTTGCTTTTATAACCTTTTGCCATAAGCTCAGCGTACAAT
+CGAAACTGCAAAAGTTTAGCTCAACAAAGCAAAAAGAAGCTGTTAATGAAAAATACGCCA
+TGCGCTGCTTCCTTTTAAAATTAGGATTTATTACAGAAGAATTCAAAACCGAGCGCAAGA
+TTCTTCTTCAAAAATTAGATGGGAACGCCGCTTTTCGTACGATTGAGGCACAGCAGGCAG
+CGGAGTCAAAGCGTAAAACAAAACAGGAGGCGAGTTAATGATTAACCAACGAGAAAAAGA
+CAAAATTTTGAGTCAGGAACGATGTTCTCGTTGTGGCAGTCCATTGACGATCCGAACAAT
+GTCGAAAATGAATATAGATATCGTATGTATGGACTGCGCGGAAGCTGAAAAAAGCCATCC
+CCGCTACCAGGAAGCTGCCGATGCCGAACTCGAACAAGTCAAAGCCGGAAACTACAATTA
+CTCAGGTCTGTTTGCTGGTGAGAAATACCCGTTCTAATATTGGTCAAAAATAAAAGACAG
+CCCGGAAAGTTCTTTTAAAAATCAAAATCCAAACGCTGCCTATCGTACAATCTAGGCACA
+ACAGGCTAGAGATGTTCCTTTATTGCCGCCATAGGATATTGAAAATCACTGGGAGGATAA
+TGAGGGTTAAGAGGACAAACAAAAAAATCTGAGCGATTGGATGAGCCCAGTTAACAGTCC
+TTCCTGCTATGGGCCACATTCTGAAGGCTTCATGGATATAAGCTTTAGGGACAAACAAGT
+TTCCATCTTCTTCGTTATAGTAAATTAGGGAGTTGTTATGTGTCCTTCGAAAATCGTCAA
+CTTCCTCATCCGTCCATTTTCGTTTGGCCATATCTAACCCTCCTTTTCCAATCACTGATA
+TAAAAATATTTTACCATAATTTAGTAATGTAATAAAACAACAAAGATTGGGTCGATTTAT
+AAGGTTTTAAGTTACCCAGATTCTCGGTAAGAAATTTGTAGAATATTGTAGTATAATTAG
+CCTAAAAGACATTAGGGGAGAATGATATGCAGTTAATTAACCGAGAAGACGAAGATGAAA
+TTAAGGTTGTAATCCATGAATTCTTAATGACAAGTCAGGTTAATTCGCAGGAAAGTATCC
+CCATTGAGTTATTAAAATATCTACGTAAAGCGGACAAGAAGATTGAAGACGGTCTCTTGC
+TTAATGAACTATGTGATTTAATCGAACAGAAACTTCGCAATAGTAATTCGCGTTAAGGTT
+TAACTTTAATTAGAATATTAATTTTACCAAGGAACTTCGTAAGAGGTTCCTTTTTTGGTT
+GCCCTATTTACTATGAAAGGAGGCTGCTACCATTGGTAAGAAAACCGAGCCGTACTTGGA
+TAAGGCTAAAGCCGAACATGCCATTCAATTCATCAACCTGCTAAAACACACCAAAGGTGA
+ATGGTATGGGCAGCCCTTTAACCTGATCCCTTGGCAGGAGACCATTATCCAAGATATTTT
+TGGGACCATGAAAGCGAATGGTTACCGGCAATATAATACGGCATACATTGAAATTCCTAA
+AAAGATGGGAAAAAGTGAACTGGCGGCAGGTATTGCCTTACTTCTGACCTGTGGCGACTT
+TGAACATGGCGGTGAGATCTACGGCTGTGCAGCCGACAGACAACAAGCCTCCATTGTTTT
+TGATGTTGCCGTTGAAATGGTTGAACAGTGCCAAGCCTTGAAGAGCCGGATTAAGCCCGT
+ACTTTCTCAGAAACGTTTGGTTTATAAACCGCTTAATAGTTTTTATCAGGTGCTATCAGC
+GGAGTCGTATACAAAACATGGCTTGAATGTTCATGGCGTTGTTTTTGATGAATTGCATAT
+TCAGCCCAACCGAGATCTTTATGATGTCATGACGCACGGTTCCGGTGATGCCAGAAAGCA
+GCCGCTGTATTTTCTGATTACCACTGCGGGAACCGATCGTCATAGTATCTGCTGGGAGGT
+TCACCAAAAGGCTGAGGACATTCTACAGGGCCGTAAAGTCGATCCGTCCTTTTACCCAGT
+GATTTATGGTGCGGACGATGATGATGACTGGACGGATCCTAAAGTATGGGCCAAAGCGAA
+CCCGTCACTCGGTATCACCGTTGATATTGAGAAATTACAAATTGCTTGCGAAAATGCCAA
+GCAAAACCCTGCCGAAGAAAACTTATTTCGCCAACTTAGATTAAACCAGTGGGTCAAACA
+ATCTATTCGCTGGATGCCCATGGAGAAATGGGACCATTGCGCCTTCCCAGTTAACTTGGA
+AAGCCTAAAAGGCCGGGAGTGCTATGCAGGACTAGACCTCTCCAGCACGACGGACATTAC
+AGCGTTTGTCTTGGTTTTTCCGCCAGAATATGAAGGCGATAAATACCAAGTGGTGCCTTT
+CTTTTGGCTGCCAGAAGATAATCTGGATCTAAGAGTGCGCCGTGACCACGTTCCCTATGA
+TACTTGGGAAAAGCAAGGCTTCCTAAAGACTACAGAAGGGAACGTTGTCCACTACGGATT
+TATAGAAACCTTCATCGAAGAACTTGGCAAGAATTACAACATTAAAGAAATCGCCTTCGA
+CCGCTGGGGAGCCGTCCAGATGACGCAGAACCTTGAGGGCCTTGGCTTTACCGTGGTTCC
+TTTTGGTCAGGGCTATAAAGATATGTCTCCTTCCAGTAAAGAACTCATGAAGCTGACCTT
+GGAAGGAAAACTGGCCCACTCCGGCCACCCGGTACTTCGCTGGATGATGGATAATATCTA
+CGTTAAAACTGACCCGGCGGGTAATATCAAACCGGACAAAGAAAAGAGCACCGAGCGCAT
+TGATGGTGCCGTCGCTTTAATTATGGCCTTAGACCGTGCGCTCCGCCATGAAAACAATGA
+CTCAAGCGATGTGTACAACCAGCGAGGAATGCGCAGTCTGTAAGAGGGAGGTGAGACAGT
+ATTAAACTCTTCCAACGAGCCAAATTCTTCTTCGGCCAAGGCTTCGATGACTATATCCAG
+CGTTTCTTACTCGGGGATGATGTCAGCGACTTAGACTATCCCGGTCAAATGGATGCCAAA
+ACAGCCATGAACTATTCGGCAGTTTTTTCGTGTGTTCGGGTCCTTGCTGAAGCCTTGGCC
+GGAACTCCAATTATGCTTTACCGCAAAAAAGAAACCGGCGAACGTGAAGTCCGTAATGAC
+TTAAGTGTTTACGACATTTTGCATAACCAACCCAATGTAGAAATGTCGCCGTTTAATTTC
+AAAGAAATGTGTATGGTCTCTCTGAACCTGGGAGGTAATTCTGTCAGCCAAAAGTTGGTC
+AACAAATATGGCGATTTAGTTGGGCTTTATCCCTATGAATGGCCCAAGGTCGATATCACC
+AGAGATCCAATCACTAATAAGTTAGTCTATAAAATCCGGGATATTAACGGCGGCAAACAA
+CTGAATTTAGCACGGGATCAGGTTTTCCACATTCCGGGTTTGAGTATGGACGGAGTAGTG
+GGAGTGTCGCCCATTGAGTATCTTTCCTCAGCCATTCGCTTGGGCCTTTCTTATGAACGG
+TTCGGGGTTAATTTCTATAAAAACGGAGCGAACTCATCCGGAGTGATTGAGTACCCCGGA
+GCCTTGGCTGACACGGCTTATGAGCGTTTAAAGAAGGACTTTGCTAAAAGTTATCAGGGA
+CTGGCTAATACCGGAAAGCCCATCATCTTAGAAGGCGGGGCGAAGTTCAGTCAGCTCGCT
+ATTAAACCTGCCGATGCCCAACTCATTGAAAATAAGAAATTCCAGCTGGAAGACATCGCC
+CGTATTTACCGCGTACCCCTTCACTTGATCCAAAACTTAGATGGAGCGACATTTTCAAAT
+ATCGAACAACAAAGTCTAGAATTTGTCATGTATACGATGTTGCCTTGGTTTAAGCGCTGG
+GAGGAAAATGTTAATATGCAGCTTTTGACACCTCTGGAACGCAAAGCAGGGTTTTATTTG
+GAGTTTAATATTTCATCGCTTCTCCGGGGTGACATGCAAAGCCGGGCGATGGCTTATGCC
+CAAGGTAGACAGTGGGGCTGGTTATCCGTGAACGATATCCGAAAGCTTGAAAATATGCCG
+CCGATTCCTAACGGAGATATTTATATGATGCCGCTGAACTTTACCGAAGCTGGAAAAGCA
+CCCTCTACAACGGAGTCGGCGGTGCCGGAAGCCTTGGCAGAAGAGACTTACAAGATGATG
+ACAAGGAGGTGATGACCATAAAACCCTTTTGGAAATTTCAAGCAAAAAATGAAGCTCCCT
+TGATCGGTGAACTTTTGCTTTATGGGGATATCTCCAGTACCACTTGGTGGGGTGATGAAG
+TGACCCCTGTGGCATTTGCACAGGACCTTAAAAATCTCGGAGATATTTCACAGCTTAACA
+TTTATATCAACAGTGGCGGCGGAGATGTGTTCGCGGGTCAAGCGATCTATTCCATGCTCA
+AACGTCACCCAGCACAGAAAAATGTCTATATTGATGGTCTGGCCGCCAGCATCGCCTCTG
+TTATCGCGATGGCTGGCGATGTTGTTTTTATGCCGAAAAACGCCATGCTCATGATCCATA
+AAGCCTGGACCATGGCCATTGGCAACGCCAACGATCTTCGTAAATTGGCTGATGATATGG
+ACAAAATTGACGAAAGTATACTTACAACCTACCAAGCGAAAACGGGCTTAGATCCCGAAA
+CTATTACAGAAATGGTTAATGCTGAAACATGGCTGACAGCCGATGAAGCCGTAAAACTTG
+GTTTTGCTGATGTGATTGAAGATAGCAAGCAAGTTTCAGCATCCATTGCCGATGGTCAGC
+TTATGGTTAATGGTCAAACCATGGACTTAAGCCGGTTCCGTAAGACTCCGCAGTTCGTTA
+ACAAAGGAGATCAACCCCAGGTTCCCCAAGATCCAAGGATACCTACGTTAGAAGAACCAA
+ACGAAGAGCTGAAGGAAGAACCAAATAACCAGGCAGTGGAAAGCAAAGTAGCCGCACCAC
+TGCCTATTCGTTTGCCCGAGTTACGAAACTCCGGTCGAACAATATCCTCCACCAACGAAG
+CTCTGATCCGCCAAGCCATGGATTGTCTGGCTGAAGTCTTAGGTCAACTGGACAACTCAG
+ACGAACAACCTGACGGCGATGACATGGGCATGGATGGCGACGGAATGGGAACGGACGCCC
+CTGAAACAAATGGGGAAGAGAATCTTGGAGAGGACGATGAGGACGTTGGACTCTTTGGTG
+TTTCCCTCTGCCAAGCACAATTAAATTTAACAAGAAGGAGACTCGATTATGGATTTTAAA
+GCTCTACTCAAACAAAAACTTGATGCCCAGCAAACCCTCATTGATGCAGCGATGGTCAGT
+GGAACAGGATTTAGTGCTGAACAGCAAACCCAGTTTGATACTTTGCAAGCAGAGATTGTA
+AATCTGGAAAATACCATTAAAGCCGCTGCAGAATTGGAAGCTCGCCAGAAAGAAATGACG
+AACCCAGTCAATCAGCCGCTCTATCCTGAACCCAAAGCCAAAAAGGAGAAATTCGCATCC
+TTTGGTGAGCAACTGCGTGCTGTGATTGAAGCTGCAAGACCGGGCGGTTCTATGGACAAT
+CGGTTATCCATCAAAGCCGCTGCTGGGCTCAATGAAAACGTGGGCAGCGATGGCGGGTTC
+TTAGTGGATGATGACTTTTCGAAAGAGATCCTAAAGAGGGCTTATGACACAGGCATTTTG
+GCCAGTCGCTGTAATAAAGTGCCGCTGAGTACCAATGCCACGGGACTAAAAATAAATGCC
+ATTGATGAAAGCAGCCGAGCCAACGGTTCCCGTTGGGGTGGAATTCAAGCTTACTGGGAA
+GGTGAATCCGACCAACTTTTAGGCAGCAAACCAAAGTTCCGACAAATGGAACTGAACCTT
+CATAAACTGACGGGACTATGTTATGCAACGGATGAACTACTGACGGATGCCACTGCCTTG
+GAATCGGTGATTTCTCAGGGGTTTGCGGAAGAATTTGGTTTTAAAATGGACGATGGCATT
+ATTAATGGGACTGGAGCTGGGATGCCTTTGGGGATCATGAATAGTAAAGCTTTAGTAACA
+GTACCCAAAGAAAACAGTCAAGCTTCAGGTACCATTAACATTCAAAATATCGTTAAAATG
+TGGTCACGATGTTGGGGTCAATCTCGCCAAAACGCCGTATGGTTCATTAATCAGGATATT
+GAACCTCAGCTCTACACGATGGCTTTATCCGTTGGGACAGGCGGTATTCCTGTCTATATG
+CCAGCGGGAGGGATTTCCGGTTCACCTTACAGCACACTGTATGGTCGTCCAGTCATTCCC
+TTGGAGCAGTGCCAAACGCTGGGTACTGTCGGTGACATTGTACTGGCGGATTTGTCGCAG
+TACCTGATCATCGACAAGGGTGGTCTTAGCGCAGCCTCTTCCATCCATGTTCGTTTTTTG
+TATGATGAGAACTGTTTCCGGTTTATTTACCGCGTGGATGGACAGCCTGTGTGGAACACA
+GTTTTAACTCCGGCACGTGGATCGAACACACTATCACCGTTCGTCGCATTGCAAACACGC
+TAATCATTTTTTATTGAAGCAGGAGGTTAAAAACTTATGTGTTGTATTCCCGAAAAAGAT
+AAACCCCTTGAAGCTATCACTCCACAGGCTGGCGGTGCTATTACCGGAGTCTATGTAACC
+CTGCGGGATGCTGAAGATTGTTATGTTCTGGTCCATATTAATCAGGCAGTCGCGACAGCC
+GTGGATATAACAATTGAACAAGCCACTGACGTTGAAGGCACCGGCAGTAAAGTCATAACC
+ACTGCCGTTCCTATTTGGGCAGATCAAGATTGCGCCTCTTCTGATGCCTTGCTTCGACAA
+CCGGATGCAGTAGCCTTCACTACTTCAGCTACCCTTGCTCATAAACTGGTTGTCTTTCAG
+ATAAACCCGTCTCACTTAGATGTAACAAACGGCTTTGACTGCATCACCGTCAAAACGGCG
+GCTTCCGACCCGACCAATATTACCGCCGCCCAGTATATCCTCAGCGATCTGCGCTTTGGT
+GGTTCAACTCCACCTACAGATATCACGGACTAATTCTTGTAACTGATTAGATAGGGAGGC
+AGCCTTGCCTTCCTATTTAAATAATCAATACGGAAAGGATGGATGCTGTGAACTTAGTCC
+AAACAGTACCTCCAGCCGTTGAACCTTTGAGTCTTCAGGAAGTGAAGGATTATCTCCGAG
+TCGATGATGATACCGATACCTCAGAAGATCAATACCTAGGCGCCTTAATCACTGCCGCCC
+GGGAGTACTGTGAAAGCTTCCAAAACCGCGCCTATATTACGCAGACTTGGCAGATGAGCT
+TTGATTACTGGCCCAGTTATGCCATCAATATTCCGCGTGGAAATCTGCAGAGAATAACTT
+CTGTTTCTTATAAAAATTCATCGGGCGTTGTAACAACCCTGACAGAAACTCTCCAATATG
+TTGTCAGTACACGCGGAGTTTTAGGCCGAATATCACCGCCTTACGCTCAGCCCTGGCCGC
+CTTTTATCCCATTTCCCTTGGATGCCGTTGTGATTGAGTTTGTCTGCGGATATGGTGATA
+CGGAGGAGAGTGTGCCGGAAAAAGTGAAGCAGGCCATGAAATTGTTGGTCAATCATTGGT
+ACGAGAATAGGACTCCTCTCACAGAGTTAAAGCAAGCTCCGGCAGAGATCGCGTTTACAG
+TATCTGCTTTATTATGGCAAGACAGAATCGTGGTGGCATAAGGTTGGTGGCTAAAAATGA
+ATCCAGGCATACTGCGGCATAAGATTAATATCCTGACCACAACGGAAGGAACCAATGAAG
+CAGGAGATACCATTCTCATTCCATCGGTATATAAAACTGTGTGGGCCAGCGTCTCTCCGG
+TCTCAGGTAAAGATTATCTTGAAGCGAAAAAGCTCCAAGCTGAACTGACCTATAAATTTA
+TCCTTCGTTACACTTCAGGGGTAACGCCGGACATGCAAATTGAGTTTAAAGGGCGAATTT
+TTCTCATTCAGGATATCCTTAATCCTTTAGAAATTAATGAGACTATAGAGATTATGGCCA
+TAGAGAGGGTGATTAAGAATGGCTGATGATTTCGAAATAACCTTTCAGGGTCTTGACCCG
+TTAATGACTCGGCTGAAGGAAGTGAGAGCACGTTATCCCTACAAGGAAGAGGAAATGCTG
+CTGACATTGGGAGCCACCTTAAAGGCCAGTTCTAAGGATAAAACTCCTTTAGGAAAGCAC
+AAAAAACATCTAAGAAATCAATATAAACTTTCTAAGGTTCAGTACAACCGAGATGGTTCC
+TTTATTACTATGACCAACACAAGTTCCCATTTTCATCTGATAGAAAAAGGCCACCAGATT
+GTCGGTAAAAACGGGCAGGAACATGGCTTTGCCCAAGGGCTGCACATGGTTGAAACGTCG
+ATGATCGAACTGGAACAAACCTTACCGGATACACTTGGGGCATGGTTGGACAGTATCTTA
+GGCAGTGTGTAATGGTTACTTTATTAGCCGTCAAGCGGGCCATGAATCAAGTGCTGGCGC
+CTATTGGTCTTAAGATTTACGGAAATGAGGTCAAAGAGGGCTTCTCCAGACCTTGTTTTT
+TTGTGAACCTTGTTCCGGTAAAGAGTGAAATCCTTAAGAAAGACACCCGAGAAAACTCGT
+TGATGGTGGAGATGGTTTATTTTTCAGAGAGTAAAACCGATTTGGAAAATCTCCAAATGT
+ATGACACCCTTCAAGGACTTCTTACGCCTATTCTAGTCATAGGGACCAGAAACCTACTCG
+TCCAGAATTTTCGGGCTGAAGTCATTGATGAGCTAGACCATATTTATTCTGTGAAATTCG
+ACCTGAACTTTTATGATGAAATTGTGGATACCACACCAGAACCCGATCCTATGGAGACAT
+TAACGATTCAGTTAGGAGGTCAATAAAGAATGGGACTTCCCGATATCGAGGTCATTTTTA
+AATCCCTAGCCGTCAGTGCCATTACTAGAGGAGCGCAAGGGATTGTTGCCTTAGTCTTAA
+AAGACTCCGTTCATAATGGATCGAATATTTATACCGATCCAACCAACATCCCGAAGGACT
+ATTCGGCCTACAACCTCAACCAAATCAACTTGGCCTTTCAAGGGGGCGTGCAAACCCCAA
+CCAGTCTGATCGTTTATGTAGAACCGAGTGATGCTGCGGACTATACCGCCGCCATGAACT
+ATTTGGAAACCGTAAAGTGGGATTATGGTGCGGTTCCGGGAATCAGCTCCACGGATGCCC
+AGACGGTGGCAACATGGTTAAAAGCCCTTCGAGATACCAAAGATATTAAAGCCAAAATGG
+TTCTTCCCAACACGGCAGCCGACCATGAAGGAATTATTAACTTTGCGACCGATGGGATTG
+TCTTATCTTCGGGAACGGTGAATGCCACCGATTACTGCAGCCGGATCGCTGGAATATTGG
+CCGGAACTCCTCTTACCATGAGTGCTACATTTCAGGTGCTCCCGGAAGTGATCGATGTAC
+CGCATAACAGCAAAACACAATTTGACACCCTGATTAATGAAGGCCAGCTAGTCTTCATGA
+ACGATGGTGAAAAGGTAAAAATAGCGCGAGCCATCAACAGTTTAGTCACGCTGACACCAA
+CGAAAACGGCGGATTGGCAGAAGTGCAAGATCGTCGATATTATGGATCTTCAGCACAATG
+ACATTATACAAACCTTTAACGATAACTATGTCGGCAAAGTCCCCAACGATTATGACCATA
+AGTGCTTACTCATCACGGCCATCAATGCTTACTTGGAAGGGTTGGAAAACCAAATGCTGC
+TTGATCCCGGTAAAAATAAAGTGAGCCTGGACGTGGAGGCCCAAACCTTATATTTACAGA
+GTAAAGGCATCGACACCAGCACCATGAGTCAGTTAGACATCAAGAAAGCCAACACGGGCT
+CTTTAGTTTTTCTAACCGGTACCGATCGCCCGCTGGATGCTATGGAAGATCTAACCTTAA
+ATCTCTATTTAAACTAGGGAGGTGAAGCATGAATAACTATACTGCAGATCAGGTCCTAAA
+TGGCACTTGGGGAGAGATGTGGCTGAACGGAGATTTCATGGCTGAAACCATCGCCCTGCA
+GGCCAAAGTGACCTTGACCAAAACTGCCGTGGAGATGTGCGGAACCTTAGTGGCGGGGCA
+AAAGGTCACGGGAATGGAACTCAAAGGGACCCTTAAAATGAACAAAGTGAGTTCGGCGAT
+GATTAAAGCCAACTCCGACAATATGAAGGCGGGTAAAACGCCGGAGTTTACCATCATCTC
+CAATCTGGATGATCCGCAGGCCTTGGGCGCTGAACGAATTGTCCTTAAAGGCGTTATGTT
+TGATGAATTGACTCTTGTGGATTGGGAAGCCAAGAAGAATGGGGAAGAAAGTATCCCGTT
+TACCTTTATGGATTGGGATCTCTTAGACTTAATCTAAAAAATCTCTTCCCATTATATAGG
+GCATTAAACTATTGATTTGGAGGTCTTATTGGTGAACTTAGTAGAGCAACTCTTAAAAAT
+GGATGCTGGACTCCTTGAAACCCCTTCGAAGGTAATAACCATCCCATCGAAAAAGCTGAA
+AGAGCCCCTCGATTTTCCCTGTAAAGCCGTGGATCCGGAGAAGTATGCCGAGATCCAGGA
+AGGGGCGGTGGAGATCCGTAAAGGTGATGTTAAGAAAATCAATATGTATTCCTTAAAGAC
+GCTCATTGTGATTGAAGGCTGTCCCGAGGTATTTAAAAGCAAAGAGATTATGGAACATTT
+CGGAGCACCGACCCCTAAAGAGTTGGTCAAAACCCTCTTACTCAGCGGAGAGATCGATGA
+TCTGTATAACGGGATCAATGAGCTTTCTGGTTATGAGAAGGATGCAGAGGACGAAGAAAC
+CATAAAAAACTGATTCAGGGAGATAAAACTGTGCAAACAGCTTATCTCCTTTTTAAGTAC
+AAAAACATGAGTCCCAAAGAGTTCTACGATAAGAAACCCGGTGAGAAGAAAATTCTCCGG
+GCGTTTTTATTTTACGAGTTAGCAGAACGAAATCGGGAGAACAGCTCTTAATAAGGCGGG
+AAGGAGGTAAAAACCATAGCGCGAGTGATTGATGCTGTGATTCAGCTTCGTGACCAATTC
+AGTGGAACTCTTCGGAATGTCAACGCTAATCTCTCAGTCTTTCAACGACAGGCCAGCTAT
+GCCGGAAGAAACATGATGTCGGTCGGTAAGGACTTACAGAGTGTGGGTAAGACGTTTACC
+AAAACACTGACTGTTCCTATTGTTGCGGCGGGTGGAGCACTATTAAAGCTGGGACAGGAC
+TTCCAAGATGCCGAAAACACCATACGAGTTGGCACGGGTGCAACCGGAAAAGATCTTCAA
+AACTTAACGAGTGATTTTAAGGCGACTTACAGTCAGGTGAGTAATAGCATGGCTGACACC
+AGCAAAGTGATTGCTGATTTAAATACAAGAACCGGCTTATCCGGTAAGCCCCTGCAAGCC
+TTGTCCGTTCAAATGCTTAACCTCTCAAAGATCACGAAAGAAGACTTGAATACTTTGATT
+CCAGCGACCACGCGGATGTTTCAGGATGCCGGGCTTAAGCAGGCGGATTATTCGAAGGCA
+CTCGACTATACCTTCAAAGTCAGCCAAAATACCGGTATTTCTGTGTCAAAACTTCAGGAG
+CTGATGACTCAGTTCGGTGGTCCTTTAAGACAAATGGGCTTTAGCTGGCAAACGAGTGCT
+GTCATGCTTGGAAAGTTTGAAAAAGAAGGTGTTAACACTGAGTTGGTTGTCGGGTCCCTT
+CGGATTGCTCTCGGTAAGATGGCTAAGAAAGGGATCGCTGATCCTTCAAAGGCGTTGCAA
+GAAATGATTACCAAGATTAAGGACGCTGGCACAGCTGGAAAGGCAAACGCCATGGCCTTG
+TCGATGTTCGGAGCTAAAGCCGGGCCGGATATGGCAGCCGCTATTCGGGAAGGACACCTG
+GACTTAGACAATCTCCTGCGAACCATTAAGAACAGCCCGGAAACGATCGACCAAGCCACT
+GCCGATACCATGACCTTTGCGGATAAAATGGCGAAAGTAAAAAATCAACTCGCCGTGGCG
+TTTGAGCCGGTGGCTACCAGCCTATTAGATTCTTTAGATAAGCTACTTCCGAGTATCAAA
+AATGTGGGCGATACCATCGCGAAGTTTGCTAAAAGAATTGCGGATATGTCACCTCAGCAA
+CAGGAAATGATTCTCAAGTTTGCGCTTATGGCTGCCGCAGCAGGGCCGGTTATTTTTACG
+GTTGGTAAGCTAGTTTATGGGATGGGTGATGCGGTAAAAACATTTACAAAATTATCTCGT
+TCCATCTCTAATGCAGGCGGGATTTTAGAGTACCTTCAAACTCCAGGCGGCATGGTGATT
+GCCATTATTGGAACTTTAACAATCGCTGGACTATTACTTGTAACCCACTGGGCACAGGTA
+ACAAAGTCCTTGAATGACTTTAAGACGGTTTTGAAAAATAATGAAACAGCCATCCGAAAT
+GTAGCGATAGCCCTTGGCGTTATTTTTGGACCGGCGCTGGTGGGGTTGGGTGTTCAAGCA
+CTCATCACGGGCGGTCAAATCACCGCTGGGTTTATTGCTTCCTTAGTAACCTCAGGAATT
+GAAGCCGCTGCAACCGGAGCCGTTTTTACAGGAAAACTAATCGTTTCTCTCATATCTTTT
+GCCCTTCAAGTCTGGAAAACTGTTGCTGTTATTGGTATTCAGACAACTTTGTTCATTGCT
+CAGAGACTTGGAATTATCAGTGCCGCCGAAGCAACGAATATTATCACAGCCGCCCAATGG
+CTTTTTAATGCCGCCATGAATGCGAACCCGATTGGTGTTGTCATTTTAGCCCTTGCGGCT
+TTAGGGGTGGCTATCTATGAGGTTGTCCAGCATTGGAAAGATATCTGTACTTGGGTTGAA
+AAAGCATGGAACTGGCTGACGAAATGGAATGGAACTCAGCCTCAGGATAAGAGCCTCAAT
+GTTACCACCAACGTGGCAACGTCCGCTGCGACTACGGCCCACAATGCGCTTGGAACCAGT
+TATTTTGGAGGCGGCTCCACTTGGGTAGGGGAGAATGGGCCAGAAATACTCACACTCCCT
+AAAGGTTCTCAAGTCATGGATCATCAAACGTCAAAAAGATCAACAGGGAAGAATATTTCG
+ATCGCCAAGCTCGCCGACACCATCGTTGTCCGGGAAGAAGCCGACATTGATAAGATTGCC
+ACGGCATTGGTGCTTAAGCTTCACTCGGTCGCTATTAACACGGCTTAGGGGGTGACATCC
+ATGGAATTTTGGCTTATGCAGGATAAGGAAACCCTCCAGCTTCCGGTTCCCCCTCCAAGT
+TATACGGTCAAGAAAACTCTGAATAATACTTCTGTGATTGTTGAAAGCATCGGCGAAATT
+AGTTTTATTGGCAAGCCGAAACTCGCTGAAATCCCGCCCATAAGTTCGTTCTTTCCGAAA
+AAGGATTATAGCTTTTGTCAGTATCATACCTTTCCAACGCCCAAAGAATGTACCGACCTT
+ATCGAGAAATGGATGGCCAGCGGTAAGCCGATCCGTTACCTTGTAACTGGGACAAGTATT
+AATACACTTTGCTCCATTGAAAGTTTTGAGTATGGTGAGCAGGATGGGACGGGGGATGTT
+TATTTTACACTGACACTTAAGGAATACAAGGTGATCCCTTCGTGATCAAAATTTACAGTA
+ATTACTTTGGGGGATCGACCGACATTACGATGTTTTGCAAGACCGTGCAGTGGTCCGGCG
+ACAAGTCGCAAGTGGCCCGGAAAATTGACGTAACTTTAGCCTATGCCATTTTTGACAAGA
+CCCAGCCCAATACCCAAATTTCGCCCGGCACCATGGTATGGCTTGTCGATGATGTGGAAG
+GTGAGATTTTTCGAGGTATTGTTTTTGTTCGCTCGCTCAATTCCAACCAGGAACTACAAT
+TCACGGCTTACGACCTTTTGATCTATTTTCTGAAGTCCAAGGCCACCTATAACTTCAAAA
+ACATTACAGCAGAGGCAATAACGGCGAAAGTTTGTCAGGAAGTTGGGGTGAGTGTTGGAA
+GTTTAGAGCCAACCGGTGTGAACATCAGCCTCATAGCCTCGAACAAAACCCTATATGATA
+TCATCATGCAGGCTTACAGCTTCGCGTCGTACTCCACAGGAAAGCAATATTTTCTCCTGA
+TGAATGGAACCAGTCTGAACTGTATTGAAAAGGGTCAAAACCTCATAAATTTTACGCTCG
+ACCCTAAGGTCAATTTAATCAATGCTGTCTATGATGACTCGATCGAACAGATGATTAATA
+AGGTGAAAATTTATAACTCCAAAAAGGAGTTTACCGGGCAAATCCTAGAGAACAAAGACT
+GGGAAAGTCACTACGGAATCCTCCAGGACACGTATACAATTAATAAGTCTAAAAACACCT
+TGATTGAAGCGTCGATCCTCCTTAAAGGGATGGAGCAGGAGGTCGAAGCCACGGCACTCG
+GTAATGTAAACGTCATCACCGGCACCGCCGTGAAAACCAATATTTTTTATGTCAGTGTTC
+TCCAAAACGCCACTTGGTATGTCGATACCGACGTTCACACGTGGGAAATCGGCACGAATA
+AATACACCATGAAGCTTAATCTCAAGAGCCATAATTTAATGGACATGAAGGAAGGTAAGG
+TCGATGGGGAATAGGGAGGCAACATGAGGTCTAAAAATCCATACAGCGAAATGATTAAAA
+TCATGCAGGACCAGGGAGCGAAATACAACCCCTTTTCGGTTCAATTGGCGACGGTGATCG
+CTACATCTCCGCTTACGATTACGGCTGGAGAACTTCAATTAGCCGGGGATAATCTATTAG
+TGGCCGATTTTCTGCTAACCAGTTATTCCCGACAGATTAACCTTCCAAGCCCAACAGTCA
+GTGGTACAACTTCAGATGGCACAATAACAAGTCTCAGCATACCAAATGCCACGCTAAATT
+TCACAGATGGACTCAATGTAGGTGACACTTTAGCCGTAGTTCAGGTCGATAGTTCTACCT
+TTGTTATTTTGGCAAGGGTTGTGAGTGTATGAGCATTTTTCCGCAAAACTTCGAACAGGC
+CCTCATCACATCCAACGGTCTGGGTTCTTCTGAGTTACCTCTGGCGAAAGAGTATGGTTG
+GGACTTTACTAATAACACGTTTCTTCTAATTGACGGCAAGAGTGTGTTGGTAACCGGAAG
+AGATGCCGTTAAGATTTGGGCTTGGAAAGCATTACAGACTCCAAAGGGTGTCTATAAAGC
+CTACAGTCTAAACTTTGGAAACGAACTGGAATCGCTGATGAATCAGAGCCTATCAAACGC
+AGCCATGTCTTCAGAAGTCGAACGGTATTTAAAAGAAGCGCTCTTAGTTAATCCCTATAT
+TACCGGAATCTCTAACATTACACTGTCTATTGATGGTAGTAAAACCAGCGTAGATTTTAC
+GGCAGAGACGATCTATGGTGAGGTGACCATGAGTGTATAGCGAAACCAGTAATGTGATTT
+TAAGTCGCATGCTTTCCAATGTATCCTCAGATGTTGACAAATCCGAGGGTTCTTTTATTT
+ATGATGCAACCTCTCCGGTGGCCATTGAGATTGCTCAGCAAGAGGCCAATCTCGACCAAG
+TAGCCAAGAAGTTTGATATTACAACCTTAAGCGGCGACGAGTTGGCCATGAGAATCTACC
+AACGGACAGGCATTTCCCGAAACCCAGCAACTTATGCCACGGCAGACGTAACCATAACAG
+GTAATGGAATGATTAATACTGGTGATTTGGTTCAAACACCTGGCGGAGTTCAGTTTAAAT
+CAACTCAGCAACAAACCATCAGCGGATCGGCAAGTGTTCATGTTGAAGCCCTCATCGCTG
+GGTCAACAGGCATGGTTCCAGCCAACCAGATCACTCAGTTTCCGGTTGCCATCGCTGGTC
+TTGTGAGCGTCACAAATTCTAATCCGACGCAGGACGGCTTTGACGCAGAAAGCGACTCAG
+CCCTTTTACAAAGGTACTATGATTATATTCAAACTCCGGCAACGGGAGGAAATATTGCTC
+AGTTTATCAACCTCATGAAAGACTTCACGGGAGTCGGTGATGTAAAATTCTATCCAACTT
+GGAACGGAAACAACACTGTAAAACTGGTCATAATTGACGTGAATAAACTGCCTCCCAGCA
+GTGATTTAGTCGCAGCAGCTCAGGCTTATATGGACCCAGGTGCCCAAGGACTCGGGCTGG
+GTGCTGCTCCGTTCGGAGCTTTTACCACAGTGGAAGGTGCATTCGCTAGTACAATAACCA
+TTAATTTTACAGCGGTTAAAGATTCGGATTATACCGATGAACAACGGCTCGCCAATGTCC
+AAGCGAATTTAACAGCTTATCTCCAGGCGATTGCCTTCGTTGATAGTACTGTTAGTTATG
+CCAAGATTGGGTCGGCAATTTTATCGAGCCAAGGGATCTTGGATTATACCAACCTAACGG
+TCAATGGAGGAATTTCTAATGTTCCTCTCAGCTATACCTCGGCACTGACTGAAACGCCGG
+TTCTGGGGGTGGTGACGATTGCTTAGCGATTCTCTTCCTTATTTCATAACGAGCACTCAG
+TTATTTACTGAGTTATTCCAATCTGAAGGGCAAGAACTGGATGGCCTGGGCGCTGATCTA
+TCCGATTTAGAAGCTCAATTTAACGTTGATACGGCAACATGGGGCTTGGATTATTATGAA
+AAAGAACTAGGAATACCCACTGATAACACAAAACCTCTGTCCTATAGGGCCAGTGTTATA
+AAGTCCAAGTGGCGAGGCGGCGGGAAGCTTAACTCCACCTTGATTAAAACCGTCTGTGAT
+GCCTTTACGAATGGAAATACGGAGGTGACGTTTGATGGAACCATTAAGGTCAAGTTCAAT
+AGTATTCTGGGTATACCACCCAATCTCAATGATTTAAAAGCAGCAGTCTCTCAGATTAAG
+CCAGCCTATTTGGAGCTGGTCTATTTGTTTTCCTATCTGTTGATTAACGAAATTCATCAG
+GTAATGACCATCAACCAGTTAGACTCAACCCCACTCAACGAATTTGCCGGAGGTGTTTAG
+ATGGCTAAGACAACGCCGAACTTGGATCTTTATGAAGTTGATCCTGCCTCAGACGGATCG
+CTGACCTTCAACATTCAGACCATGCTCAATGACAACTTTGACAAGATTGACTCAGCCATC
+CCGGCTGCACAGGCAGCAGCTCAGAGCTACACAGACTCCAAGTTTCCTGTTCAAGCTTCT
+GAATTGAGCAATGGTGCTGCCACCGATGCGGTGATTGGAAATCGAACTGGGGACCCAACG
+CTGGCTTCCCCTTCGAGCACCGGAACGATGACTCAACTCTTTGGTTGGTTGATGGGGAGG
+GTCAAGGCGATATCTGGAACGACAAACTGGTATGATCCTCCAGACATAAATCTAGCGGCT
+TTGAGTGCTCATAAATCCAGGCATGCGATAGGCGGCGCTGACGTGTTATTACCTTCAGAT
+ATTGGGGCTGAAACTCCATCAGGAGCACAGGCCAAGGCTGCCACAGCCCAAACGGCAGCT
+GGGTCTTATACAGATTCTTCGGTAGCAGGGGTTAAGTCGGATTCCATCAACTATAAACGT
+ATTACATCAATGGGAGGTCTTTATTAATGGCAGTAGGCGACAGAACGCCAACGGAACTGG
+CCCAGTCAGCATTAAGTGCCACGGCAACGAACTACTTCACCAACGCAGGGTCAAGTTATC
+GAACCCAGATCTTAGAGGTTTGCTTAGTCAATACTGGTTCCTCTCAACGAGTTGTAACTC
+TTTATAAAAATGGGTTGACTGCAAACAATCAGATCGCCAACTCTATCACACTCCCGGCTA
+ACACGTCAACCATTATTGACTTGAAACTTGTAGCCACCGGGGTACAAACGTTTGGAGCCA
+ATCAAGACTCAGGAACTGATGTCACGATGACGGTCAGCGGCATTGTTGAACAGATAGCGT
+AGGTGATGAGATGGGTATTCGATTATTTGGGGCTGTTCAAGGTATAAAGGCCCAGGTTCA
+AGGGTTACTCCTTGGTTTGGGAACGGGCGGCAATGCCAACGCCTCAGAGGTTCTTAGTGG
+AAAAGAGGTTACAACCGACGTTGGACAAATAACAGGAACCATGCCAAATGAAGGCTCCGT
+GACGCTTACGCCGGGGCCTTCTGACGTTCCTATCCCGAAAGGATACCACGACGGGACTGG
+AAAAGCCTCGGCAGTTGTTGTACCTGCAGCTAATGTCCTAACCGGCACGACAATCGCAGG
+GACAGCAGGGACCATGCCTAACGAGGGAGCTGTTACTATAACACCGAGCAATGCAGCCCA
+GGCTATCCCGGTGGGGTATCATAACGGATCTGGAACCGTCCCGGCAGTTGTTGTACCGGT
+AGCTAACGTCCTAACCGGCACGACGATCGCAGGAACAGCGGGAACCATGCCGAACCGGGG
+AGCTGTGACAATCACACCAGGAAGCACCGCACAGGCAATCCCAGCGGGGTATCACAACGG
+ATCGGGAACAGTTTCGGCGGTGTCGGTCCCGGCAGGGAATGTTTTGACCGGCACAACGAT
+CGCGGGAACGGCGGGAACTATGCCGAACCAGGGAGTGCCGACATTCACGCCGTCTACTTC
+CGGCGACACTTCAATTCCTGCAGGGTATTATTCAGGCGGGATAGTAAAGAAAGCATATCC
+TGTAGGAAGCATGGTATCGAACGTCACGGTCGAGCAGATAGCGTATTCAGCCAACCCCAA
+CAGTAGTGGCTCCTCGTATGGTATCGCTGTCGATTCGCAAGGTAATATGTATCTATGCGC
+TGGAAGTATACTGTATAAATACAACGCAGCGGGATCACTTGTGTGGTCAAAGAATGACTT
+CTCCTATTTTGGCGTTTTCGTAGACCAGTACGATTATATCTACGTTAACCACAACAATTC
+TAACCTCCATAAGATGGACGGTTCAGGTAATACGGTCTGGAATAACGCGGTAGGGGTGCA
+ACAAGCATATAATATCACCATTTGTAATTCTGGGTATATTTACACCTACGACGGTGGCAC
+AAGTACCCACCCCACAAGAAAGCATGACGGTTCCGGCAATGTAATCTGGACGGATACAAC
+AATTGGTAGTAACTCTTGGTTTTCAGACACAAATTTCAGTACCGAAGTGACGGTTATTTC
+AGGATACGTGAGTGGAACTAGCATGGCAATCAGAGTGGTAGATTCAAATGATTCGTTACA
+ATGGAATTTAACTGCTTCTGCTTCAGCAATGTCTAACTGTTCCGGAGCGGTTATGGGTTC
+GGATGGTTACGTGTACGCCAGAAATGGCACTCAGGTTGTGAAACTAAACAGTAGTGGGGG
+CCAAGTATGGTCTGTGCCTATAAATGATACCTACACCTTAAAAGGAAATATAGCCATTGA
+TAACTCAACCAACATTTATATTGTTGAATACCAAACAGGCCATAGATATATGAAAATCAA
+TTCAAGCGGTACCATTCTATGGACCTACACGGCATCAAACATGACCCCATACGCGATTAA
+CGCAAATCATAGCGGCAGCTACGCATGTGCAACTATCCCATACGCAGGAGGTACTGTATT
+TTATGGTGCTACCCAATATCTAATTAACGGCTAGGGGGAAACTTTAAATGATATTTTTAG
+GTAACTTAACTATCATAAATCCCAACAAATCGTTGGTCAATTTCATTCATTATATGCCTT
+TAGACACGGACCACGGGATGAAGGATACAAACGGAAATCTAATGACCCAGGACGAATTAA
+ACGCGATCGGTATTCTTATTGATTCAATACCGCAGCCAGCCCCGCCCAATGGATATTATG
+TCTCCGCAACCTATGTAGATCCAACTACGAAGGACGTATCATTCGACTACGCACAAACCC
+CTAAAACTCCTGAACAACAACTAGCAGATTTACAGGCCCAAAACGCTCAAATGCTCTTAG
+CCCTAGTACAAGGAGGTTTGATGTAAATGGATTGGGTATCGATTTGTACAAGTTATTACC
+AAGCAGGATATTATGACAATACTTCACTAAAAGTATTTGTAGTTAAAGGTAAGATCACTG
+GGGCCGATTATAAGACAATCACAGGCATTGACTATGTAGCTTAAATTTGGGAGGGGCATA
+AAAGCTCCTCTTTTCTAATAAAAGAAGGGGGAGATGACCATTGGGCGAACAGGATGATCT
+AAATACGCGAGTTGCTGTCCTCGAAACCAAAAACCTAGCTCAGGAAGCTAGGCTCAATTC
+TCTAGAGATCGACGTGGGAAAAAAGTTCGACCGCCTTGAGGCTAAGCTGGATCAAGTTTT
+ACAGGCTTCCCGTGGACGACCAACGTGGATTGTGGCTCTGGCGATTTCAGGACTCATGAC
+GATTGTTACAGGACTAATTGTTTATTTGGTGACCCGTTAAGAAATCACCGAAGAAGGTTT
+GTCTGCATATTCTAAATTAAACGATGATCCTTGGTACAGTCGAAGGATATAGCTCTCGAT
+CGATTGTACTGAGAAGCTTAAATAAGGATGTCCTATGATGGTCCATCTGAGCTCTTCAAA
+CATCTCAGGAAAGTTGGTTGAAAAATTTCAAAGAGGAGGGGTCTTGATTGGATCTATCGT
+CGACGATACCCATAGTTGTTGCTGCAGAGGCGATCAGTGCCGTGATCTTTGGTTATTTGG
+GCTATGCGAGAGGGGTTAAGAAAGAATCCATGCTGGATGGTCAAGATAAGGGAAGTATCG
+AGTCAGACATTAAGTATATCTTGAGAAGGACTGACGATTTGTTAATGGAGCAGAAGGAGA
+CCAACAAGAACTTTCATACTTTGTCCGAACGTCTTGCACGGGTTGAGGAAGGAACTAAGT
+TAGCTCACAAGCGTATTGACCAGCTTGAAAAAGGGGAACGACGAGATGTTAGAAGTCCAT
+GTGATTAAGCGGACGCTCACGGAAATTGTCATTGATCCTTCACACGCAGAGAGGAAAGAA
+TCGGCAGAATTTCGGCGAAGTAAGGAACGATTGAAAGCCGATGGACATTATAAATGTTGG
+ATATGTGGAACCACAGAAAATCTCCAGGTCCACCATTTTGGAGCTGAGTGGAGCTTAGAA
+AACGTGACGGATTTTGAAAAGCTCAAGGTGTTTTGTGAAGAATGGGACCCCTATGGTTAT
+GGGCGGCTTCTTAGAAACCTGCCCATAACAACCGTCGATGATGTTCGAAATATGTTGGTA
+CTCTGTCAGGAACACCATACGGGTGGTTCTAAAGATGGTGCCGCCAACGGAATTCATGAA
+ATAACCTTACCAGTATGGCTGATTCAGAAATTGGCAAAGCAAGGAGAAGATCCTGTTCCA
+CAAGACGGTGAGTCTGTAGAGAACGTGATTAAGAAGATCACGGATTTATAAATCGTTAGA
+CTTCTAAAGGGAATATCATTATTTAGTCTCCCGAATTAGGGTGGCTTTTTTGTATGCTAA
+AGAAAGTAATTTGTCAGAAATATATACTGATAGCTGGCTATAGGAGGTCAAATGAGCTAT
+TCAATCAAACAAAACTTTATTGCCGGACTACCTAAAGAACCCTATGACAACGGGCATTAT
+GTCGGAGTAGTTGCACACTCGACGGCCAATAACGGCGACTCCGCCGATGGAGAGCGCAAT
+TTCGAATCGACTACTTGGCAAAACGCGTTCGTTCATTTCTTCGTGGACGACCAGAAAATC
+CTTCAAGTTGCCGATACCAACTATCTCTGCTATGGAGCTGGCCACACTGCAAACCATTTG
+GGTTATGTTCAAGTGGAGTTGTGCCAAACAACAGATCCAGTTAAGTTCAAAGCAGCTTAT
+GAGAAATACGTTTGGTTGCTTGCAAAGCTCCTATATAATAGGAAGCTTCCTGTCGTGGAT
+GGGGTTACTCTGATGTCCCATGCTCAAGTTTCAGCCAAGTGGCATGAGACGGACCATCAA
+GATCCGATCGAATATCTAACAAGCCACGGAAAAACATGGGCTGATTTGGTCGCTGATGTA
+ACGGCTCAATATAACTTGCTGGAGGAGGAAGATAGAGTGTTAAACGTTGCAGTATTACTA
+TTCACGAAGGACGATTTTTGGAGTGGGAATGATGTTGCTGCTAAAAATGGAAACTGTGCA
+CTATTTATAAGAGCAGCCAACCAGTCCGTTCCGGCTGAGGCCCAGAGTGCCAAGCAATTA
+ATTGTTGTTGGTGGGCCAAGCGCCGGGCATCCGAACGAAGTCCTGTTATCTGGCAAGGAC
+AAATATGCGACCGCTGCTGCGGTTGCTAAGTATTTGGGACAATAAAAAAGGGGGTATTTT
+AGTGTTAAACTTTATTCTGGCTTCAAAAGTTCTCGTTACCCTGGAGACAGTTCTGGGTTT
+AATATTAGCGGATTTCATTTTTGGAGTGTTGCTTTCTCTTAGAAACAGTAATTTTAGTTT
+CAGTAAACTGCCCCAATTCGTTGAAACGAGCTTGGTTCCTTATATTGGTGGTCTTCTTGT
+GTTGGCTCTCTTTTCTAATGTAAACACTGAGCTAGGGACGCTGTTTTTCACGATTGCCGC
+AACGATTTCAGCGAAATTTCTAGCGGATATTGTAACCAAAGCGGGGCAGCTGTTTAATGG
+ATTGCAAATTCAGAGTCCGTTGACTGTGGCTAAATCAGATAGCAAACAGGAAACAGTTCC
+CGTACAAAATGCAGTCCAAACGACGGATAATGGTACTGCTGGAGATGCGCAGTAA
+>NC_018068.1|provirus_2072558_2098541
+ATGGAAGATAGATTACTCACGAAGGAAGAGGTTTGTGAGTGGCTTAATATCAGCCGAGCC
+ACACTCGATAGATGGCGCAATCAGGGTTTGCCCTATTTAAAGACTGGGAAACTTGTTAGG
+TTCAACAGAGGTAAAGTTCAAGAGTGGCTTAATCAGCAGACTCACAACCAAAAATGAAAA
+GGAAGCCGCACCCCATCTCCGCAAAAAGACAGTGCAACTTCCCACATGAAACCAACCTTG
+TAAAGGCTGAACTTCTCTATAAGTATAGCAGAATGGGCCTCTTTATTACAAGTGTTGGAA
+AAAGAAAGAGGCGAGGATAGATGACCACTTTAGAAAGTCAAGAAATGATCCTATTAGGCC
+GCCAAATAAAAATAGGTCCTGAAGCAGAACGGTTTAAACGGTATGAGTATCTCGTAGGTG
+AATTATTGTGGTCCATGCGCGAGGACGGTTTTAAAGAAGGGGTAAGTCATGCAATTAAAA
+TTTTAGACGAAGATTCCAGAATTTCATAGCAGTCTTAAATTCTTGAAAATCCGTAGTATA
+TAGCTATGGATTTTCTTTTAATTTAGACCCTTGTACCCTACCACTATGGTCTCCTTCTGT
+AAAATAAAATTTCATAAATTATCAAGCATCGTCAAAAAGGCCCTTCTAAGCCTCTGAAAT
+TAATGAAATAATGAATACCCCTTGCCCCCTCCTGAAAACGGCAGGAAGGGGGCATTATGC
+ATGTCTCCGTGAAATGTAGCGGATATCCAATGACCTTCAATATCATTTGAATCATTATCA
+AAATTTATATTAAAGAAGAACTATTAAAATTGATAATATGTGAAAATACTAATTGAAATA
+TCAATTAAAATTTGATATTGTTGAGGTATAATATTTTACTAAAGAAAGGATGTAACAAAA
+CAAATGAAAAACGAAACAAAATGGGAAGATCTACCGATTATGCTCAGCCCTATACAAGCG
+GGGAAAATTCTTCGACTTAACCCTGAAATGGTCCGAACGTTGGCCAAGGCGAAGGCTATT
+CCTGCCATCCGTCCAACGTCTAAGTTTCTGATTCCACGCGACGCTTTGAAAGAATGGATC
+GAAAAAAATTCACAGGTAGTGGAGTAAAATGGAAATTTCCACGAGGAATAATATCAAATA
+ATATCTCTAAATCCTGCGTTTCAATTCATAATCAATCAAAAGAGACACGCGATTTTGAGG
+AGGTATTCACAAAGCCTATGAAGAAGAAAGGTGGTGAGATATCTATGCCGGGGTTTATGA
+CGCTTGAAGATTTATGTAAGAGCGGAAAAATTGCCTACTTAAAGCTTGGAGATGCCGTTT
+TGATTAAGATAATTGATGAGAGGGAGAATGATGACGATGACTAAGATTAAAAAAATCCTG
+TTAACTTCTTATATATTGATTACCCTTATTTTCACAGCCGTTGCCCCAGCCTTCGCGTAT
+TACGGGGCTACCGGTGTCAGTGGGGAGATTTGGCCTCCGGTACTCACGGGGTGGACAATT
+GCTACTGGCGGGGGAAATTCAACGATTAACTGGCATTTTAGCGACCCACTTTTTGGTGGT
+TCGACCGGTGGCGGTATCCCCGATCTCTCGGCTCAGTATCCAGACTGGGATAAGCCGAAC
+AACATGGATATTGTTCTTTGGGCACAGAACCATCATTATCAAATGCCGCTGAATAGTAGG
+TTTTATTGGTTCGCACTTCACCCGACCGATAAACAACCAACAAACTACACAGGCCCAGCC
+CCATGTTCTTACACACCGCAAATTCAATCTATCATCGATGCTTCGGGCTACACTCCTGCT
+GATTTTTATAATGCGGGAAAGGCTCCGCTGAGTGGTTCAGCACCTAAAGCAACTACAACT
+TCATCGCCAGTCTCAACTCCAGCTCCAGCACCTAAAACAGTATCAACCCCAGTTGCTACT
+CCCGAACCCCCTGTTGTCTCTGGTCCTCCTGCACCCGTCGTTTCAAAAACTCAAACGCCA
+GTGTCACCAGAAGTTGCAAAGCAACACTCTGACCCAGTGAGCGACCCTTCATCATTAACC
+TATGCAACTATCACCAAAATCGACAATGCAAAACAAGCTGCGGATGATAAAGCCCAAACG
+GATTCCCTAAATAGGAAGCGATATATAGTGTATGGTCTGTTAGCGTTAGCACTTGTGGTT
+TCGATTGGTTTTGTTCTTTCTATCTATATCCGTGAATGGAGGACCAAAAGGAAATGAGAA
+AGTTAATTTCTATCCTTACGGCCCTCCTAATCCTGGTCTTTCCCGCCATAGCATCGGCTC
+AATGTGGGATTACAACTTGGGATTTCGACCCACAACGGACGGCAACCAGCATATCCAGTT
+CCAGTACCGATCCATGGGTTCTCGCGCAGGGATCAGGAAAGGTCGTGTCCTATGCTGGGA
+AACCCGTGGTCGTTCATATTCCCTCGATCGACGAATCGTATGCGCCTAACCCGGTAACGG
+GAGACGTTCCTAAAACTGGCGTATTTACCTTTAACCAATTCTCATCAACGACTGCCATAA
+CAGATCCCATCGGATACACGATGTACCAGTATACCTGGGATGATGGAGGATGGGGACATG
+TATGGAAGTATACGATTAAATCCGGTGATCTCGCCGAAGGCAATGTGATTACTTTAACAG
+CAGCCGACTTAATCGCTGCATTTCCTTGTGGCTATTCAGGAGGAACAAACTTTGCGAACG
+CCCCGTCGGGTGTAACCATTTCAAACGACGGGAATTTTGTGGCCGTCGGAGCTGGCAATA
+AGCTTTATTGGTGGCCCATCGGAAATCCGGGGGCAACGCTATATAGTTTTATAAACGGCA
+ACTCTGACTTCGACATGTGCGAAGCTTCACCAATTATCACCCCCAACGGCTATATTGCCG
+TCGGATGTGATAATGGCGGATTTGTTTCCACCGACCTCTCTGGCAATACTCATAATTTCC
+TCACCTCTGACTCAGTTCTTGGCTCAGGCGATTCTTCCGAAGCAATTACCTCATCGCCAT
+CATGGAACCCAATATCAAATACCATATGGTTCGGTATCGACTCATATTCTGCACCAAGGC
+TCGTTTCCTTTGATCCATCAAACGACACAAGCACAATCGTTGGTAAAGGCACTATTTTAA
+CTCCAGTTTTTTCCCCAACGCCCGTGGATAAGGTGTCCGGAGATGTGTTTAATACGGATT
+ACGGTGGAAATGCTTATCGTTGGAGTTCATCCGGCAATCTTATTCAAAAATGGATAACTC
+CGAACGGGGTAACGCACGTATGTTCAAACATGGCGATAGCGAGAGACGAGAACGGGAATG
+ATCATGTAGCATGGAAAGATATGAACCGTCAGCTTGAAAACGCCATTACTCCATCGGGGT
+CATTCTGGGTTGAATCGGGTGGAACAAATGCTCATGATGTAATGGATCCGAGCTTCGTGA
+CCAGTTCAGTAGGCGACTATATAGGTGAGGCTTTCGTTGATCCGTCCTCAGGGGAGGTAT
+ATTATTCGCCACAACCGAATAGCGCAATATCTACAAACCCCCATTCCTACGTACCCATTA
+ATCAAAATAATTATGGCGTCATAGGCGATTACATCGACATGGTTTACGACGCTGATATCG
+GTCCTGTAATGAGTCCAGCAAAATCAACGTCCTATACCTGGTCCAACGATGCAAATGGTT
+CGCCTGGGATTTTGATTTATCTCCTGAGCCCCGTTTCTCTTGAAATGTGCGTCGCTGGTC
+CAAGTGGGGTCGTATATGCGCCGCCAAACAAGACGATCACGGGTTTACCTGGAGATACAG
+AAAATATTACAATGTTCGCACCGGGGTTAGATTTGAGTGGTGATACCAGCGATGGTTATG
+GTGTTATTCATATCACCGGTTTCCCGGATGGTAGTTCAGCAGATAAACAGGTAAATTTCG
+ACTGCAATACCACAGACCTGATAACCGGTTCAGGGAGTGCAGCGGCTTTCGATTCGACTA
+GTATTACCTTGCCGACGTCTAGCGCTAATTACACGCTGACCTTAACTGAGACGCTCTATG
+TCAAAGATCATAGTACCGGAGTAATGGAACAAAAAGATTATCCATCACCGACGATAACGA
+TTAATGTTCCTGTAGTTGGTGTTGCCAGCCCGGGCAATCTCACAATATCGTCTTATCACA
+ATGGTGACACAAACAATTCGGGCATAGACGCCGGGGGATACCCAAACTTGGTAACTGGTA
+ACCCGTTGAAATTCAATTATGGCGACACAATGTTGGCTGATCTTGTAATCCCGGTCCCAG
+CGCCACCAGCCGGATGGCAATATTATTCATCAGTTTTAAGCGGGTTCATAACATATCCAG
+TAAATACGCCAAAGCCGACCGGCACAGCGCAAATTGGGGAGCCACTGACGATTGCTTCAA
+CAAAAACAGCGACCTTTTCAAAGAGTACGAGGGCTGGAAGTCAAGAAAATGGGGCATCGG
+TGAACGACAGTATTGCCAGTTTTCCTGTAGAATGGCCTACGTGGAGGCCACCGATTGGAC
+TGCCAGGGTACGATTGGGACTCAACATTAACAGCGACATGGACGCAAACCGTTACCTATG
+TACACCATATTAATACACCTGTGGGGGGGTTCTCACAGTATAGAACTTATACTCATAGTG
+ATAGCACCCCATCACAGGAGTTACAGAGAACAGGTACGGATATTTACTATATTCCCGCAG
+CGAGGGAGCCGTGGATGAGATAAAGAAAGGGTTGATTTGCGAAATGAAAAAATCAATAAT
+GCTTCTTGTTTGTTCTGTTTTAATTTTGTTTTCGGGCGTTTCAACAGCCCAAGCATTTGA
+TGATAGTCAGCATAATCTTGTTGGCGGAGTTGATGCTGCTTATCAAGTGGTCACTCCTGG
+TCACTCTTACACATTGGGTTACAAACTTTATGGAGTTGATTTGACGAGTGCCTGCAAATT
+TAAACTAGGAGAAAATCCCGAAACAACCCTATAAAATAAAGATCACCCAACAACAAATGG
+AATTATATGGACTTCGCAACCTCCAAAAAATGCAAATTGTGGTGTCTCTACCTATGGCAG
+CTTATCTGGTAATGTTTTTGTAATGCGCCCATTATCAGAAATCCCATTAGATTGTCGAAA
+TGAGGAAGATATAACTGGTTTAATACCGTATAATTTTTCATCTGTGAAACCTTTATCTGT
+ACATGTTCCGACACGAACTACTTTAACTGGAGTTAGCGGTGGTGGGGATTTAATTCGTTT
+TAGAATCCCTGGGAATGGACACACCCCAATACCGGCAAAAGTGAACATAAAAATAATAAT
+TTTGGGGGCTATTGGCATAGCACTGGTGTTCGGTGCTGCTGTTTTTGCGATTAAGAGTAA
+ACAGAGGAGGTCACACAATGATTAAATTTATCCGTTGACCTAGAAAGCCTTATACTTTGC
+GAAAGTCCTATACTTTATAGCTTTATTCATTAATTAATTCATTAAATGTCATGAACAATC
+TCAGCCATACTCTCGCAAGGCTTTCACGGATTTACTAATGAGGTTAAAAACGCTGTTTTT
+TCATGACTGATTGACGCTTTGAATCATCATTTGAAATGATTAATAAATGTGTATTTATAC
+CTAGCCTATCATTGCACGAATGAAAGTAGTTTTGATTTGTATGGACATAACGCGAATCAA
+AACTATTTTCAACGACTAAACATTCACTGCCACAACGGTTTCAGGCGTTTTAAAGTGCGC
+GAAGTATAGCACTTCGAAATAGGTGAGAGGCTCCTGAAAATGTCTACAATCTAGACTCAT
+ATTTTATTTCGTTTAATATTTAATTACCTATATATAAGCTATTAAATATTGAATGTTTAT
+ACGATATGGATAAGCTATTAATTTTTACTAAAAACACTCTATAACAACCTATCCTCACTG
+GGGGAAAATGACATATCATTTTCGCTCAATTTCAAGGATAATGTTTGATTAAATATCAAG
+GGGAGCTGTACGATGACACAAAAAAACAGAGTTATATCAGACCGAAATATGGAAGTTGAA
+ATTATGGGAGATATACTCGAAATCAGGATTAATCTTGCACGATCAATCGGTATGACCAGG
+AGCGAAAAAAATTTTTTGCTCGCCTCGTCCAAAGGTACTCTTCAGATTGGTCGTGATCGC
+GAGGAGAAGATGGTTCTTACAGTCTATCGACCGAAGCCGGCATAGGATTAATCGGATAGC
+TATTGAGAAATGAGGGCTGATATTGCAGGCGAAAAACATTGATGCAGAAATTCAGGGAAG
+TTTTTTAACAATACGAATAGATTTAACAAAATCCTTCGGCGAAACAAAAAGCGGAAAATA
+TGTTCTAATAGCTACAACAGACGGAATTAAACCAGTGGGAGATGGGCGCACTGAAAAAAT
+GACGATAACTGTATATCGCCCTAAGCCTTGAGTCAGCTCTCAAAGAGGAGTGGTTCGCAT
+AAAAATAGTAATAGATCGTTCCTATGCTAATTTCAGCCTTTCCGAGGAAGCCTGGACCGC
+CTACGGGAAGGAAAGACCTAAAGACTTAAACAGTATTGTCTTCCGATCCGATCCCGACCT
+GATTCGTGTGGTCGAGCAACTTGGGGAAAGGGCAAACGGTCAGTCACAGTTCGGTCCGAA
+AAACAAATTAGAAATTGTAGAAGTCCCAGATGAGATTCCGGTTCGCATTGAATCTTATGA
+TGGGAATGAGTGGGTGGCTGAGGAACATAGGGTTTGGGGGAAGGACGAAAAGATATAGAG
+CACCAAAAAACTCACCTATTTAAAAGGTGAGTTTTTAATCTGATTCTTGACTGAACCTGA
+CTGACTCTTGACTGAATGCTACCGAATACTTAGCGATATTTACGGGTTTTTATTAGGTAT
+TTTGCTCAACCCCCGTTATAATTGAAACCCGCTAATCCGCTTGTAGAGTGGCTTGTATCA
+ATGCTTTCAGGGTTTTAACCCAAAAGTTTTTGGACATAAAAATGGTGCGGTCGAGAGGAC
+TTGAACCTCCATGCCCTTGCGAGCACTAGAACCTGAATCTAGCGCGTCTGCCAGTTCCTG
+TCCAAATCTCTGAACGCTTACATACATAAGGATTATAGAGTTTTTAAATAACTGAAAAAT
+CTAGTGGGGAACTAATTACCTGTAATTGTTTGCTATTTTAGCACATAACTTGTCATAAAT
+AAACTATGTATAAAAAGAATAACAAAAATAAAAATTTTATACGTTTAGAAAATCCCGCAA
+ACTTGCTTATAGCAATACTTTCACTAATTATCCCTAGTGTGCTTAATATGGATAGTATTA
+TCTCAAACAATAAATCAAAATATTGTCCTACTTGTGCTAAGGAAATTAAATTAGAAAATG
+ATAGGAAAATCCAAAAAGAAAGATATTATAGTAATAAATTCTCGCAAATAGAAAACGCTT
+AAAAGTCACATATATCAATACTTTTAAAGAATAGATGTAATTTTGTATATATGAATATAA
+TAACAAATTAAAATATTGTCCAACTTGTGCAAAAGAAATTGAGAAAAGTAACTGGGTGGA
+AAGAAAAAGGAGACAAAGAAATAAAAATGTCACGAAATAGAAACGCCCTGAAATTCAATT
+ATAGAAAGGGTTTGACGATATATAAAACAAAACGTATTAATAATGGTAAAGAAATAACAT
+AGTATTATCAATGCTTCCAGATTACATTGTACTTTGTTTCTCAATGGTCACTTAGGGAAA
+GAAATATCAAATGTTAAGAAAGCAGTGAAGTTTTAGAAGACCCTTATACACCAACCCTTT
+CAGGATTCATCAAAATCAAGAACATAGCAATATTAGTATTTGTACTTTATTTCTTAATGT
+CCTATAAGGGAAGAAATAAAATTTAATCGCGTTTTAATCAAAATTATCAAAATTAGTGTA
+AATCATAAAAATCACACCCTTCAATCCCTTATGTGGCAATGGTTTCAGAAATTAGTTAAA
+TTGCTGTATATGGGTATATAAGCATTTTTCACGTAATTAGTTAAAGCGGATTCTACAGTC
+CTACTCGCACAACGGTTTCAGGGCTGTCTATCTTCCTTGTATATGGTATATAAACAAATT
+CAAAATATTTGCTTATTATGATACTAATAGTAGCCAATCAAATAATATAATCAAATTAAA
+TAATCATTCTAATTATGAATACTAATAGTTGTCTACCAAATAATATTTACATTTAAAATT
+ACCAATGGCTGGTAAAGTGATAAGTATATTATATTAGTGTTTTTGTACATAAAAAGCGAG
+AAAATAGAAAACGTCTAAAACTGGCTTGTGACAAGGGTTTGATAATACATAAAACAAAAC
+GTATTAATAATGGTAAAGAAATGACAAATGTGAAGTTTTAGAAAAACCTCTTAACCCATA
+TCCAACAATCATTTCAAGGTTTGTTACAGCCATTCTAATATGGATATAGTTAAAAATCGT
+GGAAGGAAAACAGAAATCCTCTGTATCCCCACAGATACAAGCGATTCCAGTCACGCTCTA
+GCCGTTGTAATGTGGATAGTATTTTAATAAAAAGTAAAAAAAATAAAAATGTTCGAAAAT
+AGAAAACGCCTGTAACTACACTCCTGTAATACTTACAGAGGACACATGTATTTTCTTAAC
+TTATGATATATAGTATTATTTTTTTTATTTAACTTCTTAATTAACTTTTTAACTCGATTA
+TCCTCCACCTTCAGCAAGTGGATTATAATACATTACTAGTTGAAAAATTTAAGTCATTTT
+ATTCCGTTGCGTCTCGTTGGGTAGCTAGACCTGACTCCTCCAAAACAAAGGAAAGACGAT
+AAGCATAGTGAGTATTCTATGCAAAGGTGCGACCTAGTTGTTGCACCTTCTTCTTTATGT
+TTAAATATCAATTCTAAGTTTCAAAACACCATCAATTGATGGTAAATTTATACCTATCTT
+TCTTAGTTGGTATAATTCTATACCCATGATAAAAAAGTATAGAAAAATCAATTTAAATGA
+CCTTCTAAGGCGTTACAAAATGATACCCCTTACAATTACCCTACTTAACATTTTAAACTC
+AATACAGCCGATTTAAAATGAAATATTGATTTTTACCATACCCGCAAACCCTTGATATAA
+GCCATTTTTAAAAATGCCATTTTTTCATCATTAAGGGGATTCCACCCCTCTTTTGATGAA
+TTAAATATATCCCAAAAAACGAATGGAGGTGAAACAAATGACAAGTAAAATTGTAAGATT
+TATAACTATTAATTTTTCATTAAATCCAAAATATTACATTGTAAAATATGGTTTGGAAGA
+TATTGCTAAAACAATTGAAGATTTCAGAAACGATTTAAACAAAAGGAGATGAAACAAATG
+AGATTAATTAGATTTATGAGACATCCAATAAAAAATGCATTAATAGCAATTCAAGTAGTT
+GGTTCTATATTGCAGGAATACCCAAAACAAACCTTAATCTTTATTATAGTTTATTGCCTA
+GTATATTACTTAAACTATTAAAACGGAGGTGTGACAACAAATGCCAACAGATACACTAAA
+AACATTTTACATAAAATCAATGCGACTTGCAGGTTTCTTAATGCAAAGGGGCTTTGTCCT
+CCATAGCGTGATACCTGATAGATTTGATACTGCTATGCCCAAACGCAATGTATTTACATT
+TACTAACTGTCCAGAGTTAATTGATGCTATAGACGATTATAAACAAATGAGAGGAAGTGT
+ATAAAAATGGAACAAACATTAAAACAAATAGAAATGCAATTACTCCGTATTGAAGCACAA
+CAATTAAATTTCCACCTTCAGATGATGAATATGATCAAATTGATCAATCAAAATTTAGCC
+AAAATCAAAAAGTAATCCTTTGCTAGAGATAGCAATTTTTTTATGCCTATTTTTTATTTA
+ACTTTTTAAAATCTGAAATGAGGTGGTGAAATGGACTTAAATGCAGAGCTAATAAATCAA
+GTTTTGGGGCAAGGAATATTCGCAGTTTTATTTGTTTGGTTGCTTATGTCTGAAAGAAAA
+TCTAGTCAAGCAAGAGAAGATAAGTTGATGCTCCAACTAGAAAAATCTAATGATGTTTAT
+ACGAACGTCATTGAAGCGGTAGATGCCCTTAAAGATACTATTATGAAACAAAAATAAAGG
+AGAGATAACGAATGGAATTTACACCTGAACAACAAGCCCATATTGATGGATTACTTACTG
+AGCATAAGGAAAAATGGGAAACTGAAATCCTTGCACCTTTACAAACAGAACTAGCAGGAT
+TAAAGCCAGTTGCCAAAACAGATAAGGAAAAAGAGATTGAAGCCAAGGAACAAGAACTAT
+GGAATAAAGAAAAATCTTTACATATCAAGGAAAAAGGTCTTAGTGATTTTGCTGAATTCT
+TTAATGCTAATACCATTGAAGATTTAGATATTCAAGCGGAAAAACTTAATAAAATCCTAG
+AAGCCAAAAAACTTAATAATGCTTATGTTCCTAGCGGTCATAAAACTGCTGATGCTTATG
+CACAGGCAGAAAAATCAGGTGATACTCAAACTATGATAGGCAGTAAACTGTCTAAATTAT
+TCTCTTAATTTATAACTAATATTAAATAAAAGAAAGAAGGAATTTTATAATGATTACAAC
+TGCTAATTTTACCTCTTTGGAAAATATTAACCTTGCTAAAGAAATAAGTTTGGTAAGTCC
+GCTAGATACTCCTTTCAGCACCATGCTTTTAGGTGGAGGTAAATTCGATACCACTACTTC
+AAAGATTGATACTTGGAGAACAAAATCCCTTGATAATACTGCTGATATTTCTCAGGTTGA
+AGGTTCAGAAACTTCTGTATTCCAAGCAAGCGCAAGAGCAGAAATGTCAAATGTTTGTGA
+AATTTTTAAAAAGGCAGTTTCTGTTTCTGGAACTGCATCCGCTTCAGGTATCACAGGCGT
+TCCTAACTCATTCGCTGAGGAAATCAACGACCGCTTAATCGAAATGAAAGTTTCGATGGA
+GAAACAACTTATCAATGGAGTTAAAAATGATGGTTCTGCCACTCCTTTTATTCGCAGAAT
+GGGTGGATTATTTTCCTTTGCATTGGCTGAACAATCTATTTCTAATGCTACTGCTGGAAC
+TCTTGCAGAAGCAGACGTAAAAGACACTGTAAAAGCACTTTGGACAGCAGGAATGGCTAC
+AGGTCAATATATTGGCATGGTTAATGCTGACCTCAAAGAGCGTATTGATGCTTTATATGA
+TGGAAAATACAGCTATATTGCACAAGAAAATTTGTTTGGGCTTGTAGTTTCTAGCATTGC
+TACTAATTATGGCACAATCAAACTCTTACTTAATCGTCATATGCCAGTTGATAAAATGGT
+TGTATTTGACCCTGCATATCTTAAAATTGCTTATCTTCGTCAACCTCAATTTGAGATGTT
+AGCAAAGACAGGTGACTACACTCAAGGTCAAGTAATTGCTGAATTGACTTTGAAAGTTAT
+GAATCCTAAAGCAATCTCAGTTTTAACTTTTGCCTAAAAGGTCAGAGTTGGTCAGGAGAG
+GGTGAAATATCCCTCTCTATATTTTTATTTAACTTTTTAACAATTTGAAAAATGAAGGAT
+GTTTTTAAAATGCTGATGACAGAGGAATTAACGGAGCGACAATATTATACATTTACAAGG
+AAAATCAAAAAAATTAAACTTCGACAAATTGCTGAGGTACTTGGATGTAGTGTGCCACTT
+CTCTCAATGTGGGAGACAGGCAGGACAGACATAAACGATTATTACGTCAAAAATTACAAG
+CAATTTATTGATAACAAATAACCTATAAACAAATGAAAGGGGTTGTATTAATGTTTGTGG
+TCGATAAGGGCAACAACGATTGCCTTCTTGATTCTGTAAAAGAGAGGGAGGGTGACATTG
+TGATTTAACCATAGCATGGTTAAATTTTACGGTACATTATCAATAGACAAACAACATATT
+GAAAATGAAATCCAAAATAAAGGAGAGATTTCCGCAATGGTGTTCTGACAATGAGGACTA
+TGAGTTGATGCTAACGGATGATATAGATAGTTTGGTTAGTTGCGCTTTACTTAAAAAAAT
+TAAAGGTTATGAGACAAATTACTATTATGATTTTCAAACTATTTATGAGCTTAAAGAATC
+AGATGTTCCTGCAATTGCAGTTGATTGTGATTTGGTTAATGGAAGATGTTGGAGTAATCA
+TGTAACAATGTTGTCCGCTAAGGACAGTGTCAATAAAAAGAGTGCCAACTTAAACAATAT
+CGGAAAAATATCAAGAGATAATTACTTTCAAAAGTTTTGTGGTAGCACAGCAATTCAGAT
+ATGGAGTTTCTATGATATTCCTCTACCAGAGACAGAAGAAGGTAAGATGGCTTTACTTTG
+TTTAGATGTTGGATTTAAGGGACACTACGATTCAAGATTCATTGAGATACATTCGAAATA
+TCTCAAGGCACTTGGATTCCCTGAATTAATTGAGGTGCTAGAACGGCACACTTCAACCGA
+ATTCTATGATCTGATTAGGAAATATAATATGGCAAGCAAAATAAAACTTAATAAAAATGG
+TATGCTCACCACTGACATAGACATTGCAAATTTGCAGTGTCTTTTTAGTTTGGATTTATC
+TCGCCCTGATAAACCATTCTACATAAGAAGAGAATTTACAAGAGATTGGCCTACATGTTT
+AGTCAACTATAAGACATATACAAAGGATGATTTTCCTGAGATGTTTAGTGTGGCTCTAAT
+TAACAGAAATAAGGTTTGTTTTACAAAAATTAAATAGAGTTTTGAAAGGACTGGGTAAAA
+TACTCAGTCCTAATATTACCAAAAATGTTCGAACAATTATTCTCAAATTAATTGTAATGT
+TCGGAATTATCATTGACCTTAAAGAAAAACAAGAGTAGAATTTTGAAGCGAAGGAAATGA
+ATATTCAAACAAATGAAAGGAAATGCTAATGAGAGTTTCAGATGTGGTTACTATAAAAAA
+GGTTAAATCTTGGATGCCAGGCGATGTAATAACAATAAAAGCAGGTACAGGAGTAGGTAA
+ATCATATTTTATAAAAAACAATCTATACGCCTTAGCCAAAAAAGAGGGCAGTAAAATTCT
+TTTATTAGTAAATAGAATTAATTGTAAAGATCAATTTGTAGATGAAATTGGTAAGGCAAA
+AAAGACGGATATTATTGATATTAAAACCTATCAATATATCGAAAATAAAGAAGCCAATAA
+AAATTATTTTGATTTCAGTGAATATGATTATATTGTTTGTGATGAGTTTCATTATTTCAT
+GAGTGATGCGGCATTTAATATCAATACCGATTTATCTTTAAATGCAATTCTTGCCCAAAC
+TTTCCCAGTTAAAATATTTATGAGTGCTACGGGCGATTACATGAAAAATTATATAACTGG
+AGTTAGAAAAATAGAAACGATTGATTATGAAGTCCCTATTACATACGATTTTATTAAAAG
+TTTAACCTTCTTTAATAAAGATGAAACACTAGAAGCATTCATAGAAGAAGCAATAGCAAA
+GAATCATAAGGCCATTTTCTTCATCCAATCAGCCACAAAAGCATATGATTTGTACAAAAA
+ATACAAAAAGCATTGTTTATTCAATTGTGGTAAAAGTGATAAACATTACAAATATGTGGA
+TAAAGAAAAAATCAAAGAAATGCTAAAGAAGGAAAGATTTGAAGATCAAATTTTAATCAC
+TACTACCTGCATGGATACAGGGGTTAATATAAATGACATTGACCTGTATCATATTGTTTG
+TGATGTTAAAGATATCGGCGTTTTAGTTCAGTGTATAGGCAGAAAACGCCTAGAAAATAA
+AGATGATAAAATTTATTTGTACGTTAAAACTATTAATAATCAATCATTAGGGGGCATGGA
+AACCCAATTAAAGAGAAAAGTTAATATGGCTGATTATTTGCGAGAACATACCGTAAAAGA
+ATATCTTGAGGAATACAAAAGACAATATGATACCAGTAACATTGTCTATAATGACACGGT
+AAAAGAAGATAATAAATCAACACTAAAAGTAAATGAATTAATGTTCTTTAAGGTTAAAAC
+AGATTTGGCTGAATTAAGTTTCATGAAAACTTATGGTGATTTTGGTTATTGTAAATATCT
+TGCGAGTAAATTTGGATTCCGAGATGATAACGGATATTATAATTATCGGACTATTGAAGA
+AGATTATCAAAAAGATAAGATTGTTAATTTTATGGCAAAGGTTGTTGGCAAAAAATTAAC
+AAAAGAAGAACAAAATGAATTGATTGATATAGTTGATTTAAGAGATTCTAGGAATAGACA
+ACAAAAATCAATAGGACAATTAAACGAGTATTTTAAAGCAAATAATATAAAATATTTTAT
+TATATCTAAAAAAAGTGGTCCAAAAAGATATTGGGAAGTAAAAGAAGATAATGCGCAAAA
+CAAAATGGGACAAAATTTGGAATAACCTCTATTATAGGTTTATCCATAAATTGTCCCAAC
+TAATTATTATATCATATTGCAAATATAATTCAAGAGTATTTAATTAAAAATAAATATAAA
+AAGTATTTGGCAGTTGCCCACGGTGGGCAAATGCGAGGTAATAATTTTGATATTTGCTTG
+GGTTTTGCGACCTTGGGGCGCGAAACCATAGCAAATTCAAATTATTGCCCAATGCCATAG
+GCAAAAGTTTAATGTAAATCTTATTTCAATGAATAAGAACACAGGGCGCTTACCAGCGGG
+GTATGTCTGTCGGGTGCAGTGGCTCCCGCCAGCCATAAATATAATTTTAATTGTTTTTAT
+AATTGGTTTCAAGAAAAGGTACTTCATATTGAGGTGCCTTTTTTTGATGTCACTAAGAGT
+TACCATTACAAAATAATTATAGGAGTTGATACAAATGACTTTAGACGAGCAATTAGCACG
+TACAAATTTAAAATATAAACGATATTTTCGGTGGAAATTCAAACTATCTACAAGAGGTAG
+AGCATATAAAGAACGTCCGTTGGAAGAAATCATGAAGATTGATTTAATAAAAACAAGGGA
+AACATATTACGCTTGGGAAAAAACGGAGGAATATCAGAACTTAGTCAATTTACTTATTAT
+GTCAAATGCAGGTAATGATTTATTAGAAATTTATAATGTCATGCTTGATAAAGCAAAAAA
+AGGTGATGCAAAGGCAGTTGATACTGTCATTAAACTTCAGAAATCTATTGCATCAAGCAT
+TAAACAGAATAGTAAAGATAATAATTCTGCTCCTGTTGAAGATGAAGAAGATGATCTTGA
+ACTATGACAATGAAAAAGGAAACAAAATTAGAGAAGATTAATAAGGACTTCTTTTTGTGG
+GCTAAAAACTTTGTTCAGATTATTGATAATAATGGAGATTTAGTTAAGTTTGTTCCGAAT
+GAGCAACAGGTAGAATTCTTTAATGGCATGGATAAGTTTAATATCATCGCCAAGAGCAGA
+CAATTAGGTTTTTCAACTTTGATGATGATATATTGCTTGTGGCTTGTTTGTACCAGACCA
+AATACTAATACTATGATGGTTTCTTATAATGTTGAGAGTACACAAGCACTATTTGAGAAG
+TTGAAAATGATTTATGCAACTATTCCTGACAAATATAAGCCAGCAGAAAAGCGTTCAAAT
+AGAATGGAATTATTTTTGGAGAACGGTTCTAAGGTAATGGTAAAGACCGCAGGTAATAAA
+TCCTTGGGGCGCGGAATGAATTTACAGTATATCCACTTGTCAGAGTTTGCTTTTTATCCC
+GATGACCAACAAAAAGATTCATTAGTGTCATTAGAGCAAGCACTTGCAAAAAATATGGAT
+TCAATGATTGTTGTTGAAACTACTTCTAACGGATACAACTATTACCAAAAACTATTTACA
+AAGTCCTATAAGGATAAATCGAGCAGATATAAAGCATTTTTCTTTCCTTGGACTTCTAGT
+GCCACTGTAAGCCAATTCAAACACGAGTTAAACATTGCTGAGGATTGGTTTAAGGCCAAT
+AATCATAATCATAGATTGATACCTGAGCAATTAGAGAAGGATGAATTACCTTTATATAAT
+GCTAAAGTTAGTTTGAAGATGATAATGTGGCGTAGATGGAAACTTCAGGACATGGCATTA
+GAAGATTTTCAGCAGGAATTTCCCTTTACTCCTGAAGAAAGTTTCAGGGCCACAAGTCGA
+TCAATATTTAATGAGCAAGCAATTAATAATAGTGTTATGAATCTACTTCCTCCATTGAGG
+AAAGATGAACTAAATATATCTCTCCCTGATTCCCTTGCTAGTTATTATGGCAGGGGTTTT
+TATATGTTCAAAAATGTTAAGCCAGGAGAACGATATTATGCAGGAGTTGATACTGCTTCA
+GGTAATGGTGGAGATAATTCAACGATTAGTGTTTATAGTTCGGAGGGTGAGCAGGTCGCA
+GTGTTTATGGATAATAAAATACCTATCTATAAATTTGCTGATGTTGTTTATGACTTGGGC
+ATGATGTTTAACTATGCCTTTCTTGTAGTGGAGAAAAATAGTTTTGGTCAGTCAGTCATT
+GAGAAGTTAAGGTCTGAACGCCAATATTTAAACATGTACAAGATGAAAACTTTTGATGAT
+AGAGGTAAGAAAAAGTATATGGTTGGTTGGATTACTACAGCAGTTTCAAAACCAAGGTTA
+GTCCAAGATTTTAAAGAGCAATTTGAGAAGAATTTGATTTTGATAAATGATAGCAGCACT
+CTTGATGAAATGAAGATTTATGTTGAAGCCGATGGTAAGACATCAAATAAGCGTGGAGAT
+GATTTTCACGATGATTTAGTAATTGCTTCAGCATTGGCAGTTCAGGGGCTTAAATGTGGC
+AAATGGTATTTATAAGAAAGGGATGAAATAAATGAATCTACAAGAGTATATAAATGCTTA
+TTATGATGGAGATGAGTATTGGTTTATACAATTTACCAATTACAGTAATTCTCATGTCAA
+TGTAAGTCAGCAAAATAATGTACCTTATGTATATAGTAATCAGGAACGCATCATGAACAT
+TATAAACATTAAAGATTATTTAAGTGGCAAACATGCCATTTTAGATAAATCGGTTGAAAT
+GTGGAATGGGAAAGAATTCCATCCGAGAACTATTGTTTTGAATTATGCCAAGACGATATT
+AAACTTCTCGACAAGTTATTTGCTCAAGAATCCTGTCACTATATCAGGAGATGAAGCAAG
+TGTACCTATAGTCAAGGATGTTTATAAAAAAGGCAATTATAATAAGATTGATTGGGACAT
+TTTAGATAAGGTATGTAAATATGGGTCAGTGGCTGAGTATGTTTATATTGACAAAGACAA
+AGAGATTAGAAGTAAGTTAATACTGCCAGAGGACAGTTATCCTGTTTACAATGATGAGAA
+TGAATATATTGGATTCGTTGAATACTTTACTTCGATTATGAATGTAAGTTACTGGAATGT
+TTTTACTGAGGATAAGGTATTAAAGTATGATGACTTTGGTGGAGAGATAAGATTAGTAGG
+TGAGTTTAATAATCCTTCAGGTTTGCCGATTATTTACAAAAATAAGAATGAGTTAGATGA
+AACAGCAGGGCGAAGTGATTTGGAGGATTATGTAAATATTGTGGATGCCTTGGAGGATTT
+AATTAGTAAATATACGGATTCAATTTATAAGTTCATTAATCCTATACCTGTAGTTGTCGG
+GCAGAAGTTAGGCATCGGTAAATCAGGTGAGGGTGCTATACCTTCTACATTAGTAGGAAC
+AGGATTACAGTTAGATGATGGTGGACAGTTTAGTTTTGCTAATGGTCAATTAGATTATCA
+ATCCTTTGAATCAGTTTGGAAGATTTTATATAACTCATTACTTCAGGTTTCTAGTGTTCC
+GGCTGTATCTATGGGTGTTCAGGACGTTAGCAATTTATCAGAAGTAAGTATTAAGTTATT
+GTTCTCTCTTGCTGATTTAAGAGCAGGTATGAATGAGATGTATATGAGAGAGGGCATAGA
+ACAACGATTTAAGGCGTTTGAAACATTACTTAAAGCAAAAGGTATAGTGATAGATGCTAA
+TGCTTTAGATGTAGTATTTGAATACGCAAGGCCAATGAATCAGACAGATATAATCAATGA
+TCTAAAGACATTAAGAGATATGGGTGCTATTAGTTTACAGAGTACATTAGAACAGTGTCC
+TATGACATATGATGTGGCTATGGAGTTAGAGAGGATTAAGAAGGAAGATAAGGCAAAGGT
+TAAGAAGCAACAGGCACAACAACAAACATTTGATAATAATGGGAATGTGGTTAGTGGAAG
+TGATGCTACCAATAACAATATAAATACAGATAATGGTAATGTAAATGGTTAAGTGAGATT
+AAGTGATACTAGATATAGTGGTTAATTTGTTTTGTTAATACTAGATGTAGTGTTGCATTA
+AGTTATGGATTATATAAGCGTTTGATTATGAATGTAATTGTTCTAAAAAATCGCGCGTGT
+TATAATATCTATATACCCATATGGGGTATAATTACTATAATTTTGCTGTATTCAATATGT
+AGGTGGCACTCACTCACTGACATAATAACCAACAAAAAAGCATAGGTGCTTCAAATCAAG
+AGCATCTATGCTTAGATACATTGTAATTATCAGAATTGTTTATTGGGTCCGATAATGAAC
+ACTATGTAAAGTAAAATATGACACAATAGACATTGTGTAACATTAGGTAAAATGGCTACA
+ATCCGCTTATATCAAGGGATGTAGGGTTTGGGGTATTACTTGCCCATTTACTTGTTAAAA
+TCTAATTGATAATGACTAGGGAAATTCCACCACTCATGGACATTTATAGGGTAATTATAT
+AGCATCAAATTGAAGTTTTAATGGAAATAGGGGGCTGATTCGATACCCCTTTTCTGAAAT
+GAGTCGCCATAGTTAATCCAATTTTACACGTTCAAAGTAAATTTTGAATCCTCAGATTCA
+CTTGGAATAAATTCATACCCACAAAACTCACATTTCTCTGTTCCATAAGGAGAAAACTCC
+CCACACTTAGGACACTTTTTTTCATTCCTCGAAATTATTGCAGATATTAAAACCCCAAGG
+ATACTAAAGAAAAATCCTGCAAAAAACCATGCTATAAAAGAACGATGTTTTGCCCATGCT
+ATTGCTCCACTGATGATTCCGCAGATTATACCAAAAATAAACCATAATGACATAACATCA
+CTTGATGGAGTAATCAAGTTGAATTCCTCCTTACTACTTAAATACAATTTGATTCAAAAC
+ATCCGCTTAATAATTTCTTTATATCTTTTATCATCTATTTCTATTAAACACTTTTTACCA
+TTTTTAAACTGAACAGCTAAAGTATGGATACCTTTAGATTTAGCAGAAAGACCTGCTAAT
+AATCCAACTGGGCCTAATAAAAATCCTCCAAGCAATCCTCTGCTTATTGCACTTGAAGCA
+CTTTTTATGCTTTCCTCCGTAACGATTTCATAGTGTTCCACATTTGATTTACTAATATCT
+TCAATGTTATATCCCTTTGAATCTTCAATGTATACTAAACCAGTCGTCCACCCAATGCGG
+TAATTAAAATAATCACCAGCAATAACAATGTTTTTTGCACTCATCTTAAATCACTCCTCG
+TATAATTAATTTAGTTCCTGCCCCACGAGTCCAAAAAACTAATGGAACGTGGGGTATTTA
+AATGACCAAAGAAAACTGGAAATTCAGTTGGTTGGTCATCATCAACAAGATGCGCGCAGA
+ATAACGCATACCCCATGCAGTCGTCGTGCCTGTGGGCAGTGTGGACAAGTCAACCCCAAA
+GCACACTTCAAATTCGACTTGTCCAAAGCCTGAGGGAAAGCTCTTTTAAGATAGACCCAT
+AAGGGCTTTTCCATAGGCTGGCACTGTCCACAGGCTCAGGATAAGGAATACCTGAGTAAT
+GATTCCTTAAGTCGTTCTTTGACAACAAAAAAGTATTTAAGTTTGTTGGGGTTTCAGGCA
+AAATGATACCGTGAGGTTCGTTCTGGTAAGGCCTTTCACTCCTTGAGGCTATGACCTCTT
+ATTAAGTCTGACTGCCAGCCCACAATTTGAACTTTTAACTCGAAGGTTGCACAGCTTAAA
+GGGAACCCCTCCGATGGTAGCAGATCGGTTGGATCCGAGGTCTTTTTAAGACAAGTGCTG
+ATTCGGCGAGGTTGTTGACCTGTTGTGGTGCCTGGTCCCAACGTTAATCTTACAAATTCT
+TCGACTCGGAAAGTGAGGTGATTTTACTTGAGTTTATTTGTCGGTATAGATGTGAGTTCC
+AGTGATTTTAAAGTGCGAATCTTAGATGAGCGTGGTAATGAACCAGTTAAAAGGCTAAGG
+GTTTTGAATGATCAGCCTGGTTGTGAGCAAGTTGCCCGATATCTCTCTGAAGCCTGTAAT
+AAAGAGAATGAGGACCGGCTGGTTATTGGTTTAGAGGCCACTTCCGTGTACAGTTGGCCG
+TTACAAATGTTCTTAGCGGAAGACCATTGTTTAGCACCTTTACAGCCCCAAATTTATTCC
+TTTAACCCCAAGGTCGTTGCTAATTTCAAAAAGGCTTATGTGGACCTTCCGAAGAACGAC
+TGGATTGATGCCTGGGTCATTGCCGAACGTTTACGCTTCGGCCGGCTCCCGGAGGGCTCT
+CAGGTCGATTTCCGCTACTTACCGTTACAGCGACTCACTCGCTTTCGTTGTCATCTGATC
+GAGATGATCTCCAGAGAGAAGAATTATTTCCTCACGAACTTGTTCTTAAAGTTTAGCACT
+CTTGCCCAAGGTACGGTTTTTAGTAATACTTTCAGCGTTACTTCTGAATCCTTGACACTT
+GAGTTTTTTTCTCCAGAAGAGGTTGCGGCTCGACCGCTTGATGAACTGATTGATTTCCTC
+ATGGAGAAAGGAAGAAGTCATTTCGAGGATCCGGAAGCCAAAGCCAGAGAGTTGAAGGAA
+GCCGCTCGCAAGGCCCATCGACTACGTGGAAGCCTATTGCAACCCATTAACCTTATCCTA
+GCCACGAGCATCGAAACCATCCACACTTTAGAGAAACAGGTCAAGAAAATCGATAAGGCG
+ATCGAAGCTGAAATCAGGCATTTCCCTAATACGCTCATTACCATTCCCGGTATTGGCCCT
+GTGCTTTCAGCTGGTATTATTGCTGAGATTGGAGACATCCGCCGTTTTCCGAATGAAGGA
+GCCTTAGCAAAGTTTATTGGGCTAACCTGGCGTTCTCACCAGTCCGGTGATTTTACAGCC
+GATGACACGCCCTTAACTCGAACCGGCAACACCTACTTGCGAAGTTATATCATCCAGGCT
+GCTAACCTAGTACGCCAAAAGGAACCAGAGTACAAAGCCTTCTACCAACGTAAATTCTCG
+GAAAGTAAGACTCACCATCATCGCCGTGCTCTCGTGCTTACTGCACGCAAACTCGTCCGT
+ATGGTTGATGCTCTGCTACGCAGCAACCAAATCTATATGCCACATGGCAATAGGGGGATT
+GCAAACTAAGCATGAACTACGAGAATTGAAGTCCCATTTTTGTAACTTGTTTCCATTTCA
+TTTTGGGAATAAGAGGGTTTTTTATTGCCTTTTTTGCCAACGGATAACTAACTTACTGAA
+AAATTGACTCACTTAGGGTCTTGACATATTACCGAAGGACTTAATTTTGAACCGCGGTTA
+ATATTCCATTGTCAAAATACAAATAACCTCCGTTATCATATACCCATTGCTCATGTGTAC
+CGTTAGCAGTAACCGTTCTATTGACCTCATTTGGTCTTCCCCACGAAGAATCTAAAACCT
+GTTGTTGAGTCATTCCTATTCTGACACCTTGTGTTTTCGCTAATGCTTTAGCTTTTGCTT
+CTTCCTCGGCACGTTTTTGAGCTTCTAACTTGGCTTGAGCATCTGCTTCTGCTTTAGCTT
+TGGTTTCTGCTTCGGCATTTTGCTTTGCTAATAAATCATTGTATTGTTGTCTTCTTTGAA
+GGAGTTCTTTTTGGACATTCTCATCAAGAAACTTGGTAACGGTTAAGTTTTGAATTTCAT
+TAATTGCCTTTTGATAATCCTTTGAATTAGCGTACTGGTCAATTTTTGTCATCTCATCTT
+GAGTATACATTTTCTTACTTTCAGCTTCTTTTGATTGTGCATCTTTATAACGTTTTGTAT
+CTTGTGCTGAAACATAACTAAATGACCTATAAGCATCTAAATAATTCTTATCATCAAATT
+GTTTTAATCCTAAATTATAGTTTTGAAGCGAAAAGCTTAAATTTTTACTTAACTCCTGCT
+TATCGACAATAGCTTGATCTGTGCGATATTTTAGGGCATTACTATAAAACGTTTCAGCAT
+CGTTGAATTTTTCATTAGAGAAACTATCATTTCCCTTTCGAACATTATCATTAAAAAGTT
+TTGAGTCATAAAGTGCTTTTAGTGAGAGGGGGACTATACAAACGACAAGAATAATGACTA
+TAAGAAGAATTGTTTTTCTTTTTTCGGTATTAGATTTTATTAATATTTCTTTTATGGGAT
+TCTCCATTTTCAAATACCTCCCAAAATCTATTTATACCAAAAGTATATACCCGTCCTCGG
+ACATTTTTTTGGTGAATCATGTCTATAGGATTTGTCTTATTACGTAGTATTTGAGAAATT
+AATAGAACATTCTGAAGTTTAGCAGGAAAATATCTATCTATGTTGAAAATGGAAGCGAGA
+AAGAGGTGAATAAGGTGATTGAAATCAAGCCAACTCAAAAACAAGTATTGAAAGTTTTAT
+TGGAAAATAAGAATACTTGGCTTACTGATATTCAGATAAGAGATAAATCAGGGTTGAATT
+ATTCCCATGTAAAAACTGCCTTGAAGAAGTTTATGGACAACGATTATGTTTTCTTTGATG
+GAAATAAGAGCTTTCAAATTTCACCTGATGGGGAAAGTGCTTATTTAAGTTAATTATAAA
+AAATGGAGGGATATTTTATGACAACTACAAAAGAAGAAGTGATAAAGATTTTGTCTCAAA
+CATATGACGAATGTAAGAAACAAAATTACAGCTATTTTATGAGAGAAAAAATACCTAACT
+TAAACGAATTAATGTTTAAATTGAGATACCTTGAAGATGAAAAACTTATAAAATATTTAG
+ATGCCGATGATGGATTGCCTTATGGAATGTTTAAATTTAGGATAACTTCTAAAGGTATTG
+ATTTCTATGAAAATGAAATAAAAAAAGTAACCGAATAATTAATATTCATCTAATCCCCTA
+ATTTATGGGGATTTTTTATATCCAAAATTAAAGGAGGAAATCAACCATGACAAATTCAGA
+CCGCTTAATCATGGAAATCAAAGGCATAGACCTTACACCAGATGAATTAAATATATACCT
+TGAAGAAAATTTACTTGTTGGTACAACTGAATATATTCCAACTTCAAAAACAAATAAGCG
+CAATATCTTAAAGGCAGCATTATCAATTCTTGAATCGGTTGCCAATCAACCTGATTTGAT
+GAAAAATTATAAACAGGATGATATTTCAATTTATCAATTCCATGAGAATCTTGAAAAGAG
+AATAGATGCACTCACATATAAAATCAGACAAATACCTGATGATACTCAAACTTATGCTGA
+TGGGGCTTCATTTTTTTATATGTTTGCTGATTAAGAGAGGGGATAAATGAATGGTGAAAT
+TATTTGATCCTGATGCTTCAAGCTTTAATTATATGCTTGAGCAAATGGGTAAAGATTTAA
+CTTTGAATGATACCACGCAAATTAGAGCCATATTGTCCTCCATCCCTGTCAATGCAAATA
+ATCATGATGATAAATATATATCCACCTTATCCCCTCTAAAACAAGGCGATAAGGTGGATT
+ATTTATTGTCTAAATGGCTTGTAGTTTCTCAGGTTAATGGTCAGAGGATAGTAAAATATA
+AGGCGATTATGCGAAAATGTAACTATAATGTGAATTTTAATTTTGATGGTTACGTGAAAA
+ATTTCCCTACTTTTATTGAGGGTAAAATTTTTGATGTTCAAAGTGGTCAATATATTATGT
+TACCTGTAGGTAAAATCCTTGTCACATTGCAGGAGAATCCTGATACATTAGCCATCGTGA
+TTAATCAACGTTTTATTTCTATGAATTCCCCTTGGAAGATTACAGGCATTGATAGGACAG
+TAAAAGGTTTAATTACTTTATCCTGTGATTTAGATTTATGGGGAGCAAACGATGATAAAA
+TCAATGAAATTGCTGATGTAGTTACTTATACAGTTGCATTTACTGATGTTTCACCTGTTT
+CAGTTGATATTGGCTCAACTTATCAGACAAATATTTCAATGGCAAAAGATGGAGCGAGTG
+TAACCTTCCCTGTAACATATAGTTCTGATAATGGCAATGTATCTGTTGATGCTAATGGTT
+TACTAACCGCATATACTGAGGGTACGTCAATTATCACAGTCACAAAATCAGATAATCCTT
+ATGTAAGTGCAACTTTAGAAGTGACAGCAAAGGTAAATCATGTTCCTGTTGTTGTTGACC
+AAATATTACCTAATGTTACTTCTTTACTTCAAACTACGTCTCAGGATTACACGGTTTACC
+AATACGTTGATTCTGTCGCGAATTCCGACACCTTTACTATAACTGCTTCAGGCCCAACAA
+CCACTTATTACACTTTGACAGTTTCAGATGGAAATCATTTTACTGTGTACAATAAGCAAT
+ATATCGCAACAAAATTGGTTATTACCTGCACGAATAATAGAGATGCTTCGCAGGTTCAAA
+TATCCATAGATTTAAGGGGATTGTGGTAATGGAAAAGGGATGTACTTTAATTACATCCCT
+TAAATTTAATTACTTGTAGTTACCTTCAATATAACAAAACGCATAGTTTTGACTGTTATC
+ATCATCATAAACAAACCATTCTTCTGTCAAATCATTGAACATGAGAGGGTATTCTTTACC
+TGCTGTCAGACAGAAATTGCTTACTGACGGAATCCAAACCTTTGCATTATTGATTCTAAT
+TTCATCTTCAAGAAAATGAGGAAAATTAATTATATTAGCCATGATTTAATCACTCCTTGC
+AAATCTTTACCCTTTTCAGTATGCCAATCACAACCTAAAAAGGCAATATTTAGTTTTAGA
+ATGGAATTACATTAGGGGCATTTCAGTATTTGCATGGTCAGCAAACACCCCCTTGTAATT
+CCATTTTGTCTAAGGGGTTATATTTTTCAAATTCCTCTAATTTATCATCCGTTGACCAAT
+ATAAATACTTTTCAACTGTTTCAATCGTTCTATGTCCTAATTGTTCCCTGAGCGATGCGG
+TAGACCCACCATTTTTGAGGTAATTGATGGCATATGTGTGCCTATACGTGTGAGGTGATA
+CTCTGATTCTAGGGTCAATATTGGCTTGTACTCCATATTCCCTGAAATTTTCCTGAATGG
+TATTGTCGGCAAGTTTTCCACCATCCTGATTTTGAAACAATATATCAAAAGGTTTGGCAT
+TGGGAAGGCATAGGCGAATGAAACGTTGTAATTCAGGTTTAATTTTCTTAGCCATTCCTA
+CAATTCTTGGAGTTCTGTTTTTACTTTCTCGAATGAGAATTCTATTATTCTTAAAATCAA
+TATCAGAAATAGTTAAATTAAGACATTCACTAATTCTCATTCCAGTGGATAAAAGCATAA
+GCATCATGCAATAATCCCTATATCCTGCATGTCTGGACTTATCTGGTTGTTTTAACAGGT
+TTTTAATATCTTCATTTGAAAAAGGGATAATAGGTTTTTGGTCAATTTTGCCCTTTTTAA
+TTTTTGCCATTGGATGATCTTGAATGATTTCTTGCTCAATAAGGTAATTGAAAAAAGGGC
+GAATAGATGCAATTGCTGAATTAATAGTTGCTTGAGTATTGTTTTTAGTTTTACGCATGA
+AATTAAGGAAATCCTTTATATCCCTTTCAGTAATTTCATCAACTAATAATGAGTGTTCAT
+TTTCTTCCAGATACTTCTTTAAATACCCTAAATAAAAGCGATAACCTTCAATAGAACCTT
+GAGTTAGATTTCTTTCCTCACAATGAATTAAGTAATCATCAAATTGAATTGAGTAATCGG
+TAGGTGCTACTATTTTTCTTGATTTTCTTTTGACAGGGGAAATAACTGCTGATTTTCTAG
+CCAT
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_018515.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,888 @@
+>NC_018515.1|provirus_3418112_3436097
+CTATATGAGACATCCTCTGATGGGCCTCGCTGCTGTATACACCAGTGTTCTTTGGACAGC
+ATCAATATCCATCCCGGTAATTTCTCCGTCTTTCACGGCAACTTTATAGGTGCAAATGGA
+GGGATGACGTTTGGAAGTAAACTCCATGTCTTCCCGCCGCTCAAAGATCACCTTCACCGG
+CTTGTTGGCCTTTTTGGCTGCAACTGCGGTTTGACAAGCAAGAATGGAAGGGAAGGCTTC
+CTTACCGCCAAGGTCCCCGCCGGTGACATCCTGGATAACCTGAACGTCCTTCTTCTCATA
+ACCCAGAGCCTTAGCCACTGCACCATGGACATAATAGGGACACTGCAAATCACTCAAGCC
+TTCAACGGTGAGAATCCGTTTTCCTACGAACTTCGATACTTTCTGCACGCAAGCCTTAAG
+CGCTTTGCCATCCACTAAAACCATACATGTCCCGCAGGCCCCTTCACTGCAGCCATCTTT
+TACCGAAGCAATCCGCAAATCGTCTCTTAAAAAGAGTAATAAACGTTTGTCACTCATAGC
+AAAGACATCTTCACCATTGATATTTAAGGTAAACATAAATAACCTCCTGTCTTATAATGA
+TTCAACAGCTGGTGTTATGAATCATTATAAGTAGGAGGTTATACTACATCAAATTCTTTC
+TCAAAAGCACTTGCTTTATTTGTTTGTATTCCACTGATATCAAGGCAAATTTAGCTCTGC
+CAGCCTTCATCAGTATTCACTGGATTACTCTTACCGTAGCAAGATCAGGCTTGCTGAACG
+CTTGAGATCACCATAATAAAGTACAAAGCAAACTTAGCATAAGCACTAACTGCATCTCCC
+TTTTCAAGCTTAACAAACCCCTCACATTCATACCTGTTTCGGCTTTTGATTCTCGTCAGA
+ATTTTTTATCCCTAATAAGTAATTCTTTGCACTAGCATAAAATATTTTAGCCATATCCGA
+AAACATTGTATAAGTAATAAACAGCCGCGCAGTCCTGGGCAGTAACCGGTAACCATAATC
+AACTACAAAGGAAAACTTTTCATCCCCGTTTTTGAGCACCAGACACTCTGCTTCCTTCTC
+AGCTCGGAGCATAAGCGAGAGAATGATCTGTGCAGCCTCAGCCTTCCCTTGAGTTACCAA
+GAAGGTGATAAAGCCTATAACGAATAGGATTATCCCCCAGTAATTCTGGAGATACGCTAA
+AATAACATCCACCTCTGTTTTCCTCCCTTTCAAATACAGCTGTAGATAAACTTAAACCTT
+TTTGCCCATACCCAATCCCCGGAACTGACCAATGCCCCTTCAGATTTTCTCAGTTATTGT
+TTTGTGTCATGGTATACTCAAAAACATTAACGCTGTCAGTGTTGCGCTGTACGGCTCCTT
+TTTGAGCTTGACCTGCCTCAACTGCCTTTTTTACTTCGGCGATTGCAGCATCTTGATAAC
+TTAATGCCATGGTCTGCTTGTCATTTAGAATGACACGATACATAACGGTAGGTACTGGAT
+TTAGAGCAGTATCTTTAACCGATTCTGTATAAGGGATACCAACAGCACGGCTGAAGCCCC
+TGCAGATTGCCGAAGACACCGACTCATCAAACCGGTCTTGTTTCATGAGTGCCTCTTCAG
+CGGGATTTGAGATAAAACCGATCTCCACCAAGACCGCGGGGCAATCCGTTTCCCTGAGCA
+CGTGGAGATTATTAAACTTAATCCCCCGATTAGTGAGGCCAGTTGCAGCGACTAACTCCT
+TCTGGATCTCCTTAGCTATCTTTTCTCCCTTCCCGCCAGCTCCTAAGGCTATCGTTTCAA
+TTCCGTGGGCATTGGGATCTGTGAAGGAGTTGGCGTGGATTGATAAAAAGTAGTGTGGCT
+TATAGTCGTTCGCTTGGTTTGTCACATCCCATAGATCTCCGTCTTGAATTGCAAGGATCT
+CCCAGCCGTTCTTTTTCAACTTCGTGACGACTAATTCTCCAACTTCTTTATTTTGCATGG
+CCTCCTGATAACCTGTTGGCCCAATGGCTCCAGGATCATAACCAATGTCTTTAGGGCCGT
+GGCCGTAGTTTATGACTGCTTTCACTTAACCAGCTCCTTCGAATAAAAAGCTCATTTAAT
+AATTGCGATTACGGCAATCGCTGTACTAATAAAGGCCCCGACGACTGTGCGCCAGAGCCA
+TGTATTGTTTGCTTCGAGTTTGTCGATACGGTGAGAGTTTGATTTTGACCTAGCTTCCGT
+TTCTGTAGCCTTGTTTTCGATGCAGTCTACCTTTTCTCTCAATCCGTTTTGGGTATCTAG
+TTTTGTCTCCACTCTCACGAGGCGTTCTCTTATGTCTATTAGTACTTCTTGATCGACCAT
+ATTGCCACTGTCCTTTCTAGAGACATAAAAATAACACCCCGTATTTAGGCGTTTTCTGCG
+CATAATGGGTCAACTGCGTATTAAGCTGTTTGCCGTTGTGATGATAATAATGTAGATAAC
+TCTTGATATTCATCTGTAGTAAGTCGTTCTCCTGCGTAAAAGACATCTAGCATTTCATGC
+ATTTGTTCAAACGAGATGAATTGTTTTTTTTCAATTTTCGATTTGCAAAGTGTATAAGTT
+AATGTATGCATGTAAAACTCCTCCTTATAATCCTAGTTCCATCATAATTAATCTATAATC
+GAGGTTTAGTACATAATCCCTTAAAATTTCGTTTTCGGTTGGTTGCGGTTCGGGTTCTGG
+TGGTATATCTGTTAATTCAAGAATTATTAACTCTTCGTTCTTTATTTCGTAGTAAGCTTG
+TTTACTACCTATAGCGTCGTACGTATCTTGGGATATTTCGTATAGAATCTCGTTTTCTTT
+CACTCGAACTATAGCACCTTCTGCTACAGCTGCGCAATTAGTAACTACGCTTTCTTTTTT
+AGATACAACGGCATAGTAACGCAAGTTTAGCCCTCCCTTTATTGTAGTGCGTACACTTCG
+TTTGTTTTGTAATCAAGTGTTGCGTTGGCGTACATATACGTAGGACTTGAAGTGTTGCCG
+TTGTAGACGTCAATTCTTATTGAATAAGAAGCACCTACAGCTATATCTGTTAAGTCAATA
+TCCGCGCTCAAGTCACGACCAGACGCGTAGTAAACCTTTTGGACTCCGTTTAAATAAAAA
+CGCGTCCCATAGCCAGCCGCTTGCGCTGTATTCGAGGTAGCGTTAAATCTCAGTGACTCC
+ATATTGATAGTCAGTGTGTCGTGGCCCTTTAATCGGGTAAGGCTGACTGATTTCAAAGTA
+CCCCATGTGTTTTGCGCTACTACAGCTTCGTTCCACGCCATAACTATGTGCGAAAGAACG
+TACCTAGTGTCTGACGTAGTAGCCACCGACAAAGACGTAGCTTTAGTTATGGCGGTCTGT
+ACAGCTGCTGCTAGGTCGGTTGTTGGAATACCTAGAGCTGGCTTCGAATATTTAGAATTC
+CACAGCGTTTGCTTTTCGGCAGTAACATGTTTCGCCACATCCGCCAAATGCGCAGCAAAA
+TCCACCTGCCCAACCCTGCTCGTATCAACAGGATGAACATGATCTGCTCTGGCATATCTC
+TTCGAAGCCCCTACTCCCGCTGTCCCATTCATGGTCGGTGCAGTTGTCCCGGCCTGGCCG
+AGCACAAAAGCGGTTGTAGCAACCTGTGTCGTACTCGTATCAACCGCGGCAGTTGTTGCT
+GTAGGCGTTCCCTCAAGTGCGGGCGACACCAACGGTGCCTTGGTACCGATGAGTGTTGCC
+GTCGTGGCCGCATAATTGGGGTCACTCCCTAAGGCATTAGCTAGTTCCTTTAATGTGTCC
+AGGGCAGCAGGAGCGGAATTAACCAAACCAGCAACTTTGGTATCTGTATAAGCCTTTGCA
+TTAGCCTCCGCTGTATTCGCTTTCGCCTGTGCCCCAGCCGTAGTTTCCTTTGCCGCCACT
+GCTGTATCCAACAGATCCGCATTATCATTAAAGTCTTGGATATTGACAACATCTGTACCT
+TCGGGCTTTTTTAACCCTAAATTCGCCGTCGTTTGCATAGCTTATCTCCTTTACTCATAC
+ACTCTCAGTTCATTCCAAGTCATCAGGTTCACGCTATTCCAAGTGAGATATTTCAAAGAA
+TCCCACCAAGTATAGGAATACTTAAAACTGTAATCTAAATGGGACGGCTTAATTTGTTCC
+AGCATCTGAATAAACCCTGGCATGTTAGACGGGATACCTTTTACCCCAATAAACCGTACC
+TCAAAGCGATATTCTGCCGGATACTCGATGACATCCACCTCCCCGCCCGAAAAGGCGGAT
+GCAGTATCCAAGATCATATGCTTGGTGGTTGTGCCAGAGCCGCGAATTTTTGCTTTTATA
+GACTCTCTTCTCCGCTCGATAGGCTTATTAGCCTCTGTCGTTAAACCTAACTCGCTTTCC
+CAGCAATCCAATCTCCATGTGGCAGTATCCACAAAACATTGACTCAGCATATCGTCAATG
+GCATATAAAAAAAGACCCATCTCATCCGATGCAGTCTCTTGGAGTTTTTTCATTTCTCGA
+ATGCTCTGATAATACTCAGGCAAATATCTCATGAGGTCAGGAATCGTGTATTCAGTCAGA
+TTACCGTCACTGCCCTCTGTGCCAAAAGTGGTTGTGCCATAAAGTTGATTTCCATATCCC
+ACTAGACTTACACCCCCTTTAATTGGTCCCAGGTTACTGCGCCCTTGGGCATAGCGTTCG
+CGACGATCGCTTGGGCCACTCTTTGGGCAGTCCATAATCTGGTGGATGTCGCAACACCTG
+CTTCTGCTTCTGCTTGAGATACCGTGCTCCAAGTGCTTGTATGAGCCAGTGTTCTGGTTG
+ACCCATTGATGCGGGTAATGATTCCCGTAGTCGTTGTCCATACGTCTCCATTAACAGGGC
+TCGTTGGTGTTACACCATGGGGAAGGTTAAGGGAAGCCGTGGAGTCTGTCGAGGCAGGAA
+GATTAATCTTTCCCTCAAAAGTATCCCCAGCTTTATTTGCCGGAATATAAGCCAGGGCAT
+CTTGTTTCGAGTTCCATGTAGACTTCTCTGCATCTGTAACAAGTCTATTGCTAGAATCCT
+GAGTAATTGCAGAAGGACTATGCGTATGTGCGCTTGGCGCAAAGGTGCTTGGTTTCTCGG
+TCACACCAGACCATGGCACACTTTCTGCTGCCTCAGCCGCATCGACTTTACCGTCATTAT
+CAGTGTCATAAATACTTTTTAGCATATCTCCAACTGTTTGCGCCGCGACAAGCAACTCAT
+TGCCGCTATCCGTTCCAATATAAAGTTTTTTGGTATCCGTACAAAAACCTAACTCACCTA
+TAGCCAGCGTTCCGATACTGGCTTCAAGACCACGCCTAATTTGGATCATTACTTTCCTTG
+GCATATCATCTCCTCCCTAAAAGGTTCCTCCATCCACGACAGATACCATCAGCCTGTTTC
+CGTTGCCAGCATCATAGACAATACTGCTGGTATCAATGTTGGCTTCTATACCAGTGCTGT
+TGACGAGAATTCCTTTCCCTGCTTTAGCACTCACTGTGGTTGTTCCTACCGCGATCCCGT
+TTCCCGCCCCAACTGTTATGCTGACCGTGTCTGCCTGACCGCCTCCAGTTAGACCATTAC
+CGGCGGTGATAGTTTGCAGAGCCCCGCCAGTTCTTACCCAAGCGGTTCCGTTCCAGGAAT
+ACACTTTTTGCTCATCATCGACATAACATGTCCAACCTGTCTGGGGTGTGTAAAAAAGCC
+AAGATGCACCATTCCACTCAGCAATTTTTGTAGCCTGGCTGACCCATGCCCCAGTGGCAC
+TGGCGGGAATAATATATCGGTCTCCCGTCGTTGGCGACCCAGGGGGAGCGGTAAGATTCT
+GATCCTTGACGCTTGCTTGAGGTTCGATATTATGTTTGGCTAACTCAATTTCGTTGTTTA
+TTTTTTGAGCACTCCACAAATCAGTTATCGTCGTCCCGGCGTCATTGATCAATCTGTGTT
+TAGCAGAATCGTCAATATGAGTCTTTATTTCTACTGCAGTTTTAGTGTTCGTTCCATCGG
+ACACTTTATTAACCTGACCATTTGTGAGATCTGATTTTTTGACCTTGGCATAGGTGGTTC
+CATCAGCAATGTCATCTAAGGTTCCCGTCAGATCCGTCAGTTTTTGCGCATTGACTCGCT
+CCCAGACTGCACCATCATCCAGGTAGAGATTACCCACATTAGTTCCGCTAGTAACATAAT
+AAAACCTTCCCGATACTCCTGCATTAGGCCGAGCCGCTTCTGTGCCTGATAGTACCCGAC
+CAACAAAAATATTGGCGATTCCGTCCCCGATGTAAACTTCCTTAGTATCTGTGCATAGTC
+CCATTTCCCCCGTTAACAAGGCACCCAAAGCGATCAACTCAGTTTTTGTACCACGACGAA
+TTCTTATTGTTTGGGCCACAAATTACACCTCCTCCAAAAATGTTCCACCATCAACGATAC
+CCTTTTTCTTATAGCTCTCTAACGCTTGTTGAGTCGCTATAAGACTTTCTTGCAGTAAAT
+TGATATCTTCTGCCTCCACCATATCCCCGAGAGTCTCATAGGTCACATACACTTTACCCA
+CACTGGCAAAGATTTTAATCATCCGCTTCCAAGGGGATTCTGATGGGATTGAAACAATAA
+AGTTTGTGATCTCTTCTCCAGCAAAACGTGACTCCGTATAAACCCTGATCGTGCTGTTCG
+TGATATTGTCATGGCCTAAAAGCCCGCTATACACCCCCTCGAAAATTGGCAGTTCTTCTT
+CAACGGCATAAGCACTGCCATCTGGCTTTCTATTGAACTTTGGCGATAACTGGTCAATCT
+GCTCAGGATAGGGCATTTTTTCATACCCCCAGTCCTACGGTTCCAAGCACCGGTATTTCT
+TCATCCCGTAAAGCAACGTTTGCATTGCCGTTATTAAGCGTTAAACTGACATAGTCAATG
+ATGCCAGGTGTGCTAAGCAGTAATGTCCCAACTTTGGCATAACTGACATAGGTACCCGTA
+AAAGCCATCTCTTGCAAATAGGCTTCCATGGATGCACTAAAAGCATCTGTCACAGCTTGG
+ATAGCATAACCTGAGGCCAACACTACTCCAGCTGAAACATTAACCCCCTTAGCGGCTGCC
+GAAACAACAGTCACTGCAGCACCAATTGGCCGGACGGTTTCAAGGTATTTCATAACCTCA
+TCCACTAAGGTTAAGGAGGCTGGCTGTTTTTCGGTATCCACTATGGCAAGCTTCACTGTT
+CCAGGTCCTGCCCATAACGGAAAGACTTTGGCATCTCCTACGCCGGGTACTTCTGTGGCC
+CACTGCCGATACTGAGCAGCATTTCCCGAGGTTGCCGGCTGCCGAACTCGCTGCAGATAT
+CGCTTTCTGAGCTCGTCATCCGACTCTGTATCTACTCCAGGAATCAAAATATCGACCAGC
+TCCGCCCTTACAAGTCCACTAATAAAGTCAATGGGCAACATAGTTCCGAAGTTCTGGTTT
+CCTCTGCTTCCTGCAATCTCACACTCCAAACTATACTGACCGGTTGAAATTCTTTCCATA
+GTCTGATAGTTAACCTTCTCTATGGAAAAGCGACTGCCCACGGCCACCTCCAAAGGTAGA
+TTATCTTTTCCAAAGAACAGGGCTTTCCGTAGTGCCTTCGTAGCAGCTTTACGAGTTACT
+CCATAATCTGCTGTCCTGTATTCCAGATAGTCTCCGCTTGAAGTCTGAGCCGAGAATAGC
+CTTAGATTGATCTCTAGCCCTGCATAGGCCTGAGCCAACTCTGCTGCAGCCGGGGATAGG
+GCATCATAAATGATGCTGCCCTCTCGTTTGTCTAGGTCTACGTCAACCCTGTCCAACATT
+CTTTTCAGTATTAACTCGTAAGTTTGTGCTTCATACACTAAACCTTCACCTCCTGAGTCA
+TATCAAAGCTCCCATAGCTGCTGATCACTGTAAATTCAATCAATAGACCATCCCCTGCAG
+CTGTGATTTGAACATTTTCAATAGAAGAAATTCGATCATCTTGAGTCAGGGCTTCTCCAA
+TCATCCGGCTTATTTCCGATTGGACAAAAATCGGATTGCTACCGATTAACTTCTCGAGCT
+CAGAACCATAGTTAGCTGTGTAAATCAAATGGTGCAAGCGTGGAGTCAGCAATATCTTAT
+AGACGGACTGCTTGACTGCCTCGATTCCGTCTAACCTGCCTACAATTCGATCTTTGGCCA
+CATCCAGCTTCCAAGTGAGTGACGGCTGCTCTATTTCTTGAATCGCATCATTGGTTAAGG
+TTCTCCCTACAGGAATCATAGCGTCACCACCTTATCTAAAATTACAAATTTTTGACCACC
+CTGAACTCGAAGCAACAGAACCATATCTCCAGCCTTGAGACCTCCGCGGATTACGATCTT
+GGTTGTTAGAGCTTTGGCACTATTTCTCGATGAACCGTCGTCAGTGTATTGGTGAGTATG
+CTCGAGATCAAGTTCAAACGAAGTCATACTTTCCGGTACCATTAAAAAATCCGCCGTAAG
+CGTGAATCGTTGATCGACCATCACACTGAGCGGATTAACTGTCATGACTTCTCCAGACAT
+CACGGTTACGGGGTTAGAGGCTCCCACTGCGTCCATTCCTGCAGTCTTTATGACATCCAG
+TAAACTTGCCATTATATCACCTTCATAATTGCTTTAAGTTCTAGGCTCATTTTATGATCT
+GCTCCGTCAAAACTATGGGTACATTCATCCACCAGAAAAGGCTGATTGATTCCGTACTCT
+TGAATCTGGATTCGAACATAGCTTCCTGCCCTTACCCGAAGATCGCCGATGGCTTCAATC
+TTCAGAGTCTTTGACTCTCGGTTTTTCAATGTGGCCAGCGTATCAAGAAGCTCATTGATC
+TGAGCAGAGTTCATGTCTTCGTCCACACTTTGGTAGAGCTGTAGGACGCCCCACTTCGCC
+ATATTTACGCTGTCTTGGGCACAATAGACCTCACGCCTGCCGGTGTCTTTGTTGTCCTTA
+TAAAGCTTAATTTTGTTATAGGTGTCGGAGTCAATCGATAGTTTATGGACATAGTCCGTC
+ATGAGACTATTATCCCCGACGACAAAGTCCAGCAACAGATCCTCTACATTTCTAACGGAT
+AAAGAACCGAAGTCATCGAAGAAGACGTAGTTTTTTCCAGAGTTAATAAGGGTTAGATCC
+AACGCCTTGCAGATGACGTCTAGAAGCTTTTTATCGTTTTCGCTCATGGTGGGAATCCTG
+TAGCCGGTATCATCAATTTGGCCGAGCTTGAGATTGAAGTCGGCAGCGATCTTTTGAACC
+ACCTCAGACGCTGTAATGTTGGTAAACACATAAGTATCATTGGACATGAGGTAGCGTATT
+TGGTCATAGCAAGTTATCTTAACTGCCTCATCCCTTCCCCCATCAATGGAAAAAATATAG
+CCAAAAAAGGCCTTGGCTCCATCTTCTGCCCTTTGAACGCTGACAATATCCCCATTACTA
+TATTTAAACGTTTTGTCTTGGCCAGGGGCGTTTTTGATGAGTGTGAAGTCCAAGCTGCCT
+GCTTTACCAATCCGGCTGGTTTTCCAGCTCACATCGGCTACCAGGCTAGAAATGTCCCAC
+ACGTCGCCGTCTTTCTTATCGATTAGTATTTTCAGCATAACCAAGAACCTCCTTTTAGGG
+CAGCTTTAAAACCCTGCCGATCTGCAGTCGCTTGATCTCGGCATCAGTAATATCGTTTAT
+TCTCTGAATTTCCGGCCAACGTGCTCCGTTGCCAAGAAACTGTTTGGCAACTGCCCAAAG
+TGTATCACCAGCCACGAGTGTATAAGTTTTAGGCTGTTGTGTCTCATCCGGGCGCGCTGG
+AGCTGCTGTTGTCGCAACGCCAGCAGCGCTTGGATTTGAGCTGATCTCAACCTTCTGTGC
+GGTATAGGGTACATACATTTTCAGCTTAATGTTGTAGTCAATGTCTCCTGCCCCACCAGC
+TACTTCTTTCCAGTCGAAACTCTCAATACTGGCCAAGGTGTTGATATTGTAGCGATCAGA
+AATAAAAATAAAGCGAATAGGCTGTGCGGACTCCATCCACTTTACGATGAATCTTACGTA
+TTCAATGGGCTGCAAAAGGGTTTGTACCGTTACAAATGGATAACGCTGAGCAGGGAAAAG
+ACTGCTAAATCCATATTGGCTGAGCTTGAGATTCTTGATCACATTGATTTCTCTTAAACC
+AACAATGTCATAAGTCTTGCTGCTTATGGCTTCGCTGATTTCAAGGGACCCCGGCATAAC
+AGGTAGTTGAAAGATTTCAGCCTTGTCATTAAAGCTCAATTCTATTCCATACGGCATTAC
+GCATACACCCCCTGAGCAGATGAGGAAATTTCGCTCTCCAGCATCGTCTTAATCTTTACT
+ATAATTGAATCTACACTCTGCCCGTTGTGAATATCCCCTGTTGTCACGGCCACCGTCGGA
+GTAAGGGTCACAAAGTTTTGAATGTTCTTCATTTCAGCCAGTTCACGCATAGTCTTTAGG
+TCTTCGCTGGAGATGTCCACGGTGTTGTTTATTTTACCGACTTCGTTGACGCGGTCGATG
+GCGGGAATACTGCCTGCTCCTCCGTTCCAGCTATTCAAGATTTTTTGTTGATCCAAAGTC
+GAAGTATCCGCCTTTCCCAAATCAGCTAGACCAAATTTCTTCTTAATATCATCGAGGCTG
+ATATTTTCAATAAAATCTTGTCCGGCTTTTTTAAATTGGGAGAAGTCAGCCTGAAATTCG
+ATTTCCTGTATCTGTTTAGCATCTATGCCTAGAAGGTCACCGAAAAATCCAGCCACTTTG
+TTAATCGCATTGATAGCATTGTTGATACTTCCAAGGATAAAGTTTATTGCGCTCTGAACA
+ACATCCACAACGAACCCAAAAGCTGAGCTAAATACATTCCTAATGCCGTTTGTGACTATA
+GCGAAGGTCCCTAATGCTGTGATTAACCCTACGATTAAAGCTATAACTATTCCGATAGGA
+TTCATGCTCATCACAAAATTGAACACTCTTTGCTTTAATAAGGCAAACGATATTGCTCCC
+GCTAATTGGAGAGTTACCAGGGACCAGCCAGCTGTAAGCGCTGTGATCAATGGAATTAGT
+GTCCCCGTGATAAATATAACTGCGTTATAGATTCCCCAAGCTGCTGCTATCCCTAGAATG
+AATGGAGAGAGCCCCACAAGAATGATTCCCACATTATAAGCGACATCGCCAATCATTGAT
+AACCCTTGTAGTAGAAGAGGCCAGACTCCTTCCCCGGTACTCACGAGCCACTGAAGGCCG
+GTAACGATCAAGAATAAACCTATGCTCAGACCCTCAAAAAATGGCTGAAAGCTTCCCTCC
+TGAAAGGCATCATTCAATCTAATCATGAGAGGAGTAAGGGCTTCAGTGGCTTGTTGCCCT
+GCATCAGCAAAGCTGGATTTCATATTGTTCGTTAAAATTTCCAACTGTTTTGTTGGAGAC
+TTCATCATTTGATCAAAGGCCGCTTGTCCCATATTTTGTTTTTCGAGGAGCTGATCAAAC
+GCTTTAATGAAACCATCAATGTTTCCCGACTTGCCTAGATCCTCAATTTTAAAGGCCTCC
+ATATCGAAGTCTGATATACTGAAGCGTTTAGCCAAAGAAGCGGTGTTGCCGGACATCGCT
+TCCTTAACAGCGGATGCTGCCCCTTCAATCCCATTGCCAGCATTGTCAAAAGCGTTTAGA
+CGAAATGCAAAATCATTCAGCTTGGATAGTTGGTCTACATTCTGGGTGGACGAAAGAAAT
+GTAAGACTACTCTGCAAGGCTTTATTGACATCCTGCCCGGTGGCGAGTGCCTCCCTTTTG
+AACTTATCGAACATGGCAGTCCCAATTTCTGTATTTCCGGTCCGGGCGATAAACATATCT
+TGAGTTTTTCGCTGCTCCATTGCGCCACCAATGCTTGCTTTTCCTAACTCCGTAAACATT
+TCGACAGTTGCCTGGACGCGAGAGGATGCATTAAAAAACTTCAAGATTGAATCAACTGTT
+GCCAAATCGGAAACCTCCTTTTGCGCATAATAAAAAGCACTCTGTTTCGAGTGCTTATAT
+GCTATGATAAATTTGGTAACAGAAAAGGCTTGCAGGGCGGTCGGCTTATGATTTCATTCG
+CGACATTGGTGGTGTTAATACTTTCTTTCCATAAACGGAAATAGACCGCCCCTGCCGAAA
+GGTTTGCGGTCTATCCGTCACCCTAAGCCGTCCGCCCTTTTAAGCGGCTGTTACACAAGG
+AGTCATGTTTGCAGCATGGCTTCTTGCTGTTACGATACGTAACTTCTGTCTTTAGCATAC
+CATAATTGTTGAATTTTAACACAAGCTGAAAGATAAATCAGGCAAGTTTGAGGCTTAAGA
+CTTGCCAATATCTCCGTCGTACAATCCTCTTCCTTATAAATCCTACTGATCAATTGCCCC
+TGTCAAATAGGAAAAGAAGAAGCTTAGGAACACTAGACATTATTTCTTCTTTATCTTCGC
+CCTATCTTGTCTTTCCTTTTTAATTCGAATATCAATCATGGCAAAGATAGCGGCCTTAGC
+TTCTCGTGTTTTTTGGGCCAGCTCATCGGGGGGAATATGGAGTTCGTGGAGGGCGTAGTA
+AGCGTAATTCCACTCACCCTCGCCCTCCTCAATTAGTTTTTTACCTCATCCATCAGGTCT
+TCCAGGCTTTGATCAAAACCGTTCAGTTCTTGCACCTGCTGAACAAGGGTCGCATATTCA
+CCGGGAAACAGCATCTTGCGCAGCAGCTCTTCAGCGCCTATGACGCCGTAAGATTTTTGC
+AACTCAGCATTTTTCAGATCAGGGAAGCTGACACTTGCCACGATGATTTTGGCCAGATAG
+ATGTTCTGATCTATTTCAGACTGCTGTGAACCATTTTTTCCCTTAACTTTCCGAGTGGCT
+GCTTTTCGGTACTCTTCATTTTCAGCTTCAGTTATGCTATGGATTTTCCAGGGTATTGAC
+TTGCCGTCATTGTCCTTAAACCGCTCGGATATGACAACCTCTTTGCTGAGATCAGATCCT
+GCATTTTGCGCAAAAAATGCTTGTAAATCACTCATTTTCTCTTCCTCCAGAATTTCTGAT
+TTCTATGATAACTACCACGAGGATACGACTTATCTCACAACCGGAGCATTAAACTGGTCC
+AAAAGATCAAAATCGTCAAACGTAAAGGGTAATTCTTCCTCCAAGGGGTCATCTGACGTC
+GCATCGAAGGCTGCAGCCACCACGCTGTCCAAGTTGCAATCCTTGAGGACGGAGGTCTGT
+TTGCCAACTGTAGAGGCAGGGTCCTCATTGACAATCTGCAGATCAAAGTAAAAATCTTTG
+CCCGTCTTGATATATTCCATCATCAGCGCCCTGAACATGCTCGTAAAGTAATAAATCGTC
+AGTGTTCCGGTCCCAGACCAACCGGCTGCCTTTTTGCCGACGTTGGTTTTTCCCAATATC
+GGTACATCAGCCTTCGTTTTTTCGATAGTCGCTTCCACTGTTTTGGCATAAAACAACTCT
+TCCACGCGGCCATTAATTGTGACAAAAGCCTTACCTTGCTTTCCGGATATTGCATCTTCT
+GCTTTAAGAAATGCCATAGCTTATCTCACCTGCACTTTCACATAGATTTTCTCAATAGAA
+TCTACCGGCTGAGCATATGCCTCAATATAGACACTATCTAATTCATTACCCGTTTGGACT
+GTCAAATCTGCTTGAGAGTCAAAATTCTGGACAGCATCCATGCTCTGAAGTGTTTCCATA
+TATTTGACACACTGGGTTTTTAACAGGTTTCGTCCATCAGCATTATTGGATACCTGCCCA
+ATGTAAAACTCACTGAAAAGCTGGACAAAATCGTTATTAATTCCATCGAGAACTCTGATC
+ACGCGGTTCTTGGCAAACTGCTTACCTTTTTCTAAGCTCGATGTGGTTAGAGTATTAATG
+TCCTGCTCGACGATGGCTCGGTTGTCATTGGCTGTGAAAATAAATTCCCCAGCCCGCAAC
+GCTGCAATGATCTGTGCATTGGTATACCTCGGAGCTACATCCACTGCCCCATCATAAGCC
+TGATAGGTTAGAGATTCATTCACTTGAGCACCTGCAGTTGCACCGGCTACCCAGGCAGTA
+GCTTGAGCTGCACTGAGGGTTGTGCCGTTGGCAAGAATGACTCCGTTCTTCACACTGATC
+ACGCCTTCATAATCAGCTGTTGGATAGTTTTCCAGCACGACCTGAATCTTTTTTCCTTCG
+TTATCTCGAAGACGTTGGCAAAACGCTGCGAATGTTGCTTTAAGAGTATCGTCTGTCGAA
+GGCAAGGCTATTGTGTTAAAGTCATAGATCTCGACTGCTGCCAAGTAGTCAACATAAGTC
+TGATTGGTGATCGTGCCATCTGCTCCTCCCATCAAAGGGACGCCCGCCGTTTCTGTCAAA
+GCTCCTGTGCCCGAAAATACGACCCAATCATTTTCTACCAGATCCGCGATATAGGGAACA
+GTTTGCTGATCTACTTCAGCCCCATCCACTAATGTGGTAACATCAAATTTAGTATTATCG
+TCAATGTTTTCCTGAATGACCAGAGACACATCATTCCCTCTGATACCGCCCCATTTGGCT
+GTGACCGTAAGGTTACCAGTTGTCACGGCTGCCTTTGTCCCAACATTAAGTCTGTATAAA
+AGCAGGGTTTTGGCTTGTTTCAAAGCCTCTCTAACTAAAAGCAGTTTGGCATCCCCCATC
+GGATAGCCCAGCTTGACGAAGGTATCTTCACCCGCCTCAAGGCTGATGATTTTATTAGGC
+TCACCCCATGAGAGCAAAAGCGGAAGAGAAACAATCCCTCGCTCTCCAAGTGCACCTACT
+ACCTGGGGCTCTGATTTAAAATTAACATACACTCCCGGTCGTATTTTATTTTGAGTCGTC
+CATGTACCTGCTGCCATCTTATTTAGCCTCCCTTTTTAGAAAATCCTCAAGAATCTTTTT
+GACCTGATCGTGACTGTATTTCTGTCCTTCTTCCAAGAGCGCCTCCAGCAAATCCTTGCG
+GAAATATTGCTTGGACTTCAAAATCTGCTGTTTACTATAAATCTTAGGGAGCTGCTTATC
+TCTTTTTTCAGTTTTAACCACGTAAATATCCCTCCTGTCTCATAGACCCCATTAATGGAT
+CTGGTTCAACACTTCGCTTAACATGAAAATTGTAAGCCACAAACCAATGAAGTACTCCGT
+TGACAATTTCGTGTCGCATTCCGCTGCCTCTAACGAGGCCGCCGTCCACGCTGATCAGCT
+CCAGTTTGTCATACAATTGCTCAGCCATGTCATGTAAGGCCTCATTACTCCCTGCAAAGT
+AATGAATATCGAATAAGTGATTGCGCTGATAATGCTGACCCAGCAGCTGATTTTGTGACA
+TAGGAAACAGCTTTACATAAAAATAAGGCTCTACCAAGCCTTGATCACTCTCTTCGCTGT
+ATGTGCCAATATTGGGGAAGCTCTGATCCAGAGCGGCAATAACGCCATCTAGGACACTAT
+TGACGGTGATCATCAAATCATCTCCTTGACCTCGACCGATTACGATTTTTTAGAGCAAGC
+TGATTAGCTTTGGCTCATAAATCTCGGGCGCTGTCCAATTTTTCTAATGGACATTGTTTT
+AATGAGTTCTTTAAAGTCTTTCATGATCGCTGTTCAGATAAGAGTTCTTAATGTGTCAGA
+GTATTACCCCCCTCTCTTCAATCCTTCCAAAAGGACTTGCTTAGCCCCGATTGTTAGAAC
+TATTGTCCCCAAACCTTGACTCTTCTGAAAGAACTAGCCGGAACAGAATCTCGCTCATAC
+CATCGTTACTCCTCGGTTTCTTCGCATCATCCGGTCCCAAGCCTTAAACTGGGCGGTATC
+CTCGTAGTTCTCCTTAAACTCGCCTTTATCCCCACATAGCTTCCCCGTCCATTTTAAACA
+GTTGGCACAGGTTTCTTTAAGTTTTGGTTTTGGTTTTATTGGTGAGAATAAGGGGCAGGG
+TTTGGTTCTGGTTTTCACGGCTTGCACCTCGCTTTAATGAGATAAAAATGAACGCCCCAA
+ACATCGGAGCGTTCTAGCCAGAGGAGGATTATGTTAGAGCGGGTCTCGTTCCTAACTTCT
+TTCACAATATTATTGTATCACGCTTTTTTCCAAACAAAGTGCAAACCCTCTGCCAAAAAA
+GTGCCAAACTTTCACTCCCAACTCCCCTAATCACGTTTATATATTCCTAATAAAATAGCC
+ACCTCTGACAACAGTTCATCTCTTACACGATAATAAGTCCGAAGAGGTATTTTCATCTGT
+TTTGCTACCCACCAGTCATAATTATGTTTACTAAAGTAGCGATACTCAATTATCTTCCTT
+TCGTCTTCTCCAAATCCAGCGAGGATAATATCTATCTCCCTGATACGAAGTGTACACTCA
+TTAATCTCTCGCGCTGTCTCCCAACGTTTTGAAGCAATCCCCGCTGTTTGATCGCTAGTC
+TTTGTGGATGCTGGAGTTAGGGAGTAGCTCGCTGTCGTCTTAGGTAGTTCGTTTCCCAGC
+TGAGCATTCAAAATGCAAAGCCGCTTTTTATCCTCCGGATATTGAGAAAGTCTTCTGATC
+GTTAGCAGGTACCACTCAGGCTTTTTGCTTTTTTTCTCTGCTTGATCATCCATAATATCC
+CCTTTGAGTTTTAACATTCTTACATCCTCCTCTCATAAACGTCAACAATCTTTACCTCTT
+TCGGGTTAATTTGCAGTTGTCCTATTTCATCTTGTATTTCCGTCATTCCCTTCTCTGTTG
+ATCTAGTGGTAATTGTATTGTATATCCGTCATTTGCTCAAGGCGAAAAAACCCCTACTGA
+GTTTAATTAGATAGCTCGTACTTAAATTTGCGATTACTCACTTGTATTTCCGTCACATTT
+GAAAAATTAAATTACTTGTTGTTCCGACAATTCTGCTCTATAATATAAATGTCTGATATG
+CCGAACAAATATTCAAGGAGGGAACACCGTGGGTGTGGGCGAGCGAATTAAACAATTCAG
+AAAACAAAAAGGTCTTACTCAAGTTAAACTTGCAGAAAAGGCCGGAATTTCAAGGTCCTA
+TCTAGCTGACGTGGAATCGGATCGATATAATCCAAGCTTAACCACGTTAATAGATCTTGC
+TCAAGCTTTAAATGTTACCGCGAGTTGTTTCCTGGATGACAAAGAAATAGATTTCAGTAA
+CCTTATTCAGCTATGTAAAAAAAACGGCATGTCCCTGAGCTCTCTTGGTGCGATATTGGA
+CATCTCGCCAAAGGAATTAGATCATATACGATCCAACAAGCTCCCCGTTGAAGAGACTAT
+GTCTAAAATTGCCGATCATTTCGAATGCACTTGGGATTATCTTATTGGCAAAACTGACTC
+CCCCGATGATATCGTCTTGGGTGGAAACTCCATTTCCATCCAAGATCCAATTTCAACCCC
+CCCCCAGAAAGTTGGAAGTTCGGTTGAGCCCATAAACATTCCTTCCACCATCGCGGCTCA
+TTTTGAAAATATGAATTTTACAAAGGAAGAAACTGAAGAGATCAGCAATTTCATTAAATT
+CATAGCCTCTAAAAGAAAAAAGTAGTCTTGCGCAAGGAGATGTCACATGAATTATGAGAG
+TTTAATTTTGGAGCTTGAAAAGGAAGGCGTCGAGGTAATAGAGCACAAATTCCACAGCGA
+ATCTTTGAAAGGTTTATATTTTGACAATGTGATAACACTTAATCCTTCAAGTATTATAGA
+TGAAAAGGAAAAAGCATGTATTCTAGCCGAAGAATATGGACACTATCGCACATCCTTTGG
+AAATATTCTAGATCAGAAAAACACCTCCAATATAAAGCAAGAAAAAAGAGCCAGAAATTG
+GGCCTATGAAAAATTAGTACCCTTAGAAAAACTCATCGATGCATTTGAAGCATGTATTTG
+TAACCGTTATGATTTAGCTGATTTTTTGGGAGTGACGGAAGATTTCTTAGATCTAACACT
+TGCCCACTATAAAGAGAAATTCGGCCTGTATGTGGAGTGTAGGAACTACCTTATTTATTT
+CAGTCCTCTCGGCATACTTCGCAAATTTGATAATACCGAATTCTAA
+>NC_018515.1|provirus_4659544_4694673
+TCACATCTTCCATAAAAGCCACCTGCAGGTATTAAGTTCATATTTGATCTCGAAAATTTG
+TACTTCACCTTTGATCTCGCTCTGACATTTAAAGATGAGCATACGATTGCCAGCAAGTTT
+TTCTTCGGACACGGAAACTACTTTATCAATTTTAAGTTCTTTTTCATCAAGCTTGAATCT
+TAAGGGGTGGGGTTTGCCGTTCTCAAACCAAGCTAAGACCTCGATGGGGGCTGCTAAGAG
+TTTCACTTTTCTACCCCCACTTCGTAATTGCTAATGAGTAACTCCCCGGCCTTACTACTT
+TTGTCAGTTCTGCAGACCGAATATCTTACTTCAATCGGGTTAATGTTAAACCCGGTATAC
+AGCTCTCGGATCTCCGGATGGTCATTAATACTCAGCAAGAACTTTCCTTGAATTTTTGCA
+AGGCATTCCTTAAGCCTGATATGATCTTCTTTCGTGAATGGTTTGCTCCCTTGGCTTTTG
+TAGTCAGCTAGGCCGTAATAAGGCGGATCGCAATAGAAAAACGTTGAGCTTCGATCATAA
+CTGGAAATAATTTTTTCGACATCTCTATTTTCGATGATTGTATTTACCAGTCTGTCCCTC
+ACGGATGTAATGTTATCCCTTACCCGCTCAAGAACCATTGGCGGCTTTTTCAAAGGAGTA
+ATCATGAAGTCCTTCATCAATGCTCCAAAGCTGAAATGAAGTAGGTAATAGAATCTGACT
+GCCCTATTTACATCGGATGTACCGGCGAGGCTTAATGCTTTGTATTTCTGGAAGATCTCT
+CTTGAAATAAGCAAATAATCAAAGGCCTGAATGAATTGTTCGGGCTTTTCTTTTACGACT
+CGGAAGAAGTTGACCAGTTCAGAATTTATGTCGTTATAGACCTCCACTTCGGAAGGAGGC
+TTTTCAAAGAGTACCCAGCCAGCTCCACCAAACGGTTCACAATAGCATATATGCTCCGGG
+ATCATTTTTACGATGGTCTTTCTTAATCTATATTTGCCACCCATCCATTTGATTGGACTG
+TTCATGGTTGTTCCTCCTATACTAGAACATATGTTCTATTATAGGGTATTTCAAGGAAAA
+AGAAAAGACCCCATAAGGGGCGTTTTCGAACAGGCTGGGACTTGAATTGGACAACGTTAT
+TATAAAATTGAGTATTAAATTAAAACAACAAAGTATTTATTGCAATAGTAATAAAAAGTT
+ATATTATAAGATATATACCTATAATACAATTGTAATATATTCCCACTCTTTTGGAGGTGA
+AAAAATGTTCGAATTAGAAAAGGAGATGACACCAGTAGTAACAAATAATCTAGGGATCTT
+TTCTCAAAGAATTGCAAATCACGAGAATCTAGCTTTAACCTATGAATTACCAGTGAAATA
+TCGTCTTATTGATATGGCAATTGCCTACGCTCTTCCCGATGGGTATTTCAATAATGTAGA
+ATCATATAGCCCATTAAAATATATCAACAATATCCTTATGGAAATACTATCTATATTTTA
+CTTGTACCCTCAAGTTACAATAAAACGTCTCCAGAAAGAGCTCTTCATGAACCCGGATGA
+ATTAGAAAAACTTTTATATAAGCTTATTAAGCATAAATTAATCAAACAAGTATCACGAAT
+GTCATATCAAATTAATGATTTGGTTAAAATAGACAGTCTTGGTATGATATCTATAGAACT
+TAAGTTGTGTAATTGGAGAGAAGCTTTAGGACAAGCAGAATATAACCTTATGTTCTCTGA
+TTACTCATATGTTGCCCTCGACAAAGCTAGAATTCCTAATAATGGAGTAGATTTGATTCC
+ATTTTTTAATAGTAGAAATATTGGCTTATTATCCGTTTCAGATGATGGTAATATTGAACT
+ACTTTTTAATCCTAAGAAAAACCGGAAAATTGATAAACGTTTATACACAATGCAACGTTT
+GAAAATACTGCAAAGTATTATCTCAAGTCAAAAATGGTACTTGTATTCGAAAATAGGAGA
+ACCTAAGTAAATTACTGTAGGTTCTCCTATTTTATTTATAGGTATTCATCCACAAAATTA
+TCCAAAACTTCTCGCCAAACACTTATATGATTTCCATTTTCACTTAAGGGATTTCCTTTC
+AGCCTGCCCTTCATATATTCCATTTTTGCCTCTGCATCCTGAAGCCATGTTTGAAGATAC
+CCTATTCTATCCCCTATAGAAGGTATTTCCCGAATATGCTCTGCTTGTTGAATTAAACTA
+ATTACTCTGTGCTTACTAGCCGCACTTGTATTACTACGGCTTTCTGTCCAAGATGGTGGA
+ACCACAATTTTTTTGCCTTTTACTCCTAGTGATTGAAGTAGTGGATCACTATGAATAGTT
+ATAATATCTGACTTAAGGTACCTTAATAATTTTAAATTAACAATTTTCTTAAGATCTCTT
+TCTGAATAAAAATCCCCGATTAGACTTGTTGAATAATACTTCGGTAATGACATGCCTCCA
+TCTTTATCTACGAAGTCATTCAAACATAATCTTCGCTCTTTAGTTGAATATCCACTTCCA
+AATGCTGTTGCACCGACAGCCAAGCACAATAAACCGAATGCATCTGCAAAATTTATAATT
+ACTTTTTTATCTTCCACGTACCCTAAATTATATGAGAGTTCTAATAGCACCCTCGCAATA
+TTGGCCTCAACAATCTGGAGCGAAGAAGTACTCTGCTCTACAACAATATAGTACCCATCT
+ATTTCTGATAAAACAGACGCATTGTCTAATAATGTTTGAACCATTTGATTATCATTAATA
+TCACAATCAAGTAAAGCCTTATCGGATATTGCAATTGTTGCAAGGAATGGCTTACTGTAA
+TTACCTTTCAGCTTACTTGCTGCCTTTAGCCATTTAAGTTGTTCACTGAACTGATCTTCG
+CGATTAACAACAAGTGGTGTGGGAATAATTAGATCTGTAACTCCAACTAGTTCTTGAAGA
+GCAAAGCAGGACTTTATACATTCTTGAATTTCTAATTCGGAAGAATACGATGATAGACTA
+ACACTTAAATCCCTTGAAGAAATAATATTAATCTTTCCAGATATACTCTTGGTCGTTCTT
+ACTTTTGGCTTTGAACTCTTCGTTTTTTCATACCAAGGATAAGAACAAAGATTTGAAAAT
+GTTTTCTTACATCTATCCTTATCGATACCATGAAGGTAATATTGAGGATCAAGCAGTACA
+GTAGATAAATCATACGCTTGCCTCTTACATAGCTTGTCGCTATTAATTGAAGAGCTGGCC
+ATTATAACCCCCTGAGGGTCTACCCCATCTATTGTACCGAAATGACCTCGATTATATAAA
+AACAATGTCACTCAACTCCTAAAATATCAAATATTTCCGTCCAACCTTTTGGTCGCTTAA
+AAGCACGAAGTTCTGTTAATTTATAAATAACCTTTTCAAGAGTATTAATAATATTTACTT
+CTTGCGGAAACTTCGGTATAGGGGTATTCAACATAATATCCTGCCTGAAATTATAGGGAT
+GATACCCAGCCAAGCATTGATATGCAACAATCCCAAGTGCGTACAGATCAGCCCGAAGAG
+TAAGATTCTTTCTCCCAAGAAACTGTTCCGGAGCAAGATACCCTTTTGTCCCAAAAATAA
+TTCCGTATTCAGTTAGTGATTCAGCATCGGCATCAAGATGTTTTGCAAGCCCGAGATCAA
+TCAATATAAAGTCTCCATTAGTATCGAGAATAATATTTTCAGGTTTAATATCACAATGAA
+CCACATCTACCGCCCATAATGCCTCAATCGCTAGAGAAATACAATGAATCAATCTTATAG
+TTTCCTGTTCAGATAACTTTTTTCCCGATTCCAATAGTGCTTGGAGATTATCGCCACTAA
+TAAAGTTTGTGATTATATAATAGCAATCTAAACCCCTTATTACCTTTTTTCCACTTCCGT
+ATAAAGTTACGAGGTAAGGAGAATCAATTTCTTTCAATTTAGCAATTTCAAGTTCAGTTC
+TACGATGCTGATGATCAGGACCATAAATTTTCAACAAAATTTCGCGTTGTGAGTTATTAT
+CAATTGCTTTAAAGACAGCTCCTTCTGCCCCTGGCTTAAGACTATCAACAGATTTAAGGT
+TAGGAAATAATGATATAACTTCAGCCTCTAATAAAGGCGGCAAAAAAGGCGAAATCATTT
+TAGGCCTCCTTAAAATTTTAATAAGTTTATAATAGTTCAATAATTTACAATATACTATTA
+TGGCATAAAGTTAATGACGAATTCCCACGAAATTAGTCTTATAAATTAAAAAAAGCCCTC
+TCGCTTTGAAGAGGGCTTTTGTCATAATAATTATACAGATTGTTGTACTGGTTTTAACTC
+CAGATTAAGCACCTGCGATGGTGTTTCCGATATAGATAGCACAGGATCTGGCTTCTGCCC
+TTGTTGCTTCATCACAAAGACAGCCGCCTCAGCCGTACTACGAATAACTTGTTTTAGATC
+CGGAGTAATCTCGCGGCCAGTAAGTTTAATCATATTCATAGCATATTCGGTGGCCTGATC
+TTTTCTCAGTTCCGGAGGTAATTGCCCACTATTATAAAGTTGCTGCGCCGAATGTACCCC
+AGTTTGTGTAACCTTGAGGATCGTATCAATAACGTTATCTACCGGATCAGGAATAATTGG
+TTCTAATACTGCATGTACAGATTCAACGGTATCCACGACAGCACCTGCAACCTGCAGCTG
+CTTCCCTGTATCCCTGCCCTGTTTGACTAACGTCTGGATACCGTACATCGTCCCAAAGAA
+ACACATCAATGATAAACCAGCAATTAATAATGTAATCGTTTGAACACTCATCTTATTTCC
+TCCTTTTTAAGTAAATTGGCAAGCGCTTGGGAATATTAAGCTCCAGTAGCGCTGACTGCA
+GCTGCAGTATCTCCCCAGGTCTTTCCGGAGAGAATCGTTTCGTTTGGATGGCCAACGGAT
+CCCCCGCCAACGATAGTTAAATGCTCTGCCTTATAAATGTCTGCCGGGGGAGTTTTATCA
+TCAAACCTGAGAAACACTGCACAGTTTCCAAGCTTAATTGACTCTCTTCGCGCCGGTACC
+AGGTAATCCTCAATTCCATGAGCTAAGACCGCCTCTTTCATCTCATAGACCTCCTTTTTA
+ATAACATTCGCGCTGACACTTACGCCAAAATGATCACCAATCCCCTGAGCGATGGCCAGA
+GCAGCCTGATCTATTTTGGCTAAGATCACGCTTTCCTCAGAATTAATAAAACCGTACTCA
+ATGAGCACGGCCGGCATATCTGTCCACTTTAATACATACCAATTTGCATATTTAACTCCG
+CGGTCAACCATTCCCAGTAAAGCCATTCTCGCCCGGATAGCCTTGGCCATCTTCTCTCCT
+TCACCACCGGCTGCTAAAGCATAGACTTCGTTCCCGTAAGCTTTCACAGCTGCCGAGTTA
+TTATGGAAGGAATAGAATGCATCGCCGCCCAAGGCATTTGCCACTTTTACCCGATTCTTT
+AAGTCGAGATCATCATTGTATGGTGCTGGCTCACAGAAGTCTTTATCTGTAGCCCTAGTG
+AACTTTACTTGGAAGCGGCCGGTTGCTTCGAGGATCGCCGCCGTTTTCTTGGCCAGCATT
+AAGACGTTATCCTTTTCCTTGGTCGTTGGGCCTACTGCTCCCGGATCCGGGCCGCCGTGG
+CCCGGGTCGAAGACCAGGTCATATATTTTCAATTCAGCCAAATTACTCACCTCACTTTCC
+AAATATGCTAGCTAAAAACTCAGGGTTGACGTTCTGTCCAATGGCTGCAAGCGTGATAAT
+AATGGCTATAATTACAAAACCCTTGATGATCCATTGTCCCCCTGGGGTTTGCCAAAAACC
+TGCTTCTTTTGATGACTCTTCGTGTAATGTTTCTAAGGTTGAAATCCGCTTTTCCATCGT
+TTCTAATGTCTTAGAGGTTGTCTCTAACAGCTGAGTAAGCTGAGTGATAATGATCTTTAA
+ATCTGTTATTGTCTCACTGTGCGCGTTTAATCTGCGTTCAGCTACCTCAAGTTGCTTATC
+TAAGCCTTTATGAGTTCGTTCACAGGATTGCTCGGTGACTAAGTTTTCCCCCACCATAGC
+CCCACCCCTTCTTTGATTATTGCTACCAACAACAAGCTCCCAATACCGTTAACTTGGCCT
+TGGGAACTTATTGTGCGCTTTATGATTTATTGGTGTCCTTAAACTTAGCCAAAATGTTGC
+ATGCAGTATCACAAGTTCCAACTGCACAGATTCCAATTAGTAACCCTTTCGCAAAACACT
+CTAATATTGAGGCACACTGCAGCAGGCCAAAGCTGCTGAGGATACCTAAAGGAATTGCGA
+GCAAGTGTGCGATTCTTCTACTTAAGCCTAACTTCTCGAGAGACTCTACAATTGCGTAGA
+CAAATCCGATCAATATTATCAGTTCAGCTGCCATAGATTACCACTCCTTCACAAACCAAT
+AAGGCTTGTTCTCCTTCTATGGCATAGTATGTTGATGATTCGGAATCCGTGAAAACACTC
+TAATTAAGCCCTTCTTCGAGATATAAAGCAGCATTAGTATCTTCTAGGCAATAAAAATAA
+CGCCCCAAGGCATTTAACTTCTCTGGAATCTTCACTATGCATTAGCCCAGTATGGCTATC
+TCCCTCGTAGCTACTTCCATCTCTACCTCGGTTCTCAATGTTGTGTTTGTTCCGTTTAAA
+AGTTCCCATTCGGTATTGGGTACGTCTTCGATGGTCATTCTCTTACCCATTACTAACGTC
+GCATAGGCGTTTACGAGTCTTTTTTGAACTGCTGTCATATTAATCCTACCTCCATCAAAA
+TATTTATAATCAATATCTCTGTCTCAGCTTTTGCAATTTCATCTCTGGACGGGATAAGGC
+TATCCAGTAATTCTTGCTCCTCATGTATTGCCTCCACCTGTGCCGAAGCCTCCTTCATTT
+CAGCCTGTGAAGGCAATTGGAGGTCATGGTTAAGCATAGTCACAGTTGTGATGTCGTTGG
+TGGTAATTACGATGAAGTCAACATTATGCTTAGCCTGGGGGTAAATATGGGATACAGCCT
+CTACGTAGTTCATAGCATCGCCTCCAAAGAGCTTAGCTGGTATTCAATGAGGATTCCCAT
+TCCCCCATTAGTTGCTGACACAGCCGGAACGGTGCTAACGTTGCAGGTACCATTTACGCC
+CTTAACCCCACCATCTAGGACAATCTGTGACGGTAGGATATCGGAGTCGGTAATGGTTAT
+TAGGAGTCCTCCCCCACCGCCTCCACCGCCTCCACCCGAAGCACCCCAGGTATTCTGGTT
+CAAATTAGCCCCATTGGAACCAGCTGTCCCGTTGCCTCCGCTAACATCAAGGGTGATGGT
+ATTGACGATGGAGGGGGATATGACAGTCAGGAATCCTCCCGCTCCACCTCCGCCACTTCC
+CCCAGCGCCCTCGTAAGTGAGGGATCCATTTCCACTACTATTATATCCCCATCCACCTTT
+ACCGCCTGCACCTCCGAAGGATCCTCCTGCCCCCCCGGGTCCACCCTGACCCCCAGAGTT
+ACTAGAGCTGGTAGTCCCCCCGGCGGATCCACCCCCACCGCCATCCGAGATGGGTACCTC
+GGGAAACTGAGTGGTTATTAGGGCTGGAATGAACAGGTAGTTTAAATATTGCCATAGCCA
+CCCCTCGGGAGCTATACCGAGAAAAGAATTACTGCCTATGCTACTATATGAGGCTCCTCC
+GGCATTATTGGGGGCTGATTTCAGCCCCAGGGCTGATATCGAGCACCCGGAACTGGGATT
+GCCCGCCTGGGGATTAGAGTTGTCATTGGTGTTAGAATAGGATCCAGGACTACCATTACC
+TCCAACTGATCCTTTGGCGGTTATAATACCAGTACCAACTATGCTATTGGCAATAATTAT
+TAATGATCCTCCAGCAGCACCACCAGCTCCCCCCTGTCCAGCGTATGAGAAGCCGTTTTT
+TGCTAAACCTCCGAGGGGTCCTGGGGCCACGGTGAGAGTTCCGTTTACGCTTAGGGTCCC
+CTTCACAAAAACCACAGACCTGTGGGGAAAGGTTAGAGTAACTCCAGCGTTGATGGTTAA
+ATTATCGTAATGATAGACTGAGTCCGTTAGGGTCTTATGCGTTGAGATCGTTACATCCCC
+GAGTATTCCACTTCCGTAATACAATTTTATTCACTCCCCTATAATTTAATAATCTCAAGG
+GTACTATTGGCTCCCCCATGTTTGTAGCCTGCGTTGGTGGCCGGAGAATTGACAGCGGTA
+TTTACCTTATCTTCGCTTTTCAAATAGACTACCCGGTGCATTTTAAACATAAATTTATTG
+CCACTAGCTGTTGGGGGGTCAGAGATCCAGATGGTATCCACAATGCTTTCCATGAGTCCA
+TTAATAAATAACCCGTAATTAAACTCATACCTATCGGTAGTGGTATCGAATATAAAATCA
+AGGTTGGATAATATCAAGTAATATCCATTCTCGGGGGCAGTATAAAATTGCCCGTTTGTT
+AAAAGTGACTCCTCGTCGCTAATGGTGTTGCCGAAGGTTACGGTATTCCATCCAACATAC
+GATGTAAAGGTAGTAGTACCTTTGGCCTTTAAATAGTGTCTTGGGGCTAGCTCTAATTTT
+AATATTCTCCGAAGTAATCCCATCTGATTAGCAAAAAACATCTTCATCGAGGGGGCTTTT
+CTTAGGAACTCCCGAGGAACTTGTACATCAGCTCCGAGAGGAGTAATGCCACCTGCTAGT
+CCCTTTCTGTGGGGAGTTGAAGTCACCATGTGAGCGTTGATGACATCCGAAGTATCATCG
+AGGTCTTCGGTAAGTGAGTCAATTTGGAGCTGGAGGTTTCCAGCGGCATCAACGCTTAAT
+TGATCCTTCATGCTGTTAAACCAAATGATAAAATCATCCTGAAACTGGGCTTCCACAGCA
+TCCTGATCAGCCTCGATGGCTAATACCCAGGCGTCATAAGCATCTTTTTTGTCGGTAGTC
+CACGTGCTAAAATCCCCATCGTATTCTGTTTGCTTAGCTGCGTACCAATCCATGTACTGG
+TTAAAGATTGCCGTGGTATCTACTTGAATTAGGCTGTTGACCCATCCGCATTTGGTGGTA
+TCCATTCGCAGATCAGTAATATTAGCTTGTGTAACTTCTATTGCACCGGCACCGATATAA
+ATCTCAGCCAGGGCCAATTCATAGATATCAGCATCCCTTTGAATCGCCGGGGCCACCGGC
+AAGCTGGCAAACACGCCTTTTTTTATAACCGATGTGATCTTTCGTAGAACGGTATCCAGC
+CTGACCACTAATAAATCTTTCCGCTTTAAAGCACCGTCAGCGACATCTATTGGGATTACT
+AGATCGGAATCGTTAAGGTAATAATACCCGTTTATCCATGCCTTGCCCGCTTTTAAGAGA
+ACAGACATCCCCCCGTTGGCCATAGCTTGAAGGCTTGTCGTTGGGTTGGGGAATACGCCG
+GTCGTAATAAAGCTGTTAAAATACGCCGCGTAGTCAGATGCTTGGTATTTTCGATCGCCA
+CTGACTGAATTAAAAAAACTTGATTTCTCCGCCAATTCTTATCACCTCATTTTCTGTTTG
+ATTTTATCGAGTAATGTTGGGATGCTGTTTCCAAAGGTGACATTAATCCTTACTCCAGCT
+TCCTCGTAGACCTCTTGAATTTCAGTGATTCGTGCATTTATAGTAACGCCCCATTTTTTA
+CGAACACAAGTCACTATATCCCCAAGATCAAAGTCAGTTTTGTAAACCAGGTTAGCATTT
+AGATTTATGACACTGTCAAAGGTTCGGTTCTCTACTCCTTCAGAGAGCTTAGAATTACCT
+CGCTCCGTTAAAGTTTTCAAATAATCTGCATCCGACAAAGTTACGCCATTAACAACGTTC
+GTAAGATCCTTGGCGTCCACAAAGTCCTCGAATCGGTTTAACCCTGTGGAGGATCCAACG
+GTTACGAGCTTTCTAGCTGTACCTTCACCCATACCCCCTACAAGGGCTGTATCCCGATAG
+TTATTGATGCTCTCGGTATACTGTTGCGTGAGAATGTTCTCAAACTCTTTACTGAAGACC
+GCCCGCGGATTAACGCTTTGATTTATGGAACGATCTAATCCCGCGTACACATCGAACACT
+AACTTTTTATTGGATGTATCAAAGCTAACCCTATATCCCAAATCAGAGAGTGAGCATAGG
+TTCTCAATTTCATCCAAGAGGTTTTTATAACTCACTTGATAGTTAACTGTTTGAGAATAG
+CCTTTTAAGGTGCCTAAACTAAGGTTTGGTATGATTCTTTTATTATCCGTTGGAGTAATG
+CTGTGCTTGTTTACAAGGGTTCTCATGGCATTTTCTGCTGTGCTCTGAAGTATCTCCTGG
+CCCCATACAATGCGTCTGTTCAGATAGGCCGAGAGAAATTTTCCCTTAACGACGAGAATT
+TCTTTACCTTCCACGTCTTGATCCATTTGCCTGAATTCAATGTACCCTGCTTCATCATCG
+TTATTCTTCCAAACGACATTCCCCCTTTGGAGCATATCAAGTGTGTAAGCATCTAAAGAA
+CAATGCAGCTCGAAATCGCCGCATTTAGAATAACGGCGATTCCACTGCAAGGACGTGAAA
+TTATCCATAACCCCCAAAAGGTTAAGGTCTGAATTGTAGATATACAAATCCATCATTACA
+CCCCCAGATACTGAGGCATGTAGTAAATGGTTACCTCAAGGTTGTCTAGATTTGTGTCTG
+AGTTATACCTAAAAAGATTATCCCCTACATCCAACTGTAAAAAGGTACTGCCAACGTCGA
+TGTAGTTAAAAGCGTTCGTTGTGACACCATTCAAATCACTCCTAACCTTTTTGTTGCCAA
+AGTATGTGGAGACCGTAATTGTTTCGCCAGCAATCATTTCTTTATTAATTTTGATGAATT
+CCTGAGTGTTCACATTGAGGATAGATGGATTCGTAAGGGTTGCAAGCGCCTTAAACTCTA
+CTCGCATTCCACACTCAACATCGCCGCCATTAAATACATTCACGATCAAAGACGGTTCTC
+TATGTCCCATCTCAATGCCGTCTTCAGTTAACTCTAGCTCAAAGCTAAAATCACCCACCC
+AAAGAGCGATCTCTTCCTTTGATTCATCGATATCAGTCCAGAAAGGATTACTGGCAGTCA
+TGGAGATTAAGCAGTCATCGTATGAAGTGTCCGTTATCTTGAAAAATGGCATCTTGTTAA
+TGAGGCATTTTACTTTTCTCTCCTTAACATTATCCTTGTAAATTAGATACCCCTCTCCGT
+ATTTCGGGTTAAATATGGCGTTGATTTCGTCTCTATAGGCCGTCAGTTCGTCCTTAGATT
+TAGCCAATAACATAACAGTAAGGGTTATGTCCCTCTCGTTTAAGGTATTGCCTAGGTATG
+TCCTCCCATCCTGGTTAACCCCTTTAGAGTTATAAATGGTTACATTGTTAGTCGTCTCAA
+TTTTCTGCAGCAAAAAAGGAGCAGTATTTGATAGTTCAATACTTACCCCTTTTGCATTGA
+CATAGGTCACCTTCCGCACAATACCCCCCCTAGAATGCTAACGCTAACTCTTGCAGGGCT
+CTTTTGTTTTGCCTTGCTGTCTCGGCAGGGCTTACAGCTGCAGGGCTGTAGATGTTCACC
+GTTTGATTGATAGCCTTCGAATTATCGGCATTTCCTGCAGAGGCTGAACTTTTAACGCGA
+CCTTCAATCATTTTTTTACTAAGAACAAATTCACCCCTTTGGGCGATAATCGGAACCTCA
+TCGGGTCGAAGGTCTAGTCCAACCCACCCACCCTCGTGGAACTTCGCATAGTTTTCTTCA
+TACTCTTCTTTTGAACCGTTTCGGTATAAAGTTTGACCAGTTTTATAATTAGTAATCGAA
+TATTGACCCGTCTTTTCATTATACGAACCAGATTTAGTGTTAATGGTTACTTGACCATTC
+GTTTCAACAACATTACCTACACCTTTGACATTAGTAATACTAGTACCACTTGAGCCTCCA
+CTGCTTCCTCCTCCTGATCCAGAAGAATAAGTTGGTTCTTTGATACTAGATTGCAATGCC
+TCGGAAAACTGTTGGCCAATGGTTGTTCCGGCAGTAACAAAGGCCGACGCTTTACTTGTG
+ACCGTGCCCACTATGTTATCCATAGCGGCACCCACGGCAGAGGCTTTATTTCCAATGCCC
+AGAATTAAGCCATCAATGGTGTACTGACCAACTTCTTGAAGTACCGTTGAAGGCGAGTGG
+ATACCCAGTATTTTCTTAATCCAGTTAGGCAGGGATGAAGCCATTTCCTCTACGGTGCCT
+TTTAGTGATGCAAGTTTATTGCTGATTCCATTAATTAAGCCCCGAATGATGTCTTGACCG
+ATCTGCATTAGGTCAATATCTTGAAGAAATTGTTGCGATTGATTCCATTTTTCAACGATG
+GTTGTTCTGACAGCTTCCATTTTGTTGTAGATAGCTGTTTTGATCGCTTCCCAGGCATTT
+GAAATATCTGTCTTTATTTCGAGCACCTTCGCCGAAATGTATGCCTTAATAGCCTCCCAA
+GTGGTACTGAGCCAAGTCGATATACCCCCGAAGATCTCAATAGTTTTGGTCTTGACCGTT
+TCCCAATTCGCAATAATCAGCACTGCAAGTGCCATTACTGCTGCCGTGACCCATGCCACT
+GGCCCCATAGCCATTACCCAAGCCGACGCCATCTTTGCGGCGTGTAATAAACTCTGTACG
+CCCATCCATGCCCATTTTGCCACCACGATGGCTGACTGCACTACTAATATAGTTACCGCT
+GCCACTGCTCCCACTCCTGTTGCAGCCCATGATGCTACAACCACTAAAGCGTGCGCAGTA
+CTCTTTAGGCCCATTAAAAGCCAATCTGCAACTACCTTGGCAGATGCTATTCCATTGACA
+ATTGCTGTTTTTGCTGCTTCAATCCCCATGACTATCCAGGCATTAATCACGACCGCAGCG
+ACCGCTCCAACAATAGGTACTATAATAGCCTGGTATTGGACAAACCAATCAATAATCCCA
+CTAATAGTTTTTGCTGCTTCGTCAATGGCTCTCCCTGCCACGGTAAACGCATATTCGATC
+TCATTTTTGATCAGCGGCATATTGGTAATAATCAAGTTCGTAAATTCATTAACTTTTGGC
+ATTACTTTTTCACCAAGGGGGATGAGGATAGACGTTTCCATGTTTCGTTTTATGCCTTGA
+ATTGCGAGACCAAAGGTATCATACTTGACTTCGTTGATTTTTCCGAGTGCATCCGTTGTC
+TTACTTATTCCCCCCTGAGTATTCGTTAGGGCCTCCATGCCTTTTGCTCCAATATCTTCC
+CACATGGTTCCAAAGAGAGCGACCCCTGCTGCTTCCTTTGCAAGTGGATCCTCAAGTGCA
+AATATTGCCTGAGCCGTCTTGTCAAATGCCTCTTTTGCACTATCTCCACCTTGAGCAAAG
+GCCAGTGACATTTTGCCAGCATCTAAACCTAACGCTTGAAACGCTTCGGTAGATGCTTTG
+CTTCCATCCTTGGAACGTATACCAAACTCTTTCATGGCATCGCCTAGTTTGTCGATATCA
+AAAACACCGGTAGCTGCCCCGTTCGCCATCATGTTGAACATTTCTTCGCTATTAAATCCA
+AGCTGTTCGAAATGAACACTGTACTCATTAATAGAGTCCAAGAGGTTCCCGTTTTTGTCG
+AGACCCTGTTGTGCACCTTGGGCTATAAGGTTAAATGCTTCATCGCTAGTAATCCCAAAT
+CGCTTCATCATCATGTCTGCAGTTCTTGTGCTTTCCGCGACCTCAAATTCAAAGGTATCT
+CGCAGCATTAAAGCATCTTTGGTCATGTCTTCAAGCTCTTCGCCTGTTGCACCAGTTTGC
+TTTCCGACTTCTGCCATTGCCTTAGCGATGTCCTCAAAGTTCTCGCCAAGATTAGCATTG
+TAAATTTCAAGCAACGTATCTTTCATGCCGATCATGGCTTCATCGGTTACCCCGGTTTCG
+GCTTGAATTCCATTAAGTGCCTTTTTTAAATCATCACTAAAGCTAACTGCAAGTCCACCA
+ACCGCCAGAGCCGCCGTACCCATGGCCAGGACTATTCCGGCGCCCACCTTCGCAGCGCTG
+GACACCATTTCGCCGAATGTTTTTGCTGTGCCCTGAGCGCGTCTGTCGGTGTCGTCTATA
+CGAGCATTCGCGGCATCATTGTCGATTAAGATTGATCCAAACAGTCTAAATATCTCTATT
+TTTACCACCTCCCATTCAATGGCATAAGAAAAACAACCCTTGTTAAAAGGTTGTTTGTTT
+TGTGTCATTGCTTTTTGGCTTCATGCGCTACAATAATCGGTAGCAGCTCATCAATAATCT
+CCTCGGCCGTTATTTCTGTGTGCTTCAGTTGTGGTTTGAATAATTCGTTCTTATAATCCT
+CAAAGCTTTGAGGGTGGATATACCCCAGTACCATATAAGGATAGAGACTGTTCCACATAT
+CCCAAGCCCATTCCTCTTGCTCTTTGGTAACAGCTTTTGCAAGTAAGCGCACCAGGTGTT
+TGAGCTGTATTTTGCTGGCTGAATTAACACCATAATGGCTATACAGTAGGTTGATTGTTT
+TTGGATAACCTACCGTATAGCATCCTTGAAAAAACCAACGGCTTCTTTATCTGAGAAGAT
+TTCTTTGAAAGAATTCATGGTCGTAATAAAGTTCTGTGCCTTAATTTCCTCGACTGCCTT
+GTCCTCGAAAACAGCGACAATCTCAAAGACTTCGTTTTTAACTTTGCCTGAGTTCTTAAG
+GACAAACTTAAACAGGTTAATCCCTGCACTCATTTGGTCAAGGCTCTTGCCTTTGTTTTC
+TTCCGCAACCTTTTTGCGGTATCCGTCGAGGTCTAGTTTATCGTATAGATCCACCACATT
+GGGGAGCATGTCAAAGGCTTTTTCCGTTGTTAACATATTTAATTCCTCCAAAATTAGGCG
+GGGGGTCCCCGCCTTTTGTTATCCTGCTACAAAAGGATCTACAATCGCTGCAACATCTTC
+GATTTTGTACAGGTCTGCGGCATCATCAAACGCATCCCAATGCGCCATGATCTCAAGCCC
+AATCTCAGCTTCGCCCTTTGGCTTTGCAGCCAACTCGAAGGAGGATTCGCTCATCGCGTT
+ATACAGAGTGATTTTTTTGTACTCGTTATTCATGAGCTTCGCGAACATAGTCACATTGTC
+CAAGTATGCGGTGTCTTGTATCCCGCCAATATTTGCGCTCTTGGCTGTGATTGTTTTCGC
+CGTGCCGTCGTAGGTCGCCCAGGGCATTGCGATAGCTAGGGTTTCCATGCTTGTGTCTAG
+GACCGTAACGCTCAGGCTTGCCGTTACACTCTCTAGGACTTGCATGCCCTTGCTTTTGCC
+ATTGCCTCCGTCATATTCGATGTCCCTGATTGTTGCATCGACCTTAAAGCCCCCGCCCCC
+TCTAGTGGGTCCTAATCTGCGCTGTGTCGCTAGGCCGTAGTCCGCAAAGACGATTCCGTA
+GTCGACTTGGACGTTTTCGAGTTGAGTTTGTGTAAGTGCCATATTTATCACCCTTTCCTA
+AATAGTTTTCCTGAGAAGTTGTACTGGCGACGCTTGATAGTTTTGTCATCATCGATCAGC
+GGGAGCATATTTTCGAGGTAAAAAATTATTGCCATTTCAGGGTTTGTGACCGTTGTTTTG
+TCCAGGGTTTTAACGCTGGTCATAAGATTCTCTAGTTCGGTAGTGTCAGGGTTTTTGCTC
+CATCCATCCACACTTAGAGTACATAACTCGAACCCTTCGCCATCAGGATAGAGCTGGAAG
+TCGAACACTAGGTAAGGAAAAACCGCTGTCGATGGTGCCTCTTGGAAGTAGGCACGAGGG
+TGGATTGTTTTGAGGAAAGCCGTTAAGGATTTCCTTAGTGCGATCATGAATCCGCCTCCT
+CATCCGCTACCTCTGGTAAGCCGTTTTCTCTTAGGCTCTCGATTTGCCTGATAGAGTCAG
+CTTGCAGTTCGCGAATTTTGGCAAGGTTACTGAGAACAGGAGCACGAAGGTAATCGGTTC
+CCTTCATCCTTACCGTACCGAATTGCACTAGGTGGGCATGGAAAGCATATTTATAACCCT
+TTTTCTTAGCTCTCGCCCTGCTGTAGACTCCGATTTGAAGAACGGGGGTTTCATTCGCCC
+TTCCTTTTACCCATGAGCCAACATTCTTTTTAAGCACACCTTCATGAATAGGAACTGTCC
+TCTTGATTTCCTTTCTCAAAAACTTTGCGGTTTCCCTAAGTGCTTGTTTTTCCAACTTCG
+CTATGGCCCCTTTTACGGCTCGGGCATTTGACTCAAACTGCACACCCATTTACACCACCC
+CATTCACAAGACCCTGACAGGTAAGCTCTGTGTCCTCGCTGTTAGGCTCAAACGTGCGAA
+TAATGTTGTACTCCTTGCCGTCGAATTCGAGCTTTCCTTCTCCTGCATATTCACGAGTCC
+ACACAACAAAGCTTAGTTCTGGTCGAAGGCCGGTTGCTTTCGCCTGGTAAAATTCAGACT
+GGCGTATTGACTTTTTTTCGGCAAACACTAGGCGCTTTGTTTTGGCTTCGATAAAATCGC
+CCATATCATTTTCGCTGATAGTAGTACTAATCAGGTAGATTGCTTGATCCGGTCTATTCA
+TGGCATACTCACCGCTTTAAGTTGAGTCATAAGAATATCAAATGCTAAGCTGAATTTTAC
+TTCTCCGCTTTTTAGATACCAAATATCATTTACGCCAACGGTAAGCGTTGCAATCCCTAA
+CTCGTTCTCGACGTTCTCAATCGTTACTCCAGCATTCATCATGTACTGTTTTACTGCGAT
+TGCTTTGATTGAGAGAGTCGAATCTGTATACTCGCCAGTAATCCCTAAACCGGTTTTTAC
+TTTCTCCAGTAATTCTTCGTTCGTCATTTACTCACCCTCTGCGGGATCTAAGGAAAACGG
+GACTAAGACAATAGTTAGCCCCGTTTTTTCCATCTCATATCGAAGCTTTTGAGATAGTTC
+CTCATGCTCCCGGACCGTGAGTGGCCTTGTTGCTTTCAAATAAAGAACGCCCTCAGTCTG
+CTTTACTTCAACAGCTTCAGGCGTCTTGCTTTTAGTTCTAGCCATTTATGCCACCGTCCT
+TAAACAAATTAGGTTCCGGAGTAGCTGTAATAGGCAAAGGTGTTCTTAGCAAACAATGGT
+TTACCTCCGGAGTACAGCTTGCCTCGCCACACGGTTTTATCCTCGGAGAACTTCTCAGAA
+GCATTGGCTTCGATGACAAAAGCCTCTGATTCATTGACAATATAGGTTGAAAGATCACCG
+TACAGCACAGAGTCCGTATCCGGCATTTGGGAAGTAAACACCACCGGCTGCCCGGCAATT
+AAGTAATTGGATTGACCAGGACCGCCTTGCACTGGAAGGACGGATACTAAAGGCTTCCCG
+GCGGCATCGGTGATTGCGAAAAACCGCTTAAAGAAGGTACTGCGCTTCATGACCCAGGTA
+GCATTATCTCCATAGGGACTCTCCACCTCTGAACAGATCAAAGCAATCTGCTGCCAATCC
+ATCAAGGAATAGGTTTTGGCGGCTGAGGGTGCAACTTTAAGGGCTGCAATAATTCCTTGG
+AAGGTCGAGGTATCCACCGCGCCGTTTAACACGTAGTTTTCAAGTAAGATCCCAATGTAC
+TTACCAATTTCCATGGCAAGGAACTTTTCAAAGGCCGGAATGCTGTTTCTGAGCAGCAGA
+TTCTTAACAACAATCGTTGCCACAACGGCCTGCTGTGAAATTTTCACTTCGGTAAAGGTG
+AAGTTGAGGGTTACTGTGCCGTCGGGATTCTCCGTCGGTGCCTCCGTGGTACCAATTGGC
+AGGGACACGTCCCCTGTAAAGCCAAACTTTGTGATAGCCGTGTACAGTCGACCGTATTGT
+TTGATGACGGAATAGACATTATCGAGAGTGGTTTGGGGAACCAGGTATTCAGCACCGCTG
+GCCACACTTTCGCCGTTCATATCCGTTACAGAGCGCTTACCAAAGGCCATAATGTCGGCG
+TCTGCTTCACTGATTTTCCCATTGAGATAACTTCGATAGAAAGCATCCCTGTACTTTGCG
+CTTGAGCGATAGTTCTCTTCCGTTAGATCGCTATGGTTTTGCTTACCGAACATAAATCCT
+CCTCGTTTCTCGGTCTCCGGTGCTTCCTGGAGCCTTTCATTGATCTCGTCCAAGCGTTCA
+GACATACTTCTAAGGTTGTCGGCGACTTCGTTCATGTCTTCGGTGGACATATCCCGATGA
+TTTTTAACCTTGCTCTTCAGCTCCAACCGCTTTTGTTCCAACTCTGACTTTTCTCTGCGG
+AGTTCCGCCGCCTCTTTTTGGGTTAGTTTCATGGATTCGTTCCTCCTCTTTCTTCGTTAT
+CTTGTAGGGTTTATAACTGACTGATCAGATTCATTAAGGCCAATTTAAGAGCAGTATCGT
+CAGCCGGTGCAGGTGTCTCAGGCGTCTGCTCTTCGGTAATAATGACCGTTTCTTCATACG
+CCGGGAAAACGACGATACTTACCTCATAGACATCATTAATCTTGAGGATGACGTCAATTT
+TGTTTTCCCAGTCCGTGGCGATCATGGCATTGTTATCGAACCAAAAGGACATACCATCCA
+CAATTTCATTTTGAACTCGGTCAAAGACGTAATCGTCCAACCAGGTATTTCCTAAGGTTA
+CCTCAATGAACAGGCCGACTTCGTCTACAACCGTCCTCATATTCTTCCCTGCTCTACCGA
+GCACCCAGGACGTGGCATGATCCCACAATAAAACAAGCTTTGAAAGATCAACCCCTTCCA
+AAGCTTTCTTATCAACCTTCTCGATCCACTTACTCCCGCGATAGGGGCGTCCCGGTGTGT
+CGAAGAGAATTGGGTACCCCCGCAATCTCCTGACGTTTTGGCCATCTACCTCTTCGCTGA
+TCGCTCGAAATTTTGACCGATCATCATCAAAGAGCATGCGCTTTTTAGACTGCTGACTCA
+GGGGTGACTTTTTCTCCGCTTCCTTGCTCATCGCTCTCTCCTCCTTTCTGCTCTACCACA
+TAGCTCCCGGGACTTAGGACTTGAAAGTTTTTGTTTTCCAAGAACTTGTCTAATTCCGGC
+GGCCCTTTGGTGATGCCGAGCCGTTTTCTGATCTCATTGCGGTTCATGATGGTTCCATAG
+ACCATTTCTTTGTAAAAGGCGGTCTTAGCCGCCAGGGTACTGATTTCCAAGTCCACCAAT
+TCTGCCTGAACGCAATTTCCGTGAAAGATTTCTGTTTCACTGAATAAGGCATAGGTGGAG
+GTTTCTTCGATTTGCCACACCCAGGGTTTGATGGTGTTGTCCACAAACTGTTCAAACTGA
+AGTTCTGAGGCGGTTCCGTTAATGATTTCGTAACTGACTCCAAAGTAGTTATAGAGTTTT
+CGGGTGATGTCATCCAGCAGCTTGGTATCCAAAGGGTTGAGCTTCATGTCAAGATTGTGG
+ACTTCATACTCAGCGCCGATCATTCCGAAACCGGTTGTGTTTTCAGCCGTGAGAAACAGC
+TCTTTAAACTCATCCAGCTTTTTCTTCATGTCTGAGCTCTTCAGTTGAGATTTAACTTGC
+AGCAGAGCAGCAATTCTCTGGCTGTTTTCGCTGTCCTTGACTGCTTGATTTTGCATGGTG
+TTGACAATTTGAACATAGTTTCCGGAGGCCTGTTTACTAGATCCTTGTTTACCGTCCGGG
+AAGCGCTGCAGGTGAATTAAGTCGTCATAATAAAAGGGATAGCTTCCGCCTAACGTGACG
+ATAATTCTCCCCTGGGCATCTTGGTTGAACTCACCAAGCGTAAAGGGTAGTGGCCAAAGC
+CAGCGCAATTTGCCGCTATGTTCATCCCATTCAGGCATAATAAAACAGTTATTAGTCAAC
+AGCACTTTCGTCATGCAATGAGTCCAGAAAACCTGGGGACACTGATAAGGATTGGTTCTT
+ACCTTCAGGACAAACCCCAGGCGGTCATTGACTTGATTCATGTTACCTTCCGTGTCTGCC
+CGGATATGGTAGAAGGGAATGCTGGCCACTTTTTCGGCGATAAAGTTAATGGCTGTCCGG
+ATTTCCGGGATGTTGTAAATATTCCCCCCGAAGAGCTGCGTCAGAGAATATCCCCGGTTC
+AGCAAATCAATGACCTTGGCAGCGGTTACTTTTTCTTTCTGAAAGTAACCGGCCACATAT
+CTTAAAAAACCCAAATGATCACCTCTTTTCTACGGCTGAACTCTAACTTATCCCTTGCTA
+ATCGTTGGCCAACCATGAGCCGTTATGCATAGGCGCTCTATGGTGTTTGCGACAGAGCAG
+GCTGCTTCTGCATTCAGGGGTTACTTTGCTTTCAAGATACTATCTTGTACTTTCTCCAAG
+GCTTCAATCTGCTTTTCGATGATGGCTTTATATTCCATAAACCTTCCTCTCTTTCTACGA
+CTGATATTCTTCGAATAAATCCTGTACTTTTTTATAAGCAATATAGGCCATTAAATAGCT
+CATATACCCGTCAATTCTCGCCTTACTCTTTGCCTTATCCGGCTGAATGTTTGCGTTGGT
+GTCGATCTTAGCTGCCGTATTCGTGGTACACCACCGGAAAAGGCCATTGTGTCTGCTGAA
+CTGTACCACTTTGTCCTCAAAGAGCGATCTCGTTTCCTTCATGGGTTGGGAAAGACTTTT
+TGCTCCCATGGCCACGGAAAAAACCACACCGCGACCTTCCTTGTTCTCTCGCGGAAAGCC
+TGCTATCTCCATGTCGCTGGCGAAGTCCTCATAGTGCCAGCGGTCTGCACCGATCTTCCA
+GAAGGTTACCCCATAGGTTTCGGCCAGATCAACGTACCATTGGACAACATCCTTCCTGCT
+TACCATGCTTCCCTCGCAGATATGCAAGAGCTCATGGTTAAGTCCATCGCTTGCCCCAGT
+GCTGGTAAAGCTTTCGTAGGCCATTTTATCGGCCTTGCTGTTTTGCTCAATCCTTGACCG
+GGCAATGAAATATTTTTGAAAGAGATACAGCTTACCTTGGATCGGTACCAGGGCCGAGGA
+TGCACAAAGGTCTGTGGTCTCGGAAATATCGCTGGCACCAACAGCATAGCGATCCTGTAT
+CATATCCTCGATCATATCGATGGCGCATTGATCAACAATGGGGAGATCAAAATAGATCAT
+GCTTAAGGAGCTGGCCCGGTTAAGATGCTTAGCCAAGAACGATGGCATTTGCGCTGGATC
+TTCCAGGGCTTTTAGATATTCCCCTTCGAGGTAGCTCATAGTGGGTCTGGCTTCCCCTAA
+TCCTGGGTTAGCCTTGATCCAGCACTTACGATCCTCCGGCTTGTCGTCATCGTCGATCCG
+GAAGATCATCGGGAAGACACGTTCTTTACTTTTTCCGTTTAAGACCTTTTTGCAGCGCTC
+GAAGATGCTGTCAAAGATTCCTTCGCGGACAAAGCCAAAGGTTGAGATGATAACATTTAG
+TGGTTGAGCTCGAGCTCCTTGGGCCGATGAGAAGACATCGTAAGTGTTACGGTTTTTGAT
+GGCATGAAGCTCATCGATGACAACTCCATGAGGATTTAAACCGTCCTGTCCTTCGCTATT
+TTTACTGCCGGCTTTCATGTATGAGTTGGTGGCAGGAAACAGGATCATCTCAGTGTTGTC
+TTTATCCCTCTTAGTCCGCCAATGTTTTTTGGGATTATCCTTGGGGGTCAGAACATCGCT
+AGTCTGCAAAAACGATTTCGCCGCTTCATAGACGATGGCTGCTTGAGTCTTCATGGTGGC
+CAGACACCAGACCTGAGCAGCCGGTTCTCCATCGGCCATTAAGAGAAAGTCTGCAATGGC
+TGAAATGAAGGTGGACTTGCCCCATTTTCTGGCCACGAATAGGATCATTTCCTTGAAGTA
+TCGAACCGTCATCTGCAGTTCGGTGTCGTAGATCTTAAAACCAAAGATGCAGGCGGAGAT
+ATACTTTTGCTCAATGGACAATTCAAAGGGCTGCCCGGCCCACCGGCCTTCCTTGTGCTT
+AACCAGCTTGCAGAAATCAATAAAGGCCTCTACGTCGGTATCGTCGTAGAAGACCTTTGG
+GTTTTTAAGTAAGGATTCAATGAGTTTCTTTAACTTTTTGATGTCTTTACAATGCTTTTT
+GGGCTCTCGATCAACATAATCATGCCAGCTTTTTATATATTCCGGAGCAATAACCTTAGG
+CTTAGCCACCTTTCCCCCGCCTTAGGATAATCTTTTCGAAGGCATCCGGCTCCGAGGCTT
+TGGGTGGAGGACCCTGCGGCGTTAAGTCTGTCAGCTGCTTGATTATGCTCATGTGGTTCT
+TCACCATCGTGTTGTAGATCTCAACCTCAGGCGATTTCTTTGTTCCGTGTTGGTTTTCTC
+CGTTCTGATATTCAGAGACTGTGCCTTCTCGGTTGATGGTTTCCTGCAGATCCTCAAGGG
+TTATCGTCATGAAGGCGGCGTTGGTGATCAGCGATAAAACTCGGTTCATGGTATCTTTGG
+GCATATTCTTGAAAAGACGCTTAAGTCTTTGGATCTCTTTCTTAATTCGCTCTTCTTTCG
+ATAAGTCTTGAAGTTCCTTTTTCATGGTTTTATCACCTCCCCACCACACCCCCCTATACA
+GATCTGACTCGCGTAATAAATAACCTTCCCTCCCCGGTCCCTGGAATTTATTATTTGTTT
+TCAGAACCCGGGGGGGATGATTTCTTAGGCAACATACTTAAAGGAACTACTGTTCCCGAA
+CATTTATTACATCTTAATCCATCTATTATCCATGGCTTATTATGGCTGATTGTATATCCG
+CAATCAATGCATTTATGCGTGGGCTTTAGCTTCTTGACCTTGATTGGATATCCTTCTGGA
+TAGTCCCTTTGTAATACACGCATACCTAGTATCTGTTGGCATTGATGTATCCCATTTGTA
+AAATCAGTCATATCTGAAGTGTGAGTTATCTCTAGTTTTGCAAACTCATTCCATGCTGCT
+TGAAGCGCATCCATAACTCTGCCCTCATGCTCCGTTAATCCGTCTTTTCTCATTAATATA
+TCAACTCCCTTCTTGGCTAATTGGCGGTATTAAAAAGTCTTGCAATCCTGTACTTCTTCC
+GCTTTTATGGTTATGACAATCAGTGCAAAGGTATTGCAAGTTTTCCGGATTATATGCTAT
+GTTCCAGTCATGCTTGTTTGCATCGGTTAACTCAATAATGTGATCTACTTCCTTGCCTGG
+CTTAATGATGCCTTTGGCATGGCATTCTTCGCAAAGACCGTTAGCTCGGATTATGACAAA
+CTGCCTCGCTGGTTCCCATTGTTTATTCTTGTAGACTTCTGGATGCCTTGCCATTTACAT
+TGGCCCAGATATACCTTTGTTCGACCTCATCAACCGATCAAGCGCTTTAAATCCCTTTGT
+ATCCTCGAACTTAATCTTTGGATGAGGTTTAATTGGCTTTTTCTTTAGAGCCTCATTAGC
+CATGTTGCCCTCCTTTTAGGCATAAGAAAAAAAAGAGCCTCTCGGCTCTTGATCCCTTTG
+GTATTAGTGAACACATCAAAGACATATTTCAAAAATCTTCACAGCTATACATTAACATAT
+AATCGAGGTCTTTTAGTGCCATGGCACTGCCACCTTTATGCCATCTTACTGCCAATCGAT
+GAACAATTAAAATTTAGCTAAAAGTATTGTCATTTATCAAAGGAATTGGAAAGTTATTGT
+AGAAAATATTTTAGATGGTTATCTAGAAAAACTGAACTATTATGCTATTGGTATCTACTA
+TTTCATGTGCTGATAATGGGAGCATCCCGACACATGTCTTGTATTCATAGAGTGATCTTC
+CGACACCTGTGAGAGAAAAGCAGTTAACAAATTTTCGATATTCAATTCAGAGGAAGATGA
+GGATTTTCATGAGTATTAACAAATAACTATTTTTGTCAGTTCGTGGGACAGGGAACTTCA
+CATAAACAGTGAATTTGCAAAACTTGAGAGGATATGAATGTAATAGCCAAACTTCGCAAA
+TTCACAGAACGTCAGGCACCATTAATAAAACCTACTATAAGAAAGGAGACTTTATTTGTT
+TGGGACAATAATTCTAGATGCGTTTACTAAATCTGAAACTATGGAAATTATCGAGGCTTT
+GGATGAATTGGTCAATCCATTAGATAACTATGGTTGGGCTTCAGCAGGTATATATAGTTT
+TTGGAACTATTACACCAAAGAATTGCTTTACATTGGATTAGCTGTAGACCTAACGGAAAG
+ATTTAAGCAGCATAATGGTATAATCCCTATGGATCCAAACGGATGCAAAAAGGATAAGAT
+AGAGGAATATTTTGGGTCATGCGATAAACTTGGCTATACAATATTTGTACAATCCTCAAT
+GTCTCAACCTGCTACTCATAGAAATAAACAACTATGGAATGGACTTGATATTAAGATGTT
+TGATGTTCAAGATTACCGTGATGACCTGGTTAGGGATGACATTCGAAGAGTTGAAGGTAT
+ACTTATTGAATCATACCGAATAAAACATGGGGATTTGCCACCATGGAATAGAGTTGGGGG
+ATCAATACTCGGTCAGCAATCTGTTAATCCAGGGAACTATAATGAAATTGTTGCAAGTTT
+TAGTTCTATGGATCCTAATTTATTAACGGCTAGGTATTCTCTAAGGGAAATATCTAATAA
+CCCAACATTTGAGAGATACGAGAACACTATGCATGCAATTAGAATGCATATGTTATTATG
+GGGGATGTCTTTTGGTGAGGCACGAAACCTTATTAAGAGATCTGATAGTACTGGTTTTTT
+CGAAAAAACAATACAGGAAATGAACCGTGCAGGATATTTTAAGCGACTTCTAGCGATATA
+AGAGATTTATCTGAGCTCACATTAAATTATAGACAAATATTTTAGTAGGGACTATATAAA
+CGAAATAATCTATTACAAAGTTAAATGATGGAGACTAACACGGGATTCCCGACACTTAGA
+GGAAGATACATCCCGGTTGGGATGCGTTGGGAATCCTTGGACATTGCGCGTTAATGCTTT
+AGGGTTTTAGTTTAAATTGAAGGAGAACGATTATGGATTTTTTGGGAACATGGGAATCTG
+TGTTAAGCATTGGAGGAATTATTCTAGCTATATTTGGTATATTAGCAACTAAGTATTATT
+ATGATAAAAGTGAAAAAAAGTTCATTAAAGCATTAGAAACTGAAAGAGCTCGGATAAAAG
+AAGAGTACAGTAATTTTCTTGCGAAGAACTTAGTAAAAATGAAACTTGAAGAAGAAGAAA
+TCATTCTATCAAGAGAAACAGTAAAATTAAGTATTCTGGGTAAGTTTAATAGAACAAATA
+TACTATCAGAACCAAACGATAAAGAAATTGATGAAATAATTACAAGAACTTATTCCATCA
+TAGAAGAACAGGAATTTGTTAGTACCTCGGTTAAAAGATATATTCTAGAATCTCTTTCAA
+AGACTATACAACAACAACATACTTTAAAATCTGAAACTATCGAAAATAGGTCAGAAATAA
+GTAATTATCAACATCTAATAGATATTTCAAGCACGCAATTGTTATATATATTATCTGGTT
+TCAGTTGTCTCTTACTAATAATATATTATGGGATAAGTCATTATGGTATTAAATCCGAGT
+TTTTGATGAGTGTTTTAATAATGGTTTTTATCGCTATCCCTTTTATGTTTATGGCTAATA
+TGCCTTTTAATTTTTTTAATCCGAGTTTATCGTTTTACTTCAAGTTACATTCATATTTTA
+ATATTGGTTTAGTTACAGTTCTTATGTTAATAGGGAAAACATTAAATAAAAATGATCCTT
+TATACAATGTATTCAGTAATATTATAATGTGGAGTTTGGCTACTCTGCCAATAAGCTATT
+TCTTGTTTATTACCATTAAGAAATTTAAGAAAAAAGATTAGTTGTCTTGTAACATGACAA
+ACATTACCCCGTATAGTTGTTTTACTACATCCGAATTACATTTAGGGTAGTAAAATTATA
+ATAGCTGTTTTAACCAAATTTTTTACCATCTCTCATATCCAACAATATTAGGGCTAGTAA
+TTTTCCAGCCAACTTATAATTATTCAAATTTAGATGAAGAAAATTTCTTTAACTTAAGTG
+AATGCAATTTAAAGACTCGCACAAACAGGCGGAAAGGCGTCTATGAAAGAGTAAATTCAT
+TCCATCCCCACTCTTCGAAACTAATCTGCTCCCTACTAACATATCCAAACATCTGAGCAG
+CCATCACTATCAACTCCTCTTTCATCCTGTAATACGACCTTACAGCCATCCCAATTTCCC
+CGGCTATCCAGAAATCCTTATTAAACCGCTGCATATACTTAAGCTCTATCAGCTTTCTCT
+CCGTTTTCCCCAAGGAGCCAAGAATTATATCAACCTCATGGATCTTGTGCCTCAGCTCCC
+TAATCTCGGTTTCAAGCTCCACTCTCCTATCTACATAGCTGCCCGTCTGATCGCCTGTCT
+TTCCAACGGAACGTCCAGGGCTTAGGCTAATCTGAGCCGTATTACTAGGAAATTCGTTCT
+CAAGTTGTGCATTAAGTATCTGTAGACGAAGTTTGTCCTGCGTGTAGGTCGTAAACCGAC
+GGATTGTTTGTCGGTACCACAACGGCTTTACACGCTTTTTCTTTTCCTCAGTTGCGGCTT
+CAGTTGTCTCCAAGCCCCTTACCTCCTTATTCTCATTTAACTAACATCCTGTCCTTAGAG
+TTATTCACTTGACCCACAAGCAAAGCAATGCATACTAGCGCCAACCTTGACAGTCTTACC
+CCCACACTCTTTGCAGCCAGCACCTTCCCTGTGGTAATAACAATTTTTCATCTTCGGATT
+CTTAGCAAGGCTTTTTGCCCTGCACTCCTGGACATCATTTTCAGTCTTCCTATCCGGATT
+GCAGCAGAATTTATGTCCACACTTAAGCACCTTTCTTGCCTCCGATCCGCACCCACCGGC
+AATCGTCCGTATACACATATTTGCATTTATCCTTTTCCACACAATCTTTGCACTGACAAG
+CGCCAGCTTTACATTTGCGGCATTGACACATTCTTTTCCCTCCTTGCCAAATCCTGACCA
+GCTTCCCACTCTCGATAAATCGCGAACCAATCCTCAGCATCCATGCAGACTTTCCAACGT
+TCCCGGTCTCGTCTAAATGCCACAATGGGCATTTCACCCTCTTTGGCATCCCTTCGACTT
+TGAATCATGGCTTTTTCGATATTGAGGGCTTCGACTCTTTTACATTCGATGTGGATCCCC
+GGGAGGCCAACGACATCGTCTCCTTCGAGCCCACTAAATTGCTGGCCACGTCTGCAATCA
+TATCCTTGATCCCTACAGAGCCGAGCAAACTCGCGCTCACCGGCTGCACCCTTTTCTCGA
+CTGTTTGTCATTGCGCTCTTTTCAACTCCTGTTCGTGCTCAGCATCGTAGATCGTCATTT
+GATACTCGGCTTCTCTAACGGCCTCAGCAAACTTCTCAATCCCGTGTTCCCAAAGCCCGT
+GCCGGTGGATGACGTCGGAAAACTCTTCTACGTCATGTTCGCGAAGATACCAATTGTCCG
+GATCATCTTTCTTGGCCCATTCTTTTCTGATGATCTTACCGGTTGAAGGATTGATGACTT
+CCATGCCTGTTTTTCTTTGAATATGGCAGAGCTCATGGTCGAGCAGGGCTTTAAGCTTTT
+CTATTTGCCACGCCTCAAATGCTAGCTCAATAATAAAAATGTGGAACATCTTGCCTGTTA
+GGAATCGCTCAAAGCTTGTACACTTCTTGCATTTGCCTGTCCAGTCAACACCGCTGTCAT
+CCCGAACGTAATACTCTATAAGTTCCTTGGCATCCTTGAGATGTGGGTGATGATCATCAA
+TTAATGCCTCAGCTATTTCTCGAACTCGAGGTGATTTTTCGTAACCCATCTCTTTCCCTC
+CAATTCTTATTTTTACAGGTAAAATGCATCGTATTTCCCCGGCTTTGGCGGCTCAGGAGT
+CTTGTCCCCTGGGTCTCTATTGCGTTTGTAGTCTTTTTGGCGATTACGCTCAGCCTCTCG
+AGCATGAACCTGATCAACGGTCAAGATTCCAGATTCACGCCAGTCTTTGAGTACGCCCCT
+CAGATAGTGCATATTTCGTGCATTAGCATCAAGGCAACACTTAAGGGCTTCGATTACAAC
+CGCGTCCGGATCCGGACTTCCCCGAGTGAAAAACTCATCACAATAGGCCATAATCATGTC
+AGTCTCACCTTTGGGGATTAAACGCCCCCAGTTCTTTTCTGCCCAATTGACTGCCCGGGT
+ACCAATGGCCAAGGATACGATTTCGCTCAAATTGTTCACGTTTTTAGGGGTTTCAGACAC
+AGTTTCCTCGGGTTCGTTCACGCTCTGCCTAATTTCCTTACTTCCGTTGTTGTCGTCATT
+CTCGGCTTCGTTATGAGGGAAACAACAATCAACATTCAATATAGGGGATTCAACATTCAA
+TAAGAGGGATTCCGCCGGGCTCGTCATAACTTTTTCACGGCTAGTAAATACCTTTAAATT
+TTTAGGTTCGTCCTTGCCGTTTATTTTCACGGCTCGTTCATACCTATTTACGGCTTGGCC
+ATTTTCGGGCATATTTGGCAAATCAGACTCACCCTCTTTAGGGTGTGGTTTCTGATGTTT
+CGAAAAATTAACAATCTGAATGCATGAAATCCCATCAACTGTATAGCGAACTATAAACTC
+CGGATCTAATAGGTTAAGGAGTTCATCAACGTTGCAATCGTCATAGGGCAAAACTTCAGC
+TTTAATCCGCTTAGGCCGATCTTCGAGCTTACCCTTACGGTCAGCTAGTCCCCATAGTCC
+GATAAATAGGAGGCGGGCCAGAGGCGGCAGCTCCCCTAATTGGTCGTTTGCAAAAAAGCT
+TGGTTTAATGTTTCGTGCCCTGGCCACTCTTAATCTCCTCCTTAAACCTCAACCAAAAGC
+ATGCTCCCGCAATCCGGGCAATGCTCTTCTTTCCAGCAATCAGCAAGGCCAATTCTTAAA
+TGAATTTTCACCGGCCTGTAGGTCGTGTGGCGACAGTCCATGCAGATCTTGCGCTTACGG
+GCAAATAGGCCCCAAAGTAGATGTCTCATCAGTTTCATAAGCCTCCTCTAAAACGGACAC
+ATTTCCAACTCAATAACCTTCCCTGGCTCCGCGACCTCAACGTCCTTGCCCGTTAATTCC
+CGAATCCCTCGAACCATCCTAAATGCATCTGAATTGCCATCAGAAAGGTGAATCAAAACG
+ATTTTCCGAACCTTTGTTAGGTCATTTGCTTGCAAGAAATCCTTTACATTGTCTAGGCTA
+AAGTGGCTCTCGATCAGCCGGTTCTTTAATGATTCCGGGATCCGCCCGGCCTCAATATTT
+TCCTCAAGGATATCTCGGCAATAGTTGCACTCAACAAGAATGTAATTTAGGTCCCTGAAT
+CTGTTCCGGATGTAATAGGTGTCTGTGGCAAAAAGCAGCTTTTCACCGGTCGGCCAATAT
+TGTATGAGATATCCTAACGGTTCAGCACAATCATGTTCAGTTCGGAATGGCAGGACTGTA
+AAGTCCCTTGTTATAGGGAATTGCTCCCCTGCCCTTACTACTCCAAGACGATGACTTTCA
+ATTCCCAACTTATCGGCTGTCCCCTTACTTAAAAAGGTGTTTACTCCGAACTTAGTAAGC
+TCCTTGACTGACTTTGCGTGATCCATATGTTCATGAGTAATTAAAGCTCCGCGCACATTG
+AACAGATTAAAATTAAGTCCCTTTTGTATCTCTTTGAAGGGGACGCCTGCATCCAAGAGC
+AGGCTCCCCGTTGGTGTTTCTAAAATGTAACAGTTCCCTTTGCTTGATGAGCCGATTATT
+TTAAGTTTCATATTAGAAGTCCGGCCCTGTAGATTGGTGCTCTACCTTGTCATTTTGAGA
+CTCTGGAGCGGGAGGAACCTCAGGCCCCGCTGCTGGTTCGGCATCAATATCAACAACCTC
+TTGATTCGCCTCTTGGGCTATTTCGTTAGCAGCACGACTTTCTGCATCCTCATCTTTGTC
+AGAGGTCAAAGCTGTAGCCATTTCAGTGGACAAAAATCCATAGTGGGACAAGAGCTTTCG
+CATAGCTGTCTTGATGGCCATCTCATCAAAATTCGATTTCCAGGCCGATGAATCATAGCT
+GAAGCTTTTGCTGTAGCGTTTCGCATGCGCAAGTACTTCATCTGCTGTCATGTACACTGT
+TTTGGTAAAGCCATTAGTGAGCTGCATATAGGCAAAGTATCCCTGGGCCTTTGTGCTGGT
+CGGCTCACCAGTAAATTCAACTTCTCCCGTGAGAATGTTCTGCTTAATTTTTACGCCTTC
+TAATAAAACACCAGCATTCAAGAACTTATATTGGCCAGTCCTCATGGCGAGCTGGATGTA
+TCCTTTGTATCCAAGTTGGAACTGAGGGATGTAAACACCCTTTGATTTATAGGGAACAAC
+ATAAGCAAAGCCAAGCTGTTTGTTGATAGGAAGCTTAAGTGTTGCTGCCTTTAGGCACTC
+CATAATAACGGTCTGAGGATCGCATTTTTGCAAGTAGGTATCACTACCATATAGATCAAT
+GATTGAGGCCAGGAAAGCCCCGGAATTCTCATTGAGTGCGTTTTTAAACTGTTCCTTGAC
+GCTATCGACGTTTAAGACAGCCTTAAGTTTGTCCATTGGTTTAACTGTAATGTTGGCCAT
+GTTTATTTAACCTCCTTATTGCTTTTCAGATTTGCAATTTGTTCTGTTATTTGTGCCTTG
+ACAAGGTCCCATGCCTCCTTGTAGGCATCTTCTACAGAATTACCAAGGCACAATTTCAGC
+GGTGACTCCCGCCTCGGCAGTAAACGATTGATGGTTTCCTAGGTTTTTAACATACTTTGA
+AGAAACGCGAATCTCTTTACCGTTCATTCAGCAACCTCCACTCTAAGAACCTTATCCAGT
+TCACTCTTGAAGAGGTTGATAACTTGGCTCTCGGTTTCAATAATTCGGGACACCGACTCG
+CGGAAGTCGATAAAAATTGGGGCTGTAGAACCGTATTGGGATGCGAGTACGTTGATACAA
+TCCAGACCGGCATTAACCTTCCCTGCGTGGTTCACATCTGACCACGTTACCCCATCCACC
+ATAGCCTCGCACATTTCCTTTACGCCGCCATTAATTTGGTCATCAAAGAGCTTCCACTTG
+ACCATCTTGAACCGACTATTGAGGTTGCCTTCCAGTAAATTAACTTTGGCCTTGATAAAT
+CGCTCGAATAAGAATTTCTGCCTCTCAAGCTCACTCAGATGGGCTGCAAGGGTTCGCTCT
+TCGTCCTTGAGCTCTTCGATCCGTTCTTGAGTCTTAATCTGTACATCTCGGTTATTCAGA
+ATCTTATTGAGCGAATTAATCTGTTCTGCGACCTCATTCTTTTGCTTGAGGAGTTCGGCG
+GTCGTGTCTTCGACCGGCTTGTCCAGCTCGTCTTTAATTACTTGCTGCCGAGACAAAAGA
+CTTGTATATTCGGTATCGGCATGATAATTAACTGTGCCAGTAAGGCCCTCCATGTCTTTG
+AGTTCTTTATCAATCTCGGCCAAGCGTTCAGCTATTTCCTGAAGCTTTGCTTCTTTTTGC
+AAAAGCTCTTCGCCGAACTTCGCAGTATCTGCCTCAAGCTTTTCTTTTCGGGCCTTAAGG
+GTCTTCCCTTCTGTATTAATCTTAGTAAATTCATTTTGCTTAGTAGTATTAAAGGCCTCG
+CGCATCTCATAGATCTGTTGCCCAATGTCATCCTCTGGCAGCTCCCTCCTGCATGTAGGA
+CAAATAAAGTTGCTGGGGTCAGGCTCTTCAAAGCCTTTCGAGCTTACCTCATTCCATTTC
+GTCCGGAGGTCAGCCATATTTTTAGATACCCTTTCTATTTCACTTGAAGAACTTTCGATC
+AATTCCTTAAGGGAATAACTTGTGGTCTCAAGCCGGTACTTTTCATTCTCAAGCTGCATC
+TTCTCGTCAGTGAGCCGTTTAGATCCGGCCAAGGCTTCTGTGTCTAATTCTTTTTTTCTT
+GCCCAAATGGCCGTATCAAGCTTGAATAATTCCTGCTGCTTCTGGCGGTATTCATCCGCT
+GCCTGACTGGCATCTAACATGCTTTTCTCGATCTTCCTGAGGACTGCTTTATGTTCGAGC
+AACCTTTCTTCGACTGCTAAATAATTAACATCTTCACTTAGCAGCGTCCGTGAAAGTTCG
+TTTATCTTAATTGGTATTGACTCAATATCTTTGTTAAGCTTCTTAACACCTTCGGCAATA
+ATCTTCTTTTGAGAATCTATCGATTTTCCGTCTAAGATGTCCTGCAATGGTGCTAGGTCA
+TCACTTGAGTCAATTACATCCTGATCCGTGACGTTCCCGCAGATCTCCATAAGTGTTTTA
+CGCCGATCCTCCCACTTGAGCTGGGTGCAAAAGTAAAACGGATTCGTCAGGAGCTTGAAG
+ACATTTTCGTCGATGATAGCGTTGATTTGATCGGTATACTCCTTCTTTTTAACAGGTACA
+GTGTCAATCCAATAAGAGGTTTGATGCCCTGTAAATTCCTTCGTGGATTCACCGCGTTTT
+TTTGTCCAAACCTCTTCGAGCATCTTCCTGAGAATTTTAGGCTTGCCGTTAATGAATAGA
+TGCAGCACAACTTCTGTCTCAAGATAATTAATATCGTTACCGTTCTTATCTTGGGGCTTT
+ACTGAGAAGTCAGCACGGTTAGCAGAATCCTTATTAAATAGCGCCCACAAAAAGGCATCA
+TACAAAGTCGTCTTTCCTGCCCCGTTCTCACCAAAAACAGTGGCATTTTGCCCGTTTATA
+TCGAGGGTAAACTCTTTTATACCCTTGAAGTTCCGGAGCTCCATCTTAGAGAGCGTTATC
+TTGTTCATTTCATTCCACTTCCCAACGATTCAAATTCTTGAAGTTCTGTGCTACAATCAA
+AGTGGTTAACTTCTTTTTGAGCTTCCGCGCCAACGGGAGCTTTTTTCATGCAAAGATTTA
+TGAGTGTTTCACCGTTATAGTCAATAAAATGGAATTCACTCGGTTCTCCACCAACAATCT
+CAACGCCGACATTGCCTCGGTATTCCATGCCTGGGAACATATCCTCTAGGACTCCATTAA
+GATCCTCCTGGTCGGCATCTAACGTTGAGATGATCGTAACTCGCATAAGTCCATTCCCGT
+GGAAATCTATACTTGCCTGGGACACTAAATGGTTATGGTTTTTGGCCAGGCCCTGAATAT
+CTAAAAGTTGACCTGCTGTGAGTTGTTTCATTTCATCCCTCCACCTTTAATTTTCAATCC
+AAACTTCCAATTCCCATATTCCGAACTCTATAGCATCACTCCGTTTCTCCATGTAAAGGT
+CTAGCCTATTCCCTCGTATTGCGCCGCCCCGATCCGTGACCGTGTAGGTATGTTCAAGCT
+TTGGGATATAGATCTTGGTTCCGAAGGGTAAGCTCGGATCGGCAGCTATCGTCCAACCCT
+CTTTGACCGGTTCACCGCTGGCTGTGATTCCTTTGCCGTCCCTTCCTCTGTCATTGGCCG
+TGTAGGCCGTGACGATCATAATTCGTCGTTCATGTTTTGTAGTTGTTCCTCGGCTAATTG
+GCTTTACGGAGACCAATACCGGCGGAGACTGTTTGATTGATTGCGGCAGCTCTGGACAAA
+TAGCGTTCGATGGTGTTAAACATAAGATCGCTGCCATTAATGCGATAACAAAAATCCTTC
+GAACTTTTGATCACTCCTTTTCTAAAGAGTTTTTCGACGTAGGCGCATACTATTGCAAAT
+TGGCATTTTGTCTTATCACGCTGCCCTGTGCATCCCCCGCATGTTTCTAGATGTTTGAAA
+AAGCGTTCACAGGTCATTATTGAGCCTTCTTCCCTTTGTATTGTCCCTCCATCGCATATA
+CTTTTGATAGTGATTTAACTTTCGCTTGGGCTGCTCAGTGATAATTGGGGTAAATGTAAT
+TGTGAATAGTCCTGTTGCCCAGTATCCTTCTGGCCCACGCTCCCACCTCATCCCACATCC
+ATCAATTGGACACCTAGCTCCTGTTTTACCTACCGGAAACATCATGGCTTGTCCACACTT
+ACAGAGTGGAGTTAACCCAATTGCTTCACTCAAAGTACCTCCCTCCTTTATGCAACATCG
+ACTTCTTCCTTCGCCTCTTCCTCGGAATCAAAACTTCCAGCAAACTTTCCGTCTATCCAG
+AGCTCTACATATCCCCGCTTCTGGATGATCGTATACGACATGGCATCACCTCCTTAATAA
+ATTGTTTTCCCTACTTTCCCCGGATGACCTATTCAAATAGATGGCATTATGAATTAATCA
+CATATTGCCCTTATTTTCCCCTCTCTCGGCATCCTCTTTAAGCAGTTGTTTAAGAACCAA
+TCCGGCTAACAAATTGATTCCTCTTTCTGGGTTAGGGTGTGGGATATAACTGACCGTAAG
+ATTAACTGTGATTACCTGGGGCTTACGTGGCATTCTCCCTTCCTCCTCTCGTGGAATTCA
+TTTTCGTCGGATTCGTAACGCTTCGCTTTGTTGCTATTTTCCTCAAAAAAAAGAGTCCAT
+TTAAAGTTCAACACTTCTCCAATTCTTTGAGCAACTTTTACGCTAGGCGTTCTTTCACCG
+TTCTCAATCATGCTATAATATTGCCTTTTTACTCCAACCATTTTTGCGACCTCTTCATGC
+GTCATATCAGCATTTATGCGTATGTTCGCTAGCCAGAATCGAGTCATCATCACCACATCC
+GTCTGTAAATTCCTAGCAACACTAAGTTGCTGTGCCTTCATTATATAGCAACATAACGTT
+GCTGTAAATATTTATGGCAACAATTTGTTGCTAAGTCTTTACGCAACATAAAGTTGCCAT
+TATAATGAATTAAAAGCAATAATATTACAGGAGGCCTAGAAGATGTTTCCTGACAGACTT
+TGTACGCTAAGAACTTCAAAGGGTTTAACACATCAAGATATGGCTGATATGTTAGGAATT
+ACGCGGCAAGCGTATAGTAACTACGAGGCAGGGAAAAGAGAACCAGATCACAGCACTTTA
+AGAAAACTGGCTGAGTTTTTCATAGTCTCAACGGATTATTTACTTGGGCAAGACAATGGT
+AAGATCGTTCCCTCATGGGCAACAGCTAAAGATAAACGAGATTTTAAGAAAATGCTCGAA
+GATGATGATGATTTAATGTTTGATGGAGTTCCTATTGAGGGTGAGGATCGACAACGGATT
+AAAGATGTTCTTACCGGCCTTTTCTGGGAAGCTAAACAAATGAACAAACGAAAAAAGAAA
+TCTGACAGCACGAACGACACCAAGAAATAA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_019936.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,550 @@
+>NC_019936.1|provirus_2347508_2361929
+TCAGACTTCCAGCTCTAACGTCAGATCGCCCGACGCGCTGACCTTCGCGCATGGCGTCGC
+CTTCTCCAGGATGAAATGCGCCAATTCGCTGTCTTTGATTGGCATGCGTCCCTGCCTGAC
+CAATAACTTATTGATTTCTATGCACTTTTGTCTAAGCGCTTCTTGCTCTGTATTCGACAG
+ACGCAGGGTGGCAGGCATCGTCAGTTGACCCATATCAAATTCACCTCGTGAAGTGTACGT
+GCATGCATGTGATTTGTATTGACGCATGCAAGTTCACCGGTATACATTCCGCCGCAATGT
+GATTTGCATGCATGCATGCATAGGCGAATGGACTTCACAAATGCTCGACAAAATCCACCT
+CTTCGTACCGTTTCGGGTCGATGCCATCGCTACCAGCACCGGTAAGCGCGGCAACGAGCT
+GTTGGTGGTCGATCTGGAAGCCCTGGGCGTTCCGCTCCGTGCTACCAGCGTCCTTTCGGA
+CGGGAAGGGTGGTTATCAGGTCGAGGACATAAGCCACGCTTGGGAATCTCTCTCCACTGG
+CTTTACGCCGTTGGCGTTCAAGGTCTTTCACCAGTCGCTCGGCAAGCGCATTCAGCCCGG
+CGTCGAGCTGAAAGCCAGCCCTGCGAAGCTGCTCCAGGGGCACAACGTCTTCGGGCCTAC
+CTCGATCCGCAAGGGCGGGGAGGTCATGTTGAAGTGGCTTGCCGGCTCATATCCGAAGCT
+GTGGGCCTTGCTGGACTGGCAGGCTGCTGAGGTTTACGGGATCGACTGCACCTATTCCGC
+TCGCCTGCCCGATCAGCGCACCGCGCTACAGCTCGTCCAGGCACTTCGCGGCGTTAGCAA
+CGGCCAGACTCGCAACCGTGGTGACGACTACGAAACCACGGCTTATTGGGGCTCCAAGGA
+AACCCGCCTGCGCAAGCTCAAGGCGTACCTCAAGGGCCCTGAGTTTCGCCGCCAGCTCGA
+TGATGCCATCAAGGCCGCCAGAGCCTATGGCGGTGCCAATTTCGTTCCCTCCCAAGCGTT
+CGCAGCCCACCGGCTGCTCTCGGTTCTCCAGAATCCCGCGCTCCAGGAGTGGGCCGAAAA
+CCTCCTTCGTCTCGAAGCCACTGTCATGCACCGCTGGCTCGAACGCAGAAACATCCCGAC
+GAATCTATGGGCCCTTTGCGACTACCAGGAACGGCTGGAAGAGCAGGGGAGTTGTTTTAT
+TCAGTGGTGTTGGGAACAAGTAACTAAAGAACTGTTTGCGGCCTTTGAAGGTATCTCCAT
+GCGAGTAATTAATGACGAAAAAGTGCTGGCCGCACTTAAAGCCCGTTGGACGAAGTTCGG
+AAAGAACGGGAAAGCCAATGAGACAGTTGCTCTCAACCTGTTTCGCACATATCGCAGTAT
+CAAGGATTACGGTTGGCAGGAAACCATGGACTCTATGTCTCGTGCGACTTTCTACCGCCA
+CGTTGATCAGATTTGCGAATGCGGACTTTCAAAAGCTGCACTTCAGAAGTTGAAGATGGA
+CGATCAGAAGAACAACGTTGTTCCGATCCTGCGCTTCCTGCAAGTTGACTTCAGCGCTCA
+GCGTCCTGGTTGGTACGTTGAGCCGTCCGTGGAGGCTGCATGATGCGTTCTTGGGCCTAT
+CTCCGCGGCTTTCGTGATTACCGGCCACGCCGCATTTATTGCAATCCGTACCTGCTTTGC
+AGTTACGACTACAACGAATATGAGCGTGGTTGGTTTCAGGCTCATAAGCGCACCGGGCTT
+TTTTCATGATCGCCGCGACTATCAACGCCCTGGTCGTCACTATGTGCGGACTGTTGGTAA
+TTCACTTTCTCGGGCGCTGGGCCCGTTCATAACCGAGGTAATCACCATGCTTGTACAACT
+GGGCCTGTGCAAAGGCGTCACTTCCAAAGAAAAGCAAAACGGCATCATCGAACATTACTT
+GGTCCTTACCGCTCCAGGTAAAGACCAATTCGGTCAAGAAACCGAACAGTCGGTCGGCCT
+GAAAGTCTCCAAGCGTCAACTCGATTCAGGCATCGAGAATGCCTATAAGAAATACATCGG
+CCAGCAAGTTGCTGTTCCGGTATACGCCAAAGCCTGGAAGTCCAAAACTGGCACCGCTTT
+CGGCATGGACCTGTGGCTCTCCGATGACGGCCTGCCTGTTCCAGTTCAGCGCGTACAACC
+GCGTCCTGCTGCTGTATCTGGCGGCAACTGATGACAACCGGCGCTCTCATCTGTGAAGGC
+CAAGTAACCATCGCAAATGATGGCGCTCCCCTGTGTTCTGGTATGTGGCAATTAATGGCA
+CTACCACAACCTTTCGACCCATCCCAGTTACAACCTGCCGAACTGGGCGCATTGTTTGGG
+TACGGCTTCGGCTTAGTTGCTGGCTGCTGCATCCTGGGCATTGTGGGTCGATTGTTTCTT
+AACGCTATATACAACCCAAGCAAGGAGTAACACCATGGAAGCAATGATCACTGCAATTAC
+CGGTGCTGTTGACTGGGCTGCTGTTATCACTGGCGCTGGCACCATCTTTGGTGCGCTCGC
+CCTGGTCTATGTCGCCTTCAAAGGTGGCCAGATGCTCGTCAACGTCCTGCGCCGCGGTTA
+ATCCAGCGTGCGTTGAACTGGGGGCCTCGGCCCCCTTTTCTTTTTCGGCGGGGGATATTC
+AATGGCCGATTTATATCAGTGGACGTTCTTTGTTCTCGGTTGCGTTTGTGGTTACGCCAT
+CTTCGGGAGGCTCTAATGTTCCGCCTTCTATTAGCTTTTTCTCTCTTGGTCATATCCATC
+ACTGCAAAGGCTGAATCCTACTATTGGATCATTTCCTTTCCTGCTGACAATGCTAGGTAC
+GTCACTGCTGTTGCGGCTTGTAATGCAAACCATACCTATTACCAGCAACTTAACCCCGGT
+TACGACAGATATGATCAAAGGGTTGTAGTTGGTGAAACTTCATTTTATTGCGAAACCACT
+GGTTTGCGGCGTAATGCTCAGGGTGTATACGAGCCGTATGGTAGATGGGGAAACACTGCT
+AACCGTCGTGGAGATTCTTGCCAGCCGGGTGAAAACTACGACCCTAATGTTGGTGGTTGT
+GAGGTTCCCCCAGGTGAAATGGGCGAAGCGTGTGAAGGTCCTGATCCTGGCTTAACTAAG
+TTCGGCTATGTCTACAACTCCCAAGGCCAGTGTGTTGACTACACCCGAGCCGATACAGCA
+TCACAATGCAAACTACTCGCTGGAACGTCAGCACCAACTAAGATTGCGGTTGTATTTAAC
+GATGATGGATCGCCTCAGATCCCGCCGCCAATGAATGTCGGTGGCTGCGCGGGCATCGTT
+GCCTCTGTGGAGCATTGCGAAATGGCACCAGTTCGCTGTGGTGGTGCGTCTGGTAATTCC
+TGCATGCAGTCTAGTGTCAATACCTGCAAAGTCCTTGTTTCGTTCTCTGGCGCTGTCTCT
+GGTGACGGTAAGCCGCTTGTCATTAAGGGGCATGAAGGCTCCGAAGAGGGCGTTTGCCAG
+CCGGGAGATGCGTGTGATCCTGCACCTACGCCAATTCAAAATGAGGAAAAACCCTGTGTT
+TATGTCGAGGACGGGGAAGGTAGGCGTGTTTGTGATTCCAATAAATGGACGGGGCAACCC
+GGTGAAAAAAGCTGCGGTACTGTCAATGGTCAGCTTACTTGTATAGGCAAATCGCCGACA
+TCGAACGGCATCAGCATTGGTACTGTCGTTGAGGAAAAAGCCAACGTCGACGGCACCAAG
+ACAGTTACTAAGACCGACGTTCATAACGAAACCAAGTGCATTGGTGCGGGTAGTTGCAAG
+ACCGAAACCACGACCAACAAAACCGTCATCGTTAAAGACTCTGCGGGTAACACTATCGGG
+CAGTCTGGAAGCTGCACCGGTCCTAAGTGTGCAACTGATGGCAAGGGCGACAAGAATGGT
+GATGGTCTTGATGATTGTAAGTCGGGCGAGGATTGCACCGATGAAGAGGAGTTCGAAGGC
+CCAACTAACGGCGACGCTGGAAGTTTTGGCGATAGCCTTGGCAACTTCACCTCACGTGTT
+AAAGGCGCTCCGATCATTGCGTCCGCATCAAGTTTGACGTTCGCGTCTGGCGGCTCGTGC
+TCGATGCCTTCTTTCTCTGTGCCAGTTCTCGGCACGCTTTCGTTTCAGCCTATGTGCCAA
+TGGGCAGCTGATTGGTTCGCACCAATTAAAATGATCATGCTCGCGCTTTGGGCGCTTGTT
+GCTGTTCGCACCTTCTTGGAGGCCTAATTATGCTTGCCGACTTCGCGCAGTGGCTCAAAG
+ACTTCTTCCTTTGGTTGCCGCTCAAGATATGGGAAATGATGCTCGATGCTCTCGCGAGCG
+TCATTGAGGCTCTTCCTGTCCCCGACTTCATGTCGAACGCTCAAGGTTATATGTCCAGCG
+TCGGAGGTAATGTTCTTTGGGTGCTTGATCTGTTTGCCGTTCCCCAGGGCATGGGCATGG
+TTATGGCGGCTTTAGTGCTCCGCTTCATTGTTCGCCGCATTCCGATCATTGGGTGATATA
+TGGCTATCGACGCTTATGTTGGCCTTCCTGGTAGTGGCAAAACTTATTCGGTCGTTAAGT
+TTGCGATCCTGCCCAGCCTCAAACAGGGCCGTTTAGTTATCACGAACATCCCCCTCACTG
+ATCTTGCCCATCAGGATTACCCCGACCAGATACGCCAGCTCCCGCATAACTGGTATCAGG
+ATGAGAAACTGTTTGAGACTGTCCCTAATGGCGCTGTTGTTGTCCTCGACGAACTTTGGC
+GTCGATGGCCGAAGGGCATGCCCGCTGCCAAGGTTCCGTTTCGCGATAAAGAGTTTCTCG
+CCGAGCATCGGCACTTGGTAGACGAGGAGGGCAACAGCACCCGAATCGTCCTCGTTACTC
+AAGACCTGGACCAGATTGCCGCTTTTGCCACCATGCTTGTCGATACCACTTATCAGAGCG
+TCAAGCTGTCCGCCCTCGGAGCTAACAAGAAGTTTCGTGTTGATATCTACCAGGGCGCAG
+CAAAGGGTCAGAGGCCTCCTAAATCTCGGCTTCTTCGCTCGACTTATGACCGCTACGAAA
+AGTCGATTCACCAGTACTACCAGAGTGCTACCAAGAGCCTTACGGGCGTTGTTGGTGACG
+AATCCAGGGCGGACAAGCGTGCAACCATCTGGCGATCGCCGCTCATGATCTTCACCTTGA
+TATCTCCGTTTCTGATTGGCTTCCTGGTCTGGCAGATCGTGCAGTTTTTCGGCAACGGCA
+TGAGCTTCTCGAAGCGGGAACCAGAACCCGACCCAGTTGAGGCTCTAGCCGATATGCCCC
+TGGTCAACCCTATGCCTGCCGATCTGGCTCCTGCTGTTATCCAACAGCCGCAACAGACTC
+AACCGGCGCAGCGTGGTTATTCTGCCGTCTGGCGTGTCTCTGGCCACATCAAGCGCAAAG
+ACCCTGACACGAACAAGATGCGTGACGTGGTCATGCTTTCGTCACTCAGTGGCATTCGAT
+ATGAGCCTATGGAGAACTGCGAGCCCATCAGCATGGGTTTCGAATTCCAATGCGAGGTTG
+ACGGTGATTTGGTCACGCCCTGGTCTGGTCCGATCAACCAGAACATGACGGGCTATGTTC
+TTGGAGGGGCAACCCAATCCGTTGACGCTGGCAAGCAAGCGGTAGGACTTGGCGGCGAGC
+GTAGCGCTGCCGTCGAAGGACGCACCGCGCAGCCATCCGTTAATCCGATCTGATGCATAC
+GACTCTTCATCGCACACGTTCTGATTGGGCGCTTCGCATAATGGATGGCCTTATGTTGAG
+CGGTGTCCGGACAATGCCTCTGGCTCCGGGCGCCGGTTAACATAGGGCCGATTATGCGCT
+GCGCTATCGATCTCGAATCCCGCCTCATCAAAACCGCCGAGCTGTATGCGCCGGGCCGCA
+AGGGTTCCGACGCCGTGACTTGGATTCTCGACGACTACCCACGACTTGTTGCCGAGATCC
+GTGATCTGAGAAAGCGAGTCGCCCAGCTCGATGACGAAGGTGCCCAGCTCGATGCAGTCC
+TTCAGGAGCTGCGTCAGATCGCTGAGCGAATCAATCATCTCTGACCTGTCCCCCTGGCCT
+CGACCTCGCCGCTCGCGGCGATTAGTCGCCTGCACTGCTTCCTGTCGTGCTGCATAGCGC
+CTGCGACGATACCCCCGAAGGGGCCGCAACCATCGACCCACAAAAAAGCCCCCAGCGGCC
+TGTATGGCCCTCTGGAGGCTTCTCGCGATCTTCGTCCCACCGTCCCCCCACCAGCTCAAC
+CCGCGCCCCGATCTGCCCAAATGGAACAGCTCCAGGGCTTCTCTCTGCCGCTCTCCCAGG
+ATCATCAGCACCGCTGACGGTTAGGTCACGAAGTTGCAGTGGTTCCGCCGCGCTTTGGCT
+TCACCGGCGCAGCCGGGTCCACCATCTCTAATGGTGGACTCTTGTCTCATGGTGAGACTT
+TTGGGGTGGTTTTCAGACTTCCAGCTCTAACGTCAGATCGCCCGACGCGCTGACCTTCGC
+GCATGGCGTCGCCTTCTCCAGGATGAAATGCGCCAATTCGCTGTCTTTGATTGGCATGCG
+TCCCTGCCTGACCAATAACTTATTGATTTCTATGCACTTTTGTCTAAGCGCTTCTTGCTC
+TGTATTCGACAGACGCAGGGTGGCAGGCATCGTCAGTTGACCCATATCAAATTCACCTCG
+TGAAGTGTACGTGCATGCATGTGATTTGTATTGACGCATGCAAGTTCACCGGTATACATT
+CCGCCGCAATGTGATTTGCATGCATGCATGCATAGGCGAATGGACTTCACAAATGCTCGA
+CAAAATCCACCTCTTCGTACCGTTTCGGGTCGATGCCATCGCTACCAGCACCGGTAAGCG
+CGGCAACGAGCTGTTGGTGGTCGATCTGGAAGCCCTGGGCGTTCCGCTCCGTGCTACCAG
+CGTCCTTTCGGACGGGAAGGGTGGTTATCAGGTCGAGGACATAAGCCACGCTTGGGAATC
+TCTCTCCACTGGCTTTACGCCGTTGGCGTTCAAGGTCTTTCACCAGTCGCTCGGCAAGCG
+CATTCAGCCCGGCGTCGAGCTGAAAGCCAGCCCTGCGAAGCTGCTCCAGGGGCACAACGT
+CTTCGGGCCTACCTCGATCCGCAAGGGCGGGGAGGTCATGTTGAAGTGGCTTGCCGGCTC
+ATATCCGAAGCTGTGGGCCTTGCTGGACTGGCAGGCTGCTGAGGTTTACGGGATCGACTG
+CACCTATTCCGCTCGCCTGCCCGATCAGCGCACCGCGCTACAGCTCGTCCAGGCACTTCG
+CGGCGTTAGCAACGGCCAGACTCGCAACCGTGGTGACGACTACGAAACCACGGCTTATTG
+GGGCTCCAAGGAAACCCGCCTGCGCAAGCTCAAGGCGTACCTCAAGGGCCCTGAGTTTCG
+CCGCCAGCTCGATGATGCCATCAAGGCCGCCAGAGCCTATGGCGGTGCCAATTTCGTTCC
+CTCCCAAGCGTTCGCAGCCCACCGGCTGCTCTCGGTTCTCCAGAATCCCGCGCTCCAGGA
+GTGGGCCGAAAACCTCCTTCGTCTCGAAGCCACTGTCATGCACCGCTGGCTCGAACGCAG
+AAACATCCCGACGAATCTATGGGCCCTTTGCGACTACCAGGAACGGCTGGAAGAGCAGGG
+GAGTTGTTTTATTCAGTGGTGTTGGGAACAAGTAACTAAAGAACTGTTTGCGGCCTTTGA
+AGGTATCTCCATGCGAGTAATTAATGACGAAAAAGTGCTGGCCGCACTTAAAGCCCGTTG
+GACGAAGTTCGGAAAGAACGGGAAAGCCAATGAGACAGTTGCTCTCAACCTGTTTCGCAC
+ATATCGCAGTATCAAGGATTACGGTTGGCAGGAAACCATGGACTCTATGTCTCGTGCGAC
+TTTCTACCGCCACGTTGATCAGATTTGCGAATGCGGACTTTCAAAAGCTGCACTTCAGAA
+GTTGAAGATGGACGATCAGAAGAACAACGTTGTTCCGATCCTGCGCTTCCTGCAAGTTGA
+CTTCAGCGCTCAGCGTCCTGGTTGGTACGTTGAGCCGTCCGTGGAGGCTGCATGATGCGT
+TCTTGGGCCTATCTCCGCGGCTTTCGTGATTACCGGCCACGCCGCATTTATTGCAATCCG
+TACCTGCTTTGCAGTTACGACTACAACGAATATGAGCGTGGTTGGTTTCAGGCTCATAAG
+CGCACCGGGCTTTTTTCATGATCGCCGCGACTATCAACGCCCTGGTCGTCACTATGTGCG
+GACTGTTGGTAATTCACTTTCTCGGGCGCTGGGCCCGTTCATAACCGAGGTAATCACCAT
+GCTTGTACAACTGGGCCTGTGCAAAGGCGTCACTTCCAAAGAAAAGCAAAACGGCATCAT
+CGAACATTACTTGGTCCTTACCGCTCCAGGTAAAGACCAATTCGGTCAAGAAACCGAACA
+GTCGGTCGGCCTGAAAGTCTCCAAGCGTCAACTCGATTCAGGCATCGAGAATGCCTATAA
+GAAATACATCGGCCAGCAAGTTGCTGTTCCGGTATACGCCAAAGCCTGGAAGTCCAAAAC
+TGGCACCGCTTTCGGCATGGACCTGTGGCTCTCCGATGACGGCCTGCCTGTTCCAGTTCA
+GCGCGTACAACCGCGTCCTGCTGCTGTATCTGGCGGCAACTGATGACAACCGGCGCTCTC
+ATCTGTGAAGGCCAAGTAACCATCGCAAATGATGGCGCTCCCCTGTGTTCTGGTATGTGG
+CAATTAATGGCACTACCACAACCTTTCGACCCATCCCAGTTACAACCTGCCGAACTGGGC
+GCATTGTTTGGGTACGGCTTCGGCTTAGTTGCTGGCTGCTGCATCCTGGGCATTGTGGGT
+CGATTGTTTCTTAACGCTATATACAACCCAAGCAAGGAGTAACACCATGGAAGCAATGAT
+CACTGCAATTACCGGTGCTGTTGACTGGGCTGCTGTTATCACTGGCGCTGGCACCATCTT
+TGGTGCGCTCGCCCTGGTCTATGTCGCCTTCAAAGGTGGCCAGATGCTCGTCAACGTCCT
+GCGCCGCGGTTAATCCAGCGTGCGTTGAACTGGGGGCCTCGGCCCCCTTTTCTTTTTCGG
+CGGGGGATATTCAATGGCCGATTTATATCAGTGGACGTTCTTTGTTCTCGGTTGCGTTTG
+TGGTTACGCCATCTTCGGGAGGCTCTAATGTTCCGCCTTCTATTAGCTTTTTCTCTCTTG
+GTCATATCCATCACTGCAAAGGCTGAATCCTACTATTGGATCATTTCCTTTCCTGCTGAC
+AATGCTAGGTACGTCACTGCTGTTGCGGCTTGTAATGCAAACCATACCTATTACCAGCAA
+CTTAACCCCGGTTACGACAGATATGATCAAAGGGTTGTAGTTGGTGAAACTTCATTTTAT
+TGCGAAACCACTGGTTTGCGGCGTAATGCTCAGGGTGTATACGAGCCGTATGGTAGATGG
+GGAAACACTGCTAACCGTCGTGGAGATTCTTGCCAGCCGGGTGAAAACTACGACCCTAAT
+GTTGGTGGTTGTGAGGTTCCCCCAGGTGAAATGGGCGAAGCGTGTGAAGGTCCTGATCCT
+GGCTTAACTAAGTTCGGCTATGTCTACAACTCCCAAGGCCAGTGTGTTGACTACACCCGA
+GCCGATACAGCATCACAATGCAAACTACTCGCTGGAACGTCAGCACCAACTAAGATTGCG
+GTTGTATTTAACGATGATGGATCGCCTCAGATCCCGCCGCCAATGAATGTCGGTGGCTGC
+GCGGGCATCGTTGCCTCTGTGGAGCATTGCGAAATGGCACCAGTTCGCTGTGGTGGTGCG
+TCTGGTAATTCCTGCATGCAGTCTAGTGTCAATACCTGCAAAGTCCTTGTTTCGTTCTCT
+GGCGCTGTCTCTGGTGACGGTAAGCCGCTTGTCATTAAGGGGCATGAAGGCTCCGAAGAG
+GGCGTTTGCCAGCCGGGAGATGCGTGTGATCCTGCACCTACGCCAATTCAAAATGAGGAA
+AAACCCTGTGTTTATGTCGAGGACGGGGAAGGTAGGCGTGTTTGTGATTCCAATAAATGG
+ACGGGGCAACCCGGTGAAAAAAGCTGCGGTACTGTCAATGGTCAGCTTACTTGTATAGGC
+AAATCGCCGACATCGAACGGCATCAGCATTGGTACTGTCGTTGAGGAAAAAGCCAACGTC
+GACGGCACCAAGACAGTTACTAAGACCGACGTTCATAACGAAACCAAGTGCATTGGTGCG
+GGTAGTTGCAAGACCGAAACCACGACCAACAAAACCGTCATCGTTAAAGACTCTGCGGGT
+AACACTATCGGGCAGTCTGGAAGCTGCACCGGTCCTAAGTGTGCAACTGATGGCAAGGGC
+GACAAGAATGGTGATGGTCTTGATGATTGTAAGTCGGGCGAGGATTGCACCGATGAAGAG
+GAGTTCGAAGGCCCAACTAACGGCGACGCTGGAAGTTTTGGCGATAGCCTTGGCAACTTC
+ACCTCACGTGTTAAAGGCGCTCCGATCATTGCGTCCGCATCAAGTTTGACGTTCGCGTCT
+GGCGGCTCGTGCTCGATGCCTTCTTTCTCTGTGCCAGTTCTCGGCACGCTTTCGTTTCAG
+CCTATGTGCCAATGGGCAGCTGATTGGTTCGCACCAATTAAAATGATCATGCTCGCGCTT
+TGGGCGCTTGTTGCTGTTCGCACCTTCTTGGAGGCCTAATTATGCTTGCCGACTTCGCGC
+AGTGGCTCAAAGACTTCTTCCTTTGGTTGCCGCTCAAGATATGGGAAATGATGCTCGATG
+CTCTCGCGAGCGTCATTGAGGCTCTTCCTGTCCCCGACTTCATGTCGAACGCTCAAGGTT
+ATATGTCCAGCGTCGGAGGTAATGTTCTTTGGGTGCTTGATCTGTTTGCCGTTCCCCAGG
+GCATGGGCATGGTTATGGCGGCTTTAGTGCTCCGCTTCATTGTTCGCCGCATTCCGATCA
+TTGGGTGATATATGGCTATCGACGCTTATGTTGGCCTTCCTGGTAGTGGCAAAACTTATT
+CGGTCGTTAAGTTTGCGATCCTGCCCAGCCTCAAACAGGGCCGTTTAGTTATCACGAACA
+TCCCCCTCACTGATCTTGCCCATCAGGATTACCCCGACCAGATACGCCAGCTCCCGCATA
+ACTGGTATCAGGATGAGAAACTGTTTGAGACTGTCCCTAATGGCGCTGTTGTTGTCCTCG
+ACGAACTTTGGCGTCGATGGCCGAAGGGCATGCCCGCTGCCAAGGTTCCGTTTCGCGATA
+AAGAGTTTCTCGCCGAGCATCGGCACTTGGTAGACGAGGAGGGCAACAGCACCCGAATCG
+TCCTCGTTACTCAAGACCTGGACCAGATTGCCGCTTTTGCCACCATGCTTGTCGATACCA
+CTTATCAGAGCGTCAAGCTGTCCGCCCTCGGAGCTAACAAGAAGTTTCGTGTTGATATCT
+ACCAGGGCGCAGCAAAGGGTCAGAGGCCTCCTAAATCTCGGCTTCTTCGCTCGACTTATG
+ACCGCTACGAAAAGTCGATTCACCAGTACTACCAGAGTGCTACCAAGAGCCTTACGGGCG
+TTGTTGGTGACGAATCCAGGGCGGACAAGCGTGCAACCATCTGGCGATCGCCGCTCATGA
+TCTTCACCTTGATATCTCCGTTTCTGATTGGCTTCCTGGTCTGGCAGATCGTGCAGTTTT
+TCGGCAACGGCATGAGCTTCTCGAAGCGGGAACCAGAACCCGACCCAGTTGAGGCTCTAG
+CCGATATGCCCCTGGTCAACCCTATGCCTGCCGATCTGGCTCCTGCTGTTATCCAACAGC
+CGCAACAGACTCAACCGGCGCAGCGTGGTTATTCTGCCGTCTGGCGTGTCTCTGGCCACA
+TCAAGCGCAAAGACCCTGACACGAACAAGATGCGTGACGTGGTCATGCTTTCGTCACTCA
+GTGGCATTCGATATGAGCCTATGGAGAACTGCGAGCCCATCAGCATGGGTTTCGAATTCC
+AATGCGAGGTTGACGGTGATTTGGTCACGCCCTGGTCTGGTCCGATCAACCAGAACATGA
+CGGGCTATGTTCTTGGAGGGGCAACCCAATCCGTTGACGCTGGCAAGCAAGCGGTAGGAC
+TTGGCGGCGAGCGTAGCGCTGCCGTCGAAGGACGCACCGCGCAGCCATCCGTTAATCCGA
+TCTGATGCATACGACTCTTCATCGCACACGTTCTGATTGGGCGCTTCGCATAATGGATGG
+CCTTATGTTGAGCGGTGTCCGGACAATGCCTCTGGCTCCGGGCGCCGGTTAACATAGGGC
+CGATTATGCGCTGCGCTATCGATCTCGAATCCCGCCTCATCAAAACCGCCGAGCTGTATG
+CGCCGGGCCGCAAGGGTTCCGACGCCGTGACTTGGATTCTCGACGACTACCCACGACTTG
+TTGCCGAGATCCGTGATCTGAGAAAGCGAGTCGCCCAGCTCGATGACGAAGGTGCCCAGC
+TCGATGCAGTCCTTCAGGAGCTGCGTCAGATCGCTGAGCGAATCAATCATCTCTGACCTG
+TCCCCCTGGCCTCGACCTCGCCGCTCGCGGCGATTAGTCGCCTGCACTGCTTCCTGTCGT
+GCTGCATAGCGCCTGCGACGATACCCCCGAAGGGGCCGCAACCATCGACCCACAAAAAAG
+CCCCCAGCGGCCTGTATGGCCCTCTGGAGGCTTCTCGCGATCTTCGTCCCACCGTCCCCC
+CACCAGCTCAACCCGCGCCCCGATCTGCCCAAATGGAACAGCTCCAGGGCTTCTCTCTGC
+CGCTCTCCCAGGATCATCAGCACCGCTGACGGTTAGGTCACGAAGTTGCAGTGGTTCCGC
+CGCGCTTTGGCTTCACCGGCGCAGCCGGGTCCACCATCTCTAATGGTGGACTCTTGTCTC
+ATGGCGAGACTTTCCTTTGTGGCTTTTCTCGCTTCAAACCCTTGCGCAGCAAGGGCTTGA
+AGGTTTTTTCCTTTAAATCCTCGCGCAATCCATTGTGTACGTACAAATGTTTATGTAAAT
+TTGCGCCTAACTCAGCTTGGTGATGCGTATGACTGCCGATGACCGTGGCAACTCTTTCCT
+TCGTGATCTTCGCGCTCAGCTTGGTCGTGATCCAGAAACCGGCCTTACTGCCGATGAATC
+TACGCGCGAGCGGGTAAATCAGATTCTTGCGAACTTGGCCGACAACGAAGACGCTCGCGT
+GAATTTCCGCATCAATTCTGCCGTGAAAGAAGAGTTTGAGCGTCTTTGCCAGCAGCGAAG
+CTCAACCCTTAGCCGCGAGCTTCGACGCTTCATGATTCAAGCGATCAGCCGTCAGCGCTT
+CTGGCAGCAATAGGAGGAGGGCGCACCCCACCCTGAGGGCATGCCTTAAGAAGCCCTCCA
+GCGTCAAATTAGAGGCCTTGTGCCTTAAGAATCGAGCCCGAGCGGGCTAGATGCTGCCCT
+AGGGAGCGCCAACTCCCCAGGGTAGCTACCAATAACGATCTAATAAGGAGATCGATATGG
+CTGCTTCGAATGTTACTCAAGTACAGCGCAATGCTTGCGTTCACGCTTTTGGTTCCTTTG
+GCCAAAATCAGGTCCAAGCTGAAAAAATATCATGTTGGAAAGATGGTTCTTTCTCCGCTG
+ACCCGTTCGTTTTCCTAGGGCGTCGTATTCGAGTCGGCGAACAGCTTCAGGCATGCTATG
+ACGATGAGCGCGGCTTGGTTGAAGAGTCGTATGTGTACGAGGCGAAGGTTGTCGCGGTCC
+ACATAGGCTCGGCTGCTGACGGCATCGAGAGTTCGCTGCTTTTGCGCCCGAACGACGTAA
+ATCACGAAAACTACGTTGATATCTCCAGGCTCACAGTTCTGGAGGTGCTTGAGTGAAACC
+CTTAATGCTCGGAACCTTGTCCAGAGTACCAGCAGCACGTCTGCTGCAACTGGGCGAGTG
+CCCGCAGCCCATCAGCATGGGTTTCGAATTCCAATGCGAGGTTGACGGTGATTTGGTCAC
+GCCCTGGTCTGGTCCGATCAACCAGAACATGACGGGCTATGTTCTTGGAGGGGCAACCCA
+ATCCGTTGACGCTGGCAAGCAAGCGGTAGGACTTGGCGGCGAGCGTAGCGCTGCCGTCGA
+AGGACGCACCGCGCAGCCATCCGTTAATCCGATCTGATGCATACGACTCTTCATCGCACA
+CGTTCTGATTGGGCGCTTCGCATAATGGATGGCCTTATGTTGAGCGGTGTCCGGACAATG
+CCTCTGGCTCCGGGCGCCGGTTAACATAGGGCCGATTATGCGCTGCGCTATCGATCTCGA
+ATCCCGCCTCATCAAAACCGCCGAGCTGTATGCGCCGGGCCGCAAGGGTTCCGACGCCGT
+GACTTGGATTCTCGACGACTACCCACGACTTGTTGCCGAGATCCGTGATCTGAGAAAGCG
+AGTCGCCCAGCTCGATGACGAAGGTGCCCAGCTCGATGCAGTCCTTCAGGAGCTGCGTCA
+GATCGCTGAGCGAATCAATCAT
+>NC_019936.1|provirus_3233292_3242961
+TTACTGCAACCCACCCAAGGGGCTCAGCCTAATGGCGTCGCTCAAATGCTCAGGCGCAAG
+GTGTGCATAGCGCATTGTCATGTTCAGCGACGCATGGCCCAGGATCTCCTTCAGCGTCAC
+GATATGGCCACCGCCCATGATGAAGTGAGCCGCGAAGGTGTGGCGCAGGATGTGGCTTGC
+CTGTCCGCGTGGTGGCTTGATCGAGGTCGAGAGCAGGACCAGCCGAAACACGCCAATGCA
+GTTGGTGAACGGCCCGTAGGTTTGCCAGTGCTTCTTGATCGCCGCCGCCAGCTCGGGCGT
+AACCGGGACCATCCGCACCCGTTTCGACTTCGTATTGGCGAACACCAAGGCGTTGCCTCT
+GATCCGCTCCAGTCGCAGCGCTTGAGCCTCACCCCACCTCGCCCCGGTCGCCAAGCAGAT
+ACGCGCCACCATCGCCGGGTGCGGAGACGTGGTCCGCGCCTGGAGTGCATCGAGCAGCTC
+GGAGATCTGCGGCTTGGTCAGGTAGGCCAAGGGGCGCTCCTGCAACCGAACCGGACGAAT
+ACGGGTGAAAGGACAGGGATAGTCGATCACGTCGAGTTTATGCAGCTCGTTGTAAACGGC
+TTTCAGGTAGCCAAGGCGATTGTTCGCCGTCTTGCCGGTGACGCCAGCTAACATCCAACG
+CGCGCGTGTGGCGGCGATCTTCGCGCCATCCACCATACGAGCTATCGGATCGCCCATCGC
+CTTTGCACACGCTCGCAGGATCGCCACACGACGAACGCCATCGGAGAGCGAGACGCCGTG
+AAGGTCGAACCATAGCTCGACCAGCTCTGACAGCCTGCGCTTGTCCTTTGGCCGCGGTGC
+CCAATCGTTCGATTCGCTGCACTTGGCGCGACAGGTCGCCTCGAAGCGCATTGCCTCGGC
+CTTGGTCTTCAGCGTCTTGCGGAAGCGCTTGCCTTTGACCGGCTCAACATCGACCCGCCA
+GCGACCATCTGAGAGCTGCTGAATCGCCATCAGACCGCTCTGCCCCATCGAACGTGGCGT
+TCTTGAAGCAACGTCTTGATGTGCTTGTACAGATCACGCTCGCTCATGTCCTTGGCGGCG
+TAGTGGTCACGAATGACCGGCCAGCATTCCCACTCCTTCAGTCGATCAAATGCGGTTTTA
+GCGCCCACTCGCTCCCGTGCCAGCAGGCTTACGAAGTTTCCCAGGAATAGCTCCACGTTC
+TTGCCCGAGAAGCCCCGTGAGGTCTTGTAGTAGCGCTTGTATTCCGTTTCATCGACCAGG
+GAATCGACCGCCACGTCGACCCGCACGTCATCACGCATCAGCGTCCAGATCGGTTCGTAT
+TGCCCTGGGCGATGCAGCAACTTGAACTGGCACAGCCCGTAGCGCCACAGGCCGTCCAAA
+TGGGCGGAGAACGCCGCAAACGAATCCGTTTCAATGGCCTCGCCGGTCTTGGCACTGATC
+GACCCGCTGGCGAACTGCTGGATGACCGAATGGTGATAGCGCAGCTCGACCCGCCACACG
+TCCGCCTCGGGATCGTAGTTATCAGGATCGGCCGTATCGAACGAATCCCGGCGACGCCAG
+ACGCTTTCCCAGAAGTCGAGCTTATCGGTTGCGCGGGCCTGTTCGGTTTTGTTGTAGATG
+CAGAGCTGAACGCCACCGGCTGAGCCGAACATGGACGTTTCGCCACGACCGTAGACGCTG
+GACTTGGTCGCCCAGTTGATCTCGTTGATCCCCGAGATATCCCGGTGCGTCCGCGCACGA
+CAGTGCAGGCGTGCCACCAGATCCACCGGAGGCTTCCAGCCCTGGAGATCCAACGCCAGA
+TGGACAGCGCACTGGTTTCGTTCGCGGTGCGTCATCACGGCTGCGGCGTAGTAGTCCATG
+CGCTCTTGCAGGCGCTCAGGCGACAGAGCGTCGATGGCGTGCGGCGACACCTCGATTTTC
+AGGTGCGGCCCGATGTTCTCCAGCTTGGCGTTGAAGTTCTTGATCAGCAGAATGAAGCCA
+AGGTCGGCGTTCTGCAGCTTGTACTGGTAACCCGAGTCCCGCCCTACCCGTCCCGCGTGC
+CAGAACTCTCCAGCGAATTCGACCATGACGCCCGGTTTCTCGAACAGCGCCATGATCTCC
+GGACGGATCAGCCCGCGATACAGCTGGCGGACCGTATCGACGCCGCAACGCAGCAAGCGA
+ACGCCCGACAGGTCAGTCAGCTTGGCCGAATGGCTATCGAAGAACAGTCGCCCGGCTGGG
+GTTTCCTGAAAGTTCTGATCAACACGAATTTGGTCTTTAACGCTCATCTTCTTCTGCTCC
+AAATTGCAACGAATTGACACTGTTCAGTTGGGTTTATCTGACGTGTTACAGGGACGTCAG
+CGCGCGCGTTTGCACGCCGGCTCGTGCCTCGCCGCGCGTGCAAAGAGCGCGGAGCGCACG
+CGCGCTGACGGTCATCACCACAGGAATTGCCCCTTCTGGTACGGCACGACGGTCATGTTC
+GCGCCACCAGCGGGTTGCGCTGCTCCAGGGCGCGGCTCATGCATTGCCGGAGACTGGTTG
+TTCTGGACTTGCTGGGTTCGCTCGCCGGTGGAGCGATCAGGAAGGGTCGGATCGAAGAAG
+CCGTTTTCGACCACGCGCATGCAGAAGGCGAAGTCGGTTTCGACCCGCGTGCTCTGCTGC
+GTGTAGCACTGGCAGACGGTGGGTGTGCCGTTGACTACGGCATGCGCCATTCGCCCGAAC
+TCGCGGGCATAGGTCGCAGGGTCGGTGCTGGACATGCAGTAGAGCCTGGGAAACGACACG
+GGCCGCGTCAGCTCGTCGTAGATCGGCGCCGACGATGGGACCTGTGGTATTCGAGGCACG
+CGCCGTCCGATGTAGCTGGCGACGCTTTCAGGCGCATCGGTCTTCGCTTCGCCCACCGGC
+TTGATGAACGCCCCGACCGTATCGCGTACCTGATCGACCATGCTGCCGGCCGGCGCGCTG
+GTAGCCGTCGCGGCTTGAGCTTTTTCGGCTGCATAGCGTTCATAGGCGCGATAAACGAGG
+ATGCCGGCACCGACCAGCACGCAGATGGCCAAGACGAACTTGGTCGGCACCTTGGCCTGA
+AAGTGGTGCTTGGCGTTGCTGCTGGTGTAGGCACCGAAGTAGCGCTTATCCAGCCGCAGC
+GACTTCTTGTCGGCATCCTTGAAACTGGTTTTCAGCTCAACCTTCTCTACGACGACTTCA
+GATTCGAAGCGCAGTAGCTGGGCGGACTTGAAGACGCGCCAGTAGTGGATGTGCGTGTTG
+CACAGCCGACGAAGGTGCACATCGAGATAGCGCGGGTCCTGAGTGACGAGGTGCACCTCA
+TGGCCCTGGTGGCGCATGGTCTCGAAGCGGGTGATGTGCTCCGGTGGCCGCGCCCTGGGA
+TCGCGTGAGCCGAACCAGCCCTGCGCTTCGTCGACGACGATGATCGAGTCATTGGGCAGC
+TCAAACCATTTTTCAGGATCTTCGAACTCGAACCACTGCGCTTGCAGCTGATCGGGCTTG
+AGACCGTTGATGTTGTGGAAGTAGACGACGCGGCCTTCGGCGTGGGCCTTCTGGTCGACC
+TCGCGGATGGTGTTCAGGGTCTTGCCATGGCCGGGCTTGCCGGTGCGGATAACGAGCATG
+ACGGCGCCTCCTTATGCGTCGATAGAGGTGCCGCCCGGCTTATGCCAGACCTGATTACGT
+TTGCGGTCGGTGGCCTTGTCGATGCCGGCGAGGATGAAGCGCGTGGAGATCGCGGCGAAA
+TACAGGTTCACCACCACATCGAACTTCGCCAGTCCGAGAATCCCTTGGATGACCGGCCCG
+ACATCGCCCATCAGCCCGAACAGGTAGTCCTGCGCCTGGCCAATGATGAGGTTGAAGCCC
+ATGTAGGAGACGAAGCCGAAACCGATCATCTTCAGCACCATCTTCACCAGCGGCCCGACG
+ATGATCACGAGCATCTGGACGATGAATAGAAACTGCATCATTGACCTCCTACGGCGCGGC
+CCACATACAGGGCGGCAAGAACGGTGGCCACGGCCACGAAGAGGCCGCTCAGGTCACTGG
+CGGCGCGGCATAGCGGTTCGTAGCTGAGCTGGAAAGTGCGACCGCCTGCTGTGGTCAGGC
+TGAAGCTCTCGGCGGCGGGACAGGCAGACGGCAGAAAGCGGGTGCCCTGGTTGATGAACG
+AAGGCACGTCGATGACGCCGTTACCTTCATCCAGCTGGAATCGGTCACCGGTAACAGCCG
+CCTCGATGGCGGACTGCTGTTTGGGGAAATCGGCCATTTCCTCAGCGAGGCACAGCTGTT
+CCTTCTGCTGCCGCAGGACTTCGCAATCAATCGGGTCACCACTGCACGAGAACGCCGCAT
+CGCAGGAGCCGGCCGAGGCCAAACGCTCCGGGCCTTCTTCGCCTTCGCCTTCACCTTCCT
+GGCTTTCCTTACAACCAGACCCTTTGCATTCCTTGCTCTCATCGCCCGGGGTGCCATCAG
+GGTTGGTGCCAGAGGTGGCTTTTTCTTCGGCCGTGGTGGAGGTACAGGGCTTGGTGCCAA
+CGCAGACGGTCTTGTCGGTGGTGGTGTTGGTTTCCGTCTTGGTGGAGCCGTCCGGGTTGG
+TGGTCTTGGTGGTTTCTTCGGTTTTCGTGGTGTCCTCAAGCCGTGGCGCAGGCTTGCCAG
+TGGTGCAGTGCAGGTAATCCCCGGCGTTGTCGCAATTGAGCTGGCCGGGTTCTTTCAGCT
+TTTCGCTACTGGTGCAGTTGCGCGATTGGGAGCCGTCCGGATTGGTGACCCAGTCACCGC
+ATTGGCTTTCGCTGGTGAACTGCGGTGTGCTGTCGGCCGGGGGCTTGGACGGTGGCTGAT
+CAAAGACACTGCCGGGAGGTGGGTTGTTTGAAGTGCATTGCGAGCCGGCGCCCTGGTAAA
+AAACCTTGCAATAAACGGAGTTCAGGTCCTTGCCGGTGGTGTCTTCCAGAAAGCGATTGC
+AGCCTTTGACCGTGGCGGTGCGGCTGTAGAGGCAGCCGCTTTCGCAGATCGAGGACGGCG
+GCAGAGAAGGCGGCACGGACGGGTCCAGGGAGCCGGCGTTGTACTCGTGGACGAACTCGC
+CGGTTGCGGTGGCGCACTGGTCGGGTTCAGGGGCGACACACTCGCCAGTCGAAGGGTCGT
+AAGTGGAATCAGGAGCGCAAGAATCGCCGCGTCTAGCTGCTGCGTTGTACCAAGAACCGT
+AACGCTCAAGCTTCCCGGAATAGGGATTGATATTTAATCCATATGTACGACAGGTAAAAG
+ACGCTGTACCTTTTTCAATCTCCTGCTCAAACGAAACATATTGCCCGGAGTTTAATTGCT
+TGTAGTAGGCATGGTTTGCATTACAGGCGGCGACACCGCTGGAATATCTTATTAGCGGGT
+CCGGAAATTGAATGGTCCAATAATAATCTTCGGCGCTAGCGGGCAAGTGCCAGAGCAGCA
+AAGCCAAAAAAGCCCCAAAAATCCTTTTCATAATCACACCCGCCCAAAAAACACGAGATA
+AAACGCCAGGGTGGTGAGGATCAGGACGTACAGTTCGTAGCTCATGGCGTTTCCCTGGAA
+GAGAAAACCCCGCCGGAGCGGGGTTTGTTTGCTTCGGCACATGCAGTGCGCAATACCTTG
+GTTACAGGGCGCGGCGCATGTACTTGAACGCCATCGCGGCGATGATCACCGCGAACACCG
+CCCAGCCGATGGTTCCAACGTCAGTGCCGGCGGTATCCAGCGCCGCGGTAGCTTCAGCCG
+GGACGGCGGCGTAGACGGAGCCGGCCAGGGTGGACAGCGCGACAGCAGCGCCAACGCCGA
+TTTTCTTGATGAATTGCTTGTTCAGTTGCATGGGTGATACCTCACTGTTTCAGGGCTTTT
+TTGAGGACCAGGAAGCCGAACACGGTGGCGAACAGAACAATCGCTTCGCCTTGCAGCTCG
+GAGACTTGGTCCCAGGTCAGTGCAGAGCCGTAGAGGCTTTGCATTTCCTCGACCGTGAGG
+GCGACCAGCGAGCCGGAGCAGATGGGCGAGCCGTCGGCGCCTTGCAGCCAGTCACCGTCA
+CAGGCGAGGAAATTCATTCGCCGGCCTGCTCGAGGTCGGCGGGTTGTTCGGAGGGTTCGC
+AGTCGGGGCAGACGGCGAAATGGGGCGGCAGGCTGAGGTCGGGCAGCAGGTCGCTTTGCG
+GCGCGGGCAGCGCCATGAGCTTGCCCATGTCGTTTCCGCAGCAGTCGCAGTACACCCGGT
+CATCAATCAGCATGGCCGCCCCTCCCGGTTAGTTGGCTTTGGCCGGGTCGCCGGCTTTGG
+CCTGGGGTTGAGCTGGGGTGCGCGGGGTATCGGCTGCGGCGCGGGTCTGGACGGCTTCGA
+GCTGGAGCGCCAGATTCTTGCCCTTGTTCTGGCCACCCCGGGCAATCTCGAAGTGAATGC
+GCACCAGTTGCAGCGGCTCGAACTTAGCGCCGGCTGCGAATATCTCGTCGGCTACTTCGT
+CTGCTGCTGCCATGCCGATGATCGACAGGCCGTGTTCGGTCTTGCCGTCCGGCTCGTCGC
+CGTAGAAGACTTTGATGTACTTCTGGCCCGCTTCACCGTCGAAGCGTTGAGTGCCGAGAA
+ATGCAACTTCCATAGTCGAACGTGCCATTTGTGTTTCCTCTTTCTAGTTGCGCTTAATTG
+CGCTGCTTTGCTTTCTGCAGGCCGAGCGATCCCGAGCGAGTGAAAAAGTAATTTCACTGC
+GACCGGCTTGTTACTTGGCTTGCGGGTTATCTATAGCTGTATTTGAACGCTCTTGGAACA
+ACTATTTAGCAAGTATTAAAACAATCAATACTTCATTTTTTAATGAGACGAATAGTGCTG
+AATTGACACTTTCCATCTGAGCAAACATTAATTTAATTAATCATCCGCAACGCTGTTTAA
+CACCAAGGGCTCTGCCCTTGTCATCCCGCTCTTGCCGCCGAGGGCTCGGGAGCGCGGGAG
+GGAAAAGCGCTCCCGCACTCACGAGCGGAGGCTGTTTCAGTTCGTGCAGGGTCAAGGGTG
+CGCTCCGCCCGTGCTTCCGTTCGCCGGATCGGTGAAGCGTGATCCGACGAGCCGGGAGCG
+CGGCCCCTGACCTGTTCGGCCACGCGCTCAGCCTGATAACGCTCAGCGACATAGCGACGC
+AGCTCGACGAGAGACCGGTGTTTCGTTGGCTCGCTACCGTCCAACGGAATGAACAGAGGA
+ACGTCGCGGCGATAGGTAACGTGCCCATACAGCTCCCCGCCTACGGTCAGCTCCCGCCCG
+ATCTCATGCCAGTTAGGCGACGCGATACGAACCTGCATCCGCTTACGCCCTACCCCACCA
+GCTCGAACGGTTCGTGAATCGGCACGTAGGGCGTTGGCTTGCCCGAGTCGTAGATAATGC
+TCCACCACTTCGCGGGGCGCTCGGGTGGCGTGTGCTTCTCGCAGATATAGGCCGGTTCCA
+CTGTCCAGTCCGAGAGCAGAGGCTTCCAGATTCCACCAACGCACCCCATTTGCAGTGTGC
+GAATCGGCCGCGCATAGGCGGGGCGGCATTGGGCGCATGGTGTGGACCGGGAGGGATCGG
+ATTTCGCCATTTCGCGTCTGGACCAGCAGACAGAGCAGTCGCAGTCCTGGGCGTGCGGAA
+GGCGTTGATAGCTGGCCGGCTTCTGCATAGGCCATCCCCTCCCCTGGCTTTCCGTAGACG
+GCGCGGATCATGCGGAGCGCTCCTGTTCATTGGTGCTGGGCGAAGGACGCTTCCAGGCGG
+ATGACGATTTCGGCGTTCAGGGAGCGGCGTGCAGCCCAAGCGGACCGTTCGACCTGGGCG
+CGGAGTGCCGCAGGCATGCGCAGCTTGAATTGCGGGTCTGTGCGGCTCATTGGTTCACCC
+CCCCGGAAAACGCACCAAACGGGTTTTGCCCAGCTTCACGCTCTCGACAGCGCCAGTCCT
+GACCCAGCCAGCGACCATATCCACGGGCACACCGGCCAGAGCGGCGAATGCGGCTTGCGT
+ATAGAAAGGAGGATTCATGCGGTCCACTCCTGTTCCAGCAGCCAGCTACGCAGCAGCGCG
+CTGTTAATCATGCGGCGCTTGCCGAGCTTTACGGTGGGGAGTACGCCCCGGTAGACCCAG
+GCGCGGGCCATGGAACACGTCAGACCGTTACGTTCCGCCCAGGCTTCGACGGTTTCCACG
+TCCTGCTGTGGGGCGATCAGCTTTGAAGGTTCTAGCTCTTCCAGTTCCATGCTCGTTCCG
+TCACTATTCGTGGCAATGCCAGTTATTCAGCACTGCGTTATCCATAACGGATAACCTCGA
+AACGGATAATGCCATTGCTAATCCAAATTGGATACATCACATATAGATCAAGTAGCTATG
+ATTAAAGAGCGCGTTATAACTATTCTGAAAAGCTCAGGTATTCGGCTGCCCGAGCTGGAA
+GAGCGCACTGGCATCAGTCGATATACCTGGAACAACCTGAAGAACACAGCGCGAAAGCGC
+GAGATTAAGGCTGAGGAGATCGAAGCTATCGTTAAGCTCTTTCCTCAATATGCCTTATGG
+GTCGTCAGCGGAGAGATAGCGCCAGAAGCGGGGCAGATTAGCCCTGATTACGCTATTGCC
+GATTCAAACTTGCCGAGTCAAAGCGCGGGATAGCGATCACAACGGAAGTGACTAGGCGCT
+GGTATGCCCGCTTAAGACGTTAGAACAGCTTTTTGGAGCAGTATTAAGAATGGGAATCTT
+CGCAGAAAATTTAAATGATATTGAATCCTACTGCGCCAAGCTAGAAATGCTTTTATCGAA
+GCAAGAACTTATAGATCAGCGTGTCTCTTTATGCGTGCCCATGCTGAAGAAAATTTCAGA
+TGAACCTGACGCTTATGATAAATCAGCAAGATTAAATGCTCAGTGGATCGGCGGAGAGTT
+ACTTAGCATTATTGCCAACCGAAGAACCGACGATAGCTCACTGCAAGAATTAACACGTTA
+CCTGGCTCGAATAGCAAGAGAAACCACACTTCGAACCCCTTACATACCAAAAACACCTGA
+AAAAGAGCTTCTTGATTTTTTCGACTATTCAAAAAATCATGAAACAACCGAAGACAAGGA
+AACTTCAGATCTTATTTGGGCCTCCATTCCAAAATACATAGTAAGGGAGCATCTAGATGA
+AGTTTCTAAAAAAGAGGATGATGTAACCAACCAGGTTAAAAGCTGGGAAGACCAACTCAA
+AACATATAAAGTAACCATAGACTCATATATCAGCGAACTTAAAGAGCAACAAGGAAAATT
+CAACTTCGTTCGACTATCAAAAGCCTTTCACGAAATGCACAAGAATAAGCAAAAGGAGCT
+TAAATCAAACTTTATCGCTTTGATTTCTCTAGGCGCTTTAGTGCTTTCCCCACTAATTTT
+TCAATTTGCAGTAAAGACACTCACGAACACAGACACCACACTCAACACCCTGAGCACGAC
+GGAAGCATGGAAGCTAATATCTTTAGTTGGCTTAGAAGTGGCTCTACTTTATTTCTTTAG
+AATTGCACTGAAAAGCTACTACTCAACCAAAGCTCAACTTCTGCAAATTGAACTCAGGCT
+TTCATTATGCGCATTTATAGAAAGTTATGCGGACTTTGCAAAATCAAGAAAAACGAAAGA
+CGCTGACCCCTTACTTAAGTTTGAATCAATAATTTTTTCCGGCATTACACCTGACGATAA
+CAATGTTCCCAGCACCTTTGACGGCATAGATCAGATTTTCCGATTAGCAAAAGAACTTAA
+AGGAAAGTGA
+>NC_019936.1|provirus_4295725_4304306
+CTATCCCGCGTCTTGACCGGTCAAGTTTCGGTTGGCCTCGTCGTAATCGGGACTCGTCTG
+CCCGCACTCCGGAGCGATCTCACCGCTTGCGACCCATAAGGCGTACTGCGGATAGAGCTT
+CACCAGGACCTCGACCTCCTCTGTACTCAACCGCGCCTTCTTGTGGCGTAGGTTTTTCCA
+TCGGCTGTAGTTGATCTCCGACTTGCGGACCAGATCGTCTAGGCCAGCCTTATAGATCAG
+AGCAATAGCTCTATCCTGCATCGATTCCATAAAGGTCTAAGAATCTCTGAGTTCACTATT
+TGAACTCTAGGAATACACTGTTATTCTTTGCCTGTCAGTTCACTATTTACACTCTAAAGC
+TGCACTGACGTAGCCCTATAAAGACCAACATAGTGCAACAAAGGCCAAGGACATGGAAGG
+AAACCTACCGCCGATAGACCTGCTCAACGCGCCCCCTGTCATGCCGTGGCGCCAGTTCGC
+GGACTGGATTCGCATGAATGATGAACACGACGTGGTGTGGGGCTGGATTCGCAACGGCTA
+CATCCCGTCGCACAAGGTTGGCAAGTACGTGATGGTCAACGTGGCGCTGCTGGTTAAGCA
+GCTCATGGAAAAGGAGTGGGACTCATGATCCGCGCCGCCTACGGAAAGCCAGGGGAAGGG
+ATGACCTATGTCGAAGCTGACCAGCTATCAACGCCTTCCGCACGCCCAGGACTGCGACTG
+CTCTGTCTGCTGGTCCAGACGCGAAATGGCGAAACACGCTCCCTCCCCGTCCACACGCTG
+CGCCCAATGCCGCCCCGCCTCTGCGCGGCCGATTCGCACGCTGCAAATGGGCCGCGTCGG
+TGGTGCCTGGAAGCCTCTGGTCTCGGAGTGGACAGTGGAACCGGCCTTTATCTGCGAGAA
+GCACACGCCGCCCGACCGCCCCACGAAGTGGTGGAGCGTTATCTACGACTCGGGCAAGCC
+CACGCCCTACGTACCGATTCACGAACCGTTCGAACTGGTGGGCTAAAGCCAACCGCCCCC
+GCCGAAGCCGAACAGGTCCAGGGCCGCGCTCCCGGCTCGTCGGATCACGCTTCACCGATC
+CGGCGAACGGAAGCACGGGCGCAGCGCACCCTTGACCCGGCACAAACCGAAACAGCCTCC
+GCTCGTGAGTGTGGGGCAGCTTCACCGCCCCGCGCTCCCGAGCCCTCGGCGGCAAGAGTG
+GGATGACAAGGGCAAAGCCCTTGGTGTTAACCAACTAGAGAACACGCACAACGCGACGTT
+TTAACCGGTAGGCCAAGTAACAGATCACCTCGGCGAACTTGCGAGTTCACCGGTTCGGGA
+TCGCTCGGCCTGCAGAAAGCAAAGCAGCGCAATAAAGCGCAACTAGAGAGAGGAAACACA
+AATGGCACGTTCGATCATGGAAGTTGCATTTCTCAGCGCCGAGAAAGTCGAGTTCGACAA
+CGTGAAGCTGGTGAAGCTGTTTGTTGGTGACGAGCCAGACGGCAAGCGTGACCTCGGCAT
+TTCCATCCTGTCGATGAATGTCTCCGAAGAAGCCCTGGACGAAGTGTGGTCCGCCTGCGA
+AAGCCTCGATGTGCTTGAGCCGATCCGCGTCACCACCGAGATCGAGCGAGGCTCCAAGAA
+CGCCGGCAAGTTCATCGTCCTGCACGTTGAGCCTGTGAAAGCCGCCGCTGCTCAAGCCAC
+CAAGCCGACCCAGCAACCGACCCCAACCGCCAAGCCAGCCGGCACCCAGCCGGAACCGGC
+GAAGGCCAACTAACCGGGAGGGGCGGCCATGCTGATTGATGACCGGGTGTACTGCGACTG
+CTGCGGAAACGACATGGGCAAGCTCATGGCGCTGCCCGCGCCGCAAAGCGACCTGCTGCC
+CGACCTCAGCCTGCCGCCCCATTTCGCCGTCTGCCCTGACTGCGAACCCTCCGAACAAAC
+CACCGACCTCGAGCAGGCCGGCGAATGAATTTCCTCGCCTGTGACGGTGACTGGCTACAA
+GGCGCCGATGGCTCGCCCATCTGCTCCGGCTCGCTGGTCGCCCTCACGGTCGAGGAAATG
+CAAAGCCTCTACGGCTCTGCACTGACCTGGGACCAAGTCTCCGAGCTGCAAGGCGAAGCG
+ATTGTTCTGTTCGCCACCGTGTTCGGCTTCCTGGTCCTGAAAAAAGCCCTGAAACAGTGA
+GGTATCACCCATGCAACTGAACAAGCACTTCATCAAGAAAATCGGCGTTGGCGCTGCTGT
+CGCGCTCTCCACCCTGGCCGGCTCCGTCTACGCGGCAGTCCCGGCCGAAGCCACCGCGGC
+GCTGGATACCGCCGGCACCGACGTCGGCACCATCGGCTGGGCGGTGTTCGCCGTGATCAT
+CGCCGCGATGGCGTTCAAGTACATGCGCCGCGCCCTGTAACCGGGGTTTTGCGCACTGCA
+TGTGCCGAAGCAAACAAACCCCGCTCCGGCGGGGTTTTCTCTTCCAGGGAAACGCCAATG
+AGCTACGAACTGTACGTCCTGATCCTCACCACCCTGGCGTTTTATCTCGTGTTTTTTGGG
+CGGGTGTGATTATGAAAAGGATTTTTGCGGTTTTTTTGCCTTTGCTGCTCTGGCACTTGT
+CCGCTAGCGCCGAAGATTATTATTGGACCATTCAATTTCCGGACCCGCTAATAAGATATT
+CCAGCGGTGTCGCCGCCTGTAATGCAAACCATGCCTACTACAAGCAACTAAACTCCGGGC
+AATATGTTTCGTTTGAGCAGGAGATTGAAAAAGGTACGGCGTCTTTTACCTGTCGTACAT
+ATGGATTAAATATCAATCCCTATTCCGGGAAGCTTGAGCGTTACGGTTCTTGGTACAACG
+CAGCAGCTAGACGCGGCGATTCTTGCGCCCCTGATTCCACTTACGACCCTTCGACTGGCG
+AGTGTGTCGCCCCTGAACCCGACCAGTGCGCCACCGCAACCGGCGAGTTCGTCCACGAGT
+ACAACGCCGGCTCGCTGGATCCGTCCGTTCCGCCTTCCCTGCCGCCGTCCTCCATCTGCG
+AAAGCGGCTGCCTCTACAACCGCACCGCCACGGTCAAAGGCTGCAACCGCTTTCTGGAAG
+ACACCACCGGCAAGGACCTGAACTCCGTTTATTGCAAGGTGGTTTACCAAGGCGCCGGAT
+CTCAATGCACCTCAAACAGCCCACCTCCCGGCAGTGTCTTTGATCAGCCACCGTCCAAGC
+CCCCGGCCGACAGCACACCGCAATTCACCAGCGAAAGCCAATGCGGTGACTGGGTGACCA
+ACGCGGACGGCTCGCAATCGCGCAACTGCACCAGTAGCGAAAAGCTGAAAGAGCCCGGCC
+AGCTCAATTGCGACAACGCCGGGGATTACCTGCACTGCACCACCGGCAAGCCCGCGCCAC
+GGCTTGAAGACACTACAAAAACCGAGGAAACCACCAAGACCACCAATCCGGACGGCTCCA
+CGAAGACGGAAACCAACACCACCACCGACAAGACCGTCTGCGTTGGCACCAAGCCCTGTA
+CCTCCACCACGGCTGAAGAAAAGTCCACCTCTGGCACCAACCCTGATGGCACTCCAGGCG
+ATGAGAGCAAGGAATGCAAAGGGTCTGGCTGTAAGGAAAGCCAGGAGGGTGAAGAAGACG
+GCGAAGAAGGCCCGGAGCGTTTGGCTTCTGCCGGCTCCTGCGATGCGGCGTTCTCGTGCA
+GTGGTGACCCTATTGATTGCGAAGTGCTCCGGCAGCAGAAGGAACAGCTTTGCCTTGCTG
+AGGAAATGGCCGATTTCCCCAAACAGCAGTCCGCCATCGAGGCGGCTGTTACCGGTGACC
+GATTCCAGCTGGATGAAGGTAACGGCGTCATCGACGTGCCTTCGTTCATCAACCAGGGCA
+CCCGCTTTCTGCCGTCCGCCTGTCCCGCCGCCGAGAGCTTCAGCCTGACCACAGCAGGCG
+GTCGCACTTTCCAGCTCAGCTACGAACCGCTTTGCCGCGCCGCCAGTGACCTGAGCGGCC
+TCTTCGTGGCCGTGGCCACCGTTCTTGCCGCCCTGTATGTGGGCCGCGCCGTAGGAGGTC
+AGTGATGCAGTTTCTATTCATCGTCCAGATGCTCGTGATCATCGTCGGGCCGCTGGTGAA
+GATGGTGCTGAAGATGATCGGTTTCGGTTTTGTCTCCTACATGGGCTTCAACCTCATCAT
+TGGCCAGGCGCAGGACTACCTGTTCGGGCTGATGGGCGATGTCGGGCCGGTCATCCAAGG
+GATTCTCGGACTGGCGAAGTTCGATGTGGTGGTGAACCTGTATTTCGCCGCGATCTCCAC
+GCGCTTCATCCTCGCCGGCATCGACAAGGCCACCGACCGCAAACGTAATCAGGTCTGGCA
+TAAGCCGGGCGGCACCTCTATCGACGCATAAGGAGGCGCCGTCATGCTCGTTATCCGCAC
+CGGCAAGCCCGGCCATGGCAAGACCCTGAACACCATCCGCGAGGTCGACCAGAAGGCTCA
+CGCCGAAGGCCGGGTCGTCTACTTCCATAACATCAACGGTCTCAAGCCCGATCAGCTGCA
+AGCGCAGTGGTTCGAGTTCGAAGATCCCGAGAAGTGGTTCGAGCTGCCCAACGATTCGAT
+CATCGTGGTCGACGAAGCGCAGGGCTGGTTTGGCTCGCGCGATCCCAGGGCGCGGCCACC
+GGAGCACATCACCCGCTTCGAGACCATGCGCCACCAGGGCCACGAAGTGCACCTCGTCAC
+ACAGGACCCGCGCTATCTCGATGTGCATCTGCGCCGGCTGTGTAACACCCACATTCACTA
+CTGGCGCGTCTTCAAGTCCGCCCAGCTGCTGCGCTTCGAGTCGGAAGTCGTCGTAGAAAA
+GGTCGAGCTGAAAACCAGCTTCAAGGATGCTGACAAGAAGTCACTGCGCCTGGATAAGCG
+CTACTTCGGTGCCTACACCAGCAGCAACGCCAAGCACCACTTTCAGGCCAAGGTGCCGAC
+CAAGTTCATCTTGGCCATCTGCGTGCTGGTCGGTGCCGGCATCCTCGTTTATCGCGCCTA
+TGAACGCTATGCAGCCGAAAAAGCTCAAGCCGCGACGGCTACCAGCGCGCCGGCCGGGAG
+CATGGTCGATCAAGTGAGGGATACGGTCGGCGCATTCATCAAGCCGGTAGGCGAGGCGAA
+AACCGATGCGCCGGAAAGCGCCGCCAGCTACATCGGGCGGCGCGTGCCTCGGATACCGCA
+AGTCCCATCGTCGGCGCCGATCTACGACGAGCTTACGCGGCCCGTGTCGTTTCCCCGACT
+CTACTGCATGTCCAGCACGGACCCTGCGACCTATGCCCGCGAGTTCGGGCGAATGGCGCA
+TGCGGTAGTCAACGGCACGCCCACCGTCTGCCAGTGCTACACGCAGCAGAGCACGCGGGT
+CGAAACCGACTTCGCATTCTGCATGCGCGTGGTCGAAAACGGCTTCTTCGATCCGACCCT
+TCCTGATCGCTCCGCTGGCGAGCGAACGCAGCAAGTCCAGAACAGCCAGCCTCCGGCAAT
+GCAGGGGCCACGCCCTGGACCAGCACAGCCAGCCAGTGGCACGAACATGACTGTCGTGCC
+GTACCAGAAGGGGCAATTCCTGTGGTGATGACCGTCAGCGCGCGTGCGCTCCGCGCTCTT
+TGCACGCACGGCGAGGCACGAGCCGGCGTGCAAACGCGCGCGCTGACGTCCCTGTAACAC
+GTCAGATAGATCGAGTTGAAACCGTCCGTTATTGGACATTGTTGGAGATTCAAGAATGAG
+CGTTAAAGACCAAGCAAGACTGGACCACATCACGGGCAATCCGACCAAGCGTGGACGGTT
+GTTCGTTGACCCTGGTACTGCGGCAATCACCGATCTGTCGAAGGTCCGTCTGCTGCGTTG
+CGGCGTCGATACGGTTCGCCAGTTGTATCGCGGGCTGATCCGTCCAGAGATCATGGCGCT
+GTTCGAGAAAACGGGCGCGATGGTGGAGTTTGCTGGCGAAGTCTGGCACTCGGGACGGGT
+TGGCCGGGACTCTGGCTACCAATACAAGCTCCAGAACGCTGACCTTGGGTTCATCCTGCT
+CATCAAGAATTTCAACGCCAAGCTGGAGAACATCGGGCCGCACCTGAAAATCGAGGTGTC
+GCCGCACGCCATCGACGCGCTGTCGCCTGAGCGTCTGCAAGAGCGGATGGATTACTACGC
+GGCGGCAGTCATGACCAACCGCGAACGTAACCAGTGCGCCGTCCATTTGGCGTTGGACCT
+CCAGGGCTGGAAGCCTCCAGTCGATCTGGTAGCCCGCCTGCACTGCCGCGCGCGAACGCA
+TCGCGATATTTCCGGAATCAAGGAAATTCAGTGGGCCACCAAGTCCAGTGTTTACGGTCG
+GGGCGAAACGTCCATGTTCGGCTCGGCCAGCGGCGTGCAGCTCTGCATCTACAACAAGAC
+CGAGCAGGCCCGCGCAACCGACAAGCTCGACTACTGGGAAAGCGTGTGGCGTCGCCGTGA
+CTCCTTCGACCCGACCGACCCTGACAACTACGATCCAGGCGCTGACGTGTGGCGCGTTGA
+GTTGCGCTATCACCACTCGGTCATCCAGCAGTTCGCCAGCGGCTCGATCAGTGCGAAGAC
+CGGTGAGGCCATCGATACGGATTCGTTTTCGGCCTTCTCGGCTCATCTGGACGGCCTGTG
+GCGCTATGGCCTGAGCCAATTCAAGCTGATCGCCCGCCCCGGCTATTACGAGCCGATCTG
+GACGCTAATGCGTGATGACGCGAGGGTCGATCTACCGGTCGATTCCCTGGTCGAGGAAAC
+GGAGTACAAGCGCTATTACAAGACCTCAAGGGGCTTCTCGGGCAAGAACGTCGAGCTGTT
+CCTGGGAAACTTCGTAAGCCTGCTGGCACGGGAGCGAGTGGGCGCTAAGACCGCATTTGA
+TCGATTGAAGCAATGGGAATGCTGGCCAGTGATCCGCGACCACTACGCCGCCAAGGACAT
+GAGCGAGCGCGACCTCTACAAGCACATCAAGAACCTGTTACAGGAACGACACGTGCGATG
+GGGGCGTGCCGTCTGATGGCGATACTGGCACTGCCTGACGGTCGCTGGCGGGTCGATGTT
+GAACCGATCAAGGGCAAGCGATTCCGCAAGACCTTCAAGACCAAGGGCGAAGCCCAGCGG
+TTCGAGGCTACCTGTCGATCCAAGCTGATCGAAAGCCCGCAATGGTCACCAAAACCGAAG
+GATCGTCGTCGCCTGTCTCAACTGGTGGACTGCTGGGGGCGTCTGCACGGTCAGTCGCTG
+TCCGACTATGAGGGTCGGCGCGTCATCATGGATCGCATGGTCGAACGCCTGAAAGACCCT
+GTCGCCATAGCCTTCACTGCTACCGATTTCGCGGAGTACCGCGCCAAGCGCCTCTCGTCC
+GGCATCAGCCCGAAAACGCTGAACAATGAGCTGTCTTACCTGCGGGCCATGTTCAATGAG
+CTACGGCGACTTGGTGAGATCGAGTTCGAGAATCCGCTTTCGATGCTCAGGGCGATTCGT
+GTGCAGGAAAGGGAACTGTCCTGCCTCGACAGCCATCAGATCGAACGGCTGTTCCAGGTA
+CTGCGCAGCATGGTTCACCCACACGTGGAGCTGATCGCCACGATCTGTCTGGTGACCGGT
+TGCCGATGGGGTGAAGCGCAAGGGCTCACGATCAGTCGGGTGGGCGATGGCATGCTCCAG
+TTTGTGAACACGAAGTCGAAGCGTCGCCGTGTGGTGCCGATCGATCAGAAGCTAGCGGAG
+CGGATACGCCAGCACCTTCGGCAACACGGTGCGTTCACCAACTGCCGGGATCGGTTCGAT
+GAAGCTGTGGTGCGTGCGGGGCTGGGTCTACCTGCGGGACAAAAGTCGCATGTGTTGCGG
+CATACCTTCGCCTCACACTTCATCGCGAACGGTGGCAATATCCTGACCTTGCAGAAGATA
+CTCGGGCACTCGTCCCTGGCGATGACAATGCGGTACGCGCACCTTGCGCCCGATCATCTG
+CAAGACGTGTTAGCGTTTGGGCCTGCTAGGGATTTTCGACACTTCTTCGACACTCCCGCC
+TCTGAGCGACAGTCGGGGCAGGAAATTCCTTTGTAAATCAATAAGGAAGGCAATCGCACC
+CGGTGGTGCGGCCGGGCTTCAAACCCGGTTGGGGACGGCAGCCGTTCCCGGGTGAGTTCG
+ACTCTCACTGCCTTCCGCCATTTCGACTCACACGCCCGACTCCCAAACCCTCGACACCTA
+CCCCGCGACAGCCCGTCCCACCTCGCAATATCAAAAAGCCATCGCACTTCAACGCGAAGC
+GCGTCACAATCGCGGCTTTTCTTTCCAGGGATAGGAGAGACGTCGTGGGTAACTCGCCAG
+ACGAGCGCCGTGCGTTGCACGCGCTGCGTGACCATATCGATTGCCTACTGGCCGAAGGAG
+CGTCCGTTGTCGGTCGCGACCCGGTGCAGCTGAGTTTTCAGGGCCGGACGTTGACGGTGC
+AGCACGGGATACTGCTCAACGAGAACGGCCATCAGGACCTGATCGAGACGCTTGCCGAGC
+TGGAGTGGACGAACAAGCGCACTCGCGATCTAGCCATCGATATCTGCATCCGCCAGCTAG
+ACCATGCGATCAAGGCGAGCTGCTTCGACGCGCTGGAAAGCTCAAAGCCCGACAAGCCCT
+GA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_fasta/NC_021184.fasta.fasta	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2005 @@
+>NC_021184.1|provirus_19778_35564
+ATGCTGGATTTGAAATTTGTGCGGAATAACCCGGAAATTGTTAAAGAGGCACTACAGAAA
+AGAGGAGCTAGCATTTCACTCGACCCGTTTTTGGAACTCGATGAGCGCCGCAGGGAAAAG
+CTGGTTGAGGTGGAGAAGCTTAAAAATAAACGTAATGTGGTATCCGAGGAGATTGGCCGG
+TTGAAAAAGGCCGGACAGTTGGCTGAGGATATGGTACTGGAAATGCGGCAGGTTTCCAAT
+GCTATCAAGGATTTAGATGAAGAAATTCGTATTTTGGATCAGCAGCTGCAACAAACATTG
+CTAAATATCCCCAATATTCCTGAAGAGAGTGTACCCGTGGGGTTGGATGAAAATGACAAT
+GTTGAATTGCGGCGCTGGGGTGAGCCCAGACAGTTTGGTTTTGAGCCCAAACCCCACTGG
+GATATCGGTGAGGCGCTGGATATATTGGATTTTGAACGGGGCGGCAAGGTTACAGGTGCC
+AGGTTTCTTTTTTACAAAGGAGCCGGTGCGGCTCTGGAGCGTGCTGTATTTAATTTTATG
+CTGGATGTGCATACGAGGGAGCACGGCTATGTAGAGGTAATGCCACCATTTATGGTTAAC
+AGCAACAGTATGATCGGCACAGGCCAACTGCCCAAGTTTGCCGAGGATATGTTTAAAGTT
+GAAAATACTGATTACTATCTAATACCCACTGCCGAAGTGCCGGTAACCAATCTTTATAAT
+AATGAAATATTGGATGGCGATAGATTGCCCATTTACCATTGTGCCTACAGCGCTTGCTTT
+AGAGCCGAGGCAGGAGCGGCGGGACGTGATACACGGGGCCTTATTAGGCTGCACCAGTTT
+AACAAGGTAGAACTGGTAAAGTTCGTTCGTCCGGAGGAGTCCTTTACTGAACTGGAGAAA
+TTGACTCAAAATGCCGAGAAAATACTGCAATTGTTGGAGCTGCCTTACCGGGTGGTTGTT
+TTAAGTACCGGTGACCTGGGTTTTAGCTCTGCCAAAACCTATGATTTAGAGGTGTGGCTA
+CCCAGTTATAACAGTTATAAAGAGATTTCTTCTTGCAGTAATTTTGTGGATTTCCAGGCC
+CGGCGGGCCAATATCAGGTACCGGGAGGGTAAAGCAAAACCTCGTTTTGTACACACTTTA
+AACGGTTCAGGTTTGGCCGTGGGCCGGACGGTAGCCGCTATATTGGAAAATTGTCAGACT
+GATACCGGTGCGGTGAAAATACCGGCGGTGTTACAGCCGTATATGGGTGGCATTAAAGAG
+ATAAATTGACACTACTGAAGGGGAACGGTGTTATTGACACCTAACCTATACTGTGTTATA
+CTTCTTATTGTCTCTGGTTGATTGAAATTGACTGGAGGGGTGTCCGAGCGGTTTAAGGAG
+GCGGTCTTGAAAACCGTTGAACCTTCACGGGTTCCGTGGGTTCGAATCCCACCTCCTCCG
+CCATTTTAATTACCTGACAGCACGGAGAGATGGCCGAGTAGGTCGAAGGCGGTCGCCTGC
+TAAGCGATTATACGGGCTAAAACTCGTATCGAGGGTTCGAATCCCTCTCTCTCCGCCAGT
+AAAGAAAACCACGGATTAAAGATCCGTGGTTTTCTGATGGGTTTACTCTCACCATATCAT
+GGTTATCACTCATTTTTACCAGTTGACTTTTACGAGTGCTTTTGTTACAATTATATTTGC
+GGTGCTGGTGAAGCAACGCAAAGAAAAAACAATATGTGCCTGTGGCTCAATTGGATAGAG
+CATCTGACTACGGATCAGAAGGTTGGGGGTTCGAGTCCCTCCAGGCACGCCACAATTTTA
+CGGCGACACAAAAGTATATATACTAATTGTGTCGCTGCATTTTATTATTAATATACCACC
+ATTGGAAATACATTAGGCGCCTGTAGCTCAGAGGATAGAGCAGCGGTTTCCTAAACCGCG
+TGCCGGGGGTTCGAGTCCCTCCAGGCGCACCACTGAAAATCAAGGCCCGCAAGGATTTGC
+GGGTTTTCGCTTTTCTAGCGAAATTCGCTGAAAGGCTATTTTGGGAGCATTTTGGGAGCA
+AAGATAACAAACCGGGAGCAAACGAGACAGGAAAAGACAGGTTTTACGCCTGTCTTTTTT
+TTGTGTCATTATGAATAATATTCTGGTACACATTTTCTAGCTTGTCCGATATTGCCTTAT
+CGGCACTCTGTAAGTAGTGACTATAAATAGCCCCAGTGGTGGCCGGGTTAGCATGTCCAA
+GCCGACCGGATATATTTTTAAGTGGCACGTTCTGATTAATCAACATTGTGGCCGCGGTAT
+GCCGGAGGCCATGAAAGGGTAGGTGCGGCAATTTGTGTTTTTTAATAAACTTGGAGAACC
+ATTGCGATGGCCATTCCGGGTGCCCGGGCCTGCCGTCCCATGTGGTAAATAATCTGTCTG
+ACCCCTGCCATAAGTCAGCGACCTTTAGGCGGTCCTTAGTCCATTCTGTTTTATACTGTT
+TAATCAGCGTCATAACGAAACCGGGAATAGATATAACCCGCTTTGACGTTTCGTTCTTTG
+GTTCTTTCGTGATGGTGCCTATACCGGGTAGGTACTGACTGGACCGCCTTACGTTAAGTA
+AGGAGTTATCAAAGTCCACATCCTGCCATTCAATGCCCATGATTTCACCACGGCGTAACC
+CGGTGAATAGTGCTATGTAAACAAGCACCTGGTGCTTTAATTCTTCTGCTTCCAGGGCTT
+GCAGTAGGGTGGCAATGTCGTTTTCATCATAACAGGCGGCCGGCTTCCTGGGGACCTTGG
+GAGCTTCCACCCGGGCGGCCGGGTTGGTTAAAATTATTTGCCATTTGACGGCAGCGTTAA
+ATATAGTGACTAATAACCTGTGATGGTGAAGTATGGTTGCGGGCGACAGTGTACCTTCCC
+TGCCGTCCTCACGGATGCCGTATTCCCGCAAGTTGTCATAGAACTGCATTATGTGAAAAG
+GCTTTATGTCCTCTAATTTCATGTGGCCCATAGCCGGTAAAATGCGGGAGTCAAGCATTT
+TTTTATACCGGTGCTTGGTTTTGGGTGCCAAGTCTATTTTGGATTTAAGCCACTGTTGGC
+TAAATTCCGTGAAGGTGAGCCCGGAGGGTTCAATATACTGGCCCTTTTGCACCTCAGCAG
+AAAAAATGTCTAGCTGTTTTTTGGCTTCACGCTCGCTGGTGGCTTCAATCGTCCGGCGGT
+AAACTTTGCGATTACCGCCCGGGCCCGTCCCACCTGGTACGTTAAGCCGCCATTTGTTGG
+TCCCCCTGTTTTCTACCCAGCCAGCCATTATTCTGATTCTCCTTCTTCTGAGAACATTAT
+TTTTAGCATAGCGAGTACGCGTTTCCGTTCATACTCAGTAAGAAGTCTGCCATTATAATA
+TGCTTCCTTTTGATGTTTAAGAAGAAAAGCTATGTCATATAAATCTTGTCCAGACATTAA
+CTTAACTGTTGTTACGCTATCAACTCCCTTTGTTGCTATCTCACCAGGCACAACAAAATT
+CACTTTTGGGAAAATAGAACCGCTAGGAATCTGGTCAATGTACATCCTGTTGGTAAGAAT
+AATATCGTAAATATCTACGTCAAGTATTTTTGCAATTTCTTCTATTACAGAAATAGGCGG
+TACAATTTCACCGCTTTCATATTTTTGTATCACGCGTTCAGACTTGTTTATTTTTTTAGC
+TAATTCCTTTTGGGTTAGTTTTTTACTTTTTCTCAATTCTCTTATCTTGGTGCCAATATC
+CAATGTATTCACCTCCATACCAATATACTACCATAACACGAATTAAAAGTACAGATAATC
+AAATAAAAACTATTTACAACGAACTATAAATACGCTATTATATAATTAGTACGAATTTAA
+AATTCGTTAAGGGGGTTTAAATAATGCATAAAACACTAGATCAGCTTAAAGACGATGCCC
+AACATGTATTACGTGAAACAATAACTGCTAGAGAAGTAGCGGAAATGCTGGGTATTAGTG
+AGTGGGCAGCATATGACTGGGCACGGAGAAAAATAATACCGCACATCAGGGCAGGTAAAC
+GCGTGCTGTTTAGGCGGAGTAGCATTCTCCAGTGGCTGGAGGCACAGGAGCAGGCTAGCG
+TTACGGTAGAGCCGGAAACTGCAGGAAAAATACGGCGGCTGAAATAATCGACATAAAAGC
+AAAAGCCCGCGCGGGGCGGCACGGGCAGGCGGTAAGGTAGGTGTGATACAGTTGCATGCT
+CCAAATAGTTTATCACGAAAAAGTAATATCTTTCAATTGGTTAAGCAAATTAATACAGTG
+GACATTATTCATAAATACAACATTGCTAATATGCACCGGCATGGTCGCTATTGGGTGGGT
+TTATGTCCAGTTCACCAAGATAAAAAACCCAGTTTCTATACTTTTCAGGATAATAAATGC
+AAATGCTGGGGATGTGGATTCTACGGTGACGCTATTGACCTAGTGGCAAAGGTGTATGGA
+CTCAGACCCATTGAGGCGGCCCGGATGATAGCGCGGGACTTTGGTATTGAGGTGGACAAT
+AGGCCGGTATCATTGGAGGCCAGGCGTAAGGCCAAGCAGTTGGCCATTGAGGCAGCCCAA
+AAGCGTGAGATTGAGAAAATCTTTAAACAAAAACGGGATCGGGCGTTAGAAATACTTTCT
+TTGTTCGTGAGAACTACCAACCATGTTTTAGCTGCTGGGGGTTATCAAGCGCATTATGAT
+TTAGCTGAATTGTTACATAAAACCGACTACCAAGAGTATTTGACCGAATGCTTGTTGAGT
+AAGGATCCCGACTTACAGCTTATGGCATTGACCGCCCCGGAGGTGCAACAATGGCTCGAA
+TAACAGCAGACGAACTCCATGAAAAAGCAAGAGATGACCCAGAGGTGGCTAAAGTGTTGG
+GGTTATCATCCTTCTGGGAAAAACTCCTAAGTAAAGATAAAAACGGTAGGATTTATTCCA
+CAATTAATAACGCTCTTTTGATATTGCGGAATGATGAAGCGTTAAAAAGTAAAGTGGCTT
+TAAATGAGTTTGCAAACCAGCTTGACATTAGGGGTGCTTTACCCTGGGGGAAGGCCAAAG
+GTACTTGGTCTGACAGTGACGATGCCGAATTAAGATATTATTTTGAGACTAGCTACAACT
+TTACTGGTAAAAGCAAAATTGATGATGCCTTTGCCATTGCCACAAGCCGGTTGAAATTTC
+ACCCGGTGCGGGAATATTTGTCAGGGCTGCAGTGGGATGGGCAGCAACGGCTTGATGCCT
+TGCTGATTGATTACTTCGGGTCTGAAGATAACGAGTATACCAGGATGGTGACGCGAAAAT
+CATTCACGGCTGCTGTGGCCCGTGTATACAAGCCTGGCATTAAGTTCGACACCATGCTGG
+TGCTGGTGGGTAACCAGGGCATAGGCAAGAGTACCTTTTTTCGTTTACTGGCCGGGGATG
+AGTGGTTTACTGATGACCTGCGGATGGAGGATATGAAAAATAAAACCGGTGCAGAAAAAA
+TGCCGGGAAAATGGATCATCGAAGTTGCGGAACTGGCCGGGTTGAGAAAAACTGAAGTTG
+AGGAAGTTAAATCATTCCTAAGCCGCAACTTTGACCGGTACCGGGAACCGTATGGCCGCC
+GATCAAAGGACCAGCTAAGACAGTGTATCCTTGTGGGGACTACAAACGCCGTGGATGGCT
+TCCTAAGGGATCAAACCGGGAACCGGCGCTTTTGGCCCGTGAGGGTGAGCCGCGGGAAAT
+TGAAACCTTGGGAAATCGATAAGGTAAGGAATCAGATATGGGCTGAAGCCAAAAAGTATT
+ATGAGACTGGGGAAGCGCTTTACCTTACGCATGAGGTTGAACAGTTAGCCACGGCGGTGC
+AAGAAGAATACACGGAAATAAGCCCATGGTACGGGTTGATTGATAAGTATCTTAGTGAAA
+AATCTATGGGAGTTGTCTGTGGAATTGAAATTTGGATACATGCCCTTAGTGGAGACAAAA
+ACAAATATGGCCATAGGGAGCAGCAAGAAATAAGCAATGTCATGAAAAAAATACCCGGAT
+GGGAACCAGGAGGGCGCGAAAGAATACCGGAATATGGACGGCAGCGCGTTTATAGGCGAA
+TATCCTAAAACCTGTCCACCTGTCCCATACCTGTCCCACACCTGTCCCCTTACGGACATA
+AGGCTTTCCCCCTCTTTGGGACAAGTGGACAAAGAAAAAGATAATAAGTATTTATATGAT
+TATAAATAAAGAAAAAATATATATATGGTTTTTTCTGTCCCCTGTCCCAAAAAAACTCGG
+AAACCTTGCAGGAGTAAGGGGACAAGATGGGACAGGAACTATCTCAACCCTGTCCCATAA
+AAGAGCCTGTCCCATATTGGAGTTGGTTACAGTAGGGGGTGATTGTGGTAAATGAGTAGG
+ATAAAAAAGGCCACTGAACAAGAATGGCGGACAATTGCAAATGAAGCAAGGGAACTTAGG
+GACCGTATAGGTAAGTTAAGCATTCAAGCCTGTCCATATCTGCCAGTTAAACTTACGGAT
+GACTTAATGAGGGCACAGCAGGTAATTGATTTATTCCGTGCAAGGGCAGAAGATGAAATG
+TTTAAACGTGGGGGTATTAAAGATACAGATATCTGGTATCCCGGAAAATGATAATAAAGG
+TGATGGCGATCTATGAAATACATACGCATTCAGATGCCCAAGCACATACTGGTACTCACC
+GACCAAGAGCTTGAACGCCTGTTGGCCCGGGACCCCAAGTTATGGAAGCTGGCCATCGGT
+AGGGGAAAAGGCTTGCGGCGTTATCAGGCGGCCAAGGCGAGAGCAAATAAAGATAGGGGT
+TGAGAACATGGAAGTTTCAATTATTCCACAAAAGAAGTTTGAATGTGTAGCGGGACGCGA
+TTACTTAAAGGCCCGAATTACATTGATTGTTTCAGCTAAGACAAAAGAAGAGAAAAGGGA
+GCTGCGGGCACGGTGGGAGCAGCTAGAGGAGAATGGATCGCTTAATGAACTGTTGGAGCT
+TGTCAGGGAGATGGAAGCGGGCAGTTACGATTAAGCATTTAGGATGCATACCCGCCCCCC
+GGGGCGTCTATCTTGTGGCCAGTTCACCTGACCGGAGGGGGAAGGCTATTTGCACACATA
+GAGCAATTACGAGATTTTAGCCAAAAATTACCCCCCTCCGCCCAAAGTAGCAAATATTAA
+CAGAAAGGGGGCAAATTATGAGCCGTCCGAGGAAACCACCAAAAACTAAAATTAAAGTCA
+GAGATATTCTTAAATACATTGAACAATTGCCCCCGGATAATCCGCTTAAACAAGAATTGA
+CACCGGACAAGCTAATCCGGATTAAGCGATATATCGAGGAATTGCAATATCTGGATTACA
+TCATCGTGGGGTTGAAATCAGACATAGAGGCAAACGGAGAAATTGAGCTATATGAAAATG
+GTAATCAGAAAACCCGGCGTACCAATCCGGCGTTGACAACTTACATTGACACAATCAAGG
+CATACAATGCCCTATTGCGGCAAGTCTCAGAAATTTTGAGGGGGATAGAAATTGAAATTG
+CCAAAACGTGGTAGTGAAATACTACAGGTGATTGATGCCTGGCATACTCTTATACACCAG
+GCAAAGGCGGGCAACCTACAGGCAATTAAAATTTTTCTAAGTTTGAAAGCTAACAATCAA
+TCCGGTGCTGGAACGGCGCCAGGCAAGGTTGTTGACATAGATAAATACCCGCTGGAATAG
+CGGGATTGAAAGGGGGAAGCCCTCATGAAACTCTACGGCTTTTCAAATGAGCTGAGGGCG
+GCTGGTGAAGAAAATAATATGCTGCTGGAAGGGCGGGCAATTGTTTTCGACCAACCGACC
+GTACTTTATGAATTTGACGGTATCGAGTACAAGGAAATCATTGCTTCAACGGCCTTGGAT
+AAGGCTGATATGAGCGATGTTGTACTTCGATATAACCATAATGGTGAATACATCGTCTTG
+GCGCGAACTCGGAATAAGTCCCTAACGCTGGAAAAGCGGCCAGACGGGCTCTATATGCGG
+GCAACTTTACAGTCAGATATAACAAGCCACCGGGACCTATATAATGCGGTAAAATCCGGT
+TTAATTGACAAGATGAGTTTCGGTTTTGCGGTGGCTGATGATGGTGATAGTTATGACTCA
+GCCACGCATACCCGGACAATCATGAATATACGCAAACTTTTTGAGACCTCTTTAGTTGAC
+CAACCGGCGTATGACCAAACCTATGTTGAAGCCAGAAGCAGGCTTGAACAGTTAGCGGAT
+GTTGAAGAATATCGGAAAGCATTGCTCATTAGAGCAAAATTAATCAGGAGGTACTAGCAT
+GAATAAATTCAAATATATGACCGAAAGTGAAATTGAAGAATATCGTTCCCAGTTGGAAGC
+CGAACTTTTAACCAGTTCCCCGGAGCGTTTAAAGGAAATTGACAAAGAACTGACGGACAT
+CGCGGCAGCCCTGGCCAAAGACGAATATCGGCGCACCGTGGGCGCTGGCCCGAGGCAACA
+GCGCACTGCCGGCCCTATTGGTCAAATGCAAATCCTGGGCACCTACGGCATTGGTACCGG
+TATTACGAACAATACCAACACCAGGGGCAATGAACCCGTAAACGGCAATGTTTACGGCTC
+CTCGGAATACCGGCAGGCTTTCATGGGCTTCGTGTTAACCGGCGCCCGGTCAGAGATTTT
+GGAATACCGGGCCAACGCTACCACTCTAACCAGCGACATTGGAACCGTGATCCCAACAAC
+GATCGTACAGAAAGTCTACGAGAAAATGTCCGCTTACTCCATGATCTGGGACCGCATTAC
+CAAAACAAACGTCAAGGGTGGCGTGTCTGTCCCGACATCCAGCTTAAAACCAACCGCAAC
+ATGGGTTGCTGAGGGTAGCGTTTCAGATAAACAGAAAAAGCCTACCGGCAGTATCACTTT
+TAACTACTACAAGCTGCAATGCCGTGTAGCTATCTCCCTGGAAGCTTCCACGGTAAGCCT
+GGAGATGTTTGAATCAACTGTTGTAGAGAACATTTACGAGGCAATGATTATTGCAGTTGA
+ACAATCGGTTGTAACCGGCACAGGCGTGGGCCAGCCCCTGGGTATCGTAAACGACAACAC
+TATTCCTGCTGGCCAGATTATAGATGTAACTGCCGCTGAAATAAGCACCTATGGCAAATG
+GGCTGCCATTATCGGGACTATACCACTGGCTTACGAGGCAAAAGTCAATTTAACTCTTAC
+AAAAAAAGATTGGGACAAGTATATTGCCGGTATGGTTGATGCCAACGGGCAACCCATAGC
+CCGGATTAACCTGGGCCTGGCTGAAAGACCGGAGCGGCGCGTCCTGGGTTACAATGTGGT
+GCTTGTGGACGATTACCTACCCAGCTTTGACGCGGCGAATGTCGGCGACATTTTTGGGTA
+TTTTGTGGATTATAAAGATTACATCTTCAACAGTAATCTGCAGATGCTCTACAAGAAATA
+TTTCGACGAGGACACCGACGAATTTGTGCATAAGTCGACCCAACTGGGTGACGGCAAACT
+TGCAGCTCCGCACAGCGTAATTCTACTCAGAAAAGCCGTCTAAGTTCCTCCGGCTCCTTT
+TTATACTGCCCATCTTTAACGGTGGGCAGTAGAAAGGGAGCAAGGGGAGTTCCCTTTAAC
+TGCAGCGCGGTCGATCGTTGCAGGCGTACAAACCCCATAGCCATTTTTTCATAAACCTAT
+CCTTTTATTTTAAGGCGGCCACCAGGGGGCTCACTGGTACGGTGAGCCTGGCCGCCTACT
+TTCTTTTTTAAAAATAACTTTCGGGAGTTGATAATATGGCAGGTTCTACCATAAAGGGCA
+TTTCTATTGAATTCGGAGCCAACACCCAAGCCCTTACGGCAGCATTAGCAGACGTAAACC
+AGAAGAGCCGAAATCTCCAGGGGGAGCTTTCACAGGTGCAGCGTCTTTTACGCATGGACC
+CCGGTAATACAACTTTGATAGCACAGCAGCAGCAACTTTTAGGGCAGGCTGTAAACAATA
+GCCGGGAAAAGCTTGATCGCCTAAAGGCTGCCCAAGAACAGGTAAATGAGCAGTTTCGGC
+GCGGTGACATAAACGAAGCCCAGTGGCGGTCGTTTCAGCGAGAAGTGGCCGCGAGTGAGC
+AGCAATTGCAACGATTTGAGGAACAACTGCAGCAGGTTAACCAAACATCTGACAACCTTA
+CTCTGGGCGATAAATTCAAAACCAGCGTGTCCGGCGTTGCTGATAATGTTAAAAACATTA
+TCAGCCCTGCAACACTGGCGGCGGGGGCCGTGGCCGGTATCGGAATTGCAGCCGTTGGAG
+TGGTGGCACAAGGCGTAAATATGGCTTCTAGCTGGGACCAGGCCAGCAGGCAAATGGCAG
+CAGCGACTGGGTTACCAATGGAAGCAATGGGCGAATTTGAAGCACAAGCAGAAATCATGT
+TCGGTAATGCCCGGGGCAGTGTTGATGAAATCTATGCAGCCATGACACAAGTACAACAGG
+TATTCCATGGATCGGCCGAGGAAACAGGCGCTTTGGCTGACAAAGCGCTGGTGTTGCAAC
+AGGTTTTTGGCTTTGAAGTGTCTGAAAGTATAAAATCAGTCGATAGCCTAGTCAAAAACT
+TTGGCATTGATGGCAATACAGCCTTTGATATTATTACCAAAACATCACAAATGGCCGGCG
+ACAAAGCCGGGGATCTGTTGGATACTTTCAATGAGTATTCCCCACAATTCGCGGCAATGG
+GTTTCTCTGCTGAAGAATTTGCCGGGATTCTTGTCAAAGGGGCTCAAGAAGGCGCGTTTA
+ACCTGGACAAGGTCGGTGATGCCGTCAAAGAATTCAATATTCGTGCCCAGGACGGTAGTA
+AAACCACGGCAGAAGGGTTTGCCGCTATTGGCCTAAACGCTGACGAGATGGGCGCAGCTA
+TCGCTGCTGGTGGCGATAAGGCACAAGCGGCTTTTGAAGCAACCATAGCGGGACTAGCTG
+CAATAGATGATCCAATGAAACAAAACCAAGCAGGGGCGGCCCTTTTCGGTGAACAATGGA
+ACGATGTCAGATCAAAAGTTATAACTGCAATGGCTGACGGTAAAACCGCTCTGGGCGACT
+TCGCGGGGGCAACTGATGACGCAGCTGGTAAGGTTGACGGTGGTTTTGGCCAGGCGATGG
+AAAGGCTGAAAAATAAATTTGGCCTCGTCACAAAAGAGATCGGTGAAAAACTGGCCCCTG
+TTTTGAATGAAATGGCCACCTGGATAGAAGACCATATGCCTGAGATCCAAGCAACTGTTG
+AGACTGCTTTTAATGTTATGGGTAAGGTGATAGAAGGTTTAACATTGCCGATTCGGAACA
+TCATTGCCTTACTGCAAGGTGACTTTGACCAGGTGATGGAAAACACGCTTCATTTGTGGG
+GTATCTCGTGGGACGGAGTAAAATCCAAAGGACTTGAGGTTTGGAACTCTATAACAACGG
+GCGTTAAAAACTGGTGGAGCGGCATAACAAGCTGGTTGTCCTCTCTAAACCCCTGGGGGG
+CCGTTTCGGGGGCATGGAATACCTTTAAAACCAACACAATCCAGGTTTGGTCTAATCTTG
+TTACCGATGCAAAATCATGGGGTAAAAACATCGTTCAGGGCCTCTGGCAAGGCATCTCCA
+GCATGGGCACAACCCTAAGAGCCAACGTCACAGAGTTTATTAACCAGAACATACCGGAAG
+TCATTAGAAAGCTTTTAGGAATACATTCCCCGTCAACAGTGGCGTATGAAATCGGAGCAA
+AGATTGAGGATGCAGACGAAAAGGCACAATTGGCATTAATTGAAATTAGAAAGTTTATGG
+AAAGGTGGGCGGTAGCATGACTCTTGTAATATCGGCAAATAACCGCGATGAATACGCTCT
+TGTGACCGGTGATTTTCTTGGTCGCAAGCATAAAGACATGGACTATAATAACCCGGTAAA
+CCATAATGATAGTGACGTTGAGCTGGTTAATAATGTTTACAAGACACTTAAAGTTAGTGA
+CTATGTATTACTTGGCGCTGCCGGTTGCCATGACCTTGGCGAGTGGCTTAGAAAGGAAAT
+ACAAGACCGGGCAGCGCCTGACTTTGATTTAATCCAGTGCAGGCAATTGGCCGAAGAAAT
+CGTCGAGGAAATGAGGGATAAACGCACCCTTAGAATAACTTTTGACATGGAGCCCCTATA
+CTTAAACCATTTATATCAGGAAAATGGCTTTGCCTTTGTGTTGACCGGCTTTTATAAAGA
+AGGCGGAACCGGTTATGTCTCTTTTGAAAGCAACCCTGACGGCGGGACATTCACAGAAAA
+GAATTGCAGTAATAACAGAGGTTACCAGTTATTTACTCCGGCAAACAACTACAGGGAGTT
+GATGGATCAATATTTTGAGCTTCGTGACGGCATAACCCCTGTTATTACAACCGCAATGGC
+ACAGGCACTATGCTTGCACCATATCATTGTTGATCATATGCCGGAGCATGTCTCCCGTGA
+AATGGAAATATTGATTTTACAAAAACAGCCTGGGCAGAATAAGCCGTGCTTTGGTCGGAT
+AAAATTAACCGATCAGAGCCGGGATAGCGCCATAAAAACAGCGGGCCAGAGGTATGCTGA
+CATATTTTTAAAACCAATGTTACAAACCATTGTAAAAACCAAACCCCAAAAACCTTCTGG
+TTATGTTAACGTTATTAAAGACATAGCCGGTCTGGGCAAAACCATGGTCGTATTAGGTCA
+AGCCATGAAGAAAAACGACATGAAGCGCATAAATATCTGCATAGATTTATACGTTGCAGA
+AGTGGCCAAGGTTAACAATTCCTTTGCCGGACTTACCCCGCCTAAGGAATTAAAGAACTA
+CCACGGGTACTATAAAAAGCTGATGAGTCATCATACCAAAGCCGTTAAATGGCTAAAGCA
+GTTTCAAAAAACAGGGGACATTGTCTTTATAGATAGGTTAAATATTGAAATGGATAACAT
+TGAAAAAATAATAGATAAGCTAAAGCGCCCGGTTTAAACCGGGCGTTATTCAGTCTTTTT
+TAGGGATGTCACTGAAATATTTCCAAGCCCCTTGTTCATCCTGAACTAGATGCATGGACG
+CTTTGTAGGGTTGTTTATTACCAACGAGATTGACTGTTATTTCGAATGGTATTTCGGCTA
+CGTTTTTGTAAGTTTTACCGGTACCTTTTGAATCAGTCCAGCTATTAAGTAAAACTGGCT
+CTTTCACTTGGTAGCTTTCAATTGCAAGTACCGGGCCATCCTCTTTCATTTTAATAAATT
+CATCTTCAGTAATTAATGCCCGGGTATCCGGGTGAAGGTATTTGTATAATTGCTGCCACT
+GTTGATATGACATATACTCTAAAATGCTTTGGGCAACCTTTTCTGGTGGCTCAGCCTTTG
+GTTCTGGACTTTCCTTTGGCATATTGTTCTCACCACAGCCAATCAGTAAAGTTAAGACTA
+ATACTAATATGGTAAGCAAGCTTTTGGGTTTCATACTATCGCCCTCCTTTTTAATTATTT
+GGTTTATTGTATTACGTTACCAAGGCAATAACATGTCACTTAAAGTCGAATATAACTTAA
+AAATTTAAAATTATCCTAACATATCAATTAATTTTTAAGGATAATAATTTCATGTAAAAT
+AAGTGGGATTACTTCCGCTTTTTGTATTTTCGTTTGGCTGCGGTATTTTCCGCTGCGAGA
+GGAAATAAAACTGGCCATGATGGACTAGGTGATCGGCTTAAAATTACATTTAACCCCAAG
+CGAGAAGGTTGAGCTGGCCCGTAGGATCGAGGAAGCATTGGGAGGACGGCAGGGCAGCAA
+TCAATATCAACGGAAAGAGGACCCGCAAAATTTTGCGGAAGCTCAAAAAGGAGAATCCCG
+AGACATAGCTGCCAAAGCCGTGGGTATGAACCGGGAAACCTACCGTCAAGCAAAAGCAGT
+AAACATGAAATCGAGGAGGAACGGGCGCTAAAAAGAAAACAAGCTACACAATTGATAGGT
+AAGGATAAGAATGGTTTGCCAACACAAAGAACTTCGGTTGGGGAACTGAGTTCCACCACC
+GAAAAGGGCAAAACCCGCGATAAGATAGCGGAGCAGATAGACTTCCCTTTGTCGGGCAGA
+ACGCTTAGTAAAGGCATGAAAATTTATGAAGCTGCCAAAGACAGCAATAAAGACGCTCAA
+GAGTCGTTAAAGAAAATAGACAACAAAGAATCAAGTATTACCGCTGAATACAAAAAGCTT
+TTCAAAAAAGATGAAATCCCAAAATGGGCAATTAAATATAGTGACTACCATATGCCCACT
+ACATAGTTCGGGTACTGGCCCTTCATAGGTAGGGTGGCCATCCTTTCCATTCCGGCGAAT
+TTGCCGGATTGCTCTGGTACTGGCCCTTCATAGGTAGGGTGGCCATCAGTACCGGACAAT
+CTGTCGGTTACTGAAAATGTGTACTTAACCCCGGTCAAACTATCCCAAGTTGAAGGGTGC
+TGGCACGCCATAGGTAGGGTGAAAACGCACCTTGTGGAACTCAGTTCCCCAAGGTCAGGA
+TTAGGTGCTGGCACGCCATAGGTAGGGTGAAAACCCCTCAGTTGTACCCAACTTGACGAC
+AACTGAAAATAACCCGGCAATGGCCGGGTTTATCTACTGCCTGTTATTTTTTCTTGGTTA
+ATTAGCCGGTTGTCCAATCTTAGTATATCCCCCCAAACTCCCTTAAGCTGCAGTTTGACT
+TCTGATACATCCTTCTGTATTTTGCGCTGGCCCTTCTCTAAAGTATCCAGACGTTTAACA
+ATGGATGCCTGGCCTTGCTCCAAGGTGCCCATGCGTTGATCCATGTCGTCAAGGCGTTCA
+TTGATAGGCTGCAGCTTCTCGGTTAGTGCCTCATCCAGTACCCGGCGGAGCATTTTTTCA
+AGCTCACTCATTGGCGGTGGCACCCCCTTCTTTGTCGGGTATGTGTTCTAGTAGATCACC
+AGGCTGGCAGTTTAAGGCGGCACAGAGCTTATTTAAAGTGGAAAAATCCATCCTTTCAGT
+TTTTTCATGGTAAAGCAAAAAAACCGTATTTCTTGATAATCCCGTTTGCTGTGCTATTTC
+TGTCATATTAATTCTTTTAGCCCCAAGTATTTTAGATAAATGCACTTTTATCATAGGCAT
+ACCCCCTGTCTTTATAATACAGTAAATAGTTAACAATGTACAGCTAATAATAAATAATTT
+ACTGATAATAGTAAATAAAGTATTGACAATGGTACGGGTAGTGGTTAAAATTGTACTAGA
+AGCAATACAGTCCACGCTACCAGGGAGGCGATCCCTGGGGAAAATTAAAAGAGGGATTTT
+AAGATGCTTAAACTTGAGAACGGCGATTATTTGGTTTATTCGGACGGCAAATTTTATCTT
+ATTGCGGACGGTGGCAGGGAGTCAGAATAAGGAGGCTTAAATCATGGCTAGTAAAAGAAA
+AGTTATCATTGTTCCTGATTTGCTACAGGACTACATCGTACTGGGAGATGTTGTATTGGT
+TAGTTTAAGGTACGTAAAGGAGCTCATAGGAGAGAAACGAGAGGATGAAGCCCATGTCAG
+CTAGAAGAGGGGTAGTAATTGTACCAGATTTGCCGGTTGATTATATTGAACTGGAGCACG
+TCGTGCTTGTTAATGCGGAATATTACATTGGTTTATTGGAGAATTAACCTGTAGCTTTAA
+AAGGGGGTATTCGTTAATGAAAACGGTAGTTTTTTGTAACTTCAAAGGTATGGAAGGCCC
+TGCCAGTCAATTTACATGTATTGCAACTGATGATTTTATTATGATTGAAGAAAGCCTTTC
+ACAAGAGGAAAAGGAACTAATTACATTTGTGCATGGCGGCAGTTTACCTTTAGCGAAGGA
+GGCGTAA
+>NC_021184.1|provirus_4466413_4519129
+GTGAAAGTTCAGAACCCACACGATAAATTCTTCAAAAAGACCTTTGGCGATGTAGCCGTG
+GCCAAGGATTTTTTAAATAATTATTTGCCTCAAAGCATCACGGATATAGTAGACGTGGAC
+ACATTGGAGCCGCAGAAAGACAGCTTTATTAACAAAGAGCTACAGGAAAGTTTTTCGGAT
+CTCCTTTTTAAGGCCAATATCAATAAACGGGAAGGCTACCTTTATTTTCTCTTTGAACAT
+AAAAGCTATCCCAGCCGGGATGTTGCTTTTCAGCTCCTAAAATACATGGTAGAAATTTGG
+AACGCCAAGATTGAAAATACCAATCAACTGCCGGTAATTATTCCGCTGGTAATATACCAC
+GGCAAGGACGGCTGGAACATAAAACATACTTTAGGGGAAATGCTTTCGGGCTATGAGGAA
+CTGCCAAGGGATGTCCAGGCACACATTCCAAATTACAAATATCTGCTTTATGATTTTTCT
+AGGTTTACTGATAGGGAAATAAAAGGTGAAGTAAGAAACAAAATAACAGTGACGATAATG
+CGGGATATGCCGAGAGAGGATATTGGCGAAATCCTAAAGTATGTTTTTAGAGCGGCTGTC
+TATTTGCTGGAGCTTGAAGATAAACAGACAGGGATAGAATATCTTGAGACCCTAGTCAGA
+TATCTGCTCAGCGCTAGGGCTGATTTAACCAAGGATGACTTCAATGAATTGGTTAAGAAA
+ATCGAAACCATCTATCCGGAAGGGAGTGAAAGGATAATGACTTTAGCTGAACTGTTTAGG
+GAAGAAGGCATGGAGCGGGGAATAGAAGTAGGTGAAGCAAAAGCCCTTGCAAGGACTGCA
+ATAAAGTTTTTAGTTAAGAAATTTGGTTTTGTGCCAGAGGATTTAAAGCAGGGTATAACG
+AAATTAGATGTACCAACACTGGAAGTTATAATTGACGGTGTATCGGAATATAAAGACCTC
+GATGAGGTAAAAAAATATATCCAGTAACAAAAACCTAAGAAAACCTTTATGAATAATAAG
+CTTATATTTCCTAACCCTATGGATAGTGCTGCTAATCATATCTACCAGAACTACAATGAA
+AAGGTAAGAAGCCCCCAAGCCCTTGTCCCATGCGGGTTTGCGGGGTTTTTAATATACACG
+AAACCAGGGGCTTTAGTGCTATTAACGCTAACAAAATTAAAGTAACATTCAACAAGGCTG
+TTGAAGATACTACAAAAGCAACCTTCGCAGTAAAACGTGGTACGGTTACTGAAGAAGTAG
+CAGTAACTTGGAACGAAGCAAAAACAGAAGCAACCTTAACAAAAACAGGAAATTTTACTC
+CAGCTGAGTACACTGTGACTGTTGGTGGGGTTGTAGAAGCTACCAATACTGTCACAATTG
+CAGCAGAAGAAGTTAAGAGCGTAGTTATCAATACTACTCAGTTACAAAAATCAGCTACTG
+CTCCAGTGTCAATTGATTTCATCAACCAATATGGTGAGAAAGCAACTGTCGCTGCAAATG
+ATACCAAATTGACTCTAACTGCTTACAACAAAACTGCTGGCGTTGCATTAGCTCAAGTCC
+CTGCTAAATTCCAATTTAATGCGGCTGCAGCTACTCTTAAAGATGAAGTTGTAATTACGG
+TAATGTACAAAGGTATTACCCAAACAGCTACAGCCATTGTTGTGAATGCTGCTACTGTTG
+GAAATGTAACATTGGGAGAAGCCGTGTTACCAACTGGTAAGACAATGTTCACACCGACAG
+GAACTAAAGATGTTGAATTAGCTTATACAGCTACTAATACACTTGGTGAGGCTTATAAAC
+TAACAGCCGCTGACAAAACAAGTGGAGCTGTACAATTCTTAAGTTCAGACAACACGATCT
+TAAACCCAGCGGATATCTCAATCGATACTAACAATAAAATTAAAATCGCTAAATTTGGTA
+AAGCTGGTACTGTTACATTGACAGCACTTACACCAGCTACCGGTGCATCAACTACAACTA
+CTGTCGTAGTAAATGAAGATGCTGGCGCAGCATACGGATTAACTTTAGAAAAAGCTGCAG
+CAGACTTCCCAGCTGGTTCCATAACGCCATTCTATGTAACACAAACTGTGGTTGATAAGT
+ATGGTACTGCTATTGCACAGAAAGACTTAAAAACAGCAGATTATACCGTCTCAACAAATA
+ACAGTTCAGTTGCTACTGCAGCATTTGAAATTACACCAGGTACTGACTATGGTAAAATCA
+AAATCACTCCAGCCGCTGCAGCTGTCAAAGGTAACTCAGCAACGATTACTGTAACTGTCA
+ATGCTACTGGTAATCAGGCAACATTATTAGTGACTGCTAGTGATGCAGCTGTACCATCAA
+GTGTTGACACCAAAAAGAATACAACCGTTTCAACTAACATGTTAACTGGTGCAACACAAA
+CATTGAGTTTTGATGTAAAAGACCAATACTCCACAACCTACACAGCAGGCGTAGCAGGAT
+ATACTGTTGAGTACACAACCAGTGATTCTAGTGTTATTGCAATCACTTCTAACGAAACTG
+CAAAAGATGCTATAAATACAGCTGCAGTTGATGTGAAAGCACTGAAAGCTGGTTCTGCTA
+CCATTAAGGCTACATTGAAAAAAGATAGCGTAGCAGTTGCTGAAAAGGCTTACACGATCA
+CAGCTATAGCAAATAGCTCTGCCGGACTTACTTACAGTGTAGAAGCGCCAACTCCTGCAT
+ATAAAGGATTACTTTCTAAGGATATCGTTGGCGAAACACTTGGTGATGCTGGTGCCGCAA
+CCTTAACAACAAACGCTGATAAAGAGCGTGCTATTAAATCTGGTTATGCAGCAGAAGTTG
+CTCTGTATGCAACAGATGCAAATGGCGTAAAAACCTTAGTTCCATCTAGCGCCTTAGTCG
+GAGGAGCCCCAACTATTACTCAAGCACAAAAAGCGGATGGAACAGGTGCTGCGACTGTTC
+AGGTAGCTGTATTTGAATATAATAATAAATACTACGTATATACCTCAACAGCAGCCGCTG
+CAACTGACTTTGAAGTTACTGTAAATGGTACTAAAGTTACACAAGATGTAAAAGCAAAAC
+TAGAGTTTACAATCAACGCAGATGATACTATCAAAACTATTTCACAAGATGTCACAATTT
+CAAAAGATGCTTTAAAAGCACAATCCATCGAATTTAAATCAGCTGCACCTGGAACAACCA
+CTGCAACTGATGTAACAGCAATCACTGTAGCTGACTACGCTGCATATACGACTGCGCTAA
+CTACAAAGGCTTATGTATGGGTAAAAGACCAATTTGGTGGCTACTCATTATCTGATACAG
+GTACTGAAGCTTCTGCCTTCTTATCTGTCGTAGACTTAACAGATGTAACAGGCGCAAGTA
+ACGACACAGTAGTTATTGGTGGGGCAGCTGCTGCACAAGATGGTGTAATTACTATTACTG
+ATACCGGTAGTAATACTGTAATCAATAAAAATGGCGGTGTAGTACGTATTATTGCTAAGA
+CTGGAGCTTTAACAGACTTTATCAACTTAACAATTGGGAAAGAGAACGTAAAACCAACAC
+TTGACTCAGTAGTATTAGCAAACGGTAGTGGAACTGCAGCAACATTGGACGTTAATGACA
+CTATTACATTAACATTCAGTGAAGCAATGACAACTACTGGAAATGCAACTTTTGCTATGA
+CAAACGGTGTTGTAACCTTACTTGATACCACTACATTAACATTTGGTACAGTAGGTGTTA
+ATGCTGGAACTGGAACGGTTGCATGGAGCGCAGATGGTAAAGTCGCTACATTGACTTTCA
+CTGCTGTAACAGATGCAACAACCGCTCCATCAGGTGCTGTTACTCCTGGAGCAGTTGTGT
+TAAAGGATGCTAATGGCAACCTAACTGCAACAACAGCTAGTGCTGCCGCAACAGGCACAT
+TCTAGGCTCAAGGAAATTCAATGCTCTAGAAAACACAATCTGATGGTTCTTTTGTTGAAA
+ACCGTCCAGTGCACTAACTAAACCAGAACAAAAAAAGCCCGGGTGGTCCCAAAGCGGATC
+GCCCGGTCTTTTGTTTATTGGGTTCGCTTGGCATAAGGCAAAGGGGCTGGCGTGGCCCAA
+GTGGAATATTAGTGGGCTTGGCTAGTGAATAAAGCTAGCCCGGCGGGTTGGCCTGATAGG
+GGTTATCTGGGTACCTGGTTGGCCGGGAACATAGAATGGCCGCGAGTTTTGCCCAGTTTG
+TGCAGGAATATAAATAATACTGATTACACGGCAAACCAGGGGGACGGTTCCTGCGGTTTG
+CGAGAACACAAGTGCTCGGGACAAACCAGAGGGACGGTTCTGGAAAAACACAAGGGGACG
+GTTCTGTTGTGCAGTAGATAACCGTCCGGCGCACTAACTAACCAAACAACCAAACAGCCC
+GGGAGGTCCTACACGGATCGCCCGGCTGTTTTTTATTGGGCGGGGTGCGCAGGAACGCTG
+GGTATAAAGGAAAGAGGCCAGCGTGGGGTTGAGGAGGGCGAGATTGGTAGGCAGCCCGGC
+AGGTAGGCCTGATTGGGGTTATCTGGCTACCTGGTTGGCTAGTAAATGCGGGGGATAGTT
+GAGCATGAAAAAACACCTTACAGGTAGAAATACTTGTAGGGTGTTTTTTTTTATTTCTCC
+AGGCTAGTTTTATCGGCAGCTCCGCCGGAACGTATCCACTCATCCACTTCGGAAATCTTA
+AATTTCCAAAGCCGTCCAACCTTGTGCGCTGGCATGTTACGGTGGTTAATCCACTGAAGT
+ATAGTTTCCCGGCTCACATCAAGATAGTCAGTTATAGTGGCCATTGATGACCATTTTTCT
+ATGTTGTCCATTGTTAAATCCTCCAGATTATCAGCGCACACCATGTAAGAATCCATAGCG
+GCCATGTTCTGTGTCCTTTGTAAAAGTGATTAGGTTGGCACCGGTATAATCCAAATCCGG
+GGGTTCGTTTTCAACAATAATAACTTGACCTTTATGCTGGTTATCAAGCAGATATTGGAA
+TAGGCCTGCTTTCATACTATCCGGTGCGCTCTCATCCCCTCGTTCCTTTAATGAGAGGAT
+AGGTGAATCCACAACCAATAGTCCCGGCGCATATTTCCCCTGCTCCACCAAATATTCCAT
+GAGTGTGACTGCAAGTACAGTATTTAAGAACGCCCGATACCCTTTACCAAAACTTTCCTT
+TGGTTTTCCGTTTACAACCACATCAAATTCCCTAGGGTCAAAAAATGCAGATCCAAATCC
+CTCGTACATACACAAATCCAAAATATCGTTTAGGCGTTCATCTAGCGTGCCTAAAATATT
+GCTGCTGAACTGGTTCTTTATTTTAAATTCTAACTGTGATTCATCCTCCATTTGTACGTT
+GAATAGCTCAGTCTTTATGTTAGTTTCAAATTTGTCAATAACAGTTGTTTCATTTTGGAT
+TTCGATGGCCCGGCGATATTCAGCCAATGTTTTCTTAAGTGCTGCCACCTTGGGCTTTAG
+TTCACTGTTGAGTAAATCTTCGATCCCCCATCTTTCATGATTCAAATCTGCAAGCCTTGC
+CTCAAGAGCAGAGCGCTCTTTGACGATGTCTTCATTGGCCTCCTTAAGATCGGAAAGTTG
+CAGCTGTATTCTATGCAGTTCCGCATGTGATGCCTCGATGTAACCCTTCTCAATCTCCAC
+GGGAACATTGCTTTCGCAGAACGGGCATTTTGACACTTCCTTGACATTCCCCCTGTTTAA
+CTCCCCTTCAACAATAAAGGCTAAACGTTTTACATCTGCGGCATACTGGCTCCCCAGGGC
+CTGGTACCGGTTGTAAAGGGTATTGCACTCCGCCAATTGTGCATTTACCGAAAATATTTC
+TTTCAACAACTGTTTATTGTGCTCAATGGCCCTGGCGATGGCTTTTTCGGTTTCAGCAAT
+ATCATCAAGTACTGTTTCAACCTTGGCTTGAAGATCCAAAGCACCGTAAGGAATATTTCC
+CAGCTCTTCTTTTCGGTCGGCAAAGGTTATTAGCTGTTTATGCATATAATCAACCAATGC
+TTTTCTTCGGGCCTCCGATATTTCCTTTTTCTCAAGGGGTTCTTCCTCGGCAAAATCTAT
+TCCTGTGATCAGAAAGAATAATGCACTGAGTGCTGCTGTTGCGGAGGTATTCTGTCTCGG
+AAGAATAATGGACCGCTCCTGTAAAACACTTGTTTCCTTGATAAGGAACATGTGTGAAAA
+TGTTCTCCAGGTAAGCCTTTGTTTCTCAAATCTTGAGTTTTTTATAATATCGTGTTCTTC
+CTCTATTCCAATTAGTTGGAGCCACAAATCACTGATATTATTCTTTTTACCGCTGGTTTT
+ATAGGTACCAGACATAATATCATAGGCGTCACTATGCACTTCAATTCTATTGGTATCTAG
+TTGGCGGCTTAATGTAACTTTACGACCTTCAGTTGCGATAATAAGTTTTATCCGGTCATA
+CCCGGCGGTTCTATCAAAACGAATTCTATCGCTGCCAAACAAATAGTCCAGGCATTCTAA
+GACATAACTTTTACCGGTATCAGATGGCCCGCAAATAATATTAAGACCCCGCTCAAACTC
+CAGGATGGAAGGTTCCTTGCCGCTGCCCATCACGATTAATTTTTCAATATGGAACTTAGA
+CATCATTCACACCCCTTTGCAGCCAGGTAAATGCGTTACGGTTAATCATTTCAAAAATTT
+GCCGCTCCGATTTTTGTGCTATGTAGCCCTGTGTTCGTTTAGCAAGATAGCGGTATGTTT
+CAGCATAATGATTTGTAAACCGTGAACAATAATCCTTTCCTTTTTGATTTATCGAATATA
+AAAAACCCCTTTGTGAAGACGCTACATCAATTAGGCCGGTTAGGACAAGTTGTTTAACAG
+CTTTTTTAACTAGTTCACGGCGGAGCGGGAATTCACTGTATTTGAAGGCACTGTCCCCAT
+GAAGATCGTTATCTGATATTTCAAAATCCTTACCATAGACCGTTATAAAATCAGCTGCGG
+CTATCATATCAGCTGTCTGGATTAAGCCGGTTTCTAACATTAATAAAACACGCAGTGAGA
+TCTCAAATGGGGTGTTAAATATATTATTCATTCCTTAACACCCACCCTTCAATCTCGCCA
+TCGTTTACCAGAATGTGGCAGACCCCTTTTTTCTCACTGGCTCCGACCCATTTTAGCGGC
+TCACATAGCCAGCATTTGTTAACCTGGATAACAGCTGCATGAGCCATTACACCATTCATC
+CGGGCAAAACCGTGTTTAAAATCATTATAGTAAATATCAATAATGCCATTGTATGTCTCT
+TCTTTTAAGGTTTCAAATTGATCTGGTTCCGTCATACCAAAAATATCCCTTGCATCTCTC
+CTTACGGTTTCAGCGGCATAGTAATCTTTTCTTCGCCGTTCAAAATCTTTTTTATATCTG
+GGATATCGGTCAAGTAATTCTTTTGACAAATCAGTTAATTTCTCGGCTTCTGCATAGGCT
+GCCAACAATTTTGTGACATAGGTCAACTCATGTTTTTGAATTTCTTCCGGTGGTGTTAGG
+GGAGGAGGGCGTAAACCATGGGATTTACTCAATATGGCCTTTAGTGCCTTTACTTCATCC
+ACAATGGTTGGAATTCCGCCATTTGTTTGCTTGTCCCCCGTTAGTTTATTAGGCTTCTTT
+ATTGCATACAGAAAAACCTCGGAAAGAAATCTAGCTAATTTTTCTCCCTCCGCAAGGGCC
+AAGAAATCTTTCTTTTTATTTTGTGGAATCTTAGTGTCCTGGGAGATAAGTTTAGTAAGT
+TCATGCACCAGATCAGAGGTTAAATCAGGTGTAATGGCAGGTATGACCACGTCTTCAAAG
+TAATCGTGGGCGGCGTCAATGATTAATTTGGAGCTAGCCGCTTTTTTAATTTTATTATGT
+ACTTGAGCATTAAGCCCTAATAACTGATTGGCGATTTTAGCCGTAACCACATATGGTTCA
+CCTATTTGATTTGTGATAACAACATTATCAAGAATTAGGCCCAGCAGGAGCTCCGTTACC
+TCCACTTGGCTGTCAGAACCTTTGATTACCTTTTGAACAGCTCTAGCGTATGTACCAAAA
+CACAGCCCGACCACTAGGATTCCCCCTTCCCGCAGAATTCAAGGGTCAAAAAAGGGTCAA
+AAACAGGTCAAACTGAGGGTAAATATTTTTAGGTCACAACCTGTTATCATTTTATTAATA
+AGTGTTGTTGAAAGAGGATGTTTCTACTTGGTTGATTGTTGTATGTGGGCATGGATGAAG
+GTGCCTCAAAAAAAAACTCCGAAAACAACCAGTTGATTCTGCCAGATATTAAAAATATTA
+TATCACCCTATTTTGGGTGTTACAACATTATTAACCATAATTCGAAACAATCTTATCCAG
+TGCAACTTAAACAATCACAAATACACTTAAATACTTGATGGATGAAATTATAGAAAGGAA
+GGTGTTTATGAATAAAAAACTGATTAACATTGAATGCCCCACATGCGGCAATCCAATTGT
+ATCAAAGTATGCCAATGGGGAAGTAACCGGCCTACTGTTGCATAAATGCAGCCGATGCAA
+GCGCTACTGGGATTTAAATTACACAACTGGAACAATTTCCTGGGTAGATGGGAAACCGGA
+CAAAACCCCAGCCAAAAATTTTATAGTGGATTTATCAACGGGGAAAACCCGTCCAATGTA
+TGATAAAGCTTTACTGAGACGAAAAGGAGCCTAACATAGAGCTACCTTAAGGACCAGATA
+GCTAATAATTAATTTTATTAGTTATCTGGCCTTTTTTTTGTCCATTACAAACTTAATAAT
+GCTTTGCCAATTATAGCGAGTTAGGAATCAAAGAATTACCTCAGACCGCATAATTACTGA
+TTTTTCGGTAATTATGCGGTTTTTTTATGCCCGTTTTTCGGACCCGCCCCATTGGGCCTT
+AAAAAAGGAGGAAATAAACATGATAAAAAAATTTCAAACCCAAGATGCTGAGATCACCAT
+TGAAATCACTGAGCAAGGAAAAGCGATTTATGCAGTAGGTAAAAAAAAGACCACATTTGA
+TTTAAGCAAATGTGAATCCTTTACTTACTGGTCAGTTATGGAAAGGGAAAAGTTTGTCGT
+CACGGAGGACATGCTCACCGGTGCAGATGAGATTGAGCCCTGGGTGTGGCTTGTAATTAG
+CCGGGGAGAAGATCGGCTGGAATATAACAACGACCAGGCGGAAACCCGTAGCCATCAAAG
+TTATTCCAGCCAAAACGATAAAGCTAAAGATTTAGTTTCTGATGAGGATGCCCTCGAAGA
+AGTGCTGGCCAATTTGGGCAGGGAAGCCGTAAGAAAAGCTATTAGGTCGCTTGAACCCAA
+GCAGCAAGAGTTAATCTTTGACATATATTACCGGGGCCTTTCCAAGGCGGATGTAGCCAA
+ACGTGATGGCGTTTCTAAAATGGCGATCACCAACCGAATGAACAAGATCATTAATCGGTT
+GAAAAAATATTTAATAAATCTATAAATTCGGGGGGGGTTTACTTTTTGCTCTACCATGAC
+TTGTATATAGAGGCCGTTAACAAAATTTATATTGCAAATCAAAACCGGCCTCTAATCATG
+GTAAAGGTAGGTGAAAAAAGTTGAGTAAAAACGCTTATATTGGCTCCACTACCCGGCACC
+ACATGGAAATTGGCATCAAGAAACCAAATTCCAGCCAAGTGTTGGCGGCAAGGAAGGTCA
+AACTTCGTGACCGGTTCTTAAATGCAATCTTTGGTAAAGGGCACAGCATGGTTGTGCTAG
+TGCCTGGGGAAAGCATTGGCACCATTTCCATTACAGAAATGGAGGTACATGAACTGGAAG
+AAGCGGAAAAGGAATGCGAAAAAATGAAGTCGATACAACGGGAAAAAGGCAGGTGATCTA
+AATCAATGTAATTTTATTCCCGCACCAACAAAGAGCATTAAACCAAACCATGCACCGCAA
+CCTGGTAGCTTACTACCTAGATATGGGACTTGGAAAAACATTTTTAGGTTCAGAGAAATT
+AAAGCAACTAAATGCACCCTTTAACCTCATAGTTTGCCAGAAGTCTAAAATCACGGACTG
+GGCTGAGCACTTTAAGACCTACTATGACTACGAAGTTATTATTTTCAAAAACCAGCCCAT
+CGAAGCAATTCCACCACACAGCATCATCATAATTAATTACGATCTGGTGTGGCGGCGCAA
+GCAGTTAGAGGAATTAAGGGATTTTTCGATGTTACTAGATGAGAGCCAATATATCAAAAA
+CGAAAATTCCAACCGGGCCAAGTTTATTCTTAACTTAAAACCAGACAATGTAATTTTATT
+ATCCGGCACCCCCACCGGTGGAAAGTATGAGGAACTGTGGTCGCAGCTAAGGTTGTTGGG
+GTGGGGTATAAGCAAAAAGTTATTTTACAAACAGTACACCATCACTGAAAAACTTGATGT
+TGGCGGATTCTACATTACCGTGGTCACTGGCTACAAAAACGTTGACCGGCTAAAGGACAA
+ACTTTACCAGCATGGGGCGATATTCATGAAAACTGATGAAGTGGTGGAACTACCGCAGCA
+GGTGGAGCAAATCATTAAAATCCCCAACACCCCCCAGTACAGGAAATTTAACCAAGACAG
+AGTGATTACCATTGATGACGAAATGCTGGTCGGCGATACCGCTCTTGCAAAATTGTTATA
+TCTGCGGCAATTAGCATCGATTTACAACCAACATAAACAACAAGCTTTAAAGGATTTACT
+GTCTTCCACCCATGACCGGGTAATTGTATTTTACAACTTCAAGAAGGAATACCAGCTCAT
+TAAAAGACTAGCTGAAGAACTGGAAAAACCGGCGTCCCATATTAACGGTGACGGTACAGA
+TTTAGATAACTACGATACAAAGGACAACAGCGTCACTCTAGTCCAGTATCAGGCTGGATC
+GACCGGGGTCAATCTACAAAAGGCAAACCGGGTTATTTACTACAGCCTGCCGCTGTCAGC
+AGAGCTATGGATGCAATCAAAAAAACGCATTCACCGCATCGGCCAGCCTCGCAGTTGTTT
+CTACTACTACCTGATCACAGAGAAGTCTGTGGAAGAAAAAATACTGGAAGCCCTAAAGCA
+AAGGAGGGATTTTACCTTGGAGTTATTTGAAAAGGGGGTGAAGTAGCACCAGTGACTGAG
+AAACAGCTTCAAAAGAAAGTCATTAAATATTTAAATTCCCTGCCCAATACCTGGTTTTTT
+AAGGTGTGGGGTGGCGGGTTCCAGCGAAGCGGCATACCGGATTTAATTTGCTGTATTAAC
+GGGTTGTTTGTGGCCCTTGAACTAAAGGGAACGGGCGGTAAATCTACCAAGCTCCAAGAG
+CTAAATATCAATAACATTAACGCTGCTGGTGGCATTGGCCTCATTTTATACCCCGCCGAT
+TTTAAGGAATTTAAGACCCTTGTAAAGGAGGTGAGTAACGGATGCGGTTTAGCCACAGCA
+GAGTTGAATGCTTTGAAAAATGCCGGTACCAATTCATGCTCCGATACATCCGAAACTTAA
+CTACGATTTTCCCCCCGGCAGCGGATAATCCCTTAATAGTCGGTAGCGCTCTCCACTTGG
+GATTGGAAAAAGGACCAACTGCTATGGAGGAATATTACTACAGCCAATACCCGGTGATTA
+ATGACTTTCACATCAACGAAATGATAAAACTGACCACCTTGGTGGAGAAAGCCAATGAAG
+TGCTGCAGGAGTTAACTCGGGGGAAAGTCAGCATATTCGAGTATGAGATAAACTTCCCGG
+AATTTATAGGTTATGTAGATTTAATAGTCCATAACGGTGATGGCAGTGCAGATGTTTATG
+ATTTTAAGTACAGCAACAACATTGACCATTACCTAGAATCCAAGCAGTTACATTTGTACA
+AGTATTACCTGGAGAAACAAGGGTTTGACGTGTTCAAGCTGGGGTATGTTTTTATTCCTA
+AAACCCAAATCCGGCAAAAGAAAACCGAGGATTTATACCAGTTCAGGAAACGGCTAACGG
+AAACCCTGGCGGCCATGCAAGTAAAAGTGGTGGAAGTGAACTACGACCACTCCAAGGTGG
+ATGGATTTTTCCAACGCTGCCATGAGATTCAAAACGAAAGCATTTATGAAAGAACACCGT
+CAAGGCTATGTGCCTGGTGCGAGTTTCAAAAATATTGCGAGGAGGAAATCGATTTTATGT
+TATTACCGAAAAATGAAAAGCGGGAAAGGAAGATGGATCTAAATCCGGATAAGTGGGTTT
+ACGGCGATTCCTATGTAGGAAAGTCCACTTTCATCGAGCGCTATGAAGACCTGCTGATGG
+TAAACACGGACGGCAATATTGACAACCTAACCTCCCCGGTGGTCAGGATTACGGACGAGG
+TGACTTATGAGGGCAGGCTCCGAAAAGAAAAATTAGCCTGGGAAGTCTTTTTAGCAGTCA
+TCGATGAACTGGAAAAGAAGGATAACACCTTCAAACGAGTGGCTATTGATTTGGTGGAGG
+ATTTGTACGAACACAGCCGGTTGTACATTTATAAAAAACTAGGCATTGACCATGAACAGG
+ACGCCGGGTTCGGCAAGGGTTGGGACATGGTGCGGACTGAATTTCTATCGGCTATGAAGC
+GCCTGAAGAACTTAGGCTACCAGGTAATCTTTATCTCCAAGGAACTGACCTCGGAGATTA
+CCCTGAAAAACGGTAACAAAATCACCACCATCAAGCCAAACATCAACGACAAGGTGGCCA
+ATGTACTAGCGGGAATCGTGGATTTGACAGTTCGGGCGTTTATGGATGGCGATGAAAGAT
+ATTTACAGCTGGAGAAAAAGGAAAATGTCTTTGGCGGTGGCCGGTTTAATTTCAAAGTGC
+CAGTTGTGAAATTGGATAAGGATGAATTTATTAAGGCATTAAGGGGCGCTCAGGAAGGCA
+TCAAGACTTATTCCAGGGCGGAAAGCGCCAAGGAAGCAGCAGCAGGAGAAACAACCGGGA
+ATGAAACCAAGGAAGATGGGGCTACGGCAACTGCTAAGGGAGATACCAACGGGGATGAAA
+CTAGCGAGGAAGAAACGGCGGCTACCACTACGGAGGAAACCACTGCGGCGACCGATAAAC
+CCGAAAAACCGGCTAAAAGGAGCAGGCGCTCTCGCAAGTCCGGTAACCAATTAACTAATT
+AAATTACAAGGAGGACAAATTTAATGAGTAGTGTATTTGCAAGGTTCGACAAAGAGTTTG
+ACCTGAAAGGTCTTAAAGAAGACCTGAAAAATGTGGGTACAGGCGATGGCCATTACCGGG
+AAGTTCCCTATGGCACCTATGAAGTGAAAATTGAAAAACTAGAATTGGTGGAATCCAAAA
+CTGGCAAGCCTATGGTCACCAGTTGGATGCGCATTATTGCCGGAGAGTACCAAAATTCTA
+TTTTATTCATGAATCAAGTCGTCCACACTGCCTTCGGAATTCATATGGCTAATGAATTTT
+TACGCTCCTTAGATTCTGGCATCGATGTTACTTTCGAGAATTTTACCCAGTATCACAACC
+TCATTTTGGACATCCATGAGGCCATTGACGGGAATTACGAGTATGCAGTGGAGTATGGGG
+AAACCAACAAAGGATTCAAAACCTTTAAAATTACTGAAGTTTTTGAGGCGGAGTAGGGTG
+CTGTTATTCTATGACGCAGAAGTCTATCCCCACGATTGGCTCTTTGTCATAATCGAACCT
+GCCAGCCAGCAAAAACATGTGTTCATAAACGATGCCAGGGCACTGGCGTCGTTTTATGAA
+CAGCATACTGATCATATTTGGGTTGGCTACAACAACCGGCACTATGACCAGTACATTTTA
+AAGGGTATCCTTTGTGGTTTTGATCCCCATGAAATCTCCAAGTTCATTATAGCAGAAAAG
+AAACCAGGCTGGCAGTTTAGTTCCCTCTTAAACAGGATTAAGCTGAACCAATTTGATGTC
+ATGACCACCTTACACAGCCTAAAGGAACTGGAAGGCTTTATGGGGCATGATATCCGGGAA
+ACAACAGTTAGTTTTGATACCAACCGGAAACTTACAACACGGGAAATTGATGAGTTGGTT
+AGTTACTGCACCCATGATGTGCAAGAAACCATGGAAATATTCCTTCACCGGAAGGAAGAA
+TTTGATAGTCACGTAGCTTTATTAAAGACCTTTAACCTGCCGCTGAATTATCTGAGTAAA
+ACCAAGGCGCAACTGGCGGCTGTGATTTTAAGGGCCAATAGAATAAACCGAAACGATGAG
+TTTGATTTAGTTTTACCCGACACTTTAAGGATTAAAAAATACCGCCATGTGGTGGATTGG
+TACAAGGATGCCCATAACCACAACTATGATAATTTTCTACAGACTACTGTTAGTGGTGTA
+CCCCATATTTTTGCCTGGGGAGGGTTACACGGGGCTAGGGATCAGTACCAGGATGAAGGG
+ATTTTGGTCAATGTGGATGTGGCCTCTTTCTACCCTTCACTTATGCTGGAGTATGGTTTT
+TTATCCCGGAATGTGGAAGACCCCAAACTCTACCAAGAGATTTATCAAGAGCGGTTAAAA
+CTGAAAGCGGAGAAAAACCCCATGCAGCTGCCATATAAGATTGTCTTAAATGCCACCTAC
+GGGGCCATGAAATATCAGTACAACAACCTTTATGACCCCAGGCAGGCCAATAACGTCTGC
+GTAGGCGGGCAGCTGCTGCTCTTAGATTTAATCGAAAAGCTAGAGCCGAAGTGGACGCTG
+ATTCAATCGAACACGGATGGATTAATCGGAAAAATTAAACGCCTGCGGGACTTGGACACT
+ATTAAAGATATTTGCCGGGAGTGGGAAACCCGTACCCGGATGCAGCTGGAATTTGAACTG
+TTCCGGAAAATCTACCAAAAGGATGTCAATAATTACATCATCATCCGGGTAGACGGCAGC
+TATGAATCAAAGGGAGCATATGTCAAGAAATTAAACGAAATTGACAATGACCTGCCTATA
+GTAAACTCGGCCCTTAAAGAGTATTTCATTAACGGTGTACCGGTGGAAAAAACCATCAAC
+GATTGCCGGGAACTGATGATGTTCCAGAAGGTAGTGAAGGTCACCAATAAATTCTCCCAT
+GCTCTTTATGGCAGCCAAAGGTTATCGGAAAAATGCCTCAGGGTGTTTGCTTCCAAAAAC
+GATGATCCCGGTGTTTTTAAGGTCAAGATAAATGGACGACCCCATAAAATAGCCGGTACC
+CCGGAGCACTGTTTTATCATCAACAGTGATGTGCGGGGTAAAAGGATACCTAGAAGGCTG
+GATAAAGATTGGTATGTTCAGGTGGCTAAAAAGCGGTTAGCGGATTTTTTGGGAAAGGAT
+GATCTGAAATGATGACAGTGTTTAAAAATAAAGATTTCGGTGAAGTAAGAAGTATTTTAA
+TTAATCAAGAACCTTGGTTTGTTGGTAAAGATGTGGCGGAGATTTTGGCGTATAAGGAAC
+CCCATAAAGCCATTGCCCGACATGTGGATGAGGATGACGGGATGAAACATCCCATCAGCG
+ATAACTTAGGCAGGGTACAAGAAACACTGCTGATCAATGAAAGCGGCCTGTATGCTTTAA
+TAATATCTTCAAGGCTCCCCAGGGCGAAAGCATTTAAAAGATGGATCACCTCCGAGGTGT
+TGCCAACCCTTAGAAGAACCGGCGGTTATTCTATGCGCCCCAAAGGGCCAAGCCTAAGTG
+AGATTATACGATTTCTAAAGCTGATAAGAGACGTGATGGTTGCCCAAGGATGTAATGAAA
+GAGATATTGCTGTAACGGTAAACAACATCTGCCAGCAATTTCAGATCCAGCTTCCCACAG
+AATTCATCCGGCTATCAGATCTGGAAGTGAAGTTTATGCAGTTTCTTTACAGGGATGAGC
+TTGCCAGGCAAATGAGTAGCGGTGATGCCATAGCGGTGTTTTTAGGTAGGGAAATCAGCG
+ATATTAGCGAGGAAAGGTATCAACAGCTCAAAACCATTTACTGCGACATAGAAAAAAACT
+AACCCAGGAAGCGGGCGGACCTACCAAACTAAAATCATTTTATCGACTAGTGACATTAAA
+AACCGGTGCCAGTTTGGTAGGTTGCCTCCCAAATGAACATTAAAAACAATAAAACAGCCG
+GGGGAAATTATCCATACTGACTGTATGTTGGGACATTAACCATCGTTTAAGCAGAAAATA
+TGTCGGGAAACACTGCCAAAATGAACTGTAGGTCTTCCGGCTACCCCATGCTTTTGGGAT
+ATAAACATCCCATAAATATCAGGTTTTTTATGAAAGAGGTGATGACCATTTGGACATGGT
+TAAGGGTTATATCAAAACCAAAGGTAAAAAACCCATAGAACCTTACCGCAATAAAAAATC
+ATTTTACACCTATGACTATATCCGCAAAACGGGCGGCGACTTTGCTGGTATCCTGGCCGA
+TGGCATGGTGCAAATAGATCTTGATGATGAAAAAGAAGGGAAACTTGTCAAACAGATTGT
+CACAGAAACCGGCCTTAGAAGCGCAATTCTTAAAACCGATCGGGGCATCCACTTTTACTT
+TAGGAACACCGAGGTCAAGAAAAAACAAGTGAAGCTGATGACTCCCATCGGCGTCACCGT
+AGATGTGGCCGTGGGCGAGCAAAATGCACCGATACCGATAAAAGTAAACGGAAAAACCCG
+GCGCTGGCTCAATAAAATCGATGCCATAGAAGATATCGATTTCCTCCCAGATTGGTTGCA
+GCCGCTGAAGAAAAAACACAATTTACCGGACTTTAGTTCCTTAGCCGATGGCGATGGCCG
+AAACCAGGCACTTTTTAACTATATCCTTACCCTCCAGGCCGAGGGTTTTGGCAAGGAAGC
+CATCAAAGGCATTATTCAGATTATAAACCAGCATGTGCTAAAAACCCCTCTGGGGGATAA
+GGAAGTGGAGACTATTTTAAGGGATGAAGCCTTTTTAAAGCAGACCTTTTATATAAAATC
+AAAATTCCTCCACGACCGGTTCGCCAAGTATCTAAAAACCGAGGAGCGGATTATTAAAAT
+CAATAACCAGCTCCACATTTATCGAGACGGGGTTTACAAAAACGATGCCTTGGAAATAGA
+AACGGCCATGATTAAACACCTGCCGGAGCTGAATCGGGCTAAACGCTCGGAAACACTAAC
+TTATTTAGACCTTATAGCGGAAGACAAGGAACCGGCTTCAGCAAATTATATTGGGTTTAA
+CAACGGGATTTTAGATATTGACAGCATGACCATGCATGACTTTTCAGCGGACATCGTGCT
+GCAAAATAAAATTGAATATGATTACATTCCCGGTGTTTACGATCAAATAGTAGATAAAAC
+CTTGGATAAAATTTGCTGCCAGGACAATAACTTGAGGAAGCTGTTGGAGGAACTAGTTGG
+CTATCTGTTCTTTAGAAGAAACGAACTGGGCAAATGTTTTATTCTTACCGGGGGCGGCAG
+CAATGGCAAATCCACATTCCTGGATATGATTAAAAACCTACTGGGAAATAACAATTATTC
+ATCCCTGGGTATAGATGAACTTGGAGTGCGCTTTAAAACGGCGGAGTTGTTCCACAAACT
+TGCCAATGTTGGAGATGACATCAGCAAAAAGTATATGGACGATAGTGCTATTTTCAAGAA
+GTTGGTCACCGGCGAAACAGTTAACGCTGAGCGCAAAGGTAAAGACCCTTTTGAATTCAA
+CAATTATGCCAAGCTGCTTTTTAGTACAAATAAATTGCCTAGGATCAACGATACTTCCGT
+AGGACTTATGCGCAGGCTGGTGATTATCCCCTTTAATGCGGTATTTAGCGACAAGGACAC
+CGATTTTGATCCTTTTATCAAAGACAAGCTGCTAACAAAACCAGCCATGGAATATTTGCT
+GAAACTAGGGATAGAGGGTTTAACCCGTGTGTTGGCCAGTGGGTTTACCGAGGCTCAGGC
+GGCAAAAAGGGAGAAACGGGATTACGAAGTGGTGAATAACCCTGTTCTGGCTTTTGTTAA
+TGAAGGATTAAAAATCGAAAATGAGGCAATAAAGGACGTTTATCGAAAATATGGGACTTG
+GTGTTATGAAAACGGCCTAAAACCTCTTAGCCACATAGAGTTTGGACGGGAGCTAAGTAA
+AAATGGCTACCAATCAGAGGTAAAAAGAATTGGCGGGGAGACCGTTCGGATTTATGTGAA
+GGCCGCTACAGATGTAACAAATGGGCAAAATGATTTGTAACGGTTAAAAGTCAGTTAATC
+CAACAGTTAGGAAGGATGATACAGATGTTACAGATATTCGTTTATCTTTTATAAATAAGG
+GATAAGAAAGATTATAAATTATTTATATAAAAGAAGTATATATATATTTATTTATAATAT
+CTGTAACGCTGTAAAAATATCACATTTAACGACATTGTAATTTAAGTGAGGTGTTAAGTC
+TTGAAAAATATAGTTTTTATCTGCAGTCCCTTTGCCGGGGATGTGGCAGGAAACATAGAT
+AGGGCCAGGCGCTACGGGCGGTTTGCGGTAACGAAAAAAGTGATACCTATTATCCCCCAC
+CTGATGTATCCACAGTTCCTTGATGAGGATGACCCGGCGGAAAGACAACTGGGGATTGAA
+ATGGGACTGGCACTATTGTCACATTGCCGGGAAGTGTGGGTGTTTGGGAGCCGGGTGTCA
+TCGGGGATGGCGGCGGAGATAGATCAGGCCAAGGTGCTAGGGATTCCGGTTAAGTATTTT
+ACGGTGGATTGTAAACCAGTGGGAGGGTTGACCTATGGGATTTGATGCTGTAGACTGTTT
+TGCCCATAAACGAAATAGCTGCACAGCTTTAAAGGTTAAACAGTGTGAAGGCTGCAGTTT
+TTATAAAACCAAGGAGCAGTATGAACTGGGTCAGCAGAAGGCGTTGGAGAGGATTTACAC
+CTTGGATATAGCCAAACAGAAACATATTTCAGAAACCTATTATGGCGGCAAACTGGAGGT
+GATAGCTGATGAAGGCTAAAGAATATTTATCCCAAGCCATCAGGCTTGACCACAGAATAA
+GCAGCAAGCTGGAGCAATTGGAGAACTTAAAGGCCCTGGCCATGCGGGTAACCTCAAACC
+TGACCCAGGAAAAGGTATCCGGTGGTAGAAATATCAGAGGTCCTTTTGAAAACACCATGG
+CTAAGATTATTGATTTGGAAAAAGAAATTAACCAGGAGGTTGACCAGTTTATAGAACTCA
+AACAGGAAATCATGGGCACCATTTGCCGGGTGGAAGATGTGAATTGCCAGTTGGTGCTGG
+AGAAAAGATATATCAGCGGCAAGTCCTGGGGGGATATCTCTTTGGAGCTTGGGTATAGCA
+GGAGCGGGGGTTTTTAGAATCCACGGTGAAGGATTAAAAGAAATTAACGAAATACTAAAA
+AAGTGGACTAAAATGGACTAAAGTGGACTTAGCAAGTGTGGTATAGTGTAAGGTGTAAAG
+ATATAAAAACATATTCAAGAAAAGCCCCAGGATACTGTGGGCTTTAATTTTTTAGGAGAT
+GAAACCAAATGAGAACATGCGCCTATGAAGGTTGTCGGCATGAAATAAAACCCGGCAGCC
+CTTATTGTAAATATCATGCCAGGCTGATTGAAATAGAAAATAACAGTCCGAAGTGGCTCA
+ATGACATGATCCAGGAAATGCGGGACAAAATGAACAGCGAAAAATGCGTAAAGGCAAGCA
+TGGCACCAGGCGATCATCCAGTTAAAAGTGACTAAACAACCATATGCCACGGCTACTAAC
+GAAAATAATCTAAGCTCTGACAGCAACTTGCTCTCAGGGCTTTTTCTATGGAGGTGCCAT
+TATGAAATGCATATCCTGTCGCTTTGCCAGCACCGATAAATCCGCTAGCGATAAACACTG
+GACGGCTTATGAGTGTGGTAACCCAAAGAGCGAATACCATAAATCTTTAATTAACATATC
+CGAAGACGGCAATAAACATAAACGTATCTCCTGGTCCGGCTGCCAGCACGGTGAGAGGAA
+GGTGAAACCCAATGCCACGGAAACCACCAGCGCCATGCCGCCATCCCGGTTGCCCGGAGC
+TAACGGAAGCCAGGTTCTGTCCCAAACACATGCAGGAATACAACCGGCAGTACAACCGGA
+AGGAAAGACCCAAGTATTCCAAACAGCTTTACAACAGTGCCCGGTGGCAGCGGTTAAGAA
+AGAAAGTTCTACTGGAGCATCCCCTCTGTGTAGAGTGTGAACGCCAGGGCAGGATTACTC
+CGGCAACAATAGTTGATCACGTAAAACCCCACAAAGGTAATCTGAATCTGTTTTGGGATG
+AGAACAATTTACAAGCTCTTTGTAAAAATTGTCATGACAGCAAGACCACAAAGGAAGGCC
+GCTGGGGTGATAAGAATAGGGTTTACAGTTATTAGGCAGTCTGGCAGCAGTAGAAAAAAA
+AAGCGACTTTATCCTGCTTAGAATAAATCGCTGTGGGTTCCCGTCCTGGTTAAAGATAGG
+GTCAGGATATCCTTTTCAATTTTGTATATAAGCAGCCAGTCAGGAGTAATGTGGCATTCA
+CGGTGACCACCGTAATTACCGGAAAGCGGGTGGTCAAGATATTTTTGAGGAAGTGGTTTC
+TCCTGGACAAGAATATTTAACACTTCCTCCAGCAGTTTTACATCATAGCCCCGTTTAACA
+ATAGCTTTGTAGTCCTTTTTAAAGCGGCTGGAGTATCTAATTTTCAGCATTTAGATCCTC
+CATCAAGGCATCTACGCTGTCAAAGGTTTTGCTCATATTGCGGTTGTTATTAACATCATC
+AATTGCGGCCCGTGTTTCCTCATTGGGTGTGTCAAGGCGAAGGTCAAAAGGAATGCCGCC
+GTAACGAACGGAGTAACGCAAAAACATATTCATAGCAGTGGACATGTTGAGGCCAAGCTC
+GTTAAAGATAGCCTCAGCTTTACGCTTTAATTCCTTATCGACACGAACATTTATATTGGT
+TGTACCGGCCATAATATCAACTCCTTTCTATACTTATATTGTAAAACATTGTACGCAATT
+TATCAATAAATAATACCATAATGTTTTACTTTGTAATGGAAGGTCATTCTCATGGAGGGG
+GTAGTAAATCGCTGAAAACGGGAGCAAAACGGAGCGGGCGCGGGCCTTCGCGTGGGAATT
+CGCAAAATTCCAGATGGGGGTTGTCAAGGTCTAATGCTTGACATGGCACGAAATACAGCG
+ATTTTAAGCAGGTTAAGAAGGAGGTGGCCCTTTTGGAGATTAAACGCATTCCACTGAAAC
+AGATTAACCCGGCCAAATACAATCCTCGTAAGGATTTAAAGCCTGGAGATCCGGAATACG
+AGAAATTAAAGAAATCTATTGACGAATTTGACCTGGTGGAACCTTTGGTGATGAACAAGC
+GGGGCAACATGCTCATCTCTGGCCACCAACGACTAAAAATTTTACTGGAGCGGGGAGATA
+CCGAAACGGAAGTGTCCGTGGTTGATTTGCCACCTGACCGTGAAAGGGCCTTAAACATTA
+CCCTTAATAAAATCGCCGGTCAATGGGATCTGCCCAAACTGAGCGAGCTGCTCAAGAACT
+TGGATGATGACTTAAAAGATATTACCGGCTTTGATGCCGAGGAAATAGATGAATTGCTGG
+GCTTTAAAGAAGAAGTCCAGGAGGATAACTTTGACGAGGAAGCACCGGAGCGGCCCATCA
+CTAAACCAGGGGACATCTGGCTTTTGGGCAATCACCGGCTGCTTTGTGGGGACAGCACCA
+ACCCAGCTGATGTAGAAAGACTAATGCACGGTGCCAAAGCCAACTGCGTTATTACCTCCC
+CGCCCTACGCCATGCAGCGCAAGGACGACTACGGCGGGATACCGGCAGAGGAATATCCGG
+GCTGGTTTTTTCATGTGGCCAGTAACGTTTACCGGATACTTGACGACAGCGGCTCCTTCT
+TCGTCAACATCAAGGAGCACGTTGAGGGCGGCCAGCGTTCCCTTTACGTGATGAAAACCA
+TCATTGCTTTGGTGGAAGGTGGCTGGCGGTATGTGGATCAGCTAATCTGGACGAAGCCAG
+GGCTGCCCGGTGGCTGGTCTAATCGCCTGAGAAACGACTTTGAGCCGGTGCACTTCTTCA
+CCAAGAAGGAACAGATCGACTGGATGGTGCAGCTGGTAGAGGTTGATGAGGACAGATTGG
+CAACATTACCGGCGGACCTGGTGGAAATGTACGAGGACATTTTCCACTTCACCAAAGCTA
+AGAAAATTAAATTCAAACCCAGGGCGGTAGGCAGTGAATCAGATGCCATCCGGGTCTACA
+GCAAAACCAATAAAACCAAAGGCGACTCCGGTAATATCAGCGTCAGCGGCAAATTCAAAA
+AGGGCATCGCTAGGCCAGGGAATGTGCTATCATTACCCGGCAACCAAAGTTCCGTAAAAC
+ACTCAGCCGCATTTCCAGTGAAGCTCCCGGCCTTTTTCATCAAGCTCGCTACTGATGTGG
+GGGATAACGTTTACGAACCCTTCAGCGGCTCTGGCACCACCATCATGGCCGCTGAGCAGC
+TGGGACGGAATTGCTATGCCATGGAATTGTCCCCAGGGTATTGTGATTTGGCCGTGAAAC
+GCTGGGAGCAGCTTACCAGGGAGAAGGCAGTAAGGCAGGAGGTGTAAAGATTGGAGATAC
+AAAGACTACCGCTGGAGAAATTAAATCCGGCTAAATATAACCCACGGAAAGACTTAAAGC
+CCGGAGATCCGGAATACGAAAAACTGAAAAAATCCATAGAGACCTTTGGCTATGTGGAGC
+CCATCGTGTGGAATAAACGCACTGGTCAGATCGTAGGGGGCCACCAGAGATTTAAAGTTT
+TACAGCACCAAGGGGAAACCGAGATTGAGTGTGTAGTAGTGGATCTGGATGAGCAACGGG
+AAAAGGCCCTGAACATAACGCTTAATAAAGTCACTGGTGAATGGGACCTGCCTAAACTGG
+CCGACTTAATCAGCGAACTGGATAACGGAATATTTGATATTTCCCTAACCGGCTTTGATG
+CCGCTGAGATAGAGGATTTATTTTCCAAAGTCCACGACAAGGATGTTAAAGAAGACGACT
+TCGATGTGGACGGAGCTTTGAAGGAACCGGTTATCAGTAAACCCGGTGACTTGTGGCTGC
+TGGGAAGGCACCGGCTCCTTTGTGGAGATAGCACTAAAGCGCAAACGTATGAAAAACTAA
+TGGACGGCAAAAAGGCCAATCTCATAGTCAGTGACTTGCCTTATAACGTGGACTACGAAG
+GAACGGCAGGGAAAATTAAAAACGATAATATGGGAGACAGGGAATTTTACGAATTTCTCC
+TAAAGGCCGCCACAAATATGTATGAAAATGTTGTAGACGGTGGCGTTGTCTATATTTTTC
+ATGCAGACAGGGAAACCGTTAATTTTAGAACCGCCTTTAGGGACGCTGGCTTCTTTTGTC
+ACCAAACCTGCATTTGGGTGAAAAACGCACCGGTGCTTAGTAGATGCGACTATTTATACG
+CTCATGAACCCATTTTATATCTATGGAAGCCCACAGCAGGCCATAAGTTTTACGGTGATA
+GAAAACATAGGACGGTATGGAATTTTGACCGGCCAGCCAAATCAAAACTCCATCCAACTA
+CGAAGCCAGTGGCTCTGTGTGCTTACCCTATCCAAAACAGCAGTGCTCCCAATGGCATCG
+TGCTCGACCCCTTCTCCGGCAGCTTTTCTACCGGCATTGCTTGCGAACAGCTGGATCGTA
+TTTGCTATGCTACCGAGTTGGAGGAACGCTTCGTAGATGTAGGAGTGAAAAGATACATTG
+AGCATATCGGCTCCGATAGTGATGTCTACTTAATCCGGGATGGACAGAAAATTAGATACG
+CTGACCTGCTATAAATCCCTTGCTATTCCTGTGGTTTTAAGTGATGTATAGACATACCAA
+AAACCACAGGAGGGGACCCAAGATGACCAGAAAAGAGCTTGTACACAAGCTGGCTGAGCA
+TTTAGGAATACGACCTGTCTATTTAGCTGCCCCCAGCTTTGCTTATCAAGTTGGCGAATA
+TACCGTTAACCGACAAGGCAATATCCTTGACAGCGAGGGTCAGGTGCTGGAACTGGAGGC
+GCTGCTGGCAGGCGGGAAGGAGGAACCGGAGTTGGAGATCATAACTGAGCAAAAGGAAAC
+TGCGGAAGCGAACACTTCTGTCGAAACAAAACCCACTGCTTTGGAAGTAGGGATACCTTT
+GGAAGGCTACGATGGCCGGAGTTTGCGGAACCTGCTCCACATGATTTACAGTAAGCAGCC
+GTTAATTAAAAAAGCATTAAACCTTGATGCAGATTTGGTGAGCGAGGAAGTAATAACTGC
+TTTAAACCAGCAGCCCATGACAACTCTGGAGCATTTCCAAAATGCACTGGAAGGTAAAAG
+CTGCCCCGGCATCGACTTTGATTTCAACAAGGGAACCATCACCTTCAAGCTAGGGCAAGG
+TGGAGACGACCCGGAGAAGGTAGAAGCGGCCACTCAATTGTTAGCCTTGGTGAACCTTAG
+CGCCAGGCGCTCCAAGCTAAACATTTCTGCCAAGGTCAAAGCCACCGATAATGAAAAATA
+CACATTTAGAACTTGGCTCCTGCGCTTAGGGATGATAGGCGATGACTACAGGCTAGCCCG
+CCGGGTTCTTTTGCAAAACCTCCCCGGTAACAGCGCTTTTAGAAAACAAGTCCAGGAGGG
+AGCGTAAATGACCAAACCAAGATGCAAATTGGTCGGTGAAAACGGCAACATCTTTAACCT
+AATGGGCATCGCCAGCCGCACTCTTAAAGATGCCGGGCTGGAGGAACAAGCGGCAGAAAT
+GCGAGAGAGGATTTTTAAGTCCGAAAGCTACGACAGAGCACTGCAGATAATCATGGAATA
+TGTGGATGCGGAATAAGGCTGGGGCATAAGCACCGGTCTTTTCTCTAGCTAAACAACCGC
+CTAAATATTAACTTTTAAGGAAAATAACCCTTGCTATTATGTGTGTTTAGAGTGATATAT
+AGACTACCAAAAACACACAGGGGGTTTTCCGAACATGAAAAACTTAACCTTTGGGATAGA
+AATTGAACTCACCGGGATTAGCAGGGAAGCAGCTGCCAAAGCAGTGGCGGGATACTTCGG
+CACCAGCGCCCACTACCTTGGCGGCGGCTACGACAAATGGGAAGCGCCGGACAACCAAGG
+CCGCAGCTGGTTTATTATGAACGACAGCAGCATCAGGCCGGAAACCAAGCGGCAAGGCAA
+AAGAATCGCAGCGGGATTGGACCACCGGTTGGAGCTGGTTTCCCCCATCTGCACCTACAG
+CGACATCGAAACGGTGCAGGAGATTATCAGAGCCTTAAGAAAAGCCGGAGCCTTCTGCAA
+CCGCAGTTGTGGGCTGCACGTCCATGTTGGCAAAGAAAGATTCACCGCCAAAACTTTACG
+GAATCTGGTCAACATTGTGGCCAGCAAAGAGGACTTGATTTACCAAGCTCTGCAGGTGGA
+CGAGCAGCGGAAACGCCGGTACTGCCAAAAGGTAAAGGAGAGCTTTTTGGAAGAACTGAA
+CCGGCGAAAGCCAACGGAGCTGGAGCAGCTGGCCGACCTTTGGTACCAGGGTTACAGCGG
+CAGCCGCAGCCAACATTACCACAGCAGCCGCTACCACGGGTTAAACTTACATGCTACTTT
+CAACGGCCCCACGGTGGAGTTTAGGCTTTTCAACGGAACCACCCACGCCGGGAAAGTCAA
+AGCCTACATACAGTTTTGCTTGGCGGTAAGTTACCAGGCTTTAAGCCAAAAGAACGCCAG
+CGCCAAGAAGACTGAGACCTCAAACCCCAAGTACACTTTTAGAACCTGGCTTTTGAGACT
+AGGCCTTATTGGCAAAGAATTTGAAACCGCCAGGCTTCACCTTTTAAAGAACCTGGAAGG
+CGACAGCGCCTTTAGAAACGGCAGACAGGTGGCTGGGCTTTAAAGCCCGGCTTCCCTTTC
+TGACAAATAGATGTTAATATGTGGGAAAAAGGGTGGTGAAGGCATGTATCTACGGGTAAT
+GACTTTGGATGGCAAACGGGTCAGTGTGGCCAAAGATGAACTGGGAGTGTTTGAGGAACT
+AAAGAGCTTTGCTTTTGTCCCCCACACCATGACTGTGGAAGAGTATATTAATTCCATGGT
+GCATAGCGCCTGGACCTTTTACGGCAAAGGTGTGCATGTCACCGGAGATACCCTGGCAGA
+GAAGGCTAAAAGTGCCTACCGTCAATTCGTGGACTATGGCTTTCTGATTGAAATCACCAA
+GGAAGAAGCCCTGGAGCATTTTGGCCTCACCCAAGCTGATGCAGACAAGATGAACATTCC
+GGGCCTTAGAAGTAACGAATAACGCCCGGTTTAAATAAAAAATACTTGCAAAACCCCTGT
+TTTTGAGTGATAGATAGGTTTACACCATTTAGCCCAAAAAGGGGGTTTTTTGTATGTACT
+ACTTTGCCTACGGCAGCAACCTGAACAAGGAACAGATGATGAGCCGCTGCCCGGATGCAA
+TACCGGTGGCCAGGGTAAAACTGCATGGCTACCAACTGACTTTTAACCGGGTGGCGGATA
+TCGTGGAAGAAGAACAGGCAATTACCTGGGGTGCCATTTACACCGTTTCGTCGGAAGATA
+TTAAAAAACTTGACCGCTATGAAGGCTATCCCCGCCTTTATAACAAAATGCCGGTAACGA
+TAGAGGACGACCGGGGAAACATTTACCAGGCCTTTGCTTATGTGCTGACCATCAAGGGTT
+TAAACGAACCCAGCGATGGCTACTATCACATCATTGAACAAGGCTACCGGGACTGGGGGC
+TGCCCCAAAAACCGCTGCGGGAGGCTTTAAAACGAAGCCTTTTGAGCGCCCCTGTGGGCC
+TTTAGCGTTGGGTTATAGCGGCTACATGGTTGGGGAGCAGTGACTAAGGCCAAAACAGGG
+GGCGATTCGATTGGATAAATTCTTTTCCCAAAGGCACTGCGATCGGTGCGGCGGGGATTT
+AAAGGGTGGCCGGACAATGTCCGCCTTTAATTTGGATTGCATCTGCATGGATTGCAAGGC
+CAAAGAAAAACAGGATAAGGATTACGACAAGGCGGTAAAGGCCGATATTGATGAGATAAA
+GAAGGGGAATTACAACTTTCCGGGTATTAGGAAATAAAAAACAAAAGGGCCAAGTGAGGC
+TCCTTTTTCAATTGGAGGTGAAAAGCTATGGCGACACGGGGAAGAAAACCAAAACCAACA
+GCTCTTAAAGTCCTGGAAGGAAACCCCGGCAAAAGGCCATTAAATGAAAACGAACCCAAG
+CCTGAAAACAAGGCACCCCGCTGCCCGTCATGGCTGGAGCAAGAGGCCAAAAATGAATGG
+AGGCGGATGAGTAAAACCTTAGAAGCTATGGGGCTTTTAACTCTGGTGGATAAAGCTGCC
+TTTGCCGGGTACTGTCAGGCCTACGCCCGGTGGAAAGAAGCCGAGGAGTTTTTAAGCAAA
+CACGGCACCATCTTTAAAACCCCATCCGGGTACATTCAGCAGGTGCCGCAAGTCTCCATC
+GCCCAAACTTACCTGAAGGTGATGAAAGATTTCTGCTCTGAGTTTGGGCTAACACCGGCG
+GCCAGGACGAGGATTAGTGTTGACACTGAAGCAGTAAACACGGACGATCCCATGGAAAAG
+CTGTTAAAAGTAACGAAGTAGGAGGTTTTTTTAATCGGAGGTGATGCCCTTGCTCTACAG
+CGAAGAAAAGGTAAATCACGTTGTCGATTTTATCCGGCAACTAAAACACACCAAAGGTAA
+ATGGGCAGGACAGCCTTTTGAATTAATTCCATGGGAACTTGATTTAATAAAACAAACCTT
+TGGCACCTTAAGGGAAGACGGCACCCGGCAGTACAGAACCGTGTATACAGAAATTGGAAA
+GAAAAATGGGAAATCCTCGATCGCCGCTGCCATTGCCCTGTATATGCTCTTAGCCGATGG
+GGAGCCAAACGCCGAGGTCTATGTAGCCGCTTGCGACCGGCAACAGGCCAGTATAATTTT
+CAATACCAGTGTTAATTTCGTGGAGGGTAATCAGACCCTTTCGAGGGTGACTAAAACCAT
+CATGTCCACCAAAAGAATTGTCTACCCTAGAACCGGTAGTTTTTATCAGGTGTTAAGTTC
+AGATGTAAAATCCAAGTCAGGACTTAACCCATCTTGCGTTATCCTCGATGAAATCTGGAC
+TTATCCAAACCCTGACCTGGCCAAGATGTTGACCACTGGTTCCGGTGATGCCAGGGAGCA
+GCCCCTGTTTATCTATTTAACCACGGCGGGTAACAAGCTGCAGGGCTACGGCTGGGAGAT
+GCATTGCAAGGCCAAGGATATTTTAGCCGGAAGAAGAATTGACCCCACTTTCCTGCCTAT
+CATTTATGGTCTGGAGGAAGATGACGATTGGGAAGATGAAGCCAACTGGTATAAAGCCAA
+CCCAAGCCTGGGCCATACCATTCAAATAGAGCGGGTCAGAGAACATTTCTTGCAAGCCAA
+ACAAGACCCGGCGGAGGAAGCACTTTTTAAACAGCTGCGACTAAATATGTGGCTGAAACA
+ACAGATCAAGTGGATGCCCATGGATACCTGGGCTAAATGCGCTCACCCGGTAGACCCGGA
+TATGCTCAAAGGTAGGGTTTGTTTCGGCGGGCTAGACTTATCCAGTTCCACTGACATCAC
+CGCCTTTGTGCTGGTGTTTTCACCGGTGGCTGGGGACGACAAGTATTACGTTCTCCCCTA
+CTTTTGGCTGCCGGAGGAAACCTTAGATTTACGGGTGCGCAGGGATCATGTGCCCTACGA
+CATCTGGCAGCGGCAAGGATACCTGTTAACCACCGAAGGCAATGTCATCCACTACGGTTT
+TATTGAAAAATTTATCGAAGAGCTGGGCCAGGATTACAACATCCAGGAGATTGCCTTTGA
+CCGCTGGGGTGCTGTGCAGATGGTGCAGAACCTGGAGGGTGCCGGATTTACCGTGGTTCC
+CTTCGGCCAGGGCTTTAAAGATATGTCCCCACCCACCAAAGAACTGATGAAACTGACCCT
+GGAGAGAAGAATTGCCCACGGTGGCCACCCGGTGCTGGCCTGGATGATGGATAACATCCA
+TATCCGTACCGACCCTGCCGGTAATATCAAGCCGGACAAGGCCAAATCAACAGAGAAAAT
+TGACGGTGCAGTGGCTATGATTATGGCGCTAGACCGATGCATTCGGAATGAAGGAGTGAG
+CAAAGACAAATCGGTGTATGATGAACGGGGTTTAGTGGTGTTTTAAGTCTGCGAATATAT
+TGCATATCGCAATACAAAATGGTAAAATATAAATACCAAGAAGGAGGCGATATGTGTGTC
+GAAAACTACAAGTATTTTTGCTCGTGTTGAGCCGGAAATAAAAGAACAAGCAGAAATGGT
+GTTAAATAAACTTGGCATACCTATGTCAAATGCTATTAATATTTTTTTAAGACAGGTTGT
+TTTGCAAAACGGGCTACCATTTGAAGTTAAAATTACACACAATAAACCTCTTGCAGTTAA
+GGATTTAACACCTGAAGATTTTAACAATGAAATTGAAAAAGGGTTTAATGATTTAAGGGC
+AGGCAGAGTTGTGCCTGCAGATAAGGTAGCCGAGCGAATCAATAGGGAATATGGGCATGA
+GTTATAGAATTATTTATACCGAAGAAGCGGAGCAGGATCTTATAAATGTTTACAGGTATA
+TTGCAATGGATTTATTAGTGCCAGAAATTGCGAAAAAGCAAATCGATAGAATCATGAATG
+CAATTAAAGGCCTGGATGAAATGCCCCTCAGGCATAAACTCTACCAAGACGAACCATGGC
+ACAGTAAGGGTTTGAGAGTTCTTCCAGTAGACAACTACCTCGTATTTTATATAGTAATTG
+AAGAAGAGATAGTTGCAATAGTAAGAATAATGTATGGTGGACGTAATATAGAATTGCAAT
+TGTCAAACACAAAAATTGGTGATTAAATATTAAAATCCACAATGGCATCTCAATTGAGGT
+GCTTTTTTCATGCCCAATATTAAGGAGGTGTGGCCTCTAACATGAAAATACCCATCTTAT
+CCAAGCTGTTTAAACCCAGGGCCAGTCCCAAGAACACCTTCTGGCAAAACGCCTACACCT
+TTTTCTTCGGCCCTACGCCCAGCGGCAAAACCGTCAACGAGCGCACGGCCATGACCACCT
+CAGCTGTATATGCCTGTGTGCGGGTATTGTCAGAAACCATCGCTTCACTGCCTCTGCACA
+CATACAGGCGCACCGAGCGGGGCAAGGGAAAAGCCATGGACCATAACCTCTACTACCTAC
+TCCATGACGAACCTAACCCGGAGATGACCTCATTTGTGTTCAGGGAAACACTTATGGGTC
+ATCTTTTACTTTGGGGCAACGCCTATGCCCAGATTATTCGGGACGGCAGGAGCAGGGTGA
+TTGGTCTTTATCCTTTATTGCCCGATCGCATGGAGGTAAGCCGCACAGAAAAAGGCGAGC
+TCTACTACCGCTATCAAAAGGAAGGCCGAGAATATTTGTTGCGCCGTGAAGAAGTGCTGC
+ACATTCCGGGTCTTAGCTTTGACGGCTTGGTGGGCTACTCCCCCATCGCCATGGCCAAAA
+ACGCCATCGGTATGGCCCTGGCCACCGAAGAATACGGTTCCAAGCTTTTTGCCAACGATG
+CCCGGCCCAGTGTGGTCTTAGAACACCCGGGTGTACTGAAAGACCCGGCTAAAATCAGAG
+AGAGCTGGAACCAAATCTACCGGGGCAGCGAAAACGCCCATAAGGTAGCGGTACTGGAAG
+AAGGAATGCAGGTAAAAACCTTAAGCATTCCCCCGGAACAGGCCCAGTTTTTAGAAACCC
+GCAAGTTCCAGATTGAGGAAATCTGCCGCATTTTCCGGGTACCACCCCATTTGGTGGCCA
+GCCTGGACCGGGCTACTTTCAGCAATATAGAAAGCCAAAGTATTAGTTTTATTGACAACA
+CCATTGTTCCTTGGGTTTCTCGCTTTGAACAAGCCATGCAAAAGGCTCTGTTTTCAGTTA
+GAGAAAAACAGCAATATTTAATCAAATTTAATTTGAACGGTAGGTTGCGTGGAGACGCCC
+AATCCCGTGCTGCTTATTATCAAACCATGCGGCAAAACGGCATTATGTCAGCGAATGACA
+TCCGAGAGCTAGAAGAGATGAACTTAATTCCGGATAAATTAGGCGGAAATAAATATTTAG
+TCAACGGAAATTTTGTAGATATGGCTGATGCCGGGGCTTGGAGTGAAAAATATGGAAAGG
+AGGCTACCGATGCATAGGTTTTGGAACTTCGAAGAAACAGATACCGACCGAATCCTCTAC
+CTGGACGGCTACATTGCCCCGGAGAGCTGGTTCGAGGATGAAATAAGCCCCAAAGAATTT
+AAAAATGAGTTAGAAGCAGGAATCGGTAACATCACCGTCTGGGTTAATTCTCCAGGGGGT
+GATTTTTTTGCCGCCAGTCAAATTTACACCATGCTCAAAGAATACAGCGGCCAGGTGCTG
+GTCAAGATTGATGGCATTGCCGCCAGTGCCGCAGCGGTGATTGCCATGGCCGGAGACAGG
+GTACTCATGTCCCCCACAGCCATGCTCATGATCCATAATCCGTCCACTTTTGTTTGGGGC
+GAAGAATCTGATATGCAAAAGGGCATTGAGATGCTCTCCGAAGTTAAGGAAGCCATCATT
+AACGCCTTTGAAGCCAAGACGGGATTGCCAAGAAAACAGATCGCTCAAATGATGGATGCC
+GAAACCTGGTTCAGTGCTAATAAAGCGGTGGATCTTGGTTTTGCTGATGAAATACTCTAT
+AGCGAACCGCCACCTCAGGTCACTGACTTCATGTTTGACCGGGTAACGGTAGTCAATGCA
+CTGATGCGGAAACTACCGGCGGTTAAAGCTCAATCTAAACCGGTAATCAATGAACCTTTG
+AACAGCAGTGGGGTTTCATACGAACAGCTAATCAAACGGCTGGAATTAATAAAAGGGAGG
+TAATATACCATGAGTAAAATTATTGAACTGCGGGAAAAGCGGGCTAAAGTGTGGGAGCAG
+GCCAAGGCCTTCCTGGATGAAAAGCGGGGAGAGAACGGCTTACTATCGGCTGAGGATACC
+GCCACTTATGAGAAGATGGAAGCGGAAGTGGTCAATTTAGGCAAGGAAGTTGAGCGCCTT
+GAGCGCCAGGCCACTATTGATCTTGAACTATCCAAGGCTACTAGCACAGCATTAAAAACT
+ATTCCTGGTGATGGTCCTAAAGGCCGGGCTTCCAATGAATACGATAAGGCCTTCTGGCAG
+TATATGCGCAACCGCAATAGCTATGAGGCCAGAAACGCTTTAACCATTGGCGGTGACGGC
+ACCGAAGGCGGGTATTTAGTTCCGGATGAGTTTGAACGTACCTTGATTGAAGCCCTGGAA
+GAAGAAAACATCATGCGCACCCTGGCTAAAGTAATTACCACCTCTACGGGAGATAGGAAA
+ATCCCAGTGGTAGCTTCCAAGGGTGTGGCTACCTGGGTAGATGAAGAAGGGCCGTACCAG
+GATAAAGATGATGCTTTTGACCAGGTATCCATTGGGGCCTACAAGGTGGCCACCATGATT
+AAGGTTTCCGAAGAACTATTAAACGACAGCGTCTTTAACCTGGAAAGCTACATTGCTAAA
+GAATTCGCTCGCCGCATTGGGGCCAAGGAAGAAGAAGCCTTTTTAATCGGGGATGGTGAG
+GGGAAACCCACCGGCATCTTTGACAATGACAGTGGCGGGGAGATTGGAGCAACCACTGCC
+GGGGCTACTCTTAAAGCGGATGAGGTTTTCGACCTCTTTTATTCCCTAAAAGCCCCCTAC
+CGCAAGAAGACTGTCTTTATCATGAACGATGCCACGGTGAAGGAAATCAGGAAACTAAAA
+GACGGTAACGGTGTGTACCTGTGGCAGCGTGCGACACGTTCGTAATTGAAAAGATTACGC
+ACTGCAACCAGTAGGTTGCGGGAGAACTGACAGTTCGATAGGTAAAATGATGGAGTAACG
+CCCTGAAGTACCTACCCTAATACTCCGAATGGCGTCGAGGTTATTAAGAACGGAACGGCG
+TCATGAGCTCGGTGAAGACGGCTGAGAGCACACCCTAACAGGTCAAGCTGAGGAAAACCG
+AACAATAAAAACGTCGAGTGTGTGATAGGCCGGGGGTCTACAAAACACCTATGGTCAGAA
+TATCCATCCCTAAACCGATGGATGACGAATTCTCGAAGGTAAGGGTCTAGAACAGGATTT
+AGTCGAAAGGCTAGAAATTGCCTACAGTGCAAGGTTTGTGAGGACGAGTAAGAATGTTGC
+CTATGAAAATCCTTATGCCATTACAGGTGGCATCCAGCAAACAGGCCCAGAGAGAAGACC
+TAAGGGTGTATGAATAGATAGAACTATCGGAACGTGGAAAGTGTGCAACGTGGAGGGCTT
+AATCCCTAGGAAGCGTTAGTGAGGAAACCCCACGGGATAACTTACTTTCATGCACATGAG
+AGCAGTGGCACAGTACCTAGGAAACCGTGATAATAAACGGTGGAGGGATAGCCACAAGTC
+AGTACTATCACCACAAATCTCACTTATTACAGCATAAGGTTCGAGTATGACTAAGAGAGG
+CGAAATTCCCAAGAGGGGATGATAAGCCGACTTATGACGACCAAGAGACTTAAGAAGAGG
+CAAAAACTTAGAAACAACGAGTACTACGACATCCAAGAGAAGTTTGATGACCTTTATCGA
+CGCTCGAAGCAAGGTTCGACATTCAACAATCTCGTTGAACTAATAGCCAGTGACCAAAAT
+ATCTTACTCGCATATAGGAACATCAAGAAGAACAAGGGTAGCAAAACCAGAGGTTCCAAC
+CGCACCACAATTATCGACATAGGCAAAACGAATCCTGACAGACTGCTACAGTATGTCAAG
+AACAGGCTTCAGAATTACTCGCCACAGCCGATAAGGCGGAAGGAGATAGAAAAAGAAGAT
+GGTAGGATGCGACCGCTTGGTATTCCAACTATAGAAGACCGCCTAATACAGCAGTGTATC
+AAGCAGGTATTAGAACCCATTTGTGAGGCAAAATTCTATGAGCACAGCTACGGCTTCAGA
+CCCAACAGGGGGACACACCACGCAATAGCGAGAGTGAACTTCCTAGCATATAAGTCTAAG
+CTACAATACGTAGTCGATATAGATATCAAAGGATTTTTTGACAACGTAGACCATGCCAAG
+CTCATGAAGCAGATGTGGAGTATAGGAATTCAAGACAAGAATTTGCTTTGCATTATTTCT
+AAGATGCTCAAAGCAGAAATTAAGGGAATTGGAATTCCAACCAGAGGAACACCCCAGGGG
+GGGATTCTTAGTCCACTGCTTTCGAATATTGTCCTAAACGAATTGGATTGGTGGATAGCT
+AGCCAATGGGAAACTATGCCGACGAAGCACCAATATGCGAGCAAGAGCAAGAGGGTTCGT
+GCCCTCAAGACAGCAGGATTAAAGGAAGTCTACATCGTGAGGTATGCGGATGACTTCAAA
+CTGCTATGCAGGACTAGGAAAGAAGCTGAAAAGTTGTTCTGCGCAGTTAAAAAATGGCTA
+AACGAGAGATTAAAGTTGGAGATAAGCCCGGAGAAATCAAAGATAGTGAATCTAAAGAGA
+CACTATTCTGATTTTCTTGGGGTGAGGATTAAGCTTCAGGAGAAAGGGCAACAACAAGTC
+ACAACCTCCCGAATGACAGAGAGATCGGTTCGGAAGAGTAAGGACAAGTTGAAGAACTGT
+GTTGACACTCTGCAGAGGCAGCCCACCGTAGACAACATGCAGAAACTTAATGCCTGTATA
+TTAGGCCTGCATAATTACTACTGTGTGGCAACAAACGTAAGCAGAGATTTCGACAAAATC
+GCCTTTCATGTCGACGCGAACCTTAGAAATACGAGGTCTATGACAACTCGACGAGGACAA
+CTAACCAAAGCTTTTACCCAGTTTTATGGGCATTATACTGGGCGCCCGAAGTTTATAATG
+GGCATACCCCTATTCCCCATACACTTGGTAAAGTTCAAGCCACCTCCATATTTTAACCAG
+GACAAGTGCAATTACACGCTAGAAGGGCGGAATATGATACACAAACCTCTTCAAGCCATT
+GACACATCGGTATTGCGCTATCTCATGGAGCACCCTGTGGAACAGGAAAGCACAGAGTAC
+AACGATAATAGAATATCCTTGTACGTGAGCCAACGGGGTAAATGTTTCATCACTGGCTTA
+GAGCTTACGACATTCACCGCAGAGGCTCACCGCAAAACCCCAAAAGGGAACGGCGGAACC
+GACGAATATGGAAACTTGGTTATTGTAGTCCCGGAAGTGCATAGGCTGATACATGCCTTG
+GACGAGGAGACTGTTCAGAAATGTCTGTTAGCACTGACGAACAGCAATATAAATTATAAA
+CGCCTCAATCAACTAAGGAAAATGGTTGGAAATAGTGAAATTTGTGTGGGGTAGTTATTG
+ATGGAGCGCCGTATGAGGGGAAACTCTCACGTACGGTGCGGAACGGGGGAAAAGGCAGAG
+ATGATTTCAAAGCCTTACCTATCGTTATCCTCCCTCACTGCAGGCGACCCGAACACTTTG
+TTAAACCGTCCCGTCAAGACCTCGGCTTATGTGCCCACCATTGCCGCCGGGAAAAAAGTG
+ATCGCCTTCGGTGATATGGGCTACTACTGGATTGCTGACCGTCAGGGAAGGATTTTCCAA
+AGGCTGAACGAACTCTATGCCGCCACCGGTCAAGTAGGGTTTAGGGCAGCGCAGCGGGTG
+GATGGCAAGCTGATCCTTAAAGAAGCCATTAAAATTCTCAAGGTGAAAGCGTAGGTGATG
+GTAGATGAGTAATGTTAAAAACTATCACGAACAAGGCGGGCAGAAATGGGTGGTGGGTGG
+CCAGCTGGAGATTACAGCTGGTGGTAAGCTCACCTTCAAGGGAACCGAACTAAAACCAGC
+ACTAGGCCAAACTAACAGTGAAGCCAGCACTGTTGCCGCTCTAAAAGAGGATTTCAACTC
+CCTCTTGGGGCGGCTTTTTGCTGCCGGTCTGATGGTGGTGGATAAATCAGCACTTGAAGC
+GGCCATCACCGCAGCTTTGGAACTTTTAGATAGTGCAGTGGTTGGCGAGGATGTTGGGGA
+ATATCCGCAAGCTGCCTACGATACTTTTGAGAGCGCCATTGAAGCTGCCCTAGGTGTGGT
+GGATGATACAGGTGCTACCCAAAACGAAGTTAGTACTGCGCTTGCAGCATTAACAACTGC
+GGTATCCACCTTTGAAGCAGCAGTAATCACTGTAGATAAATCTGTTCTTCGAGCGGCTAT
+TGCTGCCGCTCAAGATATACTGGATGGTGCTCAGGTGGGCTCCGAGCCTGGCCAATATCC
+GCAAGAGGCTGTTACTGCTTTTGAAACTGCCATTGGTGCAGCACAGGCAGTAGTGGAAAA
+CGCTGATGCCACCCAAACCAATGTAGACGATGCTGTGACTGCTTTAGCTACGGCGGTATC
+CACCTTTGAAGCAGCGGTCATCACGGAATAAACAGCGGGAGGTGGTGAGTGTATGGTGGT
+AACCCTGGAAGAAGTAAAACTGTATTTAAGGATAGACGGTGATGAGGAAGATACACTCAT
+CACTAATTTTATTTCTACCGCCGTGGAAATTTGCGAGGATATCTTAAGATACTCATTGTC
+GGAGTTTGAAGAAATACCGGCGGTAGTCAGGCAAGCGGTTTTGTACTGTGTGGCCAATCT
+GTATGAAAAAAGGGAAGGAACCCACTATTATCTGAAAAACGAAGGCGGCGGCATGGCTGA
+AACCGTAAATGTGATGAAACTGATACTGGCAAACCTTCGCCGGGAAAGCTGGTGATGCAG
+GTGGAGATTGGGGATTTAAGACACCGGATAACTTTCCAGAAACTTACCACTAGCGTCAAT
+GAGAACGGCTTTGAGGTAGAAACCTGGGAGGATTTCAAGACCGTATGGGCGGCAGTGAGC
+AACCTGCATGGCCGGGAGTACTTTGCTGCCGCCGCTGTCCAGGCAGAGAATACGGTGAAG
+TTTACCATTAGGTATTTAACGGGTCTGGATACCACCATGCGGATTGTTTTTCAAGGCAAA
+CAGTACAACATCACCGCTATTTACAACATCAAATATCAAAACCGGTATCTGGAAATCAAA
+GCACTGGAGGTGGTAAGCAGTGGCTAGGGTAGAGTTAGAGGGCTTGGAAGCCCTCATCAA
+TGCCGTTCAAAGGCTGGGCAGCGAAGGCAAGAAAATAGAAAACAAAGCCTTAAAAGAAGC
+CGGTGCTGTAATGCAAGAGGCCATCCAAAACGAAACTCCAGTGCGGACTGGCAAGCTAAA
+AGAAAGCATTACCGTTTCCGGTGTGAGAACCCAGGATGGGGTTAAGTATGTAGCAGTGGG
+GCCGAGTAAGGAAGCCTATTATGGCAAATTTCTGGAACTGGGAACTGTCAAAATGAGAGC
+TAAACCCTTCATGGCACCGGGCTATGAAAACGGTAAAGACCGGGCCACAGCAACCATCAA
+GGAAGAACTGCGAAGGGGGCTGGGCCTATGAGCATGAACCAAAATATAATAACGGCTTTA
+AAGGATATAGGAGTACCGGTACAATTCCAAAACTACACAGGCAAAGCCGATAGCTACATC
+ACCTTTTTCACCTACCTGGATAAACCGGAGCAGCATGCCGATGATGCGGAGTTAATTACT
+GGCCATTATGTGCAAGTTGATGTGTGGAGCAAAACCGATTACACAGATTTAGTCAAATCA
+ATCCATCAAAAGATGCTGACTGCCGGTTTTACCAAACAGAACTTTTATGACCTGTACGAA
+CAGGATTTAGGAATTTATCACAAAGCCATGCGATTTTTTAAGGAGGTGCTGTAGATGGCA
+CAAGTAGGATTAAATGATTTACACTTTGCGATTCTTACCGCTGATACCAAGGATGAGTTA
+ACCTATGAACCCACCGAAGCCTTGGTGGGAGCCATTAACGCCACTATCAACCCGGCGGTG
+AATACTCAGGAGCTTTACGCTGATGACCAGCTGTGGGAATCGGTATCGGCTTTAGGCAAA
+GTGGATGTGGAAATAGAGACGGCGGAACTACCCTTAACTATTCGAGCCAAAATCCTGGGT
+AATGAACTTAAAGACGGGGTACTGATTGAAAAAGCTACCGATGTACCGCCCCATCTTGCC
+TTAGGCTTTAAAAGCTTAAAATCCAACGGCAAGTACCGCTACATCTGGCTCTTAAAGGGT
+GTGGCCCAGCCCATGGCCGAGGACTTCTCCACCAAAAAGGATAACGTGGAACACAAAACA
+CCCAAGGTGAAATTCACCTTTATGGCCAGAGTCCATGATGGCGAGTGGAAAAGAACAGCG
+GATGAGGATAGTGCCGATTTTCTGGGAGCAGCCACCTGGTTTGAGCAAGTACCCGGCGAT
+ACAACGGTAGTGGGAGGTTAAAGCTATGGAGATTACTCTGAAAGTAGCAGATCAAAATAA
+AACCTACACCACAAACTTTATCAGCGCCCGCATGGTCAGAAGAACCATTGAAATATCCAA
+AGACATCAACTTTGAAAACATCTCCCCGGAGGAACTGGATAAATTGATGGACTACATTAC
+CGAGCTCTTTGGCGGCCAGTTTAGCCGGGATGATTTATATGATGGCTTACCATCCCAAGA
+GCTACTCCCCGCCATTACTGGCTGCATCAACGAAGTGGTGGGGCGAATGGCTGAAGTGAC
+CAAAGGTGATGAAAAAAACGCCTAGAGGGGAACGCCATGGCTCCCCAAGACTTTATGGAC
+AGTCTATACCTGGCATTACTAGAAAAGGGCTGGACATTGAATGAAATTGACAGTATGGAT
+ATCATCTACTATTTGAAACTACTGAACAAAAAGCTGGGAGAAGAAAAAGTGTATATCGAT
+GGGGTTTTATAGGAGTTTCTTGGAGTATAATCTAATTGTTAGCGTAGCATAATAATGCTA
+TAATTAAGGCATAATGTAACCAAAGGAGTTGATATTATGCCTGAAATTAGACCGATAAGA
+GATTTAAGAAACACAACTGAGATTTCTGAACTGTGTCATAAAAATGAAGAACCAATTTTC
+ATTACGAAAAATGGCTATGGCGATTTAGTAATCATGAGTATGGAAACTTATGAAAAAAAG
+CTAGCCCAAGCAGACCTCTATAAGAAATTAGCTGAAGCAGAAAGTCAAGTTGAAAACGGT
+GAGCCACTTTTAGATGCTGAAGATGTATTTGAAAAATTAAGGAAGAAATATGTCAAAGAA
+TAGTTATAGCTTAAAACTTACTCCAAAAGCTAGTAAGGATTTAGATAAAATATATAGATA
+CATTACCGAAGAACTTTATGCTGAACAAGCAGCTGTTAATCTTTTGGAGAAAATAGAAAC
+AAGTGTAATGAGATTAAAGGACTTTCCGTTTTCAGGTAATTATTTCGCTGATGAATATCT
+AAAGAAGAAGGGTTATCGAAAATTAATAATTGATAACTACATTGACTTTTATGTAGTCGA
+TGAAGAAGAAAAACAAGTAGTTGTTATGCGTTTTTTATACGGCAGACAAAAATATGAAGG
+TTTACTCTAATAGCATCTGATAAGCAGGTGCTTTTTTTATGCCCAAAGGTGGTGAGCTAA
+ATGTCAGATGTCGGGGATCTAAATGTACGGATCAACCTTGATGCCCTGGGCTTTCAAAAC
+GGGATCAGTAAAATCAATACGGAAATGAAAAAACTGCAATCGGAGTTTAAGCTGGCCGGT
+GCCCAATTGGGTAAACACGGCAGTGAGCTGGACAAATTACGGCTTAAATCCGATAACCTG
+ACCAAAGGAACGGAGCTGCAAAGGCAAAAGGTGCAAGCCTTAGAAGAAGCCCACCGGAAG
+TCTGTGGAGGCCAAAGGCAGTGATGCCAAGGCTACCCAGGAGCTGGAAATTAAGCTAAAT
+CAAGCTCGCGCCAGGCTAGTGACCATGGAGCAGAACTTGGAAGAAGTTAATAACGAGATA
+ACCCTCCAGTCATCCAGCTGGTACAAGCTGGGCAAAGAGCTGGAAGCCGCCGGACAAAAG
+ATGCAGGCTGTGGGCCAAAAGATGGAGCAGGCCGGAAAAGAACTCAGCATGAAGGTTACC
+ATGCCCCTGGTGGGTTTAGGAGCTGCTGCGGCAAAAATCGGCTCGGACTTTGAAGCCGGG
+ATGAGCGAAGTGCAGGCCATCAGCGGAGCCACCGGCACTCAATTAGAAATGCTGGAAGAA
+AAGGCCAAGGAAATGGGTGCCACCACCAAATTCAGCGCCGCCCAGTCGGCAGAAGCATTA
+AAGTACATGGCCATGGCTGGTTGGGATACTGGTCAGATGCTAGATGGTTTAGATGGCGTC
+ATGATGCTGGCTGCTGCCAGTGGCGAGAACTTGGGTACCGTTTCCGATATTGTCACCGAT
+GCCCTGACCGCCTTTGGCATGCAGGCAGGCCAGGCAGGTGAGTTTGCCGACCTTCTGGCC
+AGCACTTCTAGTAGCGCCAACACCAATGTTTCTATGTTAGGGGAGTCCTTTAAATATGTG
+GCTCCCCTTTTTGGTTCACTGGGTTATTCGGCAGAAGATGCAGCCCTGGCTCTAGGCTTA
+ATGGCTAATGCGGGTATCAAAGGGAGCGAATCAGGTACTGCACTAAGGGGTGCTATTGCT
+AACTTAGCTAATCCCACAGCCGGTATGGCCAAAGCCATAAATGAACTGGGCCTCACTATT
+ACTGATGCCAGCGGGGAAATGCTACCCTTTAAAGATGTGATGGACCAGCTAAGAACTGCC
+TTTGCCGGGCTTACCGAAGAGCAAAAAGCCCAATATGCTGCCACCATCTTTGGTAAGGAA
+GCCATGAGCGGCATGCTGGCCATTATCAACTCCAGTGAAGAAGACTACGCCAAACTGACC
+CAGGCTACCAGGGAATACAACGGTGTGGCCAAAGAAATGGCCGAAACTATGGAAGCAAAC
+CTGCAAGGGCAGCTGACAAAATTAAGATCAGCTCTGGAAGGTGTAGGCATACAAATTTTT
+GAGATCCTGCTTCCCCATCTAAATAAGCTGGTGGAGATGCTGCAATCCTTGACCGATAAA
+TTTGCCAGTCTTAGCCCCGCTACCCAGGAAACCATCGTAAAAATTGCCGTTCTTGTCGCA
+GCCATCGGGCCGCTTTTACTTATCGGCGGTAAACTTATCGGTGTTATCGGTGCTGTTGTG
+GGTGCGCTGTCCACAGTATCCGGGGCTATTGCTGTGGCCAGCACTGGAGCAGTTGCAGCA
+ACACCTGCCATTGGAGCCTTAGCCACAGCATTTACAGTTTTAACAGGGCCGGTGGGAATT
+GCGGTTGCTGCTATTGCCGGAGTTACCGCAGCAGGCGTAGCTTTATACAAACACCTAAGC
+CAGGAAGGCATCCCGGCCATTGAACTCTTTGACGATGAAGTATCGGAATCCACCCAAAAA
+GCTGTGGGTGGTTTTTTAGCGCTTAACGACCAGGCTACTTTAGCTTTAAACCAATTATCC
+TGGAGTGGTCAGGAAGTTACCAAGGAGATGGTGGACAACATTGCCGGGAACTTCTCACAG
+ATGGCTTCACAAGTACAAGCCGGACTGGATAAACACCATCAAGAATCCCTGGCGAAAATC
+CAAAACTTTGTCACCAGCAGCACAGCTTTATCTCAAGCTGAGCAGGACGAAATATTAAAC
+AACATGCAGCAGGGCTATGAAACCAGGAAACAAACCATTGCTGAAGGCGAAGCCAGGATA
+AAGGAAATCCTGGATATGGCCAGTACAGAGAAAAGAGCCCTGACCAAAGCCGAGCAGGAA
+GAAATCAATGCCATCCAAAGGCAGATGGTGGACACCGGCATCCAGGTCCTTTCCGAAAAC
+GAAATCGAAGCCAAAGCCATTATGGAACGCATGAAAGCCCAGGCCATAGAGTTAACGGCT
+TTGCAGGCGGCAGAAGTGGTTAAAAACAGCATTGAGCAAAGGGACGGGGCCATTCAAGCG
+GCCAATGAGCAGTATGATCAGGTGATCAAGGAAATCATCCGGCAGCGCGATGAAGCAGGC
+ACCATCTCTAAAGAACAGGCCGATAAATTGATTATCGAGGCCACCAGGCAAAAGGACGAG
+TCTATAGCCAAAGCCGAAGAAATGCACCTGCGGGTTGTTGCCGAAGCCCAGGCCCAAGCC
+CAGGAACACGTCAATCAAGTTGATTGGGAAACAGGAGAAATCAAGACCAAATGGCAGGTT
+ATGCGTGACGATATATTCGCCAAGGCCGGAGCAATTAAAGAAAACGTCTTTACCACCTGG
+GAGGAAATTAAGACCAACACCTCCCAGCAGTGGGAAAGTATCCGTACGACCATGAGCGAC
+AGGTGGAATGACATTAAAACCAATACCTCCGAAACGGTAGCCGCTATTAAAACCAATGTC
+AGCATCACCTGGGATGAGGTTAAGACCAAAACCTTTGAAACCTGGGACAACATCAAAACC
+AAAACTGCTGAAACTTGGCAGGCCATACAAAATAAAATCGATGAACACGGCGGCGGTATT
+AAGGGCCTTATTGGAGCCTACACCGAGGGATATAAATCCGTTTGGGACAGTGCCTTGACC
+ACCATGGAGGAAATCACCGGCATCAAATTTAGCGACATGGCCGATAAGGTAGCTGATGCT
+TTAGAGCGGGTTAAAAAGGCTATTAGCAGTGCTATCGACCGGATAAAAGAGTGGAACGAT
+ACCAAAGTCAAGGAAAAAGTATTTAGTATCACTGAAACCATTACCAGGATCATTAGAACC
+ATTACCACCGGTGGAGGTGGCGGCGGCGGTGGTGATACTTCTGCTTCCAAAGGCGGTGCG
+GCAGCTTCAAACTTTAGCGGCACCAGCTTCTTCCCTGGTGGTTTAACCATGGTAGGGGAA
+CTGGGACCAGAACTGGTGGCCTTGCCCAGGGGAAGTAGGATTTATAACGACCATGAAACA
+AAGAAAATATTGGATGGAAGTAAAGGCATTGTCCAACACATTACCCTCCTTTCCCCTACT
+CCCCTATCCCCTGCGGAAACGGCAAGAAGAATTAAAAATGCCTCTAGAGAGCTGGCTCTA
+GAATGGTAGGAGGTGTAGTATGGACAGAATAGTTATCACTAACCAAAAGGGAGAAAGCAT
+CACGTTAGGCAACCAGGCCCCATATTTCCTTGAAACCATTGACGGTGTCGGGGAAGTGCC
+GGTAGCTATTGAAAGCCAAAAAGCACCCAAACAGGATGGCTCGACTTATCTCGACAATAT
+GTTGGATAACCGGGCCATTTCTATTGAAGGCACGATTATCACGAAGATTGACCCTGCTTT
+TGTACTGGAAGCCAGAAGGAAAATGCAAAGGGTACTAAACCCAAAATTGGGGGAAGTAAC
+TATCACCTACCATCAGAGAGACCAGGTCCGGGAGATTAAAGGTCTGGCCGAAACCACTCC
+GGTATTCCCCGGTGGGCAAGGGAGTAAAGGTTTGTATTACCAAAAATTCTTACTTCACCT
+GCTCTGCCACCAACCCTTCTGGCTGGATACCTTCTATGAAAGCCGGGAGATGTCTTATCT
+CATGGGCGGGATTAAGTTTAAACTAATCCTTCCCACTGTATTCTCCTACCGGGGTTTTAA
+GAGGCGGGCGGTAAACGAAGGCGATGTGGCTACGCCGGTGGAGATAGAGTTTAAGGGACC
+GGCAACTAATCCTACAGTTAATAATCTAACCACTGGGGAATTTATCAAAGTTAACCGGGA
+ACTTGGGGAGGAAGATGTGCTCACCATCAATACCGCCTTCGGGCAGAAATATGTGAGGAT
+TAACGGGCAGAATGCTTTCCACTATATTGACTTGGACAGCGTATTTTGGCAGCTAGTACC
+GGGAGAAAACACCTTAAGCTACCGGAGCAACAACGACAGCATCAAAACCAGGGTTACCGT
+CAAGTGGAAAAACCGCTATGTTGGCCTATAGAAAGGAGTGATTTTGTGGCAGAGCTTTAC
+AGATTTTTTGATTCCGTTGATGGCGAGGACGAACGTTTTTATACCGCAGATGAGTTCGCT
+GAATACTTCCGCCAGTTTATCAGAAACGGCATCTTCAACGGCTCCGGGGACAACTTGCAG
+GTAGGAGCCGAAGGCCAGGACATGCGAACTTTTATTAAACCCGGCTATGCCTGGATTGAA
+GGCTACCTTTACAAAATCGACATTGAACCTTTGGAACTTTACCACCCGATGGCCCATGCC
+AACTACGACCGCATCGACCGGGTGGTGATTAGATTAGATAAGACTTTAGAAAACCGCTAC
+GTGAAAGCCTTTGTGTTAACTGGTACCCCAGCGGAAACGCCACAGGTACCGGAGCTGACT
+AGGGATGAGAATGTTTATGAGCTGGCTTTAGCCCAGGTGAAGATCTTGGCCGGGAAAAGC
+TTTATCGAAGCGTACCAAATTACTGATGAAAGATTAAATCCGGAAGTCTGCGGCGTGGTC
+ACCCATTTATTTGAACAGGTGGACACCACCGAGCTGTTTAACGAATGGCAGTTATACCTC
+AATGCCAGGAGAGCACACGGAGATACAGAGTTTGCCGCCTGGCTTGAATATTTGACAGAT
+AAAAAGCAAGATGCTGGTATTGAGCATGCTGCCTTTTTGGCCATGCTGCAATCAAAGTTC
+ACCGCTTTTCAAAACACCTGGACTAACTGGGTAAACGATAAGCTAACCATTCCGGATGGA
+GCCTTCTACATCCAGTGGAAAACCTGGTTCGATAGAATCCAGCAGGACTGGGATATTTGG
+TTTGACCATGAAGCCCAGCGGGTTTGGCAAGCCTGGGTAAACGAGAAGTTAACGGCACCT
+GATGGCGAATTTTACACCCAGTGGCAGGACTGGTTTGAAGAAATCCAAGACGTAACCAAC
+CTGGTGCCCAGGAGCCAATTCAAGGCCCACAAAGATCGGACTGTCAGGGAAGGTGCCCAC
+GGTCTACGCTTTGCTGCTAATCACTTGGAAGTAGAAATTAATGACGGCAAATGGCGCAGG
+CTGCAAGCACCAATCAGCACATGGGGAGGGATGTAATATGGGCAGCGCTATAAGATTGAG
+CAAGGGTGAATTGACCACTACTTTCGAGCCTTTATACCAGGTGCCCAATGATCGGGTGGT
+GATTCTAAAATCCATCATCTTAACGAACTTAACAGATACAGCGCAAACCATCAGCCTAAA
+ACTGGCCGGGGCTTATGTGATGCGGGATAAAACACTATCCGCCGGTGAATCTTACCAAGC
+ATCGGTATTTGACCAGGTTATTGTATCGGGGGAAGTTATCGAGGGCAAAGCCGGTCAACC
+GGAAGCAGTGGATTACTACATCAGCGGCAAACTGCTCCTGCCCCAGGACATCGCCAGTGA
+AACCCAGTGGATGCAAGAGCAGTGGGACGCCTGGTGGGCAGCGCACCCGGAAGTATTCGA
+AGTGGTTTGGGATGCCTGGCTGCAAAGTAAAACCCGTGAACCAGATGGGGCCTTTTATGC
+TGAGTGGAAAGAGTGGTTTGACTATATTCAAGGACTTAGCTTTGATGCCACCGACCTGGT
+GCCCTGGACTGCTTTTAGGGACCACGAGGCTGATTTTTCCGCCCATGGGGATCTGGCCAA
+TACCTACCGTTTTGGGAAAGACCACAAGGGGATTTTCACCACCATTGAATGGCACCGGCA
+AGATGGAACCCTGGCTAAACGGTCTGTGTTAAGCGGCGGCAACTCACCACGCTACGAAAA
+CCGGACGGTTACTTATTATGAGGCAGATGGAGAAACAATTAAGACTGCTGTTGTATACAA
+CCAAATATATGACGAGGCAGGAAACTGGATAGAGGAGGTAATGGCAAGTGAGTGATTTAT
+GGCTGCACGGCTTGGGGCAAACATCAATGGGAGATCCGGGGGTTATTCCCATTGAAGGGT
+TAACGCCAATTATAGCATCAGATGAGATTAAAGGGCTGGGATTGCCTTTTGCCTACCGCT
+CATTGGGAACCTTGTCCAACCGTAAAGGTGTTAACCACTACCACAATGGGAAGGTCTATG
+TACTTCACGGCCTGGGGGTGACTATTTATGATGCGACTACCGGAGAAGTGATAGCCGATA
+ATACCCACACAACTTCTTCAGCGCATATGACCCCTGACCTTGCGGCTACGGATGGTAGTT
+ATTATCTTGCGCAGGGCACAACCCTATATAAATATGCCTCTGATGGTGCTTTAATTTGGA
+AAGCAGAGAATGTTGGTTCTTCATACTGTATCGCAGTAGAAACATCTGGTGTTTATGTTG
+GAGTTAGTGCATCCTCGGCTTATTATATTAAAAAATGTAACCGAACCAATGGTCAAGTTA
+CGTGGACATCAACTAGCCTAAGTAGTAACATAGCGGCATTAGCGGTTAACAGTAATACAG
+TTATTGCGGCTGACCAAAGTTATAAGATCTATAGGTTAAATCCAAGTAACGGGAGCACGG
+TATATACTTACACCATACCTAATAACCGCTATGCCTATGCCCTAGCCATTGAGCCGGGTA
+CTAACCATTTTTACTCAATAGATAGTTACCATGTCATACGAAAACATAGCTACCAAACAG
+GCGAGCCAATTTTTGAGAAAACCAGCGCCAACACAACTACCGTATACAATCTATTCATCG
+ACAGCGAAAACAACATTTATACCGTCTCCAATCGGGAAATCACCAAGCTGGACAATCAAC
+TGGCCGGTTTTATCTGGCGAGAGGATCACAACATTAGCGGTAACCCCATTTATGGTTTCG
+GCCTTGATAAAGAGCAGGGAAAAATCTATGTGCTGCGCCAGCATTCAGCCCGCATTTTAT
+CTACCGATAAAGAGTGGTCGGATTTTATCCCGCATCAATTTGAAGGCGTAGTAAATTCCA
+TTGATGTGGATGTCAACGGCAACTTCTACGGAGCCAGTGATGACTGGACGGCAAGGAAGT
+TCAATGCGCTGGGTGAGCAGCAGTGGGTATACCGTCATAACCTTGCTTTGAACTTTGTCA
+AAGCCGATAAGAACGGTAATGTTTATATTGCCGATACCAACCGAACCTTGAAAAAACTTA
+ATCCGTACGGGGTGGAACAGTGGTCCTGCAGCATTTCCGGTACAACAGGTGCGGTAACAG
+ATTTAGTGGTAAACAGCGAAGGAGTAATCATTGTTAGCATTGCTTATTTTCATACTTCCG
+GCTCCAAGGACTATTTAGTCAAAATATCCCCGGAAGGAACTTTGTTAAAGACCATGGAGA
+TTGGTACCAGCGGTGTGTTTCGTAAACTGCATCTGTGGGATGACCGCACTGTAATGGCTT
+TTAACAAGTTGTACGACATCGACACCCTTCGGACTATACGATATTTCAGTGCGGCAAGGG
+CGATATTTGGTAGGCATGGAGATTTTCTCTTTGGTGTTTATGATGATGAAATCAGGGTAT
+TCAATAAATATTCTGGTGGGCAGATACACTCTTTTGAAGTAAGCGATATTAACATTACCA
+ACTTCTATTTGCGGGCTGTCCAAGGTTTGGACGGAGCTGTTTACGCCTGGGATAATGATA
+AGACCTTGATTAAATTCAATGAAAAAGGGGAGAAATTCTGGCGCTACAAGGCAGTGGAGA
+AGATTGCGGATATCAAGGTGGATGACGAGCACAATATTTATCTGGCCACCGGCTACTATA
+TTGAAAAACTAACCCAAACCTTTGGAATCAAGGGTTACGATAAAAATTAGAGGAGGGCTT
+TAATATGATTTATGTATTTGAAAGCGGCAGTATCGTTTACGATGAGAGTGTTTTGGCAGA
+GGCGGATAAGGCCAGGGCTGTGGCGGTGGAGCAGCTGCCGGAGCAGGAAACGCCAGTAGG
+AAAGATCGCCATTATCAAGGCGGACAAGGCAACGGAGACCGTTTGGTGGGAATATGTAGA
+TTCCCCTGCGGCTGTTGAATTTCGAGAGCTTGAAGTTCAAATCCAGGGGCTTCAGATGGC
+CTTAGCAGAACTGACAATATTGTTAGCGGGAGGTGAAGCATAATGACCTTTGATAAAAAC
+TCGGCATTGGTTAAAAACGTATGGGTTCCGCTCATACTGGCCGGAGTGTACACACATGAA
+CAGGTGCCAGCCTTGGGAAATCTAAGAGCAGTGGTGCAGCAAGTATTAGCGGAGATGGAG
+TAACACCTGGAAGGGGTGTTTTTTTAATGTTTTTTCTTTCCCCTTTATTGTGGTAAAATA
+TGGCAGGAGGTGGAAAATGGAAAGAATAACTTGTAGCGGACCAATACTAATAAAATTTGC
+ACCTTTGAAGTTGGCGAAGAGTTTTCGCAGCGGTACAATTTATATGAATTCGCTGGACTA
+CTTTAGAGGTCTAGAAGATGACAATAAAGTAAGAGGAGATCTTTTGGAAGGTACACATAG
+TCTGATTGCAAAAGATGATTTTAGCCAGGTGTTGCCTCAATTTGGTATGGATTTTCCTGA
+AGCGATTAAGAAAAAAATAATTGGGGGCATACATCTGTTAGACGAAGAGTTAAAATATTA
+TAAGGTTTTTTGTATGTATCAGTTAAATTGTGATTTTAAGAGCAGGTACATTGAGCCTAT
+CGATACCAGGGTAAATAATTTTGGAGATACTTTTGTTTTAATATTTAATCTTAAAGAATT
+TAGAAGAAGGATTGTTGCTGAATTAGAAAAAGGAACATACAATGCCCTGGGATTTGCCGG
+ACAAGGTGTGGAGTATTATCAATATGATACTTCTACTCAAAAATTAGGCCCATTAAAAAA
+GTTGGATTTATATAAGTGGCAAAATGAGTATAGGTTAATTGCTGAACCACTTGAACATAC
+ATTAGATCCGTTAATTCTTAACATTGGTGATATCTCTGATATTTCGATAATTGGCTCAAC
+AAGTAGGTTAATTGAAGAGATTCATTTTGAAGGTAAGGAGCTTTTTGTACCAGGTTATAA
+CTTATAACCACAAGAAATTGATAGAGGTGAGCCATGAAACCAATACGCATAATAACCCCG
+GCCCTGGAGCTTAAGGGAGAGGTAGACAACTATCTCTCCCTTTCCTTTTGCCGCAGCTAC
+CACTCGCCTGGCGAGTTCCAGCTGGTGACAAACCGCAAGGTGCAAAACGCCAATCAGCTC
+GAAATCAACAATCTAATCATGCTGGGGGCTGACCCGTGCAAGACCGGCATCATCCGCCAC
+AAGGAAATTAAAAGCAATGACAAAGGAGAAGAAATGCTCACCATCAAGGGTTACGCATTG
+GGGACTATCCTTCGTCAGCGCATCACCATCCCACCTGTCGGACAAGCCTACGACATCCAG
+GAAGCCAATGCGGAAACGGTCATGAAACACTATGTCCGGCGAAACTGTCTACAGATATCG
+GAGATGGAATTTCCGTTTCTTGTGATTGGTGATGACCAGCAAAGGGGAGAAAACGTTAAA
+TGGCAAACACGATACAAGAACCTGGCTGATGAGCTGGAACAGATAAGCATACTTACTAGC
+CTTGGTTGGCATATCTACCCGGACTTCAATTCAAAGAAGTGGATATTTGACATATATAAT
+AGAAGGAATTTTTCAGCCGGTCAACAAATAAACCCGCCGGTTATCTTCTCACCGGAGTTT
+GATAACATCAGAAGTCAGGAATTTATTGATAGCTTGGTGGGCTTTGGTAACTATGCAATC
+GTAGCTGGTCGAGACGAGGGAGCCAATAGAGAGATCATGATGCTGGGCAGCGATGCTACT
+GGTCTGGATCGCCACGTTATCTTTGTTGATGCCAGGGATGTTAAAGATACTGCTGACCTG
+CCAGCAAAAGGTGAAGCAAAACTGGTTGAGCATCAAAGGGTTTTATCCTTTCAAGCCGAG
+GTTTTAACCGCTGGGCCTTTTAAATATCGGGATGATTGGGATGTTGGGGATATCGTCACG
+GTGCAAAACAAAGCTTGGGACCTGACCATGGACACTCGGATTACAGAGGTGCAGGAAATC
+CATGAGGCTAGTGGCTTCAAACTGAACGTCACATTCGGCAACAACCTCCCCACCCTATCC
+CAGAAGTTAAAAACGGCCCTGGGGGAGTTCAAAACAGAAAGCACACGATAAGGACGCCTT
+TGACAGGTGTCTATTTTTTATGAAAGAAGGACGATTGCATGAAAGATATCATTCATACCC
+TGCAGCTTGCCTTTACGGCAATCGGCGGCTATATCGGCTGGTTTTTAGGTGGCTATGACG
+GTTTAGTCTTAGCTCTGGTGGCCTTTGTGGTCATTGATTATATTACTGGACTGATGGCAG
+CAGTTATTGAAAAGAAGCTTTCCAGTAGTATCGGCTTTCGGGGGATTTTCAAAAAAGTGC
+TCATATTTTCCTTGGTGGGTATAGGCCACATTATCGATTACTATCTGATTGAAAAGGGCA
+GTGCAGTCCGTACCGCTGTGATTTTCTTTTATTTGTCCAACGAAGGATTGAGCATCATCG
+AAAATGCATCCAAGGTGGGCCTGCCCATACCGGAGAAGCTGAGGGTGGTATTCACGGAAC
+TTAGAAGGGAGGATAGAAAGAATGGCTAGAATTTGTATCGACGCCGGACACGGTGGAAAT
+GATCCAGGGGCTGTATATACGGGAAGAAAGGAATCCGATGATAATTTAGCACTGGGAAAA
+GCAGTAGCGGCAGAACTAAGGCGGCACGGGGTAATTGTTGATGAAACCAGAACTGCTGAT
+GTCACTGTCAGCCTCAATGAAAGGAGCAACTTTGAAAACCGGCAGTCTTACGATTGTTTC
+ATCTCCTTCCATCGCAATGCCTTCAAGCCAGAGCAGGCCACGGGTGTGGAAACATACACC
+TATTTGAACCCAGGAGCCAAGGCCAAAGGGCTAGCAGAAAAAATCCAAACTGCATTGGTG
+GGTGTTGGCTTTACCAACCGGGGTGTTAAGGCGGCTAACTTCCATGTCCTTCGGGAAACA
+AAAGCACCGGCGGTATTGGTGGAGGTGGGTTTTATTGATAACACCGGTGACAACCAACTG
+TTTGATGTTAAAAGGGATGAGATCGTAGCGGCTATAACTAAAGCAATTCTGGAACAGGTG
+GGTATCAAATATCTGCCATCTACTCCCCCATCACCCAAGCAGCAAACCGGCCAAACATTA
+TACAGAGTAATGGCAGGCTCCTATGCTGTTAGGGAAAACGCTGAAAGGCAGGTGGAAAGG
+TTAAAGGCCGCCGGGTTTGACGCCACCATTATGATATTTACGCCTTAGGCTAAAACGCTT
+AGGGCTTCTTTTTTTCAACGCCCAAATCCTTAACTTTTCTAAGTTGAATTATAAGTAATT
+ATAACTTGATGTTATCCCAATGTAACGGTAACATGCTACCTACCAAAGGAGGGAGAGAAA
+TGCTCTTAAACCAAGCAATCGAGGGTTTTACAAAGTACATGCACCTTATTGATAGATCGC
+AGGAAACCATTCGGGGCTATGCCATAGAATTGAAAGGGTTTAACAACTTCTTGACTGTCA
+AGCATAACTGCCCGGTGTATTTGGAAGACATTGTGCTTCAGGATTTGGAGGACTACCTGT
+TCTACGAAAAGGAAAGAGGGGCAGCCTCATCTAGTAGAAGCCGCTCATTATATATTCTAA
+GAAGCTTTTACAACTACTGCTGCAGGAAGGACTTATGCGTCAAGAACATTGCCAGCTTAC
+TGGAGCCAGTGAAAATCAAACAAAAGGAACGAGAGTTTATCACCGAGGATGAGCTCGGGG
+AACTGGTAGCTGCCATTGAGCAACCAGTCATTAAAACCGTAGTCCAAGCCATGTTTTACA
+CCGGTGGCCGGATTTCAGAGATGATCCACCTGACACTTGAGGATGTGGATCTGGATGGCC
+GGGTGTTACACATCATTGACGGCAAGGGCGGCAAAGACCGGGATGTGCCCATCAATGATA
+AGCTACACCGGATTTTGACCCACTACCTAGAGCACATCCGGGACGCACATTCAAATCGCT
+TCTTTGCTTTAACCAGAACCGGCAAAGTATCGGCCAGCTATATCAACTACTGGATTCATA
+CCGCAGTAGAGGAATTGGGCTGGGACAAGAACATCAGCGCCCACGTGCTTCGGCACTCCT
+TTGGCTCCAACCTGCTGGAGAAAGGGGCCTCGGTGGTGAGCATTCAAAAGCTGCTGGGCC
+ACTCAAGCCTTAGGGTAACGTCAAGATATCTGCACCAGGACACGGATAAGCTGACTGAAG
+CGGTTAATCTTTTATAGGGAGGGATAAAACCATGGAACCTATTTACGATGAAAAGGTCAA
+ACGGATTATTGAAATGCTAAAATTTAAAACCAGGGATGAAGTGGCGGCAGAGTTGAAGTA
+CAAGAGTTACAAAAGCCTTGATATGTACATGCGCCGGAAGAACTTTGCTTTCGACAGCCA
+GCAAGGTCAGTATTTCCCCCGGAAGAACAGAATTGAAAAACCAGACCCCAAAAGCTACGC
+ACCCACCAAGGTAGCCAGCATCATCACAGCTTTTGAGATTGAGGGCATTGACCCAAGGAT
+GGTGGCCAGACAAGAGGGATTTGCTGACCACCGGGAAATGGCTGAGTACATGAAAACCAA
+GGGCTACGAGTGGAACGTCCATAAAAACAACTATGTCAAGACCGTGGGTAGGATTGATGT
+GCCGGAGCCGGTTGGTGATCCAATGCCGGAATCAATCAACCTACCAGGGCCAATTGTTCA
+ATCGGCATTATCGCCAACCGTTCAACCAACCAGCGGGGAATTACCGGAGGGGCTTGGGGA
+ATATCTGCCCTTCCTTCGCTTCCTCTATGAAAACCGGGATGAACTCTATCAGTTACTCAC
+CGGTACCAGGGACGATGGCATAATTCCAAGGTATGCTGTGCCAGGGGAAGTCAGGACTAA
+AGCCATTTACATGAGTGATGTTATTGCCAAGCTGGCCGGGGAATTTAGCAAGGAGAAGAA
+GGTTGCCTTAAGGGAAGTCATGGAAGGGGCGCTAGTGGAATACCTGATGAGGTATGGGTT
+CAAGCGGGAAGTGGAAACGCTCCTAAGAAACCAGTAA
+>NC_021184.1|provirus_4563831_4615358
+TCACTTCTTTAACCCACCCTTCCTTCGGCTAGTGATAAGGTGTATTTGGCCATCCTTTTG
+TTTTATGAAATGCTGCTTCATCTCATCTGTTAAACGCACTTTTCTATCCTCCGTGATAAA
+GGCAAACCTTATTATGTTAATATCCGTAAAATCTATGGCTTCCAATTTGTTTTTAAGATA
+TATTTTCCACCTAAGATTGAGGTCAGTGTTGTCCTGCCAATTAGCATAGAAGGTGTTATC
+AGTGTATAATTTAGTGTCTAGGCTAAGATATAATTCCGCAATAATATCAAGTAATAGTAA
+AACCCTGGTATTATTGTCACGTAAGACGTCCGGCTCCTCCATATACTCAAGGAAGTGCAA
+AGCCCTATTTCTATTAAATTCCCGCTTCACGCCTTTTTTAGAACCGGCAAAATTCTGGTA
+AAACACTTCTTTGATCATATACTCCAGATATTTAATTTGGTTGCGAATCCAGTTTTGGAA
+ATCAGGATTAGATCGCCTTTCATCATTCCTCTCCCCCAAATATTTTACTAAATACTTCCC
+AAAAACAAGTATGCTAAACTCACCTTTTGTGTTTGCAGATTTTATTTCCGGGTGCTCGAT
+AGCCCACTCTCTTAATGCAACTTCTACGGCTGGCACCAGGGTCAAATATGAGCATATATA
+ATTGCCGATCATTAGATCATAGGTAGCGCTTTCAATCACTTTCGTTAAACGGCTCAATAT
+CTTCGAGGGTTTAAACCTATATTCAATCTGATATGCTCTTTGCCATGGATTAATTACCAT
+CCTTAACACTTCTCCCTCCAGCCCTCCCCAAGCCGGATCCGGATTTTCTAAACAGCCTAA
+TAATTCCTCAACCTTTTTCCCGGAGACACAAGGGTAAGGAGGAATAGTAAGCAACTTGTC
+CTTTAGATGGTCATCAATTTTGTCGAAGGCCTCCCATAAATTCATGTTATCCCCCCTTTA
+GGTAAATATACTATTTAAAACACGCTTCACCTCTTATTACCTTGAGAACCTTAACGATTA
+AATGACCTCTGATACGTTCCGACGGGGCAGTTGTTAAAAATAAAATAACCAGCCAACTAG
+GTAAGCCGATATACCCTATCAGGCCTACCTGTTTGGATGGTTGTCCTGGTATAATGAGAT
+AGAATCCATGATAGCAAAAATATGTGTATTGGCAACAATTCTTCATGTTCTGCGCAGCTA
+TATTACTACATTGTAACTATCTCGCTTAATTTTTTTATGTTTTCTTCATCTTGAATATCA
+GTCCAGCATGAACTGATATTTTTACTTTTACTCATCTCGGCTTTTTCTTCTCCAAATGCA
+CTTTTTGTTTTTTCGTAATTTTTATCGCTGACCGTTTTTCCTATTGGATTCCTTTTCCAA
+CCACAAAAATATATCTTGCTAGCCTCCTCAATGTTCCTCCTTTTTGAAGCAGCCCTTATG
+ACATCCGTATAGTTTGGTTTCCGCTGAAACTCCTTTGGTATTTTTCGATTTAAAGCCTTA
+AAAAAATCGATTGGAGCAAATTTATGGTTGGGGTCATATTCTAATTCAAGATATGCAACT
+AATTTTTTGTAATCTTCCATGTAACACTTAACTCTATACCCTTTTTTTATTTCCAGTTCA
+AATACTTCAGGATTGATGCCAAGTGTTGTCAAATATAGCCGATAAGGTAATATGTCCGTC
+AAAAAGATACAGCTAAAATTTTTTCCATTATAATCAAAGGGGAATATTGCCCTCTTTTCT
+TTTTTTTGCTTCATATTCTTATGAAGTATTCTCAACCCACTAAATTCAAATATCCTCATA
+CTACTACCTTCTTTTTGAACCGTATTTGCTCTCTTTCTCCGATTCTCACTTTGGCCTTCC
+GCCACGCTACCCCGACTATATGTAAGCACTCAATCCGAAAGTACATGGTTACGCCTCTTG
+AAACATGCGACAATACCTCCATAAGACTTAAAACTAAAGAACGGAGGTAAAAGGGGCAAA
+AAGGAGAACGACAAACCCTTGTTAAGGAATACAATGCTAGTGGATTTTATGACAGAAAAC
+AATCATGATAATGCTTAACACAGAAGAATGAATAAAATTATCCACTTATTCCCGCAGTTG
+CACATTAATGTTAACCGTCCCCTTGTTTGATATATAAGACTATCCTTTATGTTGACTGCT
+ACGCCTTTCGTTACTGGCCGTTCTTGCCATTTCGATGCCCCTTGACTATATGGTAACATG
+CGTGGGTAGAAACAACAACACAAAAGAGCCATCCCGTTGTGTTGTGTTGCCAGCCCCCCA
+GGTAAGCCAGATAACTCCTATCCGGCCAACCTGCTTGGCTGGCTATATTCCCACCCACCC
+GGCTGGCTCACAATTCCTATATCCCCACCCACACGGCAGCCAAAAAACAGGCCAGGCGAT
+CCACGTGGGACCGCACTGGCCTTGGTTAGCTGATTGGGACTAATTGGATGACACAAAAGA
+ACTGTCCCCTTGTGCTCTTCGGGACTGACCCCTTTTGGGAGGAACTGGATGGGGCTTTTC
+GAGCCCCGTCCAGATTCCGACCCGTGCACTTCATTTTTCAGGACAGGATTCCTGTCTTGT
+AACAATTGTTCACAATTTTGAAATATATGTTCATCCCTCAGAAAAGAATGCTTAATATTC
+TTTCGTTATAATGTAGTTGTTAAATCCTAAGCACTTAAAGCAAAATGCTATTATTTAACC
+GGTCAGTTAAATTCATTCCTGTCCTTTGACAATTGAATACCACCGGGGGCACAACAATTC
+ATGCTGGCTATCTGCTGGACCGATTCCAGGGCTGAAAGGGAAAAAACGAGCATAAGGGAG
+AACAAAAAAAGAAAACAGCTGGGCGATCCGCGTAGGACCTCCCGGCTGTTAAATTCTTTA
+TCTCGCTAAACTGTTAACGCAGTGGGGGACTGTCCCCTTTTGGGAGGTTTTGGGAGCCAG
+TTAGGATTCCCGAAACCGACCCGAGCATCGACACCACTTGCCAATATTTACCTCGTTTTT
+TATACCCACAAAATCTCACCTGTGCAACGTATATTTCTATGGAAGAAACAAAAAGGTCGG
+TTAAACCTTATATACAAATGGAAAAACCGATTTATAAAATGCTTGTATGGCACTTATTAC
+CTGTTGTATTTTTCGACATATTATACTATACTTAGCTATACATATTAAATTTTAGAAATC
+TAGGTTTTTTTTGACTTAAGTTACAAATTATTGTATTCAAATTTTTCTAAACCTAGTGTT
+AAGACTTTAGCCGGGTTTAGCTGGTTGGGTAGGTTAATTTTTTTCGCTCTTTGACATTTG
+AATATTGTTCGGTGAGCACAGTGAGGACAATTACAGTGCTGGAAGGCTAGAAAAGAAGGT
+AGCCTTGGTGTTGTAGACTTCACAAAATGGTTCCGACGTCTTTGGTGCTGGTTCTGACAG
+CCAACTCAGGGGGGGGCATGACACAAAAAGAAGACAACCGGGCGATCCGCTTGGGACCTC
+CCGGCTGAAAAGCTCTTTAATGTGTTAAATTGTTAACGCAGCGAGGGACTGTCCCCTTTT
+GGGAGGAACTGGATGGGGCCGCCAGGCCTCGGCCAGATCCGACCCGTGCATTTCTTACAA
+AGAGGTGCCCCCAGAGGATTTAACCCCCGGGGGCACAGACCATTGGCACGCGTTTACAAC
+TAATAAGTTAAATGCCTGGTACGTTCTTTGTTAAATCATTTACGGCAAATCAACTACTTT
+CTGAGCATTGTTTACATTACCGGCAACGTCTGTAAGATTTGCTGTTACATCAGCAGCAAA
+AGCAGTATCATTTGCGCCATCGGTGTTTGCTACTGTTAATTCAGTATTTGCAGCGTTCCA
+GGTAAAGGTCAATGTTCCTGACACTTTTGCCGCATCTATCGCAGTCTCAACAGCAGTCTT
+GCCAGCAGCAGATAATGCTTCAGAGAATGTAACCTTAGCAGAATCACCATGCGCAATCTG
+TGCTGTTATAGCAGTTGCGACAGTCGGCAGAACACCATCAGTTACAGTAACGGTAATGTA
+GTCAGAATATGCACCTGAAGAAGCGATCACGCGGAATTTCGCACTGTCCTTGGTGAATGT
+GGTATCGCCACCAACTTCAGTTACACTAACTGCTCCACCAGCAACCGCAACAGTATCGGT
+TGCCATACCGGTCACACCGTCCATAGGAGCGAGTAAAGTTGTTTCAGTACCACTTAAGGA
+ATATCCACCGAACTGGTCAGTGACCCATACAAAAACGTCCTGAGCTCCGCTTTGGTCGGC
+ATTGTTATATCCAGCAGCATTTGCTACGGTGTACTCTTCAACATCCTTGGTTGTCGTGGC
+TTTAGCATTAGTAACGCTCGGTGTAACATTCTTGAATGTAACAGAAACTGCCTGAGAAGC
+ATCCTTGGAAATCGTTACATCTTTAGACAGAGTTTTCACGGTGTCGGCAGCATTGACAAT
+CACTGTCAACTTAGCAGTGACATCTTTGTCAGCAACAACTACGTTATTAGTATCAATGTA
+GTATTTGCCATTTACCAGCCCAGTTACAACTTGAGCATTATCAGTAGCTACGCTAACTAT
+ACTCGATACAGGAACTGTATAAGTATTGCCACTGGCATCAGTAGCCGTTACTTTGATCTC
+CTTAGCGTATCCGGCGTCAACAGCGGCTGCATCAACAGCAGCAGCTCCTGCATTATGGTA
+CAGTGTCGGGATATCACCTATGCTGTAAGTTACAGTCCCACTGTCGTTCTTAGCAACTGT
+AAAGGTGTAGGCTTTTTCTGCCACAGCCACACCGTCTTTCATCAGCTGAGCTTTAACAGT
+AGCAGTACCTTCCTTCAGCGCAGTAGCTACAACGCTTACAGTAGTAATATCCGCATCATC
+AGTTTTATTCAAGGAAACTACAGTGTTGTCAGTGGTAACGTAATGAACACTCCAGGAAGC
+GCTGTCTACTGCCGCATTACCATACTGATCTTTGCAATCGAATTGCAATGTCTGAGTTGC
+ACCGACTAACATATTGTTACTTACAGTAGTATCTTTCTTAGTGTCGATAGTTGTTGGAGT
+TGCTGCATCATTAGCTGTTACTGTCACTTGTGCTTTCTGGCCAGAAGCATTTACAGTAAT
+AGTAACGACTGAAGATGCACCCATAACCGCTGAGGCGGCAGGAGTGATTTTTACGCAATC
+TTCGTATCCAGCATCAGCAGTAAAAATAACGGTGGCACCGACAACCTGGCTGTTATCTGC
+AGTTACAGTGTAATCAGCAGCATTCAGATCCTTGGTCGCAATAGCTGTGCCATACTTGTC
+AGCAACAGTTGCCTTAATGTATATGGGAGTTATAGCTCCGGCAGCAAACGATGCTGAATT
+TTTTTCCAGAGTTATTGAGTATGGTGCACTAGTATCTTCGTTAATTGTGATGTCAATGTT
+ACTGCTTTCTCCAGAAGCCGGGCAAAGTGCTGTCAGCTTAACCGTGCCAGCTTTCAGGAA
+CGCACTGATGATAATTTTGTTGTTGGCATCAACCGAGACATTAGCAGCAGGCAGAATGGT
+TTCGTCTGAAGACTTGAAAATCACACCATTGCCTACATCACCAGTAACAAGTTTGCAATC
+TTCATTTAAGGTGTTTTTCGCGGTATAAGTTACTTCAACATTCTTAGTGCCAGTAGGGGT
+GAACATGGTTTTGCCTGTAGGCAGCTGTGCTGCACCTAATGTTACACTAGAAACGGTTGC
+TGTATTGACTACTTCTAAAGTCTTGGTAGCCTTAACACTACCGTACATAACTGTGACAAC
+AACCTGGTCTTTAAGAGTAGCACCTGCTGCATTTAATTGGAATTTGCCAACTACTTGGTT
+GATTGTAGCATTTGCGGTTGTGTCAAAAGCAGTGATAGTTAATTTTGCGTCAGAAGCGGA
+AATGGTTGATTCTGTACCATACTGATTTGTGAACTTAATTGTGAGTGGTGCAGTTGCTGA
+TTTCTGAAGAGCGTTGTTCGCAATCTCAATGGATTGAACTGTTTCAGCAGCAACGGTAGT
+GGTTGCGGTATCTTTACCAGCTTCCAAATCCAACCCAGAAACTGTTACAGTATAATCTCC
+AGCAATGAAATTGCCAGATGTTTTTTCTAAAGTTGCTACGGTTTTGTCATCATTCCATGT
+AGCAGCTTTTACATCCTCAGCAACAGTACCCCTTTTAACCGAGAAAACGGCTTTACTGGT
+ATCGGTTACGGGAGCACTGAATGTTACCGCTAACTTATTAGCGTTAATAGCACTAAAGCT
+TCTGGTTTCCTGTATATTAAAAACCCCGAAAACCCGCATGGGACAAGGGCTTGAGGGGTT
+TGTTAACTTTTCATTGTGGTCTTAATGGATATAATTATTAGCAGGTTCCATAAGGTTAGG
+AGAAATTAGATAATTATTCATAATAGATTTTCTTATAAATCACTGATATGCTACACTTTT
+TTCGTAAAGAACCTCGGGATCAATATCTGCTTGATTGCTCCACTCTATGCTATCAAAACT
+CACCCGAACCGATCTAAATAAATTCTTGTCTTTTAATTCCCTAAAAATTCCTTTGTTCAG
+ATAAGGCGTCATATCAAATAACCTTTTTTCTCCGTTTTCAAAGGTTAAAAGCAGTCTATA
+GCTCTCCAAAGGTTCAACTCCTACTACAGACACATACATAATTCATCACCTCTATTTCAA
+AGGTTCAATTTTAAACGGCAATTCGCTATTCATTGCCAACACCCAGTTTGCCAATAAATC
+TTCCTGTCTTAATTCTGCCCAAGCAAGGACAAGTTTAAGCTGTTTTTTAGGGAGACTCCC
+ATTAGTTAGTTCACAAGTATTTATATCAATTATCGCCTTATGCTTCCCATAATATGCATG
+AAAGTGAGGCGGGTTATGCTCACCAGGGGCGCAATACATTCTTATAATTATCCCATAAAA
+CATACAAATGGTCGGCATTATATCACCTTTTTCCCTACAATACTCCACATCTATTATACC
+ATAAAAACACACTCGTGGAATAAATATTTTTACTGGTTTCTTAAGAGCGTTTCCACTTCC
+CGCTTAAACCCATACTTCATCAGGTATTCCACTAACGCCCCTTCCATTACTCCCCTTAAA
+GCGACCTTCTTTTCTTTGCTAAATTCCACAGCCAGCTTGGCGACAACCTCGCTCATATAA
+ATGGCCTTAGTCCTTACCTCCCCTGGAACAGCGTAACGTGGAATGATGCCATCCTCCCTG
+GTGCCGGTGATTAGCTGATATAGTTCATCCCGGTTTTCATAGAGGAAGCGGAGGAAGGGC
+AAATATTCCCCAAGCCCTTCCGGTATTTCCCCGTTATTTAGTTGAGCAGTTGGTCCCGGT
+ATTGGCTCTGGCATTGATTGACTGACCGGCTCCGGCACATCAATCCTGCCCACCGTCTTA
+ACGTAGTTGTTTTTATGGACGTTCCACTCGTAGCCCTTGGTTTTCATATACTCAGCCATT
+TCCTTGTGGTCTTGAAAGCCCTCCTGCTTGGCCACCAGCCTGGGGTCTGCTCCTTCCATC
+TCAAAGGCGGTAATGATGCTGGCTACCTTGGTGGGTGCGTAGCTTTTGGGGTCCGGTTTT
+TCCAGTCTGTTCCGCATAGGAAAATACTGACCCTGCTGGCTGTCAAAGGCAAAATTCTTC
+CGGCGCATGTACATATCAAGGCTCTTCCAACTCTTGTACTTCAGCTCTGCCGCCACTTCA
+TCCCTGGTTTTAAACTTTAACATTTCAATAATCTGCTTAACCTTCTCATCATAAATTGGC
+TTTTTCATGGTGTTTCTCCTTCCCTACAAAAGATTAACCGCTTCAGTAAGCTTGCCCGTG
+TCCTGGTGCAGGTATCTGGATGTTACCCGAAGGCTTGAATGGCCCAGGAGTTTTTGGATA
+CTGACCACCGAGGCCCCCTTCTCCAGTAGGTTCGAGCCAAAGGAGTGCCTAAGCACATGA
+GCGCTGATGGTTTTACTCCAGCCCAACTGTTCTACCGCATCATGGATGCAGCGATTGATA
+TAACTGTCGGAAACCTTGCCGGTTCTAGCCAATGCAAAGAAGCGGTCGGAATCCGCCTTC
+CGGATGTGCTTTAGGTAATGGGTGAGAATCTGGTGGAGTTTATCATTGATGGGCACATCC
+CGATCCTTGCCGCCCTTGCCGTCAATGATGTGCAGCACTTTGCCTTCTAAATCCACGTCA
+TTCAGTTTCAAATTTATCATTTCCGAAATCCGACCGCCGGTATAAAACATGGCTTGGACT
+ACAGTTTTAATGACTGGTTGCTCAATGGCGGCTACCAATTCTCTCAGTTCATCCTCGGTG
+ATAAACTCCCGCTCCTTTTGCTTGATTTTCACCGGCTCCAAAAGGCTGGCGATGTTCTTG
+GTGCAGAGGTCTTTCTTGCAGCAGTAATTGTAAAAGCTGCGTAAAATATATAACGACCGG
+CTCCTGCTGGCTGATGCTGAGCCTCTTTCCTTTTCATAGAGCAAATAGTCCTCCAAATCC
+TGCAGCACAATATCTTCTAAATACACCGGGCAGTTGTGCTTGACAGTCAAGAAGTTATTA
+AACCCTTTCAATTCTATGGCATAGCCCCGGATGGTTTCCTGCGATCTATCAATAAGGTGC
+ATGTACTTTGCAAAACCCTCGATTGCTTGGTTTAAGAGCATTTCTCTCCCTCCTTTGGTA
+GGTAGCATATTACCGTTACATTGGGATAACATCAAGTTATAATTACCTAAAGATTTAACA
+AGAAAAGTTAAGTATTCGGGCGTTAAAAAAAAAGAAGCCCCGGACTGGTTTTCGTCCAAG
+GCTTTTATCTTCAAGGCGGCGGGTGTTTTTCCAATAATAATGCCGCCATCCTCTCAATTA
+AGGCAGCGGCATAGGCTCCGTTTACGGTTTTTCCTTCCCTGGCGTTTTGTTGCCAGTATT
+CAGGTGTATTAATTATTCCTTTGGCCACTAGAATCTTTAAGGCTTCTGCCAATTCATCCC
+TGGGCTGTTCGGTCAATGACTTCTTGAAAGTATGCCACCTGGCCCAGTTGTTTTCCCGCA
+TGGTACCGGGGCAGATTTTCCGGCTGGCGTCATAGTGCCTGACCACCCTTTCCGGTGGAA
+TGAAGTATTTGCCCATCAGGTGTTTGACCAGCTCCACCGTGTTGGCCACTGCCTTTTCGT
+AATCCCCGTCAGCGTTAATGCAAATTTCTACTCCGATGGAATTGCTGTTGGTAATGCCAT
+ATTTCCCGCCACCGTCACCGCAGTGCCAGGAAGCTTGGGAATCCTCCACCAGCTGCAGTA
+TGCTCTTATCATCCACAAAGTAGTGGGCTGAGGCTTGCCGATCTCCACCGTTAAAATATT
+TATAGTGAGCCTCCGCATCAGCTCCTGCCCGTGGATTGCCGGTATCGTGAACGACAATGT
+ACTTGATAGACTGGCCGTTCCTGCTAGAGTGGTTATATTTTATAAGCTTCTTATTTATGT
+GCAGCATGTTGTCCCTCCTTGTCTTCTTTCAGGTTCAGCAATACCGATTTCAATTTTTCC
+GGTATAGGCAACCCAACCCTGGCGGCGTTTTCCATAATGCTCAAGCCTTCATTGGACAGG
+TAGAAAAATATCACAGCGGTACGAACGGCACTGCCCTTTTCAATCAGATAGTAATCGATA
+ATGTGACCTATGCCCACCAAGGAAAATATGAGTACCTTTTTGAAAATCCCCCGAAAGCCG
+ATCTCACTGGAAAGTTTCTTTTCGATAACTGCCACCATCAGGCCGGTAATGTAGTCAATG
+GCCACAAAAGCCACTAAGGCTAATACTAAACCGTCATAGCCACCCAAGAACCAACCGATA
+TAGCCGCCAATAGCGGTAAAAGCCAGCTGCAGGGTATGAATGATATCTTTCATGCAATCG
+TCCTTCTTTCATAAAAAATAGACACCTGTCAAAGATGTCCTTATCGTGTGCTTTCTGTTT
+TGAAGTCCCCCAGGGCCGCTTTTAACTTCTGGGGGAGGGTAGGAAGGTTGTTGCCGAATG
+TGACGTTCAGTTTGAAGCCACTGGCCTCATGGATTTCCTGCACTTCAGTAATCCTGGTAT
+CCATGGTCACGTTCCAGTCCTTGTTTTGAACGGTCACAACATCCCCAACATCCCAATCCT
+GCTGATATTTAAATGGCCCAGCAGTTAAAACCTCGGCTTGAAAGGAAATGACCCGTTGAT
+GCTCAGCCAACTTTGCTTCACCTTTTGCTGGCAGGTCAGCAGTATCTTTAACATCCCTGG
+CATCAACAAAGATAACGTGGCGATCCAGACCAGTAGCATCGCTGCCCAGCATCATGATTT
+CTCTATTGGCTCCCTCGTCTCGACCAGCTACGATTGCATAGTTACCAAAGCCCACCAAGC
+TATCAATAAATTCCTGACTTCTGATATTATCAAACTCTGGTGAGAAGATAACCAGCGGGT
+TTATTTGCTGGCTGGCGGAAAAATCCCTTCCATTGTATATGTCAAATACCCACTTCCTTG
+CATTGAAGTCCGGATAGATATGCCAACCAAGGCCGGTGAGTGTGCTTATCTGTTCCAGTT
+CATCAGCCAGGTTCTTGTATCGTGTTTGCCATTTAATGATTTCTCCCCTTTGCTGGTCAT
+CACCAATCACAAGAAACGGAAATTCCATCTCCGATATCTGTAGACAGTTCCGCCGCACAT
+AGTGTTTCATGACCGTTTCCGCATTGGCTTCCAGGATGTCGTAGGCTTGCCCGACAGGTG
+GGATGGTGATGCGCTGACTAAGGATAGTCCCCAATGCGTAACCCTTGATGGTGAGCATTT
+CTTCTCCCCGTTCACCTGCCTTGATTTCTTTGTGGCGGATGATGCCTACTTTCCCGGTAT
+CTGCACCCAGCATAATCAGGTTGTTGATTTCAAGCTGCTCCGTATTTCGTACCTTCCGAT
+TCGTGACCAGCTGGAATTCGCCAGGCGAGTGGTAGCTGCGGCAAAAGGTAAAGGAGAGAT
+AGTTGTCTACCTCTCCCAATAAATCTAATCCCGGCGATAATATTCTAATCGGTTGCATAA
+AAAAACACCCCTCTCAAGGTGTTACTCCATTTCCGCTAATACCTGCTGCACTGCCGCTTT
+CAGGTTCCCCAGTGCCGGTACCTGCTCCACCGTGTAAACCCCGGCCAGTATGAGCGGCAC
+CCATACGTTTTTAACTAGTGCCGAATTTCTATCAAAAGTCATTATGCTTCACCTCCTGCT
+AACAATATTGTCAGTTCCGCCATAGCCATCTGCAGCCCTTGGATTTGAACTTCAAGCTCT
+CGAAATTCAACAGCCGCAGGGGAATCTACATATTCCCACCAAACAGTCTCCGTTGCCTTG
+TCCGCCTTGATAATGGCGATCTTTCCTACTGGCTTCTCCTGCTCCGACAGCTTTTCCACC
+GCCACAGCTCTGGCCTTATCCGCCTCTGTCAAAACACTCTCATCGTAAACGATACTGCCG
+CTTTCAAATACATAAATCATATTAAAGCCCTCCCTTAATTTTTATCGTAACCTTCGATTC
+CAAAGGTCTGGGTTAGTTTTTCAATGTAGTAGCCGGTGGCCAGGTAGATATTGTGCTCGT
+CATCCACCTTGACATCTGCAATCTTCTCCACTGCCTTATAACGCCAGAATTCCTCCCCTT
+TTTCATTGAATTTAACCAAGGTCTTATCATTATCCCAGGCGTAAACAGCTCCGTCCAAAC
+CTTGGACAGCCCGCAAATAGAAGTTGGTAATGTTAATATCGCTTACTTCAAAAGAGTGTA
+TCTGCCCACCAGAATATTTATTGAATACCCTAATGTCATCGTCATAAACACCAAAGAGAA
+AATCTCCATGCCTACCAAATATCGCCCTTGCCGTACTGAAATATCGTATAGTCCGAAGGG
+TGTCGATATCGTACAACTTGTTGAAAGCCAATACAGTGCGGTCATCCCACAGATGCAGTT
+TACGAAAAACACCACTAGTACCAATTTCTCTTTTCTCTAAAAGAGTACCCTCCGGGGATA
+TTTTGGCTAAATAGTCCTTGGAGCCGGAAGTGTAAAAATAAGTAATGCTAACAACAATTA
+CCCCTTCGCTGTTTACCACTAAATCTGTTACCGCACCTGTTGTACCAGTTATGCTGCAGG
+ACCACTGTTCCACCCCGTACGGGTTAAGTTTTTTCAAGGTTCGGTTGGTATCGGCAATAT
+AAACATTCCCATTCTTATCGGCTTTGACAAAGTTCAAGGCAAGGTTATGACGATATACCC
+ACTGCTGCTCACCCAGCGCATTGAACTTCCTTGCCGTCCAGTCATCACTGGCACCATAAA
+AGTTACCGGTTATATCCACATCAATGGAATTTACTACACCTTCAAATTGATGGGGGATAA
+AATCCGACCACTCTTTATCGGTAGATAAAATGCGGGCTGAATGCTGGCGCAGCACATAGA
+TTTTTCCCTGCTCTTTATCAAGGCCAAAACCATTAATGGGGTTACCGCTAATGTTGTGAT
+CCTCACGCCAGATAAAACCGGCCAGTTGATTATCCAGCTTGGTGATTTCCCGATTGGAGA
+CGGTATAAATGTTGTTTTCGCTGTCGATGAATATATTGTATACGGTAGTTGTGTTGGCAC
+TAGATCGTTCAAAAATTGGCTCGCCTGTTTGGTAGCTGTGTTTGCGCAGGGTATAGTAAT
+TATCTATTGAGTAAAAATGGTTAGTGCCCGGCTCAATAGCTAAAGCATAGGCATTTCTGG
+AATTAGGTATGGTGTAAGAATATACCGTGCTCCCGTTACTTGGATTTAGTCTATAAATCT
+TATAACTTTGATCAGCCACAATAACTGTATTGCTGTTCACCGCTAAAGCGTATATATAGG
+AATTTAGGCTACTTGAAGTCCACATAACATTGCCATTGTTTCGGTTGAACTTCTTCACGT
+AATAAGTTGAGGATTCAGTAACTCCAATATGAACACCAGATGTTTCTACTGCGATACAGT
+AAGGAGAACCAATATTTGGAGTTTCCCAAATTAAGGTGCCGCCTAAAGCGTATTTATATA
+GGCTCGATCCCTGAGCAAGGAAATAGCTACCATCCGTAGCTGCCAAGTCTGGGATCATAA
+GAGCACTGGAGGTTGTGTGGACATTATCGGCAATTACCTCGCCGGACTCAGCATCATAAA
+TGTTCACACCTGAGCTGTGCAGCACATAGACTTTCCCGTCATGATAATGATTGACACCCT
+TGCGGTTGGACGAGGTTCTCAGGGAGTGGTGGGCAAAAGGCAGTCCAATCCCTTTAATCT
+CATCTGATGCTATGATTGGCGTTAACCCTTCAATGGGGATAACTCCCGTATCTCCCATTG
+ATATTTGCCCCAAGCCGTGCAGCCATAAATCACTCATCTGTCATTACCTCCTTTATCCAA
+TTTCCTGCCTCGTCATATATTTGGTTGTATACAACTACAGCCCGTACTGTTTCACCGTCT
+GTCTCATAATAAGTAACTGTACGGTTTTCGTAGCGTGGTGAGTTACCGCCGCTTAGTACG
+GACCGTTTAGCCAGGGTTCCATCTTGCCGGTGCCATTCAATGGTGGTGAAAATCCCCTTG
+TGGTCTTTCCCAAAACGGTAGGTATTGGCCAGATCCCCATGGGCGGAAAAGTCAGCCTCG
+TGGTCTCTAAAAGCAGTCCAGGGCACCAGGTCAGTGGCATCAAAGCTAAGTCCTTGAATA
+TAGTCAAACCACTCTTTCCACTCGGCGTAAAACTCACCGTCTGGTTCCCTAATCTTGCTT
+TGCAGCCAGGCATCCCAGACAACTTCAAAGACTTCGGGGTGATTTGCCCACCAAGCGTCC
+CACTGCTCTTGCATCCACTGGGTTTCACTAGCTATGTCCTGGGGCAATAGCAGTTTGCCG
+CTGATATAGTAATCCACCGCTTCCGGGTGGCTGGCTTTACCCTCGATAACTTCCCACGAT
+ACAATAACCTGATCGAATACCGATGCTTGGTAGGACTCACCGGCTGATAGAATTTTATCT
+CGCATCACATAAGCCCCGGCCAGCTTTAGGCTGACGGTCTGCGCTGTATCGGTTAAATTG
+GTTAAAATGATTGATTTCAGCACTACCACCCGATCATTGGGTACCTGGTATAAAGGCTCA
+AATTCTGTGGGTAGTTCCCCTTTGGCAAGTCTGATGGCACTGCCCATATTACATCCCTCC
+CCAGGTGTTGATTACCGGTTGCGCTTCCAACCTGCGCCATTTGCCATCATTGATTTCAAC
+TTCCAGATTACCGCCCCTTAAGCGTAGGCCATGGGTTTCCTCTCTTACGGTGCGGTCCCG
+GTGGGCTTTAAACTGGCTCCATGGTACTAGATTAGTGATGTCTTGTATTTCTTCAAACCA
+ATCTTTCCACTGGGTGTAAAACTCACCGTCCGGTGCCGTTAATTTTTCGTTTACCCAGTC
+CTGCCAGACCCTCTGCGCTTCATGGTCAAACCAAATATCCCAGTCTTGCTGGATTCTATC
+GAACCAGGTTTTCCACTGGATGTAGAAGGCACCATCCGGAATGGTTAGCTTATCGTTTAC
+CCAGTTAGTCCAGTTGTTTTGGAAAGCGGTGAACTTTGATTGCAGCATAGCTAAAAAAGC
+AGCATGCTCAACACTGGCATTCTGCTTTTTATCTGTCAAATATTCAAGCCAGGCGGCAAA
+CTCTGTATCCCCGTGTGCTCTCCTGGCATTGAGGTATAACTGCCATTCGTTAAACAGCTC
+GGTGGTGTCCACCTGTTCAAATAAATGGGTGACCACGCCGCAGACGGCAGGGTTTAATCT
+TTCATCGGTTATCTGGTATGCCTCAATAAAACTTTTCCCGGCCAGTACCACTACCTGTGC
+CAGGGCCAATTCATAGATGTTTTCATTACGGGTTAGTTCCGGTACTTGGGGCGTTTCTGC
+AGCAGTACCAGTTAACACAAAGGCTTTCACATAGCGGTTTTCTAAAGTCTTATCTAATCT
+GATCACCACCCGGTCGATACGGTCGTAGTTGGCATGGGCCATGGGGTGGTAAAGTTCCAA
+AGGCTCGATGTCAATTTTGTAGAGATAACCCTCAATCCAGGCATAGCCAGGTTTAATAAA
+TGTTCTCATGTCCTGGCCTTGTGCTCCTACCTGCAAGTTGTCCCCGGAGCCGTTGAAGAT
+GCCGTTTCTGATAAACTGGCGGAAGTATTCAGCGAACTCATCGGCGGTATAATAGCGTTC
+ATCTTCGCCGTCAACTGAGTCGAAAAATCTGTAGTGTTCAGCCACAAAAACCCTCCTTTC
+TAAAGGCCCACATAGCGGTTTTTCCACTTAACGAGAACCCTGGTCTTGATACTGTCGTTG
+TTGCTGGTGTAGCTTAGTGCATTTTCTCCTGGTACCAGTTGCCAAAACACACTGTTAAGA
+TCAATGTAATGGAAGGCATTTTGCCCGTTAATCTTCACGTATTTATGCCCGAAGGCGGTA
+TTGACGGTGAGCACATCTTCCTCCTCAAGCTCACGATTAACTTTGATAAATTCCCCGGTG
+GTTAGGTTAGACACGGTGGGATTCACCGCTGGCCCTTTGAATTCAATCTCCACTGGGGTT
+GCCACATCACCGCCATTGATGGCTCTACGCTTGAATCCCCGGTAGGAAAACATGGTGGGG
+AGCATTAGCCTGAATTGAATTCCACCCATGAGATAAGACATCTCCCTGCTTTCAAAATAG
+GGGTCTAACCAAAATGGCTCATGGCAAATTAAATGTAGCAGGAACTTTTGATAATACAAA
+CCTTTGCTGCCTTGGCCGCTGGGAAAGATGGGTGTAGACTCCGCTATGCCTGTAATTTCT
+TTCACCTGATTTCCCTGGTGGTAGGTGATCGTCACTTCCCCCAGTTTTGGGTTTAGTACC
+TTCTGCATTTTCCTTCTTGCCATCAACACCGCAGCAGGATCGCCTTTGGTGATAATTGTG
+CCTTCAATGCTAACGGCCCGGTTATCCAATGTGTTATCAATAAAGGTGGAGCCATCCTGT
+TTCGGTGCCTTCTGGCTTTCAAGGGCTACCGGTACTTCGCCAACACCATCAATACTTTCT
+AGGAAATAAGGGGCTTGATTGCCTAATTTTATGCTTTCGCCGTTTTTGTTCGTGATGATA
+ACACTGTCCACAATCTCACCTCCTACCACTCAAGAGCCAGCTGCCGGGATGCATTTTTTA
+TCCGCCTAGCGGTTTCTGCCGGGGTAAGCGGTGTGGGGGAGTTAATCACGATATTTTGGG
+TAATGCCTTTATCCCCACCAAGGATCTCCTTTGTTTCGTGGTCGCTATAAATCCTACTTC
+CCCTGGGCAAGGCCACTAGCTCCGGCCCTAATTCACCCACCATAGTTAAACCACCGGGAA
+AGAAGCTGGTGCCGCTGTAGTTATCATCAGCCCCACCACCGGAAGTAACTGTGCTGATTA
+CCCGTGTGATGCGCTCCACAATGCTAAATACCTTCTCCTTAACACTGGTGGCGTTCCATT
+CCTTAATCCGGTCAATGGCACTACTGATGGCACTTTTAACCCGATCCAATGATTCGTTCA
+CTTTATCAGCCATAGCGGAAAACTTCTCGCTGGTGACTTCTTTCATGGTGGTTAATGCGC
+TGTCCCAAACGGATTTATAACCCTCGGTGTAGCTATTAATTAAACCTTTAATACCACCGC
+CATGCTCATCAATTTTATTTTGTATGGCCTGCCAAGTTTCAGCGGTTTTGGTTTTGATGT
+TGTCCCAGGTTTCATAGGTTTTAGTTTTAACCTCATCCCAGGTGGTGCTGACATTGGTTT
+TAATAGCAGCCACGGTTTCGGAGGTATTGGTTTTAATGTCATTCCACCTATCACTCATGG
+TAGAGCGGATGTTTTCCCATTGCTGGGATGTGGTAGTTTTAATTTCTTCCCAGGTGGAAA
+TCACATTTTCTTTAATGGCCTGGGCTTTGGCGAAGATGTCGTCTTTCATGGCCTGCCACT
+TGGTTTTTATCTGGCCGGTTTCCCAATCCACCTGATTAACGTGCTCTTGAGCTTGAGCCT
+TAGCTTCCTCCACTACCCGCTGGTGCATAATTTCAGCCTGTTTAACCGTGTCATCCTTTT
+GCCGGGTGGCTTCTTTGATTAAGCGATCCGCCTGATCTTTGGTGATGGTGCCTGCTTCAT
+CCCGCTGCCGGATAATTTCCTTAATTACCCGGTCGTACTGTTCATTAGCCGCTTTGATGG
+TTTTATCCTTTTGCTCAATGCTGTTTTTGACCACTTCGGCGGCTTGCTTGACACTAATCT
+CCCCGGCCTGGGCTTTCATCCGTTCCATAATGGCTTTGGCTTCGATTTCATTCTCGGAGA
+GGACTTGAATGCCGGTGTCCACCATCTGCCTTTGGATGGCATTAATTTCTTCCTGTTCAG
+ACTTGGTAAGCGCCCTTTTCTCTGCCGTAGCGGTATCCAGTATGGTTTTTATCCTGGCTT
+CCCCGTCAGCTATGGTTTGTTTTCTGTTTTCATAGCCCTGCTGCATATTGTTTAATATTT
+CATCCTGCTCCTGCTGGGATAGGGAAGTGCTACCGGCAACAAAACCCTTAATTTTAGCCA
+GGGACTCTTCATGATGTTTAGCCAACCCCGCCTGCACTTGAGAAGCCATCTGTGAGAAGT
+TACCGGCAATGTTGTCGGCCATTTCTTTGGTAACTTCTTGGCCACTCCAAGACAGCTGGT
+TTAAAGCAACGGTGGCTTCATCATTCAGTTCTAAAAACCCGCCTACCGCTTCTTTGGTTG
+CTTCAGATACTTCCTTACCAAACAGTTTAATAGCAGGGATGCTCTCCTGACTTAAGTGTT
+TATATAAAGCCACCCCTGCCACCGTTAATCCAGCAATAGCAGCTACCGCAATCCCCACCG
+GCCCGGTTAAAACTGTAAATACTGTGGCTAAGGCACCAATGGCAGGTGTTGCTGCAACTG
+CTCCGGTGGTGGCCACAGCAATAGCCCCGGATACTGTAGATAGTACTCCTGCTACAGAGC
+CGATAACTCCGATAAGCTTGCCACCAATAAGTAATAGCGGGCCAATGGCTGCAGCCAAAC
+CCGCTACTACAAGAATAGTCGTCTTAGCCCCATCGCTTAGTTCGCTGAATCTTTGGACGA
+GGGGAGTAATCCCTTCCAGTGCTTTGGAGATCACCGGCAGCAAGGCATCTCCAAAAGCAC
+TGGCTGTTAATTGTAGTTGGTTTTTGAATAATTGTATCTTGGAAGCTGTGGTGCCAAAGC
+GCAGTTCCGCTTCTTTGTTAAGGGCATTGTTTTCTACCCAAGCCTCACTACCCAGTTCCA
+AGCTTTCCCTGAACAGGTCACCTGCACCGGATGCCCGCAGTAATGCGTCACGAACCCGGA
+TTTCCGATAGGCCCAGATCCTCTAAGACTGCAAATACATTGCCGCCGCTTTTTGCTGTTT
+TATCTAAACCCTCAATAAATGAGATGATCGCCCCGGCTGCATCTTTTTCAAAAGCTTGTT
+GGAATTGACTAGCTGACATACCCGACACTTGGGCGAATTGTTCTAACTTTTGACCTCCGG
+AAGCTACGGCATTAGCCATGTCTACCATGACTCGGGAGATAGCGGAACCGCCGGATTCAG
+CCTCAATACCAACTGAACTTAAAGCACCGGCAAAGGAAAGAATCTGGGCTTCGGTTAAGC
+CGACCTGACTCCCGGCACCGGCGATACGCAGCCCCATCTCCACGATTTCGGCCTCGGTGG
+TGGCCAGGTTATTGCCTAAGGCCACAATGGTGGCACCCAAACGGTCAAACTCGGTTTGCG
+GCATTTGGGTAATGTTGGCGAGCCTGGCCAGCGCAGTTGCCGCCTGGTCGCTACTCATGT
+TTGTGGTTACGCCCAGCTTGGCCATTACATCGGAAAATCTTAAAATGTTTTCTTTTTTAA
+TGCCTAGTTGTCCGGCGGCTTCACCGATGCCGTAGAGTTCTGTAGTAGCAATCGGCACAG
+TTTTAGCCATGGTTTCAAAGCCCTGTTTAAGTTCTTGCAGTTCCTGTTCGGTGGCATCTA
+CCGTCTTGATAACCCCGGTAAAAGCTGTTTCTAAATCAATGGAGGCCTTGGTCGCTAATG
+CTCCAAGACCCACCAGGGGTGCCGTAACCTTGGTGCTCAGTTCCTTACCCGCTGCTTCCA
+TCTTTTTACCGACAGCCTGCAGTTTCTCCCCGGCAGCCTCCAGTTCCTTGCCCAGTTTGC
+CCCAGCTAGAGGATTGCAGGGTTAATTGGTTATTGACATCTTTTAGATTCTGTTCCATGG
+TCACCAGCCTGGCACGGGCTTGGTTTAATCTGATTTCTAATTCCTGCGTGACCCTGGCAT
+CAGCACCTTTGGTTTCAACCGCCTTCCGGTGGGCTTCCTCCAAGGTTTGCACCCTTTGCC
+TTTGCAGCTCTGTTTCCTTGGTCATGTGTTCGGATTTAAGGCGTAGTTTATCTAATTCAC
+TGCCGTGTTGACCAAGTTGGGCACTGGCTAGTTTAAACTCCGATTGCAGTTTTCGCATTT
+CAGTGCCTAATTTACTGATTCCTTCTTGGAAGCCTTGGGAATCTAGGAATATCCGGACAC
+TAAGATCACCAACACTTGCCATCTGTCTCACCACCTAAAAATAACGCCGTCAATAGGCGC
+TACAATATACTGTCGATATATACTTTTTCAGTTCCTCGTTTTCGGTTAAGCAACTTCAAG
+TAATAAATGATGTCCGTGGAATCAATCTCACCCATAGTCCAGCCCTGTTCTAAAAGAGCC
+AAATACAGCCGGTCAATAAACTCTTGGGGCTCCATGGCGTTTCCCGCTATTCGTTTTTTC
+CTGCTGTGGCCTCTCCCATCGCTCCCACCACTTCATTGATACAACGGGTAATGGTGGGGA
+TTAAATCCTTGGAAGCCAGGCCGTCATAAAGTTCATCACGGGTAAATTGACTGCCGAATA
+GATCCACGATGTAATCCATTAATTTGTCCAGTTCCTCGGGGGCAATATTGTCGAAATTTA
+TCTCTTGTGATACGGCAATGGTTGTTCTCACCATCCGGGCGCTAATAAAGCCAGCGGTGT
+AGGTTTTGTCCTTGCCATTAGTTTTAAGTACAATCTCCAAGGTTTAACCCTCCTCCGTAA
+TTATCGCCGCTTCAAAGGCAGATACCGCTACGGCTAAAGTGGCCAGTGCCGCATCGACCT
+GGGCTTGGGTAGCGTTTTCATCATCCACCACGGCTTGAGCGGCATCGATAGCGTCGCTGA
+AGGTGTCGTAGGCTTCCTGGGGGTATTCTCCGATGCCAGTACCTACAGTTGCACCAGCTA
+ATAAATCTTCGGCTTCACCAATAGTGGCAATGAGGGCAGACTTATCAACCACTACTGGAC
+TGGTATCACCCGGTACCCTACTGAACCAACTTTCAAATCCAGTGAAACCCTGCCCGTCTT
+CGTCTGCTGTGTGCTTCCACTCACCGTCATGCACTCTGGCCATAAAGGTAAACTTCACTT
+TAGGGGTTTTGTGTTCTACGTTGTCCTTTTTAGTGGAGAAGTCCTCGGCCATGGGCTGGG
+CTACTCCTTTTAAGAGCCAGACATAGCGGTACTTGCCGTTGGACTTAAGACTCTTGAAAC
+CTAAAGCAATATGAGGCGGAACGTCGGTAGCCTTTTCAATGAGCACCCCGTTTTTCAACT
+CATTGCCTAAAAGTTTGGCCCGGATAGTTAAGGGTAGTTCCGCCGTTTCTATTTCCACAT
+CCACCTTGCCTAAAGCCGATACCGATTCCCACAGCTGGTCATCAGCGTAAAGCTCCTGAG
+TATTCACCGCCGGGTTGATAGTGGCGTTAATGGCTCCCACCAAGGCTTCGGTGGGTTCAT
+AGGTTAACTCATCTTTAGTATCTGCGGTAAGAATAGCAAAGTGTAAATCATTTAATCCTA
+CTTGTGCCATCTACAGCACCTCCTTAAAAAATCGCATGGCTTTGTGATAAATTCCTAAAT
+CCTGTTCGTACAGGTCATAAAAGTTCTGTTTGGTAAAACCGGCAGTCAGCATCTTTTGAT
+GGATTGATTTGACTAAATCTGTGTAATCGGTTTTGCTCCACACATCAACTTGCACATAAT
+GGCCAGTAATTAACTCCGCATCATCGGCATGCTGCTCCGGTTTATCCAGGTAGGTGAAAA
+AGGTGATGTAGCTATCGGCTTTGCCTGTGTAGTTTTGGAATTGTACCGGTACTCCTATAT
+CCTTTAAAGCCGTTATTATATTTTGGTTCATGCTCATAGGCCCAGCCCCCTTCGCAGTTC
+TTCCTTGATGGTTGCTGTGGCCCGGTCTTTACCGTTTTCATAGCCCGGTGCCATGAAGGG
+TTTAGCTCTCATTTTGACAGTTCCCAGTTCCAGAAATTTGCCATAATAGGCTTCCTTACT
+CGGCCCCACTGCTACATACTTAACCCCATCCTGGGTTCTCACACCGGAAACGGTAATGCT
+TTCTTTTAGCTTGCCAGTCCGCACTGGAGTTTCGTTTTGGATGGCCTCTTGCATTACAGC
+ACCGGCTTCTTTTAAGGCTTTGTTTTCTATTTTCTTGCCCTCGCTGCCCAGCCTTTGAAC
+GGCATTGATGAGGGCTTCCAAGCCCTCTAACTCTACCCTAGCCACTGCTTACCACCTCCA
+GTGCTTTGATTTCCAGATACCGGTTTTGATATTTGATGTTGTCAATAGCGGTGATGTTGT
+ACTGTTTGCCTTGAAAAACAATCCGCATGGTGGTATCCAGACCCGTTAAATACCTAATGG
+TAAACTTCACCGTATTCTCTGCCTGGACAGCGGCGGCAGCAAAGTACTCCCGGCCATGCA
+GGTTGCTCACTGCCGCCCATACGGTCTTGAAATCCTCCCAGGTTTCTACCTCAAAGCCGT
+TCTCATTGACGCTAGTGGTAAGTTTCTGGAAAGTTATCCGGTGTCTTAAATCCCCAATCT
+CCACCTGCATCACCAGCTTTCCCGGCGAAGGTTTGCCAGTATCAGTTTCATCACATTTAC
+GGTTTCAGCCATGCCGCCGCCTTCGTTTTTAAGATAATAGTGGGTTCCTTCCCTTTTTTC
+ATACAGATTGGCCACACAGTACAAAACCGCTTGCCTGACTACCGCCGGTATTTCTTCAAA
+CTCCGACAAGGGGTATCTTAAGATATCCTCGCAAATTTCCACGGCGGTAGAAATAAAATT
+AGTGATGAGTGTATCTTCCTCATCACCGTCTATCCTTAAATACAGTTTTACTTCTTCCAG
+GGTTACCACCATACACTCACCACCTCCCGCTGTTTATTCCGTGATGACCGCTGCTTCAAA
+GGTGGATACCGCCGTAGCTAAAGCAGTCACAGCATCGTCTACATTGGTTTGGGTGGCATC
+AGCGTTTTCCACTACTGCCTGTGCTGCACCAATGGCAGTTTCAAAAGCAGTAACAGCCTC
+TTGCGGATATTGGCCAGGCTCGGAGCCCACCTGAGCACCATCCAGTATATCTTGAGCGGC
+AGCAATAGCCGCTCGAAGAACAGATTTATCTACAGTGATTACTGCTGCTTCAAAGGTGGA
+TACCGCAGTTGTTAATGCTGCAAGCGCAGTACTAACTTCGTTTTGGGTAGCACCTGTATC
+ATCCACCACACCTAGGGCAGCTTCAATGGCGCTCTCAAAAGTATCGTAGGCAGCTTGCGG
+ATATTCCCCAACATCCTCGCCAACCACTGCACTATCTAAAAGTTCCAAAGCTGCGGTGAT
+GGCCGCTTCAAGTGCTGATTTATCCACCACCATCAGACCGGCAGCAAAAAGCCGCCCCAA
+GAGGGAGTTGAAATCCTCTTTTAGAGCGGCAACAGTGCTGGCTTCACTGTTAGTTTGGCC
+TAGTGCTGGTTTTAGTTCGGTTCCCTTGAAGGTGAGCTTACCACCAGCTGTAATCTCCAG
+CTGGCCACCCACCACCCATTTCTGCCCGCCTTGTTCGTGATAGTTTTTAACATTACTCAT
+CTACCATCACCTACGCTTTCACCTTGAGAATTTTAATGGCTTCTTTAAGGATCAGCTTGC
+CATCCACCCGCTGCGCTGCCCTAAACCCTACTTGACCGGTGGCGGCATAGAGTTCGTTCA
+GCCTTTGAAAAATCCTTCCCTGACGGTCAGCAATCCAGTAGTAGCCCATATCACCGAAGG
+CGATCACTTTTTCCCCAGCGGCAATGGTGGGCACATAAGCCGAGGTCTTGACGGGACGGT
+TTAACAAAGTGTCCGGGTCGCCTGCAGTGAGGGAGGGCTGCCACAGGTACACACCGTTAC
+CGTCTTTTAGTTTCCTGATTTCCTTCACCGTGGCATCGTTCATGATAAAGACAGCCTTCT
+TGCGGTAGGGGGCTTTTAGGGAATAAAAGAGGTCGAAAACCTCATCCGCTTTAAGAGTAG
+CCCCGGCAGTGGTTGCTCCAATCTCCCCGCCACTGTCATTGTCAAAGATGCCGGTGGGTT
+TCCCCTCACCATCCCCGATTAAAAAGGCTTCTTCTTCCTTGGCCCCAATGCGGCGAGCGA
+ATTCTTTAGCAATGTAGCTTTCCAGGTTAAAGACGCTGTCGTTTAATAGTTCTTCGGAAA
+CCTTAATCATGGTGGCCACCTTGTAGGCCCCAATGGATACCTGGTCAAAAGCATCATCTT
+TATCCTGATACGGCCCTTCTTCATCTACCCAGGTGGCCACCCCCTTGGAAGCTACCACCG
+GGATTTTCCGGTCACCGGTAGAGGTGGTAATTACTTTAGCCAGTGTACGCATGATGTTTT
+CTTCTTCCAAGGCTTCAATCAAGGTGCGTTCGAACTCATCAGGCACCAAATATCCACCCT
+CAGTGCCGTCACCGCCAATGGTTAAAGCGTTTCTGGCCTCATAGCTATTGCGGTTGCGCA
+TATACTGCCAGAAAGCCTTATCGTATTCATTGGAAGCCCGGCCTTTAGGCTCATCACCAG
+GAATAGTTTTTAATGCTGTGCTGGTGGCCTTGGAAAGCTCAAGGTCAATGGCGGTTTGAC
+GTTCCAGGCGTTCAATCTCTTTACCTAAATTGACAACTTCGGTTTCCATTTTCTCATAAG
+TGGCGGTATCCTCAGCAGAGAGAAGACCGTTTTCACCACGCTTTTCATCCAGGAAGGCCT
+TGGCTTGTTCCCACACTTTAGTCCGCTTTTCCCGCAGTTCGATAATTTTACTCATGGTAT
+ATTACCTCCCTTTTATTAGTTCCAGCCGTTTAATTAGCTGTTCGTATGGAATGCCATCGT
+TGTTTACTGGTTTAGGTTGAGCCTTGACCGGTGGTAGTTTCCGCATCAGTGCATTGACCA
+CTGTTACCCGGTCAAACATGAAGTCAGTGACTTGGGCTGGCGGCTCACTGTAAAGGATCT
+CGTCAGCAAAACCAAGCTCCACCGCTTTATTGGCGCTCATCCAGGTTTCAGCGTCCATCA
+TCTTAGCGATCTGCTTCCTGGGTAGTCTGGCCTTGGCTTCAAAGGCATTAATGATGGCTT
+CCTTCACCTCGGACAGCATCTCGATTCCCTTTTGCATGTCAGATTCTTCGCCCCAAACAA
+AAGTGGCTGGATTGTGGATCATAAGCATAGAAGTGGGGGACATACAAACCATATCGCCCG
+CCATGGCAATTACCGCTGCAGCGCTGGCGGCAATACCGTCAATTTTAATCAGCACTTGGC
+CGCTGTATTCTTTGAGCATGGTGTAGATTTGGCTGGCTGCAAAAAAGTCCCCGCCTGGTG
+AGTTGATATAAACTGTGATGTCACCGGTTGCTGCTTCCAGCTCTTTTTTAAATTCCTTGG
+GGCTTACTTCATCTTCAAACCAACTCTCCGGGGCAATATAGCCATCCAGGTAGAGGGTTC
+TCTCGCCTTCGTTTTTAATCCAGTTCCAGAATTTATTCATCTGTGTCCTCCTTTCTGTAT
+TTTTCAGTCCAAGCCCCGGCATCAGCCATGTCCACGAAATTTCCGTTGACTAAATATTTA
+TTTCCGCCTAGCTCATCCGGGATTAGGTTCATGGATTCTAGCTCTCGAATGTCGTTCGCT
+GACATGATGCCATTTTGCCGCATGGTCTGGTAAAAGGCGGCCCGTGATTGAGCATCTCCC
+CTGAGCCTGCCGTTAAGGTTGAACTTGACCAGATATTGCTGTTTTTCTCCACCAAGGAAC
+AAGGCCTTTTGCATGGCCTGTTCAAAGCGGGCCACCCAAGGAACAATGGTGTTGTCGATA
+AAACTGATGCTTTGGCTTTCAATGTTGCTAAAGGTTGCCCGCTCTAAATTAGCCACTAGG
+TGAGGGGGTACCCTGAATATCCGACATATTTCCTCAATCTGAAACTTCCTGGTCTCCAAA
+AACTGTGCTTGCTCCGGTGGCATACTCAGGGTCTTGACGCTCATACCTTCTTCCAGCACC
+GCTACCTTGTGAGCATTTTCGCTGCCCCTGTAAATCTGGTTCCAGCTGTCACGGATTTTA
+GCCGGGTCTTTTAATATGCCGGGATGTTCTAATACCACACTTGGCCGGGCATCGTTGGCA
+AAAAGTTTGGAGCCGTATTCTTCTGTGGCCAGTGCCATTCCGATGGCATTCTTGGCCATG
+GCAATCGGGGAATAGCCCACCAAGCCATCAAAGCTAAGGCCCGGAATGTGCAGCACTTCT
+TCCCGGCGCAGTAAATACTCCCGGCCTTCTTTTTGGTAACGGTAGTACAGCTCTCCTTGT
+TCTGTGCGGCCAACATCCATGCGATCCGGCAGCAGGGGATATAAACCGATGACCCTACCC
+CGGCCATCCCTGATAATCTGAGCGTAAGCATTGCCCCAAAGTAAAAGATGACCCATCAGT
+GTTTCTCTGAACACAAATGAAGTCATCTCGGGGTTGGGCTCATCATGGAGCAGGTAATAT
+AAATTGTGATCCATGGCTTTTTCCTTCCCTTGGCCTGTGCGCCGGTAAACGTGGAGGGGT
+AGGGAGGCTATGGTTTCCGAGAGTACCCGCACACAGGCATAAACTGCTGATGTGGCCATA
+GCTGTGCGCTCGTTGACGGTTTTACCGCTAGGTGTGGGGCCAAAGAAAAAAGCCTGGGTA
+TTTTGCCAGAAGCTGTTCCTAGGACTGGCTCTGGACTTAAACAGGTTTGATAGAATAGGT
+ATTTTCAGAATCTCACCCCCCTTAAAATGAGCATGAAAAAAGCACCTCGGTTGAGATGCC
+CTCATGAACCTTAATATTTAAATTTTTGTGCTTGACAGTTGCAGTTCTATATTACGCCCA
+CCATACATTATCCTCACTACTGCAACCAGTTTTTCTTCTTCAACTACCACATAAAACACC
+AGGTAATTATCTACCGGAAGGACCCTCAAACCCCTACTGTGCCAAGGTTCTTTTTGGTAA
+AGTTTATGCCTGAGGGGCATTTCATCCAGGCCATTAATCGCATCCATGATTCTGTCTGTT
+TGATTTTTTGCGGTTTCCGGCACAGATAAATTTATGGCAATGTATCTGTAGATATTTATA
+AGATCCTGTTCGGATTCTTCTGTATAGATGATCCTATAGCCCATGGCCATATTCCTTACC
+CATACGTTCGGCTACCTTATCCGCAGATACAACCCTGCCTGCTTTCAAATCACCTAGTCC
+CTTTTCAATTTCATGGTTAAATTCTTCAGGCGTTAAATCCCCAAATGCAAGGGGTCTGTT
+ATGTGTAATCTTAACTTCAAAGGGCAGCCCGTTTTGTAAAACAACCTGCCTTAAAAAAAT
+ATTGATGGCGTTTGACATGGGTATGCCAAGTTTATTCAACACCATTTCCGCCTGTTCTTT
+TATTTCCGGCTCAACCCGAGCAAAAATACTTGTGGTTTTGGACATGCATACCGCCTCCTT
+TATGATATTTATATTTTACCATTTTGTATTGCGATATGCAATATATCTGCAAGCCTAGAA
+CACCACCAGCCCTCTCTCATCATAGACCGATTTATCCTTTTCCACCCCTTCATTCCGGAT
+ACACCGGTCTAGCGCCATAATCATAGCCACCGCACCGTCAATCTTCTCTGTTGATTTGGC
+TTTGTCCGGCTTGATATTACCGGCAGGGTCGGTGCGAATGTGAATGTTATCCATCATCCA
+AGATAAAACCGGGTGGCCGCCATGAGCGATTCTTTTCTCCAGGGTCAGTTTCATCAGTTC
+TTTGGTGGGTGGGGACATATCTTTAAAGCCCTGGCCGAAGGGAACCACGATAAATCCGGC
+ACCCTCTAAGTTCTGCACCATCTGCACAGCACCCCAGCGGTCAAAGGCAATCTCCTGGAT
+GTTGTAATCCTGGCCCAGCTCTTCGATAAATTTTTCAATAAAGCCGTAGTGGATGACATT
+ACCCTCGGTGGTTAAAAGGTATCCCTGGTTTTGCCAAATATCGTAGGGTACATGATCCCG
+GCGCACTCTAAGGTCTAAGGTTTCCTCCGGCAGCCAAAAGTAGGGGAGAATGTAATACTT
+GTCGTCCCCATCCACCGGTGGAAACACCAGCACAAAGGCGGTGATGTCAGTGGAACTGGA
+TAAGTCTAGCCCGCCGAAACAAACCCTGCCTTTAAGCTTTTCTGGGTCTACCGGGAAAGC
+GCATTTTTCCCAGGTGTCCATGGGCATCCACTTTATCTGCTGTTTCAGCCACATATTAAG
+CCGCAGCTGTTTGAATAATGCTTCCTCCGCTGGTTCTTGTTTGGCTTGCAAGAAATGTTC
+TCTGACCCGCTCTATTTGAATGGTATGGCCCAGGCTTGGGTTGGCTTTATACCAGTTGGC
+TTCATCTTCCCAATCGTCATCTTCCTCCAGACCATAAATGATAGGCAGGAAAGTGGGGTC
+AATTCTTCTTCCGGCTAAAATATCCTTGGCCTTGCAATGCATCTCCCAGCCGTAGCCCTG
+CAGCTTGTTACCCGCCGTGGTTAAATAGATAAACAGGGGCTGCTCCCTGGCATCACCGGA
+ACCAGTGGTCAACATCTTGGCCAGGTCAGGGTTTGGATAAGTCCAGATTTCATCGAGGAT
+AACGCAAGATGGGTTAAGTCCTGACTTGGATTTTACATCTGAACTTAACACCTGATAAAA
+ACTACCGGTTCTAGGGTAGACAATTCTTTTGGTGGACATGATGGTTTTAGTCACCCTCGA
+AAGGGTCTGATTACCCTCCACGAAATTAACACTGGTATTGAAAATTATACTGGCCTGTTG
+CCGGTCGCAAGCGGCTACATAGACCTCAGCGTTTGGCTCTCCGTCCGCTAGAAGCATATA
+TAGGGCAATGGCAGCGGCGATCGAGGATTTCCCATTTTTCTTTCCAATTTCTGTATACAC
+GGTTCTATACTGCCGGGTGCCGTCTTCCCTTAAGGTGCCAAAGGTTTGTTTTATTAAATC
+AAGTTCCCATGGAATTAGCTCAAAAGGCTGTCCTGCCCATTTACCTTTGGTGTGTTTTAG
+TTGCCGGATAAAATCGACAACGTGCTTTACCTTTTCTTCGCTGTAGAGCAAGGGCATCAC
+CTCCGATTAAAAAAACCTCCTACTTCGTTACTGTTAACAGCTTTTCCATGGGGTCGTCCG
+TGTTTACCGCTTCAGTGTCAACACTAATCCTCGTCCTAGCCGCCGGTGTTAAACCAAACT
+CGCTGCAGAAATCCTTCATCACTTTCAGGTAAGTTTGGGCGATGGAGACTTGCGGCACCT
+GCTGAATGTACCCGGATGGGGTTTTAAAGATGGTGCCGTGTTTGCTTAAAAACTCCTCGG
+CTTCTTTCCACCGGGCGTAGGCCTGACAGTACCCGGCAAAGGCAGCTTTATCCACCAGAG
+TTAAAAGCCCCATAGCTTCTAAGGTTTTACTCATCCGCCTCCATTCATTTTTGGCCTCTT
+GCTCCAGCCATGACGGGCAGCGGGGTGCCTTGTTTTCAGGCTTGGGTTCGTTTTCATTTA
+ATGGCCTTTTGCCGGGGTTTCCTTCCAGGACTTTAAGTGCGGTGGGTTTGGGTTTTCTTC
+CCCGTGTCGCCATAGCTTTTCACCTCCAATTGAAAAAGGAGCCTCACTTGGCCCCTTTGT
+TTTCTATTTATTTTCTAATCCCCGGAAAATTGTAATTCCCCTTCTTTATCTCATCAATAT
+CGGCCTGTACCGCCTTCTCGTAATCCCTGTCCTGCTTTTCTTTGGCCTTGCAATCCAAGC
+AGATGCAGTCCTGGTTGAACATGGACATTGTCCGGCCACCCTTTAAATCCCCGCCGCACC
+GATCGCAGTGCCTTTGGGAAAAGAATTTATCCAATCGAATCGCCCCCTGTTTTGGCCTTA
+TTTACCGCTGTCCGACCTGCCCCCTCTACAGCCGCCATAACCCTTCGCTGTGGCCCACGG
+GAACTCTCAGGCGACTTCGTTTTAATGCCTCCCGCAGTGGTTTTTGGGGCAGTCCCCAGT
+CCCGGTAGCCTTGTTCAATGATGTGATAGTAGCCATCGCTGGGTTCGTTTAAACCCTTGA
+TGGTCAGCACATAAGCAAAGGCCTGGTAAATGTTTCCCAGGTTGTCCTCTACCGTTACCG
+GCATTTTGTTATAAAGGCGGGGATAGCCTTCATAGCGGTCAAGTTTTTTAATATCTTCCG
+ACGAAACGGTGTAAATGGCACCCCAGGTAATTGCCTGTTCTTCTTCCACGATATCCGCCA
+CCCGGTTAAAAGTCAGTTGGTAGCCATGCAGTTTTACCCTGGCCACCGGTATTGCATCCG
+GGCAGCGGCTCATCATCTGTTCCTTGTTCAGGTTGCTGCCGTAGGCAAAGTAGTACATAC
+AAAAAACCCCCTTTTTTGGCTAAATGGTGTAAACCTATCTATCACTCAAAAACAGGGGTT
+TTGCAAGTATTTTTTATTTAAACCGGGCGTTATTCATCACTTCTAAGGCCCGGAATGTTC
+ATCTTGTCTGCATCAGCTTGGGTGAGGCCAAAATGCTCCAAGGCTTCTTCCTTGGTGATT
+TCAATCAGAAAGCCATAGTCCACGAATTGGCGAAAGGCACTTTTGGCCTTTTCCGCCAGG
+GTATCTCCGGTGACATGCACACCTTTGCCGTAGAAAGTCCAGGCACTATTAGCCATTTCT
+TGAATATATTCTCCCACAGTCATGGTGTGGGGGACAAAAGCAAAGCTCTTTAGTTCCTCA
+AACACTCCCAGTTCATCTTTGGCCACACTGACCCGTTTGCCATCCAAAGTCATTACCCGT
+AGATACATGCCTTCACCACCCTTTTTCCCACATATTAACATCTATTTATCAGAAAGGGAA
+GCCGGGCTTTAAAGCCCAGCCACCTGTCTGCCGTTTCTAAAGGCGCTGTCGCCTTCCAGG
+TTCTTTAAAAGGTGAAGCCTGGCGGTTTCAAATTCTTTGCCGATAAGGCCTAGTCTCAAA
+AGCCAGGTTCTAAAAGTGTACTTGGGGTTTGAGGTCTCAGTCTTCTTGGCGCTGGCGTTC
+TTTTGGCTTAAAGCCTGGTAACTTACCGCCAAGCAAAACTGTATGTAGGCTTTGACTTTC
+CCGGCGTGGGTGGTTCCGTTGAAAAGCCTAAACTCTACCGTGGGGCCGTTGAAAGTAGCA
+TGTAAGTTTAACCCGTGGTAGCGGCTGCTGTGGTAATGTTGGCTGCGGCTGCCGCTGTAA
+CCCTGGTACCAAAGGTCGGCCAGCTGCTCCAGCTCCGTTGGCTTTCGCCGGTTCAGTTCT
+GCCAAAAAGCTTTCCTTTACCTTTTGGCAGTACCGGCGTTTCCGCTGCTCGTCCACCTGC
+AGAGCTTGGTAAATCAAGTCCTCTTTGCTGGCCACAATGTTGACCAGATTCCGTAAAGTT
+TTGGCGGTGAATCTTTCTTTGCCAATGTGCAGGTGTATCCCGCAGCTCTTATTAGCGAAG
+GCCCCGACCTTTCTTAAGGTTCTGATGATCTCCTGCACCGTTTCGATGTCGCCGTAGGTG
+CAGATGGGGGAGACTAGCTCCACTCGGTGGTCTAATCCCGCTGCGATTCTTTTGCCTTGC
+CGCTTGGTTTCCGGCCTGATGCTGCTGTCGTTCATAATAAACCAGCTGCGGCCTTGGTTG
+TCCGGCGCTTCCCATTTGTCGTAGCCGCCGCCAAGGTAGTGGGCGCTGGTGCCGAAGTAT
+CCCGCCACTGCTTTGGCCGCCGCTTCCCTGGAAATCCCCGTTAGCTCAATTTCTATCCCG
+AAGGTTAAGTTTTTCATGTTTGGAAAACCCCCTGTGTGTTTTTGGTAGTCTATATATCAC
+TCTAAACACACATAATAGCAAGGGTTATTTTCCTTAAAAGTTAATATTTAGGCGGTTGTT
+TAGCCAGAGAAAAGACCGGTGCTTATGCCCCAGCCTTATTCCGCATCCACATATTCCATG
+ATTATCTGCAGTGCTCTGTCGTAGCTTTCGGACTTAAAAATCCGCTCTCGCATTTCTGCC
+GCTTGTTCCTCCAGCCCGGCATCTTTAAGTGTGCGGCTGGCGATGCCCATTAGGTTAAAG
+ATGTTGCCGTTTTCACCGACCAATTTGCATCTTGGTTTGGTCATTTACGCTCCCTCCTGG
+ACTTGTTTTCTAAAAGCGCTGTTACCGGGGAGGTTTTGCAAAAGAACCCGGCGGGCTAGC
+CTGTAGTCATCGCCTATCATCCCTAAGCGCAGGAGCCAAGTACGGAAAGTATACTTCTCA
+TTGTCGGTGGCCTTGACCTTGGCCGCTACATTCCGCTGCAGCCGCCTGACATTGATGTTT
+ATCAATTCTAAAAGCTGGGTGGCGGCTTCTACCTTCTCCGAGTCATCTCCATCCCGCCCC
+AGCTTGAAAGTAATGGCTCCCTTGTTGAAATCAAAGTCAATACCGGGGCAGCTTTTGCCT
+GCCAGTGCATTTTGGAAATGCTCCAGAGTTGTCATGGGCTGCTGGTTTAAAGCGTTAATA
+ACTTCCTTGCTCACCAAATCGGTATCAAGGTTTAACGCCTTTTTAATTAACGGCTGCTTA
+CTGTAAATCATGTGGAGCAGGTTCCGCAAACTCCGGCCATCGTAGCCTTCCAAAGGTATC
+CCTACTTCCAAAGCAGTGGGTTTTGTTTCGACAGAAGTGTTCGCTTCCGCAGTTTCCTTT
+TGCTCAGTTACGATCTCCAACTCCGGTTCCTCCTTCCCGCCTGCCAGCAGCGCCTCCAGT
+TCCAGCACCTGACCCTCGCTGTCAAGGATATTGCCTTGTCGGTTAACGGTATATTCGCCA
+ACTTGATAAGCAAAGCTGGGGGCAGCTAAATAGACAGGTCGTATTCCTAAATGCTCAGCC
+AGCTTGTGTACAAGCTCTTTTCTGGTCATCTTGGGTCCCCTCCTGTGATTTTTGGTATGT
+CTATACATCACTTAAAACCACAGGAATAGCAAGGGATTTATAGCAGGTCAGCGTATCTAA
+TTTTCTGGCCATCCCGGATTAAATAGACATCATTATCGGAGCCAGTGTGCTCAATGTATC
+TTTTCACTCCTACATCTACGAAGCGTTCCTCCAACTCGGTAGCATAGCAAATACGATCCA
+GCTGTTCGCAAGCAATCCCTGTTGAAAAGCTGCCGGAGAAGGGGTCGAGCACGATGCCAT
+TGGGAGCACTGCTGTTTTGGATGGGGTAAGCGCACAGAGCCACTGGCTTCGTAGTTGGAT
+GGAGTTTTGATTTGGCTGGCCGGTCAAAATTCCATACCGTCCTATGTTTTCTATCACCGT
+AAAACTTATGGCCTGCTGTGGGCTTCCATAGATATAAAATGGGTTCATGAGCGTATAAAT
+AGTCGCATCTACTAAGCACCGGTGCGTTTTTCACCCAAATGCAGGTTTGGTGACAAAAGA
+AGCCAGCGTCCCTAAAGGCGGTTCTAAAATTAACGGTTTCCCTGTCTGCATGAAAAATAT
+AGGCAACGCCACCGTCTATAACATTTTCATACATATTTGTGGCGGCCTTTAGGAGAAATT
+CGTAAAATTCCCTGTCTCCCATATTATCGTTTTTAATTTTCCCTGCCGTTCCTTCGTAGT
+CCACGTTATAAGGCAAGTCACTGACTATGAGATTGGCCTTCTTCCCATCCAACAATTTCT
+CGTAAGTTTCAACTTTGGTACTGTCCCCGCAGAACAGCCGGTGCCTTCCCAGCAGCCACA
+AGTCACCGGGTTTACTGATGACCGGTTCCTTCAAAGCTCCGTCCACATCGAAGTCATCTT
+CTTTGACATCCTTATCGTGTACCTTGGAAAATAAATCCTCTATCTCAGCGGCATCAAAGC
+CGGTAATGCTCACATCAAATATTCCGTTATCCAGTTCGCTGATTAAGTCGGCCAGTTTAG
+GCAGGTCCCATTCACCAGTGACTTTATTAAGCGTTATGTTCAGGGCCTTTTCCCGCTGCT
+CATCCAGATCCACTACTACACACTCAATCTCGGTTTCCCCTTGGTGCTGTAAAACTTTAA
+ATCTCTGGTGGCCCCCTACGATCTGACCAGTGCGTTTATTCCACACGATGGGCTCCACAT
+AGCCAAAGGTCTCCATGGATTTTTTAAGCTTCTCGTATTCCGGATCTCCGGGCTTTAAGT
+CTTTCCGTGGGTTATATTTGGCCGGGTTTAATTTCTCCAGCGGTAGTTTTTGTATCTCCA
+ATCCTTACACCTCCTGCCTTACTGCCTTCTCCCCGGTGAACTGCTCCCAGCGTTTAACGG
+CCAAATCACAATACCCTGGGGACAATTCCATGGCATAACAGTTTCTACCCAGCTGCTCAG
+CGGCCATGATGGTGGTGCCAGAGCCGCTGAAGGGTTCGTAAACGTTATCCCCCACATTGG
+TAGTGAGCTTGATGAAAAAGGCCGGTAGCTTCACTGGAAATGCGGCTGAGTGTTTTACGG
+AACTTTGATTGCCGGGTATCTGCAGCACATTGCCTGGCCTGGCAATGCCTTTTTTGAATT
+TACCGCTGACGCTGATGTTGCCGGAGTCGCCTTTGGATTTATTGTTTTTGCTATAGACCC
+GGATTAAATCAGACTGTTTCCCTACCGCCCTGGGTTTGAATTTAATTTTCTTAGCTTTGG
+TGAAGTGGAAAATGTCCTCGTACATTTCCACCAGGTCCGCCGGTAATGTTGCCAATCTAC
+CCTCATCAACATCTACCAGCTGCACCATCCAGTCGATCTGTTCCTTCTTGGCGAAAAAGT
+GTACCGGTTCAAAGTCATTTCTCAAGCGGTTAGACCAGCCACCGGGCAGCCCTGGCTTCG
+TCCAGATTAGCTGATCCACATACCGCCAGCCACCTTCCACCAAAGCAATGATGGTTTTCA
+TCACGTAAAGGGAACGCTGGCCGCCCTCAACGTGTTCCTTGATATTGACGAAGAAGGAGC
+CGCTGTCGTCAAGTATCCGGTAAACATTACTGGCCACATGAAAAAACCAGACCGGATATT
+CCTCTGCCGGTATCCCGCCGTAGTCGTCCTTGCGCTGCATGGCGTAGGGCGGGGAGGTAA
+TAACGCAGTTGGCTTTTTCTCCGTTCATCAGTTTTTCAACATCGGCAATATTTGTGCTAT
+CACCACAAAGTAACCGGTGATTGCCTAAGAGCCAGATGTCCCCTGGTTTAGTGATGGGCT
+GCTCCGGTGCTTCCTCGTCAAAGTTATCCTCCTGGACTTCTTCTTTAAAGCCCAGCAATT
+CATCTATTTCCTCGGCATCAAAGCCGGTAATATCTTTTAAGTCATCATCCAAGTTCTTGA
+GCAGCTCGCTCAGTTTGGGCAGATCCCATTGACCGGCGATTTTATTAAGGGTAATGTTTA
+AGGCCCTTTCACGGTCAGGTGGCAAATCAACCACGGATACTTCCGTTTCGGTATCTCCCC
+GCTCCAGTAAAATTTTTAGTCGTTGGTGGCCAGAGATGAGCACGTTGCCCCGCTTGTTCA
+TCACCAAAGGTTCCACCAGGTCAAATTCGTCAATAGATTTCTTTAATTTCTCGTATTCAG
+CATCCCCCGGCTTTAAGTCCTTACGAGGATTGTATTTGGCCGGGTTAATCTGGTCTAACG
+GGATGCGCTGAATCTCCAAAAGGGCCACCTCCTTCTTAACCTGCTTAAAATCGCTGTATT
+TCGTGCCATGTCAAGCATTAGACCTTGACAACCCCCATCTGGAATTTTGCGAATTCCCAC
+GCGAAGGCCCGCGCCCGCTCTGGAGCCGCTTAGCTGCAGGGTTTGAGGACCCCCTACCCT
+AATTTATCCACAGCGTTATCTACAGGTCAGGCTGGTAATTATACTAATAACTGTAAATCT
+TGTTTTTATCTCCCCAGCGGCCTTCTTTGGTGGTCTTGCTGTCATGACAATTTTTACAAA
+GAGCTTGTAAATTGTTCTCATCCCAAAACAGATTCAGATTGCCTTTGTGGGGTTTTACGT
+GATCAACTATTGTTGCCGGAGTAATCCTGCCCTGACGTTCACACTCTACACAGAGGGGAT
+GCGCCAGCAAAACTTTCTTCCTTAACCGCTGCCAGCGGGCACTGTTGTAAAGCTGTTTAG
+AATACTTGGGTCGCTCTTTCCGGTTGTACCGCCAGTTGTATTCCTGCATGTGTTTGGGGC
+AGAACCGAGCATCGGTCAGCTCCGGGCAACCGGGATGGCGGCAGGGTGCTAGTGGCTTCC
+TTGGCAATGGACTTCACCTTCCTCTCACCGTGCTGACACCCGGACCAGGAGATCCGTTTA
+TGTTTGTCACCGTTTACGGAAATGTTAATTAAGGATTTATGGTACTCGCTCTTTGGATTG
+CCACACTCGTAAGCCGTCCAATGTTTATCACTGGCGGATTCATCAATGGTGGCAAAGCGG
+CAGGATATACATTTCATAATGGCACCTCCATAGAAAAAGCCCTGAGAGCAAGTGTGCTGT
+CAGAGCCTGGTTATTTCCGTTAATAGTCGTGGTGGTATTCTACGGTGAGTTTAGTCACCT
+TTCATTATTATTCAGTCCTGTTTTTTGGGCATAGAAAAACCACAAGCTTTGTTGCCTGTG
+GTTTTAATTTTATTTATTTTTGCCTACGTTCATAGTTTTCCAAATTGCCATTGGGTGCTG
+TTTTATATTCTCCAGCGTCTTCCCAGAAAACAATAGCTCCGGCTGGTAGCTTCCCCTGGA
+GAACTGCTGTAAATATTCTTTATGCCTTGATGTTAAAACAATACTGTTTACTAGAAATTC
+CTTGACTTCTGATTTGGTTTTGTCCAATTCAAACCGTTCACTTTTAACCAGCATGGGATA
+TAAATCCTGATGGACTGTTCTCATTTTTAGCTGGTCCATCCGGTTAGGAGAAAAACTTAA
+TTTTGCCGCTTCTCCTGAAATGGAACCATAAAAAACTACAGCTTTACAATAGCTGACATA
+GTCCTTTTCAGAAAGAATACCATACTTTTTCACATTGTATAAATCGTAAAAATCCCTTGC
+CGCCAGACGGTTAAACAGAGCCGCTGTTTTGGAAGCCAAAAGTTCAATGCCATCTAAAGT
+TTTCACTTCTCCTCTGGCCCCAAATAAATCTGTATTTATTCTTCTCATTACGGGCGGCCA
+AATATGATGTCTTAAAGAATAGTTTATCTCAATTTTTATATTATCAAAATTACCTGCGTT
+GTTTTGAAAACGAGCTACAATTGATTCCAGAGCAAAATAGTCTTTTGATTTTTTGGATAT
+ATCATAACCTTGTCTCTCTAAATGTGCATATAACAATTCTTTTACTTTAATCCGTTCTTC
+AAGTACCTTCTCCCGGCTATCATAGGAGTGAAAATCTAGATCTATATCTACAGATAATCT
+GGGCAAAGCAAAGATAGTAAGGTTTAAGGCAGTCCCACCTTTTAGGACTAATCGGTCTTT
+TAAAAATGCATTGCTATTTATAAATTCTAGTATAACAATTAACCGGTGAACCTTCTCTAT
+TACGTCTTTGTGAAACCCTGTTTTTTCAGAAAGTTTCAGGTAGTATTTCCGATCTGGACT
+AAACAAATATATCATCCCTAACTTCAAGAGTTTTTGGCACTATCAGGGCCCATCTTTTTA
+TAAGCACACCGCTACCATTTTGTGCTTCTTCACTTAAATACTTTTTTGTATTTCCGGTCT
+TTTTTTCTATCAGACTTAATAAACCATCTGTTATTCCTAAAGATTGCTGGTGGCGCTCCA
+GGAAGTAGCCTGCCTTTTTATAAAGTATCTGTTTATTATACATTTCTAAATAATTTGCCA
+GCTTTGTTTCATCCAGAACCGTACATATTTTTAATATCTCATCTAATTCATGGACCCCGC
+CACAGTAATCCGGCCTGTCTAGAGAGTCAACAACTGTTCTTTCTAGATCTGTCAGTTTAA
+CCTTGTCATTTAAACGATAATGAGTAACACCCTCTTTAATGCCTTTACCCACATATTTGT
+ATAAAACTCCTTCAAATTCAAAATCGGATATCTTTTGTTCTGAGGACACATAAACTACAA
+AACTTACCTGGTGGGATAATCCATGGACCTCAAAGGCAGAGTGGTATGTCAAATAAGCAC
+TGTCATTTATTTTACTACCCACCAAATATCGATTAGCCGGCGCATCTCTGTTTTCTAAAT
+TTACAGCACAATACAAATCTCGGCGTACTCGCTTGACAAGGCCATTTTTTACATATGAAT
+TTAATAACACCTTGGCGTTTTCTATGCTCCCTACAACTTTTTGGGCATCCTTAAGGTTAA
+ATACTTCCATCTTTAAGAAATCTTCATAATACTTCATGTTAATTGAATCACCCAGTTCCT
+TGTTTTGCCTTTAAGTTAATATTAGTATTAACCTTCTAGGTAAATTTGATACCATTATAC
+TTTAAGTTCTTTATTTTTTCAATAGGTTAATATATATATTAACTTTCTAGGCAAAAAAGA
+AACTAAAATGTTTACAGTTCGACTAGTTTCAGGCATAGAAAAAGCCCCGAGGGTTTAATC
+CCACTAGGGCTTGCTATCAAGAATGCTGCGTTTCCCCGGAGTCGTTGGGCGATCTATCCT
+AAGGGCCTATTCAAACAGCATCTGGTGCTCTTGATATTTTTCCATGCCTTTACAGGTATA
+ATATAACACATGTCGGGGGTGGATTCTACTGGATTTTACTCCATTTTACTGTATTTTACT
+ACCCTCTTTTTTTATTCTGTTGACTTCTTTCAGGGCTCTACTATGGATCTTAAAGATTGA
+GCTGTCCCGGTAATTCAGGCTACTGGAAATCTCATCCCAGCCTTTGCCGTTGATATACCG
+CATCTCCAGTATTATTTGACCGATAGGGTCATCCACCTGGCTGATGGTGTTCATAATTTC
+AGCTTTGATGGCAATTGACCGGGCAAGGTCCTCTTTGATTTCTTTCTCTAAATCCACAAT
+TTTAACCACCGTATTTTCCATCTGGCCTTTTTTATTATTGCCACCGGCCACCTTTTCCAC
+TGTCAGGTTAGCCGACACCTTCATGGACAGTTCCCGCAGTGTTTGCAGCTGCTCTAGCTT
+GGTGTTAACCCGCTGGTCAAGCCATAGGGCTTGCGATAAATATTCCTTGGCATTCATGCT
+CTTTCACCCCCGTAATATTTTTCAAAAATATGTTTCTGCCTCTCCGCATCCAAACCACGA
+ATCCGCTCCAATGCCTTTTTTTGACCCAACTCAAACTGCTCCTTGGTTTTATAGAAACTG
+CAGCCTTCACACTTTTTTACTTTTAAGGCCGTGCAGCTGTTTCGTTTGTAAGCAAAACAA
+CCGGTACGCATGATTACTCCACCTCCTGATAAATCCTGGCCTTCACTGCTTCGATTAGTG
+CATTTTGGGTTTTATCTTTTCTTTTCAAAGCGTTCATAACATCTTCATCAATGGTGCCTT
+CAGTGATGATGTGGTGAATAACAACCGTATCCTGCTGGCCTTGCCGCCACAGCCGGGCAT
+TGGTTTGCTGGTAAAGTTCCAGGCTCCAAGTTAAACCAAACCAGATTAAAGTGCTGCCGC
+CTGCTTGCAGGTTTAGCCCATGGCCAGCGGAGGCGGGGTGGATAACAGCCACCGGGATTT
+CACCTTCATTCCACCGTTTTATGGAAGTGGTGTCATCCAGCTTTGTAGCCTTAAACCGCT
+TTAGTATCCGCTGTAGGTCATGCTTGAACCAGTAAGCAATTAATACCGGTTTGCCGTTAG
+CCGCTTCGATTAAATCCTCCAGTGCATCCAGCTTACGGTCGTGTATCTGCACCACGGCAC
+CGTCTTCATCGTATACAGCCCCGTTGGCCATCTGAAGAAGTTTACCGGACAGGGCTGCAG
+CGTTAACGGCATCAATCTCTTTGCCTTTTAGCGGCAGCACTAGTTCCTGCTGCAAGGTAC
+GGTAGTAATCCGCCTCTTTGTCCGATAGCTTGACGGTTACTTCGTTCATCACCAATTCCG
+GTAACTTCAGGTAGTCGGTATTCTTCATGGATATCGTGATGTCGGAGATGCGCCGGTAGA
+TGGCATATTCAGCACCGGGCTTTGGTTTATAGCTGAATACAATCTGCTGATTCCTTTTAT
+CCGGTACAAAGTAGTCCTCTCTATATCTTCCAATAAAGCGGCCCAGCCTGTGGCCCATAT
+CCAGAAGCCGGAATTCCGCCCATAAATCCATTAAGCCGTTAGCCGATGGTGTGCCGGTAA
+GGCCCACAATTCTTTTTACTTTTGGCCGCACTTTCATCAGGCTTTTAAACCGTTTGGCCT
+GGTGGGATTTAAAGGAACTTAGCTCATCTACCACCACCATGTCGTAATCGAAAGGCAGCC
+CGCTTTTATTAACTAACCAGTCCACATTTTCCCGGTTGATGATATAGATATCGGCTGCTT
+GCAGTAATGCCGTTTTGCGCTGTGCCTCTGTGCCAATGGCCACTGCAAACCGCAGCATAT
+TTAGATGCTGCCATTTAATTATTTCCTCCACCCACACAGCCCCCACCCGTAGAGGGCAAA
+TTACAAGCACTTTTCTGATTTCAAAGTAATCAAACAGCAGGTAGAATAAGGCCGTTAGGG
+TGATTACCGTCTTGCCTAAACCGCAATCAAGGAATATAGCGGCCTGGGGATGGTTTAATA
+TAAAATGGGTAGTATACTTCTGATAATCATGTGGTCTGTATTTCATTTAAAATCACCCCA
+ATCTGCCGCTGCTCGTCCAATACGTATACCTTAAATCCTAGCCGCCTCAGCTTTTCGTGT
+CTTTTTACCTGCAGGGGCCGTGGTTTTATGCCATAGCCCTTGATCTCAACGAAGGCTATT
+TTGCCTTCTGGTAATAACACCAAGCGGTCAGGCATACCGGCAAGACCTGGACTGATAAAC
+TTTGGCGCTATACCTCCCGCCGCTTTAACTGCTTTGACTAGCTTTTGTTCAATATGTTTT
+TCACTCATATTCCCCCTCCTTAGCGTCAGGGATTAGTGGGGGTGTGAAGGTCGTGATGGT
+CAATTACATAACTTTATATATATAGTTTTATTTATTTTTTTTTTGCTATAGGAAACTCTA
+TGACAAGACCTACATCGACCTTCACACCTAGGAAAATAGCCTATTCTAGAAGAAAATCAG
+ACCTTAACCTTAATCCCTTGACAATAACTCCTGCTCTTGTCCTTTGCCTTTCAAAATCTT
+CCATTTCAAGCGCCGCGTAGAAATCGGTGGTGCTCCTGGTATACTCACCTGTCCTCATGC
+AAAAGGCCCGGTACTCGCTGTATAGTTCACCTGATTTTTCAGTGAAGGTTCTATCCAGCT
+CACAGCATTCCTCAAGGAAGTGGGCTAGCCAATCGTTGTTTTCCTTGTAGGCGGAAATGG
+CATCCTTCACTTTTTCCGGTAGCTCGATCTGGTAATCATCCATAATCACTTTTTTGGCAC
+CTTCGATTATCCAGCTAAGTATGGCCCCGCCCGCTTGCTCGAACAGGTAATCGCCGTAGT
+TTTTAATATCGGCGCTGCCTTCAATCTTGGCAGTAAAGGGGATAACGATTAGCCGCCTCC
+AGGTACCGGTGTCCAGGGCTCCCACCCTTGGCAAGTGGTTGGTGTATAACACCAAGGTGT
+GGCTGGGAATATAGCTGAATGGGTCTTTGTATTTCTTTTCCGCATAGATTTCATCAGTGG
+AGCAAAGCTGTTTGACGTTGGAGGTATTTAGCCGCATGCCTTCTTCCATCTCCGCTGCAA
+TTAAGAGCCTTTTTCCCTTGGCCTCAGCCAGTTCTGGCTTTACATTTCTCCGGCAGCCAA
+CGGTCAATATATCGGCGGAAATATTGCCACTATAGGTGCCCAGCACTCTGGAGATTGCGT
+TCCAGAAGGTAGATTTACCATTGCGGCCTTCCCCGTGGGCGATAATTAAGGCCTCCACGT
+AGACCTTGCCAATGGCGGCCAGTCCCACTACCTTTTGCACGTAGTCAATTAGTGACTTAT
+CATTTAGGAAAAAGGTATTTAAAGCATCCTTCCATTTATCCATACCTGCAGTACCCGGTT
+CCACCGCAGTTTCTTTGGTAATAAAGTGACCAGGATCATGTTTCATTCTGGCCCCGGTTC
+TTAAGTCATAGGTGGCCTTGGGTGTGTTTAGTAAAAATTCATTGGTATCAAGAGCACTTT
+GGTTAATCTCCAGCATGGGCTGAGCTTCTTTTAATGATGCCGCTATATACTTTGAATTCC
+GGCGCTTGATGGCATATTTCCTATACGCATCGGCGGCTTCAAACTTTTCATAGGCATGGG
+ACTGTACATCATTAAAATCAGCTATTGCCTTTTTGGGACCCTTGTCGGCTAATATGTCAA
+GTGCACCGTTTTTCTCCATCTCATCCATGGCTTTTTTCATTTCAGCCCTGGCTTCTTTCA
+GTTGCCTGGTGGTAAGTTCCTGGGCTATGGCCTGGGCTTTGGGCTTTGATTCCTCCCAAA
+AGCTGCCGTTGTAGACAATGAAATCTGTAGCCGGGGAGTACCTGAGTTTGTCCTCATATT
+CCCTGGCTAAAACAACTGCTTGGCCTACATCCGAAAAATCTGATGGCTTTAAAACACTGT
+CTGAATTGTAGACCTCCGGTGGGATATACCCGGCCTGGGCAGCTACCTTTTCCCCGAAGC
+TGACAGCACTGTTCCAAATAATTTGCAGTTCCTTTTCCTCAAGCGGTGGATTGCATTTTT
+CCGCCAGGGCTAGAAACTTGGAGTGGGCTTCTTCGGTGTTGCCAAAACGCTTGATGATTC
+TCCCGGCATAACGGGACATGGTGTTGTTGCGCTGCCCTTGGGGTATTTCATCCTGGCTCT
+CGTCCCAGTCGGTAAAACTGCTGTCCTCCAGGAATTCTTTGATGTTGATGTCCCCTTCGA
+AAAGCTCCACATTACCGTTATCCGAGCCGAAGATAAACCTGGCACTGTCAAGGGCGTTGC
+TATCGAAAAAGGGAAACCTTGATGCCACGGCAAGCTTTAAGGCGGCGTATTCTTTCGGAT
+CAGTAATTACCGGAATAGCAAAATACACGTGGAACCTGGGCCGGGGTAATTTATCGCCTT
+TTTGCTTCATGTGGTTTCGGCTATAAGATACGACAAAGGGAACCCCTGGGAAGGCCGTGG
+CAACATCATCGGGGGTAACCCAATCCTTGGGATCATCCGAGTGGTCGTTATCGCAATCGA
+ATACGTTATTATCAGCCTTGATGAAATTGGCGTTGCTGCGGTAGTTGCCCTTATACTTCG
+CACTTACGTGGTCAAACTTGATGGCTTCGATGAAGGAGGCCTTGTCTTTGATTACCACCT
+TGTTTGGGTACAGGCAGTTGGCCAGGTTCCCCGTGCAATTTGCTGTGTAAAGGGTAAATT
+CAATCATTCTAAGACCTCCTTCCCGCCCCATTTGTTAGACAACACATTGAGTCACCTCCA
+GGAAATCTTCCCAAGCAGTGATGGGATAACTGTTAACGGTGCCAAACCTTTCATCATTCG
+TTTCGCACGTCCTTATTTCAATAGCACGGGAGCGGCAGTATGCAGATAAGCGTTTGCCGA
+TCCTTTGGCACTGTTTTAAATTCCAGCCCATATTAAAAGTCCTGTTATATTTGGCCACGG
+TATAAAACTTAAGCGATGAATTAAGGGCGATTTCAAGGGTTTCATTTTCCTCAACCAAGG
+CAAATATCTTTCTTTCAGCTTCAATGGCTTTTTGCTGGGCGATCTGCAGTGCCCGCTCCA
+TAATTTTTTCAGGGGAGTTCCAGGCTTCCTCGATGGCGATGAAGTGTTCCCTAAACTTTT
+TCCCTATTTCATTTCTTTGGATCATGCAGATTTCTTTTGCCATGGATATTGTTAGGGAAT
+GATCAGTTTTTGGTTTACCGGGAAGTCCATCCGATCTAACCGTCAAAAATGACGAATAGT
+CTTTTCCTTCTTTAAAACCGTATTCTGTCATTCGGCTAAACCATTTGGCATACTCGGTTC
+CTATTTCCAAAGCCTTGTGAAGTTCACGTCCATTAACCGTAGGGGTATCATTTTTATAAT
+CAATTGCAATTAAATCGTGCATCTCCCAACCTCCTCACCTTTACTGTCAAAGTACCTAAT
+AGGCATACCCCGCCGTTCCGCTTTAGCGATTTCAGCAGCCATGCCGCTACTGATGTGGCT
+ACCAAATACCCAAAGTTCGTCACATTTTCCAAGCAGGATTAGAGCAAACCAAAGGCCCAG
+TTCCCGCTGCTGCCTGTCCCCATCGTCCATAAACTGCGGGTAGTGCAGGTGCGGGGCCAG
+GGGAATGCACCCCAGGCTGACCGCCAATCTGCAATAGCCTCTGGCTCGTTCGATGTTCCT
+TTCCATATCCCCGGCAAAAGGTGATGCTATATACACCAGTGGCCGATAAATCTTGACTGC
+TTTCAAGGCTTCATATGGTGTCGGGTCGGAGTAACCCTCACTGTTGCGCCAGTCCATCTA
+TCTCCCTCCAATCTGACCCGGCTGCACTCCGAGCAAAATACTTCAGTGCCATACAGGTCG
+CTATCACCGGTGCCCAATATCTCAGCGAGGTCAACTTCTACTTCACGCCCACAACCGGGG
+CAGATGCAAAACACATTGTCATCATGGATTTCCACAGCAATTTCCACTTCATCACTAAGC
+TGCGCTTTTACATAAAACATAGGTTTTCTGCCTCCTTTACTTTTCACAGGACAGTAAGCA
+GTGGTTTGGCAACTGACCTTCTAATATACACAGGACATTTTTGATGGTTTTGAGTACCCA
+TAAGCGGAGAAATAATTCGAACCCCCGCCTGTTACCTGATGTTGCTGGCAACATGATTTT
+GTTGTATCGTTAATAAAAATTAATTTATACTGTTGCCAACAACATGAGGCTCCTTACTAT
+CTAAAGGACAGGTACCAGCCAAAATCCGTAGTTAATCTTTCTGGTAAAAATCACATTCGA
+AGCCCTCCGCCCGAAGTAACAGCCCCTTGGCCCAAGGCGGAATTTGGCTCATTTGTTCGC
+ACACCGTCCGAACTGACATTTGCTGTTCAGCTTCGATGACGATTTCGTCATGGATGTGCA
+TCACGATAGGCAAATGCCGCAGGTTCTGCATGGCATAACACAGAAGGTCACGGCTGATTG
+CCTGAATAATGTTTTCAACAATTTTCGCACCGTATGTTTCCAGCCGCTCCCACTTCTTAG
+CCGCACCAATACCTTCATAAGTCACACTGTCGGAGCCAAAGTGGTTAGTACCAATGCGAG
+GTTTCACATAGGCCAGCCGTCTGCCAGAAGGCAAGGTGATAAACAGCATTCCGCTTTGAT
+AAGCAAAACGGATACCGTGAGTTTCTGTGGTGGTGCGTTCCCGAACTGCGGTTAATGCCG
+CCCGGTCAACGTCCCACCAAAAGCGGACAATGTTGGGGTTGGCTGCTCTCCAGGCATCAA
+CCAGTGGTTTTAGTTCTTCCTCTGTAAGTCCCATTTCCAAAGCACCCATGGCCTTTATTG
+CACCCACCGAGCCGCCGTAGCCGCAGTTATGAACCAAACACAGCCGCCGTCCGTTCCATA
+CTGCAAACCGGTGCCGCCTGCCGCAGTTCACCAGGTCATATACCCGTTTTACCCCGGCGG
+GGGTAGGGGATAATGCCTGGACAGCACTATTTGGACGATAAACCCCGGCCCAATGAAGGC
+CGCCACTTTTACCGCTTTCCACCCAGCCCTGATTAGTTAAAACCAGGTGGTCTGGGGTGC
+ATATCACACCATCAACGTTTACGGTCTCCCGCTGGCCTTTGTGAACTAAACCTCCATGGG
+TTACCCACCCTTGGCCATCCCAAACTTTATGTTCTGTGGTAACTTCCTCTATGGGTACAA
+GTCCTGTATCCGTCAACACCAGTTGCCCTTTCGCTATACAGGCCAAATCCGCAATTTTAC
+CTTTTTGCCTGAGTGGGTCTTTTTTATCTGTAATAGGCACACCAAACATCTGACTAGCGG
+TAGCGATGTATAAATCCTTTTTAGCAGCGTAGGCATCTAGCACCCACCGCTCCCCGGCAA
+GCCAGGCCAACACTACCCGCTCGATTGATGAGAAATCCGCCACGATGAATTTATAACCGA
+GTTTGGGAATGAAGGCGGTTCTAATTAATTCCGACAGCACTTCCGGCACCGAATCATAGA
+GCATCTCCAAAGCGGTAAAATTACCGGAGCGCACAAGGCTCCTGGCTTGTGCCAAACCAG
+GCATGTCGTTCCTCGGTAAATTTTGTGGCTGTAAAAGCCTGCCTGACCATCGCCCGGTTC
+GATTGGCACCATAGAATTGAAATATTCCACGAGTGCGATTATCTAGACAGGCCACGTTTT
+CCATGGCCTGATACTTTTTCACTGATGATTTAGCCAGCTGCTGGCGAAGTTGCAGCACTT
+CATCCAGGGGTTTAGGTGCTGTTTCCAATAGCTCCGCCACAGCTTTTTTGCCCAGGGTAT
+CTGTCTCAAGCCCATGGTCAGCTAACCATTCTTTTAGCTGTTGTACGGAATTGGGATTAT
+CAAGGTCTGTCAGCTCGCCCATTCTCCCTAATAGTTCAGAGCGGGTACGCTCATCGGCTT
+TAATGGCTTGCTGGACAAGGGTCATATCCAAAGCCACACCCCGGTCGTTTATCTCCTGAT
+CCAGGTGGAATTCGTCCCAAATGTTCTCCGGCACGGGAAACTTGGCTAACCTTTCCTGAA
+TGGCTATTTCCACCTCCACATCCCGGCGGTTATAGGCTTTGAACTGTTCCCACTTAGCCG
+GGTCATGGATGGGCAGATTCCTTGTCCGCTTACCGTTAGCAATAGTTGGTTTACACGGGG
+TGCAGAAGTAGCGGATTAAATCTTTCCCTTCCGTTAATTTTTGTTTTTCCAATCCCAGCA
+CCGCACCCACTCCTTCTAAAGAAAGGGGCAGTCCCATATAGGCCGACCAAACCATGGTGC
+AGCGCCAGGGCCTTGGATCGAGATATTGAAGTCCCAACCAGCGGGATAAACAGATGCGTT
+CAAACTGACTGTTAAAGGCCCACTTGGTAACACCAGGGTCAGTTAATGCATGTATTATTT
+CATCCGGCAACTTCTCACCGGCGGTAAAATCCACTACCTGAACCTCACCGCCATCCACGC
+TGTAGCCAAACAGGAGTATTTCAAAATCGTGTGATTCGGCGTATTTATAAACACCGGTCT
+TTTTAAGGTCTGCACTGGAAAATGTCTCAATATCGATTCCGAGCGTTTTCATTGGATTCT
+CCTTTACAGGTGTGGGGCAGCGAGGCAAAACCCCGCCACCCCTGCAGTCACTAGGAAAGG
+AAATCATCATCGTCAGCAGTGGCGAAGTCGTCCTCTGCCCTGGACTTGCCGCCGAGCGGT
+TCGCCGTCACGGATTTTCTGCAGATTATTGAGCCCACATGCGATCCCGCGATTTCCCGAA
+CTATTGTAGGCATAAAAATTGATACTGGCCCGGCCATAAACACCGCTGTAAACCTCGGAG
+CGCTCCAGGATGGGCTGACGGTCGGCATCCACAATGCCCGGTGCAGTGGTGGAATTGGCA
+TTGACGAAATAGGCATTGGCGTATGCCGGATCATCGGGTCTTTCGGTATCGCCGTCCCTA
+AGCGGTGTCTTAATAGCGGAAAGAGGTGGTACCGTTTTACCGTTACCCTTCAGCTTTGCT
+TCCCCCTCACGGTAGGCAGCTTCGATGGCAGCTTTAATCTTGGCCACCGTTTTGGTGTCG
+CTCTTTGGGACAATCAAAGATACCGAGAACTTTGGGGTGCCGCCGTTAATTGACTTGGCC
+TCCCACACATTTGCGTAGGACCAACGAGTATTAGGTCCGGTAATAACTTTCATAGGGTTT
+TTAAACATATGATTTTCCTCCTTAATTTTCACTAAAGTCCTGTTGTGCTGTATTGATAGC
+CGGGCGTTTATCATCCACCGGCACTAAAGTCGGTTTTCCAGGTGGTTTTTCAACCAATCC
+ACCTAGCAGTTCAGTAAATCTGGCTTTGCCGAGGGTTTTTTCCATGACAGTGATGCCCTT
+CAATTTTTGTTCATATGGGTCATAACCCGCTGCCTGTACCGCCTGGGCTACCGCATCTTC
+ACTAATGTACTTGCGAACACTTCTACCTGCGACCAGTTTCCAGCCGTTCCACTCCTTACC
+GCCCAGGGCCGCTTGCAAAGCGTAAGTCTTGATGTCACCCGCCCAGGATATGAGTTCATC
+GATTCTGCCCAGGATGGCTTCCACTTCATCGTCTTCCAATAGTGGTGGCAGCTTGAAGTC
+AAAACGAGCAAATTCCATGTTGTGTTCAGCCCTGGCCCGGCACTCGTGCTTGGCCTTACA
+GAACTGACACCACTCGCCACACAGGAACTCCCCGCCACCGGCGTAGGCCAGTTCAGCGAT
+TGGCTTTAGCTCTTCCTCTGCCCAGCGGTAGAGGTCTTCCTTGGTCATGATGTAGGTGCT
+GATGTTGTCCCTGCGGGGCTGGTAGATGGTCATGGATACCGTTTCGATATCAAACAGACA
+ATCAAATATCTCCAGTGCCCCCAGCCCGTACAGCATCATTTGCGGGTTTCTTTCGGCTTC
+CACCAGCACCCCTTGACCATGCTTGTAATCAATGATGTGGAGCACCTTATCGGCGATAAC
+CAGGGCATCCCCGGTGCCAAAGCCGCCCTCTGCATATCTGGAGTAGTCCAGCCGCTGTTC
+AATGAGGACAACTGGATCGGTGCAGGTATACTTGGCCGCTTCCACCAACTCCATGATGTA
+GGCTGCGTAACCATCCGCACATTCCTCCATCTCTTGGCTGTAGTAACTTAAGTCAGCAGT
+TGGGTCTTTTGCCTCCATGCCCAAGGCCTTTTTCAACTTGTATTCACACAGGATATGAGC
+GGCTGTACCCTCGGCGGCGTAATCGCTGCCCCTGTCCTCGTAGTTCTGGCACAGCCGGGC
+TGACGGCGGACATTTTAACCACCTGGGGGAAGCTGAAGCCGAAAGCAGTGCGTGTTTACC
+CATCGCCCAGCACCTCAGCTTCCGCTAAGAGGGTCTTATAATTTGCCGGGTCAACCTCCG
+AAAGCCTGGCTGCCCCGTGCTTTTCAATGAGCATTTTAACTTCTCTTGTAAAACCGCTTC
+TGGATTTCTCCGCCAGAACTGCCCGGACAGTTTCCAGGGTGATAGGTTTTTCCTCCGGTG
+CTGATTCTGGTTGGGGTGCTACTTCGCCGCCAAATAAGTCATTAAGTGAATCTGCTACAC
+TAATTAGCGATTGGGCTGCATTCCTTAGCTCCGTTACTGCTTGCGAAAAATCACTCATCC
+TGTTCACCCACATCCCTTCCTTCCTCTTTAATGGCGTCCTGGTGCTGAAGCGTTAACAGC
+TTCCTTGCTAAACGCCGGGATACGATACTGATGGCGCTTAGGATGCCAGCCAGTTCTTCA
+TCTAGCTCCGGGTCCCTAAGATTCGTTTGCATATTGCCACCTCCATTTCTAAGGGCCTTT
+TTATCCCCTCACCATACACAGGACATTTTTGATGGTTTTGAGTACTAAAAACTGCCCTTC
+AATATCCACAGGACATTTGGGGGCAGTTTGAGTACCTTTTTATCTATAATTTTTTAGGCG
+CTGGTGAAGCTGACCGAAAATCTTGGCCTTGCGCTTGTTTACCGTCCTTTGGGAAAGTCC
+AACCTTATCGGCAATCTGCCGCTCCGACATTCCGTCACCATACAATTCAGCAATTCTTTT
+ATTTTGCGGATCTAGTTCATCAAGGGCTGCCGCTAGTTCCTCAAATAAAAGCTTTTCCGC
+TACCAATTCGGCAACATCAAAGGAACCGGGTATCTCGTAACCATCCTCTGAGAATTTTTC
+TAGTGACAAAACGCTACCGATGCGCTGTTTATCACACTGACTGCAATCCTCCATACAACG
+CTTTGTTTTACCCTTGCCATCACTAATCAAGCATCTTTTTTCCCGTTCCTGACGTTTCAG
+CTCTGCCCACACTGGTCGCCTATCGGTCCTATAAACACCCTCCGTCACCGTAATTTTCTT
+GCCATCAATTGTCAGGTAATACTCCTTGTTTGACTTCTGGTTGTCACCTTTTGGCATAAA
+AAAGCCCCTTTCCCGGTGAGAAAAGGGCATAGGAATTAGCCAAAAAACTCACCGTTTTTT
+TAAACGGGAGCCGTTTGGCTGCACCAAATTTATTGTGGAATTGCTTCCTTCACCTCTACT
+ATCGTCCATAAACAGGGTGCTGTGGCGGACACTTCATGCCCGCTTTTTTAGGGGCAAAAC
+AGGTTTTTTGGGCAAAAAAAAAAGAGCCATACACAAATCCTTGTTTGGATTCATATATGG
+CTCTTAGGAATTTAGGAATAAAAAAACCGGACACCACGTGTCCGCTTTGCTAAAAAATAT
+TTTTATAATGGCGCATCGTTTTCTTGTAAAAAGGCTCTGATATCATCCATTTTCTTGGCG
+TATAGGTGGTTTAGCGCAAATTTATAATAAACATGGCTTTCGTTAGTGTAGTTTAATGAA
+TATGGAGATCTTTCGATGATATGACTACTGATTTCCGGCGGGAGATGCAAGCTGAGGCAA
+ATTGAAACTAATGAATTAATAGAACCCTGCCCCTCACCATTGACGATCCGCCGGATGGTG
+CGTTCATCAATTAGCGTCCTTTCCTCAAGTTCTTTATATGTCACGCCCCTCCATTTCTTT
+ACCATTTTGAGGCAGGCGGTATAGCTATTTGGCAATTCACTATACATACGAGCATTTTCC
+GCTAACACATCGGCTAACAATGCTTTCCTTTTTTCCGGTTTAGCATGCTGGTAGCCTTTC
+CCGTAAACGATATCAAAACTTATGACAGCGGCTTCATCCCTATTTAGAAAACATTCCCGG
+TGGTATCTTTCCCGAACACCAGCTCTAACTGATAGGTCAAATACTAAACAACATTCTTCC
+ATATGTGTCCTGGCATAATCCGTTAGTTCGGTCTCCCCGAATAAATTCTGTGCTACATAT
+TTGGGATGGTTTAATACAAAATGGGCATCTACATACAGGTAGCTGCCGTCTTTCACCAGG
+GGGATTAATTCCGGATTGGTTATACTCTGAATTGCCGCATCTTCAGCACCGATGGAGAAG
+GTCTGATTCTTTAGAAGTGCACCCTTTTTAAAGCTGTGGGGTTTAACGTAGCGCCCGTCT
+ATGTAGGTGAAAGTACCAATGGCTTCTTCATACCCGGCGTTAATCATGCGGATTTTGGCA
+GCCTGGCGAGAGACGCAGAAGAAGATGCCCAGTGCTTCGATGACCGGTTCCATCACATCT
+ATTAGTTCAGTAGTTCCCAGTTCCCTTTGAAATTGCTTGATAAGTTCAAAGGCCTTGGTT
+TTAAACGTTCCCAGGGGCATTTGAATTCTAGGGGCTAAGGAGTTAGCCTGCCACTCCATC
+CAGTCGGTGGCATCCTTTTCACCGTCCTTGATGCCGCCAACTGTTTCACACCTAATTCTA
+CTGGCGCTGGCGTTATATAGGCGTTCTAGTTCAAAGGCTTTCCTGTGCTTGTCCCAGTGG
+ACACATTCATGGACGATAGTATTATTGACGGCACCCAAATTGCGCATGAAATATGCCTTG
+GGGTCAACGAATATCGTCTTGGCCCTGACTGATGTTTTTATTAACTGGTCTACTTCCGAA
+TCATAAAATTCCGCCTCAGCATCGTGAAAATATATCTGGCCGAAGATGGATAAATCCTCG
+GTGATGTCCCGTACTTCTACCCTGAGCCCCATTCGCTCAGCCAATTTTGATGGGTCAAGC
+GGCATGGGGGTTTTTAAGGCCTCCGGATAATATTTGCTCAGGAAGTCAACAGCTACCTTG
+TCCAAGTCCTCTTTATAAATGTATGGAACCAAAGCATCGGAAAGGGGTTTGGGCATCTTT
+CCCTTTTGATATGGGATAATGCTTCTGATCTGAAAATCATCCAGGTTACAGGCTAGATCC
+CCGGTGCATCGGATGGAAAGCCATTGATTGCAGATATCGTAATCATCATAATGGTAGTCG
+CCCTCTGTAACTTCAATTTCAGCATCCACCACGACATCAAATTCTATTTTCAGATCCGGG
+AGGTCGTAAACCGTCACGAATTTAATTACCATATCCGACATGGCAACCCCGCCAACTTCA
+TGAACATTACGCAGATATAAATCTAAACTCTCCCAATTTTGCTCGACATATTCTTCTGCT
+GCAGGATAAAGGTCATCAAGAAACCGGCTTTTTACATAATCGGTAAAAGAGCGATCGCCC
+GCCACGTCATAGCCCCCCTTCCCCCATAGGTAAATTATAGCACATATTGTCGCATGCTCA
+ACCTGATATTTGCATTTGTAAATTTTAATTGCGCTATAACTCTTTTTGTGTTAGTCTTTA
+TAGGCAGCTAAGTGAGGTGGCAACATGAGGACAAGTTATAAGAAACTATGGAAGCTCTTG
+ATAGATAGGGATATGTTAAAGAAGGATTTGCGGGAGACTGCCGGAATCAGTACAGCATCC
+ATGGCCAAGCTGGGCAAAGGTGAAAATGTGACCACTGACGTCTTGGTTAAAATATGTAAG
+GCTCTGGACTGTGATATTTCTGATATCGTGGAGATTGTGGAGGAATAA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_000913.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,144 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_000913.3|provirus_563848_584430_520	563848	564480	633	-1	0.368	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_521	564815	565978	1164	-1	0.467	11	GGAG/GAGG	GENOMAD.133037.VP	1.252e-16	85	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_522	566098	566361	264	-1	0.496	11	GGA/GAG/AGG	GENOMAD.095346.VP	5.936e-50	171	0	0	1	2561	Caudoviricetes	NA	NA	PF09588;K01143;COG5377;TIGR03033	Phage-related protein, predicted endonuclease
+NC_000913.3|provirus_563848_584430_523	566684	566779	96	1	0.521	11	AGGAG	GENOMAD.086130.VV	3.579e-13	62	0	0	0	2561	Caudoviricetes	NA	NA	PF08222;TIGR00373;COG4519	CodY helix-turn-helix domain
+NC_000913.3|provirus_563848_584430_524	566842	567141	300	1	0.500	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_525	567138	568004	867	1	0.551	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_526	568315	568647	333	1	0.411	11	AGGA/GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_527	568902	570428	1527	1	0.356	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_528	570893	571444	552	1	0.424	11	GGAG/GAGG	GENOMAD.189584.CP	1.606e-07	53	0	0	0	1	NA	NA	NA	PF01161;COG1881;TIGR00481	Phosphatidylethanolamine-binding protein
+NC_000913.3|provirus_563848_584430_529	571454	572251	798	1	0.362	11	AGxAGG/AGGxGG	GENOMAD.166602.PC	1.614e-10	64	0	0	0	1	NA	NA	NA	PF06719;PF12833;TIGR02297;K18991;COG2207	4-hydroxyphenylacetate catabolism regulatory protein HpaA
+NC_000913.3|provirus_563848_584430_530	572466	572921	456	1	0.504	11	GGAGG	GENOMAD.022699.VV	2.722e-81	265	0	0	0	2561	Caudoviricetes	NA	NA	PF05772	NinB protein
+NC_000913.3|provirus_563848_584430_531	572921	573091	171	1	0.485	11	AGGAGG	GENOMAD.177576.VP	2.504e-28	107	0	0	0	2561	Caudoviricetes	NA	NA	PF05322	NINE Protein
+NC_000913.3|provirus_563848_584430_532	573084	573374	291	1	0.533	11	AGGAGG	GENOMAD.038211.VV	1.658e-20	87	0	0	0	2561	Caudoviricetes	NA	NA	PF07102	Putative nuclease YbcO
+NC_000913.3|provirus_563848_584430_533	573371	573733	363	1	0.532	11	AGxAGG/AGGxGG	GENOMAD.154527.VP	2.554e-18	82	0	0	0	2561	Caudoviricetes	NA	NA	PF05866;K01160;COG4570	Holliday junction resolvase RusA (prophage-encoded endonuclease)
+NC_000913.3|provirus_563848_584430_534	573733	573870	138	1	0.478	11	GGA/GAG/AGG	GENOMAD.073918.VV	4.945e-10	54	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_535	573956	574339	384	1	0.430	11	GGAG/GAGG	GENOMAD.054312.VV	3.04e-60	203	0	0	0	2561	Caudoviricetes	NA	NA	PF06576	Phage antitermination protein Q
+NC_000913.3|provirus_563848_584430_536	574481	574699	219	1	0.447	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_537	574737	575717	981	-1	0.550	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_538	575758	576825	1068	-1	0.444	11	GGA/GAG/AGG	GENOMAD.042052.CC	7.284e-09	60	0	0	0	1	NA	NA	NA	PF00267;K10940;COG3203	Outer membrane protein (porin)
+NC_000913.3|provirus_563848_584430_539	577398	577613	216	1	0.477	11	GGAG/GAGG	GENOMAD.208385.VP	5.344e-28	107	0	0	1	2561	Caudoviricetes	NA	NA	PF04971	Bacteriophage P21 holin S
+NC_000913.3|provirus_563848_584430_540	577613	578110	498	1	0.476	11	GGAG/GAGG	GENOMAD.171676.VP	2.772e-28	113	0	0	1	2561	Caudoviricetes	NA	NA	PF00959;COG3772	Phage-related lysozyme (muramidase), GH24 family
+NC_000913.3|provirus_563848_584430_541	578107	578568	462	1	0.513	11	GGxGG	GENOMAD.219285.VP	5.677e-41	149	0	0	0	2561	Caudoviricetes	NA	NA	PF03245	Bacteriophage Rz lysis protein
+NC_000913.3|provirus_563848_584430_542	578600	578893	294	-1	0.422	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_543	579184	579594	411	-1	0.314	11	GGA/GAG/AGG	GENOMAD.227189.VP	1.298e-32	124	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_544	579880	580086	207	1	0.396	11	GGAG/GAGG	GENOMAD.227340.VP	5.416e-34	124	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_545	580834	581379	546	1	0.526	11	GGA/GAG/AGG	GENOMAD.161251.VP	7.238e-77	254	0	0	1	2561	Caudoviricetes	NA	NA	PF07471;K22014;COG4220	Phage DNA packaging protein, Nu1 subunit of terminase
+NC_000913.3|provirus_563848_584430_546	581354	582097	744	1	0.508	11	None	GENOMAD.167268.VP	1.572e-44	164	0	0	1	2561	Caudoviricetes	NA	NA	PF02413	Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_563848_584430_547	582152	582583	432	-1	0.412	11	3Base/5BMM	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_563848_584430_548	582875	583060	186	1	0.495	11	GGA/GAG/AGG	GENOMAD.178075.VP	3.901e-19	81	0	0	1	2561	Caudoviricetes	NA	NA	PF02413	Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_563848_584430_549	583681	584430	750	1	0.317	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1105	1196867	1197532	666	-1	0.350	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1106	1197533	1198228	696	-1	0.310	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1107	1198695	1199588	894	1	0.368	11	GGAG/GAGG	GENOMAD.088167.PP	1.632e-150	473	0	0	0	1	NA	NA	NA	PF10463;COG2856	Peptidase U49
+NC_000913.3|provirus_1196867_1213107_1108	1199679	1200806	1128	-1	0.447	11	GGA/GAG/AGG	GENOMAD.195357.VP	1.34e-89	301	0	0	0	2561	Caudoviricetes	NA	NA	PF09003;K21039	Bacteriophage lambda integrase, Arm DNA-binding domain
+NC_000913.3|provirus_1196867_1213107_1109	1200787	1201032	246	-1	0.435	11	GGA/GAG/AGG	GENOMAD.095038.VV	1.817e-43	152	0	0	0	2561	Caudoviricetes	NA	NA	PF07825	Excisionase-like protein
+NC_000913.3|provirus_1196867_1213107_1110	1201497	1201838	342	1	0.386	11	AGGA	GENOMAD.226053.VP	1.147e-47	166	0	0	0	2561	Caudoviricetes	NA	NA	PF11080;K18840	Endoribonuclease GhoS
+NC_000913.3|provirus_1196867_1213107_1111	1201776	1202084	309	-1	0.469	11	GGAG/GAGG	GENOMAD.226995.VP	1.008e-59	200	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1112	1202259	1202933	675	-1	0.441	11	3Base/5BMM	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1113	1203024	1203224	201	1	0.428	11	GGAGG	GENOMAD.218084.VP	6.055e-32	118	0	0	0	2561	Caudoviricetes	NA	NA	PF15943;COG4197	NA
+NC_000913.3|provirus_1196867_1213107_1114	1203268	1203825	558	1	0.496	11	GGAG/GAGG	GENOMAD.058510.VV	7.507e-87	283	0	0	1	2561	Caudoviricetes	NA	NA	PF06892	Phage regulatory protein CII (CP76)
+NC_000913.3|provirus_1196867_1213107_1115	1203822	1204160	339	1	0.499	11	GGAG/GAGG	GENOMAD.102216.VV	1.096e-55	189	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1116	1204170	1205537	1368	1	0.543	11	GGAG/GAGG	GENOMAD.159591.VP	5.958e-37	149	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1117	1205549	1205731	183	1	0.601	11	GGAG/GAGG	GENOMAD.088953.VV	9.423e-11	57	0	0	0	2561	Caudoviricetes	NA	NA	PF10003	NA
+NC_000913.3|provirus_1196867_1213107_1118	1205731	1206204	474	1	0.563	11	GGAGG	GENOMAD.031947.VV	1.897e-07	52	0	0	1	2561	Caudoviricetes	NA	NA	PF04860;TIGR01537	phage portal protein, HK97 family
+NC_000913.3|provirus_1196867_1213107_1119	1206173	1206922	750	1	0.576	11	None	GENOMAD.110264.VV	3.24e-56	198	0	0	1	2561	Caudoviricetes	NA	NA	PF04865;COG3948	Phage-related baseplate assembly protein
+NC_000913.3|provirus_1196867_1213107_1120	1206913	1207497	585	1	0.573	11	GGA/GAG/AGG	GENOMAD.113504.VP	5.104e-87	284	0	0	1	2561	Caudoviricetes	NA	NA	PF10076;COG3778	Uncharacterized protein YmfQ in lambdoid prophage, DUF2313 family
+NC_000913.3|provirus_1196867_1213107_1121	1207501	1208130	630	1	0.503	11	GGAG/GAGG	GENOMAD.044962.VV	2.458e-85	280	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1122	1208171	1208545	375	1	0.437	11	None	GENOMAD.045203.VV	3.842e-40	145	0	0	1	2561	Caudoviricetes	NA	NA	PF02413	Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_1196867_1213107_1123	1208517	1209119	603	-1	0.476	11	GGAG/GAGG	GENOMAD.140378.VP	8.011e-41	151	0	0	1	2561	Caudoviricetes	NA	NA	PF02413	NA
+NC_000913.3|provirus_1196867_1213107_1124	1209119	1209655	537	-1	0.453	11	AGxAGG/AGGxGG	GENOMAD.191048.VP	2.151e-63	215	0	0	0	2561	Caudoviricetes	NA	NA	COG4675	Microcystin-dependent protein  (function unknown)
+NC_000913.3|provirus_1196867_1213107_1125	1209685	1210239	555	1	0.488	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1126	1210346	1211179	834	1	0.384	11	None	GENOMAD.030786.VV	1.161e-05	49	0	0	0	2561	Caudoviricetes	NA	NA	PF13395	HNH endonuclease
+NC_000913.3|provirus_1196867_1213107_1127	1211413	1211577	165	1	0.467	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1196867_1213107_1128	1212703	1213107	405	-1	0.368	11	AGGA/GGAG/GAGG	GENOMAD.227190.VP	2.116e-26	106	0	0	0	2561	Caudoviricetes	NA	NA	PF07166;COG5562	Prophage-encoded protein YbcV, DUF1398 family
+NC_000913.3|provirus_1412000_1434224_1320	1412000	1413235	1236	-1	0.428	11	None	GENOMAD.159447.VP	2.063e-29	125	0	0	1	2561	Caudoviricetes	NA	NA	PF12167;K14059;TIGR01634;COG4385	phage tail protein, P2 protein I family
+NC_000913.3|provirus_1412000_1434224_1321	1413237	1413452	216	-1	0.454	11	GGAG/GAGG	GENOMAD.114098.VV	1.562e-32	120	0	0	0	2561	Caudoviricetes	NA	NA	PF06806	Putative excisionase (DUF1233)
+NC_000913.3|provirus_1412000_1434224_1322	1413531	1413740	210	-1	0.352	11	GGAGG	GENOMAD.223267.VP	1.749e-30	114	0	0	0	1	NA	NA	NA	PF06688;K19780	NA
+NC_000913.3|provirus_1412000_1434224_1323	1413984	1414793	810	-1	0.472	11	AGGA	GENOMAD.127355.VP	2.712e-58	205	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;TIGR00616;COG3723	recombinase, phage RecT family
+NC_000913.3|provirus_1412000_1434224_1324	1414786	1417386	2601	-1	0.494	11	GGAG/GAGG	GENOMAD.084315.VV	4.036e-74	272	0	0	0	2561	Caudoviricetes	NA	NA	PF06630;K10906	Enterobacterial exodeoxyribonuclease VIII
+NC_000913.3|provirus_1412000_1434224_1325	1417488	1417763	276	-1	0.391	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1326	1417838	1418008	171	-1	0.374	11	GGAG/GAGG	GENOMAD.110847.VV	1.628e-32	119	0	0	0	1	NA	NA	NA	PF04181	NA
+NC_000913.3|provirus_1412000_1434224_1327	1418008	1418229	222	-1	0.410	11	GGAG/GAGG	GENOMAD.074955.VV	1.258e-35	129	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1328	1418548	1419159	612	1	0.395	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1329	1419156	1419311	156	-1	0.481	11	GGA/GAG/AGG	GENOMAD.222124.VP	1.495e-23	93	0	0	0	2561	Caudoviricetes	NA	NA	PF07151	NA
+NC_000913.3|provirus_1412000_1434224_1330	1419322	1419456	135	-1	0.474	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1331	1419765	1420241	477	-1	0.419	11	AGGAG/GGAGG	GENOMAD.115833.VV	4.047e-72	239	0	0	0	2561	Caudoviricetes	NA	NA	PF00376;COG5606;TIGR00673;K10123	MerR family regulatory protein
+NC_000913.3|provirus_1412000_1434224_1332	1420365	1420661	297	1	0.434	11	GGAG/GAGG	GENOMAD.054651.VV	1.154e-09	56	0	0	0	2561	Caudoviricetes	NA	NA	PF15943;COG4197	DNA-binding transcriptional regulator YdaS, prophage-encoded, Cro superfamily
+NC_000913.3|provirus_1412000_1434224_1333	1420684	1421106	423	1	0.508	11	GGAG/GAGG	GENOMAD.072359.VV	8.614e-72	237	0	0	0	2561	Caudoviricetes	NA	NA	PF06254	Putative bacterial toxin ydaT
+NC_000913.3|provirus_1412000_1434224_1334	1421119	1421976	858	1	0.479	11	None	GENOMAD.195765.VP	5.5e-122	390	0	0	0	2561	Caudoviricetes	NA	NA	PF07120;COG3756	Uncharacterized conserved protein YdaU, DUF1376 family
+NC_000913.3|provirus_1412000_1434224_1335	1421983	1422729	747	1	0.527	11	AGxAGG/AGGxGG	GENOMAD.047125.VV	5.612e-10	62	0	0	1	2561	Caudoviricetes	NA	NA	PF16463;COG5437;TIGR02126	Phage tail tube protein family
+NC_000913.3|provirus_1412000_1434224_1336	1422752	1423312	561	1	0.488	11	GGAG/GAGG	GENOMAD.144793.VV	5.225e-30	119	0	0	0	1	NA	NA	NA	PF07789	NA
+NC_000913.3|provirus_1412000_1434224_1337	1423345	1423644	300	1	0.533	11	GGA/GAG/AGG	GENOMAD.219285.VP	4.845e-42	149	0	0	0	2561	Caudoviricetes	NA	NA	PF03245	Bacteriophage Rz lysis protein
+NC_000913.3|provirus_1412000_1434224_1338	1423815	1425239	1425	1	0.382	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1339	1425377	1425640	264	1	0.481	11	GGA/GAG/AGG	GENOMAD.159709.VV	5.097e-06	45	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1340	1425621	1425980	360	1	0.472	11	None	GENOMAD.109865.VV	7.702e-05	43	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1341	1426454	1427482	1029	1	0.468	11	AGGAG	GENOMAD.120741.VP	1.03e-151	479	0	0	1	2561	Caudoviricetes	NA	NA	COG5281	Phage-related minor tail protein
+NC_000913.3|provirus_1412000_1434224_1342	1427482	1427613	132	1	0.553	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1343	1427746	1428726	981	-1	0.555	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1344	1429049	1432411	3363	1	0.533	11	None	GENOMAD.020617.VV	5.058e-116	406	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1345	1432411	1432986	576	1	0.481	11	GGAG/GAGG	GENOMAD.167268.VP	3.58e-55	192	0	0	1	2561	Caudoviricetes	NA	NA	PF02413	Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_1412000_1434224_1346	1433084	1433674	591	-1	0.448	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1412000_1434224_1347	1433991	1434224	234	-1	0.359	11	AGGA	GENOMAD.221767.PV	3.984e-26	102	0	0	0	1	NA	NA	NA	PF10965	Biofilm development protein YmgB/AriR
+NC_000913.3|provirus_1627517_1653915_1513	1627517	1628263	747	1	0.506	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1514	1628352	1629038	687	1	0.501	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1515	1629215	1629418	204	1	0.520	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1516	1629453	1630913	1461	-1	0.494	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1517	1631002	1632285	1284	-1	0.469	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1518	1633072	1633305	234	1	0.355	11	AGGA	GENOMAD.221767.PV	3.984e-26	102	0	0	0	1	NA	NA	NA	PF10965	Biofilm development protein YmgB/AriR
+NC_000913.3|provirus_1627517_1653915_1519	1633622	1634212	591	1	0.448	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1520	1634310	1634885	576	-1	0.479	11	GGAG/GAGG	GENOMAD.167268.VP	3.58e-55	192	0	0	1	2561	Caudoviricetes	NA	NA	PF02413	Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_1627517_1653915_1521	1634885	1635847	963	-1	0.526	11	None	GENOMAD.211480.VP	3.667e-69	239	0	0	0	2561	Caudoviricetes	NA	NA	COG5301	Phage-related tail fibre protein
+NC_000913.3|provirus_1627517_1653915_1522	1635798	1636367	570	-1	0.537	11	GGA/GAG/AGG	GENOMAD.161251.VP	1.255e-74	248	0	0	1	2561	Caudoviricetes	NA	NA	PF07471;K22014;COG4220	Phage DNA packaging protein, Nu1 subunit of terminase
+NC_000913.3|provirus_1627517_1653915_1523	1637047	1637457	411	1	0.316	11	GGA/GAG/AGG	GENOMAD.227189.VP	1.298e-32	124	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1524	1637609	1637782	174	-1	0.299	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1525	1638455	1638667	213	-1	0.404	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1526	1639030	1639527	498	-1	0.458	11	GGA/GAG/AGG	GENOMAD.062288.VV	1.369e-70	235	0	0	0	2561	Caudoviricetes	NA	NA	PF10721	NA
+NC_000913.3|provirus_1627517_1653915_1527	1639524	1640057	534	-1	0.506	11	None	GENOMAD.171676.VP	8.945e-29	115	0	0	1	2561	Caudoviricetes	NA	NA	PF00959;COG3772	Phage-related lysozyme (muramidase), GH24 family
+NC_000913.3|provirus_1627517_1653915_1528	1640054	1640365	312	-1	0.439	11	AGGAG	GENOMAD.225519.VP	1.173e-50	174	0	0	0	1	NA	NA	NA	PF07041	NA
+NC_000913.3|provirus_1627517_1653915_1529	1640370	1640576	207	-1	0.473	11	AGGA	GENOMAD.208385.VP	5.126e-27	104	0	0	1	2561	Caudoviricetes	NA	NA	PF04971	Bacteriophage P21 holin S
+NC_000913.3|provirus_1627517_1653915_1530	1640618	1640737	120	1	0.342	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1531	1641339	1641554	216	-1	0.356	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1532	1641855	1642067	213	1	0.484	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1533	1642489	1643241	753	-1	0.481	11	GGAG/GAGG	GENOMAD.136613.VP	1.109e-26	112	0	0	0	2561	Caudoviricetes	NA	NA	PF03589;TIGR02642	Antitermination protein
+NC_000913.3|provirus_1627517_1653915_1534	1643255	1644304	1050	-1	0.521	11	GGAGG	GENOMAD.196019.VP	1.481e-50	186	0	0	0	2561	Caudoviricetes	NA	NA	PF06147	dATP/dGTP pyrophosphohydrolase
+NC_000913.3|provirus_1627517_1653915_1535	1644651	1644902	252	-1	0.409	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1536	1645119	1645274	156	-1	0.519	11	AGGAG	GENOMAD.136858.PV	7.473e-23	91	0	0	0	2561	Caudoviricetes	NA	NA	PF01848;K18919	Hok/gef family
+NC_000913.3|provirus_1627517_1653915_1537	1645346	1645633	288	-1	0.469	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1538	1645633	1645872	240	-1	0.471	11	GGAG/GAGG	GENOMAD.151401.PV	4.39e-26	102	0	0	0	1	NA	NA	NA	PF04221;TIGR02384;COG3077;K07473	addiction module antitoxin, RelB/DinJ family
+NC_000913.3|provirus_1627517_1653915_1539	1646405	1646737	333	1	0.429	11	AGGAG	GENOMAD.078672.PP	6.68e-60	201	0	0	0	1	NA	NA	NA	PF14282	FlxA-like protein
+NC_000913.3|provirus_1627517_1653915_1540	1647122	1647349	228	-1	0.421	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1541	1647346	1647636	291	-1	0.505	11	GGxGG	GENOMAD.150946.VV	3.745e-51	175	0	0	0	1	NA	NA	NA	PF06254	Putative bacterial toxin ydaT
+NC_000913.3|provirus_1627517_1653915_1542	1647620	1647850	231	-1	0.459	11	GGA/GAG/AGG	GENOMAD.108381.VV	1.622e-34	126	0	0	0	2561	Caudoviricetes	NA	NA	K22302	NA
+NC_000913.3|provirus_1627517_1653915_1543	1647934	1648341	408	1	0.436	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1544	1648508	1648663	156	1	0.481	11	GGAG/GAGG	GENOMAD.222124.VP	6.689e-24	94	0	0	0	2561	Caudoviricetes	NA	NA	PF07151	NA
+NC_000913.3|provirus_1627517_1653915_1545	1648665	1648793	129	1	0.465	11	GGA/GAG/AGG	GENOMAD.136713.VV	1.3e-20	84	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1546	1648823	1649041	219	1	0.479	11	GGAG/GAGG	GENOMAD.180239.VV	1.159e-43	152	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1547	1649045	1649209	165	-1	0.509	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1548	1649609	1649797	189	1	0.360	11	GGAG/GAGG	GENOMAD.189052.VV	3.595e-35	127	0	0	0	2561	Caudoviricetes	NA	NA	PF05358;K22304	DicB protein
+NC_000913.3|provirus_1627517_1653915_1549	1649794	1649985	192	1	0.432	11	AGGA	GENOMAD.094923.VV	7.175e-29	109	0	0	0	2561	Caudoviricetes	NA	NA	PF07358	NA
+NC_000913.3|provirus_1627517_1653915_1550	1650078	1650998	921	1	0.497	11	GGAG/GAGG	GENOMAD.075680.VV	3.9e-07	54	0	0	0	2561	Caudoviricetes	NA	NA	K10906	NA
+NC_000913.3|provirus_1627517_1653915_1551	1650995	1651537	543	1	0.541	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1552	1651512	1652708	1197	1	0.422	11	None	GENOMAD.099267.VV	1.899e-19	94	0	0	0	2561	Caudoviricetes	NA	NA	PF00589;TIGR02224;COG4973;K03733	tyrosine recombinase XerC
+NC_000913.3|provirus_1627517_1653915_1553	1652728	1652838	111	-1	0.414	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_1627517_1653915_1554	1652896	1653915	1020	-1	0.449	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2313	2461306	2462646	1341	1	0.498	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2314	2463012	2464070	1059	1	0.355	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2315	2464252	2465007	756	-1	0.519	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2316	2465301	2466233	933	1	0.486	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2317	2466545	2467702	1158	1	0.478	11	GGA/GAG/AGG	GENOMAD.064492.VV	0.0007762	44	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2318	2468214	2469134	921	1	0.395	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2319	2469131	2470462	1332	1	0.276	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2320	2470803	2471105	303	1	0.545	11	GGA/GAG/AGG	GENOMAD.167268.VP	2.711e-17	78	0	0	1	2561	Caudoviricetes	NA	NA	PF02413	Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_2461306_2476510_2321	2471077	2471517	441	-1	0.454	11	GGAG/GAGG	GENOMAD.045203.VV	2.366e-80	262	0	0	1	2561	Caudoviricetes	NA	NA	PF02413	Caudovirales tail fibre assembly protein, lambda gpK
+NC_000913.3|provirus_2461306_2476510_2322	2471544	2472146	603	-1	0.509	11	GGAG/GAGG	GENOMAD.044962.VV	4.611e-91	296	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2323	2472112	2472387	276	-1	0.518	11	GGxGG	GENOMAD.178309.VP	1.935e-09	55	0	0	0	2561	Caudoviricetes	NA	NA	PF05869;TIGR01712	phage N-6-adenine-methyltransferase
+NC_000913.3|provirus_2461306_2476510_2324	2472387	2472881	495	-1	0.545	11	AGGA	GENOMAD.225234.VP	1.741e-67	226	0	0	0	2561	Caudoviricetes	NA	NA	PF06069	PerC transcriptional activator
+NC_000913.3|provirus_2461306_2476510_2325	2472878	2473246	369	-1	0.556	11	GGA/GAG/AGG	GENOMAD.086968.VV	4.891e-69	228	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2326	2473604	2473966	363	1	0.501	11	AGGAG	GENOMAD.056235.VV	4.359e-53	182	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2327	2474032	2474856	825	1	0.457	11	GGAG/GAGG	GENOMAD.052651.VV	8.505e-66	227	0	0	0	2561	Caudoviricetes	NA	NA	PF10065;COG5532	Uncharacterized conserved protein YfdQ, DUF2303 family
+NC_000913.3|provirus_2461306_2476510_2328	2474984	2475520	537	1	0.462	11	GGAG/GAGG	GENOMAD.172054.VC	5.137e-36	136	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2329	2475511	2475873	363	1	0.471	11	GGAG/GAGG	GENOMAD.067358.VV	4.901e-68	225	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2330	2475873	2476178	306	1	0.428	11	GGAGG	GENOMAD.222350.VP	2.161e-43	153	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_000913.3|provirus_2461306_2476510_2331	2476310	2476510	201	1	0.438	11	GGAG/GAGG	GENOMAD.195460.VP	1.864e-28	108	0	0	0	2561	Caudoviricetes	NA	NA	COG2452	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_002737.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,172 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_002737.2|provirus_529627_569283_517	529627	531042	1416	-1	0.322	11	GGAG/GAGG	GENOMAD.022372.VV	6.087e-23	106	0	0	1	2561	Caudoviricetes	NA	NA	PF04708;COG1961;K14060	Site-specific DNA recombinase related to the DNA invertase Pin
+NC_002737.2|provirus_529627_569283_518	531163	531528	366	-1	0.333	11	GGAG/GAGG	GENOMAD.142683.VV	5.916e-18	81	0	0	0	2561	Caudoviricetes	NA	NA	PF11446;TIGR04165;COG4888	Cys-rich peptide, TIGR04165 family
+NC_002737.2|provirus_529627_569283_519	531555	532316	762	-1	0.329	11	AGGA	GENOMAD.108504.VP	7.914e-35	136	0	0	0	2561	Caudoviricetes	NA	NA	PF05866;PF00717;COG4570;TIGR02754	Endodeoxyribonuclease RusA; Peptidase S24-like
+NC_002737.2|provirus_529627_569283_520	532500	532730	231	1	0.372	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_521	532799	532936	138	1	0.326	11	GGAG/GAGG	GENOMAD.061610.VV	0.0002144	38	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_522	532938	533063	126	1	0.302	11	AGGAG	GENOMAD.129654.VV	6.909e-19	79	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_523	533060	533287	228	1	0.320	11	GGA/GAG/AGG	GENOMAD.108243.VV	1.543e-34	126	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_524	533287	534606	1320	1	0.385	11	GGAG/GAGG	GENOMAD.010825.VV	1.953e-201	628	0	0	0	2561	Caudoviricetes	NA	NA	PF13175;TIGR00634;COG4717;K03546	DNA repair protein RecN
+NC_002737.2|provirus_529627_569283_525	534621	535712	1092	1	0.444	11	GGAG/GAGG	GENOMAD.141036.VV	6.091e-73	252	0	0	1	2561	Caudoviricetes	NA	NA	PF13479;TIGR01618;K04484;COG0468	phage nucleotide-binding protein
+NC_002737.2|provirus_529627_569283_526	535752	536174	423	1	0.383	11	AGGA/GGAG/GAGG	GENOMAD.092954.VV	1.157e-35	133	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_527	536176	536910	735	1	0.351	11	AGGA	GENOMAD.014438.VV	4.323e-50	180	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_528	536932	537567	636	1	0.410	11	AGGAG	GENOMAD.005320.VV	5.429e-31	123	0	0	0	2561	Caudoviricetes	NA	NA	PF05037	NA
+NC_002737.2|provirus_529627_569283_529	537567	539150	1584	1	0.411	11	GGAGG	GENOMAD.030980.VV	1.795e-05	50	0	0	0	2561	Caudoviricetes	NA	NA	PF04851;PF17338;K17677;TIGR00614;COG1061	Type III restriction enzyme, res subunit; Gene product 88
+NC_002737.2|provirus_529627_569283_530	539160	539789	630	1	0.314	11	AGGAG	GENOMAD.116271.VP	3.678e-24	103	0	0	0	2561	Caudoviricetes	NA	NA	PF07768	PVL ORF-50-like family
+NC_002737.2|provirus_529627_569283_531	539779	542052	2274	1	0.395	11	GGA/GAG/AGG	GENOMAD.168744.VP	3.155e-85	303	0	0	0	2561	Caudoviricetes	NA	NA	K07505	NA
+NC_002737.2|provirus_529627_569283_532	542330	542548	219	1	0.292	11	GGAG/GAGG	GENOMAD.004447.VV	1.326e-12	63	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_533	542541	542936	396	1	0.419	11	GGA/GAG/AGG	GENOMAD.028440.VV	8.304e-68	225	0	0	0	2561	Caudoviricetes	NA	NA	PF05866;COG4570;K01160	Holliday junction resolvase RusA (prophage-encoded endonuclease)
+NC_002737.2|provirus_529627_569283_534	542933	543154	222	1	0.365	11	AGxAGG/AGGxGG	GENOMAD.053518.VV	3.344e-41	145	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_535	543157	543429	273	1	0.418	11	GGAGG	GENOMAD.072347.VV	1.269e-43	153	0	0	0	2561	Caudoviricetes	NA	NA	TIGR02209	NA
+NC_002737.2|provirus_529627_569283_536	543431	544066	636	1	0.358	11	GGAGG	GENOMAD.138295.VP	1.141e-77	258	0	0	0	2561	Caudoviricetes	NA	NA	TIGR02987;COG0827	NA
+NC_002737.2|provirus_529627_569283_537	544339	544773	435	1	0.418	11	GGAGG	GENOMAD.111673.VV	1.324e-85	277	0	0	0	2561	Caudoviricetes	NA	NA	PF05263;TIGR01637	phage transcriptional regulator, ArpU family
+NC_002737.2|provirus_529627_569283_538	545083	546249	1167	1	0.373	11	AGGA	GENOMAD.038338.VV	1.175e-46	176	0	0	0	2561	Caudoviricetes	NA	NA	COG3392	NA
+NC_002737.2|provirus_529627_569283_539	546592	547068	477	1	0.449	11	AGGA	GENOMAD.003239.VV	1.762e-30	119	0	0	1	2561	Caudoviricetes	NA	NA	PF05133;TIGR01538	phage portal protein, SPP1 family
+NC_002737.2|provirus_529627_569283_540	547151	548362	1212	1	0.412	11	GGA/GAG/AGG	GENOMAD.064889.VV	5.208e-172	541	0	0	1	2561	Caudoviricetes	NA	NA	PF04466;PF17288;TIGR01547;COG1783;K06909	phage terminase, large subunit, PBSX family
+NC_002737.2|provirus_529627_569283_541	548376	549878	1503	1	0.409	11	AGGAG	GENOMAD.003916.VV	9.779e-91	310	0	0	1	2561	Caudoviricetes	NA	NA	PF05133;TIGR01542	phage portal protein, putative, A118 family
+NC_002737.2|provirus_529627_569283_542	549883	551376	1494	1	0.396	11	GGAG/GAGG	GENOMAD.063181.VV	1.974e-184	582	0	0	1	2561	Caudoviricetes	NA	NA	PF06152;TIGR01641	Phage minor capsid protein 2
+NC_002737.2|provirus_529627_569283_543	551376	551603	228	1	0.303	11	GGAGG	GENOMAD.148778.VV	3.696e-41	145	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_544	551690	551956	267	1	0.363	11	AGGAG	GENOMAD.076597.VV	2.091e-45	158	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_545	552088	552696	609	1	0.399	11	AGGAG	GENOMAD.041104.VV	8.665e-41	151	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_546	552700	553518	819	1	0.435	11	AGGA	GENOMAD.013974.VV	8.477e-55	195	0	0	1	2561	Caudoviricetes	NA	NA	PF20036;TIGR04387	major capsid protein, N4-gp56 family
+NC_002737.2|provirus_529627_569283_547	553572	553988	417	1	0.396	11	GGA/GAG/AGG	GENOMAD.034545.VV	3.007e-49	172	0	0	0	2561	Caudoviricetes	NA	NA	PF11436	NA
+NC_002737.2|provirus_529627_569283_548	553978	554310	333	1	0.393	11	None	GENOMAD.114565.VV	2.724e-37	136	0	0	1	2561	Caudoviricetes	NA	NA	PF10665	Minor capsid protein
+NC_002737.2|provirus_529627_569283_549	554310	554666	357	1	0.440	11	GGAGG	GENOMAD.008261.VV	1.315e-48	169	0	0	1	2561	Caudoviricetes	NA	NA	PF11114	Minor capsid protein
+NC_002737.2|provirus_529627_569283_550	554663	555061	399	1	0.363	11	GGA/GAG/AGG	GENOMAD.034546.VV	2.354e-24	100	0	0	1	2561	Caudoviricetes	NA	NA	PF12691	Bacteriophage minor capsid protein
+NC_002737.2|provirus_529627_569283_551	555061	555531	471	1	0.425	11	AGxAGG/AGGxGG	GENOMAD.028171.VV	1.557e-56	194	0	0	1	2561	Caudoviricetes	NA	NA	PF16461;COG5437	Lambda phage tail tube protein, TTP
+NC_002737.2|provirus_529627_569283_552	555584	556018	435	1	0.393	11	AGGAG	GENOMAD.064813.VV	7.473e-34	128	0	0	1	2561	Caudoviricetes	NA	NA	PF10666	Phage tail assembly chaperone protein Gp14 ()A118
+NC_002737.2|provirus_529627_569283_553	556022	556603	582	1	0.376	11	AGGAG	GENOMAD.013935.VV	5.591e-51	180	0	0	0	2561	Caudoviricetes	NA	NA	PF06854	Bacteriophage Gp15 protein
+NC_002737.2|provirus_529627_569283_554	556593	559853	3261	1	0.431	11	AGGAG	GENOMAD.002456.VV	1.364e-297	940	0	0	1	2561	Caudoviricetes	NA	NA	COG3941	NA
+NC_002737.2|provirus_529627_569283_555	559850	560566	717	1	0.389	11	GGA/GAG/AGG	GENOMAD.006390.VV	2.824e-80	267	0	0	0	2561	Caudoviricetes	NA	NA	PF20195;COG4722;TIGR01633	Phage-related protein
+NC_002737.2|provirus_529627_569283_556	560563	562707	2145	1	0.422	11	None	GENOMAD.049306.VV	0.0	1000	0	0	0	2561	Caudoviricetes	NA	NA	COG4926	Phage-related protein
+NC_002737.2|provirus_529627_569283_557	562704	563717	1014	1	0.438	11	GGAGG	GENOMAD.093524.VV	3.153e-136	434	0	0	0	2561	Caudoviricetes	NA	NA	PF07212	Hyaluronidase protein (HylP)
+NC_002737.2|provirus_529627_569283_558	563732	565618	1887	1	0.449	11	AGGAG	GENOMAD.033709.VV	0.0	1088	0	0	0	2561	Caudoviricetes	NA	NA	PF07902	gp58-like protein
+NC_002737.2|provirus_529627_569283_559	565630	566061	432	1	0.354	11	AGGAG	GENOMAD.073534.VV	4.564e-80	261	0	0	0	2561	Caudoviricetes	NA	NA	PF07761	NA
+NC_002737.2|provirus_529627_569283_560	566064	566681	618	1	0.430	11	AGGAG	GENOMAD.024672.VV	8.84e-112	356	0	0	0	2561	Caudoviricetes	NA	NA	PF07104	NA
+NC_002737.2|provirus_529627_569283_561	566691	566966	276	1	0.348	11	GGAG/GAGG	GENOMAD.039653.VV	9.653e-09	53	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_562	566963	567190	228	1	0.390	11	AGGAG	GENOMAD.126098.VV	2.718e-14	68	0	0	0	2561	Caudoviricetes	NA	NA	COG5546	NA
+NC_002737.2|provirus_529627_569283_563	567199	567309	111	1	0.387	11	AGGAG	GENOMAD.102275.VV	5.331e-12	59	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_564	567306	568508	1203	1	0.446	11	AGGAG	GENOMAD.133734.VP	7.911e-45	171	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_529627_569283_565	568576	569283	708	-1	0.284	11	AGGAG	GENOMAD.223462.VP	3.741e-24	104	0	0	0	2561	Caudoviricetes	NA	NA	PF02876;PF01123;K11040	Staphylococcal/Streptococcal toxin, beta-grasp domain; Staphylococcal/Streptococcal toxin, OB-fold domain
+NC_002737.2|provirus_777501_820593_756	777501	778541	1041	1	0.404	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_757	778635	779774	1140	-1	0.389	11	GGAG/GAGG	GENOMAD.111131.VV	7.217e-08	57	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_758	780028	780837	810	-1	0.344	11	AGGAG	GENOMAD.221704.VP	7.412e-31	125	0	0	0	2561	Caudoviricetes	NA	NA	PF02452;COG3692;K18841	Uncharacterized protein YifN, PemK superfamily
+NC_002737.2|provirus_777501_820593_759	780850	781596	747	-1	0.395	11	AGGAG	GENOMAD.179094.VV	4.977e-08	56	0	0	0	2561	Caudoviricetes	NA	NA	PF08667;COG1974;K18830;TIGR02612	SOS-response transcriptional repressor LexA (RecA-mediated autopeptidase)
+NC_002737.2|provirus_777501_820593_760	781786	781944	159	1	0.358	11	AGGAG	GENOMAD.097925.VV	1.016e-27	105	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_761	781978	782145	168	1	0.256	11	AGGAG	GENOMAD.116752.VV	1.286e-19	82	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_762	782123	782962	840	-1	0.295	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_763	783080	783307	228	-1	0.346	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_764	783381	783587	207	1	0.382	11	AGGAG	GENOMAD.223061.VP	0.0006542	38	0	0	0	2561	Caudoviricetes	NA	NA	PF06892;COG5606;TIGR00673;K07727	Predicted DNA-binding protein, XRE-type HTH domain
+NC_002737.2|provirus_777501_820593_765	783627	784355	729	1	0.401	11	GGA/GAG/AGG	GENOMAD.133073.VP	1.055e-36	141	0	0	0	2561	Caudoviricetes	NA	NA	PF03374;COG3645	Phage antirepressor protein YoqD, KilAC domain
+NC_002737.2|provirus_777501_820593_766	784387	784653	267	1	0.356	11	GGAG/GAGG	GENOMAD.133830.VV	1.414e-41	147	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_767	784588	785394	807	-1	0.369	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_768	785536	785772	237	-1	0.350	11	None	GENOMAD.153962.VV	1.274e-45	158	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_769	785983	786222	240	1	0.363	11	None	GENOMAD.050216.VV	1.824e-42	149	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_770	786224	786409	186	1	0.371	11	AGGAG	GENOMAD.105558.VV	2.903e-29	110	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_771	786509	786748	240	1	0.342	11	GGA/GAG/AGG	GENOMAD.136142.VP	7.591e-36	130	0	0	0	2561	Caudoviricetes	NA	NA	PF13730;TIGR00373;COG4738;K07721	transcription factor E
+NC_002737.2|provirus_777501_820593_772	786892	787278	387	1	0.367	11	AGGAG	GENOMAD.198321.CP	4.29e-06	47	0	0	0	2561	Caudoviricetes	NA	NA	PF07261;COG3611;TIGR04548;K02086	Replication initiation and membrane attachment protein DnaB
+NC_002737.2|provirus_777501_820593_773	787259	787492	234	1	0.355	11	None	GENOMAD.100896.VV	1.121e-38	138	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_774	787489	787629	141	1	0.404	11	AGGAG	GENOMAD.079484.VV	1.722e-06	44	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_775	787638	787844	207	1	0.435	11	AGGAG	GENOMAD.114751.VV	3.555e-38	136	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_776	787900	788229	330	1	0.333	11	GGAG/GAGG	GENOMAD.040347.VV	1.569e-42	151	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_777	788232	789023	792	1	0.398	11	GGAGG	GENOMAD.177891.VP	2.824e-31	126	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;TIGR01913;COG3723	phage recombination protein Bet
+NC_002737.2|provirus_777501_820593_778	789033	789698	666	1	0.399	11	AGGAG	GENOMAD.012371.VV	4.137e-128	404	0	0	0	2561	Caudoviricetes	NA	NA	PF07083	NA
+NC_002737.2|provirus_777501_820593_779	789702	790061	360	1	0.408	11	None	GENOMAD.012371.VV	7.592e-55	187	0	0	0	2561	Caudoviricetes	NA	NA	PF07083	NA
+NC_002737.2|provirus_777501_820593_780	790257	790595	339	1	0.354	11	GGA/GAG/AGG	GENOMAD.060064.VV	3.644e-11	61	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_781	790592	791104	513	1	0.382	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_782	791091	791285	195	1	0.385	11	GGA/GAG/AGG	GENOMAD.100776.VV	1.514e-29	111	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_783	791282	791527	246	1	0.374	11	GGAG/GAGG	GENOMAD.105486.VP	3.33e-22	91	0	0	0	2561	Caudoviricetes	NA	NA	PF09643;TIGR01671	phage uncharacterized protein TIGR01671
+NC_002737.2|provirus_777501_820593_784	791579	792040	462	1	0.383	11	AGGAG	GENOMAD.003865.VV	3.718e-37	138	0	0	1	2561	Caudoviricetes	NA	NA	PF11753;PF07852	Protein of unknwon function (DUF3310)
+NC_002737.2|provirus_777501_820593_785	792037	792207	171	1	0.333	11	GGAG/GAGG	GENOMAD.094280.VV	2.018e-30	113	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_786	792490	792930	441	1	0.399	11	None	GENOMAD.111673.VV	9.888e-90	289	0	0	0	2561	Caudoviricetes	NA	NA	PF05263;TIGR01637	phage transcriptional regulator, ArpU family
+NC_002737.2|provirus_777501_820593_787	793076	793279	204	1	0.338	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_788	793245	794159	915	1	0.286	11	GGAG/GAGG	GENOMAD.141545.VV	2.021e-203	626	0	0	0	1	NA	NA	NA	PF20505	Intracellular sensor of Lambda phage, Abi component
+NC_002737.2|provirus_777501_820593_789	794178	794639	462	1	0.266	11	GGAG/GAGG	GENOMAD.146805.VV	3.296e-80	262	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_790	794667	795149	483	1	0.393	11	None	GENOMAD.168355.VP	1.714e-11	64	0	0	1	2561	Caudoviricetes	NA	NA	PF03592;COG3728;K07474	Phage terminase, small subunit
+NC_002737.2|provirus_777501_820593_791	795127	796416	1290	1	0.384	11	None	GENOMAD.100877.VP	2.658e-56	206	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_792	796428	796790	363	1	0.413	11	AGGA	GENOMAD.033166.VV	2.201e-68	226	0	0	1	2561	Caudoviricetes	NA	NA	PF05133;TIGR01538	phage portal protein, SPP1 family
+NC_002737.2|provirus_777501_820593_793	796902	797930	1029	1	0.421	11	None	GENOMAD.100877.VP	9.441e-55	198	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_794	797911	799536	1626	1	0.381	11	GGAG/GAGG	GENOMAD.004769.VV	9.122e-66	238	0	0	1	2561	Caudoviricetes	NA	NA	PF04233;COG5585;TIGR01641	NAD+--asparagine ADP-ribosyltransferase
+NC_002737.2|provirus_777501_820593_795	799527	799706	180	1	0.344	11	AGGAG	GENOMAD.137178.VV	6.881e-35	126	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_796	799766	800035	270	1	0.363	11	AGGAG	GENOMAD.076597.VV	2.432e-44	155	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_797	800125	800295	171	1	0.357	11	None	GENOMAD.179672.VV	0.0001663	39	0	0	0	2561	Caudoviricetes	NA	NA	PF16777;COG4453;TIGR04563	Transcriptional regulator, RHH-like, CopG
+NC_002737.2|provirus_777501_820593_798	800424	800672	249	1	0.349	11	AGGAG	GENOMAD.106940.VV	2.117e-42	149	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_799	800674	801420	747	1	0.386	11	GGA/GAG/AGG	GENOMAD.024598.VV	2.917e-13	72	0	0	0	2561	Caudoviricetes	NA	NA	COG3617	Prophage antirepressor
+NC_002737.2|provirus_777501_820593_800	801532	802065	534	1	0.419	11	AGGAG	GENOMAD.010937.VV	1.418e-32	126	0	0	0	2561	Caudoviricetes	NA	NA	PF14265	NA
+NC_002737.2|provirus_777501_820593_801	802075	802455	381	1	0.365	11	AGGAG	GENOMAD.010435.VV	1.932e-15	74	0	0	0	2561	Caudoviricetes	NA	NA	PF02924	NA
+NC_002737.2|provirus_777501_820593_802	802458	803507	1050	1	0.416	11	AGGAG	GENOMAD.004151.VV	1.227e-66	233	0	0	1	2561	Caudoviricetes	NA	NA	PF03864	Phage major capsid protein E
+NC_002737.2|provirus_777501_820593_803	803519	803785	267	1	0.378	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_804	803797	804150	354	1	0.379	11	GGAGG	GENOMAD.020971.VV	2.807e-56	191	0	0	0	2561	Caudoviricetes	NA	NA	PF11436;TIGR01560	NA
+NC_002737.2|provirus_777501_820593_805	804147	804455	309	1	0.392	11	AGxAGG/AGGxGG	GENOMAD.042575.VV	1.017e-43	154	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_806	804436	804801	366	1	0.385	11	GGA/GAG/AGG	GENOMAD.011013.VV	8.24e-39	141	0	0	1	2561	Caudoviricetes	NA	NA	PF11114;TIGR01725;COG5005	phage protein, HK97 gp10 family
+NC_002737.2|provirus_777501_820593_807	804798	805187	390	1	0.369	11	GGAGG	GENOMAD.023411.VV	1.013e-64	216	0	0	1	2561	Caudoviricetes	NA	NA	PF16807	NA
+NC_002737.2|provirus_777501_820593_808	805197	805850	654	1	0.381	11	AGGAG	GENOMAD.018762.VV	2.107e-36	139	0	0	1	2561	Caudoviricetes	NA	NA	TIGR02126;COG5437	phage major tail protein, TP901-1 family
+NC_002737.2|provirus_777501_820593_809	805910	806263	354	1	0.381	11	AGGAG	GENOMAD.019874.VV	2.516e-25	102	0	0	1	2561	Caudoviricetes	NA	NA	PF12363	Phage tail assembly chaperone protein, TAC
+NC_002737.2|provirus_777501_820593_810	806305	806634	330	1	0.345	11	None	GENOMAD.025799.VV	5.349e-22	92	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_811	806649	810284	3636	1	0.436	11	AGGAG	GENOMAD.013432.VV	0.0	1205	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_812	810317	811096	780	1	0.354	11	AGGA	GENOMAD.016670.VV	7.839e-14	74	0	0	0	2561	Caudoviricetes	NA	NA	PF20195;TIGR01633;COG4722	putative phage tail component, N-terminal domain
+NC_002737.2|provirus_777501_820593_813	811093	813141	2049	1	0.421	11	GGAG/GAGG	GENOMAD.130674.VP	5.583e-216	683	0	0	0	2561	Caudoviricetes	NA	NA	COG4926	Phage-related protein
+NC_002737.2|provirus_777501_820593_814	813141	814259	1119	1	0.417	11	GGAGG	GENOMAD.093524.VV	4.112e-132	424	0	0	0	2561	Caudoviricetes	NA	NA	PF07212	Hyaluronidase protein (HylP)
+NC_002737.2|provirus_777501_820593_815	814272	816182	1911	1	0.428	11	AGGAG	GENOMAD.033709.VV	1.037e-307	946	0	0	0	2561	Caudoviricetes	NA	NA	PF07902	gp58-like protein
+NC_002737.2|provirus_777501_820593_816	816196	816357	162	1	0.321	11	AGGAG	GENOMAD.181912.VC	1.836e-15	70	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_817	816360	816971	612	1	0.420	11	AGxAGG/AGGxGG	GENOMAD.024672.VV	4.154e-119	377	0	0	0	2561	Caudoviricetes	NA	NA	PF07104	NA
+NC_002737.2|provirus_777501_820593_818	816982	817278	297	1	0.377	11	GGAG/GAGG	GENOMAD.084276.VV	2.759e-55	187	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_819	817275	817460	186	1	0.376	11	AGGAG	GENOMAD.004934.VV	1.248e-22	91	0	0	1	2561	Caudoviricetes	NA	NA	PF16945	Putative lactococcus lactis phage r1t holin
+NC_002737.2|provirus_777501_820593_820	817464	817571	108	1	0.352	11	GGAG/GAGG	GENOMAD.102275.VV	1.131e-11	58	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_777501_820593_821	817572	818906	1335	1	0.383	11	AGGAG	GENOMAD.006162.VV	6.011e-104	346	0	0	0	2561	Caudoviricetes	NA	NA	K07273;COG3757	Lyzozyme M1 (1,4-beta-N-acetylmuramidase), GH25 family
+NC_002737.2|provirus_777501_820593_822	819180	819857	678	1	0.296	11	None	GENOMAD.223611.VP	2.952e-108	347	0	0	0	2561	Caudoviricetes	NA	NA	PF02876;PF01123;K11040	Staphylococcal/Streptococcal toxin, beta-grasp domain; Staphylococcal/Streptococcal toxin, OB-fold domain
+NC_002737.2|provirus_777501_820593_823	819883	820593	711	1	0.301	11	AGGAG	GENOMAD.224010.VP	3.442e-49	177	0	0	0	1	NA	NA	NA	PF02876	Staphylococcal/Streptococcal toxin, beta-grasp domain
+NC_002737.2|provirus_1186916_1222544_1181	1186916	1188778	1863	-1	0.405	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1182	1189309	1189491	183	-1	0.415	11	AGGAG	GENOMAD.222241.VP	3.425e-27	104	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1183	1189729	1190529	801	1	0.367	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1184	1190749	1191234	486	1	0.270	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1185	1191304	1192509	1206	-1	0.440	11	AGGAG	GENOMAD.133734.VP	8.732e-41	159	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1186	1192506	1192616	111	-1	0.387	11	AGGAG	GENOMAD.102275.VV	5.331e-12	59	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1187	1192625	1192852	228	-1	0.395	11	AGGAG	GENOMAD.126098.VV	2.718e-14	68	0	0	0	2561	Caudoviricetes	NA	NA	COG5546	NA
+NC_002737.2|provirus_1186916_1222544_1188	1192849	1193124	276	-1	0.351	11	GGAG/GAGG	GENOMAD.039653.VV	9.653e-09	53	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1189	1193134	1193751	618	-1	0.429	11	AGGAG	GENOMAD.024672.VV	3.618e-113	360	0	0	0	2561	Caudoviricetes	NA	NA	PF07104	NA
+NC_002737.2|provirus_1186916_1222544_1190	1193754	1194185	432	-1	0.370	11	AGGAG	GENOMAD.073534.VV	1.119e-78	257	0	0	0	2561	Caudoviricetes	NA	NA	PF07761	NA
+NC_002737.2|provirus_1186916_1222544_1191	1194197	1195981	1785	-1	0.406	11	AGGAG	GENOMAD.033709.VV	3.341e-135	444	0	0	0	2561	Caudoviricetes	NA	NA	PF07902	gp58-like protein
+NC_002737.2|provirus_1186916_1222544_1192	1195996	1197108	1113	-1	0.399	11	GGAGG	GENOMAD.093524.VV	3.001e-116	378	0	0	0	2561	Caudoviricetes	NA	NA	PF07212	Hyaluronidase protein (HylP)
+NC_002737.2|provirus_1186916_1222544_1193	1197108	1199066	1959	-1	0.393	11	GGAGG	GENOMAD.010194.VV	2.301e-123	412	0	0	1	2561	Caudoviricetes	NA	NA	PF06605;COG4926	Phage-related protein
+NC_002737.2|provirus_1186916_1222544_1194	1199063	1199758	696	-1	0.375	11	GGAG/GAGG	GENOMAD.004911.VV	4.418e-12	68	0	0	0	2561	Caudoviricetes	NA	NA	PF20195;COG4722;TIGR01633	Phage-related protein
+NC_002737.2|provirus_1186916_1222544_1195	1199755	1202112	2358	-1	0.416	11	AGGAG	GENOMAD.003531.VV	1.119e-145	483	0	0	0	2561	Caudoviricetes	NA	NA	COG5412	Phage-related protein
+NC_002737.2|provirus_1186916_1222544_1196	1202112	1202483	372	-1	0.368	11	None	GENOMAD.024158.VV	1.493e-41	149	0	0	0	2561	Caudoviricetes	NA	NA	PF17318	NA
+NC_002737.2|provirus_1186916_1222544_1197	1202498	1202761	264	-1	0.322	11	GGA/GAG/AGG	GENOMAD.021224.VV	2.203e-21	89	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1198	1202772	1203365	594	-1	0.375	11	AGGAG	GENOMAD.073691.VV	9.405e-47	168	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1199	1203377	1203712	336	-1	0.354	11	AGxAGG/AGGxGG	GENOMAD.019860.VV	4.248e-41	147	0	0	1	2561	Caudoviricetes	NA	NA	PF16807	NA
+NC_002737.2|provirus_1186916_1222544_1200	1203713	1203949	237	-1	0.392	11	GGA/GAG/AGG	GENOMAD.017784.VV	2.629e-38	137	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1201	1203942	1204280	339	-1	0.375	11	AGGAG/GGAGG	GENOMAD.018809.VV	1.338e-53	183	0	0	1	2561	Caudoviricetes	NA	NA	PF10665	Minor capsid protein
+NC_002737.2|provirus_1186916_1222544_1202	1204240	1204662	423	-1	0.404	11	AGGAG	GENOMAD.076853.VV	1.373e-58	199	0	0	1	2561	Caudoviricetes	NA	NA	PF09355	Phage protein Gp19/Gp15/Gp42
+NC_002737.2|provirus_1186916_1222544_1203	1204672	1204872	201	-1	0.403	11	AGGAG	GENOMAD.069443.VV	8.097e-08	49	0	0	1	2561	Caudoviricetes	NA	NA	PF09124	T4 recombination endonuclease VII, dimerisation
+NC_002737.2|provirus_1186916_1222544_1204	1204872	1205783	912	-1	0.402	11	AGGAG	GENOMAD.013457.VV	1.303e-93	309	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;TIGR01554;COG4653	Phage capsid family
+NC_002737.2|provirus_1186916_1222544_1205	1205808	1206269	462	-1	0.398	11	AGGA	GENOMAD.083647.VV	5.39e-33	126	0	0	0	2561	Caudoviricetes	NA	NA	PF14265	NA
+NC_002737.2|provirus_1186916_1222544_1206	1206350	1207765	1416	-1	0.397	11	AGGA	GENOMAD.003419.VV	3.618e-228	707	0	0	1	2561	Caudoviricetes	NA	NA	PF20441;PF03354;COG4626;TIGR01547;K17677	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_002737.2|provirus_1186916_1222544_1207	1207875	1208141	267	-1	0.363	11	AGGAG	GENOMAD.076597.VV	5.163e-44	154	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1208	1208134	1208313	180	-1	0.317	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1209	1208363	1208587	225	-1	0.387	11	None	GENOMAD.193246.VV	2.324e-45	157	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1210	1208593	1210086	1494	-1	0.364	11	GGAGG	GENOMAD.003531.VV	5.059e-87	299	0	0	0	2561	Caudoviricetes	NA	NA	COG5412	Phage-related protein
+NC_002737.2|provirus_1186916_1222544_1211	1210079	1211347	1269	-1	0.414	11	AGGAG	GENOMAD.076853.VV	1.22e-50	189	0	0	1	2561	Caudoviricetes	NA	NA	PF09355	Phage protein Gp19/Gp15/Gp42
+NC_002737.2|provirus_1186916_1222544_1212	1211344	1211700	357	-1	0.314	11	GGAGG	GENOMAD.072475.VV	3.993e-61	205	0	0	0	2561	Caudoviricetes	NA	NA	PF12855;COG4338	ECL1/2/3 zinc binding proteins
+NC_002737.2|provirus_1186916_1222544_1213	1211849	1212193	345	-1	0.432	11	GGA/GAG/AGG	GENOMAD.108097.VV	8.959e-27	106	0	0	0	2561	Caudoviricetes	NA	NA	PF13395	HNH endonuclease
+NC_002737.2|provirus_1186916_1222544_1214	1212302	1212721	420	-1	0.362	11	AGGAG	GENOMAD.024790.VV	1.124e-76	251	0	0	0	2561	Caudoviricetes	NA	NA	PF07374;TIGR01636;COG2739	phage transcriptional activator, RinA family
+NC_002737.2|provirus_1186916_1222544_1215	1212989	1213624	636	-1	0.360	11	GGAGG	GENOMAD.138295.VP	1.141e-77	258	0	0	0	2561	Caudoviricetes	NA	NA	TIGR02987;COG0827	NA
+NC_002737.2|provirus_1186916_1222544_1216	1213626	1213895	270	-1	0.393	11	GGA/GAG/AGG	GENOMAD.072347.VV	2.986e-42	149	0	0	0	2561	Caudoviricetes	NA	NA	TIGR02209	NA
+NC_002737.2|provirus_1186916_1222544_1217	1213979	1214491	513	-1	0.378	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1218	1214488	1214880	393	-1	0.361	11	None	GENOMAD.060064.VV	5.451e-14	70	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1219	1215006	1215803	798	-1	0.397	11	GGAG/GAGG	GENOMAD.161534.VP	1.003e-148	466	0	0	0	2561	Caudoviricetes	NA	NA	PF12684;TIGR01896	PDDEXK-like domain of unknown function (DUF3799)
+NC_002737.2|provirus_1186916_1222544_1220	1215796	1215996	201	-1	0.318	11	GGAG/GAGG	GENOMAD.148606.VV	1.297e-39	140	0	0	0	1	NA	NA	NA	PF06289	NA
+NC_002737.2|provirus_1186916_1222544_1221	1215993	1216982	990	-1	0.399	11	GGAG/GAGG	GENOMAD.091877.VP	1.608e-51	188	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;COG3723;K07455;TIGR00616	Recombinational DNA repair protein RecT
+NC_002737.2|provirus_1186916_1222544_1222	1216982	1217314	333	-1	0.315	11	GGAG/GAGG	GENOMAD.040347.VV	3.314e-43	153	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1223	1217370	1217576	207	-1	0.406	11	AGGAG	GENOMAD.114751.VV	1.769e-37	134	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1224	1217585	1217725	141	-1	0.404	11	AGGAG	GENOMAD.079484.VV	1.722e-06	44	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1225	1217722	1217955	234	-1	0.359	11	None	GENOMAD.100896.VV	1.121e-38	138	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1226	1217936	1218322	387	-1	0.370	11	AGGAG	GENOMAD.198321.CP	4.29e-06	47	0	0	0	2561	Caudoviricetes	NA	NA	PF07261;COG3611;TIGR04548;K02086	Replication initiation and membrane attachment protein DnaB
+NC_002737.2|provirus_1186916_1222544_1227	1218448	1218702	255	-1	0.396	11	4Base/6BMM	GENOMAD.136142.VP	2.402e-34	126	0	0	0	2561	Caudoviricetes	NA	NA	PF13730;TIGR00373;COG4738;K07721	transcription factor E
+NC_002737.2|provirus_1186916_1222544_1228	1218811	1218996	186	-1	0.382	11	AGGAG	GENOMAD.105558.VV	1.448e-28	108	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1229	1218998	1219309	312	-1	0.353	11	GGAG/GAGG	GENOMAD.050216.VV	2.881e-57	193	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1230	1219407	1219538	132	-1	0.341	11	AGGA	GENOMAD.114759.VV	3.069e-20	83	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_002737.2|provirus_1186916_1222544_1231	1219579	1219791	213	-1	0.347	11	AGGAG	GENOMAD.225776.VP	0.0003177	39	0	0	0	1	NA	NA	NA	PF05339;TIGR00673;COG3620;K22299	cyanase
+NC_002737.2|provirus_1186916_1222544_1232	1219993	1220748	756	1	0.368	11	AGGAG	GENOMAD.091877.VP	8.865e-44	162	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;COG3723;K07455;TIGR00616	Recombinational DNA repair protein RecT
+NC_002737.2|provirus_1186916_1222544_1233	1220760	1221278	519	1	0.326	11	AGGAG	GENOMAD.064488.VV	1.26e-91	296	0	0	0	2561	Caudoviricetes	NA	NA	PF08797	HIRAN domain
+NC_002737.2|provirus_1186916_1222544_1234	1221402	1222544	1143	1	0.354	11	GGAG/GAGG	GENOMAD.111131.VV	8.486e-09	60	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_003450.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_008261.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,113 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_008261.1|provirus_1070550_1127691_877	1070550	1072190	1641	1	0.238	11	GGA/GAG/AGG	GENOMAD.082048.VV	1.889e-05	50	0	0	0	12031	Mimiviridae	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_878	1072272	1072892	621	1	0.337	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_879	1073139	1074983	1845	1	0.246	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_880	1075096	1076289	1194	1	0.258	11	AGGAG	GENOMAD.076874.VV	1.378e-16	85	0	0	0	2561	Caudoviricetes	NA	NA	PF01041;K07806;TIGR03588;COG0399	UDP-4-amino-4,6-dideoxy-N-acetyl-beta-L-altrosamine transaminase
+NC_008261.1|provirus_1070550_1127691_881	1076295	1076897	603	1	0.227	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_882	1076920	1077945	1026	1	0.217	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_883	1077932	1079059	1128	1	0.243	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_884	1079063	1080139	1077	1	0.194	11	GGA/GAG/AGG	GENOMAD.216304.PC	1.438e-24	109	0	0	0	1	NA	NA	NA	PF14897;K19419;COG4745;TIGR03663	EpsG family
+NC_008261.1|provirus_1070550_1127691_885	1080176	1081549	1374	1	0.191	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_886	1081573	1082385	813	1	0.232	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_887	1082401	1083114	714	1	0.230	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_888	1083114	1083731	618	1	0.235	11	AGGAG/GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_889	1083893	1084318	426	1	0.312	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_890	1084498	1084986	489	1	0.266	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_891	1085277	1087037	1761	1	0.293	11	AGGA	GENOMAD.152449.VC	1.254e-06	54	0	0	0	1	NA	NA	NA	PF13597;PF01638;K21636;TIGR02487;COG1328	anaerobic ribonucleoside-triphosphate reductase
+NC_008261.1|provirus_1070550_1127691_892	1087034	1087492	459	1	0.307	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_893	1087687	1088409	723	1	0.245	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_894	1088615	1088833	219	-1	0.187	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_895	1089077	1090141	1065	-1	0.241	11	GGAG/GAGG	GENOMAD.225071.VP	1.1e-06	53	0	0	0	1	NA	NA	NA	PF00589;PF13102;TIGR02225;COG4973;K14059	tyrosine recombinase XerD
+NC_008261.1|provirus_1070550_1127691_896	1090234	1090698	465	-1	0.282	11	AGxAGG/AGGxGG	GENOMAD.123021.VV	2.145e-26	107	0	0	0	2561	Caudoviricetes	NA	NA	PF06114;COG2856	IrrE N-terminal-like domain
+NC_008261.1|provirus_1070550_1127691_897	1090714	1091217	504	-1	0.270	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_898	1091369	1091605	237	1	0.241	11	GGAGG	GENOMAD.069056.VV	3.217e-21	88	0	0	1	2561	Caudoviricetes	NA	NA	PF06892;TIGR00673;COG1974;K07727	cyanase
+NC_008261.1|provirus_1070550_1127691_899	1091617	1092348	732	1	0.294	11	AGGAGG	GENOMAD.119058.VP	1.071e-22	100	0	0	0	2561	Caudoviricetes	NA	NA	PF10552	ORF6C domain
+NC_008261.1|provirus_1070550_1127691_900	1092374	1092628	255	1	0.239	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_901	1092597	1093268	672	-1	0.226	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_902	1093445	1093747	303	1	0.323	11	AGGAGG	GENOMAD.061044.VV	4.551e-51	175	0	0	1	2561	Caudoviricetes	NA	NA	PF13411;COG4220;TIGR02054	Phage DNA packaging protein, Nu1 subunit of terminase
+NC_008261.1|provirus_1070550_1127691_903	1093749	1093928	180	1	0.233	11	AGGAGG	GENOMAD.164182.VV	2.491e-15	70	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_904	1093939	1094121	183	1	0.268	11	GGA/GAG/AGG	GENOMAD.117872.VV	7.847e-06	43	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_905	1094118	1094225	108	1	0.269	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_906	1094418	1094603	186	1	0.339	11	AGGAGG	GENOMAD.172161.VC	4.982e-10	55	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_907	1094603	1095514	912	1	0.305	11	AGGAGG	GENOMAD.142278.VP	1.844e-07	55	0	0	1	2561	Caudoviricetes	NA	NA	PF09588;COG5377;TIGR03033	Phage-related protein, predicted endonuclease
+NC_008261.1|provirus_1070550_1127691_908	1095516	1096385	870	1	0.313	11	AGGAGG	GENOMAD.098980.VP	5.121e-35	138	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;COG3723;K07455;TIGR00616	Recombinational DNA repair protein RecT
+NC_008261.1|provirus_1070550_1127691_909	1096403	1097116	714	1	0.312	11	AGGAGG	GENOMAD.178290.VP	7.894e-26	109	0	0	1	2561	Caudoviricetes	NA	NA	PF04492;TIGR01714;COG2188	Bacteriophage replication protein O
+NC_008261.1|provirus_1070550_1127691_910	1097117	1097290	174	1	0.299	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_911	1097284	1097670	387	1	0.333	11	GGAGG	GENOMAD.194141.VP	1.905e-16	77	0	0	0	2561	Caudoviricetes	NA	NA	PF05866;COG4570	Endodeoxyribonuclease RusA
+NC_008261.1|provirus_1070550_1127691_912	1097820	1098467	648	1	0.267	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_913	1099026	1099499	474	1	0.274	11	AGGAGG	GENOMAD.062141.VV	1.203e-15	76	0	0	0	2561	Caudoviricetes	NA	NA	PF05263;TIGR01636	phage transcriptional activator, RinA family
+NC_008261.1|provirus_1070550_1127691_914	1099982	1101157	1176	1	0.225	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_915	1101226	1101693	468	1	0.333	11	AGxAGG/AGGxGG	GENOMAD.026460.VV	4.147e-28	112	0	0	1	2561	Caudoviricetes	NA	NA	PF03592;COG3728;K07474	Phage terminase, small subunit
+NC_008261.1|provirus_1070550_1127691_916	1101686	1103050	1365	1	0.304	11	AGGA	GENOMAD.017640.VV	7.419e-95	320	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_917	1103106	1103873	768	1	0.217	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_918	1103919	1105439	1521	1	0.300	11	AGGAGG	GENOMAD.016130.VV	7.684e-228	708	0	0	1	2561	Caudoviricetes	NA	NA	PF05133;TIGR01542	phage portal protein, putative, A118 family
+NC_008261.1|provirus_1070550_1127691_919	1105423	1107060	1638	1	0.299	11	GGAG/GAGG	GENOMAD.015690.VV	1.626e-76	270	0	0	1	2561	Caudoviricetes	NA	NA	PF06152;TIGR01641	Phage minor capsid protein 2
+NC_008261.1|provirus_1070550_1127691_920	1107073	1107297	225	1	0.262	11	GGAG/GAGG	GENOMAD.093339.VV	2.906e-13	65	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_921	1107325	1107942	618	1	0.235	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_922	1108036	1108641	606	1	0.345	11	GGAGG	GENOMAD.041104.VV	1.371e-23	101	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_923	1108666	1109571	906	1	0.305	11	AGGAG	GENOMAD.075076.VV	1.757e-79	268	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_924	1109586	1109855	270	1	0.263	11	AGGAG	GENOMAD.050526.VV	1.494e-18	81	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_925	1109891	1110253	363	1	0.267	11	AGGA	GENOMAD.020431.VV	1.927e-29	114	0	0	0	2561	Caudoviricetes	NA	NA	PF11436	Putative DnaT-like ssDNA binding protein
+NC_008261.1|provirus_1070550_1127691_926	1110257	1110583	327	1	0.315	11	AGGAGG	GENOMAD.024076.VV	1.104e-53	183	0	0	1	2561	Caudoviricetes	NA	NA	PF10665	Minor capsid protein
+NC_008261.1|provirus_1070550_1127691_927	1110583	1110966	384	1	0.271	11	GGAG/GAGG	GENOMAD.019595.VV	1.238e-61	207	0	0	1	2561	Caudoviricetes	NA	NA	PF11114	Minor capsid protein
+NC_008261.1|provirus_1070550_1127691_928	1110966	1111352	387	1	0.300	11	AGGA/GGAG/GAGG	GENOMAD.028696.VV	6.269e-45	159	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_929	1111362	1111820	459	1	0.353	11	GGA/GAG/AGG	GENOMAD.019307.VV	5.136e-50	175	0	0	1	2561	Caudoviricetes	NA	NA	PF16461;COG5437	Predicted secreted protein
+NC_008261.1|provirus_1070550_1127691_930	1111833	1112201	369	1	0.263	11	AGGAGG	GENOMAD.052890.VV	8.683e-47	164	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_931	1112161	1112523	363	1	0.314	11	3Base/5BMM	GENOMAD.015650.VV	9.786e-61	204	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_932	1112564	1115776	3213	1	0.311	11	AGxAGG/AGGxGG	GENOMAD.171590.VP	0.0	1638	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_933	1115780	1116133	354	1	0.319	11	None	GENOMAD.012935.VV	2.528e-49	171	0	0	0	2561	Caudoviricetes	NA	NA	PF20458	NA
+NC_008261.1|provirus_1070550_1127691_934	1116156	1116422	267	1	0.292	11	AGxAGG/AGGxGG	GENOMAD.163907.VV	7.646e-48	165	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_935	1116489	1116869	381	1	0.226	11	GGAG/GAGG	GENOMAD.016019.VV	6.313e-44	156	0	0	0	2561	Caudoviricetes	NA	NA	PF07761	NA
+NC_008261.1|provirus_1070550_1127691_936	1116905	1122013	5109	1	0.296	11	AGxAGG/AGGxGG	GENOMAD.141397.VP	0.0	2111	0	0	1	2561	Caudoviricetes	NA	NA	PF06605;PF00149;TIGR01665;K01517;COG4926	phage minor structural protein, N-terminal region
+NC_008261.1|provirus_1070550_1127691_937	1122032	1122280	249	1	0.217	11	AGGAGG	GENOMAD.113645.VV	4.861e-34	125	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_938	1122294	1122710	417	1	0.276	11	AGGA	GENOMAD.112625.VV	0.0002838	42	0	0	1	1	NA	NA	NA	PF05105;TIGR01593;COG4824	toxin secretion/phage lysis holin
+NC_008261.1|provirus_1070550_1127691_939	1122751	1123167	417	1	0.281	11	AGxAGG/AGGxGG	GENOMAD.224084.VP	7.697e-31	119	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_940	1123253	1124281	1029	1	0.290	11	AGxAGG/AGGxGG	GENOMAD.169358.VC	0.0003137	45	0	0	0	2561	Caudoviricetes	NA	NA	PF06725;PF18348;COG3584;K11060;TIGR04211	3D (Asp-Asp-Asp) domain
+NC_008261.1|provirus_1070550_1127691_941	1124699	1125361	663	1	0.186	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_942	1125585	1126673	1089	1	0.234	11	GGAG/GAGG	GENOMAD.129207.VV	1.696e-28	121	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_943	1126618	1126959	342	1	0.266	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1070550_1127691_944	1126966	1127691	726	1	0.247	11	AGxAGG/AGGxGG	GENOMAD.129093.VV	5.379e-18	86	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1520	1784095	1784580	486	-1	0.302	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1521	1784747	1785049	303	-1	0.261	11	AGGAGG	GENOMAD.099786.VV	1.61e-22	93	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1522	1785241	1786269	1029	-1	0.287	11	AGxAGG/AGGxGG	GENOMAD.169358.VC	1.801e-05	49	0	0	0	2561	Caudoviricetes	NA	NA	PF06725;PF18348;COG3584;K11060;TIGR04211	3D (Asp-Asp-Asp) domain
+NC_008261.1|provirus_1784095_1821197_1523	1786323	1786805	483	-1	0.271	11	AGxAGG/AGGxGG	GENOMAD.222318.VP	5.723e-61	207	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1524	1786826	1787059	234	-1	0.226	11	GGA/GAG/AGG	GENOMAD.080405.VV	7.991e-27	104	0	0	0	2561	Caudoviricetes	NA	NA	PF10779	Haemolysin XhlA
+NC_008261.1|provirus_1784095_1821197_1525	1787141	1787326	186	-1	0.290	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1526	1787345	1789843	2499	-1	0.279	11	AGGAG	GENOMAD.033703.VV	5.052e-243	769	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1527	1789859	1791739	1881	-1	0.297	11	AGGAG	GENOMAD.082024.VV	7.094e-68	247	0	0	0	2561	Caudoviricetes	NA	NA	PF10651;PF15425	BppU N-terminal domain
+NC_008261.1|provirus_1784095_1821197_1528	1791790	1794849	3060	-1	0.307	11	None	GENOMAD.004842.VV	2.175e-102	362	0	0	1	2561	Caudoviricetes	NA	NA	PF06605;PF18994;COG4926;TIGR01665	Phage-related protein
+NC_008261.1|provirus_1784095_1821197_1529	1794854	1795564	711	-1	0.249	11	GGAGG	GENOMAD.055476.VV	7.973e-38	144	0	0	0	2561	Caudoviricetes	NA	NA	PF20195;COG4722;TIGR01633	Phage-related protein
+NC_008261.1|provirus_1784095_1821197_1530	1795557	1798811	3255	-1	0.299	11	AGGAGG	GENOMAD.104282.VP	3.823e-53	208	0	0	0	2561	Caudoviricetes	NA	NA	COG5412	Phage-related protein
+NC_008261.1|provirus_1784095_1821197_1531	1798847	1799200	354	-1	0.218	11	None	GENOMAD.080513.VV	1.378e-06	48	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1532	1799362	1799679	318	-1	0.270	11	GGA/GAG/AGG	GENOMAD.080540.VV	1.741e-55	188	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1533	1799682	1800284	603	-1	0.315	11	AGxAGG/AGGxGG	GENOMAD.013991.VV	4.274e-39	146	0	0	1	2561	Caudoviricetes	NA	NA	PF04630;TIGR01603	phage major tail protein, phi13 family
+NC_008261.1|provirus_1784095_1821197_1534	1800301	1800648	348	-1	0.261	11	AGxAGG/AGGxGG	GENOMAD.056191.VV	7.661e-29	112	0	0	0	2561	Caudoviricetes	NA	NA	PF05657	NA
+NC_008261.1|provirus_1784095_1821197_1535	1800657	1801094	438	-1	0.304	11	GGAG/GAGG	GENOMAD.072939.VV	1.155e-20	90	0	0	1	2561	Caudoviricetes	NA	NA	TIGR01725;COG5005	phage protein, HK97 gp10 family
+NC_008261.1|provirus_1784095_1821197_1536	1801094	1801423	330	-1	0.276	11	None	GENOMAD.078312.VV	2.185e-15	73	0	0	1	2561	Caudoviricetes	NA	NA	PF05521;TIGR01563;COG5614	phage head-tail adaptor, putative, SPP1 family
+NC_008261.1|provirus_1784095_1821197_1537	1801416	1801694	279	-1	0.262	11	GGA/GAG/AGG	GENOMAD.034954.VV	1.311e-13	67	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR01560	Phage gp6-like head-tail connector protein
+NC_008261.1|provirus_1784095_1821197_1538	1801706	1802890	1185	-1	0.295	11	AGGAGG	GENOMAD.014413.VV	7.217e-42	162	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;TIGR01554;COG4653	phage major capsid protein, HK97 family
+NC_008261.1|provirus_1784095_1821197_1539	1802931	1803536	606	-1	0.289	11	AGxAGG/AGGxGG	GENOMAD.126260.VV	7.801e-51	180	0	0	1	2561	Caudoviricetes	NA	NA	PF04586;COG3740;K06904;TIGR01543	Phage head maturation protease
+NC_008261.1|provirus_1784095_1821197_1540	1803526	1804773	1248	-1	0.272	11	GGAG/GAGG	GENOMAD.126260.VV	8.756e-55	201	0	0	1	2561	Caudoviricetes	NA	NA	PF04586;COG3740;K06904;TIGR01543	Phage head maturation protease
+NC_008261.1|provirus_1784095_1821197_1541	1804774	1806513	1740	-1	0.303	11	AGGA	GENOMAD.166487.VP	8.866e-49	188	0	0	1	2561	Caudoviricetes	NA	NA	PF20441;COG4626	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_008261.1|provirus_1784095_1821197_1542	1806506	1807018	513	-1	0.271	11	GGA/GAG/AGG	GENOMAD.136127.VP	7.834e-17	80	0	0	1	2561	Caudoviricetes	NA	NA	PF05119;COG3747;TIGR01558	Phage terminase, small subunit
+NC_008261.1|provirus_1784095_1821197_1543	1807521	1808342	822	-1	0.246	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1544	1808517	1809065	549	-1	0.270	11	GGAG/GAGG	GENOMAD.027124.VV	1.276e-14	74	0	0	0	2561	Caudoviricetes	NA	NA	PF07104	NA
+NC_008261.1|provirus_1784095_1821197_1545	1809160	1809513	354	-1	0.263	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1546	1809572	1809778	207	-1	0.304	11	GGAG/GAGG	GENOMAD.117627.VV	5.796e-41	144	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1547	1809920	1810381	462	-1	0.264	11	GGAG/GAGG	GENOMAD.062141.VV	1.839e-18	84	0	0	0	2561	Caudoviricetes	NA	NA	PF05263;TIGR01636	phage transcriptional activator, RinA family
+NC_008261.1|provirus_1784095_1821197_1548	1810917	1811306	390	-1	0.295	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1549	1811321	1811467	147	-1	0.272	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1550	1811479	1812762	1284	-1	0.296	11	GGA/GAG/AGG	GENOMAD.068048.VV	6.568e-15	80	0	0	1	2561	Caudoviricetes	NA	NA	PF20307;TIGR03600;K02314;COG0305	phage replicative helicase, DnaB family, HK022 subfamily
+NC_008261.1|provirus_1784095_1821197_1551	1812773	1813513	741	-1	0.266	11	GGAG/GAGG	GENOMAD.096239.VV	9.382e-28	115	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1552	1813541	1813699	159	-1	0.270	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1553	1813702	1813881	180	-1	0.267	11	AGGAGG	GENOMAD.148814.VV	1.3e-07	48	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1554	1813907	1814137	231	-1	0.277	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1555	1814143	1814640	498	-1	0.295	11	AGGAG	GENOMAD.142555.VV	5.332e-20	89	0	0	1	2561	Caudoviricetes	NA	NA	PF06892;TIGR02612;K22299;COG3620	Phage regulatory protein CII (CP76)
+NC_008261.1|provirus_1784095_1821197_1556	1814690	1814878	189	-1	0.243	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1557	1815028	1815372	345	1	0.278	11	AGGA/GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1558	1815423	1817012	1590	1	0.228	11	GGAGG	GENOMAD.219971.CV	7.902e-13	74	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1559	1817080	1817934	855	1	0.237	11	AGGAG	GENOMAD.170359.VC	3.605e-08	57	0	0	0	1	NA	NA	NA	PF02086;TIGR00571;COG0338;K06223	DNA adenine methylase (dam)
+NC_008261.1|provirus_1784095_1821197_1560	1818046	1818543	498	1	0.267	11	GGxGG	GENOMAD.123021.VV	2.082e-10	61	0	0	0	2561	Caudoviricetes	NA	NA	PF06114;COG2856	IrrE N-terminal-like domain
+NC_008261.1|provirus_1784095_1821197_1561	1818556	1820064	1509	1	0.250	11	GGAGG	GENOMAD.169508.VP	2.109e-24	111	0	0	1	2561	Caudoviricetes	NA	NA	PF04708;PF13262;COG1961;K14060	Site-specific DNA recombinase related to the DNA invertase Pin
+NC_008261.1|provirus_1784095_1821197_1562	1820078	1820416	339	-1	0.301	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_008261.1|provirus_1784095_1821197_1563	1820820	1821197	378	-1	0.257	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_009012.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,223 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_009012.1|provirus_1938476_1983993_1694	1938476	1938967	492	-1	0.404	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1695	1938931	1940499	1569	-1	0.392	11	AGGAGG	GENOMAD.097162.VV	2.214e-10	66	0	0	1	2561	Caudoviricetes	NA	NA	PF20307;TIGR03600;COG0305;K18947	phage replicative helicase, DnaB family, HK022 subfamily
+NC_009012.1|provirus_1938476_1983993_1696	1940561	1940779	219	-1	0.416	11	AGGAGG	GENOMAD.180442.VC	1.734e-24	97	0	0	0	2561	Caudoviricetes	NA	NA	PF20612	SHOCT domain
+NC_009012.1|provirus_1938476_1983993_1697	1940837	1941841	1005	-1	0.450	11	AGGAGG	GENOMAD.215835.VV	1.253e-44	168	0	0	0	2561	Caudoviricetes	NA	NA	PF01510;COG5632;K11066	N-acetylmuramoyl-L-alanine amidase CwlA
+NC_009012.1|provirus_1938476_1983993_1698	1941838	1942257	420	-1	0.464	11	GGAGG	GENOMAD.083633.VV	5.263e-08	53	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1699	1942344	1944812	2469	-1	0.465	11	AGxAGG/AGGxGG	GENOMAD.116546.VV	0.0	1051	0	0	1	2561	Caudoviricetes	NA	NA	PF06605;TIGR01665;COG4926	phage minor structural protein, N-terminal region
+NC_009012.1|provirus_1938476_1983993_1700	1944809	1945384	576	-1	0.472	11	GGA/GAG/AGG	GENOMAD.066153.VV	1.508e-90	294	0	0	1	2561	Caudoviricetes	NA	NA	PF06605;TIGR01665;COG4926	phage minor structural protein, N-terminal region
+NC_009012.1|provirus_1938476_1983993_1701	1945394	1945588	195	-1	0.446	11	GGAG/GAGG	GENOMAD.089015.VV	2.452e-32	119	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1702	1945599	1948121	2523	-1	0.450	11	GGAGG	GENOMAD.116546.VV	0.0	1208	0	0	1	2561	Caudoviricetes	NA	NA	PF06605;TIGR01665;COG4926	phage minor structural protein, N-terminal region
+NC_009012.1|provirus_1938476_1983993_1703	1948126	1948899	774	-1	0.433	11	GGAGG	GENOMAD.116614.VV	3.551e-139	438	0	0	0	2561	Caudoviricetes	NA	NA	PF20195;COG4722;TIGR01633	Phage-related protein
+NC_009012.1|provirus_1938476_1983993_1704	1948913	1951201	2289	-1	0.504	11	AGGAGG	GENOMAD.036973.VV	4.796e-161	527	0	0	0	2561	Caudoviricetes	NA	NA	K02334;COG4722	Phage-related protein
+NC_009012.1|provirus_1938476_1983993_1705	1951335	1951607	273	1	0.502	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1706	1951604	1952008	405	1	0.504	11	AGGA/GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1707	1952057	1952248	192	-1	0.453	11	None	GENOMAD.223693.VP	2.475e-24	96	0	0	1	2561	Caudoviricetes	NA	NA	PF09550;TIGR02216	Phage tail assembly chaperone protein, TAC
+NC_009012.1|provirus_1938476_1983993_1708	1952245	1952628	384	-1	0.448	11	AGGAGG	GENOMAD.166825.VP	3.751e-66	220	0	0	1	2561	Caudoviricetes	NA	NA	PF11836	Phage tail tube protein, GTA-gp10
+NC_009012.1|provirus_1938476_1983993_1709	1952631	1953227	597	-1	0.513	11	AGGAGG	GENOMAD.005050.VV	1.417e-111	355	0	0	1	2561	Caudoviricetes	NA	NA	PF04630;TIGR01603	phage major tail protein, phi13 family
+NC_009012.1|provirus_1938476_1983993_1710	1953233	1953577	345	-1	0.429	11	AGGAG/GGAGG	GENOMAD.077616.VV	1.204e-39	143	0	0	0	2561	Caudoviricetes	NA	NA	PF05657	NA
+NC_009012.1|provirus_1938476_1983993_1711	1953574	1954005	432	-1	0.465	11	AGGAGG	GENOMAD.032585.VV	5.7e-53	183	0	0	1	2561	Caudoviricetes	NA	NA	PF11114;COG5005;TIGR01725	Mu-like prophage protein gpG
+NC_009012.1|provirus_1938476_1983993_1712	1954022	1954357	336	-1	0.440	11	GGA/GAG/AGG	GENOMAD.040271.VV	1.154e-54	186	0	0	1	2561	Caudoviricetes	NA	NA	PF05521;COG5614;TIGR01563	Bacteriophage head-tail adaptor
+NC_009012.1|provirus_1938476_1983993_1713	1954360	1954668	309	-1	0.472	11	GGAGG	GENOMAD.028909.VV	6.135e-49	169	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR01560	Phage gp6-like head-tail connector protein
+NC_009012.1|provirus_1938476_1983993_1714	1954690	1955892	1203	-1	0.482	11	AGGAGG	GENOMAD.168658.VV	4.012e-34	139	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;PF04586;PF12518;COG4653;TIGR01554;K06904	Predicted phage phi-C31 gp36 major capsid-like protein
+NC_009012.1|provirus_1938476_1983993_1715	1955943	1956671	729	-1	0.439	11	GGAGG	GENOMAD.028909.VV	1.82e-27	114	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR01560	Phage gp6-like head-tail connector protein
+NC_009012.1|provirus_1938476_1983993_1716	1956610	1957932	1323	-1	0.485	11	AGGAG	GENOMAD.179073.VP	1.831e-53	198	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1717	1958009	1959793	1785	-1	0.324	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1718	1959867	1961096	1230	-1	0.462	11	None	GENOMAD.181434.VP	5.613e-61	219	0	0	1	2561	Caudoviricetes	NA	NA	PF20441	Terminase large subunit, endonuclease domain
+NC_009012.1|provirus_1938476_1983993_1719	1961099	1961434	336	-1	0.458	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1720	1961573	1961767	195	-1	0.385	11	GGAG/GAGG	GENOMAD.140940.VV	2.57e-10	56	0	0	0	2561	Caudoviricetes	NA	NA	PF16468	NA
+NC_009012.1|provirus_1938476_1983993_1721	1961771	1962238	468	-1	0.464	11	AGGAGG	GENOMAD.191984.VP	6.704e-12	65	0	0	0	2561	Caudoviricetes	NA	NA	PF07128	NA
+NC_009012.1|provirus_1938476_1983993_1722	1962300	1963199	900	-1	0.504	11	AGGAG	GENOMAD.105515.VV	0.0005042	44	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1723	1963341	1963571	231	-1	0.463	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1724	1963597	1964289	693	-1	0.440	11	GGAGG	GENOMAD.105515.VV	6.371e-26	109	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1725	1964406	1965659	1254	-1	0.440	11	GGAGG	GENOMAD.208446.VP	2.08e-27	119	0	0	0	2561	Caudoviricetes	NA	NA	PF01555;COG4725;K13581	N6-adenosine-specific RNA methylase IME4
+NC_009012.1|provirus_1938476_1983993_1726	1965665	1966963	1299	-1	0.464	11	AGGAG	GENOMAD.005053.VV	4.044e-23	106	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1727	1966938	1967120	183	-1	0.350	11	AGGAGG	GENOMAD.195270.VP	2e-32	119	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1728	1967120	1967671	552	-1	0.502	11	GGAG/GAGG	GENOMAD.098194.VV	4.683e-91	295	0	0	1	2561	Caudoviricetes	NA	NA	PF05119;COG3747;TIGR01558	Phage terminase, small subunit
+NC_009012.1|provirus_1938476_1983993_1729	1967792	1968151	360	-1	0.478	11	AGGAGG	GENOMAD.127444.VV	9.611e-12	63	0	0	0	2561	Caudoviricetes	NA	NA	PF13395	HNH endonuclease
+NC_009012.1|provirus_1938476_1983993_1730	1968273	1968515	243	-1	0.399	11	AGGAG	GENOMAD.212426.VP	6.855e-15	70	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1731	1968659	1969657	999	-1	0.379	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1732	1969697	1970107	411	-1	0.309	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1733	1970346	1970801	456	-1	0.436	11	GGAGG	GENOMAD.056402.VV	3.108e-38	141	0	0	0	2561	Caudoviricetes	NA	NA	PF05263;TIGR01636	phage transcriptional activator, RinA family
+NC_009012.1|provirus_1938476_1983993_1734	1970893	1971195	303	-1	0.452	11	GGAGG	GENOMAD.138066.VP	1.61e-22	93	0	0	0	2561	Caudoviricetes	NA	NA	PF03838;COG3331;TIGR00648	Penicillin-binding protein-related factor A, putative recombinase
+NC_009012.1|provirus_1938476_1983993_1735	1971496	1974051	2556	-1	0.449	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1736	1974048	1974473	426	-1	0.465	11	AGxAGG/AGGxGG	GENOMAD.179451.VC	2.953e-05	45	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1737	1974489	1975286	798	-1	0.396	11	GGAGG	GENOMAD.153366.VP	4.288e-20	93	0	0	0	2561	Caudoviricetes	NA	NA	PF03374;COG3645	Phage antirepressor protein YoqD, KilAC domain
+NC_009012.1|provirus_1938476_1983993_1738	1975291	1977213	1923	-1	0.440	11	AGGAG	GENOMAD.140318.VC	1.003e-23	110	0	0	0	2561	Caudoviricetes	NA	NA	PF00476;COG0749;TIGR00593	DNA polymerase I - 3'-5' exonuclease and polymerase domains
+NC_009012.1|provirus_1938476_1983993_1739	1977271	1978023	753	-1	0.467	11	GGAGG	GENOMAD.211539.VV	6.84e-47	171	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1740	1978145	1978585	441	-1	0.469	11	AGGAG	GENOMAD.026103.VV	4.552e-65	218	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1741	1978551	1979909	1359	-1	0.444	11	None	GENOMAD.003266.VV	2.422e-23	107	0	0	0	2561	Caudoviricetes	NA	NA	PF00176;K14440;COG1061;TIGR04095	Superfamily II DNA or RNA helicase
+NC_009012.1|provirus_1938476_1983993_1742	1979876	1980058	183	-1	0.454	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1743	1980282	1982201	1920	-1	0.369	11	GGAGG	GENOMAD.213960.VV	1.039e-08	61	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1744	1982360	1982566	207	1	0.343	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_1938476_1983993_1745	1983046	1983993	948	-1	0.397	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1786	2022140	2023468	1329	-1	0.340	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1787	2023413	2024702	1290	-1	0.350	11	AGxAGG/AGGxGG	GENOMAD.022372.VV	2.322e-18	91	0	0	1	2561	Caudoviricetes	NA	NA	PF04708;COG1961;K14060	Site-specific DNA recombinase related to the DNA invertase Pin
+NC_009012.1|provirus_2022140_2067593_1788	2024803	2025474	672	-1	0.368	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1789	2025494	2025979	486	-1	0.340	11	AGGAGG	GENOMAD.170412.VP	4.718e-05	45	0	0	1	2561	Caudoviricetes	NA	NA	PF03354;COG4626	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_009012.1|provirus_2022140_2067593_1790	2025972	2026382	411	-1	0.353	11	GGAGG	GENOMAD.083633.VV	5.663e-05	44	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1791	2026399	2028087	1689	-1	0.325	11	GGAG/GAGG	GENOMAD.068767.VV	1.613e-200	632	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1792	2028099	2029256	1158	-1	0.335	11	AGxAGG/AGGxGG	GENOMAD.222380.VP	5.366e-06	51	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1793	2029269	2031173	1905	-1	0.332	11	GGxGG	GENOMAD.004340.VV	1.903e-153	499	0	0	1	2561	Caudoviricetes	NA	NA	PF06605;PF18994;COG4926;TIGR01665	Phage-related protein
+NC_009012.1|provirus_2022140_2067593_1794	2031173	2031877	705	-1	0.296	11	GGxGG	GENOMAD.004006.VV	7.585e-128	404	0	0	0	2561	Caudoviricetes	NA	NA	PF20195;COG4722;TIGR01633	Phage-related protein
+NC_009012.1|provirus_2022140_2067593_1795	2031877	2034156	2280	-1	0.357	11	GGAGG	GENOMAD.089120.VP	5.755e-58	220	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1796	2034172	2034297	126	-1	0.333	11	4Base/6BMM	GENOMAD.202970.VV	1.546e-18	78	0	0	1	1	NA	NA	NA	PF09550;TIGR02216	NA
+NC_009012.1|provirus_2022140_2067593_1797	2034366	2034689	324	-1	0.306	11	AGGAG	GENOMAD.136836.VV	3.52e-41	147	0	0	0	2561	Caudoviricetes	NA	NA	PF16478	Phage tail tube protein, GTA-gp10
+NC_009012.1|provirus_2022140_2067593_1798	2034818	2035258	441	-1	0.306	11	GGA/GAG/AGG	GENOMAD.053493.CC	5.322e-30	117	0	0	0	1	NA	NA	NA	PF14101	NA
+NC_009012.1|provirus_2022140_2067593_1799	2035656	2036699	1044	-1	0.345	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1800	2036776	2036883	108	-1	0.204	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1801	2037023	2037595	573	-1	0.356	11	GGA/GAG/AGG	GENOMAD.013991.VV	6.347e-57	197	0	0	1	2561	Caudoviricetes	NA	NA	PF04630;TIGR01603	phage major tail protein, phi13 family
+NC_009012.1|provirus_2022140_2067593_1802	2037598	2037927	330	-1	0.294	11	GGA/GAG/AGG	GENOMAD.018077.VV	2.114e-47	165	0	0	0	2561	Caudoviricetes	NA	NA	PF05657	NA
+NC_009012.1|provirus_2022140_2067593_1803	2037924	2038316	393	-1	0.356	11	GGAGG	GENOMAD.066487.VV	1.944e-66	221	0	0	1	2561	Caudoviricetes	NA	NA	TIGR01725;COG5005	phage protein, HK97 gp10 family
+NC_009012.1|provirus_2022140_2067593_1804	2038309	2038635	327	-1	0.318	11	GGA/GAG/AGG	GENOMAD.124210.VP	2.543e-21	90	0	0	1	2561	Caudoviricetes	NA	NA	PF05521;COG5614;TIGR01563	Bacteriophage head-tail adaptor
+NC_009012.1|provirus_2022140_2067593_1805	2038632	2039231	600	-1	0.330	11	AGGAG	GENOMAD.158311.VV	2.792e-34	132	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR02215	phage conserved hypothetical protein, phiE125 gp8 family
+NC_009012.1|provirus_2022140_2067593_1806	2039246	2039686	441	-1	0.329	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1807	2039699	2040988	1290	-1	0.367	11	AGGA	GENOMAD.093418.VV	2.924e-30	128	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;TIGR01554;COG4653	phage major capsid protein, HK97 family
+NC_009012.1|provirus_2022140_2067593_1808	2041016	2041759	744	-1	0.344	11	AGGA	GENOMAD.158277.VP	2.322e-25	108	0	0	0	2561	Caudoviricetes	NA	NA	PF00574;PF19602;K01358;TIGR00493;COG3904	ATP-dependent Clp endopeptidase, proteolytic subunit ClpP
+NC_009012.1|provirus_2022140_2067593_1809	2041764	2043023	1260	-1	0.352	11	AGGAGG	GENOMAD.179073.VP	1.345e-39	156	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1810	2043035	2045584	2550	-1	0.349	11	AGGAGG	GENOMAD.181434.VP	3.417e-57	219	0	0	1	2561	Caudoviricetes	NA	NA	PF20441	Terminase large subunit, endonuclease domain
+NC_009012.1|provirus_2022140_2067593_1811	2045577	2046059	483	-1	0.400	11	AGGAGG	GENOMAD.168120.VP	3.555e-12	66	0	0	1	2561	Caudoviricetes	NA	NA	PF05119;COG3747;TIGR01558	Phage terminase, small subunit
+NC_009012.1|provirus_2022140_2067593_1812	2046118	2046333	216	-1	0.329	11	4Base/6BMM	GENOMAD.225559.VP	4.489e-15	70	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1813	2046326	2047078	753	-1	0.325	11	GGAGG	GENOMAD.105515.VV	2.253e-07	54	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1814	2047192	2047503	312	-1	0.356	11	GGAGG	GENOMAD.224340.VP	3.569e-39	141	0	0	0	1	NA	NA	NA	PF19854	NA
+NC_009012.1|provirus_2022140_2067593_1815	2047574	2048053	480	-1	0.327	11	GGxGG	GENOMAD.191984.VP	1.926e-08	55	0	0	0	2561	Caudoviricetes	NA	NA	PF07128	NA
+NC_009012.1|provirus_2022140_2067593_1816	2048198	2049121	924	-1	0.379	11	GGA/GAG/AGG	GENOMAD.105515.VV	2.991e-05	48	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1817	2049221	2050672	1452	-1	0.390	11	GGA/GAG/AGG	GENOMAD.136632.VV	1.346e-08	60	0	0	0	2561	Caudoviricetes	NA	NA	PF00145;TIGR00675;K00558;COG0270	DNA-methyltransferase (dcm)
+NC_009012.1|provirus_2022140_2067593_1818	2050674	2051909	1236	-1	0.358	11	GGAGG	GENOMAD.038338.VV	2.311e-33	137	0	0	0	2561	Caudoviricetes	NA	NA	COG3392	NA
+NC_009012.1|provirus_2022140_2067593_1819	2051914	2052339	426	-1	0.350	11	AGGAGG	GENOMAD.133740.VV	1.401e-16	78	0	0	0	2561	Caudoviricetes	NA	NA	PF07750;COG5352;K13583;TIGR00721	GcrA cell cycle regulator
+NC_009012.1|provirus_2022140_2067593_1820	2052752	2053132	381	-1	0.404	11	GGAGG	GENOMAD.208831.VV	4.697e-14	70	0	0	0	2561	Caudoviricetes	NA	NA	PF13395	HNH endonuclease
+NC_009012.1|provirus_2022140_2067593_1821	2053313	2053558	246	-1	0.260	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1822	2053627	2054031	405	-1	0.304	11	AGGAGG	GENOMAD.159035.VP	6.65e-39	142	0	0	0	2561	Caudoviricetes	NA	NA	PF07374;TIGR01636;COG2739	phage transcriptional activator, RinA family
+NC_009012.1|provirus_2022140_2067593_1823	2054033	2054335	303	-1	0.340	11	AGxAGG/AGGxGG	GENOMAD.212426.VP	1.787e-21	90	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1824	2054533	2056407	1875	-1	0.297	11	AGxAGG/AGGxGG	GENOMAD.024099.VV	3.13e-70	254	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1825	2056608	2058299	1692	-1	0.303	11	GGAG/GAGG	GENOMAD.102034.VP	2.393e-111	373	0	0	0	2561	Caudoviricetes	NA	NA	TIGR01636	NA
+NC_009012.1|provirus_2022140_2067593_1826	2058302	2058760	459	-1	0.316	11	AGGAGG	GENOMAD.031678.VV	2.327e-33	127	0	0	0	2561	Caudoviricetes	NA	NA	PF05037	NA
+NC_009012.1|provirus_2022140_2067593_1827	2058779	2060209	1431	-1	0.311	11	GGA/GAG/AGG	GENOMAD.016341.VV	4.675e-134	435	0	0	1	2561	Caudoviricetes	NA	NA	PF13479;PF12684;TIGR01618;K07465;COG1468	phage nucleotide-binding protein
+NC_009012.1|provirus_2022140_2067593_1828	2060293	2060658	366	-1	0.314	11	AGGAG	GENOMAD.010330.VV	1.124e-51	178	0	0	0	2561	Caudoviricetes	NA	NA	PF03838;COG3331;TIGR00648	Recombination protein U
+NC_009012.1|provirus_2022140_2067593_1829	2060655	2061833	1179	-1	0.314	11	GGA/GAG/AGG	GENOMAD.014802.VV	1.234e-10	66	0	0	0	2561	Caudoviricetes	NA	NA	PF00176;K20093;COG1061;TIGR04095	Superfamily II DNA or RNA helicase
+NC_009012.1|provirus_2022140_2067593_1830	2061823	2061912	90	-1	0.367	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1831	2061942	2062706	765	-1	0.319	11	GGAGG	GENOMAD.171549.VP	1.527e-13	73	0	0	0	2561	Caudoviricetes	NA	NA	COG3617	Prophage antirepressor
+NC_009012.1|provirus_2022140_2067593_1832	2062722	2062973	252	-1	0.286	11	AGGAGG	GENOMAD.222352.VV	3.867e-07	48	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1833	2062994	2063317	324	-1	0.340	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1834	2063536	2063763	228	-1	0.272	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1835	2063973	2064683	711	-1	0.336	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1836	2064700	2065068	369	-1	0.271	11	GGAGG	GENOMAD.213960.VV	6.573e-66	219	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1837	2065083	2065463	381	-1	0.333	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1838	2065520	2066308	789	-1	0.324	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1839	2066610	2067026	417	-1	0.312	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2022140_2067593_1840	2067186	2067593	408	1	0.350	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2581	2931283	2932395	1113	-1	0.436	11	AGGAGG	GENOMAD.016861.VV	8.63e-05	47	0	0	0	2561	Caudoviricetes	NA	NA	PF13671;COG2019;TIGR01359;K13829	AAA domain
+NC_009012.1|provirus_2931283_2970170_2582	2932453	2932875	423	-1	0.350	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2583	2932954	2933160	207	1	0.406	11	GGxGG	GENOMAD.087773.VV	6.92e-17	75	0	0	0	2561	Caudoviricetes	NA	NA	PF14083	PGDYG protein
+NC_009012.1|provirus_2931283_2970170_2584	2933136	2933600	465	-1	0.353	11	AGxAGG/AGGxGG	GENOMAD.170160.VC	7.688e-09	56	0	0	0	2561	Caudoviricetes	NA	NA	PF18184	SMODS and SLOG-associating 2TM effector domain 3
+NC_009012.1|provirus_2931283_2970170_2585	2933630	2934070	441	-1	0.401	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2586	2934086	2934514	429	-1	0.408	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2587	2934642	2934881	240	1	0.358	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2588	2934900	2935646	747	1	0.383	11	AGxAGG/AGGxGG	GENOMAD.132419.VP	5.435e-24	104	0	0	0	2561	Caudoviricetes	NA	NA	PF03374;COG3645	Phage antirepressor protein YoqD, KilAC domain
+NC_009012.1|provirus_2931283_2970170_2589	2935649	2935867	219	1	0.507	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2590	2935963	2936175	213	1	0.460	11	AGxAGG/AGGxGG	GENOMAD.209016.VC	1.289e-41	146	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2591	2936162	2936335	174	1	0.477	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2592	2936351	2936569	219	1	0.411	11	GGA/GAG/AGG	GENOMAD.088748.VV	2.403e-36	131	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2593	2936562	2937113	552	1	0.404	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2594	2937114	2938019	906	1	0.429	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2595	2938109	2938396	288	1	0.444	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2596	2938386	2938574	189	1	0.450	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2597	2938591	2939673	1083	1	0.437	11	GGAGG	GENOMAD.021533.VV	5.011e-133	426	0	0	1	2561	Caudoviricetes	NA	NA	TIGR01714	phage replisome organizer, putative, N-terminal region
+NC_009012.1|provirus_2931283_2970170_2598	2939670	2940506	837	1	0.458	11	GGAGG	GENOMAD.034827.VV	1.47e-07	55	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2599	2940508	2940882	375	1	0.477	11	GGAG/GAGG	GENOMAD.151656.VP	2.586e-44	157	0	0	1	2561	Caudoviricetes	NA	NA	PF17288;K06909;TIGR01547;COG1783	phage terminase, large subunit, PBSX family
+NC_009012.1|provirus_2931283_2970170_2600	2940930	2941352	423	1	0.414	11	AGxAGG/AGGxGG	GENOMAD.221128.VP	8.436e-64	214	0	0	0	2561	Caudoviricetes	NA	NA	PF05263;TIGR01636;COG2739	phage transcriptional activator, RinA family
+NC_009012.1|provirus_2931283_2970170_2601	2941501	2941743	243	1	0.374	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2602	2941811	2942653	843	1	0.323	11	GGAG/GAGG	GENOMAD.178342.VP	1.96e-33	133	0	0	0	2561	Caudoviricetes	NA	NA	PF02086;PF06576;PF06147;K21507;TIGR00571;COG0338	DNA adenine methylase (dam)
+NC_009012.1|provirus_2931283_2970170_2603	2942646	2943926	1281	1	0.304	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2604	2944119	2944964	846	1	0.301	11	AGGAGG	GENOMAD.225783.VP	6.425e-63	219	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2605	2945034	2945183	150	1	0.280	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2606	2945216	2945665	450	1	0.413	11	GGA/GAG/AGG	GENOMAD.026460.VV	5.098e-23	97	0	0	1	2561	Caudoviricetes	NA	NA	PF03592;COG3728;K07474	Phage terminase, small subunit
+NC_009012.1|provirus_2931283_2970170_2607	2945652	2946899	1248	1	0.421	11	AGxAG	GENOMAD.141197.VP	5.699e-78	269	0	0	1	2561	Caudoviricetes	NA	NA	PF17288;K06909;TIGR01547;COG1783	Terminase RNAseH like domain
+NC_009012.1|provirus_2931283_2970170_2608	2946915	2948348	1434	1	0.371	11	AGxAGG/AGGxGG	GENOMAD.006049.VV	7.501e-107	356	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2609	2948345	2948494	150	1	0.340	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2610	2948505	2949914	1410	1	0.362	11	AGxAGG/AGGxGG	GENOMAD.003968.VV	2.731e-31	132	0	0	1	2561	Caudoviricetes	NA	NA	PF06152;COG5585;TIGR01641	NAD+--asparagine ADP-ribosyltransferase
+NC_009012.1|provirus_2931283_2970170_2611	2949911	2950117	207	1	0.348	11	AGGAG	GENOMAD.066155.VV	6.191e-11	58	0	0	0	2561	Caudoviricetes	NA	NA	PF06372	NA
+NC_009012.1|provirus_2931283_2970170_2612	2950161	2950847	687	1	0.339	11	None	GENOMAD.007545.VV	1.038e-29	120	0	0	0	2561	Caudoviricetes	NA	NA	PF06810	Phage minor structural protein GP20
+NC_009012.1|provirus_2931283_2970170_2613	2950866	2951789	924	1	0.394	11	AGGAG	GENOMAD.092843.VP	1.736e-163	511	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2614	2951802	2951948	147	1	0.388	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2615	2951926	2952327	402	1	0.443	11	AGGA/GGAG/GAGG	GENOMAD.047671.VV	6.175e-72	237	0	0	0	2561	Caudoviricetes	NA	NA	PF11436	NA
+NC_009012.1|provirus_2931283_2970170_2616	2952324	2952659	336	1	0.464	11	GGAGG	GENOMAD.074010.VV	3.139e-52	179	0	0	0	2561	Caudoviricetes	NA	NA	PF12206	NA
+NC_009012.1|provirus_2931283_2970170_2617	2952656	2953066	411	1	0.416	11	GGxGG	GENOMAD.019155.VV	1.438e-72	239	0	0	1	2561	Caudoviricetes	NA	NA	PF11114;TIGR01725	phage protein, HK97 gp10 family
+NC_009012.1|provirus_2931283_2970170_2618	2953056	2953475	420	1	0.438	11	4Base/6BMM	GENOMAD.025660.VV	2.016e-70	233	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2619	2953638	2954927	1290	-1	0.420	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2620	2955379	2956425	1047	1	0.393	11	AGGAG	GENOMAD.118787.VV	2.086e-155	490	0	0	1	2561	Caudoviricetes	NA	NA	PF04984;PF17482;COG3497	Phage tail sheath protein subtilisin-like domain; Phage tail sheath C-terminal domain
+NC_009012.1|provirus_2931283_2970170_2621	2956446	2956922	477	1	0.392	11	AGGAGG	GENOMAD.018728.VV	4.047e-72	239	0	0	1	2561	Caudoviricetes	NA	NA	PF09393	Phage tail tube protein
+NC_009012.1|provirus_2931283_2970170_2622	2956939	2957352	414	1	0.377	11	GGAG/GAGG	GENOMAD.009389.VV	1.083e-59	202	0	0	1	2561	Caudoviricetes	NA	NA	PF08890;PF17482	Phage XkdN-like tail assembly chaperone protein, TAC; Phage tail sheath C-terminal domain
+NC_009012.1|provirus_2931283_2970170_2623	2957352	2957543	192	1	0.391	11	3Base/5BMM	GENOMAD.059912.VV	9.647e-19	80	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2624	2957545	2959380	1836	1	0.406	11	AGxAGG/AGGxGG	GENOMAD.118787.VV	2.585e-124	413	0	0	1	2561	Caudoviricetes	NA	NA	PF04984;PF17482;COG3497	Phage tail sheath protein subtilisin-like domain; Phage tail sheath C-terminal domain
+NC_009012.1|provirus_2931283_2970170_2625	2959377	2960036	660	1	0.374	11	AGxAGG/AGGxGG	GENOMAD.017357.VV	6.647e-18	85	0	0	0	2561	Caudoviricetes	NA	NA	PF06995;COG1652	Nucleoid-associated protein YgaU, contains BON and LysM domains
+NC_009012.1|provirus_2931283_2970170_2626	2960033	2960977	945	1	0.403	11	3Base/5BMM	GENOMAD.018966.VV	1.564e-77	263	0	0	1	2561	Caudoviricetes	NA	NA	PF14594;COG4379;TIGR03361;K06905	Mu-like prophage tail protein gpP
+NC_009012.1|provirus_2931283_2970170_2627	2960974	2961207	234	1	0.427	11	GGA/GAG/AGG	GENOMAD.096038.VV	2.254e-39	140	0	0	0	2561	Caudoviricetes	NA	NA	PF10844	NA
+NC_009012.1|provirus_2931283_2970170_2628	2961204	2961599	396	1	0.376	11	GGAGG	GENOMAD.016318.VV	1.625e-52	181	0	0	0	2561	Caudoviricetes	NA	NA	PF10934;COG4381;TIGR03357	Mu-like prophage protein gp46
+NC_009012.1|provirus_2931283_2970170_2629	2961599	2962657	1059	1	0.432	11	GGAGG	GENOMAD.004833.VV	7.052e-52	190	0	0	1	2561	Caudoviricetes	NA	NA	PF04865;COG3299	Baseplate J-like protein
+NC_009012.1|provirus_2931283_2970170_2630	2962647	2963249	603	1	0.420	11	GGA/GAG/AGG	GENOMAD.015577.VV	8.917e-17	81	0	0	1	2561	Caudoviricetes	NA	NA	PF10076;COG3778;TIGR02242	Uncharacterized protein YmfQ in lambdoid prophage, DUF2313 family
+NC_009012.1|provirus_2931283_2970170_2631	2963259	2963543	285	1	0.407	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2632	2963546	2964928	1383	1	0.513	11	AGGAGG	GENOMAD.087125.VV	1.015e-11	70	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2633	2964993	2965253	261	1	0.402	11	AGGA	GENOMAD.213587.VP	4.024e-30	114	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2634	2965254	2965406	153	1	0.386	11	AGGAG	GENOMAD.065816.VV	5.681e-11	57	0	0	0	2561	Caudoviricetes	NA	NA	PF09693;TIGR01669	phage uncharacterized protein, XkdX family
+NC_009012.1|provirus_2931283_2970170_2635	2965495	2965785	291	1	0.354	11	AGxAGG/AGGxGG	GENOMAD.171716.VV	1.182e-08	53	0	0	0	1	NA	NA	NA	PF07439	NA
+NC_009012.1|provirus_2931283_2970170_2636	2965801	2966457	657	1	0.482	11	AGxAGG/AGGxGG	GENOMAD.220135.VV	1.55e-13	72	0	0	0	2561	Caudoviricetes	NA	NA	COG5632	N-acetylmuramoyl-L-alanine amidase CwlA
+NC_009012.1|provirus_2931283_2970170_2637	2966597	2966896	300	1	0.450	11	GGAGG	GENOMAD.151236.VC	1.963e-43	153	0	0	1	1	NA	NA	NA	PF06946	Bacteriophage A118-like holin, Hol118
+NC_009012.1|provirus_2931283_2970170_2638	2967070	2967705	636	1	0.332	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2639	2967690	2968121	432	1	0.315	11	AGGAGG	GENOMAD.206152.VV	2.957e-68	227	0	0	0	1	NA	NA	NA	PF01845;COG2337;K07171	mRNA-degrading endonuclease, toxin component of the MazEF toxin-antitoxin module
+NC_009012.1|provirus_2931283_2970170_2640	2968641	2969126	486	1	0.440	11	AGGAG/GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2641	2969366	2969530	165	1	0.352	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_2931283_2970170_2642	2969562	2970170	609	1	0.417	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2977	3339258	3339497	240	1	0.429	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2978	3339748	3340554	807	1	0.446	11	AGGAGG	GENOMAD.197438.VP	4.39e-23	102	0	0	0	2561	Caudoviricetes	NA	NA	PF09250	Bifunctional DNA primase/polymerase, N-terminal
+NC_009012.1|provirus_3339258_3389049_2979	3340946	3342793	1848	1	0.414	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2980	3342816	3344054	1239	1	0.348	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2981	3344263	3344400	138	1	0.333	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2982	3344462	3344791	330	1	0.382	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2983	3344804	3345274	471	1	0.376	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2984	3345548	3345952	405	-1	0.410	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2985	3346045	3346803	759	-1	0.451	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2986	3346803	3348287	1485	-1	0.436	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2987	3348393	3349109	717	-1	0.392	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2988	3349682	3350029	348	1	0.405	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2989	3350172	3351857	1686	1	0.419	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2990	3351870	3352448	579	1	0.304	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2991	3352630	3353019	390	1	0.415	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2992	3353012	3353149	138	1	0.406	11	GGxGG	GENOMAD.223510.VP	6.369e-08	48	0	0	0	1	NA	NA	NA	PF10122;TIGR04104;COG4530	Mu-like prophage protein Com
+NC_009012.1|provirus_3339258_3389049_2993	3353530	3354081	552	1	0.457	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2994	3354477	3356318	1842	1	0.410	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2995	3356345	3357583	1239	1	0.350	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2996	3358087	3358431	345	1	0.336	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2997	3358458	3358892	435	1	0.315	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2998	3358867	3359211	345	1	0.397	11	AGxAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_2999	3359399	3359644	246	1	0.435	11	4Base/6BMM	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3000	3360040	3360228	189	1	0.370	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3001	3360466	3361671	1206	1	0.440	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3002	3361685	3361972	288	1	0.292	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3003	3362170	3362559	390	1	0.441	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3004	3362549	3362689	141	1	0.440	11	GGAGG	GENOMAD.223510.VP	2.986e-08	49	0	0	0	1	NA	NA	NA	PF10122;TIGR04104;COG4530	Mu-like prophage protein Com
+NC_009012.1|provirus_3339258_3389049_3005	3362816	3364975	2160	1	0.468	11	AGGAGG	GENOMAD.169139.VV	4.569e-22	105	0	0	0	2561	Caudoviricetes	NA	NA	PF09250	Bifunctional DNA primase/polymerase, N-terminal
+NC_009012.1|provirus_3339258_3389049_3006	3365247	3366560	1314	1	0.453	11	GGAGG	GENOMAD.093418.VV	1.24e-13	76	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;TIGR01554;COG4653	phage major capsid protein, HK97 family
+NC_009012.1|provirus_3339258_3389049_3007	3366819	3367121	303	1	0.432	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3008	3367461	3368705	1245	1	0.441	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3009	3369138	3369425	288	1	0.299	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3010	3369641	3369937	297	1	0.434	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3011	3370188	3370994	807	1	0.454	11	AGGAGG	GENOMAD.197438.VP	2.102e-21	97	0	0	0	2561	Caudoviricetes	NA	NA	PF09250	Bifunctional DNA primase/polymerase, N-terminal
+NC_009012.1|provirus_3339258_3389049_3012	3371390	3373237	1848	1	0.403	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3013	3373261	3374499	1239	1	0.351	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3014	3374708	3375235	528	1	0.358	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3015	3375248	3375718	471	1	0.374	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3016	3375991	3377127	1137	-1	0.403	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3017	3377700	3378047	348	1	0.408	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3018	3378190	3378969	780	1	0.442	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3019	3378971	3379900	930	1	0.413	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3020	3379902	3380144	243	1	0.358	11	GGxGG	GENOMAD.227820.VP	6.79e-08	50	0	0	0	1	NA	NA	NA	PF15597	Immunity protein 59
+NC_009012.1|provirus_3339258_3389049_3021	3380249	3380851	603	1	0.274	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3022	3381065	3382069	1005	1	0.392	11	3Base/5BMM	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3023	3382076	3382312	237	1	0.308	11	AGGAGG	GENOMAD.218640.VC	3.123e-07	48	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3024	3382430	3382819	390	1	0.428	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3025	3382812	3382949	138	1	0.399	11	GGAGG	GENOMAD.223510.VP	6.369e-08	48	0	0	0	1	NA	NA	NA	PF10122;TIGR04104;COG4530	Mu-like prophage protein Com
+NC_009012.1|provirus_3339258_3389049_3026	3383070	3385229	2160	1	0.468	11	AGGAGG	GENOMAD.169139.VV	2.257e-22	106	0	0	0	2561	Caudoviricetes	NA	NA	PF09250	Bifunctional DNA primase/polymerase, N-terminal
+NC_009012.1|provirus_3339258_3389049_3027	3385500	3386813	1314	1	0.451	11	GGAGG	GENOMAD.093418.VV	6.053e-14	77	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;TIGR01554;COG4653	phage major capsid protein, HK97 family
+NC_009012.1|provirus_3339258_3389049_3028	3387138	3387440	303	1	0.436	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_009012.1|provirus_3339258_3389049_3029	3387805	3389049	1245	1	0.449	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_012982.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014008.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014168.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,99 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_014168.1|provirus_27479_67296_28	27479	28375	897	1	0.672	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_29	28372	28920	549	1	0.667	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_30	28917	29114	198	1	0.712	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_31	29111	29863	753	1	0.671	11	GGAG/GAGG	GENOMAD.032144.VV	1.48e-35	138	0	0	0	2561	Caudoviricetes	NA	NA	PF12684	NA
+NC_014168.1|provirus_27479_67296_32	29860	30516	657	1	0.658	11	GGA/GAG/AGG	GENOMAD.124252.VP	2.931e-32	127	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;TIGR01913	phage recombination protein Bet
+NC_014168.1|provirus_27479_67296_33	30516	30917	402	1	0.649	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_34	30923	31276	354	1	0.638	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_35	31280	31432	153	1	0.660	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_36	31426	31845	420	1	0.662	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_37	31842	32357	516	1	0.698	11	GGAG/GAGG	GENOMAD.033304.VV	2.452e-10	61	0	0	0	2561	Caudoviricetes	NA	NA	PF13395	NA
+NC_014168.1|provirus_27479_67296_38	32357	33292	936	1	0.661	11	GGxGG	GENOMAD.028141.VV	1.19e-25	111	0	0	1	2561	Caudoviricetes	NA	NA	PF09681;TIGR01714	N-terminal phage replisome organiser (Phage_rep_org_N)
+NC_014168.1|provirus_27479_67296_39	33289	33654	366	1	0.658	11	GGAGG	GENOMAD.087217.VV	8.175e-05	43	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_40	33651	34037	387	1	0.674	11	AGGAG	GENOMAD.018151.VV	4.881e-23	96	0	0	0	2561	Caudoviricetes	NA	NA	PF01870;COG1591	Holliday junction resolvase, archaeal type
+NC_014168.1|provirus_27479_67296_41	34034	34234	201	1	0.672	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_42	34231	34542	312	1	0.670	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_43	34539	34751	213	1	0.596	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_44	34748	34984	237	1	0.578	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_45	35011	35331	321	1	0.617	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_46	35328	35798	471	1	0.620	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_47	35795	36223	429	1	0.653	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_48	36220	36798	579	1	0.585	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_49	36795	37106	312	1	0.647	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_50	37103	37882	780	1	0.663	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_51	37879	38100	222	1	0.676	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_52	38249	40009	1761	1	0.681	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_53	40017	40673	657	1	0.636	11	AGGA/GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_54	40670	40990	321	1	0.632	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_55	41205	41459	255	1	0.663	11	GGAGG	GENOMAD.083226.VV	1.61e-08	52	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_56	41512	41895	384	1	0.620	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_57	41892	42371	480	1	0.640	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_58	42274	42642	369	-1	0.672	11	AGGAG	GENOMAD.215374.PC	1.387e-08	54	0	0	0	1	NA	NA	NA	PF13827	NA
+NC_014168.1|provirus_27479_67296_59	42807	43085	279	1	0.674	11	AGGAG	GENOMAD.014408.VV	1.177e-14	70	0	0	0	2561	Caudoviricetes	NA	NA	PF13395;TIGR02646	HNH endonuclease
+NC_014168.1|provirus_27479_67296_60	43082	43267	186	1	0.602	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_61	43504	43767	264	1	0.655	11	AGGAG	GENOMAD.047538.VV	9.427e-15	70	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_62	43751	45166	1416	1	0.663	11	AGGAG/GGAGG	GENOMAD.002060.VV	1.733e-134	436	0	0	1	2561	Caudoviricetes	NA	NA	PF20441;PF04466;COG4626;TIGR01547;K06909	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014168.1|provirus_27479_67296_63	45190	46566	1377	1	0.687	11	GGAGG	GENOMAD.080886.VV	1.496e-47	181	0	0	1	2561	Caudoviricetes	NA	NA	PF05133;TIGR01538	phage portal protein, SPP1 family
+NC_014168.1|provirus_27479_67296_64	46550	47233	684	1	0.697	11	GGAG/GAGG	GENOMAD.097054.VV	4.565e-30	121	0	0	1	2561	Caudoviricetes	NA	NA	PF04233;TIGR01641	phage putative head morphogenesis protein, SPP1 gp7 family
+NC_014168.1|provirus_27479_67296_65	47285	47761	477	1	0.644	11	GGA/GAG/AGG	GENOMAD.040462.VV	2.062e-54	188	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_66	47788	48696	909	1	0.636	11	GGAG/GAGG	GENOMAD.013023.VV	2.718e-53	192	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;TIGR01554;COG4653	phage major capsid protein, HK97 family
+NC_014168.1|provirus_27479_67296_67	48696	48869	174	1	0.724	11	AGGA/GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_68	48841	49308	468	1	0.686	11	GGAG/GAGG	GENOMAD.062537.VV	2.534e-42	153	0	0	1	2561	Caudoviricetes	NA	NA	PF09355	Phage protein Gp19/Gp15/Gp42
+NC_014168.1|provirus_27479_67296_69	49305	49646	342	1	0.702	11	None	GENOMAD.038727.VV	1.417e-21	91	0	0	1	2561	Caudoviricetes	NA	NA	PF12206;COG5614;TIGR01563	Minor capsid protein
+NC_014168.1|provirus_27479_67296_70	49647	49955	309	1	0.673	11	GGAGG	GENOMAD.087122.VV	2.723e-10	58	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_71	49959	50357	399	1	0.714	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_72	50395	51042	648	1	0.657	11	AGGA	GENOMAD.004252.VV	6.372e-16	79	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_73	51039	51371	333	1	0.658	11	GGA/GAG/AGG	GENOMAD.187636.VV	2.624e-05	44	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_74	51380	51763	384	1	0.693	11	3Base/5BMM	GENOMAD.056037.VV	4.163e-06	47	0	0	0	2561	Caudoviricetes	NA	NA	PF17318;PF08765;TIGR02417	Mor transcription activator family
+NC_014168.1|provirus_27479_67296_75	51744	55466	3723	1	0.706	11	AGGAG	GENOMAD.016295.VV	2.211e-48	193	0	0	0	2561	Caudoviricetes	NA	NA	COG3953	SLT domain protein
+NC_014168.1|provirus_27479_67296_76	55466	56728	1263	1	0.678	11	GGAGG	GENOMAD.053786.VV	4.118e-58	211	0	0	0	2561	Caudoviricetes	NA	NA	COG4722	Phage-related protein
+NC_014168.1|provirus_27479_67296_77	56728	58500	1773	1	0.679	11	GGA/GAG/AGG	GENOMAD.019112.VV	3.356e-155	502	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_78	58500	58751	252	1	0.675	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_79	58751	59812	1062	1	0.658	11	GGAGG	GENOMAD.059914.VV	2.914e-67	235	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_80	59814	61079	1266	1	0.682	11	None	GENOMAD.079434.VV	5.593e-20	96	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_81	61144	62403	1260	1	0.683	11	AGGAG	GENOMAD.047467.VV	2.371e-19	94	0	0	0	2561	Caudoviricetes	NA	NA	COG5632	N-acetylmuramoyl-L-alanine amidase CwlA
+NC_014168.1|provirus_27479_67296_82	62400	62756	357	1	0.669	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_83	62756	63031	276	1	0.656	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_84	63031	63237	207	1	0.705	11	GGxGG	GENOMAD.158505.VV	1.14e-05	43	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_85	63230	63589	360	1	0.689	11	AGGAG	GENOMAD.073706.VV	2.772e-08	53	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_86	63716	64087	372	-1	0.570	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_87	64298	64633	336	-1	0.560	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_88	64630	64902	273	-1	0.615	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_89	64902	66164	1263	-1	0.621	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_27479_67296_90	66247	67296	1050	-1	0.604	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1152	1141631	1141948	318	-1	0.736	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1153	1142010	1142369	360	-1	0.742	11	GGA/GAG/AGG	GENOMAD.082050.VV	3.69e-22	93	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1154	1142366	1142698	333	-1	0.685	11	GGA/GAG/AGG	GENOMAD.076859.VV	2.776e-13	67	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1155	1142709	1143020	312	-1	0.740	11	AGGAGG	GENOMAD.103239.VV	2.089e-13	67	0	0	1	2561	Caudoviricetes	NA	NA	PF10665;TIGR01563;COG5614	Minor capsid protein
+NC_014168.1|provirus_1141631_1162952_1156	1143056	1143292	237	1	0.633	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1157	1143298	1143807	510	-1	0.716	11	GGAG/GAGG	GENOMAD.028700.VV	2.384e-22	96	0	0	0	2561	Caudoviricetes	NA	NA	TIGR02215	phage conserved hypothetical protein, phiE125 gp8 family
+NC_014168.1|provirus_1141631_1162952_1158	1143813	1144004	192	-1	0.609	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1159	1144022	1145302	1281	-1	0.680	11	AGGAG	GENOMAD.098207.VP	2.112e-87	297	0	0	1	2561	Caudoviricetes	NA	NA	PF06673;TIGR01554;COG1659	Lactococcus lactis bacteriophage major capsid protein
+NC_014168.1|provirus_1141631_1162952_1160	1145299	1145991	693	-1	0.700	11	AGGAG	GENOMAD.207278.VV	3.963e-19	89	0	0	1	2561	Caudoviricetes	NA	NA	PF04586;COG3740;K06904;TIGR01543	Phage head maturation protease
+NC_014168.1|provirus_1141631_1162952_1161	1145948	1147249	1302	-1	0.707	11	GGAG/GAGG	GENOMAD.138175.VV	2.9e-86	294	0	0	1	2561	Caudoviricetes	NA	NA	PF04860;TIGR01537;COG4695	phage portal protein, HK97 family
+NC_014168.1|provirus_1141631_1162952_1162	1147274	1148770	1497	-1	0.707	11	GGAGG	GENOMAD.037086.VV	2.935e-120	396	0	0	1	2561	Caudoviricetes	NA	NA	PF20441;PF03354;COG4626;TIGR01547	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014168.1|provirus_1141631_1162952_1163	1148787	1149077	291	-1	0.735	11	GGAG/GAGG	GENOMAD.064187.VV	3.239e-06	46	0	0	1	2561	Caudoviricetes	NA	NA	TIGR01558	NA
+NC_014168.1|provirus_1141631_1162952_1164	1149335	1149841	507	1	0.677	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1165	1150029	1150580	552	1	0.661	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1166	1150720	1151001	282	-1	0.645	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1167	1151045	1151320	276	-1	0.703	11	None	GENOMAD.041582.VV	4.527e-16	74	0	0	0	2561	Caudoviricetes	NA	NA	PF13395;TIGR02646	TIGR02646 family protein
+NC_014168.1|provirus_1141631_1162952_1168	1151326	1152444	1119	-1	0.718	11	GGAGG	GENOMAD.064801.VV	2.016e-15	81	0	0	0	2561	Caudoviricetes	NA	NA	PF00145;TIGR00675;COG0270;K15336	DNA-methyltransferase (dcm)
+NC_014168.1|provirus_1141631_1162952_1169	1152853	1153509	657	-1	0.702	11	AGGAG	GENOMAD.066690.VV	1.852e-101	327	0	0	0	2561	Caudoviricetes	NA	NA	PF10122;COG5349;TIGR01206	Uncharacterized conserved protein, DUF983 family
+NC_014168.1|provirus_1141631_1162952_1170	1153506	1153754	249	-1	0.683	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1171	1153751	1154008	258	-1	0.698	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1172	1154012	1154389	378	-1	0.675	11	GGAG/GAGG	GENOMAD.063447.VV	9.173e-15	72	0	0	0	2561	Caudoviricetes	NA	NA	PF11417	NA
+NC_014168.1|provirus_1141631_1162952_1173	1154389	1155183	795	-1	0.659	11	AGGAG	GENOMAD.049678.VV	1.151e-06	52	0	0	1	2561	Caudoviricetes	NA	NA	PF09681;TIGR01714	phage replisome organizer, putative, N-terminal region
+NC_014168.1|provirus_1141631_1162952_1174	1155187	1155612	426	-1	0.732	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1175	1155609	1155995	387	-1	0.700	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1176	1156014	1156796	783	-1	0.706	11	GGAGG	GENOMAD.021092.VV	7.29e-40	151	0	0	0	2561	Caudoviricetes	NA	NA	PF12684;TIGR00372;COG1468;K07465	CRISPR-associated protein Cas4
+NC_014168.1|provirus_1141631_1162952_1177	1156793	1157083	291	-1	0.698	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1178	1157080	1157307	228	-1	0.693	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1179	1157304	1157678	375	-1	0.739	11	GGAG/GAGG	GENOMAD.067886.VV	1.484e-08	54	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1180	1157757	1158599	843	-1	0.706	11	AGGA	GENOMAD.161352.VP	5.904e-23	102	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1181	1158605	1159525	921	-1	0.701	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1182	1159522	1159776	255	-1	0.729	11	GGA/GAG/AGG	GENOMAD.222641.VP	1.01e-05	44	0	0	0	1	NA	NA	NA	PF08667;COG5606;TIGR02612;K07727	Predicted DNA-binding protein, XRE-type HTH domain
+NC_014168.1|provirus_1141631_1162952_1183	1159861	1160289	429	1	0.713	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1184	1160403	1161263	861	1	0.700	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1185	1161230	1161493	264	1	0.746	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014168.1|provirus_1141631_1162952_1186	1161597	1162952	1356	1	0.684	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014211.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014212.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,120 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_014212.1|provirus_1170297_1209132_1203	1170297	1171460	1164	-1	0.588	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1204	1171538	1171798	261	-1	0.452	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1205	1171872	1173071	1200	-1	0.613	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1206	1173072	1173524	453	-1	0.587	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1207	1173812	1174465	654	-1	0.567	11	GGAGG	GENOMAD.212789.VC	7.003e-10	61	0	0	0	1	NA	NA	NA	PF08667;TIGR00673;COG1974;K22299	cyanase
+NC_014212.1|provirus_1170297_1209132_1208	1174604	1174783	180	1	0.517	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1209	1174780	1175010	231	1	0.623	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1210	1175054	1175242	189	1	0.614	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1211	1175242	1175514	273	1	0.648	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1212	1175507	1175629	123	1	0.618	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1213	1175629	1175847	219	1	0.689	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1214	1175875	1176492	618	1	0.544	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1215	1176556	1178289	1734	1	0.577	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1216	1178289	1178624	336	1	0.610	11	None	GENOMAD.004598.VV	3.185e-12	64	0	0	0	2561	Caudoviricetes	NA	NA	PF18743;COG1591	REase_AHJR-like
+NC_014212.1|provirus_1170297_1209132_1217	1178621	1181314	2694	1	0.628	11	GGAG/GAGG	GENOMAD.106709.VV	1.101e-06	55	0	0	0	2561	Caudoviricetes	NA	NA	PF16793	RepB DNA-primase from phage plasmid
+NC_014212.1|provirus_1170297_1209132_1218	1181304	1181546	243	1	0.424	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1219	1181649	1182485	837	1	0.568	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1220	1182591	1183058	468	1	0.645	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1221	1183055	1183510	456	1	0.596	11	GGAGG	GENOMAD.172137.VP	1.504e-54	188	0	0	1	2561	Caudoviricetes	NA	NA	PF07141;COG3728;TIGR02036	Putative bacteriophage terminase small subunit
+NC_014212.1|provirus_1170297_1209132_1222	1183500	1184804	1305	1	0.611	11	AGGA/GGAG/GAGG	GENOMAD.190694.VP	5.526e-100	334	0	0	1	2561	Caudoviricetes	NA	NA	PF04466;PF17288;TIGR01547;COG1783;K06909	phage terminase, large subunit, PBSX family
+NC_014212.1|provirus_1170297_1209132_1223	1184801	1186228	1428	1	0.680	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1224	1186209	1187081	873	1	0.667	11	None	GENOMAD.064248.VV	1.444e-15	80	0	0	1	2561	Caudoviricetes	NA	NA	PF04233;TIGR01641	phage putative head morphogenesis protein, SPP1 gp7 family
+NC_014212.1|provirus_1170297_1209132_1225	1187022	1187201	180	-1	0.578	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1226	1187232	1188875	1644	1	0.609	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1227	1188995	1189195	201	1	0.627	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1228	1189265	1190137	873	1	0.649	11	GGA/GAG/AGG	GENOMAD.063287.VV	0.0001126	46	0	0	1	2561	Caudoviricetes	NA	NA	PF04586;TIGR01543;COG3740;K06904	phage prohead protease, HK97 family
+NC_014212.1|provirus_1170297_1209132_1229	1190337	1190996	660	-1	0.620	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1230	1191039	1192691	1653	1	0.683	11	None	GENOMAD.196129.VP	5.652e-07	55	0	0	1	2561	Caudoviricetes	NA	NA	PF05125;TIGR01551;COG4653	phage major capsid protein, P2 family
+NC_014212.1|provirus_1170297_1209132_1231	1192702	1192935	234	1	0.662	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1232	1192937	1193491	555	1	0.686	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1233	1193488	1193814	327	1	0.670	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1234	1193804	1194343	540	1	0.704	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1235	1194336	1194770	435	1	0.674	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1236	1194779	1195567	789	1	0.646	11	AGGAGG	GENOMAD.154545.VV	0.0001874	45	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1237	1195567	1196052	486	1	0.693	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1238	1196182	1199919	3738	1	0.622	11	AGxAGG/AGGxGG	GENOMAD.183233.VP	3.13e-19	97	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1239	1199916	1200356	441	1	0.599	11	4Base/6BMM	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1240	1200353	1201429	1077	1	0.550	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1241	1201432	1203336	1905	1	0.602	11	None	GENOMAD.084202.VV	0.0003846	46	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1242	1203346	1203888	543	1	0.645	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1243	1203979	1204518	540	1	0.696	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1244	1204529	1204840	312	1	0.580	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1245	1204843	1206681	1839	1	0.591	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1246	1206689	1207249	561	1	0.667	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1247	1207242	1207553	312	1	0.647	11	GGAG/GAGG	GENOMAD.103334.VV	2.089e-13	67	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1248	1207563	1208354	792	1	0.635	11	GGAGG	GENOMAD.024392.VV	1.495e-72	246	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1249	1208354	1208902	549	1	0.608	11	None	GENOMAD.052331.VV	1.732e-50	178	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1170297_1209132_1250	1208917	1209132	216	1	0.579	11	GGAGG	GENOMAD.199026.VV	1.153e-06	46	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1776	1746722	1747702	981	-1	0.630	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1777	1747716	1748285	570	-1	0.400	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1778	1748294	1749001	708	-1	0.552	11	AGxAGG/AGGxGG	GENOMAD.190987.VC	3.906e-07	53	0	0	0	2561	Caudoviricetes	NA	NA	PF00717;COG1974;TIGR00498	SOS-response transcriptional repressor LexA (RecA-mediated autopeptidase)
+NC_014212.1|provirus_1746722_1764354_1779	1749082	1749270	189	1	0.582	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1780	1749263	1749469	207	1	0.614	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1781	1749504	1749674	171	1	0.614	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1782	1749664	1749942	279	1	0.609	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1783	1749935	1750057	123	1	0.650	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1784	1750057	1750149	93	1	0.613	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1785	1750146	1750445	300	1	0.623	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1786	1750442	1750786	345	1	0.600	11	4Base/6BMM	GENOMAD.138277.VP	0.0001458	42	0	0	0	9913	Herelleviridae	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1787	1750786	1751118	333	1	0.583	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1788	1751069	1752535	1467	1	0.571	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1789	1752532	1752741	210	1	0.595	11	GGA/GAG/AGG	GENOMAD.127419.VV	5.309e-06	44	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1790	1752729	1753061	333	1	0.616	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1791	1753134	1753376	243	1	0.626	11	AGGA/GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1792	1753373	1753642	270	1	0.507	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1793	1753645	1753848	204	1	0.539	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1794	1753930	1754400	471	1	0.590	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1795	1754397	1754762	366	1	0.653	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1796	1755173	1755850	678	1	0.599	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1797	1755852	1756052	201	1	0.622	11	GGAG/GAGG	GENOMAD.187456.VV	2.238e-19	82	0	0	0	4181	Sphaerolipoviridae	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1798	1756052	1756789	738	1	0.608	11	AGGA/GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1799	1756850	1757281	432	1	0.586	11	None	GENOMAD.226936.VP	5.158e-29	114	0	0	0	4181	Sphaerolipoviridae	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1800	1757291	1757752	462	1	0.576	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1801	1757761	1758645	885	1	0.631	11	AGGA	GENOMAD.175220.VV	1.243e-35	140	0	0	0	4181	Sphaerolipoviridae	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1802	1758645	1758887	243	1	0.551	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1803	1758899	1759534	636	1	0.616	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1804	1759531	1759830	300	1	0.573	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1805	1759827	1760003	177	1	0.582	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1806	1759994	1760500	507	1	0.649	11	GGA/GAG/AGG	GENOMAD.201673.VV	2.522e-06	49	0	0	0	4181	Sphaerolipoviridae	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1807	1760511	1760699	189	1	0.587	11	GGAGG	GENOMAD.131894.VV	1.707e-06	45	0	0	1	1	NA	NA	NA	PF04531;TIGR01598;COG5546	NA
+NC_014212.1|provirus_1746722_1764354_1808	1760702	1760875	174	1	0.569	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1809	1760863	1761318	456	1	0.581	11	GGAG/GAGG	GENOMAD.199413.VV	4.785e-15	74	0	0	0	4181	Sphaerolipoviridae	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1810	1761318	1762367	1050	1	0.577	11	4Base/6BMM	GENOMAD.107709.VV	1.275e-125	404	0	0	0	4181	Sphaerolipoviridae	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1811	1762357	1763370	1014	1	0.537	11	AGGAG	GENOMAD.109373.VV	8.278e-11	66	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1812	1763367	1763630	264	1	0.610	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1746722_1764354_1813	1763605	1764354	750	1	0.620	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1936	1893193	1893432	240	1	0.600	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1937	1893580	1893810	231	1	0.567	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1938	1893803	1894078	276	1	0.641	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1939	1894071	1894289	219	1	0.603	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1940	1894299	1894694	396	1	0.667	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1941	1894780	1895259	480	1	0.635	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1942	1895256	1895957	702	1	0.660	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1943	1895947	1896387	441	1	0.639	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1944	1896444	1896692	249	1	0.586	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1945	1896702	1897043	342	1	0.617	11	AGGAG	GENOMAD.188989.VV	8.584e-67	221	0	0	0	1	NA	NA	NA	PF10711	Hypothetical protein (DUF2513)
+NC_014212.1|provirus_1893193_1914973_1946	1897045	1897365	321	1	0.604	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1947	1897376	1897837	462	1	0.632	11	GGA/GAG/AGG	GENOMAD.102149.VV	7.093e-30	117	0	0	1	1	NA	NA	NA	PF11985	Bacteriophage Mu, Gp27
+NC_014212.1|provirus_1893193_1914973_1948	1897824	1899107	1284	1	0.639	11	GGA/GAG/AGG	GENOMAD.025283.VV	5.515e-85	290	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1949	1899107	1900642	1536	1	0.645	11	AGGAG	GENOMAD.116653.VV	5.637e-33	138	0	0	0	2561	Caudoviricetes	NA	NA	PF06074;COG4383	Mu-like prophage protein gp29
+NC_014212.1|provirus_1893193_1914973_1950	1900644	1901816	1173	1	0.660	11	GGAG/GAGG	GENOMAD.169564.VP	1.859e-13	75	0	0	0	2561	Caudoviricetes	NA	NA	COG2369	Uncharacterized conserved protein, contains phage Mu gpF-like domain
+NC_014212.1|provirus_1893193_1914973_1951	1901828	1903027	1200	-1	0.613	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1952	1903028	1903480	453	-1	0.587	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1953	1903664	1904203	540	1	0.667	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1954	1904257	1904703	447	1	0.691	11	None	GENOMAD.191448.VP	4.904e-23	97	0	0	1	2561	Caudoviricetes	NA	NA	PF05069;TIGR01635;COG5005	phage virion morphogenesis (putative tail completion) protein
+NC_014212.1|provirus_1893193_1914973_1955	1904784	1905284	501	1	0.679	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1956	1905295	1905507	213	1	0.648	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1957	1905504	1906925	1422	1	0.675	11	AGGAGG	GENOMAD.041181.VV	9.292e-41	161	0	0	1	2561	Caudoviricetes	NA	NA	PF10758;COG3497	Phage tail sheath protein FI
+NC_014212.1|provirus_1893193_1914973_1958	1906936	1907367	432	1	0.595	11	AGGAGG	GENOMAD.115837.VV	7.589e-83	269	0	0	0	2561	Caudoviricetes	NA	NA	PF10772	Bacteriophage HP1, Orf24
+NC_014212.1|provirus_1893193_1914973_1959	1907426	1907800	375	1	0.629	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1960	1907805	1907936	132	-1	0.712	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1961	1907951	1910032	2082	1	0.691	11	GGAGG	GENOMAD.113463.VP	1.273e-12	74	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1962	1910032	1910610	579	1	0.646	11	AGGAGG	GENOMAD.163406.VV	9.335e-105	335	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1963	1910607	1911272	666	1	0.715	11	GGA/GAG/AGG	GENOMAD.068883.VV	3.569e-104	335	0	0	0	2561	Caudoviricetes	NA	NA	TIGR03361;COG3500	type VI secretion system Vgr family protein
+NC_014212.1|provirus_1893193_1914973_1964	1911274	1911750	477	1	0.671	11	AGGAGG	GENOMAD.068883.VV	1.244e-15	76	0	0	0	2561	Caudoviricetes	NA	NA	TIGR03361;COG3500	type VI secretion system Vgr family protein
+NC_014212.1|provirus_1893193_1914973_1965	1911750	1912124	375	1	0.651	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014212.1|provirus_1893193_1914973_1966	1912117	1913199	1083	1	0.664	11	GGAGG	GENOMAD.106861.VV	2.93e-22	102	0	0	1	2561	Caudoviricetes	NA	NA	PF04865;COG3299	Baseplate J-like protein
+NC_014212.1|provirus_1893193_1914973_1967	1913200	1913811	612	1	0.667	11	GGAGG	GENOMAD.067612.VV	1.972e-93	303	0	0	1	2561	Caudoviricetes	NA	NA	PF10076;COG4385;TIGR01634	Bacteriophage P2-related tail formation protein
+NC_014212.1|provirus_1893193_1914973_1968	1913819	1914973	1155	1	0.602	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014363.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_014364.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,170 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_014364.1|provirus_2121424_2157334_1980	2121424	2123298	1875	-1	0.279	11	AATAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1981	2123295	2124836	1542	-1	0.291	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1982	2124849	2126519	1671	-1	0.313	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1983	2126533	2127723	1191	-1	0.296	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1984	2128349	2128567	219	1	0.425	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1985	2128620	2128988	369	1	0.512	11	AAAAAA	GENOMAD.048210.VV	0.0001851	42	0	0	0	2561	Caudoviricetes	NA	NA	PF05263;TIGR01636;COG1737;K03481	phage transcriptional activator, RinA family
+NC_014364.1|provirus_2121424_2157334_1986	2129017	2129205	189	1	0.439	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1987	2129348	2129836	489	1	0.462	11	AAAA	GENOMAD.053051.VV	1.914e-10	61	0	0	0	2561	Caudoviricetes	NA	NA	PF10772;PF02086;TIGR00571;COG0338	Bacteriophage HP1, Orf24; D12 class N6 adenine-specific DNA methyltransferase
+NC_014364.1|provirus_2121424_2157334_1988	2130317	2130664	348	1	0.483	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1989	2130715	2131533	819	1	0.548	11	AACAA	GENOMAD.177891.VP	2.239e-15	79	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;TIGR01913;COG3723	phage recombination protein Bet
+NC_014364.1|provirus_2121424_2157334_1990	2131552	2132241	690	1	0.470	11	AAA	GENOMAD.183319.VP	1.282e-26	111	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1991	2132238	2132714	477	1	0.564	11	None	GENOMAD.111167.VV	2.064e-79	260	0	0	0	2561	Caudoviricetes	NA	NA	PF16784	Putative HNHc nuclease
+NC_014364.1|provirus_2121424_2157334_1992	2132711	2133103	393	1	0.506	11	None	GENOMAD.002027.VV	4.172e-17	79	0	0	1	2561	Caudoviricetes	NA	NA	PF05766	Bacteriophage Lambda NinG protein
+NC_014364.1|provirus_2121424_2157334_1993	2133113	2133715	603	1	0.557	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1994	2133728	2134816	1089	1	0.573	11	None	GENOMAD.018355.VV	8.801e-10	63	0	0	1	2561	Caudoviricetes	NA	NA	PF09681;TIGR01714	phage replisome organizer, putative, N-terminal region
+NC_014364.1|provirus_2121424_2157334_1995	2134821	2135222	402	1	0.537	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1996	2135206	2135424	219	1	0.438	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1997	2135387	2135821	435	-1	0.522	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1998	2135946	2136674	729	1	0.442	11	AAAAAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_1999	2137384	2137893	510	1	0.539	11	AAA	GENOMAD.170837.VV	9.661e-13	68	0	0	1	2561	Caudoviricetes	NA	NA	PF05119;COG3747;TIGR01558	Phage terminase, small subunit
+NC_014364.1|provirus_2121424_2157334_2000	2137890	2139611	1722	1	0.564	11	None	GENOMAD.194580.VP	1.811e-50	193	0	0	1	2561	Caudoviricetes	NA	NA	PF03354;PF05521;PF20441;COG4626;TIGR01563	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014364.1|provirus_2121424_2157334_2001	2139608	2140849	1242	1	0.576	11	None	GENOMAD.120555.VV	2.308e-46	176	0	0	1	2561	Caudoviricetes	NA	NA	K21511	NA
+NC_014364.1|provirus_2121424_2157334_2002	2140839	2141672	834	1	0.574	11	None	GENOMAD.096083.VP	2.363e-26	112	0	0	0	2561	Caudoviricetes	NA	NA	PF00574;K01358;TIGR00493;COG0740	ATP-dependent Clp endopeptidase, proteolytic subunit ClpP
+NC_014364.1|provirus_2121424_2157334_2003	2141673	2142872	1200	1	0.563	11	None	GENOMAD.080602.VV	1.495e-11	69	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR02215	phage conserved hypothetical protein, phiE125 gp8 family
+NC_014364.1|provirus_2121424_2157334_2004	2142889	2143311	423	1	0.582	11	None	GENOMAD.129880.VV	8.259e-56	191	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2005	2143390	2143947	558	1	0.570	11	None	GENOMAD.080176.VV	6.661e-14	72	0	0	0	2561	Caudoviricetes	NA	NA	PF11436;TIGR02215	phage conserved hypothetical protein, phiE125 gp8 family
+NC_014364.1|provirus_2121424_2157334_2006	2143917	2144369	453	1	0.574	11	None	GENOMAD.060383.VV	2.955e-10	60	0	0	1	1	NA	NA	NA	PF04883;TIGR01725;COG5005	phage protein, HK97 gp10 family
+NC_014364.1|provirus_2121424_2157334_2007	2144347	2144745	399	1	0.534	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2008	2144749	2145444	696	1	0.519	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2009	2145447	2145848	402	1	0.530	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2010	2145869	2146144	276	1	0.554	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2011	2146125	2148398	2274	1	0.563	11	None	GENOMAD.009561.VV	4.996e-38	157	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2012	2148401	2151679	3279	1	0.526	11	None	GENOMAD.109300.VV	0.0	2070	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2013	2151676	2152287	612	1	0.547	11	None	GENOMAD.007262.VV	1.557e-22	98	0	0	1	1	NA	NA	NA	PF16778	Phage tail assembly chaperone protein
+NC_014364.1|provirus_2121424_2157334_2014	2152292	2152525	234	1	0.483	11	AAAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2015	2152527	2152997	471	1	0.507	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2016	2152994	2153242	249	1	0.478	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2017	2153244	2153633	390	1	0.538	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2018	2153947	2154315	369	1	0.360	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2019	2154472	2154795	324	1	0.349	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2020	2155168	2155953	786	1	0.392	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2121424_2157334_2021	2156093	2157334	1242	-1	0.475	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2174	2329685	2330950	1266	1	0.534	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2175	2331412	2331927	516	-1	0.260	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2176	2331924	2332307	384	-1	0.333	11	AATAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2177	2332404	2333627	1224	-1	0.283	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2178	2333802	2334419	618	-1	0.278	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2179	2334416	2335450	1035	-1	0.266	11	AAAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2180	2335637	2336704	1068	-1	0.370	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2181	2336829	2337170	342	-1	0.450	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2182	2337251	2337481	231	1	0.407	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2183	2337478	2337723	246	1	0.504	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2184	2337961	2338164	204	1	0.534	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2185	2338728	2339270	543	1	0.492	11	None	GENOMAD.112664.VP	5.227e-63	214	0	0	0	2561	Caudoviricetes	NA	NA	PF11195	NA
+NC_014364.1|provirus_2329685_2350621_2186	2339267	2339521	255	1	0.486	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2187	2339518	2340633	1116	1	0.544	11	None	GENOMAD.090362.VV	6.936e-21	98	0	0	1	2561	Caudoviricetes	NA	NA	PF13479;TIGR01618;COG2087	phage nucleotide-binding protein
+NC_014364.1|provirus_2329685_2350621_2188	2340648	2341298	651	1	0.498	11	None	GENOMAD.025041.VV	1.179e-20	93	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2189	2341303	2341941	639	1	0.535	11	None	GENOMAD.067346.VV	8.792e-124	391	0	0	0	2561	Caudoviricetes	NA	NA	PF06023;TIGR00372;COG4343	CRISPR-associated protein Cas4
+NC_014364.1|provirus_2329685_2350621_2190	2341938	2342411	474	1	0.527	11	None	GENOMAD.111167.VV	1.217e-84	275	0	0	0	2561	Caudoviricetes	NA	NA	PF16784	Putative HNHc nuclease
+NC_014364.1|provirus_2329685_2350621_2191	2342625	2342858	234	1	0.500	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2192	2342868	2343407	540	1	0.554	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2193	2343420	2344475	1056	1	0.536	11	None	GENOMAD.018355.VV	3.86e-05	48	0	0	1	2561	Caudoviricetes	NA	NA	PF09681;TIGR01714	phage replisome organizer, putative, N-terminal region
+NC_014364.1|provirus_2329685_2350621_2194	2344481	2344894	414	1	0.551	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2195	2344878	2345096	219	1	0.438	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2196	2345093	2345284	192	1	0.505	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2197	2345287	2345487	201	1	0.542	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2198	2345630	2346916	1287	1	0.431	11	AAAA	GENOMAD.185015.VV	0.0001092	47	0	0	0	2561	Caudoviricetes	NA	NA	PF18692;PF14466;TIGR03066;COG3187;K03668	Gemmata obscuriglobus paralogous family TIGR03066
+NC_014364.1|provirus_2329685_2350621_2199	2347200	2348180	981	1	0.448	11	AAAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2329685_2350621_2200	2348796	2349302	507	1	0.550	11	AAA	GENOMAD.170837.VV	4.939e-10	60	0	0	1	2561	Caudoviricetes	NA	NA	PF05119;COG3747;TIGR01558	Phage terminase, small subunit
+NC_014364.1|provirus_2329685_2350621_2201	2349299	2350621	1323	1	0.550	11	None	GENOMAD.194580.VP	1.831e-53	198	0	0	1	2561	Caudoviricetes	NA	NA	PF03354;PF05521;PF20441;COG4626;TIGR01563	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014364.1|provirus_2666253_2703772_2490	2666253	2667515	1263	1	0.469	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2491	2667512	2667952	441	-1	0.458	11	None	GENOMAD.167054.PV	6.452e-08	53	0	0	0	1	NA	NA	NA	PF06892;TIGR02612;COG3655	mobile mystery protein A
+NC_014364.1|provirus_2666253_2703772_2492	2667949	2668332	384	-1	0.474	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2493	2668604	2668852	249	-1	0.414	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2494	2668815	2669231	417	-1	0.465	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2495	2669290	2669850	561	-1	0.381	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2496	2670024	2670449	426	-1	0.528	11	AAAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2497	2670476	2670724	249	-1	0.518	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2498	2670721	2670822	102	-1	0.539	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2499	2670819	2671190	372	-1	0.527	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2500	2671197	2671430	234	-1	0.487	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2501	2671435	2672046	612	-1	0.560	11	None	GENOMAD.007262.VV	7.521e-22	96	0	0	1	1	NA	NA	NA	PF16778	Phage tail assembly chaperone protein
+NC_014364.1|provirus_2666253_2703772_2502	2672043	2675357	3315	-1	0.506	11	None	GENOMAD.109300.VV	0.0	2147	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2503	2675360	2677537	2178	-1	0.555	11	None	GENOMAD.040051.VV	1.304e-19	97	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2504	2677518	2677793	276	-1	0.558	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2505	2677814	2678215	402	-1	0.520	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2506	2678218	2678973	756	-1	0.511	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2507	2678912	2679310	399	-1	0.526	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2508	2679288	2679713	426	-1	0.561	11	None	GENOMAD.060383.VV	4.591e-11	62	0	0	1	1	NA	NA	NA	PF04883;TIGR01725;COG5005	phage protein, HK97 gp10 family
+NC_014364.1|provirus_2666253_2703772_2509	2679710	2680267	558	-1	0.534	11	None	GENOMAD.080176.VV	1.118e-18	86	0	0	0	2561	Caudoviricetes	NA	NA	PF11436;TIGR02215	phage conserved hypothetical protein, phiE125 gp8 family
+NC_014364.1|provirus_2666253_2703772_2510	2680271	2680684	414	-1	0.534	11	None	GENOMAD.210649.VV	1.155e-06	49	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2511	2680638	2681888	1251	-1	0.552	11	None	GENOMAD.090434.VV	2.489e-32	134	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;TIGR01554;COG4653	phage major capsid protein, HK97 family
+NC_014364.1|provirus_2666253_2703772_2512	2681903	2682610	708	-1	0.556	11	None	GENOMAD.126169.VV	1.014e-33	132	0	0	1	2561	Caudoviricetes	NA	NA	PF04586;K06904;COG3740;TIGR01543	Phage head maturation protease
+NC_014364.1|provirus_2666253_2703772_2513	2682607	2684223	1617	-1	0.557	11	None	GENOMAD.179073.VP	3.772e-33	139	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2514	2684220	2685944	1725	-1	0.556	11	None	GENOMAD.194580.VP	1.898e-51	196	0	0	1	2561	Caudoviricetes	NA	NA	PF03354;PF05521;PF20441;COG4626;TIGR01563	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_014364.1|provirus_2666253_2703772_2515	2685941	2686450	510	-1	0.561	11	AAA	GENOMAD.170837.VV	2.224e-11	64	0	0	1	2561	Caudoviricetes	NA	NA	PF05119;COG3747;TIGR01558	Phage terminase, small subunit
+NC_014364.1|provirus_2666253_2703772_2516	2686454	2686852	399	-1	0.549	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2517	2687097	2687804	708	-1	0.381	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2518	2687794	2688030	237	-1	0.359	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2519	2688024	2688701	678	-1	0.412	11	None	GENOMAD.222821.VP	3.109e-116	370	0	0	0	2561	Caudoviricetes	NA	NA	TIGR03116	CRISPR type IV/AFERR-associated protein Csf3
+NC_014364.1|provirus_2666253_2703772_2520	2688698	2689639	942	-1	0.429	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2521	2689612	2689965	354	-1	0.387	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2522	2689910	2690650	741	-1	0.406	11	None	GENOMAD.222446.VP	5.477e-146	457	0	0	0	1	NA	NA	NA	TIGR03114	CRISPR type AFERR-associated protein Csf1
+NC_014364.1|provirus_2666253_2703772_2523	2690719	2690904	186	-1	0.425	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2524	2690927	2691118	192	-1	0.490	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2525	2691115	2691333	219	-1	0.425	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2526	2691317	2691718	402	-1	0.557	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2527	2691723	2692811	1089	-1	0.567	11	None	GENOMAD.018355.VV	8.801e-10	63	0	0	1	2561	Caudoviricetes	NA	NA	PF09681;TIGR01714	phage replisome organizer, putative, N-terminal region
+NC_014364.1|provirus_2666253_2703772_2528	2692824	2693420	597	-1	0.554	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2529	2693430	2693843	414	-1	0.500	11	None	GENOMAD.002027.VV	5.448e-17	79	0	0	1	2561	Caudoviricetes	NA	NA	PF05766	Bacteriophage Lambda NinG protein
+NC_014364.1|provirus_2666253_2703772_2530	2693840	2696353	2514	-1	0.494	11	None	GENOMAD.126436.VP	5.738e-126	427	0	0	0	2561	Caudoviricetes	NA	NA	PF13872	NA
+NC_014364.1|provirus_2666253_2703772_2531	2696356	2696832	477	-1	0.570	11	None	GENOMAD.111167.VV	6.951e-83	270	0	0	0	2561	Caudoviricetes	NA	NA	PF16784	Putative HNHc nuclease
+NC_014364.1|provirus_2666253_2703772_2532	2696829	2697434	606	-1	0.464	11	AAA	GENOMAD.176983.VP	4.38e-16	79	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2533	2697453	2698265	813	-1	0.534	11	AACAA	GENOMAD.177891.VP	4.712e-16	81	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;TIGR01913;COG3723	phage recombination protein Bet
+NC_014364.1|provirus_2666253_2703772_2534	2698316	2699071	756	-1	0.516	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2535	2699141	2699344	204	-1	0.554	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2536	2699404	2700138	735	-1	0.509	11	None	GENOMAD.014438.VV	2.838e-34	134	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2537	2700139	2700486	348	-1	0.517	11	AAAA	GENOMAD.100208.VV	1.289e-06	48	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2538	2700598	2700861	264	-1	0.379	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2539	2700891	2701232	342	1	0.456	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2540	2701372	2701794	423	-1	0.492	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2541	2701796	2702014	219	-1	0.457	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2542	2702096	2702443	348	1	0.405	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2543	2702566	2703069	504	1	0.357	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2544	2703117	2703407	291	1	0.392	11	None	GENOMAD.219421.VC	7.977e-05	42	0	0	0	9067	Straboviridae	NA	NA	NA	NA
+NC_014364.1|provirus_2666253_2703772_2545	2703410	2703772	363	1	0.377	11	AAAA	GENOMAD.227798.VP	1.946e-45	160	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2796	2976748	2977998	1251	1	0.455	11	None	GENOMAD.225071.VP	8.645e-08	57	0	0	0	1	NA	NA	NA	PF00589;PF13102;TIGR02225;COG4973;K14059	tyrosine recombinase XerD
+NC_014364.1|provirus_2976748_3014759_2797	2978103	2978576	474	-1	0.432	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2798	2978601	2978786	186	1	0.441	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2799	2978805	2979119	315	1	0.410	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2800	2979484	2979939	456	-1	0.355	11	AATAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2801	2980070	2980450	381	-1	0.454	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2802	2981023	2981250	228	1	0.544	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2803	2981859	2982401	543	1	0.488	11	None	GENOMAD.112664.VP	2.835e-61	209	0	0	0	2561	Caudoviricetes	NA	NA	PF11195	NA
+NC_014364.1|provirus_2976748_3014759_2804	2982398	2982652	255	1	0.467	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2805	2982649	2983740	1092	1	0.552	11	None	GENOMAD.032961.VV	1.703e-27	118	0	0	1	2561	Caudoviricetes	NA	NA	PF13479;TIGR01618;COG2087;K04484	phage nucleotide-binding protein
+NC_014364.1|provirus_2976748_3014759_2806	2983755	2984405	651	1	0.498	11	None	GENOMAD.025041.VV	1.179e-20	93	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2807	2984410	2985048	639	1	0.546	11	None	GENOMAD.067346.VV	1.619e-125	396	0	0	0	2561	Caudoviricetes	NA	NA	PF06023;TIGR00372;COG4343	CRISPR-associated protein Cas4
+NC_014364.1|provirus_2976748_3014759_2808	2985045	2985518	474	1	0.540	11	None	GENOMAD.111167.VV	7.301e-82	267	0	0	0	2561	Caudoviricetes	NA	NA	PF16784	Putative HNHc nuclease
+NC_014364.1|provirus_2976748_3014759_2809	2985528	2985974	447	1	0.506	11	None	GENOMAD.002027.VV	2.633e-21	92	0	0	1	2561	Caudoviricetes	NA	NA	PF05766	Bacteriophage Lambda NinG protein
+NC_014364.1|provirus_2976748_3014759_2810	2985984	2986526	543	1	0.562	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2811	2986554	2987651	1098	1	0.533	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2812	2987656	2988057	402	1	0.545	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2813	2988041	2988259	219	1	0.447	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2814	2988256	2988462	207	1	0.507	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2815	2988462	2989181	720	1	0.528	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2816	2989159	2990028	870	1	0.553	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2817	2990048	2990725	678	1	0.527	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2818	2990697	2990873	177	1	0.525	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2819	2990900	2991442	543	1	0.499	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2820	2991609	2991938	330	1	0.521	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2821	2991948	2993630	1683	1	0.551	11	None	GENOMAD.060970.VV	1.975e-99	338	0	0	1	2561	Caudoviricetes	NA	NA	PF12236	Bacteriophage head to tail connecting protein
+NC_014364.1|provirus_2976748_3014759_2822	2993627	2993929	303	1	0.545	11	None	GENOMAD.118268.VV	1.689e-06	47	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2823	2993926	2994732	807	1	0.545	11	None	GENOMAD.072294.VV	2.192e-115	370	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2824	2994744	2995730	987	1	0.532	11	None	GENOMAD.004790.VV	4.85e-58	207	0	0	1	2561	Caudoviricetes	NA	NA	PF19307	Phage capsid-like protein
+NC_014364.1|provirus_2976748_3014759_2825	2995745	2996119	375	1	0.565	11	None	GENOMAD.013948.VV	1.528e-25	103	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2826	2996128	2996442	315	1	0.556	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2827	2996452	2997045	594	1	0.532	11	None	GENOMAD.061091.VV	8.908e-15	75	0	0	1	2561	Caudoviricetes	NA	NA	PF17212	Tail tubular protein
+NC_014364.1|provirus_2976748_3014759_2828	2997042	2998754	1713	1	0.537	11	None	GENOMAD.063463.VV	3.739e-12	72	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2829	2998751	2999638	888	1	0.484	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2830	2999654	3001600	1947	1	0.500	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2831	3001597	3007842	6246	1	0.505	11	None	GENOMAD.224557.VP	0.0001899	49	0	0	0	2561	Caudoviricetes	NA	NA	PF18819	Phage MuF-C-terminal domain
+NC_014364.1|provirus_2976748_3014759_2832	3007790	3011446	3657	1	0.470	11	AAA	GENOMAD.113444.VC	1.137e-11	72	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2833	3011443	3012054	612	1	0.554	11	None	GENOMAD.007262.VV	3.024e-24	103	0	0	1	1	NA	NA	NA	PF16778	Phage tail assembly chaperone protein
+NC_014364.1|provirus_2976748_3014759_2834	3012059	3012292	234	1	0.487	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2835	3012298	3012777	480	1	0.479	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2836	3012774	3012995	222	1	0.419	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2837	3013047	3013463	417	1	0.540	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_014364.1|provirus_2976748_3014759_2838	3013650	3014759	1110	1	0.259	11	AAA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_015761.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,112 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_015761.1|provirus_847397_862760_745	847397	847636	240	-1	0.438	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_847397_862760_746	847705	848118	414	1	0.611	11	None	GENOMAD.138177.VP	1.107e-17	81	0	0	1	2561	Caudoviricetes	NA	NA	PF04717;PF18715;COG4540;TIGR01644	Phage P2 baseplate assembly protein gpV
+NC_015761.1|provirus_847397_862760_747	848177	848536	360	1	0.553	11	GGAGG	GENOMAD.121581.VP	1.359e-07	51	0	0	1	2561	Caudoviricetes	NA	NA	PF04965;COG3628;K06903;TIGR03357	Phage baseplate assembly protein W
+NC_015761.1|provirus_847397_862760_748	848523	849431	909	1	0.590	11	AGGAG	GENOMAD.105501.VV	2.367e-122	392	0	0	1	2561	Caudoviricetes	NA	NA	PF03434;COG3948	Phage-related baseplate assembly protein
+NC_015761.1|provirus_847397_862760_749	849424	850029	606	1	0.578	11	GGxGG	GENOMAD.114503.VV	2.832e-71	239	0	0	1	2561	Caudoviricetes	NA	NA	PF09684;COG4385;TIGR01634	Bacteriophage P2-related tail formation protein
+NC_015761.1|provirus_847397_862760_750	850026	850943	918	1	0.548	11	GGA/GAG/AGG	GENOMAD.118528.VP	8.226e-145	457	0	0	1	2561	Caudoviricetes	NA	NA	PF12571;COG5301	Phage-related tail fibre protein
+NC_015761.1|provirus_847397_862760_751	851338	852495	1158	1	0.306	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_847397_862760_752	852717	853181	465	-1	0.447	11	AGGA	GENOMAD.168001.VP	6.793e-48	169	0	0	1	2561	Caudoviricetes	NA	NA	PF16778	Phage tail assembly chaperone protein
+NC_015761.1|provirus_847397_862760_753	853514	853768	255	-1	0.424	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_847397_862760_754	853798	854055	258	1	0.508	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_847397_862760_755	854436	854621	186	1	0.586	11	AGGAG	GENOMAD.120968.VV	2.238e-24	96	0	0	1	2561	Caudoviricetes	NA	NA	COG3497	Phage tail sheath protein FI
+NC_015761.1|provirus_847397_862760_756	854942	855244	303	1	0.558	11	AGGA	GENOMAD.135969.VP	5.864e-25	100	0	0	1	2561	Caudoviricetes	NA	NA	PF10109	Phage tail assembly chaperone proteins, E, or 41 or 14
+NC_015761.1|provirus_847397_862760_757	855371	856519	1149	1	0.586	11	None	GENOMAD.130201.VP	2.372e-43	166	0	0	1	2561	Caudoviricetes	NA	NA	COG5283	Phage-related tail protein
+NC_015761.1|provirus_847397_862760_758	856462	858486	2025	1	0.583	11	None	GENOMAD.145447.VP	1.422e-33	142	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_847397_862760_759	858446	858832	387	1	0.535	11	None	GENOMAD.116424.VV	2.281e-14	71	0	0	0	2561	Caudoviricetes	NA	NA	PF06995;K06906;COG3499	Phage protein U
+NC_015761.1|provirus_847397_862760_760	858829	859881	1053	1	0.531	11	GGAGG	GENOMAD.209614.VP	3.524e-49	182	0	0	1	2561	Caudoviricetes	NA	NA	PF05954;K06905;COG3500;TIGR03361	Phage protein D
+NC_015761.1|provirus_847397_862760_761	859972	860190	219	1	0.461	11	GGAG/GAGG	GENOMAD.222803.VP	3.752e-10	56	0	0	0	2561	Caudoviricetes	NA	NA	PF04606;TIGR04165;COG1326	Ogr/Delta-like zinc finger
+NC_015761.1|provirus_847397_862760_762	860426	862111	1686	-1	0.537	11	AGxAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_847397_862760_763	862383	862760	378	1	0.508	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_886	1007223	1008242	1020	-1	0.473	11	GGAG/GAGG	GENOMAD.212993.VP	2.024e-35	141	0	0	0	2561	Caudoviricetes	NA	NA	PF14659;K21039	Phage integrase, N-terminal SAM-like domain
+NC_015761.1|provirus_1007223_1045009_887	1008243	1008467	225	-1	0.502	11	GGAG/GAGG	GENOMAD.151670.VV	1.037e-08	52	0	0	0	2561	Caudoviricetes	NA	NA	PF13986	NA
+NC_015761.1|provirus_1007223_1045009_888	1008909	1009049	141	1	0.532	11	GGAG/GAGG	GENOMAD.224144.VP	3.211e-14	66	0	0	0	2561	Caudoviricetes	NA	NA	PF10798;K21975	Biofilm development protein YmgB/AriR
+NC_015761.1|provirus_1007223_1045009_889	1009155	1009961	807	-1	0.337	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_890	1009958	1010806	849	-1	0.418	11	GGAG/GAGG	GENOMAD.212816.VV	1.518e-152	478	0	0	0	2561	Caudoviricetes	NA	NA	PF20613;TIGR03843	HipA-like kinase
+NC_015761.1|provirus_1007223_1045009_891	1010978	1011445	468	-1	0.476	11	AGGA	GENOMAD.091484.VV	0.0004177	42	0	0	0	2561	Caudoviricetes	NA	NA	PF13411;COG3415;K22302;TIGR00721	Transposase
+NC_015761.1|provirus_1007223_1045009_892	1011459	1011686	228	1	0.425	11	AGGAGG	GENOMAD.151341.VV	0.0001753	40	0	0	1	2561	Caudoviricetes	NA	NA	PF11242;TIGR00673;COG5606;K18830	cyanase
+NC_015761.1|provirus_1007223_1045009_893	1011706	1012026	321	1	0.539	11	GGAG/GAGG	GENOMAD.069430.VV	6.718e-58	195	0	0	1	2561	Caudoviricetes	NA	NA	PF18010;TIGR00721;COG4220	Cry35Ab1 HTH C-terminal domain
+NC_015761.1|provirus_1007223_1045009_894	1012118	1013023	906	1	0.475	11	AGGAG	GENOMAD.208204.VP	3.298e-81	273	0	0	0	2561	Caudoviricetes	NA	NA	PF04492;TIGR01610	phage replication protein O, N-terminal domain
+NC_015761.1|provirus_1007223_1045009_895	1013020	1013712	693	1	0.551	11	GGAG/GAGG	GENOMAD.194512.VV	1.29e-76	256	0	0	1	2561	Caudoviricetes	NA	NA	PF06992	NA
+NC_015761.1|provirus_1007223_1045009_896	1013726	1013983	258	1	0.488	11	AGGAG	GENOMAD.072808.VV	9.932e-44	153	0	0	0	2561	Caudoviricetes	NA	NA	PF15944	NA
+NC_015761.1|provirus_1007223_1045009_897	1013980	1014891	912	1	0.498	11	GGAGG	GENOMAD.068933.VV	1.147e-200	618	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_898	1014993	1015319	327	1	0.462	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_899	1015319	1015426	108	1	0.454	11	AGGA/GGAG/GAGG	GENOMAD.226031.VP	2.127e-06	43	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_900	1015606	1016037	432	-1	0.389	11	GGA/GAG/AGG	GENOMAD.213484.VP	5.7e-53	183	0	0	0	2561	Caudoviricetes	NA	NA	PF05509;COG4877	Plasmid stability protein
+NC_015761.1|provirus_1007223_1045009_901	1016160	1016327	168	1	0.411	11	AGxAGG/AGGxGG	GENOMAD.168832.VV	8.581e-31	114	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_902	1016314	1017228	915	1	0.462	11	GGA/GAG/AGG	GENOMAD.222649.VP	4.345e-08	57	0	0	0	2561	Caudoviricetes	NA	NA	PF10548;PF10547;COG3617	Prophage antirepressor
+NC_015761.1|provirus_1007223_1045009_903	1017301	1018047	747	1	0.475	11	AGGA	GENOMAD.167364.VP	3.729e-134	423	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_904	1018233	1018466	234	1	0.462	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_905	1018866	1019468	603	1	0.526	11	GGAG/GAGG	GENOMAD.040195.VV	1.554e-77	257	0	0	0	2561	Caudoviricetes	NA	NA	PF07105	NA
+NC_015761.1|provirus_1007223_1045009_906	1019857	1020528	672	1	0.512	11	GGA/GAG/AGG	GENOMAD.058019.VV	7.177e-33	129	0	0	0	2561	Caudoviricetes	NA	NA	PF06323	Phage antitermination protein Q
+NC_015761.1|provirus_1007223_1045009_907	1020797	1021369	573	1	0.471	11	GGAG/GAGG	GENOMAD.209828.VP	1.159e-20	92	0	0	0	2561	Caudoviricetes	NA	NA	PF10543;COG3646	ORF6N domain
+NC_015761.1|provirus_1007223_1045009_908	1021511	1022011	501	-1	0.465	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_909	1022022	1022201	180	-1	0.472	11	GGAG/GAGG	GENOMAD.175300.VV	1.174e-29	111	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_910	1023134	1023559	426	1	0.352	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_911	1023588	1024331	744	1	0.423	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_912	1024569	1024958	390	1	0.482	11	GGAG/GAGG	GENOMAD.222896.VP	4.488e-57	194	0	0	1	2561	Caudoviricetes	NA	NA	PF16931	Putative phage holin
+NC_015761.1|provirus_1007223_1045009_913	1024945	1025226	282	1	0.514	11	GGAGG	GENOMAD.214895.VP	1.105e-15	73	0	0	1	2561	Caudoviricetes	NA	NA	PF05449	Putative 3TM holin, Phage_holin_3
+NC_015761.1|provirus_1007223_1045009_914	1025226	1025840	615	1	0.528	11	GGAG/GAGG	GENOMAD.021660.VV	3.743e-21	94	0	0	0	2561	Caudoviricetes	NA	NA	COG3179;K18950	Predicted chitinase
+NC_015761.1|provirus_1007223_1045009_915	1025837	1026379	543	1	0.534	11	None	GENOMAD.108518.VV	1.733e-31	123	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_916	1026641	1027171	531	1	0.448	11	GGA/GAG/AGG	GENOMAD.068419.VV	7.247e-49	173	0	0	0	2561	Caudoviricetes	NA	NA	PF10549	ORF11CD3 domain
+NC_015761.1|provirus_1007223_1045009_917	1027137	1027496	360	1	0.506	11	GGA/GAG/AGG	GENOMAD.062288.VV	1.85e-37	137	0	0	0	2561	Caudoviricetes	NA	NA	PF10721	NA
+NC_015761.1|provirus_1007223_1045009_918	1027571	1027981	411	1	0.353	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_919	1028070	1028375	306	1	0.392	11	GGAG/GAGG	GENOMAD.210890.VV	1.177e-49	171	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_920	1028478	1028828	351	1	0.510	11	AGGA	GENOMAD.179073.VP	2.39e-17	79	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_921	1028913	1029170	258	1	0.523	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_922	1029172	1030284	1113	1	0.524	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_923	1030383	1030499	117	1	0.436	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_924	1030656	1031234	579	1	0.402	11	AGGA	GENOMAD.222575.VP	5.62e-21	93	0	0	0	2561	Caudoviricetes	NA	NA	PF06416	Effector protein NleG
+NC_015761.1|provirus_1007223_1045009_925	1031568	1033916	2349	-1	0.456	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_926	1034271	1035401	1131	-1	0.546	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_927	1035640	1035837	198	1	0.510	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_928	1036394	1036723	330	-1	0.476	11	AGGA	GENOMAD.182552.PC	9.486e-56	189	0	0	0	1	NA	NA	NA	PF15781;COG3668;TIGR00053;K06218	Plasmid stabilization system protein ParE
+NC_015761.1|provirus_1007223_1045009_929	1036749	1036979	231	-1	0.450	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_930	1037060	1037353	294	-1	0.476	11	GGA/GAG/AGG	GENOMAD.221919.VP	3.483e-21	89	0	0	0	2561	Caudoviricetes	NA	NA	PF00589	Phage integrase family
+NC_015761.1|provirus_1007223_1045009_931	1038122	1038700	579	1	0.402	11	AGGA	GENOMAD.222575.VP	5.62e-21	93	0	0	0	2561	Caudoviricetes	NA	NA	PF06416	Effector protein NleG
+NC_015761.1|provirus_1007223_1045009_932	1039093	1039440	348	1	0.534	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_933	1039590	1040444	855	1	0.385	11	4Base/6BMM	GENOMAD.120636.VV	2.17e-58	206	0	0	0	2561	Caudoviricetes	NA	NA	PF09612;TIGR02192	protein YibB
+NC_015761.1|provirus_1007223_1045009_934	1040507	1040737	231	-1	0.320	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_935	1040933	1043740	2808	-1	0.577	11	AGGAGG	GENOMAD.054026.VV	1.896e-05	51	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_1007223_1045009_936	1044602	1045009	408	1	0.451	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2808	3084741	3084959	219	-1	0.507	11	GGAG/GAGG	GENOMAD.223866.VP	4.224e-09	53	0	0	0	2561	Caudoviricetes	NA	NA	PF04606;TIGR02098	Ogr/Delta-like zinc finger
+NC_015761.1|provirus_3084741_3115735_2809	3085026	3086195	1170	-1	0.548	11	GGAGG	GENOMAD.209614.VP	1.088e-49	185	0	0	1	2561	Caudoviricetes	NA	NA	PF05954;K06905;COG3500;TIGR03361	Phage protein D
+NC_015761.1|provirus_3084741_3115735_2810	3086192	3086677	486	-1	0.543	11	GGAG/GAGG	GENOMAD.116424.VV	2.262e-19	87	0	0	0	2561	Caudoviricetes	NA	NA	PF06995;K06906;COG3499	Phage protein U
+NC_015761.1|provirus_3084741_3115735_2811	3086692	3089133	2442	-1	0.566	11	GGA/GAG/AGG	GENOMAD.130201.VP	4.265e-179	582	0	0	1	2561	Caudoviricetes	NA	NA	COG5283	Phage-related tail protein
+NC_015761.1|provirus_3084741_3115735_2812	3089278	3089613	336	-1	0.571	11	GGA/GAG/AGG	GENOMAD.135969.VP	1.933e-25	102	0	0	1	2561	Caudoviricetes	NA	NA	PF10109	Phage tail assembly chaperone proteins, E, or 41 or 14
+NC_015761.1|provirus_3084741_3115735_2813	3089676	3090194	519	-1	0.586	11	AGGAG/GGAGG	GENOMAD.222086.VV	9.473e-26	106	0	0	1	2561	Caudoviricetes	NA	NA	PF04985;K06908;TIGR01611;COG3498	phage contractile tail tube protein, P2 family
+NC_015761.1|provirus_3084741_3115735_2814	3090210	3091397	1188	-1	0.549	11	GGAG/GAGG	GENOMAD.102019.VV	3.796e-60	216	0	0	1	2561	Caudoviricetes	NA	NA	PF10758;COG3497	Phage tail sheath protein FI
+NC_015761.1|provirus_3084741_3115735_2815	3091532	3092080	549	-1	0.475	11	AGGA	GENOMAD.209102.VP	2.721e-113	359	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2816	3092093	3094069	1977	-1	0.518	11	GGA/GAG/AGG	GENOMAD.151930.VP	1.701e-178	573	0	0	1	2561	Caudoviricetes	NA	NA	PF12571;COG5301	Phage-related tail fibre protein
+NC_015761.1|provirus_3084741_3115735_2817	3094080	3094610	531	-1	0.539	11	GGxGG	GENOMAD.114503.VV	2.848e-76	252	0	0	1	2561	Caudoviricetes	NA	NA	PF09684;COG4385;TIGR01634	Bacteriophage P2-related tail formation protein
+NC_015761.1|provirus_3084741_3115735_2818	3094603	3095511	909	-1	0.554	11	GGA/GAG/AGG	GENOMAD.105501.VV	5.746e-121	388	0	0	1	2561	Caudoviricetes	NA	NA	PF03434;COG3948	Phage-related baseplate assembly protein
+NC_015761.1|provirus_3084741_3115735_2819	3095518	3095865	348	-1	0.549	11	GGAGG	GENOMAD.121581.VP	1.186e-07	51	0	0	1	2561	Caudoviricetes	NA	NA	PF04965;COG3628;K06903;TIGR03357	Phage baseplate assembly protein W
+NC_015761.1|provirus_3084741_3115735_2820	3095862	3096503	642	-1	0.615	11	AGGA/GGAG/GAGG	GENOMAD.166314.VP	7.564e-57	198	0	0	1	2561	Caudoviricetes	NA	NA	K22111;TIGR01644;COG4540	phage baseplate assembly protein V
+NC_015761.1|provirus_3084741_3115735_2821	3096572	3097021	450	-1	0.596	11	GGA/GAG/AGG	GENOMAD.134219.VP	5.44e-48	169	0	0	1	2561	Caudoviricetes	NA	NA	PF05069;TIGR01635;COG5005	phage virion morphogenesis (putative tail completion) protein
+NC_015761.1|provirus_3084741_3115735_2822	3097014	3097481	468	-1	0.568	11	AGGA	GENOMAD.125799.VP	3.104e-65	219	0	0	1	2561	Caudoviricetes	NA	NA	PF06891	P2 phage tail completion protein R (GpR)
+NC_015761.1|provirus_3084741_3115735_2823	3097444	3097602	159	-1	0.572	11	GGA/GAG/AGG	GENOMAD.116277.VV	5.069e-27	103	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2824	3097589	3098002	414	-1	0.594	11	GGxGG	GENOMAD.191084.VP	1.984e-28	112	0	0	0	2561	Caudoviricetes	NA	NA	PF10828;TIGR03495	phage lysis regulatory protein, LysB family
+NC_015761.1|provirus_3084741_3115735_2825	3097999	3098496	498	-1	0.572	11	AGxAGG/AGGxGG	GENOMAD.123113.VP	0.0005094	42	0	0	0	2561	Caudoviricetes	NA	NA	PF19846	NA
+NC_015761.1|provirus_3084741_3115735_2826	3098483	3098779	297	-1	0.549	11	GGAG/GAGG	GENOMAD.177230.VP	7.699e-37	134	0	0	1	2561	Caudoviricetes	NA	NA	PF04550;TIGR01594	Phage holin family 2
+NC_015761.1|provirus_3084741_3115735_2827	3098783	3098971	189	-1	0.571	11	GGA/GAG/AGG	GENOMAD.159179.VP	4.593e-18	78	0	0	1	2561	Caudoviricetes	NA	NA	COG5004;K06370	P2-like prophage tail protein X
+NC_015761.1|provirus_3084741_3115735_2828	3098986	3099492	507	-1	0.586	11	GGAG/GAGG	GENOMAD.119083.VV	9.468e-51	178	0	0	0	2561	Caudoviricetes	NA	NA	PF05926	Phage head completion protein (GPL)
+NC_015761.1|provirus_3084741_3115735_2829	3099586	3100335	750	-1	0.615	11	GGAG/GAGG	GENOMAD.034571.VV	3.734e-44	163	0	0	1	2561	Caudoviricetes	NA	NA	PF05944	Phage small terminase subunit
+NC_015761.1|provirus_3084741_3115735_2830	3100339	3101406	1068	-1	0.529	11	AGGA	GENOMAD.125799.VP	2.236e-60	215	0	0	1	2561	Caudoviricetes	NA	NA	PF06891	P2 phage tail completion protein R (GpR)
+NC_015761.1|provirus_3084741_3115735_2831	3101482	3102336	855	-1	0.538	11	AGGA	GENOMAD.042716.VV	2.893e-146	460	0	0	0	2561	Caudoviricetes	NA	NA	COG4388	Mu-like prophage I protein
+NC_015761.1|provirus_3084741_3115735_2832	3102502	3104271	1770	1	0.572	11	GGAG/GAGG	GENOMAD.151636.VP	8.559e-104	352	0	0	0	2561	Caudoviricetes	NA	NA	COG5484	Uncharacterized protein YjcR, contains N-terminal HTH domain
+NC_015761.1|provirus_3084741_3115735_2833	3104271	3105317	1047	1	0.538	11	GGAG/GAGG	GENOMAD.073411.VV	2.533e-07	55	0	0	1	2561	Caudoviricetes	NA	NA	PF04860;TIGR01540;COG4695	phage portal protein, PBSX family
+NC_015761.1|provirus_3084741_3115735_2834	3105395	3106399	1005	1	0.375	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2835	3106779	3107327	549	-1	0.341	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2836	3107438	3108169	732	-1	0.455	11	AGGA	GENOMAD.226160.VP	4.122e-139	437	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2837	3108252	3108692	441	-1	0.454	11	GGAGG	GENOMAD.137104.VV	8.416e-25	102	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2838	3108810	3111029	2220	-1	0.516	11	None	GENOMAD.182861.VP	4.397e-89	314	0	0	1	2561	Caudoviricetes	NA	NA	PF05840	Bacteriophage replication gene A protein (GPA)
+NC_015761.1|provirus_3084741_3115735_2839	3111152	3111673	522	-1	0.481	11	None	GENOMAD.170058.VV	8.762e-113	357	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2840	3111670	3111894	225	-1	0.573	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2841	3111894	3112121	228	-1	0.509	11	AGGAG	GENOMAD.071646.VV	8.539e-33	121	0	0	0	2561	Caudoviricetes	NA	NA	PF10809	NA
+NC_015761.1|provirus_3084741_3115735_2842	3112191	3112391	201	-1	0.403	11	GGA/GAG/AGG	GENOMAD.167874.VV	2.606e-40	142	0	0	0	1	NA	NA	NA	NA	NA
+NC_015761.1|provirus_3084741_3115735_2843	3112378	3112605	228	-1	0.482	11	GGAG/GAGG	GENOMAD.087231.VV	3.1e-35	128	0	0	0	2561	Caudoviricetes	NA	NA	PF10893	Bacteriophage 186, Fil
+NC_015761.1|provirus_3084741_3115735_2844	3112613	3113122	510	-1	0.539	11	GGAG/GAGG	GENOMAD.170830.VP	4.59e-76	251	0	0	1	2561	Caudoviricetes	NA	NA	PF06892	Phage regulatory protein CII (CP76)
+NC_015761.1|provirus_3084741_3115735_2845	3113153	3113416	264	-1	0.530	11	GGA/GAG/AGG	GENOMAD.120542.VV	1.195e-50	173	0	0	0	1	NA	NA	NA	PF07618;COG3311;TIGR02405	Putative transcription regulator (DUF1323)
+NC_015761.1|provirus_3084741_3115735_2846	3113547	3114125	579	1	0.454	11	GGA/GAG/AGG	GENOMAD.069724.VV	5.35e-42	154	0	0	0	2561	Caudoviricetes	NA	NA	PF16452	Bacteriophage CI repressor C-terminal domain
+NC_015761.1|provirus_3084741_3115735_2847	3114125	3115162	1038	1	0.489	11	GGAG/GAGG	GENOMAD.212346.VP	5.632e-52	190	0	0	1	2561	Caudoviricetes	NA	NA	PF16452;PF06892;COG1974	Bacteriophage CI repressor C-terminal domain; Phage regulatory protein CII (CP76)
+NC_015761.1|provirus_3084741_3115735_2848	3115400	3115735	336	-1	0.473	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_017033.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,163 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_017033.1|provirus_1052334_1094910_930	1052334	1052537	204	-1	0.647	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_931	1053148	1054167	1020	-1	0.611	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_932	1054169	1054387	219	-1	0.594	11	GGAG/GAGG	GENOMAD.180717.VC	2.645e-13	65	0	0	0	2561	Caudoviricetes	NA	NA	PF13986	NA
+NC_017033.1|provirus_1052334_1094910_933	1054387	1054635	249	-1	0.554	11	GGAGG	GENOMAD.104567.VV	3.707e-07	48	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_934	1054637	1054864	228	-1	0.548	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_935	1054857	1055138	282	-1	0.681	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_936	1055135	1055392	258	-1	0.593	11	GGA/GAG/AGG	GENOMAD.178404.VP	6.067e-41	145	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_937	1055389	1056072	684	-1	0.611	11	GGAGG	GENOMAD.171154.VP	4.943e-50	179	0	0	0	2561	Caudoviricetes	NA	NA	PF13986;PF05551	NA
+NC_017033.1|provirus_1052334_1094910_938	1056069	1056419	351	-1	0.661	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_939	1056446	1056697	252	-1	0.579	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_940	1056715	1057194	480	-1	0.652	11	None	GENOMAD.061727.VV	9.654e-06	47	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_941	1057194	1057496	303	-1	0.571	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_942	1057582	1057857	276	-1	0.620	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_943	1057854	1057982	129	-1	0.636	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_944	1058637	1059326	690	1	0.528	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_945	1059393	1059671	279	1	0.591	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_946	1060095	1060526	432	-1	0.544	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_947	1061139	1061330	192	1	0.542	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_948	1061475	1061768	294	1	0.595	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_949	1061876	1062043	168	-1	0.595	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_950	1062409	1062666	258	1	0.469	11	GGAG/GAGG	GENOMAD.209492.VC	7.51e-09	53	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_951	1062672	1063235	564	1	0.426	11	AGGA	GENOMAD.193207.VC	1.694e-10	62	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_952	1063880	1064236	357	-1	0.594	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_953	1064740	1065435	696	-1	0.593	11	None	GENOMAD.223691.VP	7.797e-07	52	0	0	0	2561	Caudoviricetes	NA	NA	PF16452;COG1974;K22300;TIGR02612	SOS-response transcriptional repressor LexA (RecA-mediated autopeptidase)
+NC_017033.1|provirus_1052334_1094910_954	1065731	1065943	213	1	0.606	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_955	1066043	1066552	510	-1	0.573	11	GGA/GAG/AGG	GENOMAD.177794.VC	4.267e-34	130	0	0	0	2561	Caudoviricetes	NA	NA	PF09639	YjcQ protein
+NC_017033.1|provirus_1052334_1094910_956	1066578	1067204	627	1	0.614	11	None	GENOMAD.120202.VV	1.214e-07	54	0	0	1	1	NA	NA	NA	PF06892	NA
+NC_017033.1|provirus_1052334_1094910_957	1067201	1068190	990	1	0.614	11	GGAGG	GENOMAD.105893.VV	9.514e-13	72	0	0	0	2561	Caudoviricetes	NA	NA	PF07120;COG3756	Uncharacterized conserved protein YdaU, DUF1376 family
+NC_017033.1|provirus_1052334_1094910_958	1068177	1068839	663	1	0.621	11	AGGAG	GENOMAD.073619.VV	0.0005392	43	0	0	0	1	NA	NA	NA	PF11417	Loader and inhibitor of phage G40P
+NC_017033.1|provirus_1052334_1094910_959	1068836	1069036	201	1	0.652	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_960	1069033	1069539	507	1	0.641	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_961	1069536	1069925	390	1	0.672	11	GGAGG	GENOMAD.022482.VV	2.349e-31	120	0	0	0	2561	Caudoviricetes	NA	NA	PF16786	Recombination enhancement, RecA-dependent nuclease
+NC_017033.1|provirus_1052334_1094910_962	1069922	1070419	498	1	0.542	11	GGAGG	GENOMAD.159849.VP	2.603e-19	87	0	0	0	2561	Caudoviricetes	NA	NA	PF07102;PF13264	Putative nuclease YbcO
+NC_017033.1|provirus_1052334_1094910_963	1070416	1070799	384	1	0.669	11	GGAG/GAGG	GENOMAD.194195.VV	4.071e-16	76	0	0	0	2561	Caudoviricetes	NA	NA	PF08774	VRR-NUC domain
+NC_017033.1|provirus_1052334_1094910_964	1070975	1071658	684	1	0.640	11	3Base/5BMM	GENOMAD.069895.VV	4.278e-31	124	0	0	0	2561	Caudoviricetes	NA	NA	PF17302;TIGR02642	Tryptophan RNA-binding attenuator protein inhibitory protein
+NC_017033.1|provirus_1052334_1094910_965	1071772	1072077	306	-1	0.565	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_966	1072058	1072372	315	-1	0.543	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_967	1072433	1072939	507	1	0.615	11	GGA/GAG/AGG	GENOMAD.219399.VP	4.416e-42	153	0	0	0	2561	Caudoviricetes	NA	NA	PF10549;COG3646;TIGR02681	Phage regulatory protein Rha
+NC_017033.1|provirus_1052334_1094910_968	1073003	1073221	219	1	0.612	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_969	1073205	1073681	477	1	0.671	11	GGAG/GAGG	GENOMAD.083189.VV	3.344e-12	66	0	0	1	2561	Caudoviricetes	NA	NA	PF00959;COG3772;K01185	Phage-related lysozyme (muramidase), GH24 family
+NC_017033.1|provirus_1052334_1094910_970	1073681	1074163	483	1	0.656	11	GGAG/GAGG	GENOMAD.077452.VV	3.762e-11	63	0	0	1	2561	Caudoviricetes	NA	NA	PF03245;K14744	Bacteriophage Rz lysis protein
+NC_017033.1|provirus_1052334_1094910_971	1074160	1074501	342	1	0.675	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_972	1074715	1075245	531	1	0.629	11	GGA/GAG/AGG	GENOMAD.161251.VP	3.022e-32	125	0	0	1	2561	Caudoviricetes	NA	NA	PF07471;K22014;COG4220	Phage DNA packaging protein, Nu1 subunit of terminase
+NC_017033.1|provirus_1052334_1094910_973	1075220	1077124	1905	1	0.637	11	AGGA	GENOMAD.129396.VP	3.658e-61	227	0	0	1	2561	Caudoviricetes	NA	NA	PF20454	Terminase large subunit gpA, endonuclease domain
+NC_017033.1|provirus_1052334_1094910_974	1077125	1077361	237	1	0.662	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_975	1077361	1078962	1602	1	0.670	11	None	GENOMAD.019804.VV	6.033e-91	312	0	0	1	2561	Caudoviricetes	NA	NA	PF05136;TIGR01539;COG5511	phage portal protein, lambda family
+NC_017033.1|provirus_1052334_1094910_976	1078962	1080191	1230	1	0.686	11	AGGAG	GENOMAD.160855.VP	4.845e-09	61	0	0	0	2561	Caudoviricetes	NA	NA	PF00574;TIGR00706;COG0740	signal peptide peptidase SppA, 36K type
+NC_017033.1|provirus_1052334_1094910_977	1080191	1080607	417	1	0.686	11	AGGAG	GENOMAD.191487.VP	3.287e-14	71	0	0	0	1	NA	NA	NA	PF02924	Bacteriophage lambda head decoration protein D
+NC_017033.1|provirus_1052334_1094910_978	1080672	1081673	1002	1	0.618	11	GGA/GAG/AGG	GENOMAD.124233.VP	2.33e-71	246	0	0	1	2561	Caudoviricetes	NA	NA	PF03864	Phage major capsid protein E
+NC_017033.1|provirus_1052334_1094910_979	1081673	1081981	309	1	0.650	11	None	GENOMAD.092349.VV	3.404e-39	141	0	0	0	1	NA	NA	NA	PF13856	ATP-binding sugar transporter from pro-phage
+NC_017033.1|provirus_1052334_1094910_980	1081978	1082574	597	1	0.657	11	GGAG/GAGG	GENOMAD.066423.VV	4.833e-81	267	0	0	1	2561	Caudoviricetes	NA	NA	PF06763	Prophage minor tail protein Z (GPZ)
+NC_017033.1|provirus_1052334_1094910_981	1082571	1083152	582	1	0.634	11	GGA/GAG/AGG	GENOMAD.065270.VV	5.57e-42	154	0	0	1	2561	Caudoviricetes	NA	NA	PF09646	Gp37 protein
+NC_017033.1|provirus_1052334_1094910_982	1083127	1083714	588	1	0.675	11	AGGAG	GENOMAD.162066.VP	1.032e-44	162	0	0	1	2561	Caudoviricetes	NA	NA	PF04717;COG4540;TIGR01644	Phage P2 baseplate assembly protein gpV
+NC_017033.1|provirus_1052334_1094910_983	1083725	1084081	357	1	0.672	11	GGA/GAG/AGG	GENOMAD.099345.VV	3.147e-06	47	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_984	1084078	1084407	330	1	0.636	11	GGA/GAG/AGG	GENOMAD.136378.VP	5.237e-38	138	0	0	1	2561	Caudoviricetes	NA	NA	PF05136;PF04965;TIGR01539;K06903;COG5511	phage portal protein, lambda family
+NC_017033.1|provirus_1052334_1094910_985	1084404	1085288	885	1	0.655	11	GGA/GAG/AGG	GENOMAD.105501.VV	4.427e-74	252	0	0	1	2561	Caudoviricetes	NA	NA	PF03434;COG3948	Phage-related baseplate assembly protein
+NC_017033.1|provirus_1052334_1094910_986	1085281	1085826	546	1	0.663	11	GGA/GAG/AGG	GENOMAD.114503.VV	4.33e-30	119	0	0	1	2561	Caudoviricetes	NA	NA	PF09684;COG4385;TIGR01634	Bacteriophage P2-related tail formation protein
+NC_017033.1|provirus_1052334_1094910_987	1085826	1087793	1968	1	0.613	11	GGAG/GAGG	GENOMAD.208390.VP	2.441e-59	222	0	0	1	2561	Caudoviricetes	NA	NA	COG5301	Phage-related tail fibre protein
+NC_017033.1|provirus_1052334_1094910_988	1087794	1088279	486	1	0.646	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1052334_1094910_989	1088349	1089569	1221	1	0.649	11	GGAG/GAGG	GENOMAD.218214.VV	7.277e-53	195	0	0	1	2561	Caudoviricetes	NA	NA	PF17541;COG3497	Phage tail sheath protein FI
+NC_017033.1|provirus_1052334_1094910_990	1089579	1090082	504	1	0.647	11	AGGAG	GENOMAD.099825.VV	1.006e-10	62	0	0	1	2561	Caudoviricetes	NA	NA	PF04985;K06908;COG3498;TIGR01611	Phage tail tube protein FII
+NC_017033.1|provirus_1052334_1094910_991	1090092	1090415	324	1	0.623	11	AGGAG	GENOMAD.073828.VV	1.34e-19	85	0	0	1	2561	Caudoviricetes	NA	NA	PF10109	Phage tail assembly chaperone proteins, E, or 41 or 14
+NC_017033.1|provirus_1052334_1094910_992	1090522	1092840	2319	1	0.658	11	GGA/GAG/AGG	GENOMAD.141796.VV	3.591e-106	366	0	0	1	11124	Peduoviridae	NA	NA	COG3941	Phage tail tape-measure protein, controls tail length
+NC_017033.1|provirus_1052334_1094910_993	1092844	1093686	843	1	0.637	11	None	GENOMAD.124222.VP	1.683e-115	371	0	0	0	2561	Caudoviricetes	NA	NA	K06906;COG3499	Phage protein U
+NC_017033.1|provirus_1052334_1094910_994	1093661	1093867	207	1	0.614	11	GGA/GAG/AGG	GENOMAD.159179.VP	5.502e-12	61	0	0	1	2561	Caudoviricetes	NA	NA	COG5004;K06370	P2-like prophage tail protein X
+NC_017033.1|provirus_1052334_1094910_995	1093858	1094910	1053	1	0.633	11	GGAG/GAGG	GENOMAD.158351.VP	2.572e-37	147	0	0	1	2561	Caudoviricetes	NA	NA	PF05954;K06905;COG3500;TIGR03361	Phage protein D
+NC_017033.1|provirus_1557694_1600481_1419	1557694	1557981	288	-1	0.594	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1420	1557981	1558169	189	-1	0.598	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1421	1558169	1558477	309	-1	0.511	11	GGAG/GAGG	GENOMAD.060822.VV	8.986e-06	45	0	0	0	10823	Zobellviridae	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1422	1558474	1558842	369	-1	0.547	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1423	1558835	1559113	279	-1	0.692	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1424	1559113	1559442	330	-1	0.542	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1425	1559439	1561094	1656	-1	0.650	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1426	1561091	1561423	333	-1	0.604	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1427	1561433	1561660	228	-1	0.623	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1428	1561663	1563417	1755	-1	0.613	11	GGAGG	GENOMAD.151126.VP	2.362e-52	199	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1429	1563414	1564154	741	-1	0.592	11	AGGAG	GENOMAD.119436.VP	4.501e-07	53	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;TIGR00616;K07455;COG3723	recombinase, phage RecT family
+NC_017033.1|provirus_1557694_1600481_1430	1564207	1564491	285	-1	0.614	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1431	1564488	1564682	195	-1	0.579	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1432	1564679	1564894	216	-1	0.560	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1433	1564891	1565016	126	-1	0.619	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1434	1565064	1565897	834	-1	0.625	11	GGAG/GAGG	GENOMAD.115107.VV	1.94e-45	168	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1435	1566063	1566449	387	-1	0.618	11	AGGAG	GENOMAD.094188.VV	1.81e-25	103	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1436	1566860	1567096	237	1	0.624	11	AGGAGG	GENOMAD.189851.VV	5.539e-09	53	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1437	1567124	1567516	393	-1	0.555	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1438	1567963	1568715	753	-1	0.463	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1439	1568715	1569317	603	-1	0.580	11	GGA/GAG/AGG	GENOMAD.205774.CP	1.338e-70	237	0	0	0	1	NA	NA	NA	PF08000;PF20612	Bacterial PH domain; SHOCT domain
+NC_017033.1|provirus_1557694_1600481_1440	1569343	1569669	327	-1	0.557	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1441	1569750	1569992	243	1	0.560	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1442	1570044	1570337	294	-1	0.565	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1443	1570557	1570766	210	1	0.581	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1444	1570759	1571061	303	1	0.644	11	GGAG/GAGG	GENOMAD.045996.VV	6.818e-47	163	0	0	0	2561	Caudoviricetes	NA	NA	PF09012;TIGR02702;COG1777	FeoC like transcriptional regulator
+NC_017033.1|provirus_1557694_1600481_1445	1571058	1571933	876	1	0.604	11	None	GENOMAD.208559.VP	0.0002331	45	0	0	0	2561	Caudoviricetes	NA	NA	PF13730;COG5529;TIGR01610	Pyocin large subunit
+NC_017033.1|provirus_1557694_1600481_1446	1571920	1572411	492	1	0.673	11	GGA/GAG/AGG	GENOMAD.166457.VP	3.827e-75	248	0	0	1	2561	Caudoviricetes	NA	NA	PF06992	Replication protein P
+NC_017033.1|provirus_1557694_1600481_1447	1572408	1572614	207	1	0.628	11	GGAG/GAGG	GENOMAD.063929.VV	1.765e-08	51	0	0	0	2561	Caudoviricetes	NA	NA	PF05810;COG4068	Predicted nucleic acid-binding protein, contains Zn-ribbon domain
+NC_017033.1|provirus_1557694_1600481_1448	1572611	1572808	198	1	0.535	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1449	1572805	1572999	195	1	0.651	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1450	1572996	1573445	450	1	0.631	11	GGAG/GAGG	GENOMAD.061349.VV	2.093e-91	294	0	0	0	2561	Caudoviricetes	NA	NA	PF05772	NinB protein
+NC_017033.1|provirus_1557694_1600481_1451	1573594	1573941	348	1	0.609	11	GGAG/GAGG	GENOMAD.036842.VV	1.144e-24	100	0	0	0	2561	Caudoviricetes	NA	NA	PF07102	Putative nuclease YbcO
+NC_017033.1|provirus_1557694_1600481_1452	1573938	1574111	174	1	0.672	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1453	1574111	1574446	336	1	0.631	11	GGAGG	GENOMAD.040593.VV	7.087e-28	109	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1454	1574449	1575066	618	1	0.638	11	GGA/GAG/AGG	GENOMAD.069895.VV	4.385e-31	123	0	0	0	2561	Caudoviricetes	NA	NA	PF17302;TIGR02642	Tryptophan RNA-binding attenuator protein inhibitory protein
+NC_017033.1|provirus_1557694_1600481_1455	1575159	1575422	264	-1	0.462	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1456	1575504	1576007	504	1	0.631	11	None	GENOMAD.044304.VV	3.936e-34	130	0	0	0	5262	Schitoviridae	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1457	1575998	1576297	300	1	0.623	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1458	1576294	1576560	267	1	0.596	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1459	1576756	1577097	342	1	0.591	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1460	1577111	1577446	336	1	0.652	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1461	1577458	1577721	264	1	0.633	11	AGxAGG/AGGxGG	GENOMAD.077615.VV	2.28e-06	46	0	0	0	7278	Salasmaviridae	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1462	1577734	1578405	672	1	0.613	11	GGAG/GAGG	GENOMAD.076022.VV	5.673e-65	222	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1463	1578350	1579906	1557	1	0.615	11	AGxAGG/AGGxGG	GENOMAD.013124.VV	7.041e-150	483	0	0	1	377	Drexlerviridae	NA	NA	PF13262;COG5410	NA
+NC_017033.1|provirus_1557694_1600481_1464	1579903	1581441	1539	1	0.640	11	AGGA/GGAG/GAGG	GENOMAD.003432.VV	5.04e-57	211	0	0	1	2561	Caudoviricetes	NA	NA	PF06381;K09961;TIGR01555;COG3567	phage-related protein, HI1409 family
+NC_017033.1|provirus_1557694_1600481_1465	1581398	1582051	654	1	0.636	11	3Base/5BMM	GENOMAD.083949.VV	7.556e-40	149	0	0	1	2561	Caudoviricetes	NA	NA	PF04233;COG2369;TIGR01641	Uncharacterized conserved protein, contains phage Mu gpF-like domain
+NC_017033.1|provirus_1557694_1600481_1466	1582189	1582368	180	1	0.517	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1467	1582429	1583739	1311	1	0.652	11	None	GENOMAD.099067.VP	2.252e-113	373	0	0	0	2561	Caudoviricetes	NA	NA	PF09979;K09960;COG3566	NA
+NC_017033.1|provirus_1557694_1600481_1468	1583749	1584243	495	1	0.657	11	AGGAG	GENOMAD.033203.VV	1.156e-46	166	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1469	1584321	1585328	1008	1	0.626	11	GGAG/GAGG	GENOMAD.085797.VV	1.048e-165	519	0	0	0	2561	Caudoviricetes	NA	NA	PF09950;COG4834	Encapsulating protein for peroxidase
+NC_017033.1|provirus_1557694_1600481_1470	1585339	1585563	225	1	0.649	11	AGGAG	GENOMAD.170487.VV	4.114e-10	56	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1471	1585541	1585936	396	1	0.634	11	GGAG/GAGG	GENOMAD.005453.VV	5.437e-56	191	0	0	1	2561	Caudoviricetes	NA	NA	PF11863;COG4386	Mu-like prophage tail sheath protein gpL
+NC_017033.1|provirus_1557694_1600481_1472	1585933	1586475	543	1	0.641	11	GGxGG	GENOMAD.008778.VV	5.955e-53	185	0	0	1	2561	Caudoviricetes	NA	NA	PF05069;COG5005;TIGR01635	NA
+NC_017033.1|provirus_1557694_1600481_1473	1586475	1586858	384	1	0.630	11	GGAGG	GENOMAD.040078.VV	2.69e-45	160	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1474	1586851	1587405	555	1	0.632	11	GGAGG	GENOMAD.023692.VV	7.854e-43	156	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1475	1587409	1588893	1485	1	0.640	11	GGAG/GAGG	GENOMAD.005453.VV	4.878e-99	334	0	0	1	2561	Caudoviricetes	NA	NA	PF11863;COG4386	Mu-like prophage tail sheath protein gpL
+NC_017033.1|provirus_1557694_1600481_1476	1588902	1589342	441	1	0.603	11	GGAG/GAGG	GENOMAD.017010.VV	3.75e-67	224	0	0	0	2561	Caudoviricetes	NA	NA	PF11681	Bacteriophage KPP10, Structural protein ORF10
+NC_017033.1|provirus_1557694_1600481_1477	1589353	1589742	390	1	0.633	11	GGAG/GAGG	GENOMAD.055746.VV	7.707e-27	107	0	0	1	2561	Caudoviricetes	NA	NA	PF10876	Phage tail assembly chaperone protein, TAC
+NC_017033.1|provirus_1557694_1600481_1478	1589936	1592188	2253	1	0.603	11	GGA/GAG/AGG	GENOMAD.015777.VV	2.615e-80	288	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1479	1592185	1592805	621	1	0.589	11	GGA/GAG/AGG	GENOMAD.017318.VV	4.715e-50	178	0	0	0	2561	Caudoviricetes	NA	NA	COG3499	NA
+NC_017033.1|provirus_1557694_1600481_1480	1592809	1593123	315	1	0.571	11	GGAGG	GENOMAD.105312.VV	3.054e-41	147	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1481	1593120	1594067	948	1	0.593	11	None	GENOMAD.123309.VP	2.371e-34	137	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1482	1594067	1594726	660	1	0.621	11	None	GENOMAD.006053.VV	1.581e-30	122	0	0	1	2561	Caudoviricetes	NA	NA	PF18352;COG4540;TIGR01644	Phage protein Gp138 N-terminal domain
+NC_017033.1|provirus_1557694_1600481_1483	1594729	1595076	348	1	0.575	11	GGA/GAG/AGG	GENOMAD.009002.VV	2.079e-42	151	0	0	1	2561	Caudoviricetes	NA	NA	PF10934;COG3628	Phage baseplate assembly protein W
+NC_017033.1|provirus_1557694_1600481_1484	1595073	1596251	1179	1	0.611	11	GGAGG	GENOMAD.005285.VV	1.352e-45	173	0	0	0	2561	Caudoviricetes	NA	NA	PF03434;COG3299	Uncharacterized phage protein gp47/JayE
+NC_017033.1|provirus_1557694_1600481_1485	1596248	1596832	585	1	0.581	11	GGxGG	GENOMAD.008482.VV	3.01e-67	227	0	0	1	2561	Caudoviricetes	NA	NA	PF11041;TIGR02242	Bacteriophage Mu-like, Gp48
+NC_017033.1|provirus_1557694_1600481_1486	1596899	1598707	1809	1	0.603	11	GGAG/GAGG	GENOMAD.051520.VV	3.018e-18	92	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1487	1598708	1599193	486	1	0.652	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1488	1599313	1599489	177	1	0.548	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_1557694_1600481_1489	1599510	1600481	972	-1	0.571	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1926	2089294	2090280	987	-1	0.612	11	GGA/GAG/AGG	GENOMAD.147153.VV	7.117e-20	94	0	0	0	2561	Caudoviricetes	NA	NA	PF07120;COG3756	Uncharacterized conserved protein YdaU, DUF1376 family
+NC_017033.1|provirus_2089294_2107522_1927	2090277	2090723	447	-1	0.649	11	GGA/GAG/AGG	GENOMAD.220574.VP	9.96e-24	99	0	0	1	2561	Caudoviricetes	NA	NA	PF06892	Phage regulatory protein CII (CP76)
+NC_017033.1|provirus_2089294_2107522_1928	2090810	2091313	504	1	0.597	11	None	GENOMAD.226021.VP	3.576e-86	280	0	0	0	2561	Caudoviricetes	NA	NA	PF14205	NA
+NC_017033.1|provirus_2089294_2107522_1929	2091539	2092288	750	1	0.575	11	GGA/GAG/AGG	GENOMAD.179157.VV	8.047e-05	46	0	0	0	1	NA	NA	NA	PF18090;TIGR00673;K22300;COG5606	cyanase
+NC_017033.1|provirus_2089294_2107522_1930	2092428	2093327	900	1	0.390	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1931	2093272	2093736	465	1	0.443	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1932	2094023	2094286	264	1	0.549	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1933	2094513	2095400	888	1	0.418	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1934	2096207	2096452	246	1	0.610	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1935	2096599	2096730	132	1	0.568	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1936	2096727	2097047	321	1	0.626	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1937	2097044	2097382	339	1	0.540	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1938	2097379	2097660	282	1	0.621	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1939	2097713	2098534	822	1	0.584	11	AGGAG	GENOMAD.192631.VV	3.816e-31	126	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;TIGR01913	RecT family
+NC_017033.1|provirus_2089294_2107522_1940	2098531	2100282	1752	1	0.619	11	GGAGG	GENOMAD.151126.VP	1.22e-60	224	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1941	2100285	2100512	228	1	0.623	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1942	2100522	2100854	333	1	0.568	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1943	2100851	2101072	222	1	0.622	11	GGAG/GAGG	GENOMAD.224342.VP	6.345e-06	44	0	0	0	2561	Caudoviricetes	NA	NA	PF09035;COG3311	Predicted DNA-binding transcriptional regulator AlpA
+NC_017033.1|provirus_2089294_2107522_1944	2101069	2101995	927	-1	0.592	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1945	2102598	2104394	1797	-1	0.681	11	GGAG/GAGG	GENOMAD.005687.VV	3.84e-08	59	0	0	0	2561	Caudoviricetes	NA	NA	COG5519;K02334	NA
+NC_017033.1|provirus_2089294_2107522_1946	2104375	2105307	933	-1	0.681	11	GGAGG	GENOMAD.166800.VP	1.166e-23	105	0	0	0	2561	Caudoviricetes	NA	NA	COG4643	Uncharacterized domain associated with phage/plasmid primase
+NC_017033.1|provirus_2089294_2107522_1947	2105304	2105672	369	-1	0.629	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1948	2105669	2106016	348	-1	0.655	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1949	2106013	2106468	456	-1	0.623	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_017033.1|provirus_2089294_2107522_1950	2106551	2107522	972	-1	0.631	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_017095.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_018014.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_018068.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,86 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_018068.1|provirus_1361108_1399802_1216	1361108	1361524	417	-1	0.372	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1217	1361850	1362134	285	1	0.456	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1218	1362138	1362350	213	1	0.465	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1219	1362514	1363338	825	1	0.421	11	AGGAG(G)/GGAGG	GENOMAD.133073.VP	4.745e-26	111	0	0	0	2561	Caudoviricetes	NA	NA	PF03374;COG3645	Phage antirepressor protein YoqD, KilAC domain
+NC_018068.1|provirus_1361108_1399802_1220	1363335	1364579	1245	1	0.426	11	3Base/5BMM	GENOMAD.014802.VV	5.219e-14	77	0	0	0	2561	Caudoviricetes	NA	NA	PF00176;K20093;COG1061;TIGR04095	Superfamily II DNA or RNA helicase
+NC_018068.1|provirus_1361108_1399802_1221	1364572	1364856	285	1	0.456	11	AGGA	GENOMAD.062524.VV	5.888e-30	114	0	0	0	2561	Caudoviricetes	NA	NA	PF03838;COG3331;TIGR00648;K03552	Penicillin-binding protein-related factor A, putative recombinase
+NC_018068.1|provirus_1361108_1399802_1222	1364853	1366520	1668	1	0.430	11	3Base/5BMM	GENOMAD.016341.VV	2.768e-209	657	0	0	1	2561	Caudoviricetes	NA	NA	PF13479;PF12684;TIGR01618;K07465;COG1468	phage nucleotide-binding protein
+NC_018068.1|provirus_1361108_1399802_1223	1366538	1366987	450	1	0.389	11	AGGAG/GGAGG	GENOMAD.031678.VV	6.602e-29	114	0	0	0	2561	Caudoviricetes	NA	NA	PF05037	NA
+NC_018068.1|provirus_1361108_1399802_1224	1367256	1368950	1695	1	0.433	11	GGAG/GAGG	GENOMAD.102034.VP	2.969e-108	364	0	0	0	2561	Caudoviricetes	NA	NA	TIGR01636	NA
+NC_018068.1|provirus_1361108_1399802_1225	1369137	1371011	1875	1	0.415	11	GGAGG	GENOMAD.024099.VV	5.474e-55	208	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1226	1371524	1371904	381	1	0.428	11	GGAGG	GENOMAD.192072.VP	2.313e-13	68	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1227	1372021	1372473	453	1	0.406	11	AGGAGG	GENOMAD.076519.VV	2.465e-40	147	0	0	0	2561	Caudoviricetes	NA	NA	PF05263;TIGR01636;COG2739;K01994	phage transcriptional activator, RinA family
+NC_018068.1|provirus_1361108_1399802_1228	1372631	1372819	189	1	0.402	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1229	1372954	1373160	207	1	0.469	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1230	1373168	1373524	357	1	0.473	11	AGxAGG/AGGxGG	GENOMAD.045242.VV	1.014e-10	60	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1231	1373710	1374237	528	1	0.460	11	AGxAGG/AGGxGG	GENOMAD.098194.VV	3.009e-58	200	0	0	1	2561	Caudoviricetes	NA	NA	PF05119;COG3747;TIGR01558	Phage terminase, small subunit
+NC_018068.1|provirus_1361108_1399802_1232	1374300	1375553	1254	1	0.433	11	GGAG/GAGG	GENOMAD.038338.VV	1.076e-29	126	0	0	0	2561	Caudoviricetes	NA	NA	COG3392	NA
+NC_018068.1|provirus_1361108_1399802_1233	1375834	1376358	525	1	0.375	11	None	GENOMAD.133508.VP	1.117e-12	68	0	0	0	2561	Caudoviricetes	NA	NA	PF13392	HNH endonuclease
+NC_018068.1|provirus_1361108_1399802_1234	1376401	1376586	186	1	0.489	11	GGA/GAG/AGG	GENOMAD.209016.VC	3.22e-07	47	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1235	1376590	1377405	816	1	0.433	11	AGxAGG/AGGxGG	GENOMAD.105515.VV	4.177e-12	69	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1236	1377405	1377644	240	1	0.442	11	AGGAGG	GENOMAD.225559.VP	1.638e-13	66	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1237	1377747	1377998	252	-1	0.413	11	AGGAGG	GENOMAD.197050.CP	0.0001087	41	0	0	0	1	NA	NA	NA	PF19124	NA
+NC_018068.1|provirus_1361108_1399802_1238	1378174	1378383	210	1	0.348	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1239	1378503	1380050	1548	1	0.468	11	GGA/GAG/AGG	GENOMAD.190509.VP	4.55e-66	238	0	0	1	2561	Caudoviricetes	NA	NA	PF03354;COG4626	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_018068.1|provirus_1361108_1399802_1240	1380176	1381339	1164	1	0.456	11	None	GENOMAD.179073.VP	5.583e-45	171	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1241	1381339	1382406	1068	1	0.465	11	GGA/GAG/AGG	GENOMAD.158277.VP	6.708e-34	137	0	0	0	2561	Caudoviricetes	NA	NA	PF00574;PF19602;K01358;TIGR00493;COG3904	ATP-dependent Clp endopeptidase, proteolytic subunit ClpP
+NC_018068.1|provirus_1361108_1399802_1242	1382396	1383670	1275	1	0.469	11	AGGAG	GENOMAD.092606.VV	1.506e-40	159	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;COG4653;TIGR01554	Predicted phage phi-C31 gp36 major capsid-like protein
+NC_018068.1|provirus_1361108_1399802_1243	1383704	1384180	477	1	0.486	11	AGGAGG	GENOMAD.077304.VV	2.485e-35	133	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1244	1384255	1384848	594	1	0.468	11	AGGA	GENOMAD.067701.VV	2.482e-44	161	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR02215	phage conserved hypothetical protein, phiE125 gp8 family
+NC_018068.1|provirus_1361108_1399802_1245	1384864	1385193	330	1	0.412	11	GGxGG	GENOMAD.027939.VV	2.94e-20	87	0	0	1	2561	Caudoviricetes	NA	NA	PF05521;COG5614;TIGR01563	Bacteriophage head-tail adaptor
+NC_018068.1|provirus_1361108_1399802_1246	1385186	1385599	414	1	0.435	11	GGAG/GAGG	GENOMAD.018908.VV	5.448e-17	79	0	0	1	2561	Caudoviricetes	NA	NA	PF04883;TIGR01725;COG5005	Bacteriophage HK97-gp10, putative tail-component
+NC_018068.1|provirus_1361108_1399802_1247	1385599	1386033	435	1	0.414	11	GGA/GAG/AGG	GENOMAD.029331.VV	3.675e-58	198	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1248	1386037	1387104	1068	1	0.463	11	AGGAGG	GENOMAD.014203.VV	9.347e-74	254	0	0	1	2561	Caudoviricetes	NA	NA	PF04984;PF17482;COG4386	Mu-like prophage tail sheath protein gpL
+NC_018068.1|provirus_1361108_1399802_1249	1387116	1387544	429	1	0.471	11	GGAGG	GENOMAD.008035.VV	8.025e-49	171	0	0	1	2561	Caudoviricetes	NA	NA	PF09393	Phage tail tube protein
+NC_018068.1|provirus_1361108_1399802_1250	1387599	1388000	402	1	0.443	11	GGAGG	GENOMAD.020710.VV	1.165e-40	147	0	0	1	2561	Caudoviricetes	NA	NA	PF08890	Phage XkdN-like tail assembly chaperone protein, TAC
+NC_018068.1|provirus_1361108_1399802_1251	1388204	1390375	2172	1	0.472	11	GGA/GAG/AGG	GENOMAD.117212.VP	4.285e-62	232	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1252	1390388	1390792	405	1	0.432	11	AGxAGG/AGGxGG	GENOMAD.025221.VV	2.91e-72	238	0	0	0	2561	Caudoviricetes	NA	NA	PF06995;COG1652	Nucleoid-associated protein YgaU, contains BON and LysM domains
+NC_018068.1|provirus_1361108_1399802_1253	1390789	1391781	993	1	0.438	11	GGA/GAG/AGG	GENOMAD.020668.VV	8.021e-51	186	0	0	1	2561	Caudoviricetes	NA	NA	PF05954;COG4379;K06905;TIGR03361	Mu-like prophage tail protein gpP
+NC_018068.1|provirus_1361108_1399802_1254	1391791	1392159	369	1	0.439	11	GGAG/GAGG	GENOMAD.046601.VV	4.306e-46	162	0	0	0	2561	Caudoviricetes	NA	NA	PF10844	NA
+NC_018068.1|provirus_1361108_1399802_1255	1392156	1392587	432	1	0.431	11	GGA/GAG/AGG	GENOMAD.015505.VV	4.579e-47	166	0	0	0	2561	Caudoviricetes	NA	NA	PF10934;COG4381	Mu-like prophage protein gp46
+NC_018068.1|provirus_1361108_1399802_1256	1392580	1393653	1074	1	0.465	11	GGAG/GAGG	GENOMAD.110264.VV	3.326e-30	126	0	0	1	2561	Caudoviricetes	NA	NA	PF04865;COG3948	Phage-related baseplate assembly protein
+NC_018068.1|provirus_1361108_1399802_1257	1393646	1394167	522	1	0.423	11	GGxGG	GENOMAD.018612.VV	1.342e-21	94	0	0	1	2561	Caudoviricetes	NA	NA	PF10076;COG3778;TIGR02242	Uncharacterized protein YmfQ in lambdoid prophage, DUF2313 family
+NC_018068.1|provirus_1361108_1399802_1258	1394168	1394734	567	1	0.497	11	GGAGG	GENOMAD.069954.VV	8.47e-44	159	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1259	1394734	1395069	336	1	0.476	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1260	1395078	1396721	1644	1	0.485	11	GGA/GAG/AGG	GENOMAD.140563.VP	5.937e-15	81	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1261	1396735	1397073	339	1	0.416	11	AGxAGG/AGGxGG	GENOMAD.213587.VP	1.005e-16	77	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1262	1397074	1397211	138	1	0.348	11	AGGAGG	GENOMAD.042441.VV	4.212e-05	40	0	0	0	2561	Caudoviricetes	NA	NA	PF09693;TIGR01669	phage uncharacterized protein, XkdX family
+NC_018068.1|provirus_1361108_1399802_1263	1397268	1397507	240	1	0.475	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1264	1397695	1398015	321	1	0.442	11	AGGAGG	GENOMAD.130222.VV	2.136e-14	70	0	0	0	2561	Caudoviricetes	NA	NA	COG3105	NA
+NC_018068.1|provirus_1361108_1399802_1265	1397993	1398478	486	1	0.440	11	GGA/GAG/AGG	GENOMAD.151608.VV	2.569e-36	136	0	0	0	2561	Caudoviricetes	NA	NA	PF19988	NA
+NC_018068.1|provirus_1361108_1399802_1266	1398599	1399372	774	1	0.464	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_1361108_1399802_1267	1399389	1399802	414	1	0.415	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1928	2072558	2072734	177	1	0.429	11	AGGAGG	GENOMAD.222548.VP	1.604e-05	42	0	0	0	1	NA	NA	NA	PF06806;COG3311;TIGR01764	Predicted DNA-binding transcriptional regulator AlpA
+NC_018068.1|provirus_2072558_2098541_1929	2072878	2073066	189	1	0.386	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1930	2073461	2073664	204	1	0.446	11	4Base/6BMM	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1931	2073775	2073921	147	1	0.388	11	AGGAG(G)/GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1932	2073908	2074774	867	1	0.468	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1933	2074771	2077260	2490	1	0.472	11	AGGAG/GGAGG	GENOMAD.021366.VV	4.949e-07	56	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1934	2077248	2077511	264	1	0.383	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1935	2078510	2078722	213	1	0.418	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1936	2078760	2078948	189	1	0.381	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1937	2078967	2079275	309	1	0.463	11	None	GENOMAD.037442.VV	3.636e-15	72	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1938	2081715	2081849	135	1	0.222	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1939	2081855	2081998	144	1	0.250	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1940	2082018	2082221	204	1	0.353	11	AGGAG/GGAGG	GENOMAD.220824.VP	3.347e-09	53	0	0	0	2561	Caudoviricetes	NA	NA	PF18903	NA
+NC_018068.1|provirus_2072558_2098541_1941	2082224	2082352	129	1	0.271	11	AGGA/GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1942	2082428	2082634	207	1	0.329	11	GGAG/GAGG	GENOMAD.207723.VP	1.947e-14	68	0	0	1	2561	Caudoviricetes	NA	NA	PF10960	BhlA holin family
+NC_018068.1|provirus_2072558_2098541_1943	2082649	2083065	417	1	0.336	11	AGGAG	GENOMAD.126365.VV	7.377e-48	168	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1944	2083107	2083994	888	1	0.370	11	AGxAGG/AGGxGG	GENOMAD.136497.VV	4.06e-55	197	0	0	0	2561	Caudoviricetes	NA	NA	PF17236	Phage capsid-like protein
+NC_018068.1|provirus_2072558_2098541_1945	2084087	2084278	192	1	0.344	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1946	2084442	2085254	813	1	0.332	11	None	GENOMAD.225339.VP	2.875e-113	364	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1947	2085426	2086922	1497	1	0.279	11	AGGA	GENOMAD.225126.VP	2.658e-245	758	0	0	0	2561	Caudoviricetes	NA	NA	PF06862;TIGR01587;COG4098;K17677	CRISPR-associated helicase Cas3
+NC_018068.1|provirus_2072558_2098541_1948	2087352	2087744	393	1	0.308	11	AGGAG	GENOMAD.142024.VV	3.756e-43	154	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1949	2087741	2089312	1572	1	0.344	11	3Base/5BMM	GENOMAD.180947.VP	4.422e-38	154	0	0	1	2561	Caudoviricetes	NA	NA	PF04466;COG5323;TIGR01547;K21523	Large terminase phage packaging protein
+NC_018068.1|provirus_2072558_2098541_1950	2089329	2090789	1461	1	0.332	11	GGA/GAG/AGG	GENOMAD.003260.VV	2.398e-204	639	0	0	1	2561	Caudoviricetes	NA	NA	PF05133;TIGR01538;COG3567	phage portal protein, SPP1 family
+NC_018068.1|provirus_2072558_2098541_1951	2091361	2091654	294	-1	0.344	11	AGGAGG	GENOMAD.213863.VC	0.00091	39	0	0	0	1	NA	NA	NA	PF05810;COG4068;TIGR01206;K21463	Predicted nucleic acid-binding protein, contains Zn-ribbon domain
+NC_018068.1|provirus_2072558_2098541_1952	2091691	2092041	351	-1	0.325	11	AGGAG	GENOMAD.223401.VP	5.93e-32	121	0	0	0	2561	Caudoviricetes	NA	NA	PF09851	NA
+NC_018068.1|provirus_2072558_2098541_1953	2092685	2093926	1242	1	0.465	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1954	2094078	2094944	867	-1	0.330	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1955	2095132	2095350	219	1	0.311	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1956	2095375	2095635	261	1	0.257	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1957	2095704	2096051	348	1	0.307	11	AGGAGG	GENOMAD.220167.VP	1.032e-41	149	0	0	0	2561	Caudoviricetes	NA	NA	PF20449	NA
+NC_018068.1|provirus_2072558_2098541_1958	2096068	2097186	1119	1	0.344	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1959	2097227	2097439	213	-1	0.315	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018068.1|provirus_2072558_2098541_1960	2097555	2098541	987	-1	0.330	11	GGA/GAG/AGG	GENOMAD.214049.VP	0.0005959	44	0	0	0	2561	Caudoviricetes	NA	NA	PF00589;TIGR02224;COG4973;K03733	tyrosine recombinase XerC
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_018515.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,75 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_018515.1|provirus_3418112_3436097_3127	3418112	3418687	576	-1	0.474	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3128	3418979	3419323	345	-1	0.412	11	GGAGG	GENOMAD.178485.VV	8.068e-52	178	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3129	3419421	3420176	756	-1	0.463	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3130	3420203	3420451	249	-1	0.434	11	AGGA	GENOMAD.042597.VV	2.985e-31	117	0	0	0	2561	Caudoviricetes	NA	NA	PF10779	Haemolysin XhlA
+NC_018515.1|provirus_3418112_3436097_3131	3420532	3420702	171	-1	0.316	11	AGGAGG	GENOMAD.019319.VV	0.0001663	39	0	0	0	2561	Caudoviricetes	NA	NA	PF09693;TIGR01669	phage uncharacterized protein, XkdX family
+NC_018515.1|provirus_3418112_3436097_3132	3420716	3421015	300	-1	0.360	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3133	3421030	3422109	1080	-1	0.488	11	AGGAG	GENOMAD.010477.VV	1.931e-16	84	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3134	3422122	3422733	612	-1	0.431	11	AGxAGG/AGGxGG	GENOMAD.018612.VV	2.241e-57	199	0	0	1	2561	Caudoviricetes	NA	NA	PF10076;COG3778;TIGR02242	Uncharacterized protein YmfQ in lambdoid prophage, DUF2313 family
+NC_018515.1|provirus_3418112_3436097_3135	3422739	3423455	717	-1	0.480	11	GGAGG	GENOMAD.072355.VV	1.988e-75	253	0	0	0	5262	Schitoviridae	NA	NA	PF18454	Major tropism determinant N-terminal domain
+NC_018515.1|provirus_3418112_3436097_3136	3423468	3424490	1023	-1	0.475	11	AGGAGG	GENOMAD.072355.VV	2.41e-07	55	0	0	0	5262	Schitoviridae	NA	NA	PF18454	Major tropism determinant N-terminal domain
+NC_018515.1|provirus_3418112_3436097_3137	3424494	3424907	414	-1	0.435	11	GGxGG	GENOMAD.105081.VV	2.709e-66	221	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3138	3424912	3425949	1038	-1	0.480	11	AGGAGG	GENOMAD.004833.VV	1.671e-45	171	0	0	1	2561	Caudoviricetes	NA	NA	PF04865;COG3299	Baseplate J-like protein
+NC_018515.1|provirus_3418112_3436097_3139	3425949	3426350	402	-1	0.440	11	AGxAGG/AGGxGG	GENOMAD.016318.VV	3.473e-37	137	0	0	0	2561	Caudoviricetes	NA	NA	PF10934;COG4381;TIGR03357	Mu-like prophage protein gp46
+NC_018515.1|provirus_3418112_3436097_3140	3426347	3426703	357	-1	0.457	11	GGA/GAG/AGG	GENOMAD.020599.VV	1.753e-21	91	0	0	0	2561	Caudoviricetes	NA	NA	PF10844	NA
+NC_018515.1|provirus_3418112_3436097_3141	3426703	3427689	987	-1	0.443	11	AGGAGG	GENOMAD.018966.VV	5.985e-106	346	0	0	1	2561	Caudoviricetes	NA	NA	PF14594;COG4379;TIGR03361;K06905	Mu-like prophage tail protein gpP
+NC_018515.1|provirus_3418112_3436097_3142	3427706	3428368	663	-1	0.448	11	AGxAGG/AGGxGG	GENOMAD.015578.VV	2.506e-23	101	0	0	0	2561	Caudoviricetes	NA	NA	PF06995;COG1652	Nucleoid-associated protein YgaU, contains BON and LysM domains
+NC_018515.1|provirus_3418112_3436097_3143	3428368	3430056	1689	-1	0.436	11	AGGAGG	GENOMAD.032671.VV	1.142e-122	406	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3144	3430684	3431106	423	-1	0.437	11	GGAGG	GENOMAD.001212.VV	8.9e-47	165	0	0	1	2561	Caudoviricetes	NA	NA	PF08890	Phage XkdN-like tail assembly chaperone protein, TAC
+NC_018515.1|provirus_3418112_3436097_3145	3431161	3431628	468	-1	0.459	11	GGA/GAG/AGG	GENOMAD.011307.VV	3.196e-73	242	0	0	1	2561	Caudoviricetes	NA	NA	PF09393	Phage tail tube protein
+NC_018515.1|provirus_3418112_3436097_3146	3431632	3432948	1317	-1	0.455	11	GGAGG	GENOMAD.013578.VV	4.449e-94	317	0	0	1	2561	Caudoviricetes	NA	NA	PF17481;PF04984;PF17482;COG4386	Mu-like prophage tail sheath protein gpL
+NC_018515.1|provirus_3418112_3436097_3147	3432950	3433132	183	-1	0.388	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3148	3433125	3433544	420	-1	0.448	11	AGGAG	GENOMAD.023771.VV	1.411e-24	101	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3149	3434218	3434688	471	-1	0.410	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3150	3435000	3435596	597	1	0.405	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_3418112_3436097_3151	3435618	3436097	480	1	0.352	11	AGGAG	GENOMAD.123021.VV	8.264e-31	120	0	0	0	2561	Caudoviricetes	NA	NA	PF06114;COG2856	IrrE N-terminal-like domain
+NC_018515.1|provirus_4659544_4694673_4266	4659544	4659789	246	-1	0.398	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4267	4659786	4660568	783	-1	0.415	11	AGGAGG	GENOMAD.053051.VV	3.635e-13	72	0	0	0	2561	Caudoviricetes	NA	NA	PF10772;PF02086;TIGR00571;COG0338	Bacteriophage HP1, Orf24; D12 class N6 adenine-specific DNA methyltransferase
+NC_018515.1|provirus_4659544_4694673_4268	4660808	4661533	726	1	0.310	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4269	4661559	4662848	1290	-1	0.354	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4270	4662851	4663681	831	-1	0.357	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4271	4663834	4664334	501	-1	0.435	11	AGGAGG	GENOMAD.220913.VP	9.323e-12	65	0	0	1	2561	Caudoviricetes	NA	NA	PF09682;TIGR01673	Bacteriophage holin of superfamily 6 (Holin_LLH)
+NC_018515.1|provirus_4659544_4694673_4272	4664379	4665224	846	-1	0.488	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4273	4665235	4665600	366	-1	0.413	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4274	4665683	4665937	255	-1	0.412	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4275	4666125	4666301	177	-1	0.429	11	GGAGG	GENOMAD.202651.VV	1.242e-28	108	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4276	4666298	4666576	279	-1	0.423	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4277	4666573	4667667	1095	-1	0.525	11	GGAG/GAGG	GENOMAD.135924.VV	5.173e-50	185	0	0	0	4312	Hafunaviridae	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4278	4667682	4669058	1377	-1	0.439	11	GGAG/GAGG	GENOMAD.007293.VV	1.173e-76	267	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4279	4669065	4670156	1092	-1	0.412	11	GGxGG	GENOMAD.006687.VV	4.266e-78	267	0	0	1	2561	Caudoviricetes	NA	NA	PF14594;COG4926;TIGR01665	Siphovirus ReqiPepy6 Gp37-like protein
+NC_018515.1|provirus_4659544_4694673_4280	4670159	4671022	864	-1	0.403	11	AGxAGG/AGGxGG	GENOMAD.009232.VV	5.496e-87	289	0	0	0	2561	Caudoviricetes	NA	NA	PF16774;COG4722;TIGR01633	Phage-related protein
+NC_018515.1|provirus_4659544_4694673_4281	4671033	4673771	2739	-1	0.449	11	None	GENOMAD.110013.VP	2.08e-93	332	0	0	1	2561	Caudoviricetes	NA	NA	COG5280	Phage-related minor tail protein
+NC_018515.1|provirus_4659544_4694673_4282	4673768	4673995	228	-1	0.430	11	None	GENOMAD.095592.VV	3.087e-06	45	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4283	4674073	4674399	327	-1	0.404	11	GGAGG	GENOMAD.044337.VV	2.719e-52	179	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4284	4674442	4675005	564	-1	0.502	11	GGA/GAG/AGG	GENOMAD.009652.VV	1.45e-80	265	0	0	1	2561	Caudoviricetes	NA	NA	TIGR01537	NA
+NC_018515.1|provirus_4659544_4694673_4285	4675011	4675370	360	-1	0.444	11	AGGAGG	GENOMAD.058243.VV	1.023e-51	178	0	0	1	2561	Caudoviricetes	NA	NA	PF11367	NA
+NC_018515.1|provirus_4659544_4694673_4286	4675367	4675792	426	-1	0.465	11	GGxGG	GENOMAD.072075.VV	6.875e-16	76	0	0	1	2561	Caudoviricetes	NA	NA	PF11114;TIGR01725;COG5005	phage protein, HK97 gp10 family
+NC_018515.1|provirus_4659544_4694673_4287	4675793	4676104	312	-1	0.458	11	GGA/GAG/AGG	GENOMAD.008635.VV	1.997e-29	113	0	0	1	2561	Caudoviricetes	NA	NA	PF05521;TIGR01563;COG5614	phage head-tail adaptor, putative, SPP1 family
+NC_018515.1|provirus_4659544_4694673_4288	4676101	4676370	270	-1	0.393	11	GGAG/GAGG	GENOMAD.053459.VV	1.209e-43	153	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4289	4676371	4676568	198	-1	0.455	11	GGxGG	GENOMAD.188189.VV	3.555e-29	110	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4290	4676592	4677815	1224	-1	0.483	11	AGGAGG	GENOMAD.088359.VV	4.366e-19	93	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;PF18316;PF17078;TIGR01554;COG4653	phage major capsid protein, HK97 family
+NC_018515.1|provirus_4659544_4694673_4291	4677854	4678474	621	-1	0.470	11	AGGAGG	GENOMAD.116539.VV	2.017e-19	89	0	0	1	2561	Caudoviricetes	NA	NA	PF04586;PF05065;K06904;COG3740;TIGR01543	Phage head maturation protease
+NC_018515.1|provirus_4659544_4694673_4292	4678428	4679657	1230	-1	0.460	11	GGAG/GAGG	GENOMAD.003590.VV	9.884e-09	60	0	0	1	2561	Caudoviricetes	NA	NA	PF04860;TIGR01537;COG4695	phage portal protein, HK97 family
+NC_018515.1|provirus_4659544_4694673_4293	4679878	4681632	1755	-1	0.471	11	AGxAGG/AGGxGG	GENOMAD.194580.VP	2.855e-27	121	0	0	1	2561	Caudoviricetes	NA	NA	PF03354;PF05521;PF20441;COG4626;TIGR01563	Phage terminase-like protein, large subunit, contains N-terminal HTH domain
+NC_018515.1|provirus_4659544_4694673_4294	4681625	4682008	384	-1	0.464	11	GGAGG	GENOMAD.092852.VV	8.987e-49	170	0	0	1	2561	Caudoviricetes	NA	NA	TIGR01558	NA
+NC_018515.1|provirus_4659544_4694673_4295	4682094	4682456	363	-1	0.394	11	AGGA/GGAG/GAGG	GENOMAD.080571.VV	4.962e-76	248	0	0	0	11831	Demerecviridae	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4296	4683479	4684264	786	1	0.359	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4297	4684476	4685324	849	1	0.269	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4298	4685564	4686076	513	-1	0.454	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4299	4686432	4686794	363	-1	0.501	11	AGGAG(G)/GGAGG	GENOMAD.151656.VP	8.696e-38	138	0	0	1	2561	Caudoviricetes	NA	NA	PF17288;K06909;TIGR01547;COG1783	phage terminase, large subunit, PBSX family
+NC_018515.1|provirus_4659544_4694673_4300	4686791	4687312	522	-1	0.454	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4301	4687336	4688310	975	-1	0.463	11	AGGAGG	GENOMAD.017981.VV	2.221e-42	161	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4302	4688325	4688492	168	-1	0.494	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4303	4688511	4689254	744	-1	0.440	11	GGA/GAG/AGG	GENOMAD.129273.VC	1.957e-41	155	0	0	0	2561	Caudoviricetes	NA	NA	PF12706;TIGR02651;COG1234;K06167	ribonuclease Z
+NC_018515.1|provirus_4659544_4694673_4304	4689256	4690083	828	-1	0.447	11	AGGAGG	GENOMAD.121864.VP	4.873e-26	111	0	0	0	2561	Caudoviricetes	NA	NA	PF03837;COG3723;K07455;TIGR00616	Recombinational DNA repair protein RecT
+NC_018515.1|provirus_4659544_4694673_4305	4690183	4690290	108	-1	0.426	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4306	4690287	4692251	1965	-1	0.439	11	GGA/GAG/AGG	GENOMAD.182234.VP	4.932e-58	218	0	0	0	2561	Caudoviricetes	NA	NA	PF13175;TIGR00634;COG1195;K03546	DNA repair protein RecN
+NC_018515.1|provirus_4659544_4694673_4307	4692248	4692634	387	-1	0.429	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4308	4692650	4692922	273	-1	0.502	11	None	GENOMAD.199250.VV	1.281e-05	44	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4309	4692957	4693220	264	-1	0.432	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4310	4693210	4693476	267	-1	0.449	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4311	4693491	4693604	114	-1	0.465	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4312	4693681	4693836	156	-1	0.436	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_018515.1|provirus_4659544_4694673_4313	4693815	4694144	330	-1	0.415	11	None	GENOMAD.169643.VC	1.05e-06	48	0	0	1	1	NA	NA	NA	PF11242;TIGR02612;COG4197;K22299	mobile mystery protein A
+NC_018515.1|provirus_4659544_4694673_4314	4694266	4694673	408	1	0.395	11	AGGAGG	GENOMAD.053307.VV	0.0005741	41	0	0	0	2561	Caudoviricetes	NA	NA	PF13744;COG3655;TIGR02612;K18830	DNA-binding transcriptional regulator, XRE family
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_019897.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_019904.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_019936.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,50 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_019936.1|provirus_2347508_2361929_2122	2347508	2347720	213	-1	0.521	11	GGAG/GAGG	GENOMAD.221461.VP	1.082e-35	129	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2123	2347848	2349110	1263	1	0.571	11	GGA/GAG/AGG	GENOMAD.223897.VP	6.327e-42	163	0	0	0	8016	Inoviridae	NA	NA	PF05155	Phage X family
+NC_019936.1|provirus_2347508_2361929_2124	2349110	2349256	147	1	0.510	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2125	2349354	2349698	345	1	0.528	11	GGAG/GAGG	GENOMAD.215295.VP	5.435e-24	98	0	0	0	8016	Inoviridae	NA	NA	PF17426	Putative Gamma DNA binding protein G5P
+NC_019936.1|provirus_2347508_2361929_2126	2349942	2350088	147	1	0.565	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2127	2350223	2351734	1512	1	0.511	11	GGAGG	GENOMAD.222416.VP	9.094e-24	109	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2128	2351737	2352003	267	1	0.532	11	GGAGG	GENOMAD.197598.VP	3.988e-31	117	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2129	2352007	2353200	1194	1	0.550	11	None	GENOMAD.056690.VV	1.152e-05	50	0	0	1	8016	Inoviridae	NA	NA	PF05707;COG4128;K10954	Zona occludens toxin, predicted ATPase
+NC_019936.1|provirus_2347508_2361929_2130	2353258	2353545	288	-1	0.587	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2131	2353940	2354152	213	-1	0.521	11	GGAG/GAGG	GENOMAD.221461.VP	1.082e-35	129	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2132	2354280	2355542	1263	1	0.571	11	GGA/GAG/AGG	GENOMAD.223897.VP	6.327e-42	163	0	0	0	8016	Inoviridae	NA	NA	PF05155	Phage X family
+NC_019936.1|provirus_2347508_2361929_2133	2355542	2355688	147	1	0.510	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2134	2355786	2356130	345	1	0.528	11	GGAG/GAGG	GENOMAD.215295.VP	5.435e-24	98	0	0	0	8016	Inoviridae	NA	NA	PF17426	Putative Gamma DNA binding protein G5P
+NC_019936.1|provirus_2347508_2361929_2135	2356374	2356520	147	1	0.565	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2136	2356655	2358166	1512	1	0.511	11	GGAGG	GENOMAD.222416.VP	9.094e-24	109	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2137	2358169	2358435	267	1	0.532	11	GGAGG	GENOMAD.197598.VP	3.988e-31	117	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2138	2358439	2359632	1194	1	0.550	11	None	GENOMAD.056690.VV	1.152e-05	50	0	0	1	8016	Inoviridae	NA	NA	PF05707;COG4128;K10954	Zona occludens toxin, predicted ATPase
+NC_019936.1|provirus_2347508_2361929_2139	2359690	2359977	288	-1	0.587	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2140	2360944	2361303	360	1	0.511	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2141	2361300	2361584	285	1	0.586	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_2347508_2361929_2142	2361642	2361929	288	-1	0.587	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2952	3233292	3234299	1008	-1	0.619	11	None	GENOMAD.212346.VP	4.357e-26	113	0	0	1	2561	Caudoviricetes	NA	NA	PF16452;PF06892;COG1974	Bacteriophage CI repressor C-terminal domain; Phage regulatory protein CII (CP76)
+NC_019936.1|provirus_3233292_3242961_2953	3234281	3235558	1278	-1	0.596	11	GGAG/GAGG	GENOMAD.226808.VP	8.692e-257	787	0	0	0	8016	Inoviridae	NA	NA	PF02486	Replication initiation factor
+NC_019936.1|provirus_3233292_3242961_2954	3235706	3236890	1185	-1	0.617	11	AGGAG	GENOMAD.090645.VV	1.347e-06	53	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2955	3236903	3237229	327	-1	0.572	11	AGGAG	GENOMAD.224290.VP	3.685e-65	216	0	0	0	1	NA	NA	NA	PF10734	NA
+NC_019936.1|provirus_3233292_3242961_2956	3237229	3238722	1494	-1	0.586	11	GGxGG	GENOMAD.222416.VP	3.831e-276	847	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2957	3238725	3238853	129	-1	0.558	11	3Base/5BMM	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2958	3238873	3239082	210	-1	0.638	11	GGAG/GAGG	GENOMAD.224287.VP	6.332e-33	121	0	0	1	1	NA	NA	NA	PF05356	Inovirus Coat protein B
+NC_019936.1|provirus_3233292_3242961_2959	3239093	3239308	216	-1	0.597	11	AGxAGG/AGGxGG	GENOMAD.225528.VP	1.222e-42	149	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2960	3239305	3239484	180	-1	0.672	11	GGAGG	GENOMAD.226094.VP	6.522e-28	106	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2961	3239500	3239859	360	-1	0.611	11	GGAG/GAGG	GENOMAD.225482.VP	6.187e-49	170	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2962	3240152	3240922	771	-1	0.641	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2963	3240938	3241081	144	-1	0.660	11	GGxGG	GENOMAD.213484.VP	1.701e-13	64	0	0	0	2561	Caudoviricetes	NA	NA	PF05509;COG4877	Plasmid stability protein
+NC_019936.1|provirus_3233292_3242961_2964	3241086	3241229	144	-1	0.611	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2965	3241226	3241441	216	-1	0.616	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_3233292_3242961_2966	3241921	3242961	1041	1	0.386	11	AGGA/GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_4295725_4304306_3986	4295725	4295985	261	-1	0.567	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_4295725_4304306_3987	4296137	4296352	216	1	0.574	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_4295725_4304306_3988	4296349	4296930	582	1	0.662	11	AGGAG	GENOMAD.226428.VP	0.0008059	42	0	0	0	8016	Inoviridae	NA	NA	PF17525	NA
+NC_019936.1|provirus_4295725_4304306_3989	4297106	4297477	372	1	0.597	11	GGAG/GAGG	GENOMAD.225482.VP	2.427e-28	111	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_4295725_4304306_3990	4297493	4297672	180	1	0.644	11	GGAGG	GENOMAD.226094.VP	7.27e-27	103	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_4295725_4304306_3991	4297669	4297884	216	1	0.588	11	AGxAGG/AGGxGG	GENOMAD.225528.VP	1.222e-42	149	0	0	0	1	NA	NA	NA	NA	NA
+NC_019936.1|provirus_4295725_4304306_3992	4297895	4298104	210	1	0.657	11	GGAG/GAGG	GENOMAD.224287.VP	5.695e-34	124	0	0	1	1	NA	NA	NA	PF05356	Inovirus Coat protein B
+NC_019936.1|provirus_4295725_4304306_3993	4298256	4299749	1494	1	0.583	11	GGxGG	GENOMAD.222416.VP	3.831e-276	847	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_4295725_4304306_3994	4299749	4300075	327	1	0.566	11	AGGAG	GENOMAD.224290.VP	3.685e-65	216	0	0	0	1	NA	NA	NA	PF10734	NA
+NC_019936.1|provirus_4295725_4304306_3995	4300088	4301272	1185	1	0.619	11	AGGAG	GENOMAD.090645.VV	5.588e-06	51	0	0	0	8016	Inoviridae	NA	NA	NA	NA
+NC_019936.1|provirus_4295725_4304306_3996	4301420	4302700	1281	1	0.596	11	GGAG/GAGG	GENOMAD.226808.VP	9.102e-257	787	0	0	0	8016	Inoviridae	NA	NA	PF02486	Replication initiation factor
+NC_019936.1|provirus_4295725_4304306_3997	4302682	4303740	1059	1	0.590	11	AGGA/GGAG/GAGG	GENOMAD.212346.VP	6.393e-29	122	0	0	1	2561	Caudoviricetes	NA	NA	PF16452;PF06892;COG1974	Bacteriophage CI repressor C-terminal domain; Phage regulatory protein CII (CP76)
+NC_019936.1|provirus_4295725_4304306_3998	4303989	4304306	318	1	0.613	11	AGGAG	GENOMAD.200462.VV	1.519e-09	56	0	0	0	1	NA	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_genes/NC_021184.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,144 @@
+gene	start	end	length	strand	gc_content	genetic_code	rbs_motif	marker	evalue	bitscore	uscg	plasmid_hallmark	virus_hallmark	taxid	taxname	annotation_conjscan	annotation_amr	annotation_accessions	annotation_description
+NC_021184.1|provirus_19778_35564_13	19778	21046	1269	1	0.465	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_14	21861	23045	1185	-1	0.483	11	AGGAG	GENOMAD.016861.VV	4.71e-05	48	0	0	0	2561	Caudoviricetes	NA	NA	PF13671;COG2019;TIGR01359;K13829	AAA domain
+NC_021184.1|provirus_19778_35564_15	23045	23500	456	-1	0.342	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_16	23641	23904	264	1	0.481	11	AGxAGG/AGGxGG	GENOMAD.221988.VV	2.546e-05	43	0	0	0	1	NA	NA	NA	PF06806;COG3311;TIGR01764	Predicted DNA-binding transcriptional regulator AlpA
+NC_021184.1|provirus_19778_35564_17	23960	24580	621	1	0.435	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_18	24568	25845	1278	1	0.462	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_19	26129	26368	240	1	0.412	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_20	26390	26560	171	1	0.532	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_21	26565	26771	207	1	0.449	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_22	26935	27291	357	1	0.409	11	AGxAGG/AGGxGG	GENOMAD.096257.VV	5.932e-08	52	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_23	27269	27457	189	1	0.434	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_24	27482	28054	573	1	0.447	11	AGxAGG/AGGxGG	GENOMAD.103011.VV	5.601e-31	122	0	0	1	2561	Caudoviricetes	NA	NA	PF04586;COG3740;K06904;TIGR01543	Phage head maturation protease
+NC_021184.1|provirus_19778_35564_25	28056	29300	1245	1	0.491	11	AGGAGG	GENOMAD.113164.VP	4.496e-51	190	0	0	1	2561	Caudoviricetes	NA	NA	PF05521;COG5614;TIGR01563	Bacteriophage head-tail adaptor
+NC_021184.1|provirus_19778_35564_26	29533	31557	2025	1	0.486	11	GGAG/GAGG	GENOMAD.110013.VP	2.142e-73	265	0	0	1	2561	Caudoviricetes	NA	NA	COG5280	Phage-related minor tail protein
+NC_021184.1|provirus_19778_35564_27	31554	32714	1161	1	0.414	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_28	32727	33191	465	-1	0.391	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_29	33713	34003	291	1	0.405	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_30	34327	34608	282	-1	0.465	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_31	34601	34831	231	-1	0.390	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_32	35121	35261	141	1	0.411	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_33	35242	35364	123	1	0.398	11	AGGAG/GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_19778_35564_34	35394	35564	171	1	0.380	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4217	4466413	4467399	987	1	0.396	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4218	4467522	4470317	2796	1	0.406	11	None	GENOMAD.104116.VV	8.672e-09	62	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4219	4471023	4471277	255	-1	0.451	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4220	4471243	4473018	1776	-1	0.420	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4221	4473008	4473463	456	-1	0.384	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4222	4473456	4474466	1011	-1	0.409	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4223	4474820	4475086	267	1	0.416	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4224	4475312	4475857	546	1	0.419	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4225	4475973	4476248	276	1	0.457	11	GGA/GAG/AGG	GENOMAD.222700.VP	1.456e-50	173	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4226	4476302	4477498	1197	1	0.426	11	3Base/5BMM	GENOMAD.014802.VV	5.286e-15	80	0	0	0	2561	Caudoviricetes	NA	NA	PF00176;K20093;COG1061;TIGR04095	Superfamily II DNA or RNA helicase
+NC_021184.1|provirus_4466413_4519129_4227	4477794	4479494	1701	1	0.453	11	AGGAGG	GENOMAD.016341.VV	2.929e-155	501	0	0	1	2561	Caudoviricetes	NA	NA	PF13479;PF12684;TIGR01618;K07465;COG1468	phage nucleotide-binding protein
+NC_021184.1|provirus_4466413_4519129_4228	4479516	4479968	453	1	0.413	11	AGGAGG	GENOMAD.031678.VV	1.272e-30	119	0	0	0	2561	Caudoviricetes	NA	NA	PF05037	NA
+NC_021184.1|provirus_4466413_4519129_4229	4479970	4481664	1695	1	0.436	11	AGxAGG/AGGxGG	GENOMAD.102034.VP	2.19e-113	379	0	0	0	2561	Caudoviricetes	NA	NA	TIGR01636	NA
+NC_021184.1|provirus_4466413_4519129_4230	4481661	4482314	654	1	0.428	11	AGGA	GENOMAD.171549.VP	2.774e-19	89	0	0	0	2561	Caudoviricetes	NA	NA	COG3617	Prophage antirepressor
+NC_021184.1|provirus_4466413_4519129_4231	4482602	4484512	1911	1	0.425	11	GGAG/GAGG	GENOMAD.024099.VV	5.934e-52	199	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4232	4484713	4485057	345	1	0.507	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4233	4485047	4485271	225	1	0.418	11	GGAGG	GENOMAD.212426.VP	2.242e-30	114	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4234	4485261	4485629	369	1	0.455	11	GGAGG	GENOMAD.159035.VP	2.564e-27	108	0	0	0	2561	Caudoviricetes	NA	NA	PF07374;TIGR01636;COG2739	phage transcriptional activator, RinA family
+NC_021184.1|provirus_4466413_4519129_4235	4485801	4486007	207	1	0.435	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4236	4486094	4486492	399	1	0.501	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4237	4486710	4486982	273	-1	0.410	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4238	4486969	4487244	276	-1	0.435	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4239	4487505	4488899	1395	1	0.507	11	AGGAGG	GENOMAD.005053.VV	3.055e-18	91	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4240	4488903	4490126	1224	1	0.455	11	AGGAGG	GENOMAD.038338.VV	3.758e-27	118	0	0	0	2561	Caudoviricetes	NA	NA	COG3392	NA
+NC_021184.1|provirus_4466413_4519129_4241	4490195	4490959	765	1	0.492	11	AGGAGG	GENOMAD.105515.VV	3.381e-15	78	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4242	4490960	4491148	189	1	0.471	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4243	4491287	4492195	909	1	0.528	11	AGxAGG/AGGxGG	GENOMAD.105515.VV	1.222e-10	65	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4244	4492256	4492594	339	1	0.475	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4245	4492686	4493117	432	1	0.509	11	AGxAGG/AGGxGG	GENOMAD.191984.VP	5.92e-08	53	0	0	0	2561	Caudoviricetes	NA	NA	PF07128	NA
+NC_021184.1|provirus_4466413_4519129_4246	4493183	4493389	207	1	0.444	11	AGxAGG/AGGxGG	GENOMAD.225559.VP	7.754e-16	72	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4247	4493440	4493913	474	1	0.502	11	GGAGG	GENOMAD.168120.VP	1.382e-13	70	0	0	1	2561	Caudoviricetes	NA	NA	PF05119;COG3747;TIGR01558	Phage terminase, small subunit
+NC_021184.1|provirus_4466413_4519129_4248	4493942	4495498	1557	1	0.489	11	GGAGG	GENOMAD.181434.VP	5.884e-56	208	0	0	1	2561	Caudoviricetes	NA	NA	PF20441	Terminase large subunit, endonuclease domain
+NC_021184.1|provirus_4466413_4519129_4249	4495568	4495879	312	1	0.356	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4250	4495869	4496198	330	1	0.348	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4251	4496274	4497509	1236	1	0.493	11	AGGAG(G)/GGAGG	GENOMAD.179073.VP	1.101e-41	162	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4252	4497502	4498215	714	1	0.475	11	AGGAGG	GENOMAD.028909.VV	1.007e-19	91	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR01560	Phage gp6-like head-tail connector protein
+NC_021184.1|provirus_4466413_4519129_4253	4498222	4499157	936	1	0.495	11	GGAGG	GENOMAD.168658.VV	2.457e-20	95	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;PF04586;PF12518;COG4653;TIGR01554;K06904	Predicted phage phi-C31 gp36 major capsid-like protein
+NC_021184.1|provirus_4466413_4519129_4254	4499866	4501686	1821	1	0.440	11	3Base/5BMM	GENOMAD.036196.VV	0.0007312	45	0	0	0	2561	Caudoviricetes	NA	NA	PF01824	MatK/TrnK amino terminal region
+NC_021184.1|provirus_4466413_4519129_4255	4501705	4502046	342	1	0.523	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4256	4502057	4502743	687	1	0.504	11	GGA/GAG/AGG	GENOMAD.111513.VV	1.908e-15	78	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4257	4502765	4503067	303	1	0.439	11	GGAGG	GENOMAD.041843.VV	4.112e-13	66	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR01560	Phage gp6-like head-tail connector protein
+NC_021184.1|provirus_4466413_4519129_4258	4503067	4503399	333	1	0.477	11	GGA/GAG/AGG	GENOMAD.142742.VP	1.864e-17	79	0	0	1	2561	Caudoviricetes	NA	NA	PF05521;COG5614;TIGR01563	Bacteriophage head-tail adaptor
+NC_021184.1|provirus_4466413_4519129_4259	4503392	4503763	372	1	0.503	11	GGAGG	GENOMAD.137411.VP	1.962e-22	94	0	0	1	2561	Caudoviricetes	NA	NA	PF11114;TIGR01725;COG5005	phage protein, HK97 gp10 family
+NC_021184.1|provirus_4466413_4519129_4260	4503760	4504086	327	1	0.407	11	AGxAGG/AGGxGG	GENOMAD.018077.VV	6.075e-44	155	0	0	0	2561	Caudoviricetes	NA	NA	PF05657	NA
+NC_021184.1|provirus_4466413_4519129_4261	4504087	4504653	567	1	0.487	11	AGGAGG	GENOMAD.003250.VV	2.873e-56	195	0	0	1	2561	Caudoviricetes	NA	NA	PF04630;TIGR01603	phage major tail protein, phi13 family
+NC_021184.1|provirus_4466413_4519129_4262	4504658	4504957	300	1	0.453	11	GGAGG	GENOMAD.063000.VV	7.958e-45	157	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4263	4504969	4505124	156	1	0.378	11	GGAG/GAGG	GENOMAD.108553.VV	1.339e-24	96	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4264	4505209	4505475	267	1	0.333	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4265	4505462	4505782	321	1	0.293	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4266	4505833	4509261	3429	1	0.498	11	AGxAGG/AGGxGG	GENOMAD.181727.VP	1.385e-58	226	0	0	1	2561	Caudoviricetes	NA	NA	COG5280	Phage-related minor tail protein
+NC_021184.1|provirus_4466413_4519129_4267	4509272	4510123	852	1	0.472	11	AGGAGG	GENOMAD.008827.VV	2.998e-171	532	0	0	0	2561	Caudoviricetes	NA	NA	PF20195;COG4722;TIGR01633	Phage-related protein
+NC_021184.1|provirus_4466413_4519129_4268	4510138	4511208	1071	1	0.486	11	AGGAG	GENOMAD.007754.VV	4.216e-63	223	0	0	1	2561	Caudoviricetes	NA	NA	PF08931	Receptor-binding protein of phage tail base-plate Siphoviridae, head
+NC_021184.1|provirus_4466413_4519129_4269	4511210	4512007	798	1	0.501	11	GGAGG	GENOMAD.078804.VV	2.471e-67	231	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4270	4512000	4513862	1863	1	0.436	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4271	4513877	4514155	279	1	0.502	11	AGGAGG	GENOMAD.169028.VV	1.692e-49	170	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4272	4514155	4514295	141	1	0.468	11	GGAGG	GENOMAD.166984.VP	1.613e-13	64	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4273	4514369	4515079	711	1	0.332	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4274	4515106	4516203	1098	1	0.476	11	GGAG/GAGG	GENOMAD.006687.VV	1.779e-36	145	0	0	1	2561	Caudoviricetes	NA	NA	PF14594;COG4926;TIGR01665	Siphovirus ReqiPepy6 Gp37-like protein
+NC_021184.1|provirus_4466413_4519129_4275	4516251	4516661	411	1	0.448	11	AGxAGG/AGGxGG	GENOMAD.083633.VV	1.122e-06	49	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4276	4516654	4517340	687	1	0.483	11	GGAGG	GENOMAD.058849.VV	0.0002819	44	0	0	0	2561	Caudoviricetes	NA	NA	PF01520;COG0860;TIGR02883	N-acetylmuramoyl-L-alanine amidase
+NC_021184.1|provirus_4466413_4519129_4277	4517472	4518329	858	1	0.480	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4466413_4519129_4278	4518344	4519129	786	1	0.485	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4319	4563831	4564775	945	-1	0.388	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4320	4565036	4565629	594	-1	0.325	11	AGxAGG/AGGxGG	GENOMAD.221500.PV	0.0001909	44	0	0	0	1	NA	NA	NA	PF19503	NA
+NC_021184.1|provirus_4563831_4615358_4321	4567530	4570109	2580	-1	0.437	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4322	4570230	4570469	240	-1	0.358	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4323	4570482	4570748	267	-1	0.382	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4324	4570820	4571578	759	-1	0.484	11	AGGAG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4325	4571594	4572604	1011	-1	0.459	11	3Base/5BMM	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4326	4572601	4573257	657	-1	0.492	11	AGGAGG	GENOMAD.055867.VV	1.36e-18	87	0	0	0	2561	Caudoviricetes	NA	NA	COG5632	N-acetylmuramoyl-L-alanine amidase CwlA
+NC_021184.1|provirus_4563831_4615358_4327	4573241	4573663	423	-1	0.449	11	AGxAGG/AGGxGG	GENOMAD.083633.VV	1.257e-06	49	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4328	4573711	4574808	1098	-1	0.476	11	AGGA/GGAG/GAGG	GENOMAD.006687.VV	8.567e-33	134	0	0	1	2561	Caudoviricetes	NA	NA	PF14594;COG4926;TIGR01665	Siphovirus ReqiPepy6 Gp37-like protein
+NC_021184.1|provirus_4563831_4615358_4329	4574832	4574972	141	-1	0.504	11	AGGAGG	GENOMAD.166984.VP	1.819e-12	61	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4330	4574972	4575250	279	-1	0.477	11	GGAGG	GENOMAD.169028.VV	3.079e-51	175	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4331	4575265	4577127	1863	-1	0.430	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4332	4577120	4577917	798	-1	0.490	11	GGAGG	GENOMAD.078804.VV	1.766e-71	243	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4333	4577919	4578995	1077	-1	0.476	11	AGGAGG	GENOMAD.007754.VV	1.197e-59	213	0	0	1	2561	Caudoviricetes	NA	NA	PF08931	Receptor-binding protein of phage tail base-plate Siphoviridae, head
+NC_021184.1|provirus_4563831_4615358_4334	4579010	4579861	852	-1	0.465	11	AGGAGG	GENOMAD.008827.VV	2.146e-166	518	0	0	0	2561	Caudoviricetes	NA	NA	PF20195;COG4722;TIGR01633	Phage-related protein
+NC_021184.1|provirus_4563831_4615358_4335	4579873	4583292	3420	-1	0.488	11	AGxAGG/AGGxGG	GENOMAD.207179.VP	1.909e-93	337	0	0	1	2561	Caudoviricetes	NA	NA	PF05521;COG5283;TIGR01563	Phage-related tail protein
+NC_021184.1|provirus_4563831_4615358_4336	4583330	4583485	156	-1	0.410	11	GGA/GAG/AGG	GENOMAD.108553.VV	1.339e-24	96	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4337	4583497	4583790	294	-1	0.459	11	AGGAGG	GENOMAD.063000.VV	3.242e-45	158	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4338	4583794	4584600	807	-1	0.496	11	AGGAGG	GENOMAD.003250.VV	3.053e-56	199	0	0	1	2561	Caudoviricetes	NA	NA	PF04630;TIGR01603	phage major tail protein, phi13 family
+NC_021184.1|provirus_4563831_4615358_4339	4584601	4584927	327	-1	0.407	11	AGxAGG/AGGxGG	GENOMAD.018077.VV	6.075e-44	155	0	0	0	2561	Caudoviricetes	NA	NA	PF05657	NA
+NC_021184.1|provirus_4563831_4615358_4340	4584924	4585295	372	-1	0.508	11	GGAGG	GENOMAD.137411.VP	1.962e-22	94	0	0	1	2561	Caudoviricetes	NA	NA	PF11114;TIGR01725;COG5005	phage protein, HK97 gp10 family
+NC_021184.1|provirus_4563831_4615358_4341	4585288	4585620	333	-1	0.477	11	GGA/GAG/AGG	GENOMAD.142742.VP	1.686e-18	82	0	0	1	2561	Caudoviricetes	NA	NA	PF05521;COG5614;TIGR01563	Bacteriophage head-tail adaptor
+NC_021184.1|provirus_4563831_4615358_4342	4585620	4585922	303	-1	0.439	11	GGAGG	GENOMAD.041843.VV	4.112e-13	66	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR01560	Phage gp6-like head-tail connector protein
+NC_021184.1|provirus_4563831_4615358_4343	4585944	4586630	687	-1	0.505	11	GGA/GAG/AGG	GENOMAD.111513.VV	1.908e-15	78	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4344	4586641	4587825	1185	-1	0.499	11	GGAGG	GENOMAD.168658.VV	3.396e-31	130	0	0	1	2561	Caudoviricetes	NA	NA	PF05065;PF04586;PF12518;COG4653;TIGR01554;K06904	Predicted phage phi-C31 gp36 major capsid-like protein
+NC_021184.1|provirus_4563831_4615358_4345	4587832	4588530	699	-1	0.478	11	AGGAGG	GENOMAD.028909.VV	1.64e-23	102	0	0	1	2561	Caudoviricetes	NA	NA	PF05135;TIGR01560	Phage gp6-like head-tail connector protein
+NC_021184.1|provirus_4563831_4615358_4346	4588523	4589815	1293	-1	0.497	11	None	GENOMAD.179073.VP	7.993e-40	157	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4347	4589828	4590154	327	-1	0.401	11	AGGA	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4348	4590144	4590455	312	-1	0.426	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4349	4590525	4592081	1557	-1	0.482	11	GGAGG	GENOMAD.181434.VP	1.249e-57	213	0	0	1	2561	Caudoviricetes	NA	NA	PF20441	Terminase large subunit, endonuclease domain
+NC_021184.1|provirus_4563831_4615358_4350	4592110	4592583	474	-1	0.511	11	GGAGG	GENOMAD.168120.VP	1.382e-13	70	0	0	1	2561	Caudoviricetes	NA	NA	PF05119;COG3747;TIGR01558	Phage terminase, small subunit
+NC_021184.1|provirus_4563831_4615358_4351	4592638	4592844	207	-1	0.473	11	AGxAGG/AGGxGG	GENOMAD.225559.VP	7.754e-16	72	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4352	4592896	4593348	453	-1	0.510	11	AGxAGG/AGGxGG	GENOMAD.191984.VP	7.214e-08	53	0	0	0	2561	Caudoviricetes	NA	NA	PF07128	NA
+NC_021184.1|provirus_4563831_4615358_4353	4593440	4593778	339	-1	0.475	11	GGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4354	4593839	4594747	909	-1	0.530	11	AGxAGG/AGGxGG	GENOMAD.105515.VV	1.222e-10	65	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4355	4594886	4595074	189	-1	0.476	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4356	4595075	4595839	765	-1	0.498	11	AGGAGG	GENOMAD.105515.VV	7.138e-14	74	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4357	4595908	4597131	1224	-1	0.462	11	AGGAGG	GENOMAD.038338.VV	3.932e-28	121	0	0	0	2561	Caudoviricetes	NA	NA	COG3392	NA
+NC_021184.1|provirus_4563831_4615358_4358	4597135	4598529	1395	-1	0.491	11	AGGAGG	GENOMAD.005053.VV	3.988e-20	97	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4359	4598987	4599307	321	-1	0.505	11	GGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4360	4599480	4600436	957	-1	0.357	11	GGA/GAG/AGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4361	4600429	4601187	759	-1	0.362	11	None	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4362	4601556	4601987	432	-1	0.444	11	GGxGG	GENOMAD.159035.VP	1.815e-23	98	0	0	0	2561	Caudoviricetes	NA	NA	PF07374;TIGR01636;COG2739	phage transcriptional activator, RinA family
+NC_021184.1|provirus_4563831_4615358_4363	4601984	4602181	198	-1	0.424	11	AGGAGG	GENOMAD.212426.VP	2.201e-26	102	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4364	4602184	4603536	1353	-1	0.474	11	None	GENOMAD.116250.VP	4.087e-30	128	0	0	0	2561	Caudoviricetes	NA	NA	PF00270;COG1111;TIGR04095;K17677	ERCC4-related helicase
+NC_021184.1|provirus_4563831_4615358_4365	4603517	4603798	282	-1	0.454	11	AGGAGG	GENOMAD.004000.VV	3.23e-20	86	0	0	0	2561	Caudoviricetes	NA	NA	COG1591	NA
+NC_021184.1|provirus_4563831_4615358_4366	4603951	4606197	2247	-1	0.477	11	AGGAGG	GENOMAD.016441.VV	9.643e-11	68	0	0	0	2561	Caudoviricetes	NA	NA	TIGR01613	phage/plasmid primase, P4 family, C-terminal domain
+NC_021184.1|provirus_4563831_4615358_4367	4606225	4606872	648	-1	0.414	11	AGGAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4368	4606860	4607267	408	-1	0.529	11	GGAGG	GENOMAD.220271.VP	0.0002632	42	0	0	0	2561	Caudoviricetes	NA	NA	PF09152;COG3613;TIGR03646	Nucleoside 2-deoxyribosyltransferase
+NC_021184.1|provirus_4563831_4615358_4369	4607213	4607470	258	-1	0.496	11	AGGAGG	GENOMAD.159187.VV	1.664e-38	138	0	0	0	2561	Caudoviricetes	NA	NA	PF14205;TIGR02098;COG1996	MJ0042 family finger-like domain
+NC_021184.1|provirus_4563831_4615358_4370	4607722	4610022	2301	-1	0.501	11	AGGAG	GENOMAD.038590.VV	7.582e-125	421	0	0	0	2561	Caudoviricetes	NA	NA	PF00476;PF13482;K02334;COG0749;TIGR01388	DNA polymerase I - 3'-5' exonuclease and polymerase domains
+NC_021184.1|provirus_4563831_4615358_4371	4610081	4610638	558	-1	0.518	11	AGGAGG	GENOMAD.039702.VV	2.165e-40	149	0	0	0	2561	Caudoviricetes	NA	NA	PF10991	NA
+NC_021184.1|provirus_4563831_4615358_4372	4610652	4611773	1122	-1	0.529	11	GGAG/GAGG	GENOMAD.136786.VV	3.244e-49	183	0	0	0	2561	Caudoviricetes	NA	NA	PF10926;TIGR01896;COG2887;K07465	CRISPR-associated exonuclease Csa1
+NC_021184.1|provirus_4563831_4615358_4373	4611766	4612083	318	-1	0.494	11	GGAG/GAGG	GENOMAD.222352.VV	4.487e-22	92	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4374	4612061	4612222	162	-1	0.506	11	GGAGG	GENOMAD.116519.VV	3.339e-10	55	0	0	0	2561	Caudoviricetes	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4375	4612350	4612847	498	-1	0.448	11	GGA/GAG/AGG	GENOMAD.204246.VV	1.065e-07	53	0	0	0	2561	Caudoviricetes	NA	NA	PF03333;K01994;TIGR03879	Adhesin biosynthesis transcription regulatory protein
+NC_021184.1|provirus_4563831_4615358_4376	4613153	4615015	1863	-1	0.444	11	AGxAGG/AGGxGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
+NC_021184.1|provirus_4563831_4615358_4377	4615155	4615358	204	1	0.422	11	GGAG/GAGG	NA	NA	NA	0	0	0	1	NA	NA	NA	NA	NA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_000913.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,6 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_000913.3|provirus_1412000_1434224	22225	Provirus	1412000-1434224	28	11	0.9653	NA	4	27.1536	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_000913.3|provirus_2461306_2476510	15205	Provirus	2461306-2476510	19	11	0.9611	NA	2	18.3692	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_000913.3|provirus_1196867_1213107	16241	Provirus	1196867-1213107	24	11	0.9605	NA	6	22.4142	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_000913.3|provirus_563848_584430	20583	Provirus	563848-584430	30	11	0.9007	NA	6	14.4709	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_000913.3|provirus_1627517_1653915	26399	Provirus	1627517-1653915	42	11	0.8949	NA	4	21.7953	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_002737.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_002737.2|provirus_529627_569283	39657	Provirus	529627-569283	49	11	0.9801	NA	13	76.8805	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_002737.2|provirus_777501_820593	43093	Provirus	777501-820593	68	11	0.9796	NA	10	90.5047	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_002737.2|provirus_1186916_1222544	35629	Provirus	1186916-1222544	54	11	0.9770	NA	8	73.4096	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_003450.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_008261.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_008261.1|provirus_1784095_1821197	37103	Provirus	1784095-1821197	44	11	0.9669	NA	13	47.9680	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_008261.1|provirus_1070550_1127691	57142	Provirus	1070550-1127691	68	11	0.9536	NA	12	61.5635	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_009012.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_009012.1|provirus_2931283_2970170	38888	Provirus	2931283-2970170	62	11	0.9595	NA	14	62.6553	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_009012.1|provirus_1938476_1983993	45518	Provirus	1938476-1983993	52	11	0.9466	NA	14	58.8179	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_009012.1|provirus_2022140_2067593	45454	Provirus	2022140-2067593	55	11	0.9296	NA	12	56.7329	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_009012.1|provirus_3339258_3389049	49792	Provirus	3339258-3389049	53	11	0.9122	NA	2	13.1702	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_012982.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014008.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014168.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_014168.1|provirus_27479_67296	39818	Provirus	27479-67296	63	11	0.9641	NA	7	44.2001	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014168.1|provirus_1141631_1162952	21322	Provirus	1141631-1162952	35	11	0.9457	NA	7	27.6971	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014211.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014212.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_014212.1|provirus_1746722_1764354	17633	Provirus	1746722-1764354	38	11	0.9025	NA	1	16.7440	Viruses;Varidnaviria;Helvetiavirae;Dividoviricota;Laserviricetes;Halopanivirales;Sphaerolipoviridae
+NC_014212.1|provirus_1893193_1914973	21781	Provirus	1893193-1914973	33	11	0.8895	NA	5	22.1216	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014212.1|provirus_1170297_1209132	38836	Provirus	1170297-1209132	48	11	0.8869	NA	5	21.9558	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014363.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_014364.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_014364.1|provirus_2666253_2703772	37520	Provirus	2666253-2703772	56	11	0.9674	NA	8	31.3276	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014364.1|provirus_2976748_3014759	38012	Provirus	2976748-3014759	43	11	0.9540	NA	6	25.4448	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014364.1|provirus_2121424_2157334	35911	Provirus	2121424-2157334	42	11	0.9330	NA	8	27.2215	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_014364.1|provirus_2329685_2350621	20937	Provirus	2329685-2350621	28	11	0.8720	NA	4	13.7214	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_015761.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_015761.1|provirus_3084741_3115735	30995	Provirus	3084741-3115735	41	11	0.9788	NA	20	51.6697	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_015761.1|provirus_1007223_1045009	37787	Provirus	1007223-1045009	51	11	0.9585	NA	5	39.7532	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_015761.1|provirus_847397_862760	15364	Provirus	847397-862760	19	11	0.9561	NA	10	16.7146	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_017033.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_017033.1|provirus_1557694_1600481	42788	Provirus	1557694-1600481	71	11	0.9788	NA	11	61.4099	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_017033.1|provirus_1052334_1094910	42577	Provirus	1052334-1094910	66	11	0.9602	NA	20	58.7796	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_017033.1|provirus_2089294_2107522	18229	Provirus	2089294-2107522	25	11	0.9392	NA	1	11.4432	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_017095.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_018014.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_018068.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_018068.1|provirus_1361108_1399802	38695	Provirus	1361108-1399802	52	11	0.9631	NA	13	58.9401	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_018068.1|provirus_2072558_2098541	25984	Provirus	2072558-2098541	33	11	0.9473	NA	3	21.6083	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_018515.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_018515.1|provirus_3418112_3436097	17986	Provirus	3418112-3436097	25	11	0.9523	NA	6	32.1738	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_018515.1|provirus_4659544_4694673	35130	Provirus	4659544-4694673	49	11	0.9431	NA	14	45.8652	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_019897.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_019904.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_019936.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_019936.1|provirus_4295725_4304306	8582	Provirus	4295725-4304306	13	11	0.9664	NA	2	10.7145	Viruses;Monodnaviria;Loebvirae;Hofneiviricota;Faserviricetes;Tubulavirales;Inoviridae
+NC_019936.1|provirus_2347508_2361929	14422	Provirus	2347508-2361929	21	11	0.9596	NA	2	12.9957	Viruses;Monodnaviria;Loebvirae;Hofneiviricota;Faserviricetes;Tubulavirales;Inoviridae
+NC_019936.1|provirus_3233292_3242961	9670	Provirus	3233292-3242961	15	11	0.9092	NA	2	8.9242	Viruses;Monodnaviria;Loebvirae;Hofneiviricota;Faserviricetes;Tubulavirales;Inoviridae
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/genomad_virus_summary/NC_021184.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+seq_name	length	topology	coordinates	n_genes	genetic_code	virus_score	fdr	n_hallmarks	marker_enrichment	taxonomy
+NC_021184.1|provirus_4563831_4615358	51528	Provirus	4563831-4615358	59	11	0.9554	NA	11	60.5769	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_021184.1|provirus_4466413_4519129	52717	Provirus	4466413-4519129	62	11	0.9421	NA	12	58.6292	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
+NC_021184.1|provirus_19778_35564	15787	Provirus	19778-35564	22	11	0.9155	NA	3	8.5756	Viruses;Duplodnaviria;Heunggongvirae;Uroviricota;Caudoviricetes;;
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/gtdbtk.bac120.summary	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,23 @@
+user_genome	classification	closest_genome_reference	closest_genome_reference_radius	closest_genome_taxonomy	closest_genome_ani	closest_genome_af	closest_placement_reference	closest_placement_radius	closest_placement_taxonomy	closest_placement_ani	closest_placement_af	pplacer_taxonomy	classification_method	note	other_related_references(genome_id,species_name,radius,ANI,AF)	msa_percent	translation_table	red_value	warnings
+NC_000913.fasta	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli	GCF_003697165.2	95.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli	96.74	0.856	GCF_000026225.1	95.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii	91.54	0.56	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__	taxonomic classification defined by topology and ANI	N/A	GCF_000194175.1, s__Escherichia coli_F, 95.0, 95.46, 0.89; GCF_002965065.1, s__Escherichia sp002965065, 95.0, 94.52, 0.691; GCF_004211955.1, s__Escherichia sp004211955, 95.0, 93.12, 0.774; GCF_005843885.1, s__Escherichia sp005843885, 95.0, 92.76, 0.782; GCF_011881725.1, s__Escherichia coli_E, 95.0, 92.37, 0.807; GCF_029876145.1, s__Escherichia ruysiae, 95.0, 92.28, 0.788; GCF_014836715.1, s__Escherichia whittamii, 95.0, 91.78, 0.782; GCF_002900365.1, s__Escherichia marmotae, 95.0, 90.92, 0.738; GCF_000759775.1, s__Escherichia albertii, 95.0, 90.18, 0.68	98.47	11	N/A	N/A
+NC_002737.fasta	d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes	GCF_002055535.1	95.0	d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes	99.7	0.968	GCF_002055535.1	95.0	d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes	99.7	0.968	d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_900459225.1, s__Streptococcus dysgalactiae, 95.0, 88.16, 0.456; GCF_900636575.1, s__Streptococcus canis, 95.0, 86.81, 0.468	98.31	11	N/A	N/A
+NC_003450.fasta	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Corynebacterium;s__Corynebacterium glutamicum	GCF_000011325.1	95.0	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Corynebacterium;s__Corynebacterium glutamicum	100.0	1.0	GCF_000011325.1	95.0	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Corynebacterium;s__Corynebacterium glutamicum	100.0	1.0	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Corynebacterium;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_002355155.1, s__Corynebacterium suranareeae, 95.0, 86.55, 0.531; GCF_001643015.1, s__Corynebacterium crudilactis, 95.0, 84.07, 0.363; GCF_001277995.1, s__Corynebacterium deserti, 95.0, 83.77, 0.275	96.43	11	N/A	N/A
+NC_008261.fasta	d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens	GCF_000013285.1	95.0	d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens	100.0	1.0	GCF_000013285.1	95.0	d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens	100.0	1.0	d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_029258205.1, s__Sarcina sp029258205, 95.0, 92.75, 0.744; GCF_029267215.1, s__Sarcina sp029267215, 95.0, 84.03, 0.29	94.4	11	N/A	N/A
+NC_009012.fasta	d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum	GCF_000015865.1	95.0	d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum	100.0	1.0	GCF_000015865.1	95.0	d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum	100.0	1.0	d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000521465.1, s__Hungateiclostridium straminisolvens, 95.0, 84.49, 0.429; GCF_004102745.1, s__Hungateiclostridium mesophilum, 95.0, 81.39, 0.257	94.22	11	N/A	N/A
+NC_012982.fasta	d__Bacteria;p__Pseudomonadota;c__Alphaproteobacteria;o__Caulobacterales;f__Hyphomonadaceae;g__Hirschia;s__Hirschia baltica	GCF_000023785.1	95.0	d__Bacteria;p__Pseudomonadota;c__Alphaproteobacteria;o__Caulobacterales;f__Hyphomonadaceae;g__Hirschia;s__Hirschia baltica	100.0	1.0	GCF_000023785.1	95.0	d__Bacteria;p__Pseudomonadota;c__Alphaproteobacteria;o__Caulobacterales;f__Hyphomonadaceae;g__Hirschia;s__Hirschia baltica	100.0	1.0	d__Bacteria;p__Pseudomonadota;c__Alphaproteobacteria;o__Caulobacterales;f__Hyphomonadaceae;g__Hirschia;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	98.25	11	N/A	N/A
+NC_014008.fasta	d__Bacteria;p__Verrucomicrobiota;c__Verrucomicrobiae;o__Opitutales;f__Coraliomargaritaceae;g__Coraliomargarita;s__Coraliomargarita akajimensis	GCF_000025905.1	95.0	d__Bacteria;p__Verrucomicrobiota;c__Verrucomicrobiae;o__Opitutales;f__Coraliomargaritaceae;g__Coraliomargarita;s__Coraliomargarita akajimensis	100.0	1.0	GCF_000025905.1	95.0	d__Bacteria;p__Verrucomicrobiota;c__Verrucomicrobiae;o__Opitutales;f__Coraliomargaritaceae;g__Coraliomargarita;s__Coraliomargarita akajimensis	100.0	1.0	d__Bacteria;p__Verrucomicrobiota;c__Verrucomicrobiae;o__Opitutales;f__Coraliomargaritaceae;g__;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	90.76	11	N/A	N/A
+NC_014168.fasta	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus	GCF_000092825.1	95.0	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus	100.0	1.0	GCF_000092825.1	95.0	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus	100.0	1.0	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000185725.2, s__Segniliparus rugosus, 95.0, 80.18, 0.178	96.56	11	N/A	N/A
+NC_014211.fasta	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Streptosporangiales;f__Streptosporangiaceae;g__Nocardiopsis;s__Nocardiopsis dassonvillei	GCF_000092985.1	95.0	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Streptosporangiales;f__Streptosporangiaceae;g__Nocardiopsis;s__Nocardiopsis dassonvillei	100.0	1.0	GCF_000092985.1	95.0	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Streptosporangiales;f__Streptosporangiaceae;g__Nocardiopsis;s__Nocardiopsis dassonvillei	100.0	1.0	d__Bacteria;p__Actinomycetota;c__Actinomycetes;o__Streptosporangiales;f__Streptosporangiaceae;g__Nocardiopsis;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_012396365.1, s__Nocardiopsis alborubida, 95.0, 94.89, 0.822; GCA_000340945.1, s__Nocardiopsis synnemataformans, 95.0, 94.67, 0.838; GCA_002529455.1, s__Nocardiopsis fusca, 95.0, 93.48, 0.743; GCF_000341065.1, s__Nocardiopsis halotolerans, 95.0, 89.3, 0.575; GCF_001905145.1, s__Nocardiopsis sp001905145, 95.0, 89.08, 0.554; GCF_008638415.1, s__Nocardiopsis sinuspersici, 95.0, 88.61, 0.531; GCF_008638365.1, s__Nocardiopsis quinghaiensis, 95.0, 88.23, 0.498; GCF_009830945.1, s__Nocardiopsis sp009830945, 95.0, 87.99, 0.442; GCA_937957845.1, s__Nocardiopsis sp937957845, 95.0, 87.38, 0.277; GCF_026642255.1, s__Nocardiopsis nanhaiensis_A, 95.0, 86.06, 0.436; GCF_030271535.1, s__Nocardiopsis sp030271535, 95.0, 84.81, 0.338; GCF_013410755.1, s__Nocardiopsis aegyptia, 95.0, 84.69, 0.277; GCF_018316655.1, s__Nocardiopsis changdeensis, 95.0, 84.65, 0.301; GCF_000341125.1, s__Nocardiopsis lucentensis, 95.0, 84.45, 0.226; GCF_001279585.1, s__Nocardiopsis sp001279585, 95.0, 84.4, 0.267; GCA_018388625.1, s__Nocardiopsis eucommiae, 95.0, 84.39, 0.264; GCF_014201115.1, s__Nocardiopsis metallicus, 95.0, 84.3, 0.268; GCF_003634495.1, s__Nocardiopsis sp003634495, 95.0, 84.18, 0.288; GCF_030766825.1, s__Nocardiopsis sp030766825, 95.0, 84.18, 0.286; GCF_000341085.1, s__Nocardiopsis ganjiahuensis, 95.0, 84.16, 0.28; GCF_030555055.1, s__Nocardiopsis sp030555055, 95.0, 84.06, 0.267; GCF_024134545.1, s__Nocardiopsis exhalans, 95.08, 84.04, 0.267; GCF_900141985.1, s__Nocardiopsis flavescens, 95.0, 83.82, 0.272; GCF_003386285.1, s__Nocardiopsis sp003386285, 95.0, 83.73, 0.264; GCF_014651695.1, s__Nocardiopsis terrae, 95.0, 83.6, 0.27; GCF_014203695.1, s__Nocardiopsis algeriensis, 95.0, 83.59, 0.238; GCF_020741345.1, s__Nocardiopsis listeri_A, 95.0, 83.53, 0.202; GCF_000341225.1, s__Nocardiopsis alba, 95.0, 83.47, 0.217; GCF_018207095.1, s__Nocardiopsis sp018207095, 95.0, 83.32, 0.229; GCF_028882275.1, s__Nocardiopsis sp028882275, 95.0, 83.25, 0.266; GCF_900143625.1, s__Nocardiopsis sp900143625, 95.0, 83.09, 0.229; GCF_000515115.1, s__Nocardiopsis sp000515115, 95.0, 83.02, 0.181; GCF_014892575.1, s__Nocardiopsis coralli, 95.0, 82.85, 0.213; GCF_000341265.1, s__Nocardiopsis prasina, 95.0, 82.63, 0.245; GCF_001942255.1, s__Nocardiopsis sp001942255, 95.0, 82.61, 0.248; GCF_000341005.1, s__Nocardiopsis alkaliphila, 95.0, 82.53, 0.186; GCF_001570765.1, s__Nocardiopsis listeri, 95.0, 82.26, 0.198; GCF_000341025.1, s__Nocardiopsis salina, 95.0, 82.22, 0.158; GCF_000341145.1, s__Nocardiopsis xinjiangensis, 95.0, 81.14, 0.168	26.24	11	N/A	N/A
+NC_014212.fasta	d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Allomeiothermus;s__Allomeiothermus silvanus	GCF_000092125.1	95.0	d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Allomeiothermus;s__Allomeiothermus silvanus	100.0	0.999	GCF_000092125.1	95.0	d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Allomeiothermus;s__Allomeiothermus silvanus	100.0	0.999	d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Allomeiothermus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_003226535.1, s__Allomeiothermus sp003226535, 95.0, 87.73, 0.485	93.82	11	N/A	N/A
+NC_014363.fasta	d__Bacteria;p__Actinomycetota;c__Coriobacteriia;o__Coriobacteriales;f__Atopobiaceae;g__Olsenella;s__Olsenella uli	GCF_000143845.1	95.0	d__Bacteria;p__Actinomycetota;c__Coriobacteriia;o__Coriobacteriales;f__Atopobiaceae;g__Olsenella;s__Olsenella uli	100.0	1.0	GCF_000143845.1	95.0	d__Bacteria;p__Actinomycetota;c__Coriobacteriia;o__Coriobacteriales;f__Atopobiaceae;g__Olsenella;s__Olsenella uli	100.0	1.0	d__Bacteria;p__Actinomycetota;c__Coriobacteriia;o__Coriobacteriales;f__Atopobiaceae;g__;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	95.47	11	N/A	N/A
+NC_014364.fasta	d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae	GCF_000143985.1	95.0	d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae	100.0	1.0	GCF_000143985.1	95.0	d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae	100.0	1.0	d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000378205.1, s__Sediminispirochaeta bajacaliforniensis, 95.0, 94.41, 0.82	88.42	11	N/A	N/A
+NC_015761.fasta	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori	GCF_000252995.1	95.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori	100.0	1.0	GCF_000252995.1	95.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori	100.0	1.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000006945.2, s__Salmonella enterica, 95.0, 90.34, 0.758; GCA_900478215.1, s__Salmonella houtenae, 95.0, 90.05, 0.755; GCF_008692785.1, s__Salmonella diarizonae, 95.0, 89.91, 0.746; GCF_008692845.1, s__Salmonella arizonae, 95.0, 89.51, 0.704	97.58	11	N/A	N/A
+NC_017033.fasta	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia	GCF_000242255.2	95.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia	100.0	1.0	GCF_000242255.2	95.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia	100.0	1.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	98.45	11	N/A	N/A
+NC_017095.fasta	d__Bacteria;p__Thermotogota;c__Thermotogae;o__Thermotogales;f__Fervidobacteriaceae;g__Fervidobacterium;s__Fervidobacterium pennivorans	GCF_000235405.2	95.0	d__Bacteria;p__Thermotogota;c__Thermotogae;o__Thermotogales;f__Fervidobacteriaceae;g__Fervidobacterium;s__Fervidobacterium pennivorans	100.0	1.0	GCF_000235405.2	95.0	d__Bacteria;p__Thermotogota;c__Thermotogae;o__Thermotogales;f__Fervidobacteriaceae;g__Fervidobacterium;s__Fervidobacterium pennivorans	100.0	1.0	d__Bacteria;p__Thermotogota;c__Thermotogae;o__Thermotogales;f__Fervidobacteriaceae;g__Fervidobacterium;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_001644665.1, s__Fervidobacterium pennivorans_A, 95.0, 92.25, 0.827	90.82	11	N/A	N/A
+NC_018014.fasta	d__Bacteria;p__Acidobacteriota;c__Terriglobia;o__Terriglobales;f__Acidobacteriaceae;g__Terriglobus;s__Terriglobus roseus	GCF_000265425.1	95.0	d__Bacteria;p__Acidobacteriota;c__Terriglobia;o__Terriglobales;f__Acidobacteriaceae;g__Terriglobus;s__Terriglobus roseus	100.0	1.0	GCF_000265425.1	95.0	d__Bacteria;p__Acidobacteriota;c__Terriglobia;o__Terriglobales;f__Acidobacteriaceae;g__Terriglobus;s__Terriglobus roseus	100.0	1.0	d__Bacteria;p__Acidobacteriota;c__Terriglobia;o__Terriglobales;f__Acidobacteriaceae;g__Terriglobus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_900105625.1, s__Terriglobus roseus_B, 95.0, 82.2, 0.254	94.06	11	N/A	N/A
+NC_018068.fasta	d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus	GCF_000255115.2	95.0	d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus	100.0	1.0	GCF_000255115.2	95.0	d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus	100.0	1.0	d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_002196705.1, s__Desulfosporosinus sp002196705, 95.0, 81.15, 0.156	93.92	11	N/A	N/A
+NC_018515.fasta	d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei	GCF_000231385.2	95.0	d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei	100.0	1.0	GCF_000231385.2	95.0	d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei	100.0	1.0	d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_900100785.1, s__Desulfosporosinus hippei, 95.0, 94.11, 0.765; GCF_000765145.1, s__Desulfosporosinus sp000765145, 95.0, 92.48, 0.692	94.5	11	N/A	N/A
+NC_019897.fasta	d__Bacteria;p__Bacillota;c__Bacilli;o__Paenibacillales;f__Paenibacillaceae;g__Thermobacillus;s__Thermobacillus xylanilyticus	GCF_907165215.1	95.0	d__Bacteria;p__Bacillota;c__Bacilli;o__Paenibacillales;f__Paenibacillaceae;g__Thermobacillus;s__Thermobacillus xylanilyticus	97.81	0.815	GCF_907165215.1	95.0	d__Bacteria;p__Bacillota;c__Bacilli;o__Paenibacillales;f__Paenibacillaceae;g__Thermobacillus;s__Thermobacillus xylanilyticus	97.81	0.815	d__Bacteria;p__Bacillota;c__Bacilli;o__Paenibacillales;f__Paenibacillaceae;g__Thermobacillus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_002159085.1, s__Thermobacillus sp002159085, 95.0, 85.65, 0.466	95.97	11	N/A	N/A
+NC_019904.fasta	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Cytophagales;f__Cyclobacteriaceae;g__Echinicola;s__Echinicola vietnamensis	GCF_000325705.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Cytophagales;f__Cyclobacteriaceae;g__Echinicola;s__Echinicola vietnamensis	100.0	1.0	GCF_000325705.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Cytophagales;f__Cyclobacteriaceae;g__Echinicola;s__Echinicola vietnamensis	100.0	1.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Cytophagales;f__Cyclobacteriaceae;g__Echinicola;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_005281475.1, s__Echinicola rosea, 95.0, 83.28, 0.288; GCF_006575665.1, s__Echinicola soli, 95.0, 81.29, 0.203; GCF_003260975.1, s__Echinicola strongylocentroti, 95.0, 80.38, 0.164	96.96	11	N/A	N/A
+NC_019936.fasta	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE	GCF_000327065.1	95.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE	100.0	1.0	GCF_000327065.1	95.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE	100.0	1.0	d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_003696315.1, s__Stutzerimonas songnenensis, 95.0, 93.2, 0.909; GCF_000661915.1, s__Stutzerimonas decontaminans, 95.0, 91.33, 0.803; GCF_900114065.1, s__Stutzerimonas kunmingensis, 96.6, 90.17, 0.753; GCF_024397475.1, s__Stutzerimonas xanthomarina_A, 97.0, 90.15, 0.746; GCA_007713455.1, s__Stutzerimonas sp007713455, 95.0, 90.03, 0.748; GCF_014764705.1, s__Stutzerimonas sp002692525, 96.82, 90.01, 0.736; GCA_003530955.1, s__Stutzerimonas sp003530955, 96.79, 89.98, 0.727; GCF_002929225.1, s__Stutzerimonas stutzeri_U, 97.04, 89.97, 0.743; GCF_000935215.1, s__Stutzerimonas stutzeri_AD, 96.98, 89.84, 0.723; GCF_000495915.1, s__Stutzerimonas chloritidismutans, 96.78, 89.84, 0.717; GCA_018823765.1, s__Stutzerimonas sp018823765, 97.02, 89.77, 0.71; GCA_003488145.1, s__Stutzerimonas sp003488145, 96.59, 89.74, 0.666; GCF_000341615.1, s__Stutzerimonas stutzeri_G, 95.0, 89.32, 0.697; GCF_002890795.1, s__Stutzerimonas stutzeri_AA, 95.0, 89.28, 0.735; GCF_024448335.1, s__Stutzerimonas frequens, 95.0, 88.75, 0.714; GCF_015291885.1, s__Stutzerimonas stutzeri_AC, 95.0, 88.59, 0.662; GCF_000219605.1, s__Stutzerimonas stutzeri, 95.0, 88.34, 0.673; GCF_002909485.1, s__Stutzerimonas stutzeri_AH, 95.0, 88.19, 0.688; GCF_000307775.2, s__Stutzerimonas stutzeri_B, 95.0, 86.95, 0.549; GCF_002890915.1, s__Stutzerimonas stutzeri_AF, 95.0, 85.91, 0.472; GCF_025966695.1, s__Stutzerimonas sp025966695, 95.0, 85.39, 0.44; GCA_000263395.1, s__Stutzerimonas stutzeri_C, 95.0, 85.38, 0.392; GCF_024448505.1, s__Stutzerimonas degradans, 96.08, 85.26, 0.426; GCF_021432765.1, s__Stutzerimonas phenolilytica, 95.0, 85.11, 0.435; GCF_015070855.1, s__Stutzerimonas lopnurensis, 95.0, 85.07, 0.41; GCF_021726475.1, s__Stutzerimonas oligotrophica, 95.0, 84.76, 0.419; GCF_000818015.1, s__Stutzerimonas balearica, 95.0, 83.88, 0.33; GCF_003696285.1, s__Stutzerimonas nitrititolerans, 95.0, 82.51, 0.26; GCF_018138085.1, s__Stutzerimonas stutzeri_AI, 95.0, 82.03, 0.245; GCF_005876855.1, s__Stutzerimonas nosocomialis, 95.0, 81.99, 0.242; GCF_019090095.1, s__Stutzerimonas stutzeri_AN, 95.0, 81.91, 0.245; GCF_013522825.1, s__Stutzerimonas stutzeri_AK, 95.0, 81.91, 0.2; GCA_002339675.1, s__Stutzerimonas stutzeri_O, 95.0, 81.89, 0.253; GCF_019355055.1, s__Stutzerimonas sp004331835, 95.0, 81.83, 0.222; GCF_024448955.1, s__Stutzerimonas stutzeri_AQ, 95.0, 81.79, 0.232; GCF_024448695.1, s__Stutzerimonas stutzeri_T, 95.0, 81.71, 0.242; GCF_022810315.1, s__Stutzerimonas marianensis, 95.0, 81.66, 0.218; GCF_024448935.1, s__Stutzerimonas stutzeri_AO, 95.0, 81.57, 0.177; GCF_009789555.1, s__Stutzerimonas stutzeri_R, 95.0, 81.41, 0.22; GCA_022448005.1, s__Stutzerimonas sp022448005, 95.0, 81.35, 0.194; GCF_003325755.1, s__Stutzerimonas sp003325755, 95.0, 81.28, 0.206; GCA_004010935.1, s__Stutzerimonas sp004010935, 95.0, 81.27, 0.216; GCA_002387205.1, s__Stutzerimonas stutzeri_N, 95.0, 81.26, 0.195; GCF_024448985.1, s__Stutzerimonas stutzeri_AP, 95.0, 81.22, 0.203; GCF_000425625.1, s__Stutzerimonas azotifigens, 95.0, 81.18, 0.187; GCF_000756775.1, s__Stutzerimonas saudiphocaensis, 95.0, 81.13, 0.219; GCF_000952685.1, s__Stutzerimonas stutzeri_E, 95.0, 81.08, 0.216; GCF_000235745.1, s__Stutzerimonas stutzeri_H, 95.0, 81.07, 0.199; GCF_013522725.1, s__Stutzerimonas azotifigens_A, 95.0, 80.99, 0.203; GCA_900766265.1, s__Stutzerimonas sp900766265, 95.0, 80.94, 0.196; GCF_024448895.1, s__Stutzerimonas stutzeri_Q, 95.0, 80.91, 0.193; GCF_900129835.1, s__Stutzerimonas xanthomarina, 95.0, 80.89, 0.2; GCF_002890895.1, s__Stutzerimonas stutzeri_AB, 95.0, 80.87, 0.198; GCF_019880365.1, s__Stutzerimonas stutzeri_P, 95.0, 80.81, 0.187; GCA_002345575.1, s__Stutzerimonas stutzeri_S, 95.0, 80.74, 0.191; GCF_013620795.1, s__Stutzerimonas sp013620795, 95.0, 80.74, 0.187; GCF_024448715.1, s__Stutzerimonas stutzeri_AR, 95.0, 80.6, 0.18; GCF_000590475.1, s__Stutzerimonas stutzeri_D, 95.0, 80.4, 0.167; GCF_003696365.1, s__Stutzerimonas zhaodongensis, 95.0, 79.95, 0.152	97.72	11	N/A	N/A
+NC_021184.fasta	d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae	GCF_000233715.2	95.0	d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae	100.0	1.0	GCF_000233715.2	95.0	d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae	100.0	1.0	d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	95.73	11	N/A	N/A
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_000913.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,50 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_000913.3|provirus_1196867_1213107,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;92.80
+NC_000913.3|provirus_1196867_1213107,RS_GCF_000026225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii,blast,96.90,iPHoP-RF;92.40
+NC_000913.3|provirus_1196867_1213107,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;93.40
+NC_000913.3|provirus_1196867_1213107,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;96.40
+NC_000913.3|provirus_1196867_1213107,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;93.70
+NC_000913.3|provirus_1196867_1213107,RS_GCF_004211955.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp004211955,iPHoP-RF,96.40,None
+NC_000913.3|provirus_1196867_1213107,RS_GCF_005843885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp005843885,iPHoP-RF,96.40,None
+NC_000913.3|provirus_1196867_1213107,RS_GCF_011881725.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli_E,iPHoP-RF,96.40,None
+NC_000913.3|provirus_1196867_1213107,RS_GCF_002965065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp002965065,iPHoP-RF,96.10,None
+NC_000913.3|provirus_1196867_1213107,RS_GCF_014836715.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia whittamii,iPHoP-RF,95.10,None
+NC_000913.3|provirus_1412000_1434224,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;93.70
+NC_000913.3|provirus_1412000_1434224,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;93.10
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002075345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter;s__Citrobacter braakii,blast,96.90,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;95.40
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002925905.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Klebsiella;s__Klebsiella michiganensis,blast,96.90,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;95.40
+NC_000913.3|provirus_1412000_1434224,RS_GCF_005843885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp005843885,iPHoP-RF,96.10,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002965065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp002965065,iPHoP-RF,95.40,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_014836715.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia whittamii,iPHoP-RF,95.40,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_000026225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii,iPHoP-RF,95.10,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_011881725.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli_E,iPHoP-RF,95.10,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_002042885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter;s__Citrobacter portucalensis,blast,94.90,None
+NC_000913.3|provirus_1412000_1434224,RS_GCF_004211955.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp004211955,iPHoP-RF,92.40,None
+NC_000913.3|provirus_1627517_1653915,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;95.10
+NC_000913.3|provirus_1627517_1653915,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;96.10
+NC_000913.3|provirus_1627517_1653915,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;96.70
+NC_000913.3|provirus_1627517_1653915,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;96.10
+NC_000913.3|provirus_1627517_1653915,RS_GCF_011881725.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli_E,blast,96.90,iPHoP-RF;96.10
+NC_000913.3|provirus_1627517_1653915,RS_GCF_000026225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii,iPHoP-RF,96.40,None
+NC_000913.3|provirus_1627517_1653915,RS_GCF_004211955.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp004211955,iPHoP-RF,96.10,None
+NC_000913.3|provirus_1627517_1653915,RS_GCF_005843885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp005843885,iPHoP-RF,96.10,None
+NC_000913.3|provirus_1627517_1653915,RS_GCF_002965065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp002965065,iPHoP-RF,95.70,None
+NC_000913.3|provirus_1627517_1653915,RS_GCF_014836715.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia whittamii,iPHoP-RF,95.70,None
+NC_000913.3|provirus_2461306_2476510,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;93.10
+NC_000913.3|provirus_2461306_2476510,RS_GCF_000026225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia fergusonii,blast,96.90,iPHoP-RF;94.40
+NC_000913.3|provirus_2461306_2476510,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;94.10
+NC_000913.3|provirus_2461306_2476510,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;93.40
+NC_000913.3|provirus_2461306_2476510,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;92.80
+NC_000913.3|provirus_2461306_2476510,RS_GCF_011881725.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli_E,blast,96.90,iPHoP-RF;96.40
+NC_000913.3|provirus_2461306_2476510,RS_GCF_002965065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp002965065,iPHoP-RF,95.10,None
+NC_000913.3|provirus_2461306_2476510,RS_GCF_004211955.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp004211955,iPHoP-RF,95.10,None
+NC_000913.3|provirus_2461306_2476510,RS_GCF_005843885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia sp005843885,iPHoP-RF,93.70,None
+NC_000913.3|provirus_2461306_2476510,RS_GCF_014836715.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia whittamii,iPHoP-RF,93.40,None
+NC_000913.3|provirus_563848_584430,GB_GCA_021307345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia ruysiae,blast,96.90,iPHoP-RF;88.20
+NC_000913.3|provirus_563848_584430,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.90,iPHoP-RF;89.20
+NC_000913.3|provirus_563848_584430,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,96.90,iPHoP-RF;88.50
+NC_000913.3|provirus_563848_584430,RS_GCF_002925905.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Klebsiella;s__Klebsiella michiganensis,blast,96.90,None
+NC_000913.3|provirus_563848_584430,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;87.00
+NC_000913.3|provirus_563848_584430,RS_GCF_002075345.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter;s__Citrobacter braakii,blast,96.50,None
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_002737.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,133 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000186445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus agalactiae,CRISPR,97.80,blast;91.00 iPHoP-RF;88.90
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900459225.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus dysgalactiae,iPHoP-RF,97.10,blast;96.90
+NC_002737.2|provirus_1186916_1222544,RS_GCF_002055535.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes,blast,96.90,iPHoP-RF;96.40
+NC_002737.2|provirus_1186916_1222544,RS_GCF_022354845.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_AA,CRISPR,96.80,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900459405.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis,CRISPR,96.80,iPHoP-RF;89.50
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900636575.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus canis,iPHoP-RF,96.70,blast;96.60
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000425025.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus castoreus,iPHoP-RF,94.70,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_001598035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halotolerans,iPHoP-RF,93.70,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000154985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus infantarius,iPHoP-RF,93.40,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900475675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus lutetiensis,iPHoP-RF,93.10,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000187265.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equinus,iPHoP-RF,92.80,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_900101445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equinus_B,iPHoP-RF,92.80,None
+NC_002737.2|provirus_1186916_1222544,GB_GCA_000283635.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus macedonicus,iPHoP-RF,92.40,None
+NC_002737.2|provirus_1186916_1222544,GB_GCA_934196125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp934196125,iPHoP-RF,92.40,None
+NC_002737.2|provirus_1186916_1222544,GB_GCA_900637675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equi,iPHoP-RF,92.10,blast;62.80
+NC_002737.2|provirus_1186916_1222544,RS_GCF_004843545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pasteurianus,iPHoP-RF,91.80,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_003337175.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus_B,iPHoP-RF,91.40,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_009870755.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halichoeri,iPHoP-RF,91.10,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_002000985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus,iPHoP-RF,90.80,None
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000188015.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ictaluri,iPHoP-RF,90.50,blast;62.80
+NC_002737.2|provirus_1186916_1222544,RS_GCF_000188055.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus urinalis,iPHoP-RF,90.50,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000960035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus oralis_G,CRISPR,98.60,iPHoP-RF;97.10
+NC_002737.2|provirus_529627_569283,RS_GCF_002055535.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes,CRISPR,98.60,blast;97.50 iPHoP-RF;96.10
+NC_002737.2|provirus_529627_569283,RS_GCF_002093545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus oralis_C,CRISPR,98.60,iPHoP-RF;96.10
+NC_002737.2|provirus_529627_569283,RS_GCF_900636575.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus canis,CRISPR,98.40,iPHoP-RF;97.10 blast;96.70
+NC_002737.2|provirus_529627_569283,RS_GCF_001937065.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp001937065,CRISPR,98.20,iPHoP-RF;96.70
+NC_002737.2|provirus_529627_569283,RS_GCF_902729355.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp902729355,CRISPR,98.10,iPHoP-RF;95.40
+NC_002737.2|provirus_529627_569283,RS_GCF_000186445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus agalactiae,CRISPR,97.60,iPHoP-RF;91.40 blast;67.70
+NC_002737.2|provirus_529627_569283,RS_GCF_000188035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pseudoporcinus,CRISPR,97.60,iPHoP-RF;96.40
+NC_002737.2|provirus_529627_569283,RS_GCF_000220065.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp000220065,iPHoP-RF,97.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000379985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus caballi,iPHoP-RF,97.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000380105.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus orisratti,iPHoP-RF,97.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000380125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ovis,iPHoP-RF,97.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_900459225.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus dysgalactiae,blast,96.90,iPHoP-RF;93.10
+NC_002737.2|provirus_529627_569283,RS_GCF_000423745.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus plurextorum,iPHoP-RF,96.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_002953735.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pluranimalium,iPHoP-RF,96.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_006739205.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus mutans,iPHoP-RF,96.70,None
+NC_002737.2|provirus_529627_569283,GB_GCA_945876895.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp945876895,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000425025.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus castoreus,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_002000985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_002355215.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus troglodytae,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_003337175.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus_B,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_900475415.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus porcinus,iPHoP-RF,96.40,None
+NC_002737.2|provirus_529627_569283,GB_GCA_900637675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equi,iPHoP-RF,96.10,blast;78.70
+NC_002737.2|provirus_529627_569283,GB_GCA_934196125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp934196125,iPHoP-RF,96.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000420785.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyovaginalis,iPHoP-RF,96.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_004843545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pasteurianus,iPHoP-RF,96.10,None
+NC_002737.2|provirus_529627_569283,GB_GCA_000283635.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus macedonicus,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000423765.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus porci,iPHoP-RF,95.70,blast;72.00
+NC_002737.2|provirus_529627_569283,RS_GCF_003686955.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hillyeri,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_011039275.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis_A,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_012277075.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus alactolyticus,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_900459405.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_901542335.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus porcinus_A,iPHoP-RF,95.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000187995.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus macacae,iPHoP-RF,95.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000380145.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus thoraltensis,iPHoP-RF,95.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_012396585.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ovuberis,iPHoP-RF,95.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_016908655.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus saliviloxodontae,iPHoP-RF,95.40,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000188055.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus urinalis,iPHoP-RF,95.10,blast;66.30
+NC_002737.2|provirus_529627_569283,RS_GCF_001598035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halotolerans,iPHoP-RF,95.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_009870755.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halichoeri,iPHoP-RF,95.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_024814375.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp024814375,iPHoP-RF,95.10,None
+NC_002737.2|provirus_529627_569283,RS_GCF_011421425.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus catagoni,iPHoP-RF,94.70,blast;66.30
+NC_002737.2|provirus_529627_569283,RS_GCF_000380085.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus merionis,iPHoP-RF,93.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_000785785.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus uberis_A,iPHoP-RF,93.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_003674745.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus iniae,iPHoP-RF,93.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_900475595.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus uberis,iPHoP-RF,93.70,None
+NC_002737.2|provirus_529627_569283,RS_GCF_019794555.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_AB,iPHoP-RF,91.10,None
+NC_002737.2|provirus_777501_820593,MGYG000003717,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__,CRISPR,98.40,iPHoP-RF;96.70
+NC_002737.2|provirus_777501_820593,RS_GCF_004843545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pasteurianus,CRISPR,98.40,iPHoP-RF;94.10
+NC_002737.2|provirus_777501_820593,GB_GCA_000283635.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus macedonicus,CRISPR,98.30,iPHoP-RF;88.50
+NC_002737.2|provirus_777501_820593,RS_GCF_000186445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus agalactiae,CRISPR,98.30,iPHoP-RF;80.30 blast;76.70
+NC_002737.2|provirus_777501_820593,RS_GCF_002055535.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pyogenes,blast,98.00,iPHoP-RF;93.70
+NC_002737.2|provirus_777501_820593,RS_GCF_900636575.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus canis,CRISPR,98.00,blast;96.50 iPHoP-RF;95.40
+NC_002737.2|provirus_777501_820593,RS_GCF_010120595.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus thermophilus,CRISPR,97.90,iPHoP-RF;96.10
+NC_002737.2|provirus_777501_820593,RS_GCF_000220065.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp000220065,iPHoP-RF,97.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_001697145.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus anginosus_C,iPHoP-RF,97.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_009717815.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus parasanguinis_F,iPHoP-RF,97.10,blast;83.70
+NC_002737.2|provirus_777501_820593,RS_GCF_016648925.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp900766505,iPHoP-RF,97.10,blast;83.70
+NC_002737.2|provirus_777501_820593,RS_GCF_900636475.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus anginosus,iPHoP-RF,97.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_902167705.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus constellatus_A,iPHoP-RF,97.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_943193075.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus parasanguinis_E,iPHoP-RF,97.10,blast;83.70
+NC_002737.2|provirus_777501_820593,RS_GCF_900459225.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus dysgalactiae,blast,96.90,iPHoP-RF;95.10
+NC_002737.2|provirus_777501_820593,RS_GCF_000380125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ovis,iPHoP-RF,96.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000423765.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus porci,iPHoP-RF,96.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_001598035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus halotolerans,iPHoP-RF,96.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_023109675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus parasanguinis_I,iPHoP-RF,96.70,blast;83.70
+NC_002737.2|provirus_777501_820593,RS_GCF_023167545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus constellatus,iPHoP-RF,96.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000423745.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus plurextorum,iPHoP-RF,96.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_003686955.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hillyeri,iPHoP-RF,96.40,blast;70.10
+NC_002737.2|provirus_777501_820593,RS_GCF_011039275.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis_A,iPHoP-RF,96.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000380025.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus entericus,iPHoP-RF,96.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000380145.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus thoraltensis,iPHoP-RF,96.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_900475675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus lutetiensis,iPHoP-RF,96.10,blast;68.90
+NC_002737.2|provirus_777501_820593,RS_GCF_000154985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus infantarius,iPHoP-RF,95.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000420785.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyovaginalis,iPHoP-RF,95.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000425025.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus castoreus,iPHoP-RF,95.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_002000985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus,iPHoP-RF,95.40,blast;68.90
+NC_002737.2|provirus_777501_820593,GB_GCA_000440235.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_F,iPHoP-RF,95.10,None
+NC_002737.2|provirus_777501_820593,GB_GCA_934196125.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp934196125,iPHoP-RF,95.10,None
+NC_002737.2|provirus_777501_820593,GB_GCA_002831545.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_P,iPHoP-RF,94.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000785515.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus salivarius,iPHoP-RF,94.70,blast;68.90
+NC_002737.2|provirus_777501_820593,RS_GCF_003337175.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus gallolyticus_B,iPHoP-RF,94.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_900101445.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equinus_B,iPHoP-RF,94.70,None
+NC_002737.2|provirus_777501_820593,GB_GCA_945876895.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp945876895,iPHoP-RF,94.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_002760245.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_I,iPHoP-RF,94.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_002953735.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pluranimalium,iPHoP-RF,94.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000380105.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus orisratti,iPHoP-RF,94.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_902702775.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_W,iPHoP-RF,94.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_902729355.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp902729355,iPHoP-RF,94.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000376985.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus henryi,iPHoP-RF,93.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_012396585.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus ovuberis,iPHoP-RF,93.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_016743335.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_Y,iPHoP-RF,93.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_900459405.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus hyointestinalis,iPHoP-RF,93.70,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000294495.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis,iPHoP-RF,93.40,blast;65.20
+NC_002737.2|provirus_777501_820593,RS_GCF_000380085.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus merionis,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_001302265.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus phocae,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_016908655.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus saliviloxodontae,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_019794555.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_AB,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_021654455.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus parasuis,iPHoP-RF,93.40,None
+NC_002737.2|provirus_777501_820593,GB_GCA_900637675.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus equi,iPHoP-RF,93.10,blast;70.70
+NC_002737.2|provirus_777501_820593,RS_GCF_000440115.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_L,iPHoP-RF,93.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_003595525.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus respiraculi,iPHoP-RF,93.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_015594605.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp015594605,iPHoP-RF,92.80,blast;68.90
+NC_002737.2|provirus_777501_820593,RS_GCF_000188055.2,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus urinalis,iPHoP-RF,92.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_012277075.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus alactolyticus,iPHoP-RF,92.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_001578805.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus sp001578805,iPHoP-RF,91.80,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000785785.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus uberis_A,iPHoP-RF,91.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_022354845.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus suis_AA,iPHoP-RF,91.40,None
+NC_002737.2|provirus_777501_820593,RS_GCF_900475595.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus uberis,iPHoP-RF,91.10,None
+NC_002737.2|provirus_777501_820593,RS_GCF_003674745.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus iniae,iPHoP-RF,90.80,None
+NC_002737.2|provirus_777501_820593,RS_GCF_000188035.1,d__Bacteria;p__Bacillota;c__Bacilli;o__Lactobacillales;f__Streptococcaceae;g__Streptococcus;s__Streptococcus pseudoporcinus,iPHoP-RF,90.50,None
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_008261.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_008261.1|provirus_1070550_1127691,RS_GCF_000013285.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens,blast,97.50,iPHoP-RF;76.60 CRISPR;50.20
+NC_008261.1|provirus_1784095_1821197,RS_GCF_000013285.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Clostridiales;f__Clostridiaceae;g__Sarcina;s__Sarcina perfringens,blast,96.90,CRISPR;93.40 iPHoP-RF;85.40
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_009012.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,5 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_009012.1|provirus_1938476_1983993,RS_GCF_000015865.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum,blast,94.90,iPHoP-RF;71.30
+NC_009012.1|provirus_2022140_2067593,RS_GCF_000015865.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum,blast,93.90,None
+NC_009012.1|provirus_2931283_2970170,RS_GCF_000015865.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum,blast,91.80,None
+NC_009012.1|provirus_3339258_3389049,RS_GCF_000015865.1,d__Bacteria;p__Bacillota_A;c__Clostridia;o__Acetivibrionales;f__Acetivibrionaceae;g__Hungateiclostridium;s__Hungateiclostridium thermocellum,blast,95.50,iPHoP-RF;69.10
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_014168.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_014168.1|provirus_1141631_1162952,RS_GCF_000092825.1,d__Bacteria;p__Actinomycetota;c__Actinomycetia;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus,blast,95.70,iPHoP-RF;68.00
+NC_014168.1|provirus_27479_67296,RS_GCF_000092825.1,d__Bacteria;p__Actinomycetota;c__Actinomycetia;o__Mycobacteriales;f__Mycobacteriaceae;g__Segniliparus;s__Segniliparus rotundus,blast,96.00,iPHoP-RF;79.30
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_014212.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,9 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_014212.1|provirus_1170297_1209132,RS_GCF_000092125.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Meiothermus_B;s__Meiothermus_B silvanus,blast,95.50,iPHoP-RF;80.80
+NC_014212.1|provirus_1170297_1209132,RS_GCF_003226535.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Meiothermus_B;s__Meiothermus_B sp003226535,blast,92.20,iPHoP-RF;72.60
+NC_014212.1|provirus_1170297_1209132,RS_GCF_000430045.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Calidithermus;s__Calidithermus chliarophilus,blast,90.90,CRISPR;76.20 iPHoP-RF;73.70
+NC_014212.1|provirus_1746722_1764354,RS_GCF_000092125.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Meiothermus_B;s__Meiothermus_B silvanus,blast,95.20,iPHoP-RF;86.00
+NC_014212.1|provirus_1893193_1914973,RS_GCF_000092125.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Meiothermus_B;s__Meiothermus_B silvanus,blast,94.80,iPHoP-RF;66.00
+NC_014212.1|provirus_1893193_1914973,RS_GCF_003574095.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Calidithermus;s__Calidithermus roseus,blast,91.00,None
+NC_014212.1|provirus_1893193_1914973,RS_GCF_000430045.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Calidithermus;s__Calidithermus chliarophilus,blast,90.80,iPHoP-RF;57.10
+NC_014212.1|provirus_1893193_1914973,RS_GCF_000373205.1,d__Bacteria;p__Deinococcota;c__Deinococci;o__Deinococcales;f__Thermaceae;g__Calidithermus;s__Calidithermus timidus,blast,90.40,None
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_014364.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,7 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_014364.1|provirus_2121424_2157334,RS_GCF_000143985.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae,blast,96.20,CRISPR;95.40 iPHoP-RF;68.40
+NC_014364.1|provirus_2121424_2157334,RS_GCF_000378205.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta bajacaliforniensis,CRISPR,93.40,blast;91.30 iPHoP-RF;63.50
+NC_014364.1|provirus_2329685_2350621,RS_GCF_000143985.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae,blast,95.70,iPHoP-RF;65.10
+NC_014364.1|provirus_2329685_2350621,RS_GCF_000378205.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta bajacaliforniensis,blast,92.10,iPHoP-RF;52.80
+NC_014364.1|provirus_2666253_2703772,RS_GCF_000143985.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae,blast,96.20,CRISPR;74.20 iPHoP-RF;72.60
+NC_014364.1|provirus_2976748_3014759,RS_GCF_000143985.1,d__Bacteria;p__Spirochaetota;c__Spirochaetia;o__DSM-16054;f__Sediminispirochaetaceae;g__Sediminispirochaeta;s__Sediminispirochaeta smaragdinae,blast,96.20,iPHoP-RF;69.80
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_015761.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,21 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_015761.1|provirus_1007223_1045009,GB_GCA_900446925.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter_B;s__Citrobacter_B koseri,blast,96.90,iPHoP-RF;83.30
+NC_015761.1|provirus_1007223_1045009,GB_GCA_900478215.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella houtenae,blast,96.90,iPHoP-RF;90.80
+NC_015761.1|provirus_1007223_1045009,RS_GCF_000006945.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella enterica,blast,96.90,iPHoP-RF;88.50
+NC_015761.1|provirus_1007223_1045009,RS_GCF_000252995.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori,blast,96.90,iPHoP-RF;91.10
+NC_015761.1|provirus_1007223_1045009,RS_GCF_008692785.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella diarizonae,blast,96.90,iPHoP-RF;93.40
+NC_015761.1|provirus_1007223_1045009,RS_GCF_008692845.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella arizonae,blast,96.90,iPHoP-RF;90.50
+NC_015761.1|provirus_1007223_1045009,RS_GCF_006874705.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Leclercia;s__Leclercia adecarboxylata_C,blast,91.00,None
+NC_015761.1|provirus_3084741_3115735,RS_GCF_000006945.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella enterica,CRISPR,98.50,blast;96.80 iPHoP-RF;89.80
+NC_015761.1|provirus_3084741_3115735,RS_GCF_008692785.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella diarizonae,CRISPR,98.10,iPHoP-RF;90.80
+NC_015761.1|provirus_3084741_3115735,RS_GCF_000252995.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori,blast,96.90,iPHoP-RF;90.10
+NC_015761.1|provirus_3084741_3115735,RS_GCF_002918555.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter_C;s__Citrobacter_C amalonaticus_A,blast,93.20,None
+NC_015761.1|provirus_3084741_3115735,GB_GCA_900446925.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Citrobacter_B;s__Citrobacter_B koseri,iPHoP-RF,92.10,CRISPR;67.50
+NC_015761.1|provirus_847397_862760,RS_GCF_003697165.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia coli,blast,96.90,iPHoP-RF;88.90
+NC_015761.1|provirus_847397_862760,RS_GCF_000759775.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia albertii,blast,96.30,iPHoP-RF;86.70
+NC_015761.1|provirus_847397_862760,RS_GCF_001729745.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Enterobacter;s__Enterobacter hormaechei_A,blast,96.20,iPHoP-RF;73.00
+NC_015761.1|provirus_847397_862760,RS_GCF_000252995.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella bongori,blast,93.90,iPHoP-RF;71.50
+NC_015761.1|provirus_847397_862760,GB_GCA_900478215.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella houtenae,blast,91.90,iPHoP-RF;73.70
+NC_015761.1|provirus_847397_862760,RS_GCF_000006945.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella enterica,blast,91.70,iPHoP-RF;88.50
+NC_015761.1|provirus_847397_862760,RS_GCF_008692845.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Salmonella;s__Salmonella arizonae,blast,91.70,iPHoP-RF;84.50
+NC_015761.1|provirus_847397_862760,RS_GCF_002900365.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Enterobacterales;f__Enterobacteriaceae;g__Escherichia;s__Escherichia marmotae,blast,90.00,iPHoP-RF;87.00
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_017033.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,4 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_017033.1|provirus_1052334_1094910,RS_GCF_000242255.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia,blast,98.40,None
+NC_017033.1|provirus_1557694_1600481,RS_GCF_000242255.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia,blast,98.40,iPHoP-RF;64.30
+NC_017033.1|provirus_2089294_2107522,RS_GCF_000242255.2,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Xanthomonadales;f__Rhodanobacteraceae;g__Frateuria;s__Frateuria aurantia,blast,95.20,None
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_018068.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,13 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_018068.1|provirus_1361108_1399802,RS_GCF_000255115.2,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus,blast,96.40,iPHoP-RF;53.60
+NC_018068.1|provirus_1361108_1399802,RS_GCF_001707885.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp001707885,iPHoP-RF,95.40,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_001936615.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus metallidurans,iPHoP-RF,95.40,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_000224515.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp000224515,iPHoP-RF,95.10,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_000960765.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp000960765,iPHoP-RF,93.40,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_004766055.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp004766055,iPHoP-RF,93.10,None
+NC_018068.1|provirus_1361108_1399802,3300011997_21,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__,iPHoP-RF,92.10,None
+NC_018068.1|provirus_1361108_1399802,GB_GCA_002404215.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp002404215,iPHoP-RF,91.80,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_001029285.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acididurans,blast,91.80,None
+NC_018068.1|provirus_1361108_1399802,RS_GCF_002196705.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp002196705,blast,91.20,iPHoP-RF;78.30
+NC_018068.1|provirus_1361108_1399802,GB_GCA_900290375.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus infrequens,blast,90.30,iPHoP-RF;73.50
+NC_018068.1|provirus_2072558_2098541,RS_GCF_000255115.2,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acidiphilus,blast,93.60,iPHoP-RF;69.50
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_018515.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,22 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_018515.1|provirus_3418112_3436097,RS_GCF_000231385.2,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei,blast,95.90,iPHoP-RF;79.80
+NC_018515.1|provirus_3418112_3436097,RS_GCF_004766055.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp004766055,iPHoP-RF,95.70,None
+NC_018515.1|provirus_3418112_3436097,GB_GCA_002404215.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp002404215,iPHoP-RF,95.10,None
+NC_018515.1|provirus_3418112_3436097,3300011997_21,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__,iPHoP-RF,94.70,None
+NC_018515.1|provirus_3418112_3436097,GB_GCA_021779415.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp021779415,iPHoP-RF,92.80,None
+NC_018515.1|provirus_3418112_3436097,RS_GCF_023897015.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus nitroreducens,blast,91.80,iPHoP-RF;73.20
+NC_018515.1|provirus_3418112_3436097,GB_GCA_003132105.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp003132105,iPHoP-RF,91.40,None
+NC_018515.1|provirus_3418112_3436097,RS_GCF_020595055.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp020595055,blast,91.40,iPHoP-RF;74.10
+NC_018515.1|provirus_3418112_3436097,RS_GCF_000235605.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus orientis,blast,90.70,iPHoP-RF;73.00
+NC_018515.1|provirus_3418112_3436097,RS_GCF_900100785.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus hippei,blast,90.30,iPHoP-RF;71.70
+NC_018515.1|provirus_4659544_4694673,RS_GCF_000231385.2,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus meridiei,blast,96.40,iPHoP-RF;77.30
+NC_018515.1|provirus_4659544_4694673,RS_GCF_023897015.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus nitroreducens,blast,95.70,iPHoP-RF;86.00
+NC_018515.1|provirus_4659544_4694673,GB_GCA_002404215.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp002404215,iPHoP-RF,94.40,None
+NC_018515.1|provirus_4659544_4694673,GB_GCA_900290375.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus infrequens,iPHoP-RF,94.40,None
+NC_018515.1|provirus_4659544_4694673,3300011997_21,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__,iPHoP-RF,94.10,None
+NC_018515.1|provirus_4659544_4694673,RS_GCF_900100785.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus hippei,blast,93.30,iPHoP-RF;73.50
+NC_018515.1|provirus_4659544_4694673,GB_GCA_003132105.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp003132105,iPHoP-RF,92.40,None
+NC_018515.1|provirus_4659544_4694673,GB_GCA_016278585.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp016278585,iPHoP-RF,92.10,None
+NC_018515.1|provirus_4659544_4694673,RS_GCF_001707885.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus sp001707885,blast,90.80,iPHoP-RF;85.70
+NC_018515.1|provirus_4659544_4694673,RS_GCF_000244895.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus youngiae,blast,90.40,iPHoP-RF;83.30
+NC_018515.1|provirus_4659544_4694673,RS_GCF_001029285.1,d__Bacteria;p__Bacillota_B;c__Desulfitobacteriia;o__Desulfitobacteriales;f__Desulfitobacteriaceae;g__Desulfosporosinus;s__Desulfosporosinus acididurans,blast,90.40,iPHoP-RF;85.70
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_019936.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,45 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_019936.1|provirus_2347508_2361929,RS_GCF_015291885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AC,CRISPR,97.40,blast;95.00 iPHoP-RF;87.30
+NC_019936.1|provirus_2347508_2361929,RS_GCF_003640395.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas urumqiensis,CRISPR,96.90,iPHoP-RF;51.70
+NC_019936.1|provirus_2347508_2361929,RS_GCF_000219605.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri,blast,96.10,CRISPR;90.50 iPHoP-RF;84.20
+NC_019936.1|provirus_2347508_2361929,RS_GCF_000327065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE,blast,95.90,iPHoP-RF;69.30
+NC_019936.1|provirus_2347508_2361929,RS_GCF_002929225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_U,blast,94.10,iPHoP-RF;89.50
+NC_019936.1|provirus_2347508_2361929,RS_GCF_003935375.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas xanthomarina_A,blast,94.10,iPHoP-RF;86.70 CRISPR;82.70
+NC_019936.1|provirus_2347508_2361929,GB_GCA_007713455.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp007713455,blast,93.10,iPHoP-RF;77.10
+NC_019936.1|provirus_2347508_2361929,RS_GCF_021432085.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis_A,blast,93.00,iPHoP-RF;89.20
+NC_019936.1|provirus_2347508_2361929,RS_GCF_000341615.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_G,blast,91.80,iPHoP-RF;75.00
+NC_019936.1|provirus_2347508_2361929,RS_GCF_003696285.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas nitrititolerans,blast,90.60,iPHoP-RF;51.50
+NC_019936.1|provirus_2347508_2361929,RS_GCF_015070855.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas lopnurensis,blast,90.10,iPHoP-RF;73.50
+NC_019936.1|provirus_3233292_3242961,RS_GCF_003696285.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas nitrititolerans,blast,96.90,iPHoP-RF;70.40
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000219605.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri,blast,96.80,iPHoP-RF;95.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000495915.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas chloritidismutans,blast,96.80,iPHoP-RF;88.90
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000818015.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas balearica,blast,96.80,iPHoP-RF;65.30
+NC_019936.1|provirus_3233292_3242961,RS_GCF_002929225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_U,blast,96.80,iPHoP-RF;92.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_003935375.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas xanthomarina_A,blast,96.80,iPHoP-RF;88.90
+NC_019936.1|provirus_3233292_3242961,RS_GCF_900114065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis,blast,96.80,iPHoP-RF;92.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_002890795.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AA,iPHoP-RF,96.70,blast;91.70
+NC_019936.1|provirus_3233292_3242961,RS_GCF_015291885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AC,blast,96.70,iPHoP-RF;93.70
+NC_019936.1|provirus_3233292_3242961,RS_GCF_021432085.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis_A,blast,96.70,iPHoP-RF;93.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_003696315.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas songnenensis,blast,96.20,iPHoP-RF;94.70
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000327065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE,blast,95.70,iPHoP-RF;94.10
+NC_019936.1|provirus_3233292_3242961,RS_GCF_002909485.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AH,blast,94.30,iPHoP-RF;91.80
+NC_019936.1|provirus_3233292_3242961,RS_GCF_014764705.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp002692525,iPHoP-RF,92.40,None
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000661915.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_A,iPHoP-RF,92.10,blast;91.90
+NC_019936.1|provirus_3233292_3242961,RS_GCF_000935215.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AD,iPHoP-RF,91.10,None
+NC_019936.1|provirus_4295725_4304306,RS_GCF_003696285.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas nitrititolerans,blast,96.90,iPHoP-RF;85.40
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000219605.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri,blast,96.80,iPHoP-RF;96.10
+NC_019936.1|provirus_4295725_4304306,RS_GCF_015291885.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AC,blast,96.60,iPHoP-RF;96.10
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000818015.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas balearica,blast,96.20,iPHoP-RF;85.70
+NC_019936.1|provirus_4295725_4304306,RS_GCF_002909485.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AH,iPHoP-RF,95.70,blast;92.80
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000495915.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas chloritidismutans,iPHoP-RF,94.10,blast;89.90
+NC_019936.1|provirus_4295725_4304306,RS_GCF_002929225.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_U,iPHoP-RF,94.10,blast;89.90
+NC_019936.1|provirus_4295725_4304306,RS_GCF_003935375.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas xanthomarina_A,iPHoP-RF,94.10,blast;90.30
+NC_019936.1|provirus_4295725_4304306,RS_GCF_003696315.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas songnenensis,blast,93.90,iPHoP-RF;86.30
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000327065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AE,blast,93.80,iPHoP-RF;85.70
+NC_019936.1|provirus_4295725_4304306,RS_GCF_014764705.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp002692525,iPHoP-RF,93.70,None
+NC_019936.1|provirus_4295725_4304306,RS_GCF_900114065.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis,iPHoP-RF,93.70,blast;91.00
+NC_019936.1|provirus_4295725_4304306,GB_GCA_003488145.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp003488145,iPHoP-RF,93.40,None
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000935215.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_AD,iPHoP-RF,92.40,blast;90.60
+NC_019936.1|provirus_4295725_4304306,RS_GCF_021432085.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas kunmingensis_A,iPHoP-RF,92.40,blast;89.90
+NC_019936.1|provirus_4295725_4304306,GB_GCA_007713455.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas sp007713455,iPHoP-RF,91.80,None
+NC_019936.1|provirus_4295725_4304306,RS_GCF_000661915.1,d__Bacteria;p__Pseudomonadota;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Stutzerimonas;s__Stutzerimonas stutzeri_A,blast,91.70,iPHoP-RF;83.10
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/iphop_host_prediction_to_genome/NC_021184.fasta.csv	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,9 @@
+Virus,Host genome,Host taxonomy,Main method,Confidence score,Additional methods
+NC_021184.1|provirus_19778_35564,RS_GCF_000233715.2,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae,blast,95.50,iPHoP-RF;84.20
+NC_021184.1|provirus_19778_35564,RS_GCF_008124625.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum thermosapovorans,iPHoP-RF,93.40,blast;90.30
+NC_021184.1|provirus_19778_35564,GB_GCA_016841645.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum geothermicum_B,blast,90.90,iPHoP-RF;74.80
+NC_021184.1|provirus_19778_35564,GB_GCA_016841205.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum geothermicum_A,blast,90.60,iPHoP-RF;70.90
+NC_021184.1|provirus_19778_35564,GB_GCA_016841905.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum geothermicum_C,blast,90.40,iPHoP-RF;51.20
+NC_021184.1|provirus_19778_35564,RS_GCF_009932395.1,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum syntrophicum,blast,90.30,iPHoP-RF;83.30
+NC_021184.1|provirus_4466413_4519129,RS_GCF_000233715.2,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae,blast,98.40,iPHoP-RF;68.90
+NC_021184.1|provirus_4563831_4615358,RS_GCF_000233715.2,d__Bacteria;p__Bacillota_B;c__Desulfotomaculia;o__Desulfotomaculales;f__Desulfallaceae;g__Sporotomaculum;s__Sporotomaculum gibsoniae,blast,98.20,iPHoP-RF;76.80
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_000913.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
+NC_000913.3|provirus_1196867_1213107_23	NC_000913.3|provirus_1196867_1213107	K00031	"IDH1, IDH2, icd; isocitrate dehydrogenase [EC:1.1.1.42]"	PF00180.20	Isocitrate/isopropylmalate dehydrogenase
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_002737.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
+NC_002737.2|provirus_777501_820593_1	NC_002737.2|provirus_777501_820593	K01710	"E4.2.1.46, rfbB, rffG; dTDP-glucose 4,6-dehydratase [EC:4.2.1.46]"	PF16363.5	"GDP-mannose 4,6 dehydratase"
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_008261.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_009012.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
+NC_009012.1|provirus_2022140_2067593_32	NC_009012.1|provirus_2022140_2067593	K00558	"DNMT1, dcm; DNA (cytosine-5)-methyltransferase 1 [EC:2.1.1.37]"	PF00145.17	C-5 cytosine-specific DNA methylase
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_014168.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
+NC_014168.1|provirus_1141631_1162952_17	NC_014168.1|provirus_1141631_1162952	K00558	"DNMT1, dcm; DNA (cytosine-5)-methyltransferase 1 [EC:2.1.1.37]"	PF00145.17	C-5 cytosine-specific DNA methylase
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_014212.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_014364.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
+NC_014364.1|provirus_2666253_2703772_28	NC_014364.1|provirus_2666253_2703772	K00390	cysH; phosphoadenosine phosphosulfate reductase [EC:1.8.4.8 1.8.4.10]	PF01507.19	Phosphoadenosine phosphosulfate reductase family
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_015761.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_017033.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,2 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
+NC_017033.1|provirus_1557694_1600481_7	NC_017033.1|provirus_1557694_1600481	K00558	"DNMT1, dcm; DNA (cytosine-5)-methyltransferase 1 [EC:2.1.1.37]"	PF00145.17	C-5 cytosine-specific DNA methylase
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_018068.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_018515.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,3 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
+NC_018515.1|provirus_4659544_4694673_38	NC_018515.1|provirus_4659544_4694673	K06167	"phnP; phosphoribosyl 1,2-cyclic phosphate phosphodiesterase [EC:3.1.4.55]"	PF00753.27	Metallo-beta-lactamase superfamily
+NC_018515.1|provirus_3418112_3436097_1	NC_018515.1|provirus_3418112_3436097	K00106	XDH; xanthine dehydrogenase/oxidase [EC:1.17.1.4 1.17.3.2]	PF02738.18	Molybdopterin-binding domain of aldehyde dehydrogenase
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_019936.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vibrant_amg_individuals/NC_021184.fasta.tabular	Wed Jun 04 17:36:40 2025 +0000
@@ -0,0 +1,1 @@
+protein	scaffold	AMG KO	AMG KO name	Pfam	Pfam name