changeset 0:52d69f74b19e draft

planemo upload for repository https://github.com/phac-nml/galaxy_tools/tree/master/tools/spatyper commit a211c27b9f7386f8e43419ec22b88403498da26e
author nml
date Mon, 20 Mar 2023 20:16:56 +0000
parents
children 2c353e0dacae
files spatyper.xml test-data/input.fasta test-data/output.txt test-data/sparepeats.fasta
diffstat 4 files changed, 2594 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/spatyper.xml	Mon Mar 20 20:16:56 2023 +0000
@@ -0,0 +1,64 @@
+<tool id="spatyper" name="Generate spa type identification" version="@VERSION@+galaxy0" profile="21.01">
+    <macros>
+        <token name="@VERSION@">0.3.3</token>
+    </macros>
+    <requirements>
+        <requirement type="package" version="@VERSION@">spatyper</requirement>
+    </requirements>
+    <command detect_errors="aggressive"> <![CDATA[
+        spaTyper -f '${input1}' -r '${input2}' > '${output1}' 
+    ]]> </command>
+    <inputs>
+        <param type="data" name="input1" format="fasta" label="SPA Fasta file" help="Staphylococcus aureus - staphylococcal protein A fasta file. This will be assigned a type based on its repeat region."/>
+        <param type="data" name="input2" format="fasta" label="Repeats Library Multifasta" help="A multifasta representing a set of known repeat regions found in staphylococcal protein A. This can be downloaded at (http://spa.ridom.de/dynamic/sparepeats.fasta)"/>
+    </inputs>
+    <outputs>
+        <data name="output1" format="txt" />
+    </outputs>
+    <tests>
+        <test>
+            <param name="input1" value="input.fasta"/>
+            <param name="input2" value="sparepeats.fasta"/>
+            <output name="output1">
+                <assert_contents>
+                    <has_text text = "t11215" />
+                </assert_contents>
+            </output>
+        </test>
+    </tests>
+    <help><![CDATA[
+::
+
+    USAGE: spaTyper [-h] [-r REPEAT_FILE] [-o REPEAT_ORDER_FILE] [-d FOLDER] [-f FASTA [FASTA ...]] [-g GLOB] [-e] [--output OUTPUT] [--version] [--debug] [--info]
+
+    spaTyper.py: Get spa types
+
+    Version: 0.3.3
+    License: GPLv3
+    Prints spa type to stdout
+
+    It will download sparepeats.fasta and spatypes.txt to repository directory 
+    if files not provided or already in directory. It can be loaded as a python
+    module. Python 3 version only.
+
+    Options: -h     show this help message and exit
+             -r     REPEAT_FILE (http://spa.ridom.de/dynamic/sparepeats.fasta)
+             -o     REPEAT_ORDER_FILE (http://spa.ridom.de/dynamic/spatypes.txt)
+             -d     Folder to save downloaded files from Ridom/Spa server
+             -f     List of one or more fasta files.
+             -g     Uses unix style pathname expansion to run spa typing on all files. If your shell autoexpands wildcards use -f.
+             -e     Do PCR product enrichment. [Default: False]
+
+    ]]></help>
+    <citations>
+        <citation type="bibtex">
+@misc{githubseqtk,
+  author = {HCGB},
+  year = {2020},
+  title = {spaTyper},
+  publisher = {GitHub},
+  journal = {GitHub repository},
+  url = {https://github.com/HCGB-IGTP/spaTyper},
+}</citation>
+    </citations>
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input.fasta	Mon Mar 20 20:16:56 2023 +0000
@@ -0,0 +1,16 @@
+>AJ829762.1 Staphylococcus aureus subsp. aureus partial spa gene for protein A
+TGCTGCGCAACACGATGAAGCTCAACAAAATGCTTTTTATCAAGTGTTAAATATGCCTAACTTAAACGCT
+GATCAACGTAATGGTTTTATCCAAAGCCTTAAAGATGATCCAAGCCAAAGTGCTAACGTTTTAGGTGAAG
+CTAAAAAACTTAATGACTCTCAAGCTCCAAAAGCTGATGCGCAACAAAATAACTTCAACAAAGATCAACA
+AAGCGCCTTCTATGAAATTTTGAACATGCCTAACTTAAACGAAGCGCAACGCAATGGTTTCATTCAAAGT
+CTTAAAGACGATCCAAGCCAAAGCACTAACGTTTTAGGTGAAGCTAAAAAATTAAATGAATCTCAAGCAC
+CGAAAGCTGACAACAATTTCAACAAAGAACAACAAAATGCTTTCTATGAAATCTTGAACATGCCTAACTT
+GAACGAAGAACAACGCAATGGTTTCATCCAAAGCTTAAAAGATGACCCAAGTCAAAGTGCTAACCTATTG
+TCAGAAGCTAAAAAGTTAAATGAATCTCAAGCACCGAAAGCTGATAACAAATTCAACAAAGAACAACAAA
+ATGCTTTCTATGAAATCTTACATTTACCTAACTTAAACGAAGAACAACAAAATGCTTTCTATGAAATTTT
+ACATTTACCTAACTTAACTGAAGAACAACGTAACGGCTTCATCCAAAGCCTTAAAGACGATCCTTCAGTG
+AGCAAAGAAATTTTAGCAGAAGCTAAAAAGCTAAACGATGCTCAAGCACCAAAAGAGGAAGACAATAACA
+AGCCTAGTAAAGAAGACAACAACAAACCTGGCAAAGATGACGGCAACAAGCCTGGTAAAGAAGATGGCAA
+CAAACCTGGCAAAGATGACGGCAACAAACCTGGTAAAGAAGACAACAACAAACCTGGTAAAGAAGACGGC
+AACAAGCCTGGTAAAGAAGACGGCAACAAACCTGGTAAAGAAGACGGCAACAAACCTGGTAAAGAAGACG
+GCAACAAACCTGGTAAAGAAGACGGCAACAAACCTGGTAAAGAAGACGGCA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output.txt	Mon Mar 20 20:16:56 2023 +0000
@@ -0,0 +1,10 @@
+Start the identification of repeats in Spa protein:
++ Repeats fasta file provided:  ~/tools/spaTyper/test-data/sparepeats.fasta
++ Check or download repeats types file in folder:  ~/planemo/bin
+	A previous download created spatypes.txt on: 2023-03-15 17:43:58
+
+-----------------
+Results:
+Sequence name	Repeats	Type
+AJ829762.1 Staphylococcus aureus subsp. aureus partial spa gene for protein A	99-20-69-31-70-13-17-16-16-16-16	t11215
+-----------------
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sparepeats.fasta	Mon Mar 20 20:16:56 2023 +0000
@@ -0,0 +1,2504 @@
+>r01
+GAGGAAGACAACAACAAGCCTAGC
+
+>r02
+AAAGAAGACAACAAAAAACCTGGC
+
+>r03
+GAGGAAGACAATAACAAACCTGGT
+
+>r04
+GAGGAAGACAATAACAAGCCTGGT
+
+>r05
+AAAGAAGACAACAAAAAGCCTGGC
+
+>r06
+AAAGAAGACGGCAAAAAACCTGGC
+
+>r07
+GAGGAAGACAACAACAAACCTGGT
+
+>r08
+GAGGAAGACAACAACAAGCCTGGT
+
+>r09
+GAGGAAGACGGCAACAAACCTGGT
+
+>r10
+AAAGAAGACAATAACAAGCCTGGT
+
+>r11
+GAGGAAGACAATAACAAGCCTGGC
+
+>r12
+AAAGAAGACAACAACAAGCCTGGT
+
+>r13
+AAAGAAGACAACAACAAACCTGGT
+
+>r14
+GAGGAAGACAACAACAAACCTGGC
+
+>r15
+GAGGAAGACAACAACAAGCCTGGC
+
+>r16
+AAAGAAGACGGCAACAAACCTGGT
+
+>r17
+AAAGAAGACGGCAACAAGCCTGGT
+
+>r18
+AAAGAAGATGGCAACAAGCCTAGT
+
+>r19
+AAAGAAGACAATAACAAGCCTGGC
+
+>r20
+AAAGAAGACAACAACAAACCTGGC
+
+>r21
+AAAGAAGACAACAACAAGCCTGGC
+
+>r22
+AAAGAAGACGGCAACAAGCCTGGC
+
+>r23
+AAAGAAGACGGCAACAAACCTGGC
+
+>r24
+AAAGAAGATGGCAACAAGCCTGGT
+
+>r25
+AAAGAAGATGGCAACAAACCTGGT
+
+>r26
+GAGGAAGACAACAAAAAACCTGGT
+
+>r28
+AAAGAAGATGGTAACAAACCTGGC
+
+>r29
+AAAGAAGACAACAAAAAGCCTAGC
+
+>r30
+AAAGAAGACGGCAACAAAAAACCTGGT
+
+>r31
+AAAGAAGATGGCAACAAACCTGGC
+
+>r32
+AAAGAAGACAGCAACAAGCCTGGC
+
+>r33
+AAAGAAGATGGCAACAAGCCTGGC
+
+>r34
+AAAGAAGACAACAAAAAACCTGGT
+
+>r35
+GAGGAAGACAACAAAAAACCTGGC
+
+>r36
+AAAGAAGACAACAAAAAGCCTGGT
+
+>r37
+AAAGAAGACGGCAACAACAAACCTGGC
+
+>r38
+AAAGAAGACTACAAAAAACCTGGT
+
+>r39
+AAAGAAGACAGCAACAAACCTGGT
+
+>r41
+CAAGAAGACGGCAACAAGCCTGGT
+
+>r42
+AAAGAAGACAACATCAAACCTGGT
+
+>r43
+AAAGAAGACGGTAACAAACCTGGT
+
+>r44
+AAAGAAGACAACAAGCCTGGT
+
+>r45
+AAAGAAGATGGCAACAGACCTGGC
+
+>r46
+AAACAAGACAACAAAAAACCTGGT
+
+>r47
+AAAGAAGACAACAACAAAAAACCTGGC
+
+>r48
+CAAGAAGACAACAACAAGCCTGGT
+
+>r49
+GAGGAAGACAACAAACCTGGC
+
+>r50
+AAAGAAGACGGCAACAAGCCTAGT
+
+>r51
+AAAGAAGACAACAAACCTGGT
+
+>r52
+AAAGAAGACAACAAAAAACTTGGC
+
+>r53
+AAAGAAGACGTCAACAAACCTGGC
+
+>r54
+AAAGAAGACAACAAGCCTGGC
+
+>r55
+CAAGAAGACAACAACAAACCTGGC
+
+>r56
+AAGGAAGACAACAACAAGCCTGGT
+
+>r57
+AAAGAAGACAACAATAAGCCTGGC
+
+>r58
+AAAGAATACGGCAACAAGCCTGGT
+
+>r59
+AAAGAAGACAGTAACAAACCTGGC
+
+>r60
+GAGGAAGACAACAAACCTGGT
+
+>r61
+AAAGGAGATGGCAACAAGCCTGGC
+
+>r62
+AAAGAAGACGGCAATAAACCTGGC
+
+>r63
+GAGGAAAACAACAACAAGCCTGGT
+
+>r64
+AAAGAAGACAATAAAAAACCTGGT
+
+>r65
+AAAGAAGATGGCAAAAAACCTGGT
+
+>r66
+AAAGAAGACAGCAACAAGCCTGGT
+
+>r68
+AAAGAAGACGGTAACAAGCCTGGT
+
+>r69
+AAAGATGACGGCAACAAGCCTGGT
+
+>r70
+AAAGATGACGGCAACAAACCTGGT
+
+>r71
+AAAGAAGATGGAAACAAGCCTGGT
+
+>r72
+AAAGAATACAACAACAAGCCTGGT
+
+>r73
+AAAGAAGATAACAACAAGCCTGGC
+
+>r74
+AATGAAGATGGCAACAAGCCTGGC
+
+>r75
+AAAGAAGATGGTAACAAACCTGGT
+
+>r76
+AAAGAAGACGACAACAAACCTGGT
+
+>r77
+AAAGAAGACGGCAACAAGCCTGAT
+
+>r78
+AAAGAATACGGCAACAAACCTGGT
+
+>r80
+AAAGAAGACAACAATAAACCTGGT
+
+>r81
+AAAGAAGACAGCAAAAAACCTGGT
+
+>r82
+AAAGAAGACAGCAACAAACCTGGC
+
+>r83
+AAAGAAGACGGCAAAAAACCTGGT
+
+>r84
+AAAGAAGATGGCAACAAACCTGAC
+
+>r85
+AAAGAAGACGGCAATAAACCTGGT
+
+>r86
+AAAGAAGACGACAAAAAACCTGGC
+
+>r87
+AAAGAAGATGGCAACAAGCCTGAT
+
+>r88
+AAAGAAGACGGCAGCAAGCCTGGT
+
+>r89
+GAAGAAGACGGCAACAAACCTGGT
+
+>r90
+AAAGAAGGCAACAAAAAACCTGGT
+
+>r91
+AAATAAGACAACAAAAAACCTGGT
+
+>r92
+AAAGAAGACAACAACAAACATGGC
+
+>r93
+CAAGAAGACAACAACAAGCCTGGC
+
+>r94
+CAAGAAGACAACAACAAACCTGGT
+
+>r95
+GAGGAATACAATAACAAGCCTGGC
+
+>r96
+AAAGAAGACGGCAACAAAACTGGT
+
+>r97
+AAAGAAGACACCAACAAGCCTGGT
+
+>r98
+AAAAAAGACGGCAACAAACCTGGT
+
+>r99
+GAGGAAGACAATAACAAGCCTAGT
+
+>r100
+AAAGAAGACAACAAAAAACCTGAC
+
+>r101
+AAATAAGACAACAACAAGCCTGGT
+
+>r102
+AAAGAAGACAACAACAAACCTGAT
+
+>r103
+AAAGAAGACGGCAACAAACCTGGG
+
+>r104
+AAAGAAGGCGGCAACAAACCTGGT
+
+>r105
+AAAGAAGATAACAAAAAACCTGGT
+
+>r106
+GAGCAAGACAACAACAAGCCTGGT
+
+>r107
+AAAGAAGACGGCAACAAACCTGAC
+
+>r108
+AAAAAAGACAACAACAAACCTGGT
+
+>r109
+AAAGAAGACGGCAACAAACCTAGC
+
+>r110
+AAAGAAGACGACAACAAGCCTGGT
+
+>r111
+AAAGAAGATGGCAACAAACTTGGT
+
+>r112
+AAAGAAGATGGAAACAAGCCTGGC
+
+>r113
+AAAGAAGACAACAAAAAACCCGGT
+
+>r114
+AAAGAAGACGGTAACAAACCTGGC
+
+>r115
+AAAGAAGACAACAAAAAGCCTACC
+
+>r116
+AAATAAGACAATAACAAGCCTGGC
+
+>r117
+AAAGAAGATGGTAACAAGCCTGGT
+
+>r118
+AAAGAAGACGTCAACAAGCCTGGT
+
+>r119
+AAATAAGACGGCAACAAGCCTGGT
+
+>r120
+AAAGAAGACAACAAAAAACCTGAT
+
+>r121
+GAGGAAGACAACAAGCCTGGT
+
+>r122
+GAGGAAGACAACAAAAAACCTGGA
+
+>r123
+GAGGAAGACAACAACAATCCTGGC
+
+>r124
+GAGGAAGGCAACAAAAAACCTGGT
+
+>r125
+GAGGAAGACGGCAACAAACCTGGC
+
+>r126
+GAGGAAGACAACAAAAAGCCTAGC
+
+>r127
+AAAGAAGACAACAAAAAACCTGTC
+
+>r128
+AAAGAAGACAACAACAAGCCTAGT
+
+>r129
+AAAGAACACAACAAAAAACCTGGT
+
+>r130
+AAAGAAGACGGCAACAAGTCTGGT
+
+>r131
+AAAGAAGACAACAACAAGCTTGGC
+
+>r132
+AAAGAAGACGGCAACAAGCCTAGC
+
+>r133
+AAAAAAGACGGCAACAAGCCTGGT
+
+>r134
+AAAGAAGGCAACAAGCCTGGC
+
+>r135
+GAGGAAGACAACAAAAAGCCTGGT
+
+>r136
+GAGGAAGACAACAACAAATCTGGT
+
+>r137
+GAGGAAGGCAATAACAAGCCTGGC
+
+>r138
+AAAGAAGACAACAAAAAACTTGGT
+
+>r139
+AAAGAAGACAACAACAACCCTGGT
+
+>r140
+GGAGAAGACAACAAAAAACCTGGT
+
+>r141
+AAAGAAGACGGCAACCAGCCTGGT
+
+>r142
+GAGAAAGACAACAACAAGCCTAGC
+
+>r143
+AAAGAAGACAACAAAAAGCCTAGT
+
+>r144
+AAAGAAGACACCAACAAACCTGGT
+
+>r145
+AAAGAAGACGGCAACAAGCCTGGA
+
+>r146
+AAAGAAGATGGTAACAAACCTGGA
+
+>r147
+AAAGAATACAACAAAAAACCTGGT
+
+>r148
+AAAGAAGACAACAACAAGACTGGT
+
+>r149
+AAAGAAGACGGCAACAATCCTGGT
+
+>r150
+AAAGAAGAAGGCAACAAACCTGGT
+
+>r151
+AAAGAAGACGGCAAGAAGCCTGGT
+
+>r152
+AAAGAAGACAACAACAACAAGCCTGGC
+
+>r153
+AAAGAAGATGGCAATAAGCCTGGT
+
+>r154
+AAAGAAGACAACAAAAAACCTGTA
+
+>r155
+AAAGAAGACGGCAACAAGCCTTGT
+
+>r156
+AAAGAAGACAACAACAAGCCTAGC
+
+>r157
+AAAAAAGACAACAAAAAACCTGGC
+
+>r158
+AAAGAAGACGGAAACAAACCTGGT
+
+>r159
+AAAGAAGACAACAAAAAACCTAGC
+
+>r160
+GAGGAAGACAACAAAAAGCCTGGC
+
+>r161
+AAAGAAGAGGGCAACAAGCCTGGT
+
+>r162
+AAAGAAGATAGCAACAAACCTGGT
+
+>r163
+GAGGAAGACAACTACAAGCCTGGT
+
+>r164
+GAGGAAGACGGCAACAAGCCTGGT
+
+>r165
+AAAGAAGACGGCAACAAAGCTGGC
+
+>r166
+AAAGAAGACGTCAACAAACCTGGT
+
+>r167
+AAAGAAGACGGCAACAAAAAGCCTAGC
+
+>r168
+AAAGAAGATGGCAACCAGCCTGGC
+
+>r169
+AAAGAAGACGACAAAAAGCCTAGC
+
+>r170
+AAAGAAGATCGCAACAAACCTGGT
+
+>r171
+AAAGAAGACGGGAACAAACCTGGC
+
+>r172
+AAAGGAGACAACAAAAAACCTGGT
+
+>r173
+CAAGAAGACAACAAAAAACCTGGT
+
+>r174
+AAAGAAGATAACAACAAGCCTGGT
+
+>r175
+AAAGAAGATAGCAACAAACCTGGC
+
+>r176
+AAAGAAGACGGCAACGGCAACAAACCTGGC
+
+>r177
+AAAGAAGACAACAGAAAACCTGGT
+
+>r178
+AAAAAAGACAACAACAAGCCTGGT
+
+>r179
+AAAAAAGACAACAACAAGCCTGGC
+
+>r180
+AAAGAAGATGACAACAAGCCTGGT
+
+>r181
+AAAGAAGACGGCATCAAACCTGGT
+
+>r182
+AAAGAAGACACCAAAAAACCTGGC
+
+>r183
+AAAGAAGACAACAACAAACCTAGC
+
+>r184
+AAAGAAGAAAACAACAAGCCTGGT
+
+>r185
+AAAGAAGACAACAAAAAACATGGC
+
+>r186
+GAGGAAGATAACAACAAACCTGGT
+
+>r187
+AAAGAAGACGGCAACTAACCTGGC
+
+>r188
+CAAGAAGACGGCAACAAACCTGGT
+
+>r189
+AAAGAAGATAACAAGCCTGGT
+
+>r190
+TAGGAAGACAACAACAAGCCTGGC
+
+>r191
+AAAGAAGATGCCAACAAGCCTAGT
+
+>r192
+AAAGAAGACAACTACAAACCTGGT
+
+>r193
+GAGGAAGACAACAACAAGCCTAGT
+
+>r194
+AAAGAAGACAACAAAAAAACTGGT
+
+>r195
+AAAGAAGACGGCAACAAGCCTCGT
+
+>r196
+AAAGAAGACAACAACAAGCCTGCC
+
+>r197
+AAAGAAGACAACAACAATCCTGGC
+
+>r198
+AAAGAAGACAATAACAAGCCAGGC
+
+>r199
+GAAGAAGACAACAAAAAACCTGGT
+
+>r200
+AAAGAAGACAATAACAGGCCTGGC
+
+>r201
+AAAGGAGACAACAACAAACCTGGC
+
+>r202
+AAAGAAGACGACAACAAACCTGGC
+
+>r203
+AAAGAAGGCAACAACAAACCTGGT
+
+>r204
+AAAGAAGACAACAAAAAACATGGT
+
+>r205
+AAAGAAGACGGCAAAAAGCCTAGC
+
+>r206
+AAAGAAGACAACAACAATCCTGGT
+
+>r207
+AAAGAAGACGATAACAAGCCTGGT
+
+>r208
+AAAGAAGATAACAAAAAACCTGGC
+
+>r209
+AAAGAAGACAACAACAAGTCTGGC
+
+>r210
+GAGGAAGACAACAACAATCCTGGT
+
+>r211
+AAAGAAGACGGCAACAAGCCCGGT
+
+>r212
+AAAGAAGACGACAAAAAACCTGGT
+
+>r213
+AAAGAAAACAACAACAAACCTGGT
+
+>r214
+AAAGAAGAAGACAACAAGCCTGGT
+
+>r215
+AAAGAAGACAACAACAAGCCTGAT
+
+>r216
+AAAGAAGACAACGAAAAACCTGGT
+
+>r217
+AAAGAAGATGGCAACAAAAAGCCTGGC
+
+>r218
+AAAGAAGAGAACAACAAACCTGGT
+
+>r219
+AAAGAAGACGGCAACAAACTTGGC
+
+>r220
+AAAGAAGCCGGCAACAAACCTGGT
+
+>r221
+GAGGAAGACAACAACAAGCCTGAC
+
+>r222
+AAAGAAGACAACAAAAAATCTGGT
+
+>r223
+AAAGAAGACGGCAACAAACCCGGC
+
+>r224
+AAAGAAGACAACAAAAATCCTGGC
+
+>r225
+AAAGAAGACGGCAACAAGACTGGT
+
+>r226
+AAAGAAGACAAAAAAAAACCTGGT
+
+>r227
+AAAGAAGATGGCAACAAACCCGGT
+
+>r228
+AAAGAAGACAATAACAAACCTGGT
+
+>r229
+AAAGAAGAAGGCAACAAACCTGGC
+
+>r230
+AAAGAAGATGGCAACAAGTCTGGT
+
+>r231
+AAAGAAGATGGTAACAAACCTCGC
+
+>r232
+AAAGAAGACAACAAAAAAACTGGC
+
+>r233
+GAGGAAGACAACAAAAAAACTGGT
+
+>r234
+GAGGAAGACAGCAACAAACCTGGT
+
+>r235
+AAAGAAGACAACAAAAAACCCGGC
+
+>r236
+CAAGAAGACGGCAACAAACCTGGC
+
+>r237
+AAAGAAGACAACGACAAGCCTGGT
+
+>r238
+AAAGAAGATGGCAACAAGCCTAGC
+
+>r239
+AAAGAAGATGGCTACAAACCTGGC
+
+>r240
+GAGGAAGACAGCAAAAAACCTGGT
+
+>r241
+AAATAAGACGGCAACAAACCTGGT
+
+>r242
+AAAGAAGACGGCAACAAACCTGTT
+
+>r243
+AAATAAGACAACAAAAAACCTGGC
+
+>r244
+AAAGAAGACGGCAACAAATCTGGC
+
+>r245
+GAGGAAGACAACAACAAGCTTGGC
+
+>r246
+AAAGAATATGGCAACAAACCTGGC
+
+>r247
+AAAGAAGATGGCAACAAATCTGGT
+
+>r248
+AAAAAAGACGGCAACAAGCCTGGC
+
+>r249
+AAAGAAGATGGTAACAAGCCTGGC
+
+>r250
+AAAGAAGATGGTAACAAACCTGCA
+
+>r251
+GAGGAAGACAACAAAAAACCTGAT
+
+>r252
+AAAGAGGATGGTAACAAACCTGGC
+
+>r253
+TAAGAAGACGGCAACAAACCTGGC
+
+>r254
+AAAGAAAACAACAAAAAACCTGGT
+
+>r255
+GAGGGAGACAATAACAAGCCTGGT
+
+>r256
+AAAGAAGACAACAAAAAACCTAGT
+
+>r257
+AAAGAAGACAACAACAAACCAGGC
+
+>r258
+GAAGAAGACAATAACAAGCCTGGT
+
+>r259
+GATGAAGACAACAACAAGCCTGGT
+
+>r260
+AAAGAAGACTCCAACAAACCTGGT
+
+>r261
+AAAGAGGACGGCAACAAGCCTGGT
+
+>r262
+AAAGAAGACGGCAAAAAGCCTGGC
+
+>r263
+AAAGAAGACAACAAAAAATCTGGC
+
+>r264
+AAAGAAGACGACAACAAGCCTGGC
+
+>r265
+AAAGAAGACGGCAACAAACCTGAT
+
+>r266
+AAAGAAGACGGCAACAAACCTGTC
+
+>r267
+AAAGAAGATAACAACAAACCTGGC
+
+>r268
+GAGGAAGACAACAATAAACCTGGT
+
+>r269
+AAAGAGGACAACAACAAGCCTGGC
+
+>r270
+AAAGAAGGCGGCAACAAGCCTGGT
+
+>r271
+AAATAAGACAGCAACAAACCTGGT
+
+>r272
+CAAGAAGACGGCAACAAGCCTGGC
+
+>r273
+AAAGAAGACGGCAACAAACCTGGA
+
+>r274
+AAAGAAGACGGCAACAAACCTGTA
+
+>r275
+AAAGAAGACGGCAACAAACTTGGT
+
+>r276
+AATGAAGACGGCAACAAGCCTGGT
+
+>r277
+CAAGAAGACGACAACAAGCCTGGT
+
+>r278
+GAGGAAGACAACAACAAGCCAGGT
+
+>r279
+AAAGAAAATGGCAACAAACCTGGT
+
+>r280
+AAAGAAGATGGTAACAAACCTAGC
+
+>r281
+AAAGAAGATGGCAACAAACCTGAT
+
+>r282
+AAAGAAGACAACAACAAACCTGGA
+
+>r283
+GAGGAAGACAACAACAAACTTGGT
+
+>r284
+AAAGAAGACAACAAAAAACCTGCC
+
+>r285
+AAAGAAGATGGCAACAAACCTAGT
+
+>r286
+AAAAAAGACAACAAAAAACCTGGT
+
+>r287
+AAAGAAGACGGCAACAAGCTTGGT
+
+>r288
+AAGGAAGACAATAACAAGCCTGGT
+
+>r289
+AAAGAAGAAAACAAAAAACCTGGT
+
+>r290
+CAAGAAGATGGTAACAAACCTGGC
+
+>r291
+AAAGTAGACGGCAACAAGCCTGGT
+
+>r292
+GAGGAAGACAACAACAAAAAACCTGGC
+
+>r293
+AAAGAAGACGGCAATAAGCCTGGT
+
+>r294
+AAAGAAGATGGCAACATACCTGGT
+
+>r295
+AAAGAAGATGGCAACAAACCTAGC
+
+>r296
+AAAGAAGATGGCAACAAAAAACCTGGC
+
+>r297
+AAAGAAGACGGAAACAAGCCTGGT
+
+>r298
+AAAGAAAACGGCAACAAGCCTGGT
+
+>r299
+GATGAAGACAACAACAAACCTGGC
+
+>r300
+GAGAAAGACAACAAAAAACCTGGT
+
+>r301
+AAAGAAGACAACAACAAGTCTGGT
+
+>r302
+GAGAAAGACAACAACAAGCCTGGC
+
+>r303
+AAAGAGGACGGCAACAAACCTGGT
+
+>r304
+AAAGAAAACGGCAACAAACCTGGC
+
+>r305
+GAGGAAGACAACAACAAGCGTGGC
+
+>r306
+AAAGAAGATGGGAACAAGCCTGGC
+
+>r307
+AAAGAAGACGGCAACAACCCTGGT
+
+>r308
+AAAGAAGACAACAAAAATCCTGGT
+
+>r309
+AAAGAAGACGCCAACAAGCCTGGT
+
+>r310
+AAAGAAGATGGCAACAATCCTGGC
+
+>r311
+AAAGAAGATGACAACAAACCTGGT
+
+>r312
+AAAGAAGATAGTAACAAACCTGGC
+
+>r313
+AAAGAAGGCAACAACAAGCCTGGT
+
+>r314
+AAAGAAAACGGCAACAAACCTGGT
+
+>r315
+CAAGAAGACAACAAAAAACCTGGC
+
+>r316
+GAGGAAGACAACAAAAATCCTGGT
+
+>r317
+GAGTAAGACAACAAAAAACCTGGT
+
+>r318
+CAAGAAGATGGCAACAAGCCTGGC
+
+>r319
+AAAGAAGATGGCAACAAGCCTCGC
+
+>r320
+AAAGAAGATGGCAACAAGCCCGGT
+
+>r321
+AAAGAAGGCGGTAACAAACCTGGT
+
+>r322
+AAAGAAGACAACAACAAGCTTGGT
+
+>r323
+AAAGAAGACTGCAACAAGCCTGGT
+
+>r324
+TAGGAAGACAACAACAAGCCTGGT
+
+>r325
+AAAGAAGACTACAAAAAACCTGGC
+
+>r326
+AAAGAAGATGGAAACAAACCTGGT
+
+>r327
+AAAGAAGACGGCAACAAACATGGT
+
+>r328
+AAAGATGGCAACAAACCTGGT
+
+>r329
+AAAGAAGACAACAACAACAAACCTGGT
+
+>r330
+AAAGAAGACAACAGCAAGCCTGGT
+
+>r331
+GAAGAAGACGGCAACAAGCCTGGT
+
+>r332
+AAAGAATATGGCAACAAACCTGGT
+
+>r333
+CAGGAAGACAATAACAAGCCTGGC
+
+>r334
+GAAGAAGATGGCAACAAGCCTGGC
+
+>r335
+GAGGAAGACGGCAACAAACCTAGT
+
+>r336
+GAGGAAGATAACAACAAGCCTGGC
+
+>r337
+AAAGAAGACCGCAACAAACCTGGT
+
+>r338
+AAAGAAGACCACAACAAGCCTGGT
+
+>r339
+AAAGAAGACTACAACAAACCTGGT
+
+>r340
+AAAGAAGACAGCAAAAAGCCTAGC
+
+>r341
+GAGGAAGACAATAATAAGCCTGGT
+
+>r342
+AAAGAAGACGGCAACAAATCTGGT
+
+>r343
+AAAGAAGATGGCAACAAGCCAGGT
+
+>r344
+GAGGAAGGCAACAACAAGCCTGGC
+
+>r345
+GAGGAAGACAACAACAAACCAGGT
+
+>r346
+AAAGAAGACTACAACAAGCCTGGT
+
+>r347
+AAAGAAGACAACAAAAAGTCTAGC
+
+>r348
+AAAGAAGATGGCAACAGACCTGGT
+
+>r349
+AAAGAAGATGGCAGCAAGCCTGGT
+
+>r350
+AAAGAAGATGGTAACAAGCCTAGT
+
+>r351
+AAAGAAGACAACAAACCTGGC
+
+>r352
+GAGGAAGACATTAACAAGCCTGGC
+
+>r353
+GAGGAAGACAACAACAAGTCTGGT
+
+>r354
+AAAGAAGACAACAAAAACCCTGGT
+
+>r355
+AAAGAAGACGGCAACAAACCTTGC
+
+>r356
+GAGGCAGACAATAACAAACCTGGT
+
+>r357
+AAAGAAGATGGCAAAAAACCTGGC
+
+>r358
+AAAGAAGGCGGCAACAAACCTGGC
+
+>r359
+AAAGAAGATGGCGACAAACCTGGT
+
+>r360
+AAAGAAGATGGCAACAACCCTGGT
+
+>r361
+GAGGAAGACAGCAACAAGCCTGGT
+
+>r362
+AAGGAAGACGGCAACAAGCCTGGT
+
+>r363
+AAAGAAGATGGCAATAAACCTGGT
+
+>r364
+GAGGAAGACAATAACAAGCCTAGC
+
+>r365
+GAAGAAGATGGCAACAAGCCTGGT
+
+>r366
+AAAGAAGACCGCAACAAACCTGGC
+
+>r367
+AATGAAAACGGCAACAAGCCTGGT
+
+>r368
+AATGAAGACGGCAACAAACCTGGC
+
+>r369
+ACAGAAGACGGCAACAAACCTGGT
+
+>r370
+GATGAAGACAACAAGCCTGGT
+
+>r371
+AAAGAAGATAACAACAAACCTGGT
+
+>r372
+AAAGAAGATAGCAACAAGCCTGGT
+
+>r373
+GAGGAAGACGGCAAAAAACCTGGT
+
+>r374
+AAAGAAGACACCAACAAACCTGGC
+
+>r375
+AAAGAAGACGGCAACAATCCTGGC
+
+>r376
+GAGGAAGACAATAACAAGCCTGCC
+
+>r377
+AAAGAAAACAACAACAAACCTGGC
+
+>r378
+GAGGAAGACAACAACAAGCCCGGC
+
+>r379
+AAAGCAGACAACAAAAAACCTGGT
+
+>r380
+AAAGAAGACAACAACTAGCCTGGT
+
+>r381
+GAGGAAGACAACAACAAACCCGGC
+
+>r382
+AAAGAAGACGGCAACAAGCCAGGT
+
+>r383
+AAAGAAGACAACAAAAAACCAGGT
+
+>r384
+AAAGAAGATGGCAACAAACCTGTA
+
+>r385
+GAGGAAGACAACAACAAGCCTGAT
+
+>r386
+AAAGAAGACAACAATAAGCCTAGC
+
+>r387
+AGAGAAGACAACAAAAAACCTGGT
+
+>r388
+GAGGAAGATAATAACAAACCTGGT
+
+>r389
+AAAGAAGATAGCAACAAGCCTGGC
+
+>r390
+AAAGAAGATGGTAACAAACCCGGC
+
+>r391
+GAGGAAGATAATAACAAGCCTGGT
+
+>r392
+AAAGAAGACGGCAACATACCTGGT
+
+>r393
+AAAGAAGATGGCAACAAGCCTGCC
+
+>r394
+AAAGAAGATAGCAACAAGCCTAGT
+
+>r395
+AAAGAAGACAACAACAAGCCCGGT
+
+>r396
+AAGGAAGACGGCAACAAACCTGGT
+
+>r397
+AAAGAAGACAACAAAAAACCTCGT
+
+>r398
+GAGGAAGACAATAACAATCCTGGC
+
+>r399
+GAGGAAGATAACAAAAAACCTGGT
+
+>r400
+AAAGAAGACGGCAACAAAAAGCCTGGT
+
+>r401
+GAGGAAGACAACAACAAGCTTGGT
+
+>r402
+GAGGAAGGCAACAACAAGCCTGGT
+
+>r403
+AAGGAAGACAACAAGCCTGGT
+
+>r404
+AAAGAGGACAACAAAAAACCTGGC
+
+>r405
+TAAGAAGACGGCAACAAACCTGGT
+
+>r406
+AAAGAAGACGGCTACAAACCTGGT
+
+>r407
+AAAGAAGACGGTAACAAGCCTGGC
+
+>r408
+AAAGAAGACGGCAATAAGCCTGGC
+
+>r409
+AAGTAAGACAACAAAAAACCTGGT
+
+>r410
+GAGTAAGACAACAACAAGCCTGGC
+
+>r411
+GAGGAAGACACCAACAAGCCTGGT
+
+>r412
+AAGGAAGACAACAACAAGCCTGGC
+
+>r413
+AAAGAAGACAACAACACGCCTGGC
+
+>r414
+AAAGAAGACAACAATAAGCCTGGT
+
+>r415
+AAAGAAGATGGCAACATGCCTGGC
+
+>r416
+AAAGAAGACAACAACCAACCTGGC
+
+>r417
+GAAGAAGATGGCAACAAACCTGGC
+
+>r418
+AAAGAAGATGACAACAAGCCTGGC
+
+>r419
+AAAAAAGATGGCAACAAACCTGGC
+
+>r420
+AAATAAGACAACAACAAACCTGGC
+
+>r421
+AAAGAAGACAACAACAAACCTGTT
+
+>r422
+AAAGAAGACGACAACAACAAGCCTGGT
+
+>r423
+AAATAAGACGGCAACAAACCTGGC
+
+>r424
+AAAGAAGACAACAACACGCCTGGT
+
+>r425
+AAAGAAAACAACAAAAAACCTGGC
+
+>r426
+AAAGAAGACGACAACAAAAAACCTGGT
+
+>r427
+AAAGAAGGCAACAACAAACCTGGC
+
+>r428
+GAGGAAGACAGCAACAAGCCTGGC
+
+>r429
+GAGGAAGACAATAACAAGACTGGC
+
+>r430
+AAAGAATACAACAACAAGCCTGGC
+
+>r431
+AAAGAACACGGCAACAAGCCTGGT
+
+>r432
+AAAGAAGACGGCATCAAACCTGGC
+
+>r433
+AAAGAAGACAACAACAAGCCTCGT
+
+>r434
+AAAGAAAACAACAACAAGCCTGGT
+
+>r435
+AAAGAAGACAGCAAAAAACCTGGC
+
+>r436
+AAAGAAGACTGCAACAAACCTGGT
+
+>r437
+AAAGAAGACAACAACAAGCCTGAC
+
+>r438
+AAAGAAGACGGCAAGAAACCTGGC
+
+>r439
+AAAGAAGACAACAACAAACTTGGT
+
+>r440
+AAAGAAGACGGCAGCAAACCTGGT
+
+>r441
+AAAGAAGATGGAAACAAACCTGGC
+
+>r442
+AAAGAAGACAACAACAAACTTGGC
+
+>r443
+AAATAAGACAACAAAAAGCCTAGC
+
+>r444
+AAAGAAGTCAACAACAAGCCTGGT
+
+>r445
+AAAGAAGACGGCAACAAGCATGGT
+
+>r446
+AAAGAAAATGGCAACAAACCTGGC
+
+>r447
+AAAGAAGACAACAACAAGCCTGGA
+
+>r448
+AAAGAAGATGGCAACAATCCTGGT
+
+>r449
+GGGGAAGACAATAACAAGCCTGGT
+
+>r450
+ACAGAAGACGGCAACAAGCCTGGC
+
+>r451
+AAAGAAGACAACAAAAAGCCTATT
+
+>r452
+AAAGAAGACGGCAACAAACCCGGT
+
+>r453
+AAAGAAGATGGCAACAAAGCTGGC
+
+>r454
+AAAGCAGACAACAAAAAACCTGGC
+
+>r455
+AAAAAAGACGGCAACAAACCTGGC
+
+>r456
+GAGGAAGACAACAACAAGTCTGGC
+
+>r457
+AAAGAAGACAACAAAAAAGCTGGT
+
+>r458
+AAAGAAGACGGCAGCAAACCTGGC
+
+>r459
+AAAGAAGACAACAACAACAAGCCTGGT
+
+>r460
+AAAGAAGACAACAACAAGGCTGGT
+
+>r461
+AAAGAAGACAACAACAAAACTGGT
+
+>r462
+AAAGAAGACATCAACAAACCTGGT
+
+>r463
+AAAGGAGACGGCAACAAACCTGGT
+
+>r464
+AAAGATGACGGCAACAAACCTGGC
+
+>r465
+GAGGAATACAATAACAAGCCTGGT
+
+>r466
+AAAGAAGACGGCAACAAACCTGCC
+
+>r467
+AAAGAAGACAACAAAAAGCCTAAC
+
+>r468
+GAAGAAGACAACAACAAGCCTGGT
+
+>r469
+AAAGAAGACAACAACAAGCATGGC
+
+>r470
+AAAGAAGACAACAAAAGACCTGGT
+
+>r471
+AAAGAAGACAACAAAAAGCCTGAC
+
+>r472
+GAGGAAAACAACAACAAACCTGGC
+
+>r473
+AAAGAAGACGGCAACAGGCCTGGT
+
+>r474
+AAAGAAGACGGCAACAAGCCGGGT
+
+>r475
+AAAGAAGACGGCAACAAACCTAGT
+
+>r476
+AAAGCAGATGGCAACAAACCTGGT
+
+>r477
+AAAGAAGACAACGACAAGCCTGGC
+
+>r478
+GGGGAAGACAACAACAAGCCTGGC
+
+>r479
+GAGGAAGACAATAACAAACCTGGC
+
+>r480
+GCTGACAACAAAAAACCTGGT
+
+>r481
+AAAGAAGATTGCAACAAGCCTGGC
+
+>r482
+AAAGAAGACGGCAACGAGCCTGGT
+
+>r483
+GAGGAAGACAACAACAAGCCGGGC
+
+>r484
+AAAGAAGATTGCAACAAACCTGGT
+
+>r485
+AAAGAAAACAACAAAAAGCCTAGC
+
+>r486
+AAAGAAGACAACAACAAACCTGAC
+
+>r487
+AAAGAAGATGGCAACAAGACTGGT
+
+>r488
+AAAGAAGACAACAACGAGCCTGGT
+
+>r489
+AAATAAGACAATAACAAGCCTGGT
+
+>r490
+AAAGAAGACAACCACAAGCCTGGT
+
+>r491
+AAAGAAGATGGCAACCAGCCTGGT
+
+>r492
+ATAGAAGACAACAACAAGCCTGGC
+
+>r493
+AAAGAAGATGGCAACTAACCTGGT
+
+>r494
+AAAGAAGACAGCAACAAGTCTGGC
+
+>r495
+AAAGAAGACAACAAAAAACCAGGC
+
+>r496
+GAAGAAGACAATAACAAGCCTGGC
+
+>r497
+AAAGAAGACGGCAACAAGGCTGGT
+
+>r498
+AAAGAAGATGGCAACCAACCTGGT
+
+>r499
+GAGGAAGATAATAACAAGCCTGGC
+
+>r500
+AAAGAGGACGGCAACAAACCTGGC
+
+>r501
+AAAGAAGATGGCAACAAACCTGTT
+
+>r502
+AAAGAAGACAACAACAAACCCGGT
+
+>r503
+AAAGAAGACCGCAACAAGCCTGGT
+
+>r504
+AAAGAAGATGGCAACAAACCCGGC
+
+>r505
+AAAGAATACAACAAAAAACCTGGC
+
+>r506
+AAAGAAGACGGCATCAAGCCTGGT
+
+>r507
+AAAGAAGACAACAACCCTGGT
+
+>r508
+GAGGAAGACAACAAAAAACCTAGC
+
+>r509
+AGAGAAGATGGCAACAAACCTGGT
+
+>r510
+AAAGAAGGTGGCAACAAACCTGGT
+
+>r511
+AAAGAAGATGTCAACAAGCCTGGT
+
+>r512
+AAAGAAGATAACAAAAAGCCTGGC
+
+>r513
+AAAGAAGACTGCAACAAACCTGGC
+
+>r514
+AAAGAAGACAAGAACAAGCCTGGT
+
+>r515
+AAAGAAGATGGCAACAAGCTTGGT
+
+>r516
+GAGGAAGACAACAACAAACCTGTT
+
+>r517
+AAAGAAGACTCCAACAAACCTGGC
+
+>r518
+AAAGAAGATGGCAAAAAGCCTAGC
+
+>r519
+AAAGAAGACAACAGCAAGCCTGGC
+
+>r520
+AGAGAAGACGGCAACAAACCTGGT
+
+>r521
+GAGGAAGACAACAACAAGCCTGCC
+
+>r522
+AAAGAAGACAACAATAAACCTGGC
+
+>r523
+AAATAAGATGGCAACAAACCTGGT
+
+>r524
+GAGAAAGACAATAACAAGCCTGGC
+
+>r525
+AAAGAAGATGGCAACAAAACTGGT
+
+>r526
+AAAGAAGACGCCAACAAACCTGGT
+
+>r527
+AAAGAATATGGCAACAAGCCTGGT
+
+>r528
+AAAGAAGACAACCAAAAACCTGGC
+
+>r529
+AAAGAAGGTGGTAACAAACCTGGC
+
+>r530
+GAGGAGGACAATAACAAGCCTGGT
+
+>r531
+AAAGTAGATGGTAACAAACCTGGC
+
+>r532
+AAAGAAGACAACAAAAAACCGGGT
+
+>r533
+AAAGAATACGGCAACAAACCTGGC
+
+>r534
+AAAAAAGATGGTAACAAACCTGGC
+
+>r535
+GAGGAAGACAACAATAAGCCTGGT
+
+>r536
+AAAGAAGAGGGCAACAAACCTGGC
+
+>r537
+AAATAAGACAACAACAAGCCTGGC
+
+>r538
+AAAGGAGACAACAACAAGCCTGGT
+
+>r539
+AAAGAAGACAACAACAAACCACCT
+
+>r540
+AAAGAAAACGGCAACAAGCCTGGC
+
+>r541
+GAGAAAGACAACAACAAACCTGGT
+
+>r542
+AAAGAAGACAACAACGAACCTGGT
+
+>r543
+AAAGAAGATGGCAACAAAAAACCTGGT
+
+>r544
+GAGGAAGACGGCAAAAAACCTGGC
+
+>r545
+GAGGAAGGCAACAAACCTGGT
+
+>r546
+AAAGAAGACAACAAGAAACCTGGT
+
+>r547
+AAAGAAGATAACAAAAAGCCTAGC
+
+>r548
+GAGAAAGACGGCAACAAACCTGGT
+
+>r549
+AAGGAAGACAACAAAAAACCTGGT
+
+>r550
+GAAGAAGATGGTAACAAACCTGGC
+
+>r551
+GAGGAAGACAAAAACAAGCCTGGC
+
+>r552
+AACGAAGATGGCAACAAGCCTGGC
+
+>r553
+AAAGAAGACAACAACCAGCCTGGT
+
+>r554
+AAATAAGACAACAACAAACCTGGT
+
+>r555
+GAGGAAGACACTAACAAGCCTGGT
+
+>r556
+AAAGAAGACGATAACAAGCCTGGC
+
+>r557
+AAAGAAGACATCAACAAGCCTGGT
+
+>r558
+AAGGAAGACGGCAACAAGCCTGGC
+
+>r559
+AAAGAGGATGGCAACAAGCCTGGT
+
+>r560
+AAAGAAGATGACAACAAACCTGGC
+
+>r561
+GAGGAAGACAACAACAAACATGGT
+
+>r562
+AAAGAAGAGAACAAAAAACCTGGT
+
+>r563
+AAGGAAGACAATAACAAGCCTGGC
+
+>r564
+AAAGAAGAAAACAAAAAACCTGGC
+
+>r565
+AAAGAAGATAGCAACAGACCTGGC
+
+>r566
+GAGGAAGACAATAAGCCTGGT
+
+>r567
+TAAGAAGACGGCAACAAGCCTGGT
+
+>r568
+AAAGAAGACAACAAAAAACCTTGT
+
+>r569
+AAGGAAGACAACAACAAACCTGGT
+
+>r570
+GAGGAAGGCAATAACAAGCCTGGT
+
+>r571
+AAAGAAGGCAACAAAAAACCTGGC
+
+>r572
+AAAGAAGATGGCAACAAGCCTGGG
+
+>r573
+GAGGAAGACAATAACAGGCCTGGT
+
+>r574
+AAAGAAGATGGCAACAAGCCTTGC
+
+>r575
+AAAGAAGATGGCAACAAGGCTGGC
+
+>r576
+AGAGAAGATGGCAACAAGCCTAGT
+
+>r577
+AAAGAAGATGGCAACAAACCAGGT
+
+>r578
+AAAGAAGACTGCAACAAGCCTGGC
+
+>r579
+AAAGAAGACAACAAAAATCCTAGC
+
+>r580
+GAGGAAGACAACAACAAACCTCGG
+
+>r581
+AAAGAAGATAATAACAAGCCTGGC
+
+>r582
+AAAGAAGACGGCAACAAGCCTGTT
+
+>r583
+AAAGAAGACAACAACATGCCTGGC
+
+>r584
+GAGGAAGACAAGAACAAACCTGGT
+
+>r585
+GAGGAAGAGAATAACAAGCCTGGC
+
+>r586
+GAGGAAGACAATAAAAAACCTGGT
+
+>r587
+AAAGAAGACAACAACAGGCCTGGT
+
+>r588
+CAAGAAGACAACAAGCCTGGT
+
+>r589
+GAAGAAGACAACAAAAAACCTGGC
+
+>r590
+AAAGAAGGTGGCAACAAGCCTAGT
+
+>r591
+GAGGAAGACAACAAGCCTGGC
+
+>r592
+GAGTAAGACAATAACAAGCCTGGT
+
+>r593
+AAAGAAGACGGCAACCAGCCTGGC
+
+>r594
+AAAGGAGATGGCAACAAACCTGGC
+
+>r595
+GAGGAAGACCATAACAAGCCTGGC
+
+>r596
+AAAGAAGACAACAACAAGACTGGC
+
+>r597
+GATGAAGACAACAAGCCTGGC
+
+>r598
+AAAGAAGACAACAAAACACCTGGC
+
+>r599
+CAAGAAGATGGCAACAAGCCTGGT
+
+>r600
+AAAGAAGACAATAACAAACCTGGC
+
+>r601
+AAAGCAGACAACAACAAACCTGGC
+
+>r602
+AAAGAAGACGGCACCAAGCCTGGT
+
+>r603
+GAGTAAGACAATAACAAGCCTGGC
+
+>r604
+AAAGAAGACAACACAAAACCTGGT
+
+>r605
+AAAGAAGACAAGAACAAGCCTGGC
+
+>r606
+AAAGAAGACGATAACAAACCTGGT
+
+>r607
+GAGGAAGACAGCAACAAGCCCCTG
+
+>r608
+GAGGAAGACAATAAAAAGCCTGGT
+
+>r609
+GAGGAAGACAATAACAAGCCTGTT
+
+>r610
+AAAGAAGATGACAACAAGCCTAGT
+
+>r611
+GCTGACAACAACAAGCCTGGT
+
+>r612
+AAAGAAGACAATAACTAGCCTGGC
+
+>r613
+AAAGAAGACAACTACAAGCCTGGC
+
+>r614
+AAAGAAGACAATAACAAGCCCGGC
+
+>r615
+AAAGAAGATGTCAACAAACCTGGC
+
+>r616
+AAAGAATACGGCAACAAGCCTGGC
+
+>r617
+GAGGAAGACAACAACAAAAAACCTGGT
+
+>r618
+CAAGAAGATGGCAACAAACCTGGT
+
+>r619
+GAGTAAGACAACAACAAGCCTGGT
+
+>r620
+AAAGAAGATGGCAACAAGCCTGGA
+
+>r621
+TAGGAAGACAACAACAAACCTGGT
+
+>r622
+AAAGAAGATGGCAATAAGCCTGGC
+
+>r623
+AAAGCAGACGGCAACAAACCTGGT
+
+>r624
+GAGGAAGACAATAACAAGACTGGT
+
+>r625
+AAAGAAGACAACAACAAACCTAGT
+
+>r626
+AAAGAAGACAACAACAAGCCAGGT
+
+>r627
+AAAGAAGACGGCAAGAAACCTGGT
+
+>r628
+AAAGAAGATGGCAACGAGCCTGGT
+
+>r629
+GAGGAAGACAGCAACAAACCTGGC
+
+>r630
+GAGGAATACAACAAGCCTGGT
+
+>r631
+AAAGAAGACAACAACAAGCCTGTT
+
+>r632
+AAAGAAGACGGCAACAACCCTGGC
+
+>r633
+AAATAAGATGGCAACAAGCCTGGT
+
+>r634
+AAAGAAGACGGCAACAAACCTCGT
+
+>r635
+AAAGAAGACGGCAACAAGCCTGCT
+
+>r636
+GAGGAAGACAATAAGAAGCCTGGT
+
+>r637
+GAGGAAGAAAATAACAAGCCTGGC
+
+>r638
+AAAGAAGAAAACAACAAGCCTGGC
+
+>r639
+AAAGAAGACGGCAACAGACCTGGC
+
+>r640
+AAAGAAGAGGGTAACAAACCTGGC
+
+>r641
+GCTGACAACAACAAGCCTGGC
+
+>r642
+AAAGAAGACAATAACAAGACTGGC
+
+>r643
+AAAAAAGATGGCAACAAGCCTGGT
+
+>r644
+GAGGAAGACAACAACAAACCCGGT
+
+>r645
+GAGGAATACAACAAAAAACCTGGT
+
+>r646
+AATGAAGACAACAACAAGCCTGGT
+
+>r647
+AACGAAGACGGCAACAAGCCTGGC
+
+>r648
+AAAGAAGACGGCAACAAGCAGCCTGGT
+
+>r649
+AAAGAAGACAACAACAAAAAACCTGGT
+
+>r650
+AAAGAAGATGGCAACAAACCTTGT
+
+>r651
+AAAGAAGACAACAACAAGCCTTGT
+
+>r652
+AAAGAAGACAACAAAATACCTGGT
+
+>r653
+GAGAAAGACAATAACAAACCTGGT
+
+>r654
+AAAGAAGACAACCAAAAACCTGGT
+
+>r655
+AAAGAGGACAACAACAAGCCTGGT
+
+>r656
+GAAGAAGACAACAACAAACCTGGC
+
+>r657
+AAAGAAGACAGAAACAAACCTGGC
+
+>r658
+AAAGAAGACGGCAACAAGCCTGTC
+
+>r659
+AAAGAAGATGGCAACAAGTCTGGC
+
+>r660
+AAAGAAGGCAACAACAAGCCTGGC
+
+>r661
+AAACAAGACGGCAACAAGCCTGGC
+
+>r663
+AAAGAAGACGGCAAAAAGCCTGGT
+
+>r664
+AAAGAAGATGGCAACAAGCCTGTT
+
+>r665
+AAAGAAGACAGCAAAAAGCCTATC
+
+>r666
+AAAGAAGATGGCAACAAACCGGGT
+
+>r667
+AAAGAAGATCGCAACAAGCCTGGT
+
+>r668
+AAAGAAGACGTCAACAAGCCTGGC
+
+>r669
+AAAGAAGAGAACAACAAGCCTGGC
+
+>r670
+AAAGAAGACAACAAAAGACCTGGC
+
+>r671
+AAAGAAGTCAACAAAAAACCTGGT
+
+>r672
+AAAGAAGGCAACAAACCTGGT
+
+>r673
+AAAAAAGACAACAACAAACCTGGC
+
+>r674
+GAGGAAGACAATAACAAGCTTGGC
+
+>r675
+GAGGAAGACAATAACAAGCCTGAT
+
+>r676
+AAAGAAGATGGCAACAAACCTGGA
+
+>r677
+AAAGAAGACGGGAACAAACCTGGT
+
+>r678
+AAAGAAGACAATAACAAGGCTGGC
+
+>r679
+AAAGAGGATGGCAACAAACCTGGT
+
+>r680
+TAAGAAGACAACAACAAGCCTGGT
+
+>r681
+GAGGAAGACGACAACAAACCTGGT
+
+>r682
+GAAGAAGACAACAACAAGCCTGGC
+
+>r683
+AAAGAAGGCAACAAGCCTGGT
+
+>r684
+AAAGAAGACGGAAACAAACCTGGC
+
+>r685
+AAAGAAGATGGCAAGAAACCTGGT
+
+>r686
+AAAGAAGACAACAACAAATCTGGT
+
+>r687
+AAAGAAGACGACAACAAGCCCGGT
+
+>r688
+AAAGAAGACAACAAAAAACCTGCT
+
+>r689
+AAAGAAGATGGTAACAAAGCTGGC
+
+>r690
+AAATAAGACGGCAACAAGCCTGGC
+
+>r691
+AAAGAAGACAACAACAAACCTGTC
+
+>r692
+AAAGAAGCCGGCAACAAACCTGGC
+
+>r693
+AATGAAGACAACAAAAAACCTGGT
+
+>r694
+AAAGAAGACAACAACAAATCTGGC
+
+>r695
+AAAGAAGACAACAAAAAGCCCAGC
+
+>r696
+AAAGAAGACGGCAACAAGCCTGAC
+
+>r697
+AAAGAAGACAACAACAAACCCGGC
+
+>r698
+AACGAAGACAACAAAAAACCTGGT
+
+>r699
+TAGGAAGACAATAACAAGCCTGGC
+
+>r700
+AAAGAAGATGGCAACAAGCCTGAC
+
+>r701
+AAAGAAGACCCCAACAAACCTGGT
+
+>r702
+GAGGAAGATGGCAACAAACCTGGT
+
+>r703
+AAAGAAGACAAGAAAAAACCTGGT
+
+>r705
+GAGGAAGACAACAAAAAACCCGGT
+
+>r706
+AAAGAAGACAACAAAAAACCGGGC
+
+>r707
+GAGTAAGACAACAACAAACCTGGT
+
+>r708
+AAAGAAGACAATGACAAGCCTGGC
+
+>r709
+AAAGAAGACAACAAAAAATTTGGT
+
+>r710
+AGAGAAGACGGCAACAAACCTGGC
+
+>r711
+AAAGAAGACGGCAACAAAACTGGC
+
+>r712
+GAGGAAGACAAAAACAAACCTGGT
+
+>r713
+AAAGAGGATAACAACAAACCTGGT
+
+>r714
+AAAGAAGACAACAACAAGCCCGGC
+
+>r715
+AAAGAAGACGGCAACAAACCTCGC
+
+>r716
+AAAGAAGACAAAAACAAACCTGGT
+
+>r717
+AAACAAGATGGCAACAAGCCTGGC
+
+>r718
+AAAGAAGATGGCAATAAACCTGGC
+
+>r719
+AAAGAAGACTGCAAAAAACCTGGT
+
+>r720
+AAAGAAGTCGGCAACAAACCTGGC
+
+>r721
+AAAGAAGATGGCAACAAACCTGCT
+
+>r722
+AAAGAAGACAACAACAAAGCTGGC
+
+>r723
+AAAGGAGACGGCAACAAGCCTGGC
+
+>r724
+GAGGAAAACAACAACAAACCTGGT
+
+>r725
+AAAGAAGACAACAACAAACCGGGT
+
+>r726
+GAAGAAGACAACAACAAACCTGGT
+
+>r727
+AAAGAAAACAACAACAAGCCTGGC
+
+>r728
+AAAGAAAATGGCAACAAGCCTGGT
+
+>r729
+AAAGATGACAACAACAAGCCTGGT
+
+>r730
+AAAGAAGACGGAAAAAAACCTGGC
+
+>r731
+AAAGAAGATGGCAACAAAAAGCCTAGC
+
+>r732
+AAAAAAGACAATAACAAGCCTGGC
+
+>r733
+GAGGAAGACAACAACATGCCTGGT
+
+>r734
+AAAGAAGACACCAAAAAACCTGGT
+
+>r735
+GAGGAAGACAACAATAAGCCTGGC
+
+>r736
+AAAGAAGATGGTAACAAACTTGGC
+
+>r737
+AAAGGAGATGGCAACAAGCCTGGT
+
+>r738
+AAAGGAGATGGCAACAAACCTGGT
+
+>r739
+AAACAAGACGGCAACAAACCTGGT
+
+>r740
+GAGAAAGACAACAACAAACCTGGC
+
+>r741
+GAGGAAGACAAAAACAAACCTAGT
+
+>r742
+GAGGAAGACAAAAACAAGCCTGGT
+
+>r743
+AAAGAAGACAAAAACAAGCCTGGT
+
+>r744
+AAAGAAGACAACAATAAGCCTGAC
+
+>r745
+AAAGAAGACAATAACAGGCCTGGT
+
+>r746
+AAAGGAGACGGCAACAAGCCTGGT
+
+>r747
+AAAGAAGACATCAAAAAACCTGGC
+
+>r748
+AAAGGAGACAACAAAAAACCTGGC
+
+>r749
+GAGGGAGACAACAAAAAACCTGGT
+
+>r750
+GGGGAAGACAACAAAAAACCTGGT
+
+>r751
+GAGGAAGACAACAACAACCCTGGT
+
+>r752
+AAAGAAGACCACAAAAAACCTGGC
+
+>r753
+AAAGAAGACAACAACAAACCTTGC
+
+>r754
+AAAGAAGACAACAAGAAGCCTGGT
+
+>r755
+AAACAAGACGGCAACAAACCTGGC
+
+>r756
+GAGGAAGACAACAACAAACCTTGT
+
+>r757
+GAGGAAGACAATAACAATCCTGGT
+
+>r758
+AAAAAAGACAACAAAAAGCCTGGC
+
+>r759
+AAAGAAGACAACAACAGACCTGGC
+
+>r760
+CAAGAAGTCGGCAACAAGCCTGGT
+
+>r761
+GAGGAAGACAACAACGAGCCTGGC
+
+>r762
+GAGGGAGACAACAACAAACCTGGT
+
+>r763
+AAAGAAGGCAATAACAAGCCTGGT
+
+>r764
+GAGGAAGACAACAACAAGCCTTGT
+
+>r765
+AAAGAAGACGGCAACAAACCTGCA
+
+>r766
+AAAGAAGACAGCAACAAGCCTGAC
+
+>r767
+AAAGAAGACGGCAACAAACCGGGT
+
+>r768
+AAAGAAGTTGGCAACAAGCCTGGT
+
+>r769
+AAAGCAGACAACAACAAGCCTGGT
+
+>r770
+AAAGAAGATGGCAACAAACCTCGT
+
+>r771
+GAGGAAGAAAACAACAAACCTGGT
+
+>r772
+GAGGAAGACAACAACAAATCTGGC
+
+>r773
+AAAGAAGAGGGCAACAAACCTGGT
+
+>r774
+AAAAAAGACAATAACAAGCCTGGT
+
+>r775
+GAGGAAAACAATAACAAGCCTGGC
+
+>r776
+AAAGAAGACAACGACAAACCTGGC
+
+>r777
+AAAGAAGGTGGCAACAAACCTGGC
+
+>r778
+GAGGAAGACAATAACAAGCCTGAC
+
+>r779
+AAAGAAGACAACAACAAGCGTGGC
+
+>r780
+GAGGAAGACAATAACAAGTCTGGC
+
+>r781
+GAGGAAGAGAACAACAAACCTGGT
+
+>r782
+GAGGAAGATAACAACAAACCTGGC
+
+>r783
+AAAGAAGACAACAAAAACCCTGGC
+
+>r784
+AAAGAAGACAAAAAAAAACCTGGC
+
+>r785
+AGAGAAGACAACAACAAACCTGGC
+
+>r786
+GAGGAAGACAACAACAAGCCTGTT
+
+>r787
+GAGGAAGACAACAACAAACCTAGT
+
+>r788
+GAGGAAGACAACAACAAACCTGAC
+
+>r789
+AAAGAAGGTGGCAACAAGCCTGGC
+
+>r790
+GAGGAAGACAACAACCAACCTGGT
+
+>r791
+AAAGAAGATGGCAACACACCTGGT
+
+>r792
+GAGGAAGACAACAAAAAACCTGGG
+
+>r793
+GAGGAAGACATCAAAAAACCTGGT
+
+>r794
+AAAGAAGACAATAACAAGCCTAGC
+
+>r795
+AAAGAAGACAACAAGAAGCCTGGC
+
+>r796
+AAAGAAGACGGCAACAAGCCTGTA
+
+>r797
+AAAGAAGACAATAACAAGACTGGT
+
+>r798
+AAAGAAGACAACAAAGAACCTGGC
+
+>r799
+AAAGACGACAACAACAAGCCTGGT
+
+>r800
+AAAGAAGACAATAAAAAACCTGGC
+
+>r801
+AAAGAAGACAATAACAAGCCTGGA
+
+>r802
+GAGGAAGACAACAACAAGCCTGGA
+
+>r803
+AAAGAAGACGGCAACAAACATGGC
+
+>r804
+AAAGAAGAAGGCAACAAGCCTGGT
+
+>r805
+AAAGAGGACAACAAAAAACCTGGT
+
+>r806
+AAAGAAGACAACAACAAGCCTGCT
+
+>r807
+AAAGAAGACAACAAAAAACCTCGC
+
+>r808
+AAAGAAGACAATAACAAGCCTGAT
+
+>r809
+GAGGAAGATGGCAACAAGCCTGGT
+
+>r810
+AAAGAAGACAACAAATAACCTGGT
+
+>r811
+AAAGAAGGCAATAACAAGCCTGGC
+
+>r812
+AAAGAAGATGGCAAAAAGCCTGGT
+
+>r813
+GAGGAAGACAACAACAAACCTGAT
+
+>r814
+AAAGAAGACAACAACAACCCTGGC
+
+>r815
+GAGGAAGATAACAACAAGCCTGGT
+
+>r816
+GAGGAAGACAACAAAAAAACTGTT
+
+>r817
+AAAGAAGATGGCAACTCGCCTGGT
+
+>r818
+AAGGAAGACAACAACAAACCTGGC
+
+>r819
+AAAGAAGCCGGCAACAAGCCTGGT
+
+>r820
+AAAGAAGGCAACAAACCTGGC
+
+>r821
+TAGGAAGACAACAAAAAACCTGGT
+
+>r822
+AAAGAAGACGGCGACAAACCTGGT
+
+>r823
+AAAGAAGACAACAAAAAACCTGTT
+
+>r824
+GAGAAAGACAACAACAAGCCTGGT
+
+>r825
+AAAGAAGACAACAAAAAACCTGGA
+
+>r826
+AAAGAACATGGTAACAAACCTGGC
+
+>r827
+AAAGAAGACAGCAAAAAGCCTAGT
+
+>r828
+GAGGAAGACAACAACAACAAGCCTGGT
+
+>r829
+AAAGAAGATGTCAACAAACCTGGT
+
+>r830
+AAAGAAGAAGACAACAAGCCTGGC
+
+>r831
+GAGGAAGACAACCAAAAACCTGGT
+
+>r832
+AAAGAAGCCAACAAAAAACCTGGT
+
+>r833
+AAGGAAGACAACAACAACAAGCCTGGT
+
+>r834
+AAAGAAGACGGCAACTAACCTGGT
+
+>r835
+GAGGAAGACAACAACAAACCTGCT
+
+>r836
+CAAGAAGACAACAAAAAGCCTGGC
+
+>r837
+GAGGAAGACGGTAACAAACCTGGT
+
+>r838
+AAAGAAGACATCAAAAAACCTGGT
+
+>r839
+GAGGAAGACGGCAACAAACCTGAT
+
+>r840
+AAAGAGGATGGCAACAAACCTGGC
+
+>r841
+AAAGAAGATGCCAACAAGCCTGGT