Mercurial > repos > bgruening > blobtoolkit
changeset 0:7d9ee8cd14b8 draft
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/blobtoolkit commit 7c0db48ffd4dbee68fb2320fc5a064bc9c3219d9
author | bgruening |
---|---|
date | Mon, 30 Jan 2023 12:39:40 +0000 |
parents | |
children | 840822c1e84a |
files | blobtoolkit.xml macros.xml test-data/assembly.fasta.gz test-data/assembly.yaml test-data/bam_file.bam test-data/blast_results.tabular test-data/busco_full_table.tabular test-data/contig.fasta test-data/reads.fastq test-data/small_taxdump.tar.gz test-data/test01_blobdir.tar.gz test-data/test02_blobdir.tar.gz test-data/test04_circle.png test-data/test04_cumulative.png test-data/test04_snail.png |
diffstat | 15 files changed, 968 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/blobtoolkit.xml Mon Jan 30 12:39:40 2023 +0000 @@ -0,0 +1,413 @@ +<tool id="blobtoolkit" name="BlobToolKit" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="21.05"> + <description>genome assembly QC</description> + <macros> + <import>macros.xml</import> + </macros> + <expand macro='requirements' /> + <command detect_errors="exit_code"><![CDATA[ + #if $mode_conditional.selector == 'create' + mkdir -p './Blobdir' && + mkdir -p './taxdump' && + ln -s '${mode_conditional.taxdump}' 'taxdump.tar' && + tar -xf 'taxdump.tar' -C './taxdump' && + ln -s '${mode_conditional.fasta}' 'assembly.fasta' && + #if $mode_conditional.meta + ln -s '${mode_conditional.meta}' 'assembly.yaml' && + #end if + blobtools create + --fasta 'assembly.fasta' + #if $mode_conditional.meta + --meta 'assembly.yaml' + #end if + --taxid $mode_conditional.taxid + --taxdump './taxdump' + './Blobdir' + && cp -r './taxdump' './Blobdir/' + && tar -zcf './Blobdir.tgz' './Blobdir' + + #else if $mode_conditional.selector == 'add' + #if $mode_conditional.blobdir.is_of_type("tgz") + tar -zxf '${mode_conditional.blobdir}' -C './' && + #else + tar -xf '${mode_conditional.blobdir}' -C './' && + #end if + #if $mode_conditional.busco + ln -s '${mode_conditional.busco}' './busco_results.tab' && + #end if + #if $mode_conditional.blast_input.selector == 'enabled' + ln -s '$mode_conditional.blast_input.hits' './blast_results.tab' && + #end if + #if $mode_conditional.cov + ln -s '$mode_conditional.cov' './input.bam' && + ln -s '$mode_conditional.cov.metadata.bam_index' './input.bam.bai' && + #end if + #if $mode_conditional.bed + mkdir -p './bed_files' && + #import re + #for $i, $input in enumerate($mode_conditional.bed): + #set $safename = re.sub('[^\w\-_]', '_', $input.element_identifier) + "." + str($i) + ln -sf '${input}' './bed_files/${safename}.bed' && + #end for + #end if + blobtools add + --threads \${GALAXY_SLOTS:-8} + --taxdump './Blobdir/taxdump' + #if $mode_conditional.busco + --busco './busco_results.tab' + #end if + #if $mode_conditional.blast_input.selector == 'enabled' + --hits './blast_results.tab' + #if $mode_conditional.blast_input.hits_cols + --hits-cols '${$mode_conditional.blast_input.hits_cols}' + #end if + --taxrule $mode_conditional.blast_input.taxrule + --evalue $mode_conditional.blast_input.evalue + --hit-count $mode_conditional.blast_input.hit_count + --bitscore $mode_conditional.blast_input.bitscore + #end if + #if $mode_conditional.bed + --beddir './bed_files' + #end if + #if $mode_conditional.cov + --cov './input.bam' + #end if + #if $mode_conditional.fasta + --fasta '${mode_conditional.fasta}' + #end if + #if $mode_conditional.trnascan + --trnascan '${mode_conditional.trnascan}' + #end if + #if $mode_conditional.text_input.selector == 'enabled' + --text '${mode_conditional.text_input.text}' + --text-cols '${mode_conditional.text_input.text_cols}' + $mode_conditional.text_input.text_header + $mode_conditional.text_input.text_no_array + --text-delimiter $mode_conditional.text_input.text_delimiter + #end if + #if $mode_conditional.advanced_options.blobdb + --blobdb '${mode_conditional.advanced_options.blobdb}' + #end if + #if $mode_conditional.advanced_options.synonyms + --synonyms '${mode_conditional.advanced_options.synonyms}' + #end if + $mode_conditional.advanced_options.update_plot + #if $mode_conditional.advanced_options.pileup_args + --pileup-args '${mode_conditional.advanced_options.pileup_args}' + #end if + $mode_conditional.advanced_options.replace + './Blobdir' + && tar -zcf './Blobdir.tgz' './Blobdir' + + #else if $mode_conditional.selector == 'filter' + #if $mode_conditional.blobdir.is_of_type("tgz") + tar -zxf '${mode_conditional.blobdir}' -C './' && + #else + tar -xf '${mode_conditional.blobdir}' -C './' && + #end if + #if $mode_conditional.filter_options.fasta + ln -s '${mode_conditional.filter_options.fasta}' './input.fasta' && + #end if + #if $mode_conditional.filter_options.fastq_filter.selector == 'enabled' + ln -s '${mode_conditional.filter_options.fastq}' './input.fastq' && + ln -s '$mode_conditional.filter_options.cov' './input.bam' && + ln -s '$mode_conditional.filter_options.cov.metadata.bam_index' './input.bam.csi' && + #end if + blobtools filter + #if $mode_conditional.filter_options.param + --param $mode_conditional.filter_options.param + #end if + #if $mode_conditional.filter_options.json + --json $mode_conditional.filter_options.json + #end if + #if $mode_conditional.filter_options.list + --list $mode_conditional.filter_options.list + #end if + $mode_conditional.filter_options.invert + #if $mode_conditional.filter_options.fasta + --fasta './input.fasta' + #end if + #if $mode_conditional.filter_options.fastq_filter.selector == 'enabled' + --fastq './input.fastq' + --cov './input.bam' + #end if + #if $mode_conditional.filter_options.text_input.selector == 'enabled' + --text '${mode_conditional.filter_options.text_input.text}' + --text-cols '${mode_conditional.filter_options.text_input.text_cols}' + $mode_conditional.filter_options.text_input.text_header + --text-delimiter $mode_conditional.filter_options.text_input.text_delimiter + #end if + ./Blobdir + #if $mode_conditional.remove_options.remove_selector or $mode_conditional.remove_options.field + && blobtools remove + #for $param in $mode_conditional.remove_options.remove_selector + $param + #end for + #if $mode_conditional.remove_options.field + --field $mode_conditional.remove_options.field + #end if + ./Blobdir + #end if + && tar -zcf './Blobdir.tgz' './Blobdir' + + #else if $mode_conditional.selector == 'plots' + #if $mode_conditional.blobdir.is_of_type("tgz") + tar -zxf '${mode_conditional.blobdir}' -C './' && + #else + tar -xf '${mode_conditional.blobdir}' -C './' && + #end if + blobtools view + --format $mode_conditional.format + --view 'blob' + ./Blobdir + && mv ./Blobdir.blob.circle* ./Blobdir.blob.circle + && blobtools view + --format $mode_conditional.format + --view 'cumulative' + ./Blobdir + && mv ./Blobdir.cumulative* Blobdir.cumulative + && blobtools view + --format $mode_conditional.format + --view 'snail' + ./Blobdir + && mv ./Blobdir.snail* Blobdir.snail + #end if + ]]></command> + <inputs> + <conditional name="mode_conditional"> + <param name="selector" type="select" label="Select mode" help="Select a BlobToolKit module"> + <option value="create">Create a BlobToolKit dataset</option> + <option value="add">Add data to a BlobToolKit dataset</option> + <option value="filter">Edit a BlobToolKit dataset</option> + <option value="plots">Generate plots</option> + </param> + <when value="create"> + <param argument="--fasta" type="data" format="fasta" label="Genome assembly file" help="FASTA sequence file" /> + <param argument="--meta" type="data" format="yaml" label="Metadata file" optional="true" help="Optional metadata dataset"/> + <param argument="--taxid" type="integer" value="" label="NCBI taxonomy ID" help="Add ranks to metadata for a taxid"/> + <param argument="--taxdump" type="data" format="tar,tgz,gz" label="NCBI taxdump directory" help="It should be compressed in tar.gz format"/> + </when> + <when value="add"> + <param name="blobdir" type="data" format="tgz" label="Blobdir.tgz file" help="This file should be generated by Blobtool create" /> + <param argument="--busco" type="data" format="tsv,tabular,txt" optional="true" label="BUSCO full table file"/> + <conditional name="blast_input"> + <param name="selector" type="select" label="BLAST/Diamond hits"> + <option value="enabled">Enabled</option> + <option value="disabled" selected="true">Disabled</option> + </param> + <when value="enabled"> + <param argument="--hits" type="data" format="tsv,tabular" optional="true" label="BLAST/Diamond hits dataset" help="Tabular BLAST/Diamond output file"/> + <param argument="--taxrule" type="select" label="BLAST hits to taxa rule" help="Rule to use when assigning BLAST hits to taxa"> + <option value="bestsum">Bestsum</option> + <option value="bestsumorder">Bestsumorder</option> + <option value="bestdistsum">Bestdistsum</option> + <option value="bestdistsumorder">Bestdistsumorder</option> + <option value="blastp">Blastp</option> + </param> + <param argument="--evalue" type="float" min="0" value="1" label="E-value cutoff" + help="The smaller the E-value, the better the match. Any hits with an evalue weaker than the value specified will be excluded"/> + <param argument="--bitscore" type="float" min="0" value="1" label="Bitscore cutoff" + help="The higher the bit-score, the better the sequence similarity. Any hits with an bitscore lower the value specified will be excluded"/> + <param argument="--hit-count" type="integer" min="1" value="10" label="Hits to a given taxon" optional="true" + help="By default the 10 highest scoring hits to a given taxon will be used when applying the --taxrule"/> + <param argument="--hits-cols" type="text" value="1=qseqid,2=staxids,3=bitscore,5=sseqid,10=qstart,11=qend,14=evalue" optional="true" + label="BLAST/Diamond file column order" help="More information in the help section"> + <sanitizer invalid_char=""> + <valid initial="string.letters,string.digits"> + <add value="=" /> + <add value="," /> + </valid> + </sanitizer> + <validator type="regex">[0-9a-z=,]+</validator> + </param> + </when> + <when value="disabled"/> + </conditional> + <param argument="--bed" type="data" format="bed" multiple="true" optional="true" label="BED file of coverages per scaffold"/> + <param argument="--cov" type="data" format="bam,sam,cram" optional="true" label="BAM/SAM/CRAM read alignment file"/> + <param argument="--fasta" type="data" format="fasta" optional="true" label="FASTA sequence" help="FASTA sequence file" /> + <param argument="--trnascan" type="data" format="tsv,tabular" optional="true" label="tRNAscan2-SE" help="tRNAscan-SE is employed for identifying and annotating tRNA genes in genomes"/> + <expand macro="macro_text_input"> + <param argument="--text-no-array" type="boolean" truevalue="--text-no-array" falsevalue="" checked="false" label="Prevent duplicated identifiers" + help="Prevent fields in files with duplicate identifiers being loaded as array fields" /> + </expand> + <section name="advanced_options" title="Advanced options"> + <param argument="--blobdb" type="data" format="json" optional="true" label="Blobtools v1 database" help="This file should have been generated with the previous Blobtools tool version"/> + <param argument="--synonyms" type="data" format="tsv" optional="true" label="Identifier and sinonyms" help="TSV file containing current identifiers and synonyms"/> + <param argument="--update-plot" type="boolean" truevalue="--update-plot" falsevalue="" checked="false" label="Update plot" help="Flag to use new taxrule as default category" /> + <param argument="--pileup-args" type="text" value="" optional="true" label="Samtools Pileup" help="Key/value pairs to pass to samtools pileup"> + <sanitizer invalid_char=""> + <valid initial="string.letters,string.digits"> + <add value="=" /> + <add value="," /> + <add value="-" /> + </valid> + </sanitizer> + <validator type="regex">[0-9a-zA-Z=,-]+</validator> + </param> + <param argument="--replace" type="boolean" truevalue="--replace" falsevalue="" checked="false" label="Replace fields" help="Allow existing fields to be overwritten" /> + </section> + </when> + <when value="filter"> + <param name="blobdir" type="data" format="tgz" label="Blobdir file" help="This file should be generated by the moudule create" /> + <section name="filter_options" title="Filter mode options" expanded="true"> + <param argument="--param" type="text" value="" optional="true" label="Parameter value" help="String of type param=value. Individual param=value pairs can be specified to + filter based on Variable or Category fields"> + <sanitizer invalid_char=""> + <valid initial="string.letters,string.digits"> + <add value="=" /> + <add value="," /> + <add value="-" /> + </valid> + </sanitizer> + <validator type="regex">[0-9a-zA-Z=,-]+</validator> + </param> + <param argument="--list" type="text" value="" optional="true" label="List of identifiers" help="Space separated list of identifiers"> + <sanitizer invalid_char=""> + <valid initial="string.letters,string.digits"> + <add value=" " /> + <add value="-" /> + <add value="_" /> + </valid> + </sanitizer> + <validator type="regex">[0-9a-zA-Z _-]+</validator> + </param> + <param argument="--json" type="data" format="json" optional="true" label="JSON format list file" help="JSON format list file as generated by BlobtoolKit Viewer"/> + <param argument="--fasta" type="data" format="fasta" multiple="true" optional="true" label="Assembly to be filtered" help="FASTA format assembly file to be filtered"/> + <conditional name="fastq_filter"> + <param name="selector" type="select" label="Filter FASTQ reads"> + <option value="disabled">Disabled</option> + <option value="enabled">Enabled</option> + </param> + <when value="disabled"/> + <when value="enabled"> + <param argument="--fastq" type="data" format="fastq" optional="true" label="Reads to be filtered" help="FASTQ format read file to be filtered"/> + <param argument="--cov" type="data" format="bam,sam,cram" optional="true" label="BAM/SAM/CRAM read alignment file" /> + </when> + </conditional> + <expand macro="macro_text_input"/> + <param argument="--summary-rank" type="text" value="phylum" label="Sumamry rank" help="Taxonomic level for summary"> + <sanitizer invalid_char=""> + <valid initial="string.letters"/> + </sanitizer> + <validator type="regex">[a-zA-Z]+</validator> + </param> + <param argument="--invert" type="boolean" truevalue="--invert" falsevalue="" checked="false" label="Invert filter" help="Invert the filter (exclude matching records)"/> + </section> + <section name="remove_options" title="Remove mode options" expanded="true"> + <param name="remove_selector" type="select" multiple="true" display="checkboxes" label="Fields to remove"> + <option value="--all">Remove all fields except identifiers (--all)</option> + <option value="--busco">Remove all BUSCO fields (--busco)</option> + <option value="--cov">Remove all cov and read_cov fields (--cov)</option> + <option value="--fasta">Remove gc, length and ncount fields (--fasta)</option> + <option value="--hits">Remove all taxonomy fields (--hits)</option> + </param> + <param argument="--field" type="text" value="" optional="true" label="Remove fields by ID"> + <sanitizer invalid_char=""> + <valid initial="string.letters,string.digits"/> + </sanitizer> + <validator type="regex">[0-9a-zA-Z]+</validator> + </param> + </section> + </when> + <when value="plots"> + <param name="blobdir" type="data" format="tgz" label="Blobdir file" help="This file should be generated by the moudule create" /> + <param argument="--format" type="select" label="Image format"> + <option value="png">PNG</option> + <option value="svg">SVG</option> + </param> + <param argument="--param" type="text" optional="true" label="Query parameter" help="Query string parameter."/> + </when> + </conditional> + </inputs> + <outputs> + <data name="blobdir" format="tgz" from_work_dir="./Blobdir.tgz" label="${tool.name} on ${on_string}: Blobdir.tgz"> + <filter>mode_conditional['selector'] == 'create' or mode_conditional['selector'] == 'add' or mode_conditional['selector'] == 'filter'</filter> + </data> + <data name="plot_circle" format="png" from_work_dir="./Blobdir.blob.circle" label="${tool.name} on ${on_string}: blob plot"> + <filter>mode_conditional['selector'] == 'plots'</filter> + <change_format> + <when input="$mode_conditional.format" value="svg" format="svg"/> + </change_format> + </data> + <data name="plot_cumulative" format="png" from_work_dir="./Blobdir.cumulative" label="${tool.name} on ${on_string}: cumulative plot"> + <filter>mode_conditional['selector'] == 'plots'</filter> + <change_format> + <when input="$mode_conditional.format" value="svg" format="svg"/> + </change_format> + </data> + <data name="plot_snail" format="png" from_work_dir="./Blobdir.snail" label="${tool.name} on ${on_string}: snail plot"> + <filter>mode_conditional['selector'] == 'plots'</filter> + <change_format> + <when input="$mode_conditional.format" value="svg" format="svg"/> + </change_format> + </data> + </outputs> + <tests> + <test expect_num_outputs="1"> + <conditional name="mode_conditional"> + <param name="selector" value="create"/> + <param name="fasta" value="assembly.fasta.gz"/> + <param name="meta" value="assembly.yaml"/> + <param name="taxid" value="801"/> + <param name="taxdump" value="small_taxdump.tar.gz"/> + </conditional> + <output name="blobdir" file="test01_blobdir.tar.gz" compare="sim_size" delta="1000"/> + </test> + <test expect_num_outputs="1"> + <conditional name="mode_conditional"> + <param name="selector" value="add"/> + <param name="blobdir" value="test01_blobdir.tar.gz"/> + <param name="busco" value="busco_full_table.tabular"/> + <param name="cov" value="bam_file.bam"/> + <param name="fasta" value="contig.fasta"/> + <section name="advanced_options"> + <param name="update_plot" value="false"/> + </section> + <conditional name="blast_input"> + <param name="selector" value="enabled"/> + <param name="hits" value="blast_results.tabular"/> + <param name="taxrule" value="bestsum"/> + <param name="evalue" value="1"/> + <param name="bitscore" value="1"/> + <param name="hit_count" value="10"/> + <param name="hits_cols" value="1=qseqid,2=staxids,3=bitscore,5=sseqid,10=qstart,11=qend,14=evalue"/> + </conditional> + </conditional> + <output name="blobdir" file="test02_blobdir.tar.gz" compare="sim_size" delta="1000"/> + </test> + <test expect_num_outputs="1"> + <conditional name="mode_conditional"> + <param name="selector" value="filter"/> + <param name="blobdir" value="test02_blobdir.tar.gz"/> + <section name="filter_options"> + <param name="fasta" value="contig.fasta"/> + <param name="summary_rank" value="phylum"/> + <param name="invert" value="false"/> + </section> + <section name="remove_options"> + <param name="remove_selector" value="--all"/> + </section> + </conditional> + <output name="blobdir"> + <assert_contents> + <has_size value="672428" delta="1000"/> + </assert_contents> + </output> + </test> + <test expect_num_outputs="3"> + <conditional name="mode_conditional"> + <param name="selector" value="plots"/> + <param name="blobdir" value="test02_blobdir.tar.gz"/> + <param name="format" value="png"/> + </conditional> + <output name="plot_circle" file="test04_circle.png" ftype="png"/> + <output name="plot_cumulative" file="test04_cumulative.png" ftype="png"/> + <output name="plot_snail" file="test04_snail.png" ftype="png"/> + </test> + </tests> + <help><![CDATA[ + BlobToolKit is a software suite to aid researchers in identifying and isolating non-target data in draft and publicly available genome assemblies. It can be used to process assembly, + read and analysis files for fully reproducible interactive exploration in the browser-based Viewer. BlobToolKit can be used during assembly to filter non-target DNA, helping researchers produce assemblies with high biological credibility. + ]]></help> + <expand macro="citations"/> +</tool> \ No newline at end of file
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml Mon Jan 30 12:39:40 2023 +0000 @@ -0,0 +1,47 @@ +<macros> + <token name="@TOOL_VERSION@">3.4.0</token> + <token name="@VERSION_SUFFIX@">0</token> + + <xml name="requirements"> + <requirements> + <container type="docker">genomehubs/blobtoolkit:@TOOL_VERSION@</container> + </requirements> + </xml> + <xml name="citations"> + <citations> + <citation type="doi">10.1534/g3.119.400908</citation> + </citations> + </xml> + <xml name="macro_text_input" > + <conditional name="text_input"> + <param name="selector" type="select" label="Genetic text file" help="Include a genetic text file as input"> + <option value="enabled">Enabled</option> + <option value="disabled" selected="true">Disabled</option> + </param> + <when value="enabled"> + <param argument="--text" type="data" format="txt" label="Generic text file"/> + <param argument="--text-cols" type="text" value="" label="Column specification" help="Example: 1=identifiers,2,3=score,total=total_score"> + <sanitizer invalid_char=""> + <valid initial="string.letters,string.digits"> + <add value="_" /> + <add value="," /> + <add value="=" /> + <add value="-" /> + <add value="#" /> + </valid> + </sanitizer> + <validator type="regex">[0-9a-zA-Z=,_#-]+</validator> + </param> + <param argument="--text-header" type="boolean" truevalue="--text-header" falsevalue="" checked="false" label="Text has header row" help="Set the flag if a text file contains a header row" /> + <param argument="--text-delimiter" type="select" label="Text delimiter" help="Character used as delimiter in the text file"> + <option value=",">Comma</option> + <option value="\t">Tabulation</option> + <option value="whitespace">Whitespace</option> + </param> + <yield/> + </when> + <when value="disabled"/> + </conditional> + + </xml> +</macros> \ No newline at end of file
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/assembly.yaml Mon Jan 30 12:39:40 2023 +0000 @@ -0,0 +1,9 @@ +assembly: + accession: GCA_018777385.1 + alias: Candidatus Symbiopectobacterium + bioproject: PRJEB12068 + biosample: SAMN17910462 + record_type: assembly +taxon: + name: SAMN17910462 + id: 801 \ No newline at end of file
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/blast_results.tabular Mon Jan 30 12:39:40 2023 +0000 @@ -0,0 +1,2 @@ +NZ_JAFJYB010000008.1 P08504.1 87.030 771 98 1 108971 111277 222 992 0.0 1402 gi|136134|sp|P08504.1|TNP5_ECOLX 3628 671 721 2 93.51 2 0 VVYETDRLNAIESLALPDGIALSVHQNRLLKLAREGRKMSSRDLAKFTDIRRYASLVCIISEARATLTDEVIDLHERILGSLFNRAKRTQAERLQQTGKLIQSKLKQFITVGQALLNARESGEDPWAAIEDVIPWQEFINSVEETRFLSRKDNFDPLHLITEKYSTLRKYAPRMLSALQFRAAPAAIQLSDALDTVREMYRKQLRKVPSSAPIGFIPESWRKVVITPSGIDRKYYEFCVLNELKGALRSGDIWVKGSRRYRNFDDYLIPSDDFEKSLRDNQLSLAILTDCHEY--NRMTLLASRLEEVNTMALAGDLPDVDISDKGVKITPLDNSVPSAASPFADLVYGMLPHPKITEMLDEVDGWTGFTRHFTHLKNNHVRPKDRKLLLTTILADGINLGLTKMAESCPGTTKLSLEGIQAWYIRDETYSAALAELVNAQKKRHLSAFWGDGTTSSSDGQNFLVGSHGRYAGQVNLKYGQEPGVQIYTHISDQYSPFYTKVISRVRDSTHVLDGLLYHESDLEITEHYTDTAGFTEHVFALMHLLGFAFAPRIRDLHDKRIFIHGKAERYPGLQSVISTTQLNLKDIETHWNEVLRLASSIKQGTVTASLMMKKLASYPKQNGLVKALREIGRIERTLFMLD*FRDPSLRRRVQAGLNKGEARNALARAVFMHRLGEVRDLGPENQNYWASGLTLLTAVISLWNTVYIERAIDSLRRKGLPINEQLISHLSPLGWEHINLSGDYVWRTNLKLGQGKYRSLRSVDSGLYKK VLQHIDRLNSIAALGLPDGITLSIHQNRLLKLAREGRKMSSRDLAKFTDVRRYATLVCVIQEAQATLTDEVIELHERILGTLFSRAKRTQAERLQLTGKLIQSKLKQYVTVGQALLHARESGEDPWAAIEDVLPWQEFINSLEETQFLSRKGNFDPLHLITEKYSTLRKYAPRMLSALQFIATPPAQTLSDALDTIRDMYRKQLRKVPPAAPTGFIPESWRKLVLTPSGIDRKYYEFCVMNELKGALRSGDIWVKGSRRYRNFDDYLIPAAEFEKSRHNDQLQLAVQTDCRAYLQARMTLLASRLEEVNAMALAGDLPDVDISDKGVKITPLENSVPSGASPFADLVYGMLPHPKITEILEEVDNWTGFTRHFAHLKNNNVRPKDGRLLLTTILADGINLGLTKMAESCPGATKSSLEGIQAWYIRDETYSAALAELVNAQKARPLAAFWGDGTTSSSDGQNFRVGSHGRYAGQVNLKYGQEPGVQIYTHISDQYSPFYAKVISRVRDSTHVLDGLLYHESDLEITEHYTDTAGFTEHVFALMHLLGFAFAPRIRDLHDKRLFIHGKAERYPGLQSVISTTSLNIKDIEAHWDEILRLAASIKQGTVTASLMIKKLASYPKQNGLAKALREIGRIERTLFMLDWFRDPGLRRRVQAGLNKGEARNALARAVFMHRLGEIRDRGLENQSYRASGLTLLTAAITLWNTVYIERAIESLKRKGIPINNQLVSHLSPLGWEHINLSGDYVWRNNIKLGSGKYRSLRTVDTELYKK 148954 994 RecName: Full=Transposase for transposon Tn2501 +NZ_JAFJYB010000008.1 P27302.5 83.861 663 107 0 85932 87920 1 663 0.0 1110 gi|54042066|sp|P27302.5|TKT1_ECOLI 2872 556 610 0 92.01 3 0 MSSRKERANAIRALSMDGVQKAKSGHPGAPMGMADIAEVLWRDYLNHNPANPHWANRDRFVLSNGHASMLIYSLLHLTGYNLPIEELKNFRQLHSKTPGHPEYGYTDGVETTTGPLGQGIANAVGMALAERTLAAQFNRPGHDIVDHFTYVFMGDGCMMEGISHEVCSLAGTLKLGKLVAFYDDNGISIDGHVEGWFTDDTAARFEAYGWHVVRGVDGHDADAITRAIEQARAVTDKPSLLMCKTVIGFGSPNKAGTHDSHGAPLGDAEVAASREQLGWKYPPFEIPAEIYAAWDAKAAGAQKESVWNETFAAYARAYPELAAEFKRRTVGDLPANWQADAQKFIEDLQASPAKIASRKASQNALEAYGKLLPEFLGGSADLAPSNLTIWSGSVSRDKDPAGNYIHYGVREFGMTAIANGLALYGGFLPYTATFLMFVEYARNAVRMAALMKIRSIYVYTHDPIGLGEDGPTHQPVEQLASLRVTPNMSTWRPTDQVETAVAWKYAIERKDGPTALILSRQNLAQQARTAQQLADVAKGAYVLKDSDGQPDLILIATGSEVELAVAASDVLSAQGHKVRVVSMPSTDAFDKQDAAYREAVLPKAVSARVAIEAGIADYWYKYVGLNGAIVGMTSFGESAPAEKLFEVFGFTVDNVVAKASALL MSSRKELANAIRALSMDAVQKAKSGHPGAPMGMADIAEVLWRDFLKHNPQNPSWADRDRFVLSNGHGSMLIYSLLHLTGYDLPMEELKNFRQLHSKTPGHPEVGYTAGVETTTGPLGQGIANAVGMAIAEKTLAAQFNRPGHDIVDHYTYAFMGDGCMMEGISHEVCSLAGTLKLGKLIAFYDDNGISIDGHVEGWFTDDTAMRFEAYGWHVIRDIDGHDAASIKRAVEEARAVTDKPSLLMCKTIIGFGSPNKAGTHDSHGAPLGDAEIALTREQLGWKYAPFEIPSEIYAQWDAKEAGQAKESAWNEKFAAYAKAYPQEAAEFTRRMKGEMPSDFDAKAKEFIAKLQANPAKIASRKASQNAIEAFGPLLPEFLGGSADLAPSNLTLWSGSKAINEDAAGNYIHYGVREFGMTAIANGISLHGGFLPYTSTFLMFVEYARNAVRMAALMKQRQVMVYTHDSIGLGEDGPTHQPVEQVASLRVTPNMSTWRPCDQVESAVAWKYGVERQDGPTALILSRQNLAQQERTEEQLANIARGGYVLKDCAGQPELIFIATGSEVELAVAAYEKLTAEGVKARVVSMPSTDAFDKQDAAYRESVLPKAVTARVAVEAGIADYWYKYVGLNGAIVGMTTFGESAPAELLFEEFGFTVDNVVAKAKELL 148954 663 RecName: Full=Transketolase 1; Short=TK 1
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/busco_full_table.tabular Mon Jan 30 12:39:40 2023 +0000 @@ -0,0 +1,197 @@ +# BUSCO version is: 5.3.2 +# The lineage dataset is: archaea_odb10 (Creation date: 2021-02-23, number of genomes: 404, number of BUSCOs: 194) +# Busco id Status Sequence Gene Start Gene End Strand Score Length OrthoDB url Description +860at2157 Missing +1642at2157 Missing +3905at2157 Missing +6590at2157 Complete NZ_JAFJYB010000003.1 350058 352109 - 294.1 364 https://www.orthodb.org/v10?query=6590at2157 Methionine--tRNA ligase +6736at2157 Missing +7046at2157 Complete NZ_JAFJYB010000002.1 796689 798419 - 198.1 387 https://www.orthodb.org/v10?query=7046at2157 Arginine--tRNA ligase +7724at2157 Missing +7896at2157 Complete NZ_JAFJYB010000002.1 521516 524143 + 230.5 399 https://www.orthodb.org/v10?query=7896at2157 Alanine--tRNA ligase +8899at2157 Missing +8922at2157 Missing +10236at2157 Missing +13010at2157 Missing +13531at2157 Missing +13565at2157 Missing +14061at2157 Missing +14454at2157 Missing +14889at2157 Missing +17053at2157 Missing +17629at2157 Missing +18705at2157 Missing +19750at2157 Fragmented NZ_JAFJYB010000001.1 942014 943066 - 36.0 113 https://www.orthodb.org/v10?query=19750at2157 ATPase +21317at2157 Missing +22545at2157 Missing +22747at2157 Fragmented NZ_JAFJYB010000001.1 563445 564428 + 232.3 231 https://www.orthodb.org/v10?query=22747at2157 phenylalanine--tRNA ligase subunit alpha +22842at2157 Missing +23182at2157 Missing +23221at2157 Missing +24257at2157 Missing +24288at2157 Missing +25592at2157 Missing +25871at2157 Complete NZ_JAFJYB010000002.1 529172 530533 + 231.0 344 https://www.orthodb.org/v10?query=25871at2157 signal recognition particle protein +29893at2157 Missing +30130at2157 Missing +31316at2157 Fragmented NZ_JAFJYB010000002.1 770147 771136 + 138.9 205 https://www.orthodb.org/v10?query=31316at2157 Dihydroorotate dehydrogenase +31722at2157 Missing +32079at2157 Missing +32191at2157 Missing +32623at2157 Missing +35648at2157 Complete NZ_JAFJYB010000008.1 72373 73671 + 270.4 266 https://www.orthodb.org/v10?query=35648at2157 Adenylosuccinate synthetase +35861at2157 Missing +36028at2157 Missing +37207at2157 Missing +37299at2157 Complete NZ_JAFJYB010000003.1 83351 84868 + 371.7 386 https://www.orthodb.org/v10?query=37299at2157 Amidophosphoribosyltransferase +39322at2157 Complete NZ_JAFJYB010000002.1 861947 863317 - 291.9 395 https://www.orthodb.org/v10?query=39322at2157 Adenylosuccinate lyase +41214at2157 Missing +41305at2157 Complete NZ_JAFJYB010000008.1 61495 63021 + 186.3 366 https://www.orthodb.org/v10?query=41305at2157 Bifunctional NAD(P)H-hydrate repair enzyme +43727at2157 Missing +44076at2157 Missing +46017at2157 Complete NZ_JAFJYB010000002.1 437560 438723 + 225.2 353 https://www.orthodb.org/v10?query=46017at2157 Phosphoglycerate kinase +47919at2157 Complete NZ_JAFJYB010000001.1 1093397 1094671 + 232.2 356 https://www.orthodb.org/v10?query=47919at2157 Histidine--tRNA ligase +48934at2157 Missing +50844at2157 Complete NZ_JAFJYB010000001.1 245664 246425 + 196.6 205 https://www.orthodb.org/v10?query=50844at2157 di-trans,poly-cis-decaprenylcistransferase +51351at2157 Missing +52427at2157 Missing +54988at2157 Complete NZ_JAFJYB010000001.1 959054 960073 + 146.3 218 https://www.orthodb.org/v10?query=54988at2157 S-methyl-5-thioribose-1-phosphate isomerase +55024at2157 Missing +56027at2157 Missing +57545at2157 Missing +58019at2157 Missing +58022at2157 Missing +58340at2157 Missing +59062at2157 Missing +59314at2157 Complete NZ_JAFJYB010000001.1 745036 745983 + 111.3 169 https://www.orthodb.org/v10?query=59314at2157 Ribose-phosphate pyrophosphokinase +59861at2157 Missing +60366at2157 Missing +60670at2157 Missing +60954at2157 Missing +61613at2157 Missing +61936at2157 Missing +62508at2157 Complete NZ_JAFJYB010000003.1 214280 215317 - 137.7 179 https://www.orthodb.org/v10?query=62508at2157 Phosphoribosylformylglycinamidine cyclo-ligase +63341at2157 Missing +64860at2157 Missing +65833at2157 Missing +66209at2157 Missing +66811at2157 Missing +69351at2157 Missing +70269at2157 Missing +70525at2157 Missing +70865at2157 Missing +72726at2157 Missing +73593at2157 Missing +74812at2157 Missing +75288at2157 Missing +76134at2157 Missing +76877at2157 Missing +78046at2157 Missing +79065at2157 Missing +79845at2157 Missing +80498at2157 Missing +80501at2157 Missing +80629at2157 Missing +82104at2157 Missing +82755at2157 Missing +82853at2157 Missing +83050at2157 Missing +84219at2157 Missing +84684at2157 Complete NZ_JAFJYB010000002.1 717347 719023 + 127.1 387 https://www.orthodb.org/v10?query=84684at2157 Translation initiation factor 2 subunit alpha +85023at2157 Missing +85279at2157 Missing +85293at2157 Missing +87367at2157 Missing +87520at2157 Missing +88531at2157 Complete NZ_JAFJYB010000003.1 105180 105644 + 65.6 96 https://www.orthodb.org/v10?query=88531at2157 6,7-dimethyl-8-ribityllumazine synthase +89321at2157 Missing +89943at2157 Missing +90096at2157 Missing +90641at2157 Missing +90817at2157 Complete NZ_JAFJYB010000001.1 1045496 1049383 + 71.6 176 https://www.orthodb.org/v10?query=90817at2157 phosphoribosylformylglycinamidine synthase I +90882at2157 Missing +91154at2157 Missing +91297at2157 Missing +91632at2157 Missing +91936at2157 Missing +92409at2157 Missing +92795at2157 Missing +93236at2157 Missing +93256at2157 Missing +94875at2157 Fragmented NZ_JAFJYB010000001.1 247306 248658 + 65.3 255 https://www.orthodb.org/v10?query=94875at2157 PDZ domain-containing protein +94889at2157 Missing +95578at2157 Missing +96138at2157 Missing +97230at2157 Missing +98179at2157 Missing +98187at2157 Missing +98221at2157 Missing +98657at2157 Complete NZ_JAFJYB010000002.1 444459 445115 + 149.0 181 https://www.orthodb.org/v10?query=98657at2157 Ribose-5-phosphate isomerase A +99236at2157 Missing +99734at2157 Complete NZ_JAFJYB010000002.1 505471 506289 - 135.2 173 https://www.orthodb.org/v10?query=99734at2157 16S rRNA (adenine(1518)-N(6)/adenine(1519)-N(6))- dimethyltransferase +99842at2157 Missing +101957at2157 Missing +102178at2157 Missing +102360at2157 Missing +102399at2157 Missing +103467at2157 Missing +104254at2157 Missing +104636at2157 Missing +104702at2157 Fragmented NZ_JAFJYB010000002.1 442619 442915 + 14.8 65 https://www.orthodb.org/v10?query=104702at2157 GHMP kinase +104786at2157 Missing +105095at2157 Missing +105165at2157 Missing +105421at2157 Missing +105604at2157 Missing +105851at2157 Missing +106462at2157 Complete NZ_JAFJYB010000001.1 1088327 1088758 + 126.1 121 https://www.orthodb.org/v10?query=106462at2157 Nucleoside diphosphate kinase +106603at2157 Missing +107015at2157 Missing +107212at2157 Missing +107993at2157 Missing +108145at2157 Missing +108717at2157 Missing +109335at2157 Missing +110798at2157 Missing +111803at2157 Missing +112466at2157 Missing +112720at2157 Missing +113971at2157 Missing +114285at2157 Missing +114541at2157 Missing +115384at2157 Missing +115425at2157 Missing +115808at2157 Fragmented NZ_JAFJYB010000003.1 268875 270056 + 56.1 143 https://www.orthodb.org/v10?query=115808at2157 Geranylgeranyl reductase +115947at2157 Missing +116294at2157 Missing +116732at2157 Missing +116879at2157 Fragmented NZ_JAFJYB010000002.1 490837 491310 + 59.6 80 https://www.orthodb.org/v10?query=116879at2157 Peptidyl-prolyl cis-trans isomerase +117225at2157 Missing +117241at2157 Missing +119044at2157 Missing +119723at2157 Missing +121171at2157 Missing +121548at2157 Missing +121943at2157 Missing +122290at2157 Missing +123463at2157 Missing +123503at2157 Missing +123853at2157 Missing +123859at2157 Missing +124073at2157 Missing +124429at2157 Missing +124805at2157 Missing +124913at2157 Missing +124973at2157 Missing +125162at2157 Missing +125788at2157 Missing +126193at2157 Missing +127293at2157 Missing +128227at2157 Missing +128960at2157 Missing +129321at2157 Missing +129447at2157 Missing +129924at2157 Missing +130316at2157 Missing +130364at2157 Missing +131584at2157 Missing
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/contig.fasta Mon Jan 30 12:39:40 2023 +0000 @@ -0,0 +1,100 @@ +>NZ_JAFJYB010000008.1 Candidatus Symbiopectobacterium endolongispinus isolate SYM 10, whole genome shotgun sequence +AGACGATGGAGTTGATTTGCCCTTCATCCAAGGCACGGCCAGGTTGCAAGTTCAACGTTACGGACGCAGAGGGTGCCCTC +TGTTCGCGAACAAACAGTGAGGGCTTAGGTATCGCCAGATGCACTCGTGCTGTTTGCACGGGTCCGAGCGTTTCAATGGT +CCGTGACAGTTCGCCTTCTAGCGCCCGCTGATAGTTGATCTGCTCGCTAAATTGGCTGATGCCAAACTTTTCCTGATCGA +GCAATTCAAAACCAACCGCCCCGCCTTTGGGAAGTCCCAGTTGAGCCAGGCGTAAACGGGTTTCATACACGTTTTTTGAA +GGGATCAGGATTGCACTGCCACCTTCAGCAAATCGGTAAGGGATATTTATTTTTGTCAGTTCGCTGACAATGGCTCCACC +ATCACGGTCATTGACGTTATTGTAGAGCACCCGGTAATCAGGGCCTTTTGCCCATAGTACCATAGCGACAACAATTGCAA +TTGCAGCGGCCGCCGCAACTAACAGGGGAATTTTAGGATTGGCGCGCAAGCGGTTGAGTATCTCGCCAAACCCTTTTCCA +CCGGACATAAAACCGGTTGCGGCGTTCATACTCGTCCTCTGCTTGGTTGTTGAGCGATAAAATTAACGTTGGTACGTAAC +AAAACAGCACTCCCTGATTGCGCAATCGTTAATACGTGCACCTACTTTTGTCAGCATAGTATTATTTTCCGTAACGGCAA +AAACGATGCTCCGATAAGGTGGCATTTTCCCCGTCTTTTACGCCTTTTAGGATAAGACTGATATGGTAGTTTAGTGCACT +GTGTTAATTGGGTGGTTTTTGTGCGATTAGGAAAAGTGGGGCAATAAGCCCCTTGTCGCAAAATCATTTGCGAAAGATGG +TGCTGTTGTGGGGCATTCCTGTCGGAAAAGGTGAGAGACAATGTCAGTTCAAGGTATTGAGAGCGTAGTGCAGCAATTGC +AGGCTACCGCGTTACAAGCGGGGAACAATCCTGGCGTTAAACCGACTATCGAACCTGGTTTTGCGAGTGAGCTAGAGTCT +GCATTGGATAACATTAGTGGCACTCAACAAGCCGCACGTGAGCAAGCGCAAAAGTTCACCTTGGGTACACCTGGCGTTGA +ATTGAATGATGTGATGGTGGATTTACAGAAATCCTCAATCAATATGCAAATGGGTATCCAGGTACGTAACAAGCTGGTTG +CTGCTTATCAGGAAATAATGAGTCTTTCCGTCTGAGCCGGTATCTGGCTAAATCGAGTTGGTAGGCTTCAGTGTAAAAAA +ACCATTCCGACGACGTCAGAATGGTTTTTTATTGCATGCGGCAAATTGCCCCGGCACCGTCACTCTTGAGGATTAATATT +GCCAGGAATAACACCTTGGGGTGAGAATTCACCGTAGGCTGCATTGACACTATGCTGCTTAACTGACGTTTGCATTAATG +AACTCAGCTCATCCATGCGTTTTTGCAGTAACTCTTTTATTTGCGCTTCACTTTCTACGATTTCTCGCAAAATTTTGCGA +AATTGCAACCGCATCACACTGTCCAGATTATCGGGGATCGGCATCTTGCTCAGATTCTCCACCGACTGGATGTAGATAAT +CTCTTGTTCGACCACTTCATCCCATGCGCCGTTGTTAGCCAGAGCCAATATATGTCGGCTCAGTAGCTGAAGCTGCTGAT +AATCCTTTAGCAGTTGCGAAGGCGTTGTCATTTATGCTGCTCCGCTCTGTACCGCTTGCGGTGTAGGGCCAATCTGGCGC +CAGGCATCAGAGATGCTGTTAAGCAATGTTTCAACTTCGTCGATAACTTTTGCATCATTATGCAAGTTGGCAATCATTAA +ACGTTGAACCATGTAATCATAAAGGGCTGCAAGATTCTCTGCCAACTCACCGCCTTTTTCTATGTCTAAGTCCGCTTTAA +GGCCATTCGTGATGATATCGATAGCTTTGGATAAAGCGTAACCTTTACCAGCAATATCATTCTGCTGTAATAAAATCCGC +GCACGGACCAACGCACTGCGCGCACCGTCAAAAAGCAGAACAATGAGCTGATGTGGGCTGGCGCTCATCACACTGCTTTC +CAGGCCAACTTGGGCATAGGCCTGGCTGCCGTTTCTGCTGTACATCAGTGACTTTCTCCATTAACTACCTTTTGTTTAAG +GCAGCGAGTTGTGTTGTCAGATAATCGCCGGTGCTATTCATTTTAGAAACCAACGTATCCAACTGGGCAAACTGTGCTTT +ATAGCGCGCAATAGTATCTTCGATACTTTGCTGAGTGAGATCGTAGGTTTTCTTAATGGTTTTCAGCGTCGCTGCAATAC +TGTCTTTCGCGGTTTGGATTGCCACTTTGCTGGAATCAAGAACGTTGTCTAAATAATTAGTGACTTGTGTAGCGTAGCCG +GTGGTTTTTCCATCGCCAACGAAGAAATCTAATACCTGACTGGAATTATCTGTCAGTGCAGTTGTTAGCTTATCGCTATC +AATCTCAAGCATGCCGGTTTTGGGGTTTTGTTTAACACCCATTTCGTTAAGCGTACTGATATCCATACCGCTCTGAGCGT +AGGAGATTTGTGTTTTCAGTGAGGTCTGGATACCTCTGACAGTACTGTTACCAAGCAATACACCGTTACTGGTGCTTTGT +GCATCAGAACCAGAATCTACCTCTGTGTATTTGGTCAAGGTACCAATTGTCGTCTGCAGTGCATTGTACGCATCGACGTA +ATTTTGAACGGCTGTCTTCATCGGTGCAATATCACTGGCGATTGATAATGTCTCTGATGAGTTCGTCGCTGTTTGGGGTT +TCAAGATTAGTGTAACGCCGTCAATAGCGTCAGAAATGTGTTACTTTGACGCTCAATCGTCATGCCATTGAGCTTTATTG +ATGCATTTTGCGCGGCAGTCTGCTGCGTCATTGCACCACTGCCAGCACCTGTATCGGAGGTATAATTCAATTTGCCATTC +AGCGTGCCATCACCGGTGACGCTGATAGTCATCTTGGCATCGGTGCCAGTGTCTTTGGCCGTGATAGACAAATAATAAGT +ATCGTCATCCACTTTGATGATACTCGCACCAACATTGCCATTAGCCTTATTAATTGCATCACGGATGCCCACTAATGATG +TTTGGTCATCGGTCAGTTTGATTTCAAGTGGTTTATCCTGACCTGGCTGGCTGATAGTTAGGGTCCGGGTATTGTTTTTT +GTCGCTGATCCCTGCTGTGCTGTATTGCTGGCAAATTCACCCGAGATCAAGGATTGCGCGGTAGCAAGTGTCTTCACTTC +TACACTGTAATTGCCGTTAGTTGCTTTGCTATCCGTTGTTGCAGTGAAGGCGGTATTGGTGCTGCTGACACTGGTTTTAT +TGATACTGCTTGCTTTGGTCAATGCTTCTGCGGCAGTGTTCAGCTTTTCTAGTGCACTCTTAAGGGTGTCAAAGGCTTTA +TCTCGGTTTTCTTAAAGCGTTTGTTGTGCCTTTACCGGGGTTAAGCGAGTCTGTTCATTGGTTGTTAATTGCGAAAGAAT +ATCGCTCATTTCGCTGGTGGAACCTGTGAAGCTGATGCTTGCCATGGTAATTCCTTATGAATAGGTTAATGCCTTCTAGA +AGCTTATCGGCAAATAATGAACAAAGTTTAGTATAATCTTTCAGTAGAACTGAGATGGCACGATGGCATCCGCTACAGCG +TATTTTAATCAGTAATCCACCTCGAAGGAAATTTTAAAAAATCATTAAAGCTTTTGAAAGGAGCGCCGATATCAGGTAGG +ACGGTGATGAAACCGTGGGCGGCAGACGCTGTCCCCCCTAACTGACTTGAATTGAGAAAGGAATACAACTATGGCAGTGA +TCAACACTAACAGCCTGTCTCTGGTAGCACAAAATAACCTGAATAAATCTCAGTCCGCACTGGGGACAGCTATTGAACGT +CTGTCTTCAGGCTATCGCATCAACAACGCTAAAGATGATGCTGCTGGTCAGGCGATTGCTAACCGTTTCACCGCGAACAT +CAAAAGTCTGACTCAGGCTGCTCGTAACGCCAACGACGGTATCTCAATCGCGCAGACTGCTGAAGGTTCTCTGAACGAAA +TCAACAACAACCTGCAACGTATCCGTGAACTGTCTGTTCAGGCGCGGAATGGTACTAACTCTGCATCTGACATCGACTCC +ATCCAGTCTGAAGTTAACCAACGTTTGGAAGAAATTGACCGCGTTGCTTCTCAGACTCAGTTCAACGGTATCAAAGTGCT +GTCCAAAACCAGTGCTGATACGTCTATTTCCATCCAGGTCGGTGCTAACGATAGAGAAACTATCAGCATCACCCTGAAAG +GCAACTCTGGCTGGAACAAATTTTATTCCGCTGGTTCTGCCGCTGCTTCTGGTGGTCAGGTTACTGTTTCCGGTACCGGT +ACTGCTGCTGGTCAACGTCAAGTTGGCGCGAAAGGTGTTGACGTTCTGGATACTACCGTATTGGCTGATGTTGACGCTGC +ACTGAAAGCCGTTGATACGCAACGTAGTGATCTGGGTGCGATTCAGAACCGTTTTGAATCCACCATCAATAACCTGAACA +ACACCGTAACTAACCTGACTGCTGCACGTAGCCGTATTGAAGATGCTGATGTGGCGACCGAAGTGTCTAACATGAGCAAA +AACCAGATTCTGCAACAGGCTGGTACTGCTGTATTGGCCCAAGCCAACCAGGTTCCGCAGACTGTTCTGTCTCTGCTGCG +TTAATTGCTATACTCAGTTTTCAAAGCCAGTCTCCGGGCTGGCTTTTTTTGTTTAAAAGCACAAGTTTTTATTTTTTACG +TTAGTGCCGGATAAACGGCTAGAAGAATAACGTCCTTGCTGGATTGTGCGTGTACCAAGGTTGATAGTCCACAGATTGGT +TTAATTGGGAGTTGGTCAAATGGCGGCTTTAGACAGTAAGTTGGACAACAAGAACAATAGTGACGTAAAGAACACCACGG +CTGAGGACATTGCTCCAACCCCAATGGAACGAGTCTATGGTTCGGTTGAACATATTCGGGCTGTTTCGTGGCTGTACGGC +ATCGACACTGTGCCTGCTGAATATTCGCGTACTTTAGTGCTTGGGTGTGAAGACGGATTAAACTTACTGCCTTTTGCCTC +CGCTTACCCTTCTGCGCAGATCGTTGGGGTCGAATTAGCATCAGAGCCTCTCCCTGAAAAACAGAAAAATGCAGATATCC +TGTTGCCGACCAACCTACATCTTTACAGTTTGTCTCTGGAGGCATTACTGGGCAACTCGTGGGAGAATTTTGATTACATC +ATTGTTCATGGGAGCTTTTCTCTGCTTGCCAATGAGGTGACCGATCTCTTGCTGGCGTTTTTTCAACAAAAGTTGAGTGC +GAAAGGCATTATTGCTCTAGATTGGTTTTGCCAGCCCGGAGCTAAATCCATGGAGGCACTACGCGATGCGATCCAACTTC +ACAGTTGTCGGGGAGAAAATTTTACCGAGCAAGTCGAGCAGGGAAAAGCGATGTTGTCTTGGCTTAATCAGGTATCCCCG +ATGTCAACTGCTACCGAAAGCAGTCTTGGCTTACCTCTGAAGAAAGCGAATGCACTGTCAGACGATTTATTCATACACTA +TTTTCTGGAAAGCAAAAACGAATCCAGTTATTTAGTCGAATTTAATAACCGTATCGAAAATTGCGGTTTGGCCTACGTGG +GTGATGTGAGGCCTGAAACAGAAACGCCCGATTTTTACAATAAAGCGTTAGATGAGCGGTGGCAGGATATCGCCTTTGGA +TGTGGAAAGGTGATGGGTCAGCAATATTTGGATATTGCAGTAAATCGTAGTCAGCGTTTTAGTTTATTGGTATCGCAGAG +TAGGGCTCCAGAAGTATCTGAACAGATTGATTATTCCCGATTGGCGGATATGCGTTGGGCTGGAGGGTTCCGCCGTCAGA +CTTCCGATCTTCGTGTTATTCATAACTCGCTCGCCAGTCATGATAGTGTCGCTGTTTCTACAGACAATATTCTGGCGATG +TGTATCCTTGACACCCTCGGAGATGCTTGGCCGTATAGTGTCAGCTTTGACCAACTCGTCTTTCATTATCGATTGCCAGA +TGATGATCCAGAATCGCCTTTTTCGGCCGATCTTGAGAAGAAAATAATCAATGCCCTGAAAGCATTGCTGAATAAAGGCA +TCTCAAGCCTCCATTTTCAGTTGGACAAAGATCGCCACAGTTTGTGCAATGAGCACCAAGTTGCAGCCAGCGAGAGTGTT +AAGCTCCAGTTGCAGAGTGCGCCAGGATCGCTGTCTGTGATTAATCTGTGGCAAGAAGTGGTGGGGCTTACGGAAGAAGA +ACGGGAACAACTGTTACTTCCAAGCTTAACCCTTACAGCAACCAACCGAACGTTGGTTGACAGCCTTCACCATAAAGGCG +TGTTAAATGCATCTGCACTGGGCTGGAAACGCTATTATCAGCAGGTCGCGCGCAATGCCGAATTGGTTGATCTTAATCGA +GTACCTTGTGCGTTATTACTGTTCTCCAGCGATGTTTCGGCAGGGGGATTCTATACTCGCACCTTTGAACTCCTGGCCAA +TGAAACAGATACAAACGCTGCGAATCAGGATGAAGACTCGATAGATGGTAAGTTGGTTGTTGAAATCAATAGTCTTCTGA +TTAAAAGTAAAAATGAAAAAGCGATCGCGCTGGTAGAGCATGAACGAGAGCGACTTCTGAAAACTATAAATGGTTGTTAT +TATTTATCACGATTTTATCGGCGGGTTGCGGATGATGCATCAACTGCACTGATGCTAACGCGTATATTATCTTATAACTC +AACGAGTTTATTTGTTTACTCAGGGTTGGCTATGGCGCTCTACCAACACCGAGTGTTTTGGACTGCTGGGCGGTTAGCCC +GTGCAATTTTGCGCTGTAACCGGAAAAGCTCGCCAGATTGGTTTTTGCTTGGACTCTTACATAAAGAGAGTAAAACATTA +GATCATGCCGAATACTGTGCACGACAGGCGATGGCATTAGTGCCAAATAGTCAGCAAATCGTTGGTCTATTGGGGGGATG +CCTTTGCGAACAGGCAAAGACCGATGAGGGAATTGCGTTTCTACGTAAAACGATAAGAGATCCGATTTCTGATTACTATG +TCTACAGCCAATTAGCATTTATTCTTTCTCACAGTAAAAATGCGACTGCCCAAGAGCTTATGGATTGTCATTTAGCCTAT +GCCAAAGGCGAAATGGCATGGGCAGCGCATCAGACGTTCGAAGGTTATCAACCTCTCGATAAATCTTTCGATAGGAAACT +GCGTATCGGTTTTGTATCTGGTGACCTTAGAGATTGGCATCCTGCGGGCTTTTTCTTCACACCGATTTGGGATAAGTTAG +ATCGGGAACAGTTTGAATTATACTGCTACAACAACAGCCCCTCCTATTTGTGCAATGCGGGTACGGATCACTTCGAAGCA +ACCGCAGATGCCTGGCGAGATATTCAACATGTCAACCCAATTGAATTAGCCGAAATGATAAAGACGGATAAGATTGATAT +ATTGATCGATCTTTCTGGGCATACCGGGTACAACCGGTTAAGTACCTTTGCGTTAAAACCTGCGCCGATACAAATTTCTT +GGGTTGGCTATCATGCTACCACGGGATTGCCTGTAATGGATTATTACGCGACTATTTTCCCTGTGGCGAAAGATCCCTTA +ATTGAGGCGCAATTTACGGGAAAATTGATCTACCTTTCTCTGCCGAATAGTTTTGACAACAAGGAAGCCACGATCCCCGT +CAACCCATTGCCCGCACTTAAGAACGGCTATTTCACCTTTGGCAGTTTCAACCGCCCGAATAAGGTCAATGATGATGTGT +TAGATGCGTGGGCGGAGATATTAAAACGCGTTCCAACGTCAAGAATGCGTATTGGCAACATGCCGAGCGCTATTTGGGCT
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/reads.fastq Mon Jan 30 12:39:40 2023 +0000 @@ -0,0 +1,200 @@ +@NZ_JAFJYB010000008.1_0_1/1 +GATCTAAAAGCTATATGGTTAAAGCTAGCAAAAGAAAGAGGGAATGAATAATACGTTCCAAATTGGAACAAGAGTCCACTATTGATAGTGGACTCTGTACGATTTTTAACCACCATATCCGCTAGGAAAGGTATCACTGAATGCCTGACGA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000008.1_0_0/1 +CGTTATGCCTTGGTTAATGGGGTTGTTCGCAATGACTCTGGTGCCCAACTGGATTTGGGGCTGCAAGGCAAAGCGACCTTGGATGATGTGCGGCAGATTTTGTAACTGAAAGACAGCATTGAACACAGAATTTGGCCTACCTCGAAACCCG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000009.1_0_0/1 +ATGAGGGCCAGGAGAGATGCATCGCCGCCGATACCATCATCGTCTGTGCAGAACAGGATTCACGGCGCGAGTTCTATGCGCCATTGCAGGCCAACTGGTGCGCCGTGCATCTGATTGGCGGTGCGGATGTCGCCGCCGAACTGGATGCCCG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000009.1_0_1/1 +CTTAAGCAAGGAGTCGCCTTCCTTTCCTGATGGTGTGGCCAATTAAGGCCACACTGTTGGGTAGCATCTCGTGATAAAAATCACGCCTTGCGGCAGACGAACGTCTGCCGTTATTGGTAACCAATCACCACTACTTTGACCGTTTCGCTTA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000010.1_0_1/1 +TAAACAGGTACTTATGCAGCTCGCTCTTGTCTTTGTGGCGCACATAGTGCGGGAAGTAATGTTCGACAAAATAGTCATACCCGCTGACCGGGTCGAATACGCGTGCGCGTCGTTCAGCTATGGCCGCCGCAGACGGGTCAAAACCAACACA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_6_1/1 +GCGGTTATCCAGGTTGTAACGGTGTGCCAGCGTGATGGCAGCCGGGCCGATAAACTCAGGATTAAGGCCAAGCTGCGGGCACGCGGCGTAGCACAGGCCACAGTTGATGCAGTCGGAGAACTGATGGTATTTCGCCATTTGCGCCAGTGTC ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_7_0/1 +GCGATGGCGTGGCGATAAACGCTGTGCGTGAATGGGATGGCATTCCCTGGCAAGATAACGTGGACAAGCCAGCAATACTGCGCGCCAGTGAATGTAAGCGCCCGCTTACTAATAATTGGCGAGTGACCAGCTATTCTGGTTTACAACAGCA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_6_0/1 +AGGATTGATCTCTGTGCCAGCCTCGCCAAAACAGTGGCGGCGGCTTGATGGAGACGGGTTTATACGCGTTGGTTGTTGTGGATTGCCTGCTTAGGCTGGCGTAAAATCCTTATTTGCGGCCTGCCAGATGATCCTCCTTTTGGGATCTCGC ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_8_1/1 +TGGCGCAGGCAGATGTCGGGCTGGCCATGAACCAGAGCACCGAGCTGGCACAGCAGGCGGCGGATGCGGTGTTGATGTAGGATAGTCTGCACGGCGTGGTGCTGGCGCGTGAACTGGCGCTGGAAGCGATGAAACTGGTGCACAGCAACAT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_3_0/1 +TTGGCGAGCGGAGTCACGCGGCGTCAAACGCAGATACTGGGTGCTGAATTTCACTTGCTCATCATAGCGATAGTGCGTGAGATGATTAATGGTCAGTTTCATACCGTCTCCAGATAGGTTTGTCGCACGCTGTCAGCCAGCGCGTTGATTC ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_2_1/1 +CACCCACCTGCGTGCGACCTGTCGCGAGCAGAACCCGAAAACCTTCCACGAAGCGGCGCATCTGGGCGGCGACGTGAATATGGTGGCAGTGGTGAAAGCGATCCTGACGGAAGAATCACGCCGTAAAGCGGCGGGCGATCCGCGTACGATT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_4_1/1 +GCGAACAGGGCACGCCACAGTACGGCAATGGCTACGCTACTACCGAGAATAGACGGTACATAGTAAGCAGTACGGAAGAAACCGATACCACGCAATTTGAAATTGAGCACAAATGCAATAAGCAGTGCGAAAATCAATTTCAACGGAATGG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_0_0/1 +GCTTCATGCCGCCGCCCTGTTTCAACGCTGGTTGCAGGACAATCATGCTGTCAATGCCACCGCCGTTACCAGCAATGCCGCAGGCAAACGACTTGATAGCGTGCAATCGCTGTTTTTCAACAGCTATGACTGGATGTGTAAGACACCGTAT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_9_1/1 +GATCTTCAGGGCACTGTTCCACGAAGTAGCTTAAATCAGACACCGCGATATGGTCGCAGTCCAACTGTGCATAGATCAAGCCGCGATCGCGAATTCCATAAGGGTCTTCCGGATCGAATTGCAGCACGGCTTCACTGGCCCGCAACGCAAG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_7_1/1 +GTGCCACTGCGGGTAATGTCGCCCGAATATCCGACCAGCTTTTTTCCGCAATACCCTGAGATATCGCCCAGGCAATAACGGTAGCGCCAGCCACCGCAATATTTGATTTGTGAGTAGGGCTAGACGCGAGCGCCACGGCATCAATGAAATC ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_1_0/1 +GGCTGTCACCACCGTCGCCCGCTTCGCCAATGTCAGTATTACCCGCTGCTGGCGCTTCCAGGACTTGAGTCGGGTCTGCGCCTTGTGCGAGCATCCTGTAACGCTGCCACATCCTGAGCGTCTTGTGCTGTGGCCTGCGGCATTACGTTGG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_3_1/1 +GTCAGGTCGACCGTTTCAACCGACGGTGTCGTCAGCAATGGCGGTAACCCTTCGCTTAATAATGGGCGTAACGTCTCACGGATATCATCACTGACCACCAGCGATGTCACCAGAAATTGCTCCATTCGTTCCCCATTGCGATCCTACAAGT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_0_1/1 +ACCGGAGGCTTGCTGTCCAGAATTTTACGCAGTTCACCCAGATTCTGCACCGGCTGCTGGTTCACACTGAGGATAACGTCATCCTTCTTCAAGCCGATTTTCGCGGCCGCCGATCCGGCTTTCACCTCGTCCACTTTCACGCCTTTCTGGC ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_5_1/1 +TGGGCAATCAGCGCATCGACTTTGACTTGCAGCGTTGCTTCCCCTTTCTTGATGCCGATATAACACGGTGAGTCTTTCAGCATAAATTTGGCAACCGGAGCCTTGGCGGGGTTTTGTGCCGCAATGGCGGCCACCACCAGGTTACCAGTAG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_4_0/1 +TGATAGCGTATGCAAGCGGCGGGCATACTCCAACGCAGCATCCGTGTCGTGAATGGAACAGGGTCCACACACCACCAATAACCGGTTATCGCGACCGTGGATAATATCGGAAATGGTACAACGTGCCGTGGCAATGGCCTGCTCTTCTTGC ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_5_0/1 +TGGAGATAGCGATGGTGGCGATAACCGGCGCCAGATAGGCCATGACTGGGTTATTAAAGTGGTTTGCCAGGTAAGACAAAATGGAAATGTTTTGCGTTTTGGCTTCCATCAGTTCTGCAGGGGACAGGCTCAGTACACAACTGAACACAAA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_2_0/1 +GTAAATGAAGTTGGTGCGTAATAAAACTGTCTACCGTATTGGTTATCGCTACGCTATAAACCAACAAAATAGGGTAAATAGCAAAAAAGTAGAGCAGCGTGATTAATTTCCCTGCGCCGACACCGAAATGTTCTTCGACCACTTCAGTAAT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_8_0/1 +CTCGTTGTCCAGCAATCGCATCGCTGTGCTGGCGGCGGATAAGCAGCGCGGCGCGGTAGTTGGCTTCGTGGCGCTGACGCTCCATGTTCAGATGACGCAGTGGTGAACCTATCCACTGCGTTAACGCCATACCCAGCAGGGTATAGAGAAT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000001.1_1_1/1 +TGGGTGTTGTCGGGGCGATCATGTTGTTTGCCACCTGGAGCTGGGTGCCAGAGAGTCTGCCGCGAGATCAGCGCATGCAGGGCAATATTGGTTCGGCTTTTGTAGGTTATGCCGCGCTTTTTCGCCAACGTATCTACATGGGGTATACCCT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_0_0/1 +AAAATTGACGCCGGGCTGCCTGTTTATCGCTCTGCGCGATGAAAAGTTTGATGCCCATGATTATGCCCATCAGGCAGTACGCGGTGGTGCGGCGGCTCTGTTGGTCAGTAAGCACTTACCTATCGACGTGCCACAACTGTTGGTGGGGGAT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_5_1/1 +GCAGCATAAAGTCACCGAATTTATTGATGACATGGCGCAAGCCTACAGTTGGGCCGACGTGGTGGTGTGCCGCTCTGGTGCGCTTACCGTCAGTGAAATTGCCGCCGCCGGTTTGCCTGCGCTGTTTGTGCCCTTTCAGCATAAAGACCGG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_3_1/1 +GCACCGACGTCGTTACAGGCCACCAGCGCCAGCAAATCGCCTTCGACCTGCTCCGGTTCACGCACGTTGGCGCGAATAATATCCAGCACCACCTGATTGATCTGGCCGCCATCGATAAAGCGCAGCAGCTGCAAAAACAACCCTTCGTGAT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_2_0/1 +ACACCCGCATCCTCAAACTGCGCCAGCACACAGATATCAAAGCTGTTTGAGCAGGTGAAAAAATGGCGTGTACCCATGGTGAGCCAGCCGTTTTTTAATCTGCTTAAGTCTTCTTTATGGGGGAGTGTCAGGGAACCGAAGGTTTGGTAGG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_1_0/1 +GTTACACAGCGAAGGAAACGAGGGCGTTCGGTCATCTATTGAATCTTGAAACGAGGACAACGGCAGTGAGGAGTCCACAAAGCAATGGAATGGCTGAGAGCTTCGTGAAGACGATGAAGCGCGACTATATCAGTATAATGCCCAAACCGAA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_4_1/1 +GTCACCGGTAATGACGCAGGCGGCATGTACGGCGACAATTACGATCTGCTGTTAGGCGGTGGCGCCTTCGGTTTTGCCATGAACTCAGGCCGTATTGCCGCAGAAAGTGCGTTGGATTACATGCACTTCAAAAAACAATAATACTGCTCGC ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_6_0/1 +GGAGATGGTAAGGGCGAGGTAACGCCAGGGGAAACATGCGGGATGTGCTTTGAACGCGCAGAAACAAAAAACCGGCCAGAGCCGGTTTTTTCTTACAACGAGGAAGACAGATGTCTACGCAAGCAATGATTACAGTGCGTTGATCTGAGCA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_6_1/1 +CCGCTGAAACTGTCTCGTGCGCTGGAAGCTGCGGGTGTGCCGGTTATTGGCACCAGCCCGGATGCTATTGACCGTGCAGAATATCGTGAGCGTTTCCAACAGGCGGTGAATCGTCTGGGCCTGAAACAGCCGGAAAATGCCACCGTCACCT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_4_0/1 +GCCTTAGCCTGCTGGATGAAGAGATCAAAAACCTGAAAGGGAACGTACTGGACGGTGAGACGGCGTTCCGGCTGTATGACACTTACGGCTTCCCGTTCGATTTAACGGAAGACGTGTGCCGTGAGCACGATCTTACGGTGGATAAGGACGG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_2_1/1 +AGGCGTGGTCATTGAGCAGTTCCGCCACTTTATGCAGCAGTCAGAAGAGCAGATCTCCATGGTTATTCTGGAAGCCTGTGCTAACAATATGCTGTTTCTCGGTGAAGAAGAAGAGACCTCTCCTGCGCGCACTCTGTCACACAGTCTGCAT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_1_1/1 +CAGTGGTGATAAAACGAAATTAGAACTGATAAGTTATACCAACAGCAACTTTGTCATCATCATTGATGCCGTAGAGGTTGTCAGATTTGATCAGGTTAATTTCGTACTCAGAGTATACGGAGAAGTTTTTGTTGAATGCGTAGGTTGCACC ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_3_0/1 +AAATGGTGGCCAGCGCGTTGACTTCAGGTGAGACACCCACTTTGACCATGGAATAGATTTTCAGCGGCAAGATTTCATAAGAAGGACCCGTGACAAAGGATGATACCACCACATCATCCATGGACAGGGTGAAGCTCAGCAGCCAGCGGCA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_0_1/1 +CCTTTTGTCAGCGGTGGGGTGAACCCGTTGGCGCTGAATTCGACTGAGCTTATTCAGCGTCGAATGCATGCCGACAGTGAATTAGTGGCGGCGTCGTATACCTCCCCCCGCGCCGCCGCACAAGCGTTACAACCGGTAATACAGCGACTGT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_7_1/1 +TTTGTTCCTCAATCAGATAGTAATTACCCAGTAACCATTCCCCTGCGGGCGTAATACTGGCTTTATCGGCGGCACTAAGCATCGAGCAATGCCGCGTGATGACCGCTTCATTCTCCGCCAGACGCCGGGTTAAATGGTAAGGCATTTATGT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000002.1_5_0/1 +TATCCTGCCTACGTGTTGCATACGGTTGCTTTGCTGCTGTTTTTTATCGCCATGTCAGTGCAAATCTGGATACCCGCTTATTTGCATCGCGTTTTTGCGCTCACCAATCCGCAGGCTTCAGGCTTTTTGGCGCAGGTGTTGCTGTATACGT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_2_0/1 +CAGTAATAAAAATTTCTGATTTTAAGACGTATTGAATACGTAATTGAAATTTCCAAGAGGTGAGGTATGTCAGGTGTAACTATAAATTTAAATGTTGCAGCTCCTTATTTATCTCTAAAAGAATATGCCAGAGTAACCGGCATACCCTTTG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_4_0/1 +TGGGATCACATCGAAGTCCGCGCCAAAGAGGAAAGCCAACGCGAAGAGATTCGCGATGCGTTAACCCGTATTCCCGGCATTCATCATATTCTGGACGTTGAAGACCACGCTTACACCGACGTGCACGACATTTTTGAACAAACGTTGGCGC ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_4_1/1 +TCCTGTTACTTTCTCGTCGATGGGGGCAATTAAGCCTATGGCATCGGTCGGCTCAAAAATTGTAATGGCGTCTCAATTATAGAACCGCGCATTAAAAATGAAAACCATGGGATGTTAACAATACCGTCCCCATAAAGAAAGTGAGCATTCG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_3_0/1 +TGGCTTTAATGGATATTCCGGATAGCTCACTGATTTTACTGTTATTTAGTCCATGTTTGTAGCCCCATAATACCTCCCGCTCGCGTGGACTGAGGCACTGCACGATATTATATTGCTGTACGTGGGGTGGAATCCCAGACGATAAAGGGCT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_1_0/1 +TACCATTCGGGGCTATACTTGCAGCAAGTTTATTTGCCCATAAAACCATAAGTTATATTCATGAAACATATATCAAACCACGCGCATTGATGCTGTTTTTGACGATGATAGCTAATCGATGTGCGGATGAGATTATTTACGTCTCTCATTA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_0_0/1 +GGAGGTTCCGTCAGAGGCGATAGCAAACACGGTTTCTGCCACCGAAGGGGATAATACAATATTGTCCAGAAACGTACTGATATGCTGTTTAAATTCAGAAGAGTGAATAACGACATCACAGGCTCTGAGTTTGCTCAAAAATTGGGAAAAT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_2_1/1 +GATCCGCTTTCGCTCAAAGGCTCCTATGCGGGTGCCATGGGTTACGGTCAGTTTATGCCATCGTCATTTAAGCAGTATGCCGTCGATTTTAACGGTGACGGACATATCAACTTGTGGGATCCGGTTGATGCTATCGGCAGTGTGGCCAACT ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_5_1/1 +ACGGTTTTGTCTGTTAGTTCCATGCCGGATAATCCGTCAATAAACTCCTGCCAGGACTCGCCTTCGCACCCGGCATCCATACCCGGTAGCTGTCCTTGCCCCAGCGTTGGCGTGCCGAGCAGCAGCACGGGATAGGACAGAAAACTGTCCA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_0_1/1 +CCGCAATGGCCTGGTGCCTGAACAGGTCATTGTTGAAGTGACGGAGGATGAAGTCATTTCCAGTTTCGACGCATTTTCCTCTGCTATCCAGCAATTACGTTCGGCGGGGATTGGTGTGGCTATCGCTGCTTGCGAAGTTTCAGCCAGGCAA ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_3_1/1 +CTTGGCGACGGTGAACCGCTGACGCTCTATCCCGGTGAAGTGCCCGCGCGTTTGCCCGGTGCCGCCTTTTGGCAGCAACAGGGCTTCCATTTTGAAGATTTTCGACCTCAAGCGATGAACGTTGATACGCCGCTGCCGCACATTCGGCTGG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII +@NZ_JAFJYB010000003.1_1_1/1 +CGTCGGCAGAAACCGCCGGCAGCTCTAAGGTGATGCACGGCAACTGACGCTCCGCGCACCAACTGCCAAAAGAACCCGGCGTGGGGTAACCAATATGCTAGACCTGTGGCAATGAGAAAGCCCGTGAAAGCCATCCTGCCAGCGAAGAACG ++ +IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII