# HG changeset patch # User iuc # Date 1605131691 0 # Node ID 60573349e9aeec709b78066044afad7603c0e3af "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/shasta commit 6d14992ea4fb1af09373d51b3a48166afcbd3a74" diff -r 000000000000 -r 60573349e9ae configs/Nanopore-Dec2019.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/Nanopore-Dec2019.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,51 @@ +# This file contains Shasta options that, as of December 2019, +# are known to work with Oxford Nanopore reads under the following +# circumstances: + +# - Human genome assembly. +# - Coverage between 40x and 80x. If you have more coverage than that, +# you can use option "--Reads.minReadLength" to adjust coverage as desired. +# - Reads from Guppy 3.0.5 base caller. Also known to work with +# reads from other Guppy releases 3.0.x and 3.1.x. + +# To use this configuration file, specify Shasta option "--config PathToThisFile". +# If you specify any conflicting values on the command line, +# the values specified on the command line take precedence. + +# In most cases, for best performance on a large assembly +# you will usually also want to use the following options, which +# cannot be specified in a configuration file: +# --memoryMode filesystem +# --memoryBacking 2M +# Using these options require root access. + +# For detailed information on all available options see here: +# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html + +# For information on running a small assembly for which +# performance is not essential see here: +# https://chanzuckerberg.github.io/shasta/QuickStart.html + +# For more information on running an assembly see here: +# https://chanzuckerberg.github.io/shasta/Running.html + +# For information on optimizing assembly performance see here: +# https://chanzuckerberg.github.io/shasta/Performance.html + + + +[Reads] +# If you have extra coverage, use this option to adjust coverage. +minReadLength = 10000 + +[MinHash] +minBucketSize = 5 +maxBucketSize = 30 +minFrequency = 5 + +[Align] +minAlignedFraction = 0.4 + +[Assembly] +consensusCaller = Bayesian:guppy-3.0.5-a + diff -r 000000000000 -r 60573349e9ae configs/Nanopore-Jun2020.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/Nanopore-Jun2020.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,74 @@ +# DO NOT USE THIS FILE IF YOU HAVE READS CREATED BY A +# GUPPY VERSION OLDER THAN 3.6.0. + +# This file contains Shasta options that, as of June 2020, +# are known to work with Oxford Nanopore reads under the following +# circumstances: + +# - Human genome assembly. +# - Coverage between 40x and 80x. If you have more coverage than that, +# you can use option "--Reads.minReadLength" to adjust coverage as desired. +# - Reads from Guppy 3.6.0 base caller. If you have reads +# from an older version of Guppy, use configuration file +# Nanopore-Dec2019.conf instead. + +# To use this configuration file, specify Shasta option +# "--config AbsolutePathToThisFile". +# If you specify any conflicting values on the command line, +# the values specified on the command line take precedence. + +# In most cases, for best performance on a large assembly +# you will usually also want to use the following options, which +# cannot be specified in a configuration file: +# --memoryMode filesystem +# --memoryBacking 2M +# Using these options requires root access. + +# For detailed information on all available options see here: +# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html + +# For information on running a small assembly for which +# performance is not essential see here: +# https://chanzuckerberg.github.io/shasta/QuickStart.html + +# For more information on running an assembly see here: +# https://chanzuckerberg.github.io/shasta/Running.html + +# For information on optimizing assembly performance see here: +# https://chanzuckerberg.github.io/shasta/Performance.html + + + +[Reads] +# If you have extra coverage, use this option to adjust coverage. +minReadLength = 10000 +noCache = True + +[Kmers] +# Due to the higher accuracy of Guppy 3.6.0 we use longer +# markers than usual. +k = 14 + +[MinHash] +minBucketSize = 5 +maxBucketSize = 30 +minFrequency = 5 + +[Align] +alignMethod = 3 +downsamplingFactor = 0.05 +matchScore = 6 +minAlignedFraction = 0.55 +minAlignedMarkerCount = 400 +sameChannelReadAlignment.suppressDeltaThreshold = 30 + +[MarkerGraph] +simplifyMaxLength = 10,100,1000,10000,100000 +refineThreshold = 6 +crossEdgeCoverageThreshold = 3 + +[Assembly] +consensusCaller = Bayesian:guppy-3.6.0-a +detangleMethod = 1 + + diff -r 000000000000 -r 60573349e9ae configs/Nanopore-OldGuppy-Sep2020.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/Nanopore-OldGuppy-Sep2020.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,83 @@ +# This file contains Shasta options which attempt to partially automate +# parameter selection. It is based on an earlier config, which, as of Jun 2020, +# was known to work with Oxford Nanopore reads under the following circumstances: + +# - Human genome assembly. +# - Coverage between 40x and 80x. If you have more coverage than that, +# you can use option "--Reads.minReadLength" to adjust coverage as desired. +# - Reads from Guppy 3.0.5 base caller. Also known to work with +# reads from other Guppy releases 3.0.x and 3.1.x. + +# The automation provided by this config is particularly applicable to +# low coverage or non-human samples. It also matches or exceeds continuity +# in human samples, relative to the appropriately chosen config file. +# Updating to guppy 3.6.0 or higher will greatly improve assembly +# quality and is therefore strongly recommended. + +# To use this configuration file, specify Shasta option +# "--config AbsolutePathToThisFile". +# If you specify any conflicting values on the command line, +# the values specified on the command line take precedence. + +# In most cases, for best performance on a large assembly +# you will usually also want to use the following options, which +# cannot be specified in a configuration file: +# --memoryMode filesystem +# --memoryBacking 2M +# Using these options requires root access. + +# For detailed information on all available options see here: +# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html + +# For information on running a small assembly for which +# performance is not essential see here: +# https://chanzuckerberg.github.io/shasta/QuickStart.html + +# For more information on running an assembly see here: +# https://chanzuckerberg.github.io/shasta/Running.html + +# For information on optimizing assembly performance see here: +# https://chanzuckerberg.github.io/shasta/Performance.html + + + +[Reads] +# If you have extra coverage, use this option to adjust coverage. +minReadLength = 10000 +noCache = True + +[MinHash] +minBucketSize = 5 +maxBucketSize = 30 +minFrequency = 5 + +[Align] +alignMethod = 3 +downsamplingFactor = 0.05 +matchScore = 6 +sameChannelReadAlignment.suppressDeltaThreshold = 30 + +# The following Align parameters are set to very permissive values to allow the majority of alignments +# to be assessed during the initial stage of automatic alignment parameter selection +maxSkip = 100 +maxDrift = 100 +maxTrim = 100 +minAlignedMarkerCount = 10 +minAlignedFraction = 0.1 + +[ReadGraph] +# This method uses the observed distribution of alignment stats to choose a cutoff for +# maxSkip, maxDrift, maxTrim, minAlignedMarkerCount, and minAlignedFraction +creationMethod = 2 + +[MarkerGraph] +simplifyMaxLength = 10,100,1000,10000,100000 +crossEdgeCoverageThreshold = 3 + +# Automatically determine this using PeakFinder +minCoverage = 0 + +[Assembly] +consensusCaller = Bayesian:guppy-3.0.5-a +detangleMethod = 2 + diff -r 000000000000 -r 60573349e9ae configs/Nanopore-Sep2020.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/Nanopore-Sep2020.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,94 @@ +# DO NOT USE THIS FILE IF YOU HAVE READS CREATED BY A +# GUPPY VERSION OLDER THAN 3.6.0. + +# This file contains Shasta options which attempt to partially automate +# parameter selection. It is based on an earlier config, which, as of Jun 2020, +# was known to work with Oxford Nanopore reads under the following circumstances: + +# - Human genome assembly. +# - Coverage between 40x and 80x. If you have more coverage than that, +# you can use option "--Reads.minReadLength" to adjust coverage as desired. +# - Reads from Guppy 3.6.0 base caller. If you have reads +# from an older version of Guppy, use configuration file +# Nanopore-Dec2019.conf instead. + +# The automation provided by this config is particularly applicable to +# low coverage or non-human samples. It also matches or exceeds continuity +# in human samples, relative to the appropriately chosen 3.6.0 or 3.6.0-UL conf. +# Automation can also be activated with parameters designed for earlier basecallers, +# if needed, but updating to guppy 3.6.0 or higher will greatly improve assembly +# quality and is therefore strongly recommended. + +# To use this configuration file, specify Shasta option +# "--config AbsolutePathToThisFile". +# If you specify any conflicting values on the command line, +# the values specified on the command line take precedence. + +# In most cases, for best performance on a large assembly +# you will usually also want to use the following options, which +# cannot be specified in a configuration file: +# --memoryMode filesystem +# --memoryBacking 2M +# Using these options requires root access. + +# For detailed information on all available options see here: +# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html + +# For information on running a small assembly for which +# performance is not essential see here: +# https://chanzuckerberg.github.io/shasta/QuickStart.html + +# For more information on running an assembly see here: +# https://chanzuckerberg.github.io/shasta/Running.html + +# For information on optimizing assembly performance see here: +# https://chanzuckerberg.github.io/shasta/Performance.html + + + +[Reads] +# If you have extra coverage, use this option to adjust coverage. +minReadLength = 10000 +noCache = True + +[Kmers] +# Due to the higher accuracy of Guppy 3.6.0 we use longer +# markers than usual. +k = 14 + +[MinHash] +minBucketSize = 5 +maxBucketSize = 30 +minFrequency = 5 + +[Align] +alignMethod = 3 +downsamplingFactor = 0.05 +matchScore = 6 +sameChannelReadAlignment.suppressDeltaThreshold = 30 + +# The following Align parameters are set to very permissive values to allow the majority of alignments +# to be assessed during the initial stage of automatic alignment parameter selection +maxSkip = 100 +maxDrift = 100 +maxTrim = 100 +minAlignedMarkerCount = 10 +minAlignedFraction = 0.1 + +[ReadGraph] +# This method uses the observed distribution of alignment stats to choose a cutoff for +# maxSkip, maxDrift, maxTrim, minAlignedMarkerCount, and minAlignedFraction +creationMethod = 2 + +[MarkerGraph] +simplifyMaxLength = 10,100,1000,10000,100000 +crossEdgeCoverageThreshold = 3 + +# Automatically determine this using PeakFinder +minCoverage = 0 + +[Assembly] +consensusCaller = Bayesian:guppy-3.6.0-a +detangleMethod = 2 + + diff -r 000000000000 -r 60573349e9ae configs/Nanopore-UL-Dec2019.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/Nanopore-UL-Dec2019.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,53 @@ +# This file contains Shasta options that, as of December 2019, +# are known to work with Ultra-Long (UL) Oxford Nanopore reads +# under the following circumstances: + +# - Human genome assembly. +# - Coverage between 40x and 80x. If you have more coverage than that, +# you can use option "--Reads.minReadLength" to adjust coverage as desired. +# - Reads from Guppy 3.0.5 base caller. Also known to work with +# reads from other Guppy releases 3.0.x and 3.1.x. + +# To use this configuration file, specify Shasta option "--config PathToThisFile". +# If you specify any conflicting values on the command line, +# the values specified on the command line take precedence. + +# In most cases, for best performance on a large assembly +# you will usually also want to use the following options, which +# cannot be specified in a configuration file: +# --memoryMode filesystem +# --memoryBacking 2M +# Using these options require root access. + +# For detailed information on all available options see here: +# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html + +# For information on running a small assembly for which +# performance is not essential see here: +# https://chanzuckerberg.github.io/shasta/QuickStart.html + +# For more information on running an assembly see here: +# https://chanzuckerberg.github.io/shasta/Running.html + +# For information on optimizing assembly performance see here: +# https://chanzuckerberg.github.io/shasta/Performance.html + + + +[Reads] +# If you have extra coverage, use this option to adjust coverage. +minReadLength = 50000 + +[MinHash] +minBucketSize = 5 +maxBucketSize = 40 +minFrequency = 10 + +[Align] +maxSkip = 60 +maxDrift = 60 +minAlignedMarkerCount = 400 + +[Assembly] +consensusCaller = Bayesian:guppy-3.0.5-a + diff -r 000000000000 -r 60573349e9ae configs/Nanopore-UL-Jun2020.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/Nanopore-UL-Jun2020.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,78 @@ +# DO NOT USE THIS FILE IF YOU HAVE READS CREATED BY A +# GUPPY VERSION OLDER THAN 3.6.0. + +# This file contains Shasta options that, as of June 2020, +# are known to work with Ultra-Long (UL) Oxford Nanopore reads +# under the following circumstances: + +# - Human genome assembly. +# - Coverage between 40x and 80x. If you have more coverage than that, +# you can use option "--Reads.minReadLength" to adjust coverage as desired. +# - Reads from Guppy 3.6.0 base caller. If you have reads +# from an older version of Guppy, use configuration file +# Nanopore-UL-Dec2019.conf instead. + +# To use this configuration file, specify Shasta option +# "--config AbsolutePathToThisFile". +# If you specify any conflicting values on the command line, +# the values specified on the command line take precedence. + +# In most cases, for best performance on a large assembly +# you will usually also want to use the following options, which +# cannot be specified in a configuration file: +# --memoryMode filesystem +# --memoryBacking 2M +# Using these options requires root access. + +# For detailed information on all available options see here: +# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html + +# For information on running a small assembly for which +# performance is not essential see here: +# https://chanzuckerberg.github.io/shasta/QuickStart.html + +# For more information on running an assembly see here: +# https://chanzuckerberg.github.io/shasta/Running.html + +# For information on optimizing assembly performance see here: +# https://chanzuckerberg.github.io/shasta/Performance.html + + + +[Reads] +# If you have extra coverage, use this option to adjust coverage. +minReadLength = 50000 +noCache = True + +[Kmers] +# Due to the higher accuracy of Guppy 3.6.0 we use longer +# markers than usual. +k = 14 + +[MinHash] +minBucketSize = 10 +maxBucketSize = 30 +minFrequency = 5 + +[Align] +alignMethod = 3 +downsamplingFactor = 0.05 +matchScore = 6 +minAlignedFraction = 0.55 +minAlignedMarkerCount = 600 +sameChannelReadAlignment.suppressDeltaThreshold = 30 + +[ReadGraph] +maxAlignmentCount = 12 + + +[MarkerGraph] +simplifyMaxLength = 10,100,1000,10000,100000 +refineThreshold = 6 +crossEdgeCoverageThreshold = 3 + +[Assembly] +consensusCaller = Bayesian:guppy-3.6.0-a +detangleMethod = 1 + + diff -r 000000000000 -r 60573349e9ae configs/Nanopore-UL-Sep2020.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/Nanopore-UL-Sep2020.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,89 @@ +# DO NOT USE THIS FILE IF YOU HAVE READS CREATED BY A +# GUPPY VERSION OLDER THAN 3.6.0. + +# This file contains Shasta options which attempt to partially automate +# parameter selection. It is based on an earlier config, which, as of Jun 2020, +# was known to work with Oxford Nanopore reads under the following circumstances: + +# - Human genome assembly. +# - Coverage between 40x and 80x. If you have more coverage than that, +# you can use option "--Reads.minReadLength" to adjust coverage as desired. +# - Reads from Guppy 3.6.0 base caller. If you have reads +# from an older version of Guppy, use configuration file +# Nanopore-UL-Dec2019.conf instead. + +# The automation provided by this config is particularly applicable to +# low coverage or non-human samples. It also matches or exceeds continuity +# in human samples, relative to the appropriately chosen 3.6.0 or 3.6.0-UL conf. +# Automation can be activated with parameters designed for earlier basecallers, +# if needed, but updating to guppy 3.6.0 or higher will greatly improve assembly +# quality and is therefore strongly recommended. + +# In most cases, for best performance on a large assembly +# you will usually also want to use the following options, which +# cannot be specified in a configuration file: +# --memoryMode filesystem +# --memoryBacking 2M +# Using these options requires root access. + +# For detailed information on all available options see here: +# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html + +# For information on running a small assembly for which +# performance is not essential see here: +# https://chanzuckerberg.github.io/shasta/QuickStart.html + +# For more information on running an assembly see here: +# https://chanzuckerberg.github.io/shasta/Running.html + +# For information on optimizing assembly performance see here: +# https://chanzuckerberg.github.io/shasta/Performance.html + + + +[Reads] +# If you have extra coverage, use this option to adjust coverage. +minReadLength = 50000 +noCache = True + +[Kmers] +# Due to the higher accuracy of Guppy 3.6.0 we use longer +# markers than usual. +k = 14 + +[MinHash] +minBucketSize = 10 +maxBucketSize = 30 +minFrequency = 5 + +[Align] +alignMethod = 3 +downsamplingFactor = 0.05 +matchScore = 6 +sameChannelReadAlignment.suppressDeltaThreshold = 30 + +# The following Align parameters are set to very permissive values to allow the majority of alignments +# to be assessed during the initial stage of automatic alignment parameter selection +maxSkip = 100 +maxDrift = 100 +maxTrim = 100 +minAlignedMarkerCount = 10 +minAlignedFraction = 0.1 + +[ReadGraph] +# This method uses the observed distribution of alignment stats to choose a cutoff for +# maxSkip, maxDrift, maxTrim, minAlignedMarkerCount, and minAlignedFraction +creationMethod = 2 + +[MarkerGraph] +simplifyMaxLength = 10,100,1000,10000,100000 +crossEdgeCoverageThreshold = 3 + +# Automatically determine this using PeakFinder +minCoverage = 0 + +[Assembly] +consensusCaller = Bayesian:guppy-3.6.0-a +detangleMethod = 2 + + diff -r 000000000000 -r 60573349e9ae configs/Nanopore-UL-iterative-Sep2020.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/Nanopore-UL-iterative-Sep2020.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,46 @@ +# This configuration file is EXPERIMENTAL and should only +# be used under the following conditions: +# - Nanopore reads created by Guppy 3.6.0 or newer. +# - Ultra-Long (UL) reads with typical N50 80Kb or more. +# - High coverage 80X. +# Iterative assembly results in some separation of haplotypes +# and does better at resolving segmental duplications. + +[Reads] +minReadLength = 30000 +noCache = True + +[Kmers] +k = 10 + +[MinHash] +minBucketSize = 10 +maxBucketSize = 40 +minFrequency = 5 + +[Align] +alignMethod = 3 +matchScore = 6 +gapScore = -3 +downsamplingFactor = 0.05 +maxSkip = 100 +maxDrift = 100 +maxTrim = 100 +minAlignedMarkerCount = 10 +minAlignedFraction = 0.1 +sameChannelReadAlignment.suppressDeltaThreshold = 30 + +[ReadGraph] +maxAlignmentCount = 12 +creationMethod = 2 + +[MarkerGraph] +minCoveragePerStrand = 3 +simplifyMaxLength = 10,100 +crossEdgeCoverageThreshold = 3 + +[Assembly] +detangleMethod = 2 +consensusCaller = Bayesian:guppy-3.6.0-a +iterative = True + diff -r 000000000000 -r 60573349e9ae configs/PacBio-CCS-Dec2019.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/PacBio-CCS-Dec2019.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,50 @@ +# This file contains Shasta options that, as of December 2019, +# are known to work with PacBio CCS reads under the following +# circumstances: + +# - Human genome assembly. +# - Coverage between 40x and 80x. If you have more coverage than that, +# you can use option "--Reads.minReadLength" to adjust coverage as desired. + +# To use this configuration file, specify Shasta option "--config PathToThisFile". +# If you specify any conflicting values on the command line, +# the values specified on the command line take precedence. + +# In most cases, for best performance on a large assembly +# you will usually also want to use the following options, which +# cannot be specified in a configuration file: +# --memoryMode filesystem +# --memoryBacking 2M +# Using these options require root access. + +# For detailed information on all available options see here: +# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html + +# For information on running a small assembly for which +# performance is not essential see here: +# https://chanzuckerberg.github.io/shasta/QuickStart.html + +# For more information on running an assembly see here: +# https://chanzuckerberg.github.io/shasta/Running.html + +# For information on optimizing assembly performance see here: +# https://chanzuckerberg.github.io/shasta/Performance.html + +[Kmers] +k = 15 +probability = 0.02 + +[MinHash] +m = 12 +minBucketSize = 20 +maxBucketSize = 100 +minHashIterationCount = 25 +minFrequency = 10 + +[ReadGraph] +maxAlignmentCount = 20 + +[Assembly] +consensusCaller = Modal + + diff -r 000000000000 -r 60573349e9ae configs/PacBio-CLR-Dec2019.conf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/configs/PacBio-CLR-Dec2019.conf Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,45 @@ +# This file contains Shasta options that, as of December 2019, +# are known to work with PacBio CLR reads under the following +# circumstances: + +# - Human genome assembly. +# - Coverage between 40x and 80x. If you have more coverage than that, +# you can use option "--Reads.minReadLength" to adjust coverage as desired. + +# To use this configuration file, specify Shasta option "--config PathToThisFile". +# If you specify any conflicting values on the command line, +# the values specified on the command line take precedence. + +# In most cases, for best performance on a large assembly +# you will usually also want to use the following options, which +# cannot be specified in a configuration file: +# --memoryMode filesystem +# --memoryBacking 2M +# Using these options require root access. + +# For detailed information on all available options see here: +# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html + +# For information on running a small assembly for which +# performance is not essential see here: +# https://chanzuckerberg.github.io/shasta/QuickStart.html + +# For more information on running an assembly see here: +# https://chanzuckerberg.github.io/shasta/Running.html + +# For information on optimizing assembly performance see here: +# https://chanzuckerberg.github.io/shasta/Performance.html + + +[Reads] +# Use this option to adjust coverage. +minReadLength = 10000 + +[ReadGraph] +maxAlignmentCount = 20 + +[Assembly] +consensusCaller = Modal + + + diff -r 000000000000 -r 60573349e9ae macros.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,82 @@ + + + 0.6.0 + 18.01 + + + shasta + + + + shasta --version + + + + 10.1038/s41587-020-0503-6 + @online{shasta, + author = {TODOLastName,TODOFirstName}, + title = {shasta}, + year = 2020, + url = {https://github.com/chanzuckerberg/shasta}, + urldate = {2020-11-05} + } + + + + ./input_${counter}.${ext} && + #elif $input.is_of_type("fastq.gz","fastqsanger.gz") + #set $ext = "fastq" + gzip -dcf '$input' > ./input_${counter}.${ext} && + #elif $input.is_of_type("fastqsanger", "fastq"): + #set $ext = "fastq" + ### I tried symlinking but shasta still complained about file extensions + cp '$input' ./input_${counter}.${ext} && + #elif $input.is_of_type("fasta"): + #set $ext = "fasta" + ### I tried symlinking but shasta still complained about file extensions + cp '$input' ./input_${counter}.${ext} && + #end if +#end for + ]]> + + + + + + + + + + + + + + + + + + + + + + + `_ or the `github `_ . + ]]> + diff -r 000000000000 -r 60573349e9ae shasta.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/shasta.xml Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,832 @@ + + + De novo assembly of long read sequencing data + + macros.xml + + + + + + + &2 + ]]> + + + + + + + + + + + + + + + + + +
+ + + +
+
+ + + ^([0-9]*)?([KMG]bp?)?$ + + + + +
+ + + + + + + + + + +
+ +
+
+ + + + + + + + + + +
+
+ + + + + + + + + + + + + + + +
+
+ + + + + + + + + + + + + + + + + + + + + + + +
+ +
+
+
+ + + + + + + + + + + + + + + + + + + +
+
+ + + + + + + + + + ^[0-9]+(,[0-9]+)*$ + + + + + + + + +
+ + +
+ +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + + +
+ +
+ + + + + + + + + + + + + +
+ +
+
+ + + outputs["report_graphical_fragment_assembly"] + + + outputs["report_config"] + + + outputs["report_log"] + + + + + assembly["write_reads_by_assembled_segment"] + + + + + + + + + + + +
+ + + +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + +
+ + + + + + + +
+ + + +
+ + + + + +
+ + + + + + + +
+ + + +
+ + + + + +
+ + + + + + +
+ + + +
+
+ + +
+ + + + + + + +
+
+
+ + + + + +
+
+ + + + + + + + + +
+
+ + + + + + + + + + + + + + +
+ +
+
+
+ + + + + + + + + + + +
+
+ + + + + + + + + + + + +
+ + +
+
+
+ + + + + + + + +
+ + + + +
+
+ + + + + + + + + + +
+
+ + + + + + + + + + +
+
+ `_ (these files correspond to the packaged config files available for this tool). + +**Output** + +- Assembled genome (FASTA) +- Graphical fragment assembly (optional) (.gfa1) +- Log file (optional) (.txt) +- Config file (optional) (.txt) +- Read CSV detailing which reads align to which assembly fragments (optional) (.csv) +- Coverage CSV List (optional) (list:.csv) + +**References** + +@REFERENCES@ + ]]> + +
diff -r 000000000000 -r 60573349e9ae test-data/nanopore.fasta.gz Binary file test-data/nanopore.fasta.gz has changed diff -r 000000000000 -r 60573349e9ae test-data/out_config.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/out_config.txt Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,100 @@ +[Reads] +minReadLength = 10000 +desiredCoverage = 0 +noCache = False +palindromicReads.skipFlagging = False +palindromicReads.maxSkip = 100 +palindromicReads.maxDrift = 100 +palindromicReads.maxMarkerFrequency = 10 +palindromicReads.alignedFractionThreshold = 0.1 +palindromicReads.nearDiagonalFractionThreshold = 0.1 +palindromicReads.deltaThreshold = 100 + +[Kmers] +generationMethod = 0 +k = 10 +probability = 0.1 +enrichmentThreshold = 100 +file = + +[MinHash] +version = 0 +m = 4 +hashFraction = 0.01 +minHashIterationCount = 10 +alignmentCandidatesPerRead = 20 +minBucketSize = 5 +maxBucketSize = 30 +minFrequency = 5 +allPairs = False + +[Align] +alignMethod = 3 +maxSkip = 30 +maxDrift = 30 +maxTrim = 30 +maxMarkerFrequency = 10 +minAlignedMarkerCount = 100 +minAlignedFraction = 0.4 +matchScore = 6 +mismatchScore = -1 +gapScore = -1 +downsamplingFactor = 0.1 +bandExtend = 10 +maxBand = 1000 +sameChannelReadAlignment.suppressDeltaThreshold = 0 +suppressContainments = False + +[ReadGraph] +creationMethod = 0 +maxAlignmentCount = 6 +minComponentSize = 100 +maxChimericReadDistance = 2 +crossStrandMaxDistance = 6 +containedNeighborCount = 6 +uncontainedNeighborCountPerDirection = 3 +removeConflicts = False +markerCountPercentile = 0.015 +alignedFractionPercentile = 0.12 +maxSkipPercentile = 0.12 +maxDriftPercentile = 0.12 +maxTrimPercentile = 0.015 + +[MarkerGraph] +minCoverage = 10 +maxCoverage = 100 +minCoveragePerStrand = 0 +lowCoverageThreshold = 0 +highCoverageThreshold = 256 +maxDistance = 30 +edgeMarkerSkipThreshold = 100 +pruneIterationCount = 6 +simplifyMaxLength = 10,100,1000 +crossEdgeCoverageThreshold = 0 +refineThreshold = 0 +reverseTransitiveReduction = False +peakFinder.minAreaFraction = 0.08 +peakFinder.areaStartIndex = 2 + +[Assembly] +crossEdgeCoverageThreshold = 3 +markerGraphEdgeLengthThresholdForConsensus = 1000 +consensusCaller = Bayesian:guppy-3.0.5-a +storeCoverageData = False +storeCoverageDataCsvLengthThreshold = 0 +writeReadsByAssembledSegment = True +detangleMethod = 0 +detangle.diagonalReadCountMin = 1 +detangle.offDiagonalReadCountMax = 2 +detangle.offDiagonalRatio = 0.3 +iterative = False +iterative.iterationCount = 3 +iterative.pseudoPathAlignMatchScore = 1 +iterative.pseudoPathAlignMismatchScore = -1 +iterative.pseudoPathAlignGapScore = -1 +iterative.mismatchSquareFactor = 3 +iterative.minScore = 0 +iterative.maxAlignmentCount = 6 +iterative.bridgeRemovalIterationCount = 3 +iterative.bridgeRemovalMaxDistance = 2 + diff -r 000000000000 -r 60573349e9ae test-data/out_config2.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/out_config2.txt Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,100 @@ +[Reads] +minReadLength = 10000 +desiredCoverage = 0 +noCache = False +palindromicReads.skipFlagging = False +palindromicReads.maxSkip = 100 +palindromicReads.maxDrift = 100 +palindromicReads.maxMarkerFrequency = 10 +palindromicReads.alignedFractionThreshold = 0.1 +palindromicReads.nearDiagonalFractionThreshold = 0.1 +palindromicReads.deltaThreshold = 100 + +[Kmers] +generationMethod = 0 +k = 10 +probability = 0.1 +enrichmentThreshold = 100 +file = + +[MinHash] +version = 0 +m = 4 +hashFraction = 0.01 +minHashIterationCount = 10 +alignmentCandidatesPerRead = 20 +minBucketSize = 5 +maxBucketSize = 30 +minFrequency = 5 +allPairs = False + +[Align] +alignMethod = 3 +maxSkip = 30 +maxDrift = 30 +maxTrim = 30 +maxMarkerFrequency = 10 +minAlignedMarkerCount = 100 +minAlignedFraction = 0.4 +matchScore = 6 +mismatchScore = -1 +gapScore = -1 +downsamplingFactor = 0.1 +bandExtend = 10 +maxBand = 1000 +sameChannelReadAlignment.suppressDeltaThreshold = 0 +suppressContainments = False + +[ReadGraph] +creationMethod = 0 +maxAlignmentCount = 6 +minComponentSize = 100 +maxChimericReadDistance = 2 +crossStrandMaxDistance = 6 +containedNeighborCount = 6 +uncontainedNeighborCountPerDirection = 3 +removeConflicts = False +markerCountPercentile = 0.015 +alignedFractionPercentile = 0.12 +maxSkipPercentile = 0.12 +maxDriftPercentile = 0.12 +maxTrimPercentile = 0.015 + +[MarkerGraph] +minCoverage = 10 +maxCoverage = 100 +minCoveragePerStrand = 0 +lowCoverageThreshold = 0 +highCoverageThreshold = 256 +maxDistance = 30 +edgeMarkerSkipThreshold = 100 +pruneIterationCount = 6 +simplifyMaxLength = 10,100,1000 +crossEdgeCoverageThreshold = 0 +refineThreshold = 0 +reverseTransitiveReduction = False +peakFinder.minAreaFraction = 0.08 +peakFinder.areaStartIndex = 2 + +[Assembly] +crossEdgeCoverageThreshold = 3 +markerGraphEdgeLengthThresholdForConsensus = 1000 +consensusCaller = Bayesian:guppy-3.0.5-a +storeCoverageData = False +storeCoverageDataCsvLengthThreshold = 0 +writeReadsByAssembledSegment = False +detangleMethod = 0 +detangle.diagonalReadCountMin = 1 +detangle.offDiagonalReadCountMax = 2 +detangle.offDiagonalRatio = 0.3 +iterative = False +iterative.iterationCount = 3 +iterative.pseudoPathAlignMatchScore = 1 +iterative.pseudoPathAlignMismatchScore = -1 +iterative.pseudoPathAlignGapScore = -1 +iterative.mismatchSquareFactor = 3 +iterative.minScore = 0 +iterative.maxAlignmentCount = 6 +iterative.bridgeRemovalIterationCount = 3 +iterative.bridgeRemovalMaxDistance = 2 + diff -r 000000000000 -r 60573349e9ae test-data/out_fasta.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/out_fasta.fasta Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,2 @@ +>0 length 16594 +TCACCTTTCTGCGTTCTCCGGATTTTTTCGCACGTGACTGCCCAGTTCGCTAAGGCTCGATTCCGATCTTAGCTTCCGAAGCATCTCTGCGTACGAAGCCTCCTCCTGTCTTTTTTTTTACGATGAGTGCCTCTGCACCCGTGCTAGCATTCTTGGCGACAGATGCATAGCTGCCTCGGCTTGGACTCGTTAGGTATGGATGTCGCCTTTTCTTCACCGCTTGCCATCCAACGTAGGGTTGCTCTGCTTCGGCGCCTGGACTTTGGCACCTGCACCGTGGGTACCTGCGCATTTTGTGGAGCCTTTTGGTAGGCTTTGTACCTCCGTCTGGGTAGCGCTGCTCTTCAAGCGGTGCTCGCTAGTAGTACCTTCTTGTACAGCTCTATCGCCCCTGTTGTTAAGGGCTGAGAGTTCGGAAGCTATGCCCTTTGTCTCTCATGTGTGTCGTTGGGTCTCGAATGCGGATAGAAGGGGGGCTGATCTTGCCATTCATCCTGGTAAGTATGCCCCTCAGGTCCTCGTTCTGGAGAGCAGTGGTCAAGTCCGAAGACCGATGAGGGGAACCAGCTGGGGACTTCCCTCCCGTCTTTTGCGATGGCACGGCGATGTGGTCCATCGTCTTCTGACTTGTCGCGGTCGTAGATGCTGTAGGAGCCAATTTCTCCACCTCTACAGCATCGCTGCAGTCGATAGTCAACGGCGGCTGGGGCCTGCGTGCTCACCCCCTTTGCCACCGACGGGACCGAGATTCCGTCACCATGGGTCGGGTTACCGACTCCTCTGGTGGGGGATCTCGAAAGTCGGGAGCTCCTCCTGAACGGGTCGTTGCGATCAGGGGACTGCCCCCACTGCGCTGTCCATCAACCGAAGGATGGCCTAAGGTTACCTAGGGTCACGTAGGCCACGGATTTCCCCGGCTTTTACGGATGGAGGTTTGTACCGCCTCGACTCGGACACCAGAGCCTCTGCTTAGGCACCAGCACGGTGAGAGGATGATATTTGGTCTGTCCGCGACCTTTGTGCCTTTTCCTTTTCCCCTTTCTTAAAGACTTGTGCGCTCCCCAGTTACCAGAATCAAAATTAAATTAAATTAAAAAATTTCAACGGCTTAATTTTTAAATTTAATTTTGAATTTCGCGCCCTACTGTCGCAACACAACACTGATCACACGGTTGATCTGGCAACGCCCCTCCCTCTCCAGATCGTCCCGCTGCGCTATCAGCTGTTTATCCGCTGCAACAATCGCAAGATAATAAATTACCTATTTACATGAAACAGGCGCACAATTAACTTCGCGTGATTGCAGCGCAGAACTATGGCGCGACTCCACCGTGTGATTTTGCCAGTTTGCCGCACACACCGGCCGACACAACTTCTATGGTTTCGAGTATTTCGCGCCGCGTAATTTAAGACGTCCGTCTTCACGGCGATGTAGACTTGGTCTCCGCACCAGGATTGAGTGTCTAAGCCTGTGCGTTCAGGATTAAACTTTGGCAATACGACAGCATTGAGTTTTTGGGTCTCTTTGTGAGTTTTGCACTTCTTTTAACAGTTCAGAAAAATGGCGATTCTGCGACTCTAGAATTGTCAGCAAATTGTTTTCACTATTGTAGTATGCACACATATCGGTTAAGCACTGTACCTATGTGTATTCATAATTGTAGCACTCTGTTGCAATGTGTACATAAACAGTCCAGCACAAGTGTATACGTAATACGAGCACCCACTTGAGGGGCTAACATACATAATTGCCTGGTCAGCAGTTCTCCCGCTGGCCAAGCGCTGATCGCTTATATGTGTGCCTATACCACTCCTCCTCCAGCACCATCGCTCGGCGACAGTACATATATATATACATATATATAAGATACGCATATAAGCGTTGCTGCGCTGCAGGCTATGCCGGCAGCGCTGCTCCTCGACTTAGGCTAAGAAACCTTTGTATGTAGATCATAAGAGGATTGACGAATTAATTTCGAATGGAGCGGGACCTTCCCTGTTCCTCAAATTGGATCAAATAAAGAACAGCTAAAACACAAATGATCTATGACACAATGAAACTACAGGAAGTTGGAGTAGGCGGTCCCACTTCTGATGTCGGATCTGAATCACTTTATACTCGGCATCACTCTCTACAGCGGACACAAAGTAACAGAAAACGGTCGTTAACTTGAAATTAAAAATAAATCTGCGACAAGTACAGTTTGTCAAGAAACTGTTTACACACCGTGAAATAAGATGAATTTTTGATTTTAACGGTCAAAATTAAGGGTTATTTGCTTAATTAAACGCAATTTTTTTTTTAGGAAATATAATTAAACAATATTTATTTTACTTATAAATTAAAAAACAAATTCAAAATATCAAATATACAAGAAAATAAATAACAAACTTCCAAGTTTACACACTTTTGAGAGTGTCACTCTGCCCAAACCGTCATCTCTGGGATGAGCTGATAGGTCCACCTCCCCCCGTCGCGACGTTTGCCATCTGCTCTGCCATTCACCTAATAGCCACTCGTGTGCCTCTTGCCTGGAAGCGCCACTCCGCATAAGGCTGAGAGCCTTGATCTCCAGATCAATCGGCAGGCCTGCCAGCGCTAGCGCCGCGTCTTCGGATATGGTCCTGAATCCTCTAATGAGCCTGAGGGCCATTGACCGTAGCACCGAACGAGCTCCTTTCAGGTATGAGACCCTGCAAGTGGCATTGCTCCAGACTGGTGCAGCGTATAGCAGCGAAGCCTTTGCTACTGACACCAGCAGTTTCCTGGCCGGGTGTCTTGGGCCTCCGACGTTGGGCATGCCTCGCCAACGAAGAGGATGTGACTGCTGTCTTCTTGCTGGCGTAGCTCGCGTGGTCCTTGAACGATAGTCTGCGATCTATCATTACCCCCAGGTACTTTAGGGACTCTTGAGAGGTCCCCTGAGTACCCTTGACGGAGACCAGCATGTTCTCCATCTTTTCCTGCTGCTTAGTAGGACTGCTTCGGTCTTGTGAGCCGCTATTGCTAGCCCGGCTGTGATTGCCACATCGTCAGCGAAACAGCTGCCTCGACGACTTCAAGTTCTGTGACGCACGGGAAATCTGGGGCAGGGGCTGCCTCTGTTGGCCTCCATAGTGTGGTCTGCTTTGGAAATAGCTCCCCTAGTATGTTAGCCAGGACCCCCGGGTCGGATGGGGTTGCCGCTCCTCCTCCTCCTTAGCTGCTTGGTAACAAGCTTGTAGGCGAGGCCCCAGATATCGCTGTCTACGCCATCCTGCAGCTCCTTAAACGACCGCGCTTTGGCAGCCGCGATGCCGTGCTTGAACTCTAGGCGTTTGCTTCTGAAAGCCTCCAAGAGTTCCGCGTGGTGGAGTACTGCCTCTGGCTCGTTGCGCCGTTCTCTTAGCCCTGAGGCAATCAGACCGTAGTTGGCTTAGGGAGGCACTCCACCAGTAAACGGGTGGTTTGCGCTGTGCCTTATTTTTTCCTTGGCATGATTGCGTCGCAGATTCTTCCCAGCATATTCATGAGGCCTGCCGCCATACTCTCTGCGTCCACATTTGGGATTTCCAGGGGAATTGATCTGATAGGCCAGCATGGCCTCATCGATCTTCCTGGTGTCCCATGTTTTCCCGGCTGTTCTACTCTGCCGTCTTTTGGGCATGTCCCTCCGGGGAGAAGGAGATCAGGGCATGGTCGCTCAGCGTCATGACGTCATGGACCATCCAGTTGTTGTTGTCTACTAGCCCTCTGCTGACAAAGGTAACGTCAATAAAGGACGTACCCCTATCGTTGTTAAACGTCGGCTTCCGTCCATCGTTCAGCAGTATGAGGTCCAGCATTCGCATGGCGTCAATCACAGCTCGTCCTCTGGTGTTGGATGTCCTGCTGCCCCATTCCACTGTCCAGGCATTAAAGTCGCCGGTATGACCTTCGGGCTTGCCCTCTCGCATGGTCCACGAGCGCCTCCAGAAGCCCTCGAACTGATCGGGGGTGTCGCTCGGCGGAGCGTAGCAGCTGTACATGTGCACGTGTTTTAACTTCGCATAAGCGATACCCCGCATGGGTAAAGCAGCCAGTTCCTGGACTTGAGAGAGCTGCAGCATTTGATAGCTGCTTTTACCTGCCTCGTCAAGGATCATGGACGATTGTCCACTACCAGAGACGTAGGGTTCGCTTAGGAGCATGATGTCTACATTGCGCTCAACCGCAGTCTGGGCCAGGAGGCTCTGAGCTGCTGCGCAATGATTGACATTGAGCTGTACTACGCTAATATGAGCGTGCATTAAGGTGGCTCTTGGCATCTTTTAGTGTCGCTCTGTAAGTCGGGCACGCAAAGCTACCCGTCGGGTGGTTTCTGTCCACCTCGCTGCTGCAGATCAGGCATTTTGGTGCAGCAACGCACCCCTTTGCCTTGTGCCCACGCTCACCGCATCTAAGACAGCAGTCTGCCCTGTCAGTGTCCTTGCAGGTTGCTGATCGATGCCCATAGCCGAGACACCTGTAGCATCTCGTGGGTCGGACGTCCTGGGTGATACGACATCTTGACCATCCAACGATTATGGTGCCCTGTTTAAGGACTGGTATCGCAACGTTCGCGTTCAGCAGCACTGAGGCTATTTGCTTTGCAATTCCGCATACTGCGAAGGCCCCTGATATCTTCAGGATTTATCTGCAGGCCCTGGAATTGGGCGACCAAGCAGCTGTGGAGCTTCTCTGCTGTCGTAGCCTCGTCCAATCCGCTGCAAGATAGAGCTATTCTTTGCGCTCCCTGTGCGCACAGAGGTTAAGTCATTGAGCGCCGCTTCCAGGTCGCTCTTAAACTTGGGAACGCTTTCGAAGCTTTCCCCTCTACCTCAAGCAACAGATCACCTTTCTGCGTTCTCTCCGGATTTTTTCGCACGTGACTGCCCAGTTCGCTAAGGCTCGATTCCGATCTTAGCTTCCGAAGCATCTCTGCGTACGAAGCCTCTCCTGTCTTTTTACGATGAGTGCCTCTGCACCCGTGCTAGCATTCTTGGCGACAGATGCATAGCTGCCTGGCTTGGACTCGTTAGGTATGGATGTCGCCTTTTCTTCACCGTTGCCATCCAACGTAGGGTTGCTCTGCTTCGGCGCCTGGACTTTGGCACCTGCACCGTGGGTACCTGCGCATTTTGTGGAGCCTTTTGGTAGGCTTTTGTACCTCCGTCTGGGTAGCGCTGCTCTTCAAGCGGTGCTCGCTAAGTAGTACCTTCGTACAGCTCTATCGCCCTGTTGTTAAGGGCTGAGAGTTCGGAAGCTATGCCCTTTGTCTCATGTGTGTCGTTGGGTCTCGAATGCGGATAGAAGGGGGCTGATCTTGCCATTCATCCTGGTAAGTATGCCCCTCAGGTCTCGTTCTGGAGAGCAGTGGTCAAGTCCGAAGACCGATGAGGGGAACAAGCTGGGGACTTCCCTCCCGTCTTTTGCGATGGCACGGCGATGTGGTCCATCGTCTTCTGACTTGTCGCGGTCGTAGATGCTGTAGGAGCCAATTTCTCCACCTCTACAGCATCGCTGCAGTCGATAGTCAACGGCGGCTGGGGGCCTGCGTGCTCACCCCTTGCCACCGACGGGACCGAGATTCCGTCACCATGGGTCGGGTTACCGACTCCTCTGGTGGGGGGATCTCGAAAGTCGGGAGCTCCTCCTGAACGGGTCGTTGCGATCAGGGGACTGCCCCCCACTGCGCTGTCCATCAACTGAAGGATGGCCTAAGGTTACCTAGGGTCACGTAGGCCACGGATTTCCCCCTGGCTTTTACGGATGGAGGTTTGTACCGCCTCGACTCGGACACCAGAGCCTCTGCTTAGGCACCAGCACGGTGAGAGGATGATATTTGGTCTGTCCGCGACCTTTGTGCCTTTTCCCCTTTCTTAAAGACTTGTGCGCTCCCAGTTACCAGAATCAAAATTAAATTAAATTAAATTTCAACGGCTTAATTTTAAATTTAATTTTGAATTTCGCGCCCTACTGTCGCAACACAACACTGATCACACGGTTGATCTGGCAACGCCTCCCTCTCCAGATCGCCCGCTGCGCTATCAGCTGTTTATCCGCTGCAACAATCGCAAGATAATAAATTACCTATTTACATGAAACAGGCGCACAATTAACTCGCGTGATTGCAGCGCAGAACTATGGCGCGACTCCACCGTGTGATTTTGCCAGTTTGCCGCACACACCGGCCGACACAACTTCTATGGTTTCGAGTATTTCGCGCCGCGTAATTTAAGACGTCCGTCTTCACGGCGATGTAGACTTGGTCTCCGCACCAGGATTGAGTGTCTAAGCCTGTGCGTTCAGGATTAAACTTTGGCAATACGACAGCATTGAGTTTTTTGGGTCTCTTTGTGAGTTTTGCACTTCTTTTAACAGTTCAGAAAAATGGCGATTCTGCGACTCTAGAATTGTCAGCAAATTGTTTTCACTATTGTAGTATGCACACATATCGGTTAAGCACTGTACCTATGTGTATTCATAATTGTAGCACTCTGTTGCAATGTGTACATAAACAGTCCAGCACAAGTGTATACGTAATACGAGCACCCACTTGAGGGCTAACATACATAATTGCCTGGTCAGCAGTTCTCCCTGCTGGCAAGCGCTGATCGCTTATATGTGTGCCTATACCACTCCTCCTCCAGCACCATCGCTCGGCGACAGTACATATATATATACATATATATAAGATACGCATATAAGCGTTGCTGCGCTGCAGGCTATGCCGGCAGCGCTGCTCCTCGACTTAGGCTAAGAAACCTTTGTATGTAGATCATAAGAGGATTGACGAATTAATTTCGAATGGAGCGGGACCTTCCCTGTTCCTCAAATTGGATCAAATAAAGAACAGCTAAAACACAAATGATCTATGACACAATGAAACTACAGGAAGTTGGAGTAGGCGGTCCCACTTCTGATGTCGGATCTGAATCACTTTATACTCGGCATCACTCTCTACAGCGGACACAAAGTAACAGAAAACGGTCGTTAACTTGAAATTAAAATAAATCTGCGACAAGTACAGTTTGTCAAGAAACTGTTTACACACCGTGAAATAAGATGAATTTTTTGATTTTTAACGGTCAAAATTAAGGGTTATTTGCTTAATTAAACGCAATTTTTTTTTAGGAAATATAATTAAACAATATTTATTTTACTTATAAATTAAAAAACAAATTCAAAATATCAAATATACAAGAAAATAAACAACGAATTCCAAGTTTAAAGCACTTTTGAGAGTTTCAAGAAACTCTTTACACAAAAACACTAAACCTAAGTTTAATCCTAAATTTTTAAATTATTTTGTTAAAATTTGAAAAGTTGTAGTATTTAGTATGACCCCCCATTGGCTTTGGCTACAAGTTGAAGCTTTTTTTTCATGGAATGGATGAGTTTTTTTTAGGTCATATTCAAGCGGGATCTTTTCCCACTCTATCGCAGCCATGAGCTGTTGTCGTGTTTTGGTGCCCCTTTTGCCACATTCTTCTTTAAGTAGGCCCACAAATTTTCAATGGGGTTCAGATCAAGACTCTGAGGGGGCGTATCGATCACCTTGCCACAGTTATAAAGGAGCCAGTTGCGTACATTGCACTCTTTATGTTTTGGGATCATTGTCCTGATAAAACTTAAAATTTGGCTTGTTGTTGCTAAATAGACCAAATTTTTTCTGCACTGGCCTTCAAATTTGATTTTAAAATATCTAGATATTGCACGGCATTCATAGTGCTTTCAATAAAGGCTAATTTGCCCACTCCATGGCTTGAGATACAGCCCCAAATCATCACTGATAATTTTCCAAATTTGATTGTTGGAATGATATTTTGTTTTTTCTAGCGCACTCAACAGCTTGCGCCATACTCTGCTTGGCCCATCGTTATAATAGAGCATCATTTTTGTTTCGTCACAAAATATTACGTCATCCCAGTACTCTTCCGCATGATCCATCATGCTCACAGCGAATGAATGACGCTTTTCTATATTGACCTCTGATAGCAAAGGCTTTTTTTCTTGCAACTCTTGAAGAGTACCTATGGCGTAGAATGACTTGGCGCACAGTTTTGTGTGGCACAACTAGGTCACATTCTTGCCTGATATCCTGAGCAAGTGATCTGACCGAGATTCAGGGGGGTTCGCAATCACTTTTCGCATAATAAGGCGGTCTACACGCTTGCTAATTTTAGTTTTGCGCCCACCACTCTTAGGTTCAAGCCTGTTCTCTTTTTTCAAGCGATTAAAACATTGTAGACGGTCTTACGGGATACAGAAAACATTTATACTAATTCTGGAATAGATTTTCCCAACTGGTGGTTTTAGTATATTATTTGGGTCACTTCAAAAGCTAATCTATTTCCAGGCATTTTTATTAAATTTAATAACTCATTCGATCAGCAAAATTTCACAAGCAAAGTAAAAAAAATTTCAATAGAAGCGTTGTAAAAAGGAATGCAAATGCCAAAAATAACGGAAAAATCGAGTTCGTTCTAAGAAAAGAGCAAAACAAAGTAGGAAAACAAAATGTGTAAGGAGTTTCTTGCCACTCTCAAAAGTGTGTAAACTTGGAATTTGTTGTTTAATTTCTTGTATATTTGATATTTTGAATTTGTTTTTTTAATTTATAAGTAAAATAAATATTGTTTAATTATATTTCATTAAAAAATTGCGTTTAATTAAAGAAATAACCCTTAATTTTGATTTAAACCTTTAAAATGAAAAATTCAACTTATTTCACGGCGTGTAAATAGTTTCTTGACAAACTGTATATATCTACAAATTTACAACTTGCCGGTACCATCTGCAAGATTCATTACATTGAGAAGTGGACTTTGACTCTCAGAATGAATTAAAACATTATATTCTTAGATTGAACTGACGAGGAACCAGACTGAACTAACTAAACTAACTATCATTTAACTAAATTTAATTGTTTGCTGATAATTTTGAGTTTCTTACAAAGATGACTAATATTAATTTTTAGTTAAAATAGTTTGCAAAACTGAATTTATGTAAATAATATGTTCAATTGATCTGGTTGGGTTTTCTGGGTCTCCCCAACACCTCGCAACGAATGCTGGATCAAAATTATTCGTCAGAAGGACGTGCACAGTCTCGTGAGTAATAAAAGTACAGCAATCTTACTTTGAGGTGGCGTGTTGGAAAGTATGTACACATTTAAGCAAAAGTCACATGGCCTGCATCAAAGACACTAGAATAATAAGATGCGTAACAGCCATACACTGGTTTGGCACTATGCAGCCACTTTTTTTTGGTGACGGCCAAAATTGCTCTCTTTCCGCTCGCTCACGCTGAGCGTAAGAAATCTAAAATAGAATTTGCTTGCTTGTGTGAGTAAAAACAAAAGACGAGAACGCGTATATGTGTGCGTGTTGTGCTAGAAGGCGATTTTCGGGCCGAAATCAATTCTGATCGCAGTAACGAATTTACATATGTACATACATATTTGGGGAGTTTTGGCCAATTTCGTAGAATATGATGAAATTGCGCGCTGTTTAAGATATCAAATTGGAATATAAAAAAAACTGAAAAGAAGTCATTACACTGAGAAAAAATATTTCATAAAAAAATAATACGAAGTAGAAAATAAAAATTTATAAAATAAAAAAAAATGTTAACTGTTTATTGCAAACGTCATATCAAATTAGAATTATTCTAGTGTCTTTGCTTTGGTCATATCTTGAGGCACGAAGTGCGGACCAAAGCACTCAACAATCATTGTCTTCTTAATACTCAAGCAGAGCGACACCGACGAAGACCCTAACTGCTTTGAAATGGCGAAGTAAAATAAAATCAAAAAAAGAGACCAAGCCCCTCCCGAAGTTCAAAGAAAACAGGATTCCCTGGACAATTCATCAAGCACCAGCGCAAATAATTTCGCTCTCTTAAGCGACGGATTGCCCGACAAAACAGGAAACAAATATAACAAAACGAAGATCTCGAAATGGTAAAGTGAAGACAGTGCAACTGATTTTGCTAAGCCCCACCTATCTTTCTCTCTGACGTCAATGGTATAAGTGAAAAGCTAACCTATCTTAAAACTAAAATTAAGAGAACTTTTTTTTATTATAAGACTCAACGTTATGGACATGTAGAGGTAATGGTTAAAAGTATTGAAGAATTCTGAAAATTAGTCAAAACACTTAATAATGATTGTGTGCAGTACCACACATACCAGCTTAAGGATGACAGAGCATTTAGAGTTGTTATTAAGAATTTGCATTTTCCACAAATTTAGATGAAATTAAAAGTGATGAAGAGTCAAAAGGTCATGTTGTTAGAAACATAAGTAATATTAAAAAGCCGTGCGACCAAAACGTCACTGAACATGTTTTATGTAGATATTGAGCCTAACAAAAAAAACCTAGACATATATAATGTAAATAAAATATTGAGCCTCCCCACAATGAAATCGTTCAATGCTATAGCTGCCAGGAATTCGGACATACTAAATCATATTGTACCAAAACGTACCGCTGTGTAAAATCCTCTTCTCGACACCCAAGCAACATTTGCCCGAAAAATACAGAACAACCAGCAAAATGTGCCAACTGCTACGAAGAACACGCCGCCAGCTACAAAGGGTGTAGAATTTATCAGGAACTCTTGTCCAAAAAAAAATAGAAAATAGAAATAATGATCTGAGTAAAATGATTTAGGAATCCAGCAAAGTTTGTTCCGCCTAACAAGCCAACATATACCCAACAAAGTAACGATTATCAATCTTATGCCCAAATTGCTGCAGGAAATAGCAAAACAAACACATCACTGGAGAGAATAGAGCAACTATTAGGAAAACAGTCTGAACTTACAAATAATTTACTTAACATGATAATGTTACTTGTAAACAAATTATGCAAGTAAATCCTAACCTTGGAATATGGAAGCGTAGTAGGAGGTGACTTCAATGCTAAGCTTCCGAAGGGAAGAAACGAACTGTACAAATGCATAGTAAACAACAGCATAACAACACTTTCAACCGGCAAGCCTACATACTGGCCTACTGATAGTAGAAAGATACCAAACTTAACCCTTTCGCACCCAACGTTGCTTGTGAGCAATTTCTATGTTTTCAGAGCTAACTGTAAGTGTGCCTTTTGTTTTTATCTGCTGATTCTTTATGATAACGGTGCTTTTATGTGTCTACTCTAAATATAAAAGCAAAAAACGCATTTGGAGATTAATTGCAGGAATTATTTGCAATAAATAGCACGCGCATCACAATAATTATTGTTTCGATATTCGGTGCAACTTTTGGAATTATTAATTTACTTTTATAATACTTTAAAAAGAACCTAAAGTATAAACAGCAAAGAGTTAACAAGACAGTGATTTAGTCAAACTTAGTAAGTAGTGAACAATAAGTAAGTAAATAATTTTCTAAGTTGCTTGTGAGCAACCTTGGGCATTCGTGATAATAATTTTCACCGAAAGTGAAAGGTTTGTCTAACGAAAGAAATTGAACAGGGATTTAAACTTCGATTGGGATATTTCTACTGACGAAGAAAGTGGTGAGGAGATGAAAGACATTTCTACGGTACTGGAGAAGAATTTAGAAGGAATTCTTGAAAGGGGAGAAAGTATCGACATTGACCTTCTGGAAAATACAGTGATTGAAGGATGTGAACCTGACTCTTGCGTTGTTGTTGACAGTTGCTTAGAGAAAATTGATCCAAAGAGGCTAAAGTGGAGAACAAGGCCGTTTGTAGCTCCAGAGAGTATTTGGGAAGATGACAAAACTTTTGATGTCGGGGACATAAAGACGACCGTGGAGTTCTTCTACACACTTTTGATACTCAGCTAATTCATTTAATGGCTAGGCAAACTGATATACAGTCATGGTCAAAATTATTTTCACAAAGTGCATTTTTGTGCATGGGTCACAAACAGTTGCTTGTGCAGCAAGTGGGGGAGGTGAAATGCAAAAAAAACTTTTGCTTTTGCAAATTCAAACCTATGCAGAGTCAGATGAAAGAAGAATTGAAAAAATAACTGTTCCTATGCGCAAGGAAGAGGCAAATGAAGAGATCTTTATCAGTTGTCAGAAGTATTTGCACACGGTTTCGTCGCATCACAATTATTTTCACAACGCAATTTCTTCTTCAGTGATTGGTTTAGAGTGACAAGTGCCGGTTTGTTTGCTTAAATACATTTAAATTATTGAATAAAAAATTAGATTTAATCATTTTCCTATTACAGTTATTAAATAAAATGCCCAAAACAAAAGAGTTAACAGTTGAGGCCCGGGCTGGTATTGTTGCTAGGTTTAAAGCCGGTACACCTGCGGCCAAAATAGCTGAAATATATCAAATTTCGCGTAGAACTGTCTACTACTTAATAAAAAAAGTTTGATACAGTTGGCACATTAAAAAATAAAAAAAAGATCAGGCCGAAAACCTGTGCTGGACCAAAAGGCAATGCAGGCAAATACTTGGAGTTGTGGCGAAGAATCCTAGTGCCAGTCCGGTAAAAAATTGCCTTAGAATCAAAAAAATACAATTGGCAAACAAGTTAGTAGTTCTACAATTCGTCGCAGGCTAAAAGAAGCTGATTTTAAGACATACTTTGTTCGCAAAACGATTGAGATCACACCAACCAACAAAACAAAACGTCTTCGATTTGCGTTGGAATATGTTAAGAAGCCTCTTGACTTTTGGTTTAATATTTTATGGACTGATGAGTCTGCATTTCAGTACCAGGGGTCATACAGCAAGCATTTTATGCATTTGAAAAATAATCAAAAGCATTTGGCAGCCCAACCAACCAATAGATTTGGTGGTGGGGGCACAGTCATGTTTTGGGGATGTCTTTCCTATTATGGATTCGGAGACTTGGTACCGATAGAAGGTACTTTAAATCAGAACGGATACCTTCTTATCTTAAACAACCATGCTTTTACGTCTGGAAATAGACTTTTTCCAACTACTGAATGGATTCTTCAGCAGGACAATGCTCCATGCCATAAGGGTAGGATACCAACAAAATTTTTAAACGACCTTAATCTGGCGGTTCTTCCGTGGCCCCCCCCCAAAGCCCAGACCTTAATATCATTGAAAACGTTTGGGCTTTTATTAAAACCAACGAACTATTGATAAAAATAGAAAACGAGAGGGAGCCATCATTGAAATAGCGGAGATTTGGTCCAAATTGACATTAGAATTTGCACAAACTTTGGTAAGGTCAATACCAAAAGACTTCAAGCAGTTATTGATGCCAAAGGTGGTGTTACAAAATATTAGTATTGTATTTATATAAAATAAAGAAATTCTTATGTTGAAATTAGATGTTAAGCTGAAATTTACTAAATTAAGTTGAGTGAAAATACTTTTGAAGCGCAATAAACATGTGAAAATACTATTGACAACTTGCATGCATATTTTCTTTTGCTTTTAAGCTTTGTACTATGAACCGTTATCTTTCGTATTTCTTTTCGACTACCTTCTGCATAGATCAAGCTAAGCGATAAGAACTATTTCAGGCAAATCGGACAACAACAAGAAGAAATATAACAAAAGAAGTTGAAGTTTGCAAATATTGTGCGTTGTGAAAATACTTTGACCACCTCTGTATATAGTTTGCAGGAGCACGGTATTGAACTTAAATGTACTGATGAGGAAATCAAACGCTACATTGGCATTTTATTGTACTTTGGTGTTTTAAAACTACCGCAATTCAGAATGGCGTGGTCAAAGTATTTAAAGATTACCGCAATAACTGATTCAATGCCGCGTGGGAGATTTAAAAAAATAAAACAATGCTTACATTTCAACGACAACGCCAAACAATTAAAAAAAGGGGATTGCAACTATGATAAACTCTACAAGATCCGCCCTTTGTTCAGAATTCTCAAAGAAAATTTTGGAAAAACTAACGCAGGAAGAGCATCAAAGTGTCGATGAGCAAATAATTGCATTCAAAGGTACGTTTTAATTTTCTTTTAAATTAGCTTTATTTTTTAATAATTGCTTTTGTTGCAGGTCGATCCACGCTTAGGCAATATAATCCAAACCTCATAAATGGGGTCTTAAAATGTTTACGCGGGCTGGAATATCTGGATTAGTTTATGATTTTATTGCTATATGTTGGAGAAGGCACTTCTCCTTCTTATGGCTTGGGAATATCATCTTATGTTGTCTTATATTTGGCAGAAAGTCTTCCCAAAGACAAAATTTTAAACTGTATTTTGATAATTGGTTTACGTCTGTAATCCTTCTGATTTCGTTGAAGGAAATAGGAATCTTTGCAACAGGTACCTGTACGTATGATAAAGTTGAACATTGGGTAGTTTTTTGGAGAAAGAGGACGTTGCAGACTGTGCAAAATTGCAACACCGATGACCAAATGCCTTACATGCAAAGTCCATCTGTGCTGCAATAACAATAAAAACTGTTTTTTGTCATACCACACTTAAATTGTCATTATAAAGAAAAATATTTCATATTCTGTGATTTATAAAAAAAAAACAATGCTTACACATCACTACTGCCCGACGTTGCTCACAAGAAAACTTTTGCTACCGCCCAAACTAATGGGCGTGGCATACCTAAAATTTTGCTAAATTTTTTCTAAAATAAATGTAAAACATTAATGATAAAACAAAATTTCACGGGTAAAAAAGTTGGGCGCGAAAGGGTTAAAAGACTTCTGTAGCATACTTTGGAATCCCAGAATCTCACATGCGAATAATGGAAAGTTTTGATCTAAGCTCAGATCATTCTCTAATAATAGTGACATACAGTACAGTAGCTCATATATTGCAAATACAGATATCAATGCATTTAAAAGTTATCTGGAAACAGCTATCAGCCTGGATATCTCGCTAAAATCAGGAGAGGAGAGCTACTGTGGAGCTACTCACAAACAAGATCCATAAAGCAAGCTATATATGTACGAAGCTACCAGCCAGAAACTCACAATCAAATCAGCTCTATCTCTCAGCTGAAACTCCGACAACAAATACAACACAAGAGAAATTTGCGTAAGAGATGGCAAGAAACTCTCTACCCTGCCGACAAAAGATCGTATAACAAGGCTGCATCTGATCGCAGAAAACTACTGTCAACTTTAAGAAATTAATCTCTCGCTGAATATCTTAGAAATCTAGATCCACATTCTTGTAACCACGAACATAATTTATGGAGTAACCAAATATCTCAAGCGACCTGCAAAAGAAACACAGTAGTCCGAAACTCTAATGGCGAATGGCGTAGATCTGATGATGAACAAGCCAAAGCATTTGCTTAACACCTGCACTCTGTATTTCAGCCAAATGATATTGATAACCCGCAAACAGAAAGGGAAGTAGATAACTTTTTTCGAGTCACCGCCAAATGAGCTTACCCATTCGTAAAATCAGTATTAATGAAGTTTCATCAGAAATGGCTAAAAAGTAAAAAGGCTCCAGATTGGGACAAAATAGATGGCATAGCCTTGAAAAAAAAAATGGGCGGTTAGAGTTGACCACTTCCCAAGCCAATGGAAATGTGCAGAAATTATAGGAATCCTTAAACCAAACAAGGCAGAAAATGAAGTGACATTGTACCGTCCCATTAGTTTGTTGTCAATATTTTCTAAAGTATTTAAAAAAAATAATTTTAAAGAGAATGTTGTCAATCTTGGAAGAATTGCTATCATACCCAAACACCAGTTTGGATTCGAAGAGGCCACGGAACCCCTGAGCAATGTCACAGGATTAAAAAATGAAATTTCGTCAGCATTTGAGAGCAAAAAATACTGCACTGCTAAATTTCTTGACGTTTAACAAGCGTTTGATCGAGTCTGGCATGATGGCTTATCATATAAAACCATATTTTATATTATTAAAGTCATACTTAACCAATAGACAATTTTATTTGCAACAAAAAAATGAATACTCGCCCTTGCACTTTATAAAAGCTGGAGTCCCACAAGGAAGAGTCTTAGTAACTGTCTTATACACCCTGTAACGGCAGATATGCCGGTAACAAATACCGCCTGTAACAAATGATACAGCTATATTAGCTACAAGCTCATCTAAAGAGGAAGCCTCACAACTCCTGCAAGCAGAGCTACGCCTTATTGAAAGCTGGTTTCTTATTTGGAAAATTAAAGTCAACGCCCTGAAATCTGCGCAAATAACTTTTGCATTAAGAAGAGGTAACTGCCCAGAAGTGTCATTTAATGGATCAGCAATCCCACAAAGTATCGATCGCAGACTAACGTGGAAACACATAAACATAAAAGCAAAGCGCCAGCAACTAAATCAAAAAAGTTTGAAGATGACCTGGTTGCTTGGCCGAAAATCTGCAACCACTCGGAAAATAAAGTCCGTTTATACAAAGCTATACTAAAGCCCATGTGGACTTATGACATACAGCTTTGGGGTACTGCCAGCAACTCAAATATTGAGATTCTACAATGCTACCAATCAAAAAATATTAAGACAAATTGTTAATGCTCCATTTTATATTTCAAATGCAAGTATCTATAAAGACTTAGGAATCCCTTATGTTAAAGAAGAAATAGCAAAACATATTAAAAATATATAGACAGACCAAGAACACATGAAAATAACTTAGCCTTAAATTTGGTAAATAA diff -r 000000000000 -r 60573349e9ae test-data/out_gfa.gfa1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/out_gfa.gfa1 Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,2 @@ +H VN:Z:1.0 +S 0 TCACCTTTCTGCGTTCTCCGGATTTTTTCGCACGTGACTGCCCAGTTCGCTAAGGCTCGATTCCGATCTTAGCTTCCGAAGCATCTCTGCGTACGAAGCCTCCTCCTGTCTTTTTTTTTACGATGAGTGCCTCTGCACCCGTGCTAGCATTCTTGGCGACAGATGCATAGCTGCCTCGGCTTGGACTCGTTAGGTATGGATGTCGCCTTTTCTTCACCGCTTGCCATCCAACGTAGGGTTGCTCTGCTTCGGCGCCTGGACTTTGGCACCTGCACCGTGGGTACCTGCGCATTTTGTGGAGCCTTTTGGTAGGCTTTGTACCTCCGTCTGGGTAGCGCTGCTCTTCAAGCGGTGCTCGCTAGTAGTACCTTCTTGTACAGCTCTATCGCCCCTGTTGTTAAGGGCTGAGAGTTCGGAAGCTATGCCCTTTGTCTCTCATGTGTGTCGTTGGGTCTCGAATGCGGATAGAAGGGGGGCTGATCTTGCCATTCATCCTGGTAAGTATGCCCCTCAGGTCCTCGTTCTGGAGAGCAGTGGTCAAGTCCGAAGACCGATGAGGGGAACCAGCTGGGGACTTCCCTCCCGTCTTTTGCGATGGCACGGCGATGTGGTCCATCGTCTTCTGACTTGTCGCGGTCGTAGATGCTGTAGGAGCCAATTTCTCCACCTCTACAGCATCGCTGCAGTCGATAGTCAACGGCGGCTGGGGCCTGCGTGCTCACCCCCTTTGCCACCGACGGGACCGAGATTCCGTCACCATGGGTCGGGTTACCGACTCCTCTGGTGGGGGATCTCGAAAGTCGGGAGCTCCTCCTGAACGGGTCGTTGCGATCAGGGGACTGCCCCCACTGCGCTGTCCATCAACCGAAGGATGGCCTAAGGTTACCTAGGGTCACGTAGGCCACGGATTTCCCCGGCTTTTACGGATGGAGGTTTGTACCGCCTCGACTCGGACACCAGAGCCTCTGCTTAGGCACCAGCACGGTGAGAGGATGATATTTGGTCTGTCCGCGACCTTTGTGCCTTTTCCTTTTCCCCTTTCTTAAAGACTTGTGCGCTCCCCAGTTACCAGAATCAAAATTAAATTAAATTAAAAAATTTCAACGGCTTAATTTTTAAATTTAATTTTGAATTTCGCGCCCTACTGTCGCAACACAACACTGATCACACGGTTGATCTGGCAACGCCCCTCCCTCTCCAGATCGTCCCGCTGCGCTATCAGCTGTTTATCCGCTGCAACAATCGCAAGATAATAAATTACCTATTTACATGAAACAGGCGCACAATTAACTTCGCGTGATTGCAGCGCAGAACTATGGCGCGACTCCACCGTGTGATTTTGCCAGTTTGCCGCACACACCGGCCGACACAACTTCTATGGTTTCGAGTATTTCGCGCCGCGTAATTTAAGACGTCCGTCTTCACGGCGATGTAGACTTGGTCTCCGCACCAGGATTGAGTGTCTAAGCCTGTGCGTTCAGGATTAAACTTTGGCAATACGACAGCATTGAGTTTTTGGGTCTCTTTGTGAGTTTTGCACTTCTTTTAACAGTTCAGAAAAATGGCGATTCTGCGACTCTAGAATTGTCAGCAAATTGTTTTCACTATTGTAGTATGCACACATATCGGTTAAGCACTGTACCTATGTGTATTCATAATTGTAGCACTCTGTTGCAATGTGTACATAAACAGTCCAGCACAAGTGTATACGTAATACGAGCACCCACTTGAGGGGCTAACATACATAATTGCCTGGTCAGCAGTTCTCCCGCTGGCCAAGCGCTGATCGCTTATATGTGTGCCTATACCACTCCTCCTCCAGCACCATCGCTCGGCGACAGTACATATATATATACATATATATAAGATACGCATATAAGCGTTGCTGCGCTGCAGGCTATGCCGGCAGCGCTGCTCCTCGACTTAGGCTAAGAAACCTTTGTATGTAGATCATAAGAGGATTGACGAATTAATTTCGAATGGAGCGGGACCTTCCCTGTTCCTCAAATTGGATCAAATAAAGAACAGCTAAAACACAAATGATCTATGACACAATGAAACTACAGGAAGTTGGAGTAGGCGGTCCCACTTCTGATGTCGGATCTGAATCACTTTATACTCGGCATCACTCTCTACAGCGGACACAAAGTAACAGAAAACGGTCGTTAACTTGAAATTAAAAATAAATCTGCGACAAGTACAGTTTGTCAAGAAACTGTTTACACACCGTGAAATAAGATGAATTTTTGATTTTAACGGTCAAAATTAAGGGTTATTTGCTTAATTAAACGCAATTTTTTTTTTAGGAAATATAATTAAACAATATTTATTTTACTTATAAATTAAAAAACAAATTCAAAATATCAAATATACAAGAAAATAAATAACAAACTTCCAAGTTTACACACTTTTGAGAGTGTCACTCTGCCCAAACCGTCATCTCTGGGATGAGCTGATAGGTCCACCTCCCCCCGTCGCGACGTTTGCCATCTGCTCTGCCATTCACCTAATAGCCACTCGTGTGCCTCTTGCCTGGAAGCGCCACTCCGCATAAGGCTGAGAGCCTTGATCTCCAGATCAATCGGCAGGCCTGCCAGCGCTAGCGCCGCGTCTTCGGATATGGTCCTGAATCCTCTAATGAGCCTGAGGGCCATTGACCGTAGCACCGAACGAGCTCCTTTCAGGTATGAGACCCTGCAAGTGGCATTGCTCCAGACTGGTGCAGCGTATAGCAGCGAAGCCTTTGCTACTGACACCAGCAGTTTCCTGGCCGGGTGTCTTGGGCCTCCGACGTTGGGCATGCCTCGCCAACGAAGAGGATGTGACTGCTGTCTTCTTGCTGGCGTAGCTCGCGTGGTCCTTGAACGATAGTCTGCGATCTATCATTACCCCCAGGTACTTTAGGGACTCTTGAGAGGTCCCCTGAGTACCCTTGACGGAGACCAGCATGTTCTCCATCTTTTCCTGCTGCTTAGTAGGACTGCTTCGGTCTTGTGAGCCGCTATTGCTAGCCCGGCTGTGATTGCCACATCGTCAGCGAAACAGCTGCCTCGACGACTTCAAGTTCTGTGACGCACGGGAAATCTGGGGCAGGGGCTGCCTCTGTTGGCCTCCATAGTGTGGTCTGCTTTGGAAATAGCTCCCCTAGTATGTTAGCCAGGACCCCCGGGTCGGATGGGGTTGCCGCTCCTCCTCCTCCTTAGCTGCTTGGTAACAAGCTTGTAGGCGAGGCCCCAGATATCGCTGTCTACGCCATCCTGCAGCTCCTTAAACGACCGCGCTTTGGCAGCCGCGATGCCGTGCTTGAACTCTAGGCGTTTGCTTCTGAAAGCCTCCAAGAGTTCCGCGTGGTGGAGTACTGCCTCTGGCTCGTTGCGCCGTTCTCTTAGCCCTGAGGCAATCAGACCGTAGTTGGCTTAGGGAGGCACTCCACCAGTAAACGGGTGGTTTGCGCTGTGCCTTATTTTTTCCTTGGCATGATTGCGTCGCAGATTCTTCCCAGCATATTCATGAGGCCTGCCGCCATACTCTCTGCGTCCACATTTGGGATTTCCAGGGGAATTGATCTGATAGGCCAGCATGGCCTCATCGATCTTCCTGGTGTCCCATGTTTTCCCGGCTGTTCTACTCTGCCGTCTTTTGGGCATGTCCCTCCGGGGAGAAGGAGATCAGGGCATGGTCGCTCAGCGTCATGACGTCATGGACCATCCAGTTGTTGTTGTCTACTAGCCCTCTGCTGACAAAGGTAACGTCAATAAAGGACGTACCCCTATCGTTGTTAAACGTCGGCTTCCGTCCATCGTTCAGCAGTATGAGGTCCAGCATTCGCATGGCGTCAATCACAGCTCGTCCTCTGGTGTTGGATGTCCTGCTGCCCCATTCCACTGTCCAGGCATTAAAGTCGCCGGTATGACCTTCGGGCTTGCCCTCTCGCATGGTCCACGAGCGCCTCCAGAAGCCCTCGAACTGATCGGGGGTGTCGCTCGGCGGAGCGTAGCAGCTGTACATGTGCACGTGTTTTAACTTCGCATAAGCGATACCCCGCATGGGTAAAGCAGCCAGTTCCTGGACTTGAGAGAGCTGCAGCATTTGATAGCTGCTTTTACCTGCCTCGTCAAGGATCATGGACGATTGTCCACTACCAGAGACGTAGGGTTCGCTTAGGAGCATGATGTCTACATTGCGCTCAACCGCAGTCTGGGCCAGGAGGCTCTGAGCTGCTGCGCAATGATTGACATTGAGCTGTACTACGCTAATATGAGCGTGCATTAAGGTGGCTCTTGGCATCTTTTAGTGTCGCTCTGTAAGTCGGGCACGCAAAGCTACCCGTCGGGTGGTTTCTGTCCACCTCGCTGCTGCAGATCAGGCATTTTGGTGCAGCAACGCACCCCTTTGCCTTGTGCCCACGCTCACCGCATCTAAGACAGCAGTCTGCCCTGTCAGTGTCCTTGCAGGTTGCTGATCGATGCCCATAGCCGAGACACCTGTAGCATCTCGTGGGTCGGACGTCCTGGGTGATACGACATCTTGACCATCCAACGATTATGGTGCCCTGTTTAAGGACTGGTATCGCAACGTTCGCGTTCAGCAGCACTGAGGCTATTTGCTTTGCAATTCCGCATACTGCGAAGGCCCCTGATATCTTCAGGATTTATCTGCAGGCCCTGGAATTGGGCGACCAAGCAGCTGTGGAGCTTCTCTGCTGTCGTAGCCTCGTCCAATCCGCTGCAAGATAGAGCTATTCTTTGCGCTCCCTGTGCGCACAGAGGTTAAGTCATTGAGCGCCGCTTCCAGGTCGCTCTTAAACTTGGGAACGCTTTCGAAGCTTTCCCCTCTACCTCAAGCAACAGATCACCTTTCTGCGTTCTCTCCGGATTTTTTCGCACGTGACTGCCCAGTTCGCTAAGGCTCGATTCCGATCTTAGCTTCCGAAGCATCTCTGCGTACGAAGCCTCTCCTGTCTTTTTACGATGAGTGCCTCTGCACCCGTGCTAGCATTCTTGGCGACAGATGCATAGCTGCCTGGCTTGGACTCGTTAGGTATGGATGTCGCCTTTTCTTCACCGTTGCCATCCAACGTAGGGTTGCTCTGCTTCGGCGCCTGGACTTTGGCACCTGCACCGTGGGTACCTGCGCATTTTGTGGAGCCTTTTGGTAGGCTTTTGTACCTCCGTCTGGGTAGCGCTGCTCTTCAAGCGGTGCTCGCTAAGTAGTACCTTCGTACAGCTCTATCGCCCTGTTGTTAAGGGCTGAGAGTTCGGAAGCTATGCCCTTTGTCTCATGTGTGTCGTTGGGTCTCGAATGCGGATAGAAGGGGGCTGATCTTGCCATTCATCCTGGTAAGTATGCCCCTCAGGTCTCGTTCTGGAGAGCAGTGGTCAAGTCCGAAGACCGATGAGGGGAACAAGCTGGGGACTTCCCTCCCGTCTTTTGCGATGGCACGGCGATGTGGTCCATCGTCTTCTGACTTGTCGCGGTCGTAGATGCTGTAGGAGCCAATTTCTCCACCTCTACAGCATCGCTGCAGTCGATAGTCAACGGCGGCTGGGGGCCTGCGTGCTCACCCCTTGCCACCGACGGGACCGAGATTCCGTCACCATGGGTCGGGTTACCGACTCCTCTGGTGGGGGGATCTCGAAAGTCGGGAGCTCCTCCTGAACGGGTCGTTGCGATCAGGGGACTGCCCCCCACTGCGCTGTCCATCAACTGAAGGATGGCCTAAGGTTACCTAGGGTCACGTAGGCCACGGATTTCCCCCTGGCTTTTACGGATGGAGGTTTGTACCGCCTCGACTCGGACACCAGAGCCTCTGCTTAGGCACCAGCACGGTGAGAGGATGATATTTGGTCTGTCCGCGACCTTTGTGCCTTTTCCCCTTTCTTAAAGACTTGTGCGCTCCCAGTTACCAGAATCAAAATTAAATTAAATTAAATTTCAACGGCTTAATTTTAAATTTAATTTTGAATTTCGCGCCCTACTGTCGCAACACAACACTGATCACACGGTTGATCTGGCAACGCCTCCCTCTCCAGATCGCCCGCTGCGCTATCAGCTGTTTATCCGCTGCAACAATCGCAAGATAATAAATTACCTATTTACATGAAACAGGCGCACAATTAACTCGCGTGATTGCAGCGCAGAACTATGGCGCGACTCCACCGTGTGATTTTGCCAGTTTGCCGCACACACCGGCCGACACAACTTCTATGGTTTCGAGTATTTCGCGCCGCGTAATTTAAGACGTCCGTCTTCACGGCGATGTAGACTTGGTCTCCGCACCAGGATTGAGTGTCTAAGCCTGTGCGTTCAGGATTAAACTTTGGCAATACGACAGCATTGAGTTTTTTGGGTCTCTTTGTGAGTTTTGCACTTCTTTTAACAGTTCAGAAAAATGGCGATTCTGCGACTCTAGAATTGTCAGCAAATTGTTTTCACTATTGTAGTATGCACACATATCGGTTAAGCACTGTACCTATGTGTATTCATAATTGTAGCACTCTGTTGCAATGTGTACATAAACAGTCCAGCACAAGTGTATACGTAATACGAGCACCCACTTGAGGGCTAACATACATAATTGCCTGGTCAGCAGTTCTCCCTGCTGGCAAGCGCTGATCGCTTATATGTGTGCCTATACCACTCCTCCTCCAGCACCATCGCTCGGCGACAGTACATATATATATACATATATATAAGATACGCATATAAGCGTTGCTGCGCTGCAGGCTATGCCGGCAGCGCTGCTCCTCGACTTAGGCTAAGAAACCTTTGTATGTAGATCATAAGAGGATTGACGAATTAATTTCGAATGGAGCGGGACCTTCCCTGTTCCTCAAATTGGATCAAATAAAGAACAGCTAAAACACAAATGATCTATGACACAATGAAACTACAGGAAGTTGGAGTAGGCGGTCCCACTTCTGATGTCGGATCTGAATCACTTTATACTCGGCATCACTCTCTACAGCGGACACAAAGTAACAGAAAACGGTCGTTAACTTGAAATTAAAATAAATCTGCGACAAGTACAGTTTGTCAAGAAACTGTTTACACACCGTGAAATAAGATGAATTTTTTGATTTTTAACGGTCAAAATTAAGGGTTATTTGCTTAATTAAACGCAATTTTTTTTTAGGAAATATAATTAAACAATATTTATTTTACTTATAAATTAAAAAACAAATTCAAAATATCAAATATACAAGAAAATAAACAACGAATTCCAAGTTTAAAGCACTTTTGAGAGTTTCAAGAAACTCTTTACACAAAAACACTAAACCTAAGTTTAATCCTAAATTTTTAAATTATTTTGTTAAAATTTGAAAAGTTGTAGTATTTAGTATGACCCCCCATTGGCTTTGGCTACAAGTTGAAGCTTTTTTTTCATGGAATGGATGAGTTTTTTTTAGGTCATATTCAAGCGGGATCTTTTCCCACTCTATCGCAGCCATGAGCTGTTGTCGTGTTTTGGTGCCCCTTTTGCCACATTCTTCTTTAAGTAGGCCCACAAATTTTCAATGGGGTTCAGATCAAGACTCTGAGGGGGCGTATCGATCACCTTGCCACAGTTATAAAGGAGCCAGTTGCGTACATTGCACTCTTTATGTTTTGGGATCATTGTCCTGATAAAACTTAAAATTTGGCTTGTTGTTGCTAAATAGACCAAATTTTTTCTGCACTGGCCTTCAAATTTGATTTTAAAATATCTAGATATTGCACGGCATTCATAGTGCTTTCAATAAAGGCTAATTTGCCCACTCCATGGCTTGAGATACAGCCCCAAATCATCACTGATAATTTTCCAAATTTGATTGTTGGAATGATATTTTGTTTTTTCTAGCGCACTCAACAGCTTGCGCCATACTCTGCTTGGCCCATCGTTATAATAGAGCATCATTTTTGTTTCGTCACAAAATATTACGTCATCCCAGTACTCTTCCGCATGATCCATCATGCTCACAGCGAATGAATGACGCTTTTCTATATTGACCTCTGATAGCAAAGGCTTTTTTTCTTGCAACTCTTGAAGAGTACCTATGGCGTAGAATGACTTGGCGCACAGTTTTGTGTGGCACAACTAGGTCACATTCTTGCCTGATATCCTGAGCAAGTGATCTGACCGAGATTCAGGGGGGTTCGCAATCACTTTTCGCATAATAAGGCGGTCTACACGCTTGCTAATTTTAGTTTTGCGCCCACCACTCTTAGGTTCAAGCCTGTTCTCTTTTTTCAAGCGATTAAAACATTGTAGACGGTCTTACGGGATACAGAAAACATTTATACTAATTCTGGAATAGATTTTCCCAACTGGTGGTTTTAGTATATTATTTGGGTCACTTCAAAAGCTAATCTATTTCCAGGCATTTTTATTAAATTTAATAACTCATTCGATCAGCAAAATTTCACAAGCAAAGTAAAAAAAATTTCAATAGAAGCGTTGTAAAAAGGAATGCAAATGCCAAAAATAACGGAAAAATCGAGTTCGTTCTAAGAAAAGAGCAAAACAAAGTAGGAAAACAAAATGTGTAAGGAGTTTCTTGCCACTCTCAAAAGTGTGTAAACTTGGAATTTGTTGTTTAATTTCTTGTATATTTGATATTTTGAATTTGTTTTTTTAATTTATAAGTAAAATAAATATTGTTTAATTATATTTCATTAAAAAATTGCGTTTAATTAAAGAAATAACCCTTAATTTTGATTTAAACCTTTAAAATGAAAAATTCAACTTATTTCACGGCGTGTAAATAGTTTCTTGACAAACTGTATATATCTACAAATTTACAACTTGCCGGTACCATCTGCAAGATTCATTACATTGAGAAGTGGACTTTGACTCTCAGAATGAATTAAAACATTATATTCTTAGATTGAACTGACGAGGAACCAGACTGAACTAACTAAACTAACTATCATTTAACTAAATTTAATTGTTTGCTGATAATTTTGAGTTTCTTACAAAGATGACTAATATTAATTTTTAGTTAAAATAGTTTGCAAAACTGAATTTATGTAAATAATATGTTCAATTGATCTGGTTGGGTTTTCTGGGTCTCCCCAACACCTCGCAACGAATGCTGGATCAAAATTATTCGTCAGAAGGACGTGCACAGTCTCGTGAGTAATAAAAGTACAGCAATCTTACTTTGAGGTGGCGTGTTGGAAAGTATGTACACATTTAAGCAAAAGTCACATGGCCTGCATCAAAGACACTAGAATAATAAGATGCGTAACAGCCATACACTGGTTTGGCACTATGCAGCCACTTTTTTTTGGTGACGGCCAAAATTGCTCTCTTTCCGCTCGCTCACGCTGAGCGTAAGAAATCTAAAATAGAATTTGCTTGCTTGTGTGAGTAAAAACAAAAGACGAGAACGCGTATATGTGTGCGTGTTGTGCTAGAAGGCGATTTTCGGGCCGAAATCAATTCTGATCGCAGTAACGAATTTACATATGTACATACATATTTGGGGAGTTTTGGCCAATTTCGTAGAATATGATGAAATTGCGCGCTGTTTAAGATATCAAATTGGAATATAAAAAAAACTGAAAAGAAGTCATTACACTGAGAAAAAATATTTCATAAAAAAATAATACGAAGTAGAAAATAAAAATTTATAAAATAAAAAAAAATGTTAACTGTTTATTGCAAACGTCATATCAAATTAGAATTATTCTAGTGTCTTTGCTTTGGTCATATCTTGAGGCACGAAGTGCGGACCAAAGCACTCAACAATCATTGTCTTCTTAATACTCAAGCAGAGCGACACCGACGAAGACCCTAACTGCTTTGAAATGGCGAAGTAAAATAAAATCAAAAAAAGAGACCAAGCCCCTCCCGAAGTTCAAAGAAAACAGGATTCCCTGGACAATTCATCAAGCACCAGCGCAAATAATTTCGCTCTCTTAAGCGACGGATTGCCCGACAAAACAGGAAACAAATATAACAAAACGAAGATCTCGAAATGGTAAAGTGAAGACAGTGCAACTGATTTTGCTAAGCCCCACCTATCTTTCTCTCTGACGTCAATGGTATAAGTGAAAAGCTAACCTATCTTAAAACTAAAATTAAGAGAACTTTTTTTTATTATAAGACTCAACGTTATGGACATGTAGAGGTAATGGTTAAAAGTATTGAAGAATTCTGAAAATTAGTCAAAACACTTAATAATGATTGTGTGCAGTACCACACATACCAGCTTAAGGATGACAGAGCATTTAGAGTTGTTATTAAGAATTTGCATTTTCCACAAATTTAGATGAAATTAAAAGTGATGAAGAGTCAAAAGGTCATGTTGTTAGAAACATAAGTAATATTAAAAAGCCGTGCGACCAAAACGTCACTGAACATGTTTTATGTAGATATTGAGCCTAACAAAAAAAACCTAGACATATATAATGTAAATAAAATATTGAGCCTCCCCACAATGAAATCGTTCAATGCTATAGCTGCCAGGAATTCGGACATACTAAATCATATTGTACCAAAACGTACCGCTGTGTAAAATCCTCTTCTCGACACCCAAGCAACATTTGCCCGAAAAATACAGAACAACCAGCAAAATGTGCCAACTGCTACGAAGAACACGCCGCCAGCTACAAAGGGTGTAGAATTTATCAGGAACTCTTGTCCAAAAAAAAATAGAAAATAGAAATAATGATCTGAGTAAAATGATTTAGGAATCCAGCAAAGTTTGTTCCGCCTAACAAGCCAACATATACCCAACAAAGTAACGATTATCAATCTTATGCCCAAATTGCTGCAGGAAATAGCAAAACAAACACATCACTGGAGAGAATAGAGCAACTATTAGGAAAACAGTCTGAACTTACAAATAATTTACTTAACATGATAATGTTACTTGTAAACAAATTATGCAAGTAAATCCTAACCTTGGAATATGGAAGCGTAGTAGGAGGTGACTTCAATGCTAAGCTTCCGAAGGGAAGAAACGAACTGTACAAATGCATAGTAAACAACAGCATAACAACACTTTCAACCGGCAAGCCTACATACTGGCCTACTGATAGTAGAAAGATACCAAACTTAACCCTTTCGCACCCAACGTTGCTTGTGAGCAATTTCTATGTTTTCAGAGCTAACTGTAAGTGTGCCTTTTGTTTTTATCTGCTGATTCTTTATGATAACGGTGCTTTTATGTGTCTACTCTAAATATAAAAGCAAAAAACGCATTTGGAGATTAATTGCAGGAATTATTTGCAATAAATAGCACGCGCATCACAATAATTATTGTTTCGATATTCGGTGCAACTTTTGGAATTATTAATTTACTTTTATAATACTTTAAAAAGAACCTAAAGTATAAACAGCAAAGAGTTAACAAGACAGTGATTTAGTCAAACTTAGTAAGTAGTGAACAATAAGTAAGTAAATAATTTTCTAAGTTGCTTGTGAGCAACCTTGGGCATTCGTGATAATAATTTTCACCGAAAGTGAAAGGTTTGTCTAACGAAAGAAATTGAACAGGGATTTAAACTTCGATTGGGATATTTCTACTGACGAAGAAAGTGGTGAGGAGATGAAAGACATTTCTACGGTACTGGAGAAGAATTTAGAAGGAATTCTTGAAAGGGGAGAAAGTATCGACATTGACCTTCTGGAAAATACAGTGATTGAAGGATGTGAACCTGACTCTTGCGTTGTTGTTGACAGTTGCTTAGAGAAAATTGATCCAAAGAGGCTAAAGTGGAGAACAAGGCCGTTTGTAGCTCCAGAGAGTATTTGGGAAGATGACAAAACTTTTGATGTCGGGGACATAAAGACGACCGTGGAGTTCTTCTACACACTTTTGATACTCAGCTAATTCATTTAATGGCTAGGCAAACTGATATACAGTCATGGTCAAAATTATTTTCACAAAGTGCATTTTTGTGCATGGGTCACAAACAGTTGCTTGTGCAGCAAGTGGGGGAGGTGAAATGCAAAAAAAACTTTTGCTTTTGCAAATTCAAACCTATGCAGAGTCAGATGAAAGAAGAATTGAAAAAATAACTGTTCCTATGCGCAAGGAAGAGGCAAATGAAGAGATCTTTATCAGTTGTCAGAAGTATTTGCACACGGTTTCGTCGCATCACAATTATTTTCACAACGCAATTTCTTCTTCAGTGATTGGTTTAGAGTGACAAGTGCCGGTTTGTTTGCTTAAATACATTTAAATTATTGAATAAAAAATTAGATTTAATCATTTTCCTATTACAGTTATTAAATAAAATGCCCAAAACAAAAGAGTTAACAGTTGAGGCCCGGGCTGGTATTGTTGCTAGGTTTAAAGCCGGTACACCTGCGGCCAAAATAGCTGAAATATATCAAATTTCGCGTAGAACTGTCTACTACTTAATAAAAAAAGTTTGATACAGTTGGCACATTAAAAAATAAAAAAAAGATCAGGCCGAAAACCTGTGCTGGACCAAAAGGCAATGCAGGCAAATACTTGGAGTTGTGGCGAAGAATCCTAGTGCCAGTCCGGTAAAAAATTGCCTTAGAATCAAAAAAATACAATTGGCAAACAAGTTAGTAGTTCTACAATTCGTCGCAGGCTAAAAGAAGCTGATTTTAAGACATACTTTGTTCGCAAAACGATTGAGATCACACCAACCAACAAAACAAAACGTCTTCGATTTGCGTTGGAATATGTTAAGAAGCCTCTTGACTTTTGGTTTAATATTTTATGGACTGATGAGTCTGCATTTCAGTACCAGGGGTCATACAGCAAGCATTTTATGCATTTGAAAAATAATCAAAAGCATTTGGCAGCCCAACCAACCAATAGATTTGGTGGTGGGGGCACAGTCATGTTTTGGGGATGTCTTTCCTATTATGGATTCGGAGACTTGGTACCGATAGAAGGTACTTTAAATCAGAACGGATACCTTCTTATCTTAAACAACCATGCTTTTACGTCTGGAAATAGACTTTTTCCAACTACTGAATGGATTCTTCAGCAGGACAATGCTCCATGCCATAAGGGTAGGATACCAACAAAATTTTTAAACGACCTTAATCTGGCGGTTCTTCCGTGGCCCCCCCCCAAAGCCCAGACCTTAATATCATTGAAAACGTTTGGGCTTTTATTAAAACCAACGAACTATTGATAAAAATAGAAAACGAGAGGGAGCCATCATTGAAATAGCGGAGATTTGGTCCAAATTGACATTAGAATTTGCACAAACTTTGGTAAGGTCAATACCAAAAGACTTCAAGCAGTTATTGATGCCAAAGGTGGTGTTACAAAATATTAGTATTGTATTTATATAAAATAAAGAAATTCTTATGTTGAAATTAGATGTTAAGCTGAAATTTACTAAATTAAGTTGAGTGAAAATACTTTTGAAGCGCAATAAACATGTGAAAATACTATTGACAACTTGCATGCATATTTTCTTTTGCTTTTAAGCTTTGTACTATGAACCGTTATCTTTCGTATTTCTTTTCGACTACCTTCTGCATAGATCAAGCTAAGCGATAAGAACTATTTCAGGCAAATCGGACAACAACAAGAAGAAATATAACAAAAGAAGTTGAAGTTTGCAAATATTGTGCGTTGTGAAAATACTTTGACCACCTCTGTATATAGTTTGCAGGAGCACGGTATTGAACTTAAATGTACTGATGAGGAAATCAAACGCTACATTGGCATTTTATTGTACTTTGGTGTTTTAAAACTACCGCAATTCAGAATGGCGTGGTCAAAGTATTTAAAGATTACCGCAATAACTGATTCAATGCCGCGTGGGAGATTTAAAAAAATAAAACAATGCTTACATTTCAACGACAACGCCAAACAATTAAAAAAAGGGGATTGCAACTATGATAAACTCTACAAGATCCGCCCTTTGTTCAGAATTCTCAAAGAAAATTTTGGAAAAACTAACGCAGGAAGAGCATCAAAGTGTCGATGAGCAAATAATTGCATTCAAAGGTACGTTTTAATTTTCTTTTAAATTAGCTTTATTTTTTAATAATTGCTTTTGTTGCAGGTCGATCCACGCTTAGGCAATATAATCCAAACCTCATAAATGGGGTCTTAAAATGTTTACGCGGGCTGGAATATCTGGATTAGTTTATGATTTTATTGCTATATGTTGGAGAAGGCACTTCTCCTTCTTATGGCTTGGGAATATCATCTTATGTTGTCTTATATTTGGCAGAAAGTCTTCCCAAAGACAAAATTTTAAACTGTATTTTGATAATTGGTTTACGTCTGTAATCCTTCTGATTTCGTTGAAGGAAATAGGAATCTTTGCAACAGGTACCTGTACGTATGATAAAGTTGAACATTGGGTAGTTTTTTGGAGAAAGAGGACGTTGCAGACTGTGCAAAATTGCAACACCGATGACCAAATGCCTTACATGCAAAGTCCATCTGTGCTGCAATAACAATAAAAACTGTTTTTTGTCATACCACACTTAAATTGTCATTATAAAGAAAAATATTTCATATTCTGTGATTTATAAAAAAAAAACAATGCTTACACATCACTACTGCCCGACGTTGCTCACAAGAAAACTTTTGCTACCGCCCAAACTAATGGGCGTGGCATACCTAAAATTTTGCTAAATTTTTTCTAAAATAAATGTAAAACATTAATGATAAAACAAAATTTCACGGGTAAAAAAGTTGGGCGCGAAAGGGTTAAAAGACTTCTGTAGCATACTTTGGAATCCCAGAATCTCACATGCGAATAATGGAAAGTTTTGATCTAAGCTCAGATCATTCTCTAATAATAGTGACATACAGTACAGTAGCTCATATATTGCAAATACAGATATCAATGCATTTAAAAGTTATCTGGAAACAGCTATCAGCCTGGATATCTCGCTAAAATCAGGAGAGGAGAGCTACTGTGGAGCTACTCACAAACAAGATCCATAAAGCAAGCTATATATGTACGAAGCTACCAGCCAGAAACTCACAATCAAATCAGCTCTATCTCTCAGCTGAAACTCCGACAACAAATACAACACAAGAGAAATTTGCGTAAGAGATGGCAAGAAACTCTCTACCCTGCCGACAAAAGATCGTATAACAAGGCTGCATCTGATCGCAGAAAACTACTGTCAACTTTAAGAAATTAATCTCTCGCTGAATATCTTAGAAATCTAGATCCACATTCTTGTAACCACGAACATAATTTATGGAGTAACCAAATATCTCAAGCGACCTGCAAAAGAAACACAGTAGTCCGAAACTCTAATGGCGAATGGCGTAGATCTGATGATGAACAAGCCAAAGCATTTGCTTAACACCTGCACTCTGTATTTCAGCCAAATGATATTGATAACCCGCAAACAGAAAGGGAAGTAGATAACTTTTTTCGAGTCACCGCCAAATGAGCTTACCCATTCGTAAAATCAGTATTAATGAAGTTTCATCAGAAATGGCTAAAAAGTAAAAAGGCTCCAGATTGGGACAAAATAGATGGCATAGCCTTGAAAAAAAAAATGGGCGGTTAGAGTTGACCACTTCCCAAGCCAATGGAAATGTGCAGAAATTATAGGAATCCTTAAACCAAACAAGGCAGAAAATGAAGTGACATTGTACCGTCCCATTAGTTTGTTGTCAATATTTTCTAAAGTATTTAAAAAAAATAATTTTAAAGAGAATGTTGTCAATCTTGGAAGAATTGCTATCATACCCAAACACCAGTTTGGATTCGAAGAGGCCACGGAACCCCTGAGCAATGTCACAGGATTAAAAAATGAAATTTCGTCAGCATTTGAGAGCAAAAAATACTGCACTGCTAAATTTCTTGACGTTTAACAAGCGTTTGATCGAGTCTGGCATGATGGCTTATCATATAAAACCATATTTTATATTATTAAAGTCATACTTAACCAATAGACAATTTTATTTGCAACAAAAAAATGAATACTCGCCCTTGCACTTTATAAAAGCTGGAGTCCCACAAGGAAGAGTCTTAGTAACTGTCTTATACACCCTGTAACGGCAGATATGCCGGTAACAAATACCGCCTGTAACAAATGATACAGCTATATTAGCTACAAGCTCATCTAAAGAGGAAGCCTCACAACTCCTGCAAGCAGAGCTACGCCTTATTGAAAGCTGGTTTCTTATTTGGAAAATTAAAGTCAACGCCCTGAAATCTGCGCAAATAACTTTTGCATTAAGAAGAGGTAACTGCCCAGAAGTGTCATTTAATGGATCAGCAATCCCACAAAGTATCGATCGCAGACTAACGTGGAAACACATAAACATAAAAGCAAAGCGCCAGCAACTAAATCAAAAAAGTTTGAAGATGACCTGGTTGCTTGGCCGAAAATCTGCAACCACTCGGAAAATAAAGTCCGTTTATACAAAGCTATACTAAAGCCCATGTGGACTTATGACATACAGCTTTGGGGTACTGCCAGCAACTCAAATATTGAGATTCTACAATGCTACCAATCAAAAAATATTAAGACAAATTGTTAATGCTCCATTTTATATTTCAAATGCAAGTATCTATAAAGACTTAGGAATCCCTTATGTTAAAGAAGAAATAGCAAAACATATTAAAAATATATAGACAGACCAAGAACACATGAAAATAACTTAGCCTTAAATTTGGTAAATAA RC:i:105426 diff -r 000000000000 -r 60573349e9ae test-data/out_reads.csv --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/out_reads.csv Wed Nov 11 21:54:51 2020 +0000 @@ -0,0 +1,59 @@ +AssembledSegmentId,EdgeCount,OrientedReadCount,OrientedReadId,VertexCount,EdgeCount +0,478,29,1-0,138,109 +0,478,29,2-1,137,115 +0,478,29,3-1,85,69 +0,478,29,6-1,146,114 +0,478,29,8-1,161,130 +0,478,29,9-1,167,141 +0,478,29,10-1,223,196 +0,478,29,11-0,231,188 +0,478,29,13-0,292,229 +0,478,29,15-1,274,246 +0,478,29,16-1,262,213 +0,478,29,17-1,305,255 +0,478,29,19-0,139,103 +0,478,29,22-0,232,172 +0,478,29,23-0,360,330 +0,478,29,24-1,282,233 +0,478,29,26-0,346,301 +0,478,29,27-0,147,100 +0,478,29,28-0,245,230 +0,478,29,29-0,220,198 +0,478,29,30-1,179,149 +0,478,29,31-0,166,140 +0,478,29,33-1,140,126 +0,478,29,36-1,105,91 +0,478,29,38-0,90,82 +0,478,29,39-1,68,62 +0,478,29,40-1,85,76 +0,478,29,41-1,87,81 +0,478,29,42-1,77,69 +1,478,29,1-1,138,109 +1,478,29,2-0,137,115 +1,478,29,3-0,85,69 +1,478,29,6-0,146,114 +1,478,29,8-0,161,130 +1,478,29,9-0,167,141 +1,478,29,10-0,223,196 +1,478,29,11-1,231,188 +1,478,29,13-1,292,229 +1,478,29,15-0,274,246 +1,478,29,16-0,262,213 +1,478,29,17-0,305,255 +1,478,29,19-1,139,103 +1,478,29,22-1,232,172 +1,478,29,23-1,360,330 +1,478,29,24-0,282,233 +1,478,29,26-1,346,301 +1,478,29,27-1,147,100 +1,478,29,28-1,245,230 +1,478,29,29-1,220,198 +1,478,29,30-0,179,149 +1,478,29,31-1,166,140 +1,478,29,33-0,140,126 +1,478,29,36-0,105,91 +1,478,29,38-1,90,82 +1,478,29,39-0,68,62 +1,478,29,40-0,85,76 +1,478,29,41-0,87,81 +1,478,29,42-0,77,69