Repository 'spades'
hg clone https://toolshed.g2.bx.psu.edu/repos/nml/spades

Changeset 14:74f20c988994 (2022-01-23)
Previous changeset 13:b7829778729f (2021-09-20) Next changeset 15:a39c4cb6ab7f (2022-01-24)
Commit message:
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/spades commit 8734db131db6f76697b500b30f18ee7723d61813"
modified:
macros.xml
spades.xml
added:
test-data/A_R1.fastq.gz
test-data/A_R2.fastq.gz
test-data/B_R1.fastq.gz
test-data/B_R2.fastq.gz
test-data/corona_scaffold.fasta
test-data/covid.fastq.gz
test-data/ecoli_1K.fasta.gz
test-data/ecoli_1K.fastq.gz
test-data/ecoli_1K_1.fasta.gz
test-data/ecoli_1K_1.fastq.gz
test-data/ecoli_1K_2.fasta.gz
test-data/ecoli_1K_2.fastq.gz
test-data/pl1.fq.gz
test-data/pl2.fq.gz
removed:
test-data/auto_kmer_output.fa
test-data/ecoli_1K_1.fasta
test-data/ecoli_1K_1.fq
test-data/ecoli_1K_1.fq.gz
test-data/ecoli_1K_2.fasta
test-data/ecoli_1K_2.fq
test-data/ecoli_1K_2.fq.gz
test-data/kmer_33_output.fa
test-data/kmer_77_output.fa
test-data/reference_1K.fa
b
diff -r b7829778729f -r 74f20c988994 macros.xml
--- a/macros.xml Mon Sep 20 09:55:41 2021 +0000
+++ b/macros.xml Sun Jan 23 21:31:26 2022 +0000
[
b'@@ -1,4 +1,749 @@\n <macros>\n-    <token name="@TOOL_VERSION@">3.12.0</token>\n-    <token name="@INTYPES@">fasta,fasta.gz,fastq,fastq.gz</token>\n+    <token name="@TOOL_VERSION@">3.15.3</token>\n+    <token name="@VERSION_SUFFIX@">0</token>\n+    <xml name="requirements">\n+        <requirements>\n+            <requirement type="package" version="@TOOL_VERSION@">spades</requirement>\n+            <requirement type="package" version="3.0">zip</requirement>\n+            <yield/>\n+        </requirements>\n+    </xml>\n+    <xml name="stdio">\n+        <stdio>\n+            <exit_code range="1:"/>\n+            <regex match="Cannot allocate memory"\n+               source="stdout"\n+               level="fatal_oom"\n+               description="Out of memory error occurred"/>\n+            <regex match="The reads contain too many k-mers to fit into available memory"\n+               source="stdout"\n+               level="fatal_oom"\n+               description="Out of memory error occurred"/>\n+        </stdio>\n+    </xml>\n+    <xml name="version_command">\n+        <version_command><![CDATA[spades.py --version 2>&1 | awk -F \'v\' \'{print $2}\']]></version_command>\n+    </xml>\n+    <token name="@INTYPES@">\n+        \n+    </token>\n+    <xml name="citations">\n+        <citations>\n+            <citation type="doi">10.1093/bioinformatics/btv688</citation>\n+            <citation type="doi">10.1093/bioinformatics/btu266</citation>\n+            <citation type="doi">10.1093/bioinformatics/btv337</citation>\n+            <yield/>\n+          </citations>\n+    </xml>\n+    <xml name="operation_mode" token_help="">\n+        <param name="operation_mode" type="select" label="Operation mode" help="@HELP@">\n+            <option value="">Assembly and error correction</option>\n+            <option value="--only-assembler">Only assembler (--only-assembler)</option>\n+            <option value="--only-error-correction">Only error correction (--only-error-correction)</option>\n+        </param>\n+    </xml>\n+    \n+\n+<!-- PREPARE INPUT FILES-->\n+\n+<token name="@PREPROCESS_INPUT_FILES_MAIN@"><![CDATA[\n+#if $singlePaired.sPaired == "single" or $singlePaired.sPaired == "paired_interlaced"\n+    mkdir -p reads1 &&\n+    #set file_paths1 = []\n+    #for $input_file in $singlePaired.input1\n+        #set $ext = $input_file.ext.replace(\'fastqsanger\', \'fastq\')\n+        #set $fname = $input_file.element_identifier.replace(" ","_") + \'.\' + $ext\n+        #set $file_path = \'reads1/\' + $fname\n+        ln -s \'$input_file\' $file_path &&\n+        $file_paths1.append($file_path)\n+    #end for\n+#else if $singlePaired.sPaired == "paired"\n+    mkdir -p paired_reads1 &&\n+    #set fw_reads1 = []\n+    #for $input_file in $singlePaired.input1\n+        #set $ext = $input_file.ext.replace(\'fastqsanger\', \'fastq\')\n+        #set $fname = $input_file.element_identifier.replace(" ","_") + \'.\' + $ext\n+        #set $file_path = \'paired_reads1/\' + str($fname)\n+        ln -s \'$input_file\' $file_path &&\n+        $fw_reads1.append($file_path)\n+    #end for\n+    #set rv_reads1 = []\n+    #for $input_file in $singlePaired.input2\n+        #set $ext = $input_file.ext.replace(\'fastqsanger\', \'fastq\')\n+        #set $fname = $input_file.element_identifier.replace(" ","_") + \'.\' + $ext\n+        #set $file_path = \'paired_reads1/\' + str($fname)\n+        ln -s \'$input_file\' $file_path &&\n+        $rv_reads1.append($file_path)\n+    #end for\n+    #silent $fw_reads1.sort()\n+    #silent $rv_reads1.sort()\n+#else\n+    mkdir -p paired_reads1 &&\n+    #set fw_reads1 = []\n+    #set rv_reads1 = []\n+    #for $i, $input_file in enumerate($singlePaired.input)\n+        #set $ext = $input_file.forward.ext.replace(\'fastqsanger\', \'fastq\')\n+        #set $file_path = \'paired_reads1/fw\' + str($i) + \'.\' + $ext\n+        ln -s \'$input_file.forward\' $file_path &&\n+        $fw_reads1.append($file_path)\n+        #set $file_path = \'paired_reads1/rv\' + str($i) + \'.\' + $ext\n+        ln -s \'$input_file.reverse\' $file_path &&\n+        $rv_reads1.append($file_pat'..b'</filter>\n+        </data>\n+    </xml>\n+    <!--\n+      help\n+    -->\n+\n+    <token name="@HELP_IN@"><![CDATA[\n+\n+SPAdes takes as input paired-end reads, mate-pairs and single (unpaired) reads in FASTA and FASTQ. For IonTorrent data SPAdes also supports unpaired reads in unmapped BAM format (like the one produced by Torrent Server). However, in order to run read error correction, reads should be in FASTQ or BAM format. Sanger, Oxford Nanopore and PacBio CLR reads can be provided in both formats since SPAdes does not run error correction for these types of data.\n+\n+To run SPAdes 3.15.3 you need at least one library of the following types:\n+\n+- Illumina paired-end/high-quality mate-pairs/unpaired reads\n+- IonTorrent paired-end/high-quality mate-pairs/unpaired reads\n+- PacBio CCS reads\n+- Illumina and IonTorrent libraries should not be assembled together. All other types of input data are compatible. SPAdes should not be used if only PacBio CLR, Oxford Nanopore, Sanger reads or additional contigs are available.\n+\n+SPAdes supports mate-pair only assembly. However, we recommend to use only high-quality mate-pair libraries in this case (e.g. that do not have a paired-end part). We tested mate-pair only pipeline using Illumina Nextera mate-pairs. \n+\n+Notes:\n+\n+- It is strongly suggested to provide multiple paired-end and mate-pair libraries according to their insert size (from smallest to longest).\n+- It is not recommended to run SPAdes on PacBio reads with low coverage (less than 5).\n+- We suggest not to run SPAdes on PacBio reads for large genomes.\n+- SPAdes accepts gzip-compressed files.\n+\n+A detailed description can be found in the `input section <https://github.com/ablab/spades/#sec3.1>`_ of the manual.\n+    ]]></token>\n+    <token name="@HELP_OUT_AG@">\n+- Assembly graph\n+    </token>\n+    <token name="@HELP_OUT_AGS@">\n+- Assembly graph with scaffolds\n+    </token>\n+    <token name="@HELP_OUT_C@">\n+- Contigs\n+    </token>\n+    <token name="@HELP_OUT_CP@">\n+- Contigs paths in the assembly graph\n+    </token>\n+    <token name="@HELP_OUT_CS@">\n+- Contigs stats\n+    </token>\n+    <token name="@HELP_OUT_CR@">   \n+- Corrected reads by BayesHammer\n+    </token>\n+    <token name="@HELP_OUT_L@">\n+- Log file\n+    </token>\n+    <token name="@HELP_OUT_S@">\n+- Scaffolds (recommended for use as resulting sequences)\n+    </token>\n+    <token name="@HELP_OUT_SP@">\n+- Scaffolds paths in the assembly graph\n+    </token>\n+    <token name="@HELP_OUT_SS@">\n+- Scaffolds stats\n+    </token>\n+    <token name="@HELP_WID@">\n+SPAdes - St. Petersburg genome assembler - is an assembly toolkit containing various assembly pipelines.\n+    </token>\n+    <token name="@IONTORRENT@"><![CDATA[\n+The selection of k-mer length is non-trivial for IonTorrent. If the dataset is more or less conventional (good coverage, not high GC, etc), then use our `recommendation for long reads <https://cab.spbu.ru/files/release3.12.0/manual.html#sec3.4>`_ (e.g. assemble using k-mer lengths 21,33,55,77,99,127). However, due to increased error rate some changes of k-mer lengths (e.g. selection of shorter ones) may be required. For example, if you ran SPAdes with k-mer lengths 21,33,55,77 and then decided to assemble the same data set using more iterations and larger values of K, you can run SPAdes once again specifying the same output folder and the following options: --restart-from k77 -k 21,33,55,77,99,127 --mismatch-correction -o <previous_output_dir>. Do not forget to copy contigs and scaffolds from the previous run. We\'re planning to tackle issue of selecting k-mer lengths for IonTorrent reads in next versions.\n+\n+You may need no error correction for Hi-Q enzyme at all. However, we suggest trying to assemble your data with and without error correction and select the best variant.\n+\n+For non-trivial datasets (e.g. with high GC, low or uneven coverage) we suggest to enable single-cell mode (setting --sc option) and use k-mer lengths of 21,33,55.\n+\n+    ]]></token>    \n+\n </macros>\n'
b
diff -r b7829778729f -r 74f20c988994 spades.xml
--- a/spades.xml Mon Sep 20 09:55:41 2021 +0000
+++ b/spades.xml Sun Jan 23 21:31:26 2022 +0000
[
b'@@ -1,359 +1,720 @@\n-<tool id="spades" name="SPAdes" version="@TOOL_VERSION@+galaxy1">\n-    <description>genome assembler for regular and single-cell projects</description>\n-    <xrefs>\n-        <xref type="bio.tools">spades</xref>\n-    </xrefs>\n+<tool id="spades" name="SPAdes" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="20.01">\n+    <description>genome assembler for genomes of regular and single-cell projects</description>\n     <macros>\n         <import>macros.xml</import>\n     </macros>\n-    <requirements>\n-        <requirement type="package" version="@TOOL_VERSION@">spades</requirement>\n-    </requirements>\n-    <stdio>\n-        <exit_code range="1:" />\n-        <regex match="Cannot allocate memory"\n-           source="stdout"\n-           level="fatal_oom"\n-           description="Out of memory error occurred" />\n-        <regex match="The reads contain too many k-mers to fit into available memory"\n-           source="stdout"\n-           level="fatal_oom"\n-           description="Out of memory error occurred" />\n-    </stdio>\n-    <command>\n-    <![CDATA[\n-    ## A real command looks like: spades.py -k 21,33,55,77,99,127 --careful -1 Y.fastq.gz -2 X.fastq.gz -t 24 -o output\n+    <expand macro="requirements"/>\n+    <expand macro="stdio"/>\n+    <expand macro="version_command"/>\n+    <command detect_errors="exit_code"><![CDATA[\n+\n+#set $library = 1\n \n-    if [ -n "\\$GALAXY_MEMORY_MB" ]; then\n-        GALAXY_MEMORY_GB=\\$(( GALAXY_MEMORY_MB / 1024 ));\n-    fi &&\n+@PREPROCESS_INPUT_FILES_MAIN@\n+#if $additional_reads.selector == \'true\'\n+    @PREPROCESS_INPUT_FILES_ADDITIONAL@\n+#end if\n+@PREPROCESS_NANOPORE_PACBIO_FILES@\n+@PREPROCESS_CONTIGS_FILES@\n+@PREPROCESS_SANGER_FILES@\n \n-    spades.py -o . --tmp-dir "\\${TMPDIR:-.}" --disable-gzip-output $sc $onlyassembler $careful -t \\${GALAXY_SLOTS:-16} -m \\${GALAXY_MEMORY_GB:-250}\n-    #if not $kmer_choice.auto_kmer_choice:\n-        -k "$kmer_choice.kmers"\n-    #end if\n-    #if $cov.state == "auto":\n-        --cov-cutoff \'auto\'\n-    #elif $cov.state == "value":\n-        --cov-cutoff \'$cov.cutoff\'\n+## run\n+spades.py\n+    $operation_mode\n+    -o \'output\'    \n+    @RESOURCES@\n+    @INPUT_READS_MAIN@\n+    #if $additional_reads.selector == \'true\'\n+        @INPUT_READS_ADDITIONAL@\n     #end if\n-    $iontorrent\n-    ## Sequence files, libraries\n-    #for $i, $library in enumerate( $libraries, start=1 )\n-        #if str( $library.lib_type ) == "paired_end":\n-            #set prefix = \'pe\'\n-        #elif str( $library.lib_type ) == "mate_paired":\n-            #set prefix = \'mp\'\n-        #elif str( $library.lib_type ) == "nxmate_paired":\n-            #set prefix = \'nxmate\'\n-        #else:\n-            #set prefix = \'hqmp\'\n-        #end if\n-        --$prefix$i-$library.orientation\n-        #for $file in $library.files\n-            #if $file.file_type.type == "separate"\n-                --$prefix$i-1 $file.file_type.fwd_reads.extension.replace(\'fastqsanger\', \'fastq\'):$file.file_type.fwd_reads\n-                --$prefix$i-2 $file.file_type.fwd_reads.extension.replace(\'fastqsanger\', \'fastq\'):$file.file_type.rev_reads\n-            #elif $file.file_type.type == "interleaved"\n-                --$prefix$i-12 $file.file_type.interleaved_reads.extension.replace(\'fastqsanger\', \'fastq\'):$file.file_type.interleaved_reads\n-            #elif $file.file_type.type == "merged"\n-                --$prefix$i-m $file.file_type.merged_reads.extension.replace(\'fastqsanger\', \'fastq\'):$file.file_type.merged_reads\n-            #elif $file.file_type.type == "unpaired"\n-                --$prefix$i-s $file.file_type.unpaired_reads.extension.replace(\'fastqsanger\', \'fastq\'):$file.file_type.unpaired_reads\n-            #elif $file.file_type.type == "paired-collection"\n-                --$prefix$i-1 $file.file_type.fastq_collection.forward.extension.replace(\'fastqsanger\', \'fastq\'):$file.file_type.fastq_collection.forward\n-                --$prefix$i-2 $file.file_type.fastq_collection.reverse.extension.replace(\'fastqsang'..b'ame="sPaired" value="paired_collection"/>\n+                <param name="input">\n+                    <collection type="list:paired">\n+                        <element name="ecoli.fastq">\n+                            <collection type="paired">\n+                                <element name="forward" value="ecoli_1K_1.fastq.gz" ftype="fastqsanger.gz"/>\n+                                <element name="reverse" value="ecoli_1K_2.fastq.gz" ftype="fastqsanger.gz"/>\n+                            </collection>\n+                        </element>\n+                    </collection>\n+                </param>\n+                <param name="type_paired" value="hqmp"/>\n+            </conditional>\n+            <output name="out_ag">\n+                <assert_contents>\n+                    <has_n_lines n="36"/>\n+                    <has_text_matching expression=">EDGE_.+"/>\n+                </assert_contents>\n+            </output>\n+            <output name="out_ags">\n+                <assert_contents>\n+                    <has_n_lines n="2"/>\n+                    <has_text_matching expression="S.+"/>\n+                </assert_contents>\n+            </output>\n+            <output name="out_cn">\n+                <assert_contents>\n+                    <has_n_lines n="18"/>\n+                    <has_text_matching expression=">NODE\\_1\\_length\\_1000\\_cov\\_.+"/>\n+                </assert_contents>\n+            </output>\n+            <output name="out_sc">\n+                <assert_contents>\n+                    <has_n_lines n="18"/>\n+                    <has_text_matching expression=">NODE\\_1\\_length\\_1000.+"/>\n                 </assert_contents>\n             </output>\n         </test>\n     </tests>\n-    <help>\n-<![CDATA[\n+    <help><![CDATA[\n+.. class:: infomark\n+\n **What it does**\n \n-SPAdes \xe2\x80\x93 St. Petersburg genome assembler \xe2\x80\x93 is intended for both standard isolates and single-cell MDA bacteria assemblies. See http://bioinf.spbau.ru/en/spades for more details on SPAdes.\n+@HELP_WID@\n+\n+**Input**\n \n-This wrapper runs SPAdes, collects the output, and throws away all the temporary files. It also produces a tab file with contig names, length and coverage.\n+@HELP_IN@\n \n-**License**\n+**Output**\n \n-SPAdes is developed by and copyrighted to Saint-Petersburg Academic University, and is released under GPLv2.\n-\n-This wrapper is copyrighted by Philip Mabon and is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version.\n+@HELP_OUT_AG@\n+@HELP_OUT_AGS@\n+@HELP_OUT_C@\n+@HELP_OUT_CP@\n+@HELP_OUT_CR@\n+@HELP_OUT_CS@\n+@HELP_OUT_L@\n+@HELP_OUT_S@\n+@HELP_OUT_SP@\n+@HELP_OUT_SS@\n \n-This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.\n-\n-You should have received a copy of the GNU General Public License along with this program.  If not, see http://www.gnu.org/licenses/.\n \n-** Acknowledgments **\n+-------------------\n \n-Original wrapper developed by Lionel Guy.\n+.. class:: infomark\n \n-Anton Korobeynikov greatlty helped understanding how SPAdes work, and integrated handy features into SPAdes.\n+**IonTorrent data**\n \n-Nicola Soranzo fixed various bugs.\n+@IONTORRENT@\n+\n+-------------------\n \n-Simon Gladman added fastg optional outputs.\n-]]>\n-    </help>\n-    <citations>\n-        <citation type="doi">10.1089/cmb.2012.0021</citation>\n-    </citations>\n+.. class:: infomark\n+\n+**References**\n+\n+More information are available on `github <https://github.com/ablab/spades>`_ and on the `project website <http://cab.spbu.ru/software/spades>`_.\n+    ]]></help>\n+    <expand macro="citations">\n+            <citation type="doi">10.1089/cmb.2012.0021</citation>\n+            <citation type="doi">10.1007/978-3-642-37195-0_13</citation>\n+    </expand>\n </tool>\n'
b
diff -r b7829778729f -r 74f20c988994 test-data/A_R1.fastq.gz
b
Binary file test-data/A_R1.fastq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/A_R2.fastq.gz
b
Binary file test-data/A_R2.fastq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/B_R1.fastq.gz
b
Binary file test-data/B_R1.fastq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/B_R2.fastq.gz
b
Binary file test-data/B_R2.fastq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/auto_kmer_output.fa
--- a/test-data/auto_kmer_output.fa Mon Sep 20 09:55:41 2021 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,18 +0,0 @@
->NODE_1_length_1000_cov_140.62
-AGCTTTTCATTCTGACTGCAACGGGCAATATGTCTCTGTGTGGATTAAAAAAAGAGTGTC
-TGATAGCAGCTTCTGAACTGGTTACCTGCCGTGAGTAAATTAAAATTTTATTGACTTAGG
-TCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTAC
-ACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGT
-AACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCACCTGACAGTGCGGG
-CTTTTTTTTTCGACCAAAGGTAACGAGGTAACAACCATGCGAGTGTTGAAGTTCGGCGGT
-ACATCAGTGGCAAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCC
-AGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCACCTGGTG
-GCGATGATTGAAAAAACCATTAGCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAA
-CGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCG
-CAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATT
-AGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAA
-ATGTCGATCGCCATTATGGCCGGCGTATTAGAAGCGCGCGGTCACAACGTTACTGTTATC
-GATCCGGTCGAAAAACTGCTGGCAGTGGGGCATTACCTCGAATCTACCGTCGATATTGCT
-GAGTCCACCCGCCGTATTGCGGCAAGCCGCATTCCGGCTGATCACATGGTGCTGATGGCA
-GGTTTCACCGCCGGTAATGAAAAAGGCGAACTGGTGGTGCTTGGACGCAACGGTTCCGAC
-TACTCTGCTGCGGTGCTGGCTGCCTGTTTACGCGCCGATT
b
diff -r b7829778729f -r 74f20c988994 test-data/corona_scaffold.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/corona_scaffold.fasta Sun Jan 23 21:31:26 2022 +0000
b
@@ -0,0 +1,18 @@
+>NODE_1_length_1009_cluster_1_candidate_1_domains_2
+GTTCAAGCTGAGGCAAAACGCCTTTTTCAACTTCTACTAAGCCACAAGTGCCATCTTTAG
+GATGTTGACGTGCCTCTGATAAGACCGCCTCCACTGGAGGATACACAGGTTTAAAGGTTT
+ATACCTTCCCAGGTAACAAACCAACCAACTTTCGATCTCTTGTAGATCTGTTCTCTAAAC
+GAACTTTAAAATCTGTGTGGCTGTCACTCGGCTGCATGCTTAGTGCACTCACGCAGTATA
+ATTAATAACTAATTACTGTCGTTGACAGGACACGAGTAACTCGTCTATCTTCTGCAGGCT
+GCTTACGGTTTCGTCCGTGTTGCAGCCGATCATCAGCACATCTAGGTTTCGTCCGGGTGT
+GACCGAAAGGTAAGATGGAGAGCCTTGTCCCTGGTTTCAACGAGAAAACACACGTCCAAC
+TCAGTTTGCCTGTTTTACAGGTTCGCGACGTGCTCGTACGTGGCTTTGGAGACTCCGTGG
+AGGAGGTCTTATCAGAGGCACGTCAACATCTTAAAGATGGCACTTGTGGCTTAGTAGAAG
+TTGAAAAAGGCGTTTTGCCTCAACTTGAACAGCCCTATGTGTTCATCAAACGTTCGGATG
+CTCGAACTGCACCTCATGGTCATGTTATGGTTGAGCTGGTAGCAGAACTCGAAGGCATTC
+AGTACGGTCGTAGTGGTGAGACACTTGGTGTCCTTGTCCCTCATGTGGGCGAAATACCAG
+TGGCTTACCGCAAGGTTCTTCTTCGTAAGAACGGTAATAAAGGAGCTGGTGGCCATAGTT
+ACGGCGCCGATCTAAAGTCATTTGACTTAGGCGACGAGCTTGGCACTGATCCTTATGAAG
+ATTTAAGATGGCACTTGTGGCTTAGTAGAAGTTGAAAAAGGCGTTTTGCCTCAACTTGAA
+CAGCCCTATGTGTTCATCAAACGTTCGGATGCTCGAACTGCACCTCCTGGTCATGTTGAG
+CTGGTAGCAGAACTCGAAGGCATTCAGTACGGTCGTAGTGGTGAGACAC
b
diff -r b7829778729f -r 74f20c988994 test-data/covid.fastq.gz
b
Binary file test-data/covid.fastq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K.fasta.gz
b
Binary file test-data/ecoli_1K.fasta.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K.fastq.gz
b
Binary file test-data/ecoli_1K.fastq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_1.fasta
--- a/test-data/ecoli_1K_1.fasta Mon Sep 20 09:55:41 2021 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,4108 +0,0 @@\n->EAS20_8_6_1_9_1972/1 trim=6\n-ACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCACCTGACAGTGCG\n->EAS20_8_6_1_163_1521/1\n-GCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTG\n->EAS20_8_6_1_178_1948/1\n-ATTCGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGA\n->EAS20_8_6_1_318_1522/1 trim=5\n-AAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCAC\n->EAS20_8_6_1_348_1372/1\n-AAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAAC\n->EAS20_8_6_1_389_646/1 trim=2\n-ACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAAC\n->EAS20_8_6_1_513_951/1\n-TTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGCAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGG\n->EAS20_8_6_1_530_1080/1 trim=1\n-AAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAG\n->EAS20_8_6_1_546_406/1\n-AAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCAT\n->EAS20_8_6_1_553_1132/1 correct\n-CGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTTATTTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAG\n->EAS20_8_6_1_594_142/1 trim=11\n-GGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCAGGTGCGGGCTTTTTTCTGTGTTTCCTGTACGCGTCAGCCCG\n->EAS20_8_6_1_641_1277/1 trim=50\n-GGGCTTTTTTCTGTGTTTCCTGTACGCGTCAGCCCGCACCGTTACCTGTG\n->EAS20_8_6_1_660_979/1 trim=5\n-AGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCACCTGGTGGCGATGATTGAAAAAACCATTAGCGGCCAGGATGCTTTACCCAAT\n->EAS20_8_6_1_763_241/1 trim=42\n-TTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCAGGTGCGGGCTTT\n->EAS20_8_6_1_789_699/1\n-GCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGT\n->EAS20_8_6_1_802_355/1 correct\n-AGCAGCTTCTGAACTGGTTACCTGCCGTGAGTAAATTAAAATTTTATTGACTTAGGTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGAT\n->EAS20_8_6_1_807_1707/1 trim=15\n-TCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTTTGGCGG\n->EAS20_8_6_1_918_1054/1 correct trim=10\n-AACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCA\n->EAS20_8_6_1_1078_254/1 correct trim=20\n-CACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCAGGTGCGGGCTTTTTTCTGTGTTT\n->EAS20_8_6_1_1107_1548/1\n-ATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTG\n->EAS20_8_6_1_1173_908/1 trim=15\n-GAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATA\n->EAS20_8_6_1_1216_1097/1\n-ATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTA\n->EAS20_8_6_1_1393_1905/1 trim=5\n-TACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACA\n->EAS20_8_6_1_1477_92/1\n-ACCGTTACCTGTGGTAATGGTGATGGTGGTGGTAATGGTGGTGCTAATGCGTTTCATGGATGTTGTGTACTCTGTAATTTTTATCTGTCTGTGCGCTATG\n->EAS20_8_6_1_1556_445/1 trim=29\n-ACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAA\n->EAS20_8_6_1_1669_38/1 trim=17\n-GTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCG\n->EAS20_8_6_1_1692_295/1\n-TCGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGACA\n->EAS20_8_6_1_1713_508/1 trim=70\n-CGGGCTGACGCGTACAGGAAACACAGAAAA\n->EAS20_8_6_1_1752_449/1 correct trim=4\n-TTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGCAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCA\n->EAS20_8_6_2_17_2016/1 trim=33\n-TGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCG\n->EAS20_8_6_2_30_542/1 trim=3\n-CTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCG\n->EAS20_8_6_2_65_168/1\n-GGGTGGACTCAGCAATATCGACGGTAGATTCGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTC\n->EAS20_8_6_2_79_54/1 correct trim=11\n-GAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAA'..b'1\n-CGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTTATTTGGGC\n->EAS20_8_6_99_900_1246/1 trim=20\n-ATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCACCTGGTGGC\n->EAS20_8_6_99_1005_429/1 trim=10\n-TCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGT\n->EAS20_8_6_99_1058_1002/1 trim=5\n-GAATATCGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTC\n->EAS20_8_6_99_1438_1524/1\n-AGTAAATTAAAATTTTATTGACTTAGGTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGA\n->EAS20_8_6_99_1487_1757/1 trim=1\n-TTTTCTGTGTTTCCTGTACGCGTCAGCCCGCACCGTTACCTGTGGTAATGGTGATGGTGGTGGTAATGGTGGTGCTAATGCGTTTCATGGATGTTGTGT\n->EAS20_8_6_99_1633_42/1 trim=60\n-CACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAG\n->EAS20_8_6_99_1638_1013/1 trim=6\n-GACAGTGCGGGCTTTTTTTTTCGACCAAAGGTAACGAGGTAACAACCATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACG\n->EAS20_8_6_99_1753_1845/1\n-TTCCAGAATATCGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTC\n->EAS20_8_6_99_1777_785/1 correct\n-CGCTGGCGCAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAA\n->EAS20_8_6_100_27_710/1\n-AAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTT\n->EAS20_8_6_100_177_1949/1\n-TATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTTATTTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCC\n->EAS20_8_6_100_187_1683/1\n-CAAAGGTAACGAGGTAACAACCATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGC\n->EAS20_8_6_100_238_819/1\n-ATGGCCGGCGTATTAGAAGCGCGCGGTCACAACGTTACTGTTATCGATCCGGTCGAAAAACTGCTGGCAGTGGGGCATTACCTCGAATCTACCGTCGATA\n->EAS20_8_6_100_346_1515/1\n-TAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGC\n->EAS20_8_6_100_434_840/1 trim=47\n-ACCTGCCATCAGCACCATGTGATCAGCCGGAATGCGGCTTGCCGCAATACGGC\n->EAS20_8_6_100_451_465/1 correct\n-CGCCATTATGGCCGGCGTATTAGAAGCGCGCGGTCACAACGTTACTGTTATCGATCCGGTCGAAAAACTGCTGGCAGTGGGGCATTACCTCGAATCTACC\n->EAS20_8_6_100_452_1846/1 correct\n-CGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTA\n->EAS20_8_6_100_723_1564/1\n-TCTAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCAT\n->EAS20_8_6_100_776_1749/1 trim=5\n-GGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGCAAT\n->EAS20_8_6_100_779_871/1 trim=20\n-GTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAA\n->EAS20_8_6_100_816_1759/1 correct trim=47\n-AAAAAGCCCGCACTGTCAGGTGCGGGCTTTTTTCTGTGTTTCCTGTACGCGTC\n->EAS20_8_6_100_993_1119/1\n-GTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACC\n->EAS20_8_6_100_1153_966/1\n-AGCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGC\n->EAS20_8_6_100_1183_226/1 correct trim=26\n-TTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCG\n->EAS20_8_6_100_1263_900/1 correct trim=1\n-AGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCAC\n->EAS20_8_6_100_1277_357/1 trim=5\n-ACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTTTGGCGGGGGCAG\n->EAS20_8_6_100_1337_252/1 correct trim=16\n-GCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGG\n->EAS20_8_6_100_1432_436/1 trim=3\n-GTAGATTCGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGG\n->EAS20_8_6_100_1457_1209/1 correct trim=7\n-TTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAAT\n->EAS20_8_6_100_1609_245/1\n-GGTGGCCACCTGCCCCTGCCTGGCATTGCTTTCCAGAATATCGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACT\n->EAS20_8_6_100_1637_1332/1\n-TGGTGCTAATGCGTTTCATGGATGTTGTGTACTCTGTAATTTTTATCTGTCTGTGCGCTATGCCTATATTGGTTAAAGTATTTAGTGACCTAAGTCAATA\n'
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_1.fasta.gz
b
Binary file test-data/ecoli_1K_1.fasta.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_1.fastq.gz
b
Binary file test-data/ecoli_1K_1.fastq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_1.fq
--- a/test-data/ecoli_1K_1.fq Mon Sep 20 09:55:41 2021 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,8216 +0,0 @@\n-@EAS20_8_6_1_9_1972/1 trim=6\n-ACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCACCTGACAGTGCG\n-+\n-HHHHHHGHHHHFHHGGHHFHHHHHFHHFHFHHHHHFHHHHHFHHHHHHHHFHHFHFDHHGG@BGGHCDHE:;3)7.A973A:AA5>AD9G=D<D\n-@EAS20_8_6_1_163_1521/1\n-GCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTG\n-+\n-HGHHIHHHDHHHHHIHHIHHHHHHHHHBHHHHHFHCFHHHHHHHGHHHHHEHHFHHHGHHIHHHGHGHHHIHFHHHHHGH?5<<;BD>6>?BGEHHGHFG\n-@EAS20_8_6_1_178_1948/1\n-ATTCGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGA\n-+\n-GHHHHHHHHHGGHHHHHHGHHHHHHHEHHHHHHHHHHHHHFHHHEHHHHHHHFHFHIHHIHHHIHHHGHIIGGHBGGGHHFFGBHIFFGCIGGEFDG@AG\n-@EAS20_8_6_1_318_1522/1 trim=5\n-AAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCAC\n-+\n-HHHHHHHHHHIHHHHHHHHHHHHHHHHHGEHHHHHEHHHHHHIHHHHGHHEHHGHBHDDEHHEGH?HEGGGIHDIGFFFEHE;EE;=AFE;AB/B\n-@EAS20_8_6_1_348_1372/1\n-AAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAAC\n-+\n-HHHHHHHHHHHHHHHHHHHEHHGHHIHHHDHHHHHHHHHHFHHHGHHFHHH@HHHFHHHEHH<HH?@D>DHDEBEEGDFDCHECGB:?43CCCFG?90<6\n-@EAS20_8_6_1_389_646/1 trim=2\n-ACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAAC\n-+\n-HBHGGHHIGHHHGDHHGHHDHHHGDHFGGHHHHHHHHHHHHIHHGFGHHHHHGHGGHGGDHHEFHDDHGGGHHH=HDDB9FHGGEIEHICEB?DBBAE\n-@EAS20_8_6_1_513_951/1\n-TTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGCAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGG\n-+\n-HHHHHDHHHHHHIHGHGIEEDFHBDDHGGGBC?C?IHD>GFHGHG?DDGEB?;?,DCF=D??F=BDBGE=DDGDG.>76?>EB>54+?;=5;BEBDAGGA\n-@EAS20_8_6_1_530_1080/1 trim=1\n-AAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAG\n-+\n-EHHHHHHGHHFEHHHHHGHHHHHHGHH=BHHHEHHHHHHHEHFEEHHFDHHHHHHFGHHHHFHFHHEHFHFEHEEHB>EG=F?E=>FHE@CH5HB:81@\n-@EAS20_8_6_1_546_406/1\n-AAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCAT\n-+\n-HHHHHHGGGHHHHHHHHHHHHHIHHHHHHHHHHHHIFHHHHHHHHHHHIFHHHHHHHHHHHHHGHHHHFHHHHFHHHHEHHDH@8GFHHGHEFBHHGG5G\n-@EAS20_8_6_1_553_1132/1 correct\n-CGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTTATTTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAG\n-+\n-HHHHHIHHHHHHGHHHHHHHHHDHHHHHHHHHHHIGHH@HHHHHGHHFHDHHHHHHHHGGGHH=HDHHHFHHHGHHHFHH55445#A@@:55555EGGDE\n-@EAS20_8_6_1_594_142/1 trim=11\n-GGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCAGGTGCGGGCTTTTTTCTGTGTTTCCTGTACGCGTCAGCCCG\n-+\n-HIHHHHHHHHHHHHHHHHHHHHHIHHFHDHHGEBEEEHHGHIIHHFHHEG@FAFHD;DEFHHH@E.:82=??:=:F5?E6;4<:@B?AE\n-@EAS20_8_6_1_641_1277/1 trim=50\n-GGGCTTTTTTCTGTGTTTCCTGTACGCGTCAGCCCGCACCGTTACCTGTG\n-+\n-HHE=GHHHHHECGHHHG@FDHEFF7@@CAA?FA>FA?9;;>@;5=1AA+D\n-@EAS20_8_6_1_660_979/1 trim=5\n-AGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCACCTGGTGGCGATGATTGAAAAAACCATTAGCGGCCAGGATGCTTTACCCAAT\n-+\n-HHEGHHHHHHHHHHHHHHHHGFFHHHFEEAHEHHGHHEHDFGHIHHHGGD<9F:FHFHHBC4EEEDEBGHHGE@BCBEDGGFFGACFG=4C39:B\n-@EAS20_8_6_1_763_241/1 trim=42\n-TTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCAGGTGCGGGCTTT\n-+\n-GHHHIG@HHHHHHGHGIHHHHHHHEDDFEHCBGGHHHHH@HFFGGAGE;B+>3223;D\n-@EAS20_8_6_1_789_699/1\n-GCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGT\n-+\n-HGHHHHHHHHGHF@GHHGHHFHF@FD??F>CDHHFHHHHHBEFHHAHCHHHEHH@HHHDFHH;HGHGFHHF>1DDFF?FFEHFEHF0AE.2061585=@/\n-@EAS20_8_6_1_802_355/1 correct\n-AGCAGCTTCTGAACTGGTTACCTGCCGTGAGTAAATTAAAATTTTATTGACTTAGGTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGAT\n-+\n-HIHHHHHHIGHDHHHHH#HHFDFBB?DDA>EFGDFHHFHFHHHHHHHEGFHHHFGHBH=;FF@;FEGHHHHHFHCHHEHDFHEHHFHDH=?HEFEHEHAH\n-@EAS20_8_6_1_807_1707/1 trim=15\n-TCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTTTGGCGG\n-+\n-FHCEHGFHHHHGEEHHHHGHHFFHFHGHHHGHGFHH=HFCHHHHHEHEHHDFHHFFHHHHAHHBHA4>C6?@=8>5FBBFE?EEB\n-@EAS20_8_6_1_918_1054/1 correct trim=10\n-AACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCA\n-+\n-HHGHHHHHHHHHHHHHHHHHHHHEHHFHHHHGHHHEHHHFIHGHFHHHFHGGFHC>D1D<AFD:CGGGGAB=FCECE23B/#8>=DD:EC\n-@EAS20_8'..b'<@>@8BG9G9\n-@EAS20_8_6_100_346_1515/1\n-TAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGC\n-+\n-FGDHEHHHHHHGHHHHHHHHBG?GEHHDDGHHHDH@GEEH?CHHFF?FDFEEFHEEFHGHHFFHEIHHGBGGEGDIGFEDEHBEHGEAFHGFH@HGGA?H\n-@EAS20_8_6_100_434_840/1 trim=47\n-ACCTGCCATCAGCACCATGTGATCAGCCGGAATGCGGCTTGCCGCAATACGGC\n-+\n-HGHHHGHHHHHHGGHHHGHHHEGFHHHFHHDGHHEHGGHE:5=>9-<<.-BGB\n-@EAS20_8_6_100_451_465/1 correct\n-CGCCATTATGGCCGGCGTATTAGAAGCGCGCGGTCACAACGTTACTGTTATCGATCCGGTCGAAAAACTGCTGGCAGTGGGGCATTACCTCGAATCTACC\n-+\n-FHHEHHHGHHHHHGFDHHBHBBDDDHEHHHGHIHHDHHEHHHHHEFHHHHHHI@HE=@FBFFCC#HHDHHEHHHH@HGADFF,=FB@F?F?FB4F?F@BB\n-@EAS20_8_6_100_452_1846/1 correct\n-CGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTA\n-+\n-HFHHEHHHGHEEFEHHHHHHHGFHHHHHDHFGHFHGHHGH@B5>BAEHEHFF#?;-54457HHFAFACEFFCFAFGGGECGEEG#@@@AAFGGCDBHEE=\n-@EAS20_8_6_100_723_1564/1\n-TCTAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCAT\n-+\n-HHHHHHGHGHHHHHHHHDHHHGGHGFFHD=DFHHHFHHGGHHFHHHHHHHHDHGGHHHCHEHHGHGFHHHHGEG3H@HEDHHGHHFGEGGGGFFFGEGAG\n-@EAS20_8_6_100_776_1749/1 trim=5\n-GGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGCAAT\n-+\n-H,/E8;GH88;?8AA=CFHFCF/F7FE0EA@1.=;ACFF>C=HFFFD=D=HFBFH1FFFG>@CD;GGFGBGAGGF8HHHHHHEHIHEH8H??,<A\n-@EAS20_8_6_100_779_871/1 trim=20\n-GTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAA\n-+\n-GHHGGHGHHHHHHHCHHHFHHHFHHHHDFHHEHGHHEDHF?GG@::FGCDCB6E@F6:F<BFAC?EDF-:FEHFB:226A\n-@EAS20_8_6_100_816_1759/1 correct trim=47\n-AAAAAGCCCGCACTGTCAGGTGCGGGCTTTTTTCTGTGTTTCCTGTACGCGTC\n-+\n-#GGHHHBHCGHHHHB@>DA@0#?8>/:/<=FFF/@,3/444(555<5/?3A,A\n-@EAS20_8_6_100_993_1119/1\n-GTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACC\n-+\n-?@FDBEFGF8BFGFGHHHHEHHHHEHBFHHHHGGHHH@HGFHHHDH5HB?GHDGDFDHEHIFHFHFFHFE?HDFCFGEHEGBE=HHGGGGGHFHHGGIEG\n-@EAS20_8_6_100_1153_966/1\n-AGCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGC\n-+\n-HHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHHDHHCHHHHGBFHHDHDHHHHFCHBHEGEHEHGGEHH@GEG8FFBEHFF:FBFDA+DFC;C3\n-@EAS20_8_6_100_1183_226/1 correct trim=26\n-TTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCG\n-+\n-CFCCF?DCCDHEGHFHHHHFFFHD@HGEHHHGHHHGHHFHHHHGEEH:H>HHHDCFF#EADA366=A0A+8<AA\n-@EAS20_8_6_100_1263_900/1 correct trim=1\n-AGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCAC\n-+\n-HGHHHHHHIHHHIHFBD?BCHHHHHDGHHHHEHHFCHFHHBHEHHHFHHDHHFEHHHGH=HEFFFHH@CFHBHEHHBGHGBCDBGFDH<EAF#9F#?@A\n-@EAS20_8_6_100_1277_357/1 trim=5\n-ACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTTTGGCGGGGGCAG\n-+\n-DEHHHHIEHHHHHHHHGIGHHHHHHHGHHHHEFEHHHHHHHHFEHHHHHHHHH@CGHGCHFHHE@FB<=F=FFFFFFDG;BFDFFGFEG@9B24C\n-@EAS20_8_6_100_1337_252/1 correct trim=16\n-GCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGG\n-+\n-GBHHHHHHGGHHBHEG@BEHHDHAHGBHGHDGDDEH#EBEDBFDHHC2EDF9?@EEHHE?CCH=EHEGAGGGEE4AGA6E1G?F\n-@EAS20_8_6_100_1432_436/1 trim=3\n-GTAGATTCGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGG\n-+\n-HHHHHIHHGGHDGHHHHHEGHHHGHHDHHHEHHGHHHHGHHFHGDGHHDHECHDEGGFGGFGFFBGGEGEG?GBGHEHB9EGEDGDAEDEDE?DFBF\n-@EAS20_8_6_100_1457_1209/1 correct trim=7\n-TTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAAT\n-+\n-HGHFFDBCBD#BBFFEDDFCHGHHEHCHHHEHHHHHHEAHHHGHBDGHEHEEGHGEE@GGGGFG?5C;A5:0;A4988-/>8@5>;<-37<?B\n-@EAS20_8_6_100_1609_245/1\n-GGTGGCCACCTGCCCCTGCCTGGCATTGCTTTCCAGAATATCGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACT\n-+\n-BCBBDFHHHHHHEHHHHGHHHHHHDHHHHHHHGHHHGIHHHHHEHIDHGGIHHHFGHFHHGHHBGFFHHHHFHHFHHGHHIHHEHGFF=HGFHHBFFGBH\n-@EAS20_8_6_100_1637_1332/1\n-TGGTGCTAATGCGTTTCATGGATGTTGTGTACTCTGTAATTTTTATCTGTCTGTGCGCTATGCCTATATTGGTTAAAGTATTTAGTGACCTAAGTCAATA\n-+\n-FHFHHFGGHGHFHGHHGHHHFEHHHGFFDFHFHHHGEDCGHHHHHG9HDGHFHGHHHEHEFGF=GAHEHHFEGFFGEHFHHHHFHHEBE?HHFHEGFDHH\n'
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_1.fq.gz
b
Binary file test-data/ecoli_1K_1.fq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_2.fasta
--- a/test-data/ecoli_1K_2.fasta Mon Sep 20 09:55:41 2021 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,4108 +0,0 @@\n->EAS20_8_6_1_9_1972/2 correct\n-GGTGGCCACCTGCCCCTGCCTGGCATTGCTTTCCAGAATATCGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACT\n->EAS20_8_6_1_163_1521/2\n-GGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACG\n->EAS20_8_6_1_178_1948/2\n-ATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTG\n->EAS20_8_6_1_318_1522/2\n-AGAATATCGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAA\n->EAS20_8_6_1_348_1372/2\n-GGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGC\n->EAS20_8_6_1_389_646/2 trim=17\n-TGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTC\n->EAS20_8_6_1_513_951/2 correct\n-ATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCG\n->EAS20_8_6_1_530_1080/2\n-GAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCA\n->EAS20_8_6_1_546_406/2\n-CGGGTGGACTCAGCAATATCGACGGTAGATTCGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTT\n->EAS20_8_6_1_553_1132/2 trim=6\n-GGCGATGATTGAAAAAACCATTAGCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCC\n->EAS20_8_6_1_594_142/2\n-AACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACC\n->EAS20_8_6_1_641_1277/2\n-GGTTACCTGCCGTGAGTAAATTAAAATTTTATTGACTTAGGTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTA\n->EAS20_8_6_1_660_979/2\n-CCATGCAGGACATGTTTTATTTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAA\n->EAS20_8_6_1_763_241/2\n-TATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGT\n->EAS20_8_6_1_789_699/2 correct trim=20\n-TGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCC\n->EAS20_8_6_1_802_355/2 correct\n-CTGTACGCGTCAGCCCGCACCGTTACCTGTGGTAATGGTGATGGTGGTGGTAATGGTGGTGCTAATGCGTTTCATGGATGTTGTGTACTCTGTAATTTTT\n->EAS20_8_6_1_807_1707/2 trim=1\n-GAGGTAACAACCATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGG\n->EAS20_8_6_1_918_1054/2 correct\n-GCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAA\n->EAS20_8_6_1_1078_254/2\n-GGTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCAC\n->EAS20_8_6_1_1107_1548/2 trim=7\n-GGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGGCGATCG\n->EAS20_8_6_1_1173_908/2\n-ACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCC\n->EAS20_8_6_1_1216_1097/2 trim=16\n-GCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCAG\n->EAS20_8_6_1_1393_1905/2 trim=11\n-CGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTC\n->EAS20_8_6_1_1477_92/2\n-GGCAATATGTCTCTGTGTGGATTAAAAAAAGAGTGTCTGATAGCAGCTTCTGAACTGGTTACCTGCCGTGAGTAAATTAAAATTTTATTGACTTAGGTCA\n->EAS20_8_6_1_1556_445/2\n-TTTCCAGAATATCGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGT\n->EAS20_8_6_1_1669_38/2 trim=8\n-CAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAA\n->EAS20_8_6_1_1692_295/2\n-TTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGT\n->EAS20_8_6_1_1713_508/2 correct trim=30\n-TGATTTTGGCGGGGGCAGAGAGGACGGTGGCCACCTGCCCCTGCCTGGCATTGCTTTCCAGAATATCGGC\n->EAS20_8_6_1_1752_449/2\n-AACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGC\n->EAS20_8_6_2_17_2016/2 correct\n-CGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACT\n->EAS20_8_6_2_30_542/2 trim=65\n-GATCAGCCGGAATGCGGCTTGCCGCAATACGGCGG\n->EAS20_8_6_2_65_168/2 correct\n-AAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTT'..b'9_809_1613/2\n-CATTAGCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTG\n->EAS20_8_6_99_900_1246/2 trim=1\n-GGACATGTTTTATTTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAAGTTCGG\n->EAS20_8_6_99_1005_429/2 trim=5\n-CACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGA\n->EAS20_8_6_99_1058_1002/2 trim=18\n-CATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAA\n->EAS20_8_6_99_1438_1524/2 correct trim=26\n-CCCGCACTGTCAGGTGCGGGCTTTTTTCTGTGTTTCCTGTACGCGTCAGCCCGCACCGTTACCTGTGGTAATGG\n->EAS20_8_6_99_1487_1757/2\n-TGTCTGATAGCAGCTTCTGAACTGGTTACCTGCCGTGAGTAAATTAAAATTTTATTGACTTAGGTCACTAAATACTTTAACCAATATAGGCATAGCGCAC\n->EAS20_8_6_99_1633_42/2 correct trim=40\n-GCGGGGGCAGAGAGGACGGTGGCCACCTGCCCCTGCCTGGCATTGCTTTCCAGAATATCG\n->EAS20_8_6_99_1638_1013/2 trim=12\n-TTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTTTGGCGGGGGCAGAGAGGACGGTGGCCACCTGCCCCTGCCTGGCATTGCTTTC\n->EAS20_8_6_99_1753_1845/2 correct trim=2\n-CGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCACCTGACA\n->EAS20_8_6_99_1777_785/2 correct\n-CCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGAT\n->EAS20_8_6_100_27_710/2\n-AATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGACATTTTCTC\n->EAS20_8_6_100_177_1949/2 trim=25\n-CCAAAATCACCAACCACCTGGTGGCGATGATTGAAAAAACCATTAGCGGCCAGGATGCTTTACCCAATATCAGCG\n->EAS20_8_6_100_187_1683/2 correct trim=1\n-GCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTTTGGCGGGGGCAGAGAGGACGGTGGCCAC\n->EAS20_8_6_100_238_819/2 trim=46\n-AGAGTAGTCGGAACCGTTGCGTCCAAGCACCACCAGTTCGCCTTTTTCATTACC\n->EAS20_8_6_100_346_1515/2\n-TGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGCAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTC\n->EAS20_8_6_100_434_840/2\n-AGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCGTATTAGAAGCGCGCGGTCACAACGTTAC\n->EAS20_8_6_100_451_465/2 correct trim=22\n-GTTGCGTCCAAGCACCACCAGTTCGCCTTTTTCATTACCGGCGGTGAAACCTGCCATCAGCACCATGTGATCAGCCGG\n->EAS20_8_6_100_452_1846/2 correct\n-CTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCACCTGGTGGCGATGA\n->EAS20_8_6_100_723_1564/2 correct trim=2\n-TGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGCAATTGAAAACTTTCGTCGATCAGGAATTTG\n->EAS20_8_6_100_776_1749/2\n-TCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTTATTTGGGCAAATTCCTGATC\n->EAS20_8_6_100_779_871/2\n-AAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAG\n->EAS20_8_6_100_816_1759/2\n-AAATTAAAATTTTATTGACTTAGGTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAAC\n->EAS20_8_6_100_993_1119/2 trim=60\n-TGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCC\n->EAS20_8_6_100_1153_966/2\n-TCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTTATTTGGGCAAATTCCTGATCGA\n->EAS20_8_6_100_1183_226/2 correct trim=40\n-AATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCAC\n->EAS20_8_6_100_1263_900/2\n-AAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTTTG\n->EAS20_8_6_100_1277_357/2 trim=5\n-GCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGG\n->EAS20_8_6_100_1337_252/2 correct\n-CATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTT\n->EAS20_8_6_100_1432_436/2\n-CAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGC\n->EAS20_8_6_100_1457_1209/2 correct trim=11\n-GCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCACCTGGTGGCGATGATTGAAAAAACCATTAGCGGCCAGG\n->EAS20_8_6_100_1609_245/2 correct trim=16\n-TCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCACCTGACAGTGCGGGCTTTTTT\n->EAS20_8_6_100_1637_1332/2\n-ATTCTGACTGCAACGGGCAATATGTCTCTGTGTGGATTAAAAAAAGAGTGTCTGATAGCAGCTTCTGAACTGGTTACCTGCCGTGAGTAAATTAAAATTT\n'
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_2.fasta.gz
b
Binary file test-data/ecoli_1K_2.fasta.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_2.fastq.gz
b
Binary file test-data/ecoli_1K_2.fastq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_2.fq
--- a/test-data/ecoli_1K_2.fq Mon Sep 20 09:55:41 2021 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,8216 +0,0 @@\n-@EAS20_8_6_1_9_1972/2 correct\n-GGTGGCCACCTGCCCCTGCCTGGCATTGCTTTCCAGAATATCGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACT\n-+\n-HFHHHGHHHHHHHHHHHHGHHHHHHGHHHHHHHHHHHFHHGHHGHEHHHHHHEH;G?F<F?GDFF/EEFBD:DCHHH7A@?EEH@HH96:4F@#76=C@@\n-@EAS20_8_6_1_163_1521/2\n-GGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGTAACG\n-+\n-HHGGFHHGHHHHHHHGFHHHHHHHCGHFHFHFHHHHHHGHHGHHDHHIEGEDFEHHCHHHHGCCGF>GFEFEGGFGGEIG1ACBCF?CD1?CADCD.DFB\n-@EAS20_8_6_1_178_1948/2\n-ATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTG\n-+\n-HGHIHHHIHGGHHHHGHHFHHFDHHHHHGHHBHHHHHHGGGHHHHHHHHHFHHHHGHHFHFEDHGDHH>HGEFCHHCHHH=GGHBEGFFHEGGD@HHEEH\n-@EAS20_8_6_1_318_1522/2\n-AGAATATCGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAA\n-+\n-IGHFHHHDEHGHHEHHHEGHDHHHGHHHHHHEHHHHHDHHHHHGHHHHEGFAEHDGHFHHFDHFGHHHIGHIEGHHGGHFGFAHGHGFEHDHEEEB7<3<\n-@EAS20_8_6_1_348_1372/2\n-GGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGC\n-+\n-HHHHHH@HGHHEHGHGHHHHDHHHHFHEHDDHHDHHHEEHHDHHHBFHCEGEHGGGDHHE@EFDAHHGHEDFGG:FDB<>=BDG?D=3BB>G?GGEGGD;\n-@EAS20_8_6_1_389_646/2 trim=17\n-TGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTC\n-+\n-HGGGDHHHAHGHHHHGHIHHEHHHGHFHHHHHFHHEG=GHEEFEHEHHEEEDGHGHFHDFFFADDHHF:>0&D0A4?,?AE=?\n-@EAS20_8_6_1_513_951/2 correct\n-ATAACAGTAACGTTGTGACCGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCG\n-+\n-GHFHGHDHGHHHHHHFHHHEFHHHHHGHFHBHEHHHFDHHGGHHBEHHGHHHFFFBHHHHHGEGDHFIHHHHEEC?GEGDFE;<E+@5@>?E;=?#A)?=\n-@EAS20_8_6_1_530_1080/2\n-GAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTCGCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCA\n-+\n-D?D?DG;FAFFGDGFDF?F:>=DD>GGGGGDAD:D+DD>DDFAFFDGFG4FFFFC<FF>BGCG/CFF59AFBD6DG@BA1.53;-:9:FG::F-:><>96\n-@EAS20_8_6_1_546_406/2\n-CGGGTGGACTCAGCAATATCGACGGTAGATTCGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGACCGCGCGCTT\n-+\n-HHHHEHHHHHHHIHHFHHHHHHHHHGHHHIHHHHHFGHHGHHHHHBHHGBHHEHGHCGGGGHAGHEGGGGHEDECGGFE8GGE=EGGC>FGE@DDECGDD\n-@EAS20_8_6_1_553_1132/2 trim=6\n-GGCGATGATTGAAAAAACCATTAGCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCC\n-+\n-HHHHHHHHHHHHFHHHHHHHHHHHHHHHHHHHEGHHHHHABGEEHHDHAGHDHGGHFFFGH@HDGGHGHEEFIIBFFFIEGD@EFG<E@EC<6B\n-@EAS20_8_6_1_594_142/2\n-AACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACC\n-+\n-GGHHHHHHHHHFGHHHHHGHHHDGDHHHHHHHFH?EHHHHGDGEHHHHDHHHIHHGIHHEFFHHHHFGFHGEHCGGGEGA;HFH@DEFEBEEAHE??=?C\n-@EAS20_8_6_1_641_1277/2\n-GGTTACCTGCCGTGAGTAAATTAAAATTTTATTGACTTAGGTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTA\n-+\n-FFE?FEBFG?EHFHDHDFHDEHGAEEFGFHHH?GH;HAGGFF7AEHCCBH?0FG=2FAB4EHGB>BC0<?EE=9C=E;F;:;AAAA+,=,6E@2AC3?<>\n-@EAS20_8_6_1_660_979/2\n-CCATGCAGGACATGTTTTATTTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAA\n-+\n-HDHHEFHH@FHHHEHHGGGGEEEHFFHHFGHHHHHGGHHDBFBF;FFFGFDFGGHHHHG<FHCHHA9=B?=G@@?EHED9F8DHEDD3EBC&GD3)-000\n-@EAS20_8_6_1_763_241/2\n-TATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGT\n-+\n-HHFDFGHHHHHEHHCHHFGHBEEAGHBCGEGHHEHDHEHH=HHHHHHHHGHHDBFGHHDGBIHHHHCHEHBE>HHGHBHHFHEGEHGHBDEHEH=F:E??\n-@EAS20_8_6_1_789_699/2 correct trim=20\n-TGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCC\n-+\n-H=BHHFAECGAHHHF<AF@FFEEEEHHHHFCHHHHHGHH=FEHHHEHH4E1DAA=FEG?AHDEH#*F;1/AA7(D<?)FF\n-@EAS20_8_6_1_802_355/2 correct\n-CTGTACGCGTCAGCCCGCACCGTTACCTGTGGTAATGGTGATGGTGGTGGTAATGGTGGTGCTAATGCGTTTCATGGATGTTGTGTACTCTGTAATTTTT\n-+\n-HHHHHHHHHHHGGGGHHHHIHGGIHHHHGHHEAEBFFBCF=GGD?D@2C;?<6?BFBFF>BCCE?BBDGDBD>2HF?8?C?:19?0&5-#=:/;6DHGD>\n-@EAS20_8_6_1_807_1707/2 trim=1\n-GAGGTAACAACCATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGG\n-+\n-FCFF2FBBFBEHGHH?D=AAFDGGCCHHHHBHEEHDEFAFFGGGDGGABIGECHEBBBHFHHHDDFEGGEEFD=1=BDDDCCGEEDDJCBBDDE;BEAG\n-@EAS20_8_6_1_918_1054/2 correct\n-GCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGT'..b'6_100_346_1515/2\n-TGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGCAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTC\n-+\n-AADA@BBFBDHCGGBHHHGHH=HEHFHHH@HFHHFFDHFE;HHEHGF<CGHHH@FGGG1F<B9BDHHHH=H?HE6GFADFEBHBDFD/BGF1F??HGHGF\n-@EAS20_8_6_100_434_840/2\n-AGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCGTATTAGAAGCGCGCGGTCACAACGTTAC\n-+\n-HHHGHHFHGGHHEFHHH>FHHHHHFHFHHEHHHFFHHHHDHHGHHBAHHHFHHEHFHHGBIHHEFIFGEDGGC;FE80>ABC4CAEGG;A182;916>98\n-@EAS20_8_6_100_451_465/2 correct trim=22\n-GTTGCGTCCAAGCACCACCAGTTCGCCTTTTTCATTACCGGCGGTGAAACCTGCCATCAGCACCATGTGATCAGCCGG\n-+\n-HIHHDHHHHGHIGHHHHGHHHFHHIHIHHHHHIHHHHHGIH@HH>A;AD95#+43=?C:35:6865/9;13=<:?B?C\n-@EAS20_8_6_100_452_1846/2 correct\n-CTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCACCTGGTGGCGATGA\n-+\n-HHHHHGHHHHGHHHFHHHHGHGHDHHFHBEHHHFHFGHHGHHHDHE#HEDF?CF?DFD:E252+7CBF?14:*:AA;:C9;9;+ABAD8#64<::;3+<7\n-@EAS20_8_6_100_723_1564/2 correct trim=2\n-TGCCGAACGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCGCAATTGAAAACTTTCGTCGATCAGGAATTTG\n-+\n-HHHEHEHEH?HHEEHEEGHHBEFEEHHHFHHHHHHFHEHFEHHFHGHHGHED/EHDHEH@A88D@C(E6BEEHD@5?CE:AG;D@C;;2@>#8.95?C\n-@EAS20_8_6_100_776_1749/2\n-TCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTTATTTGGGCAAATTCCTGATC\n-+\n-F3G30CEG?GDD4D=H<8BFEF8HDGHHH1HHFFEHDHB1;5>;<8EDC8??@ADEHH@HEEEHFHHHHHHEHHHG:@FFFGA6AEHH@=EHH;HFC/FF\n-@EAS20_8_6_100_779_871/2\n-AAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCTGGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAG\n-+\n-FGEFCEHFFFBHHFHHHHEEHHHBCFAFEHGHGHH7B@:EDFHDE5CAABBHCB7@8?A8?FB3BBADBDG>;;CF=FGGD52B0?A2A?;;=;BA5DAE\n-@EAS20_8_6_100_816_1759/2\n-AAATTAAAATTTTATTGACTTAGGTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTACACAACATCCATGAAAC\n-+\n-63;=>>3>>?DECADBBDCG?@7?5DCEEEGGGECGGGCGGGDCGGFCG6FGBCGGGGG>DGCGGBEGG>4E7?GFGG<GGGGEG;,GBADD8ADG>2EF\n-@EAS20_8_6_100_993_1119/2 trim=60\n-TGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCC\n-+\n-B>BBB=F:FGFHFBHHHHHHHDHDGHEH=HHHHGE>8DC=\n-@EAS20_8_6_100_1153_966/2\n-TCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTTATTTGGGCAAATTCCTGATCGA\n-+\n-HHGHHHHHHGHHHHHGHHHHHHHHHHGHHHHHHHHHGHGHHHHH;HFDEHFDHDHHHHHGDHHHHDGHFGBGHHCGGHFH>ECGGHGECFFDFFD?DDDB\n-@EAS20_8_6_100_1183_226/2 correct trim=40\n-AATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCAC\n-+\n-DDBBD@EEEGDHHEHBCBB0=GCGC4?.6=D8CF89:DFBGG5==*83<#?/:;+E@ABB\n-@EAS20_8_6_100_1263_900/2\n-AAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGGGTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTTTG\n-+\n-HHHEHHHEGIHHHGHGGHHHHHHHHHHHHHH=HFHHHHHFHHHGEHHFHHHGEBHHHBCHHDEGHGGF@G@HGEE=F;C9H39H=FEHFHHEFH?=AEFE\n-@EAS20_8_6_100_1277_357/2 trim=5\n-GCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGG\n-+\n-FFFHFHHHHHHHHGHHDHHBBHHHHHHEEEH<GHGH@FHHHHGGHGHHHFGHHGGHGGHHHFBEFFEHHHECGIIFHEGEEDFEEH//EBD4=EF\n-@EAS20_8_6_100_1337_252/2 correct\n-CATAATGGCGATCGACATTTTCTCGCCACGGCAAATCAGCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTTTT\n-+\n-HHHHBHEECG=FEEFH.HHH=GEGE@HEF<BFHHBHHAHHBBBB>DGHH8HDF/=F=FF==;/FFCGGHDGBHG-B<@BFE=:FE5=E98E=E-H=@C#C\n-@EAS20_8_6_100_1432_436/2\n-CAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGC\n-+\n-HHHHHFHHGHHHHHGGHHHHGHHHHHHHHGHHHGHHHGGGEEEHHHHHHFHEDGGGHHFHHHDGHBFGFF>BHH8FBF0F@>DFGHHBBEH>FBD@DHEG\n-@EAS20_8_6_100_1457_1209/2 correct trim=11\n-GCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCACCTGGTGGCGATGATTGAAAAAACCATTAGCGGCCAGG\n-+\n-HHHHBGHHHFH?HHHHCCFDB=?D=HHEEAEFEHGEB=HHC68C5??B==B=F<;C7=ECH=HE:?CE>@?<EB1.-87<<#3C9@>??\n-@EAS20_8_6_100_1609_245/2 correct trim=16\n-TCACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCACCTGACAGTGCGGGCTTTTTT\n-+\n-HHEHHHGHHGHHHHDIHHHHHHHHHFHAFHFHHEIFDHFH8HHHFHHHGHHHEEB<8FFFCG>FE==9D9#0:?45/<#;B8=D\n-@EAS20_8_6_100_1637_1332/2\n-ATTCTGACTGCAACGGGCAATATGTCTCTGTGTGGATTAAAAAAAGAGTGTCTGATAGCAGCTTCTGAACTGGTTACCTGCCGTGAGTAAATTAAAATTT\n-+\n-HHGEHGHHHHGHIGHAHEHEHEIHGGHHHHHHHGGHHHHFHEGDGCCCHHHGHHDHHIHFEEHHHHHGHIHHHFHHIEIHHHHFAEEEHHIEHDHFFHFH\n'
b
diff -r b7829778729f -r 74f20c988994 test-data/ecoli_1K_2.fq.gz
b
Binary file test-data/ecoli_1K_2.fq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/kmer_33_output.fa
--- a/test-data/kmer_33_output.fa Mon Sep 20 09:55:41 2021 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,18 +0,0 @@
->NODE_1_length_1000_cov_225.838676
-AATCGGCGCGTAAACAGGCAGCCAGCACCGCAGCAGAGTAGTCGGAACCGTTGCGTCCAA
-GCACCACCAGTTCGCCTTTTTCATTACCGGCGGTGAAACCTGCCATCAGCACCATGTGAT
-CAGCCGGAATGCGGCTTGCCGCAATACGGCGGGTGGACTCAGCAATATCGACGGTAGATT
-CGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGAC
-CGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCA
-GCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTT
-TTATTTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCT
-GGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGG
-GTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTT
-TGGCGGGGGCAGAGAGGACGGTGGCCACCTGCCCCTGCCTGGCATTGCTTTCCAGAATAT
-CGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTC
-GCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCAGGTGCGGG
-CTTTTTTCTGTGTTTCCTGTACGCGTCAGCCCGCACCGTTACCTGTGGTAATGGTGATGG
-TGGTGGTAATGGTGGTGCTAATGCGTTTCATGGATGTTGTGTACTCTGTAATTTTTATCT
-GTCTGTGCGCTATGCCTATATTGGTTAAAGTATTTAGTGACCTAAGTCAATAAAATTTTA
-ATTTACTCACGGCAGGTAACCAGTTCAGAAGCTGCTATCAGACACTCTTTTTTTAATCCA
-CACAGAGACATATTGCCCGTTGCAGTCAGAATGAAAAGCT
b
diff -r b7829778729f -r 74f20c988994 test-data/kmer_77_output.fa
--- a/test-data/kmer_77_output.fa Mon Sep 20 09:55:41 2021 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,18 +0,0 @@
->NODE_1_length_976_cov_64.459399
-AGCTTTTCATTCTGACTGCAACGGGCAATATGTCTCTGTGTGGATTAAAAAAAGAGTGTC
-TGATAGCAGCTTCTGAACTGGTTACCTGCCGTGAGTAAATTAAAATTTTATTGACTTAGG
-TCACTAAATACTTTAACCAATATAGGCATAGCGCACAGACAGATAAAAATTACAGAGTAC
-ACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCATTACCACAGGT
-AACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCACCTGACAGTGCGGG
-CTTTTTTTTTCGACCAAAGGTAACGAGGTAACAACCATGCGAGTGTTGAAGTTCGGCGGT
-ACATCAGTGGCAAATGCAGAACGTTTTCTGCGTGTTGCCGATATTCTGGAAAGCAATGCC
-AGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAATCACCAACCACCTGGTG
-GCGATGATTGAAAAAACCATTAGCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAA
-CGTATTTTTGCCGAACTTTTGACGGGACTCGCCGCCGCCCAGCCGGGGTTCCCGCTGGCG
-CAATTGAAAACTTTCGTCGATCAGGAATTTGCCCAAATAAAACATGTCCTGCATGGCATT
-AGTTTGTTGGGGCAGTGCCCGGATAGCATCAACGCTGCGCTGATTTGCCGTGGCGAGAAA
-ATGTCGATCGCCATTATGGCCGGCGTATTAGAAGCGCGCGGTCACAACGTTACTGTTATC
-GATCCGGTCGAAAAACTGCTGGCAGTGGGGCATTACCTCGAATCTACCGTCGATATTGCT
-GAGTCCACCCGCCGTATTGCGGCAAGCCGCATTCCGGCTGATCACATGGTGCTGATGGCA
-GGTTTCACCGCCGGTAATGAAAAAGGCGAACTGGTGGTGCTTGGACGCAACGGTTCCGAC
-TACTCTGCTGCGGTGC
b
diff -r b7829778729f -r 74f20c988994 test-data/pl1.fq.gz
b
Binary file test-data/pl1.fq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/pl2.fq.gz
b
Binary file test-data/pl2.fq.gz has changed
b
diff -r b7829778729f -r 74f20c988994 test-data/reference_1K.fa
--- a/test-data/reference_1K.fa Mon Sep 20 09:55:41 2021 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,18 +0,0 @@
->NODE_1_length_1000_cov_140.641_ID_29
-AATCGGCGCGTAAACAGGCAGCCAGCACCGCAGCAGAGTAGTCGGAACCGTTGCGTCCAA
-GCACCACCAGTTCGCCTTTTTCATTACCGGCGGTGAAACCTGCCATCAGCACCATGTGAT
-CAGCCGGAATGCGGCTTGCCGCAATACGGCGGGTGGACTCAGCAATATCGACGGTAGATT
-CGAGGTAATGCCCCACTGCCAGCAGTTTTTCGACCGGATCGATAACAGTAACGTTGTGAC
-CGCGCGCTTCTAATACGCCGGCCATAATGGCGATCGACATTTTCTCGCCACGGCAAATCA
-GCGCAGCGTTGATGCTATCCGGGCACTGCCCCAACAAACTAATGCCATGCAGGACATGTT
-TTATTTGGGCAAATTCCTGATCGACGAAAGTTTTCAATTGCGCCAGCGGGAACCCCGGCT
-GGGCGGCGGCGAGTCCCGTCAAAAGTTCGGCAAAAATACGTTCGGCATCGCTGATATTGG
-GTAAAGCATCCTGGCCGCTAATGGTTTTTTCAATCATCGCCACCAGGTGGTTGGTGATTT
-TGGCGGGGGCAGAGAGGACGGTGGCCACCTGCCCCTGCCTGGCATTGCTTTCCAGAATAT
-CGGCAACACGCAGAAAACGTTCTGCATTTGCCACTGATGTACCGCCGAACTTCAACACTC
-GCATGGTTGTTACCTCGTTACCTTTGGTCGAAAAAAAAAGCCCGCACTGTCAGGTGCGGG
-CTTTTTTCTGTGTTTCCTGTACGCGTCAGCCCGCACCGTTACCTGTGGTAATGGTGATGG
-TGGTGGTAATGGTGGTGCTAATGCGTTTCATGGATGTTGTGTACTCTGTAATTTTTATCT
-GTCTGTGCGCTATGCCTATATTGGTTAAAGTATTTAGTGACCTAAGTCAATAAAATTTTA
-ATTTACTCACGGCAGGTAACCAGTTCAGAAGCTGCTATCAGACACTCTTTTTTTAATCCA
-CACAGAGACATATTGCCCGTTGCAGTCAGAATGAAAAGCT