# HG changeset patch
# User iuc
# Date 1632344500 0
# Node ID 71adaaace3360d1ffabe92ba15762acea4aebdce
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/amplican commit 48a91cdf44f4d7e332b852bb2ced6cd180147fdc"
diff -r 000000000000 -r 71adaaace336 amplican.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/amplican.xml Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,438 @@
+
+ analysis tool for genome editing
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ Use both FASTQ files
+ Use both FASTQ files, but only for one of the reads (forward or reverse) is required to have primer perfectly matched to sequence
+ Use only the forward FASTQ file
+ Use only the reverse FASTQ file
+
+
+
+
+
+
+
+
+ None: don't write any alignments to files
+ Text file: read information followed by forward read and amplicon sequence followed by reverse read with its amplicon sequence
+ FASTA file: outputs alignments in fasta format where header indicates experiment ID, read id and number of reads
+
+
+ Configuration summary (config_summary.csv)
+ Barcode reads filters (barcode_reads_filters.csv)
+ Knitr HTML report
+ Parameters (RunParameters.txt)
+ Alignments Rda file (AlignmentsExperimentSet.rds)
+ Events filtered shifted (events_filtered_shifted.csv)
+ Events filtered shifted normalized (events_filtered_shifted_normalized.csv)
+ Raw events (raw_events.csv)
+ Unnasigned reads (unassigned_reads.csv)
+
+
+
+
+
+ "config_summary" in output_options["outputs"]
+
+
+ "barcode_reads" in output_options["outputs"]
+
+
+ "knit_reports" in output_options["outputs"]
+
+
+ "parameters" in output_options["outputs"]
+
+
+ "alignments_rds" in output_options["outputs"]
+
+
+ output_options["write_alignment_format"] == "fasta"
+
+
+ output_options["write_alignment_format"] == "txt"
+
+
+ "events_filtered_shifted" in output_options["outputs"]
+
+
+ "events_filtered_shifted_normalized" in output_options["outputs"]
+
+
+ "raw_events" in output_options["outputs"]
+
+
+ "unassigned_reads" in output_options["outputs"]
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff -r 000000000000 -r 71adaaace336 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,19 @@
+
+ 1.14.0
+ 0
+
+
+ amplican
+
+
+
+
+ bioconductor-amplican
+
+
+
+
+ 10.1101/gr.244293.118
+
+
+
diff -r 000000000000 -r 71adaaace336 test-data/R1_001.fastq
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/R1_001.fastq Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,80 @@
+@ID_1_valid_cut_biggest_1
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCTGTTCCAGAAAAAAAAAAAAAAAAAAAATTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCAGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_biggest_2
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCTGTTCCAGAAAAAAAAAAAAAAAAAAAATTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCAGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_biggest_3
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCTGTTCCAGAAAAAAAAAAAAAAAAAAAATTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCAGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_medium_1
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCTGTTAAAAAAAAAAAAAAAAAAAACACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCAGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_medium_2
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCTGTTAAAAAAAAAAAAAAAAAAAACACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCAGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_small
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAAATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@primer_dimer
+AAGCTGACGGCTAAATGAAAAAGCCTCGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@bad_quality32
+AAGCTGACGGCTAAATGAAAAATATCTGAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGAAGAAGGTCAGGGAAGGTCACTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCA
++
+9999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999
+@bad_quality32
+AAGCTGACGGCTAAATGAAAAATATCTGAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGAAGAAGGTCAGGGAAGGTCACTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCA
++
+9999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999
+@bad_bases
+AAGCTGACGGCTAAATNNNAAATATCTGAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGAAGAAGGTCAGGGAAGGTCACTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCA
++
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+@bad_bases
+AAGCTNGCGGCTAAATGAAAAATATCTGAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGAAGAAGGTCAGGGAAGGTCACTGGAGGTCACTGGGATACCCTTTCTTCCCACACCANNNGGGAAAGGAGTCCTGCCAGATGACCA
++
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+@next_id_nocut6_bad_alphabet
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTGTTTTGATGATNNNCTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTATATGTAGTGATAAAA
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@next_id_nocut7_bad_quality
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTGTTTTGATGATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTATATGTAGTGATAAAA
++
+9999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999
+@next_id_nocut8_bad_quality
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTGTTTTGATGATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTATATGTAGTGATAAAA
++
+9999999999999999999999999999999999999999999999999999999999999999IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_biggest_1
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAGGATGAT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_biggest_2
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAGGATGAT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_biggest_3
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAGGATGAT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_medium_1
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAGGATGAT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_medium_2
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAGGATGAT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_small
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAGGATGAT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
diff -r 000000000000 -r 71adaaace336 test-data/R1_001.fastq.gz
Binary file test-data/R1_001.fastq.gz has changed
diff -r 000000000000 -r 71adaaace336 test-data/R1_002.fastq
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/R1_002.fastq Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,84 @@
+@ID_3_valid_cut_biggest_1
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCATTTTTGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_biggest_2
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCATTTTTGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_biggest_3
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCATTTTTGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_biggest_4
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCATTTTTGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_biggest_5
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCATTTTTGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_medium_1
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGTGGTCAGGGAACAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_medium_2
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGTGGTCAGGGAACAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_PD_1
+AAGCTGACGGCTAAATGAAAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_not_valid_insertion_deletion
+AAGCTGACGGCTAAATGAAAAATGTTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCCCCCCCCCCCCCCCCCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_1
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAGTAACTTGTGCTTGCATTGTGTAACAACTGACTGCTGTTAAAGGCCGGAAGTCTAAGAACTCACATGAAAGAGGGTATAATCCTGCCTCAGCGCTC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_2
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAGTAACTTGTGCTTGCATTGTGTAACAACTGACTGCTGTTAAAGGCCGGAAGTCTAAGAACTCACATGAAAGAGGGTATAATCCTGCCTCAGCGCTC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_3
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAGTAACTTGTGCTTGCATTGTGTAACAACTGACTGCTGTTAAAGGCCGGAAGTCTAAGAACTCACATGAAAGAGGGTATAATCCTGCCTCAGCGCTC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_4
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAGTAACTTGTGCTTGCATTGTGTAACAACTGACTGCTGTTAAAGGCCGGAAGTCTAAGAACTCACATGAAAGAGGGTATAATCCTGCCTCAGCGCTC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_medium_1
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAATCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTGGGGGGGGAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGAGTGCATGTAGAGGGTATAATCCTGCCTCAGCGCTC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_medium_2
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAATCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTGGGGGGGGAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGAGTGCATGTAGAGGGTATAATCCTGCCTCAGCGCTC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_small_1
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCACCACACGTGCATCGTACTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTCCTTGGAGAGGGTATAATCCTGCCTCAGCGCTC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfect1
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfect2
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfect3
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfectHDR1
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAAGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfectHDR2
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAAGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
diff -r 000000000000 -r 71adaaace336 test-data/R1_002.fastq.gz
Binary file test-data/R1_002.fastq.gz has changed
diff -r 000000000000 -r 71adaaace336 test-data/R2_001.fastq
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/R2_001.fastq Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,80 @@
+@ID_1_valid_cut_biggest_1
+AATTACACAAGCGCAAACACACCTGGATCTGGCTGCTGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAATTTTTTTTTTTTTTTTTTTTCTGGAACAGACGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_biggest_2
+AATTACACAAGCGCAAACACACCTGGATCTGGCTGCTGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAATTTTTTTTTTTTTTTTTTTTCTGGAACAGACGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_biggest_3
+AATTACACAAGCGCAAACACACCTGGATCTGGCTGCTGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAATTTTTTTTTTTTTTTTTTTTCTGGAACAGACGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_medium_1
+AATTACACAAGCGCAAACACACCTGGATCTGGCTGCTGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGTTTTTTTTTTTTTTTTTTTTAACAGACGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_medium_2
+AATTACACAAGCGCAAACACACCTGGATCTGGCTGCTGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGTTTTTTTTTTTTTTTTTTTTAACAGACGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_1_valid_cut_small
+AATTACACAAGCGCAAACACACCTGGATTTGGCTGCAGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGACGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@primer_dimer
+AATTACACAAGCGCAAACACACGAGGCTTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@bad_quality32
+TGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCAGTGACCTTCCCTGACCTTCTTCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTCAGATATTTTTCATTTAGCCGTCAGCTT
++
+9999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999
+@bad_quality32
+AAGCTGACGGCTAAATGAAAAATATCTGAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGAAGAAGGTCAGGGAAGGTCACTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCA
++
+9999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999
+@bad_bases
+TGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCAGTGACCTTCCCTGACCTTCTTCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTCAGATATTTTTCATTTAGCCGTCAGCTT
++
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+@bad_bases
+TGGTCATCNNNNAGGACTCCTTTCCCCATTGGTGTGGGAAGNNNGGGTATCCCAGTGACCTCCAGTGACCTTCCCTGACCTTCTTCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTCAGATATTTTTCATTTAGCCGTCAGNNN
++
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+@next_id_nocut6_bad_alphabet
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTGTTTTGATGATNNNCTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTATATGTAGTGATAAAA
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@next_id_nocut7_bad_quality
+TGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCAGTGACCTTCCCTGACCTTCTTCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTCAGATATTTTTCATTTAGCCGTCAGCTT
++
+9999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999999
+@next_id_nocut8_bad_quality
+TGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCAGTGACCTTCCCTGACCTTCTTCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTCAGATATTTTTCATTTAGCCGTCAGCTT
++
+9999999999999999999999999999999999999999999999999999999999999999IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_biggest_1
+ATCATCCTCTGCTGCAAAATGCAAGGCAAAAAAAAACATTTAATTTTAATTTAACATTTTTTTATCACTACACATAAATAAAAGAAATTGAGAAGACTTACTGGTCTGCTGACCAGGGGCACAACTACAAAAGCACAATAAAGTTTATTATCAAAATAGCACCTTAAGAAGGTTTGGTCACAAGACAGTATTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_biggest_2
+ATCATCCTCTGCTGCAAAATGCAAGGCAAAAAAAAACATTTAATTTTAATTTAACATTTTTTTATCACTACACATAAATAAAAGAAATTGAGAAGACTTACTGGTCTGCTGACCAGGGGCACAACTACAAAAGCACAATAAAGTTTATTATCAAAATAGCACCTTAAGAAGGTTTGGTCACAAGACAGTATTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_biggest_3
+ATCATCCTCTGCTGCAAAATGCAAGGCAAAAAAAAACATTTAATTTTAATTTAACATTTTTTTATCACTACACATAAATAAAAGAAATTGAGAAGACTTACTGGTCTGCTGACCAGGGGCACAACTACAAAAGCACAATAAAGTTTATTATCAAAATAGCACCTTAAGAAGGTTTGGTCACAAGACAGTATTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_medium_1
+ATCATCCTCTGCTGCAAAATGCAAGGCAAAAAAAAACATTTAATTTTAATTTAACATTTTTTTATCACTACACATAAATAAAAGAAATTGAGAAGACTTACTGGTCTCTGCCAACACAAGGGGCACAACTACAAAAGCACAATAAAGTTTATTATCAAAATAGCACCTTAAGAAGGTTTGGTCACAAGACAGTATTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_medium_2
+ATCATCCTCTGCTGCAAAATGCAAGGCAAAAAAAAACATTTAATTTTAATTTAACATTTTTTTATCACTACACATAAATAAAAGAAATTGAGAAGACTTACTGGTCTCTGCCAACACAAGGGGCACAACTACAAAAGCACAATAAAGTTTATTATCAAAATAGCACCTTAAGAAGGTTTGGTCACAAGACAGTATTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_2_valid_cut_small
+ATCATCCTCTGCTGCAAAATGCAAGGCAAAAAAAAACATTTAATTTTAATTTAACATTTTTTTATCACTACACATAAATAAAAGAAATTGAGAAGACTTACTGCTGACCCTCTGCCAACACAAGGGGCACAACTACAAAAGCACAATAAAGTTTATTATCAAAATAGCACCTTAAGAAGGTTTGGTCACAAGACAGTATTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
diff -r 000000000000 -r 71adaaace336 test-data/R2_001.fastq.gz
Binary file test-data/R2_001.fastq.gz has changed
diff -r 000000000000 -r 71adaaace336 test-data/R2_002.fastq
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/R2_002.fastq Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,84 @@
+@ID_3_valid_cut_biggest_1
+AATTACACAAGCGCAAACACACCTGGATCAAAAATGCAGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCACCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_biggest_2
+AATTACACAAGCGCAAACACACCTGGATCAAAAATGCAGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCACCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_biggest_3
+AATTACACAAGCGCAAACACACCTGGATCAAAAATGCAGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCACCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_biggest_4
+AATTACACAAGCGCAAACACACCTGGATCAAAAATGCAGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCACCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_biggest_5
+AATTACACAAGCGCAAACACACCTGGATCAAAAATGCAGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCACCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_medium_1
+AATTACACAAGCGCAAACACACCTGGATCTGGCTGCAGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTGTTCCCTGACCACTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_valid_cut_medium_2
+AATTACACAAGCGCAAACACACCTGGATCTGGCTGCAGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTGTTCCCTGACCACTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTGACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_PD_1
+AATTACACAAGCGCAAACACACCTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_3_not_valid_insertion_deletion
+AATTACACAAGCGCAAACACACCTGGATCTGGCTGCAGCAACACAGTTGGGATGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCACCAGTTCCCTGGGGGGGGGGGGGGGGGACCACCTCCTCTGCCCTGGCATACGCAGCAACATTTTTCATTTAGCCGTCAGCTT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_1
+GAGCGCTGAGGCAGGATTATACCCTCTTTCATGTGAGTTCTTAGACTTCCGGCCTTTAACAGCAGTCAGTTGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_2
+GAGCGCTGAGGCAGGATTATACCCTCTTTCATGTGAGTTCTTAGACTTCCGGCCTTTAACAGCAGTCAGTTGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_3
+GAGCGCTGAGGCAGGATTATACCCTCTTTCATGTGAGTTCTTAGACTTCCGGCCTTTAACAGCAGTCAGTTGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_4
+GAGCGCTGAGGCAGGATTATACCCTCTTTCATGTGAGTTCTTAGACTTCCGGCCTTTAACAGCAGTCAGTTGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_medium_1
+GAGCGCTGAGGCAGGATTATACCCTCTACATGCACTCTTGACACCTGCTGATGTGAGTTCTTAGACTTCCGGCCTTTCCCCCCCCAATGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACATTAGATTTTTACGTAAATTACTGGTAGGAATGTTGCCAGC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_medium_2
+GAGCGCTGAGGCAGGATTATACCCTCTACATGCACTCTTGACACCTGCTGATGTGAGTTCTTAGACTTCCGGCCTTTCCCCCCCCAATGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACATTAGATTTTTACGTAAATTACTGGTAGGAATGTTGCCAGC
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_4_not_valid_insertion_deletion_small_1
+GAGCGCTGAGGCAGGATTATACCCTCTCCAAGGACACTTGACACCTGCTGATGTGAGTTCTTAGACTTCCGGCCTTTAATGTTGCAGTACGATGCACGTGTGGTGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACATTAGCACATTTTATAGCATTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfect1
+ACTGGCTGAGGCAGGATTATACCCTCTTCATGCACACTTGACACCTGCTGATGTGAGTTCTTAGACTTCCGGCCTTTAATGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACATTAGACTGGAGAGCTACACATTTTATAGCATTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfect2
+ACTGGCTGAGGCAGGATTATACCCTCTTCATGCACACTTGACACCTGCTGATGTGAGTTCTTAGACTTCCGGCCTTTAATGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACATTAGACTGGAGAGCTACACATTTTATAGCATTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfect3
+ACTGGCTGAGGCAGGATTATACCCTCTTCATGCACACTTGACACCTGCTGATGTGAGTTCTTAGACTTCCGGCCTTTAATGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACATTAGACTGGAGAGCTACACATTTTATAGCATTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfectHDR1
+ACTGGCTGAGGCAGGATTATACCCTCTTCATGCACACTTGACACCTGCTGATGTGAGTTCTTAGACTTCCGGCTTTTAATGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACATTAGACTGGAGAGCTACACATTTTATAGCATTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
+@ID_5_perfectHDR2
+ACTGGCTGAGGCAGGATTATACCCTCTTCATGCACACTTGACACCTGCTGATGTGAGTTCTTAGACTTCCGGCTTTTAATGTTGCAGGGACTGGTTTCCTGTAAACACAATGCAAGCACAAGTTACATTAGACTGGAGAGCTACACATTTTATAGCATTTTTTTACGTAAATTACTGGTAGGAATGTTGCCAGT
++
+IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII
diff -r 000000000000 -r 71adaaace336 test-data/R2_002.fastq.gz
Binary file test-data/R2_002.fastq.gz has changed
diff -r 000000000000 -r 71adaaace336 test-data/RunParameters.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/RunParameters.txt Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,17 @@
+Config file: /tmp/tmpg3fcuksp/files/f/0/2/dataset_f0207835-503b-4340-b985-c28af77332e6.dat
+Average Quality: 0
+Minimum Quality: 20
+Write Alignments: txt
+Fastq files Mode: 0
+Gap Opening: 25
+Gap Extension: 0
+Consensus: TRUE
+Normalize: guideRNA, Group
+PRIMER DIMER buffer: 30
+Cut buffer: 5
+Scoring Matrix:
+,A,C,G,T
+A,5,-4,-4,-4
+C,-4,5,-4,-4
+G,-4,-4,5,-4
+T,-4,-4,-4,5
diff -r 000000000000 -r 71adaaace336 test-data/alignments.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/alignments.txt Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,112 @@
+ID: ID_1 read_id: 1 Count: 3
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCTGTTCCAG------------------------------------------------------------------AAAAAAAAAAAAAAAAAAAATTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCAGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTC--------------------TTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCTGTTCCAG------------------------------------------------------------------AAAAAAAAAAAAAAAAAAAATTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCAGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTC--------------------TTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+ID: ID_1 read_id: 2 Count: 2
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCTGTT--------------------------------------------------------------------------AAAAAAAAAAAAAAAAAAAACACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCAGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCC--------------------CACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTCTGTT--------------------------------------------------------------------------AAAAAAAAAAAAAAAAAAAACACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCAGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCC--------------------CACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+ID: ID_1 read_id: 3 Count: 1
+AAGCTGACGGCTAAATGAAAAAG------------------------------------------------------------------------------------------------------------------------------------------------------CCTCGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+AAGCTGACGGCTAAATGAAAAAG------------------------------------------------------------------------------------------------------------------------------------------------------CCTCGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+ID: ID_1 read_id: 4 Count: 1
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTC------------------------------------------------------------------------------------AATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAAATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+AAGCTGACGGCTAAATGAAAAATGTCAAACGTC------------------------------------------------------------------------------------AATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAAATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+ID: ID_2 read_id: 1 Count: 3
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCT-------------GGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCT-------------GGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+
+ID: ID_2 read_id: 2 Count: 2
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAG---------ACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAG---------ACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+
+ID: ID_2 read_id: 3 Count: 1
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAG-----TAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAG-----TAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+TGACCAAACCTTCTTAAGGTGCTATTTTGATAATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTGTAGTGATAAAAAAATGTTAAATTAAAATTAAATGTTTTTTTTTGCCTTGCATTTTGCAGCAGAG
+
+ID: ID_3 read_id: 1 Count: 5
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGG------------------TGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCATTTTTGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCA-GATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGG------------------TGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCATTTTTGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCA-GATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+ID: ID_3 read_id: 2 Count: 2
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAG------TGGTCAGGGAAC------AGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAG------TGGTCAGGGAAC------AGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+ID: ID_3 read_id: 3 Count: 1
+AAGCTGACGGCTAAATGAAAAATGT-----------------TGCTGCGTATGCCAGGGCAGAGGAGGTGGTCCCCCCCCCCCCCCCCCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTC----------------AGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+AAGCTGACGGCTAAATGAAAAATGT-----------------TGCTGCGTATGCCAGGGCAGAGGAGGTGGTCCCCCCCCCCCCCCCCCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTC----------------AGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+ID: ID_3 read_id: 4 Count: 1
+AAGCTGACGGCTAAATGAAA------------------------------------------------------------------------------------------------------------------------------------------------------------GGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+AAGCTGACGGCTAAATGAAA------------------------------------------------------------------------------------------------------------------------------------------------------------GGTGTGTTTGCGCTTGTGTAATT
+AAGCTGACGGCTAAATGAAAAATGTCAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGGAGGTGGTCAGGGAACTGGTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCATCCCAACTGTGTTGCTGCAGCCAGATCCAGGTGTGTTTGCGCTTGTGTAATT
+
+ID: ID_4 read_id: 1 Count: 4
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAA--------------------------------GTAACTTGTGCTTGCATTGTGT--------AACAACTGACTGCTG--TTAAAGGCCGGAAGTCTAAGAACTCACATGA--------------------AAGAGGGTATAATCCTGCCTCAGCGCTC
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCGCTC
+
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAA--------------------------------GTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACAACTGACTGCTGTTAAAGGCCGGAAGTCTAAGAACTCACATGA--------------------AAGAGGGTATAATCCTGCCTCAGCGCTC
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACA-----------TTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCGCTC
+
+ID: ID_4 read_id: 2 Count: 2
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAA---------------------------TCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTGGGGGGGGAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGAGTGCATGTAGAGGGTATAATCCTGCCTCAGCGCTC
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATT--------AAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCGCTC
+
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAA---------------------------TCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTGGGGGGGGAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGAGTGCATGTAGAGGGTATAATCCTGCCTCAGCGCTC
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATT--------AAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCGCTC
+
+ID: ID_4 read_id: 3 Count: 1
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTG------------CTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCACCACACGTGCATCGTACTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTCCTTGGAGAGGGTATAATCCTGCCTCAGCGCTC
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCC------------------TGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCGCTC
+
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTG------------CTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCACCACACGTGCATCGTACTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTCCTTGGAGAGGGTATAATCCTGCCTCAGCGCTC
+GCTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCC------------------TGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCGCTC
+
+ID: ID_5 read_id: 1 Count: 3
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
+
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
+
+ID: ID_5 read_id: 2 Count: 2
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAAGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
+
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAAGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
+ACTGGCAACATTCCTACCAGTAATTTACGTAAAAAAATGCTATAAAATGTGTAGCTCTCCAGTCTAATGTAACTTGTGCTTGCATTGTGTTTACAGGAAACCAGTCCCTGCAACATTAAAGGCCGGAAGTCTAAGAACTCACATCAGCAGGTGTCAAGTGTGCATGAAGAGGGTATAATCCTGCCTCAGCCAGT
+
diff -r 000000000000 -r 71adaaace336 test-data/barcode_reads_filtered.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/barcode_reads_filtered.csv Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,3 @@
+Barcode,experiment_count,read_count,bad_base_quality,bad_average_quality,bad_alphabet,filtered_read_count,unique_reads,unassigned_reads,assigned_reads
+barcode_1,2,20,0,0,3,17,10,3,7
+barcode_2,3,21,0,0,0,21,9,0,9
diff -r 000000000000 -r 71adaaace336 test-data/config.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/config.csv Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,6 @@
+ID,Barcode,Forward_Reads,Reverse_Reads,Group,Control,guideRNA,Forward_Primer,Reverse_Primer,Direction,Amplicon,Donor
+ID_1,barcode_1,R1_001.fastq,R2_001.fastq,Betty,0,AGGTGGTCAGGGAACTGG,AAGCTGACGGCTAAATGA,AATTACACAAGCGCAAACACAC,0,aagctgacggctaaatgaaaaatgtcaaacatctgttccaggtgctgcgtatgccagggcagaggAGGTGGTCAGGGAACTGGtggaggtcactgggataccctttcttcccacaccaatggggaaaggagtcctgccagatgaccatcccaactgtgttgctgcagccagatccaggtgtgtttgcgcttgtgtaatt,
+ID_2,barcode_1,R1_001.fastq,R2_001.fastq,Tom,0,TGACCCTCTGCCAACACAAGGGG,TGACCAAACCTTCTTAAGGTGC,CTCTGCTGCAAAATGCAAGG,1,aaatactgtcttgtgaccaaaccttcttaaggtgctattttgataataaactttattgtgcttttgtagttgtgCCCCTTGTGTTGGCAGAGGGTCAgcagaccagtaagtcttctcaatttcttttatttatgtgtagtgataaaaaaatgttaaattaaaattaaatgtttttttttgccttgcattttgcagcagaggatgat,
+ID_3,barcode_2,R1_002.fastq,R2_002.fastq,Tom,0,AGGTGGTCAGGGAACTGG,AAGCTGACGGCTAAATGA,AATTACACAAGCGCAAACACAC,0,aagctgacggctaaatgaaaaatgtcaaacatctgttccaggtgctgcgtatgccagggcagaggAGGTGGTCAGGGAACTGGtggaggtcactgggataccctttcttcccacaccaatggggaaaggagtcctgccagatgaccatcccaactgtgttgctgcagccagatccaggtgtgtttgcgcttgtgtaatt,
+ID_4,barcode_2,R1_002.fastq,R2_002.fastq,Betty,1,GTCCCTGCAACATTAAAGGCCGG,GCTGGCAACATTCCTACCAGT,GAGCGCTGAGGCAGGATTAT,0,gctggcaacattcctaccagtaatttacgtaaaaaaatgctataaaatgtgtagctctccagtctaatgtaacttgtgcttgcattgtgtttacaggaaaccaGTCCCTGCAACATTAAAGGCCGGaagtctaagaactcacatcagcaggtgtcaagtgtgcatgaagagggtataatcctgcctcagcgctc,
+ID_5,barcode_2,R1_002.fastq,R2_002.fastq,Betty,0,GTCCCTGCAACATTAAAGGCCGG,ACTGGCAACATTCCTACCAGT,ACTGGCTGAGGCAGGATTAT,0,actggcaacattcctaccagtaatttacgtaaaaaaatgctataaaatgtgtagctctccagtctaatgtaacttgtgcttgcattgtgtttacaggaaaccaGTCCCTGCAACATTAAAGGCCGGaagtctaagaactcacatcagcaggtgtcaagtgtgcatgaagagggtataatcctgcctcagccagt,actggcaacattcctaccagtaatttacgtaaaaaaatgctataaaatgtgtagctctccagtctaatgtaacttgtgcttgcattgtgtttacaggaaaccaGTCCCTGCAACATTAAAAGCCGGaagtctaagaactcacatcagcaggtgtcaagtgtgcatgaagagggtataatcctgcctcagccagt
diff -r 000000000000 -r 71adaaace336 test-data/config_gzip.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/config_gzip.csv Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,6 @@
+ID,Barcode,Forward_Reads,Reverse_Reads,Group,Control,guideRNA,Forward_Primer,Reverse_Primer,Direction,Amplicon,Donor
+ID_1,barcode_1,R1_001.fastq.gz,R2_001.fastq.gz,Betty,0,AGGTGGTCAGGGAACTGG,AAGCTGACGGCTAAATGA,AATTACACAAGCGCAAACACAC,0,aagctgacggctaaatgaaaaatgtcaaacatctgttccaggtgctgcgtatgccagggcagaggAGGTGGTCAGGGAACTGGtggaggtcactgggataccctttcttcccacaccaatggggaaaggagtcctgccagatgaccatcccaactgtgttgctgcagccagatccaggtgtgtttgcgcttgtgtaatt,
+ID_2,barcode_1,R1_001.fastq.gz,R2_001.fastq.gz,Tom,0,TGACCCTCTGCCAACACAAGGGG,TGACCAAACCTTCTTAAGGTGC,CTCTGCTGCAAAATGCAAGG,1,aaatactgtcttgtgaccaaaccttcttaaggtgctattttgataataaactttattgtgcttttgtagttgtgCCCCTTGTGTTGGCAGAGGGTCAgcagaccagtaagtcttctcaatttcttttatttatgtgtagtgataaaaaaatgttaaattaaaattaaatgtttttttttgccttgcattttgcagcagaggatgat,
+ID_3,barcode_2,R1_002.fastq.gz,R2_002.fastq.gz,Tom,0,AGGTGGTCAGGGAACTGG,AAGCTGACGGCTAAATGA,AATTACACAAGCGCAAACACAC,0,aagctgacggctaaatgaaaaatgtcaaacatctgttccaggtgctgcgtatgccagggcagaggAGGTGGTCAGGGAACTGGtggaggtcactgggataccctttcttcccacaccaatggggaaaggagtcctgccagatgaccatcccaactgtgttgctgcagccagatccaggtgtgtttgcgcttgtgtaatt,
+ID_4,barcode_2,R1_002.fastq.gz,R2_002.fastq.gz,Betty,1,GTCCCTGCAACATTAAAGGCCGG,GCTGGCAACATTCCTACCAGT,GAGCGCTGAGGCAGGATTAT,0,gctggcaacattcctaccagtaatttacgtaaaaaaatgctataaaatgtgtagctctccagtctaatgtaacttgtgcttgcattgtgtttacaggaaaccaGTCCCTGCAACATTAAAGGCCGGaagtctaagaactcacatcagcaggtgtcaagtgtgcatgaagagggtataatcctgcctcagcgctc,
+ID_5,barcode_2,R1_002.fastq.gz,R2_002.fastq.gz,Betty,0,GTCCCTGCAACATTAAAGGCCGG,ACTGGCAACATTCCTACCAGT,ACTGGCTGAGGCAGGATTAT,0,actggcaacattcctaccagtaatttacgtaaaaaaatgctataaaatgtgtagctctccagtctaatgtaacttgtgcttgcattgtgtttacaggaaaccaGTCCCTGCAACATTAAAGGCCGGaagtctaagaactcacatcagcaggtgtcaagtgtgcatgaagagggtataatcctgcctcagccagt,actggcaacattcctaccagtaatttacgtaaaaaaatgctataaaatgtgtagctctccagtctaatgtaacttgtgcttgcattgtgtttacaggaaaccaGTCCCTGCAACATTAAAAGCCGGaagtctaagaactcacatcagcaggtgtcaagtgtgcatgaagagggtataatcctgcctcagccagt
diff -r 000000000000 -r 71adaaace336 test-data/config_summary.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/config_summary.csv Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,6 @@
+ID,Barcode,Forward_Reads_File,Reverse_Reads_File,Group,guideRNA,Found_Guide,Control,Forward_Primer,Reverse_Primer,Direction,Amplicon,Donor,fwdPrPosEnd,rvePrPos,Reads,PRIMER_DIMER,Low_Score,Reads_Filtered,Reads_Del,Reads_In,Reads_Edited,Reads_Frameshifted,HDR
+ID_1,barcode_1,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R1_001.fastq,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R2_001.fastq,Betty,AGGTGGTCAGGGAACTGG,TRUE,FALSE,AAGCTGACGGCTAAATGA,AATTACACAAGCGCAAACACAC,FALSE,aagctgacggctaaatgaaaaatgtcaaacatctgttccaggtgctgcgtatgccagggcagaggAGGTGGTCAGGGAACTGGtggaggtcactgggataccctttcttcccacaccaatggggaaaggagtcctgccagatgaccatcccaactgtgttgctgcagccagatccaggtgtgtttgcgcttgtgtaatt,"",18,178,7,1,0,6,6,0,6,2,0
+ID_2,barcode_1,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R1_001.fastq,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R2_001.fastq,Tom,TGACCCTCTGCCAACACAAGGGG,TRUE,FALSE,TGACCAAACCTTCTTAAGGTGC,CTCTGCTGCAAAATGCAAGG,TRUE,aaatactgtcttgtgaccaaaccttcttaaggtgctattttgataataaactttattgtgcttttgtagttgtgCCCCTTGTGTTGGCAGAGGGTCAgcagaccagtaagtcttctcaatttcttttatttatgtgtagtgataaaaaaatgttaaattaaaattaaatgtttttttttgccttgcattttgcagcagaggatgat,"",35,181,6,0,0,6,6,0,6,4,0
+ID_3,barcode_2,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R1_002.fastq,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R2_002.fastq,Tom,AGGTGGTCAGGGAACTGG,TRUE,FALSE,AAGCTGACGGCTAAATGA,AATTACACAAGCGCAAACACAC,FALSE,aagctgacggctaaatgaaaaatgtcaaacatctgttccaggtgctgcgtatgccagggcagaggAGGTGGTCAGGGAACTGGtggaggtcactgggataccctttcttcccacaccaatggggaaaggagtcctgccagatgaccatcccaactgtgttgctgcagccagatccaggtgtgtttgcgcttgtgtaatt,"",18,178,9,1,0,8,7,1,8,1,0
+ID_4,barcode_2,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R1_002.fastq,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R2_002.fastq,Betty,GTCCCTGCAACATTAAAGGCCGG,TRUE,TRUE,GCTGGCAACATTCCTACCAGT,GAGCGCTGAGGCAGGATTAT,FALSE,gctggcaacattcctaccagtaatttacgtaaaaaaatgctataaaatgtgtagctctccagtctaatgtaacttgtgcttgcattgtgtttacaggaaaccaGTCCCTGCAACATTAAAGGCCGGaagtctaagaactcacatcagcaggtgtcaagtgtgcatgaagagggtataatcctgcctcagcgctc,"",21,175,7,0,0,7,4,7,7,2,0
+ID_5,barcode_2,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R1_002.fastq,/tmp/tmpg3fcuksp/job_working_directory/000/6/working/fastq_folder/R2_002.fastq,Betty,GTCCCTGCAACATTAAAGGCCGG,TRUE,FALSE,ACTGGCAACATTCCTACCAGT,ACTGGCTGAGGCAGGATTAT,FALSE,actggcaacattcctaccagtaatttacgtaaaaaaatgctataaaatgtgtagctctccagtctaatgtaacttgtgcttgcattgtgtttacaggaaaccaGTCCCTGCAACATTAAAGGCCGGaagtctaagaactcacatcagcaggtgtcaagtgtgcatgaagagggtataatcctgcctcagccagt,actggcaacattcctaccagtaatttacgtaaaaaaatgctataaaatgtgtagctctccagtctaatgtaacttgtgcttgcattgtgtttacaggaaaccaGTCCCTGCAACATTAAAAGCCGGaagtctaagaactcacatcagcaggtgtcaagtgtgcatgaagagggtataatcctgcctcagccagt,21,175,5,0,0,5,0,0,2,0,2
diff -r 000000000000 -r 71adaaace336 test-data/events_filtered_shifted.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/events_filtered_shifted.csv Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,84 @@
+seqnames,start,end,width,strand,originally,replacement,type,read_id,score,counts,readType,overlaps,consensus
+ID_1,42,61,20,+,"",AAAAAAAAAAAAAAAAAAAA,insertion,1,597,3,FALSE,FALSE,TRUE
+ID_1,46,65,20,+,"",AAAAAAAAAAAAAAAAAAAA,insertion,2,557,2,FALSE,FALSE,TRUE
+ID_1,-24,41,66,+,"","",deletion,1,597,3,FALSE,TRUE,TRUE
+ID_1,-28,45,74,+,"","",deletion,2,557,2,FALSE,TRUE,TRUE
+ID_1,-32,51,84,+,"","",deletion,4,532,1,FALSE,TRUE,TRUE
+ID_1,-35,-35,1,+,A,G,mismatch,1,597,3,FALSE,FALSE,TRUE
+ID_1,97,97,1,+,T,A,mismatch,1,597,3,FALSE,FALSE,TRUE
+ID_1,-35,-35,1,+,A,G,mismatch,2,557,2,FALSE,FALSE,TRUE
+ID_1,97,97,1,+,T,A,mismatch,2,557,2,FALSE,FALSE,TRUE
+ID_1,-35,-35,1,+,A,G,mismatch,4,532,1,FALSE,FALSE,TRUE
+ID_1,105,105,1,+,G,A,mismatch,4,532,1,FALSE,FALSE,TRUE
+ID_1,42,61,20,-,"",AAAAAAAAAAAAAAAAAAAA,insertion,1,597,3,FALSE,FALSE,FALSE
+ID_1,46,65,20,-,"",AAAAAAAAAAAAAAAAAAAA,insertion,2,557,2,FALSE,FALSE,FALSE
+ID_1,-24,41,66,-,"","",deletion,1,597,3,FALSE,TRUE,FALSE
+ID_1,-28,45,74,-,"","",deletion,2,557,2,FALSE,TRUE,FALSE
+ID_1,-32,51,84,-,"","",deletion,4,532,1,FALSE,TRUE,FALSE
+ID_1,-35,-35,1,-,A,G,mismatch,1,597,3,FALSE,FALSE,FALSE
+ID_1,97,97,1,-,T,A,mismatch,1,597,3,FALSE,FALSE,FALSE
+ID_1,-35,-35,1,-,A,G,mismatch,2,557,2,FALSE,FALSE,FALSE
+ID_1,97,97,1,-,T,A,mismatch,2,557,2,FALSE,FALSE,FALSE
+ID_1,-35,-35,1,-,A,G,mismatch,4,532,1,FALSE,FALSE,FALSE
+ID_1,105,105,1,-,G,A,mismatch,4,532,1,FALSE,FALSE,FALSE
+ID_2,5,17,13,-,"","",deletion,1,845,3,FALSE,TRUE,FALSE
+ID_2,-4,4,9,-,"","",deletion,2,865,2,FALSE,TRUE,FALSE
+ID_2,-9,-5,5,-,"","",deletion,3,885,1,FALSE,TRUE,FALSE
+ID_2,5,17,13,+,"","",deletion,1,845,3,FALSE,TRUE,TRUE
+ID_2,-4,4,9,+,"","",deletion,2,865,2,FALSE,TRUE,TRUE
+ID_2,-9,-5,5,+,"","",deletion,3,885,1,FALSE,TRUE,TRUE
+ID_3,105,105,1,+,"",T,insertion,1,819,5,FALSE,FALSE,TRUE
+ID_3,8,23,16,+,"",CCCCCCCCCCCCCCCC,insertion,3,860,1,FALSE,TRUE,TRUE
+ID_3,0,17,18,+,"","",deletion,1,819,5,FALSE,TRUE,TRUE
+ID_3,-3,2,6,+,"","",deletion,2,885,2,FALSE,TRUE,TRUE
+ID_3,15,20,6,+,"","",deletion,2,885,2,FALSE,TRUE,TRUE
+ID_3,-40,-24,17,+,"","",deletion,3,860,1,FALSE,FALSE,TRUE
+ID_3,101,101,1,+,G,T,mismatch,1,819,5,FALSE,FALSE,TRUE
+ID_3,102,102,1,+,C,T,mismatch,1,819,5,FALSE,FALSE,TRUE
+ID_3,103,103,1,+,C,T,mismatch,1,819,5,FALSE,FALSE,TRUE
+ID_3,104,104,1,+,A,T,mismatch,1,819,5,FALSE,FALSE,TRUE
+ID_3,105,105,1,-,"",T,insertion,1,819,5,FALSE,FALSE,FALSE
+ID_3,8,23,16,-,"",CCCCCCCCCCCCCCCC,insertion,3,860,1,FALSE,TRUE,FALSE
+ID_3,0,17,18,-,"","",deletion,1,819,5,FALSE,TRUE,FALSE
+ID_3,-3,2,6,-,"","",deletion,2,885,2,FALSE,TRUE,FALSE
+ID_3,15,20,6,-,"","",deletion,2,885,2,FALSE,TRUE,FALSE
+ID_3,-40,-24,17,-,"","",deletion,3,860,1,FALSE,FALSE,FALSE
+ID_3,101,101,1,-,G,T,mismatch,1,819,5,FALSE,FALSE,FALSE
+ID_3,102,102,1,-,C,T,mismatch,1,819,5,FALSE,FALSE,FALSE
+ID_3,103,103,1,-,C,T,mismatch,1,819,5,FALSE,FALSE,FALSE
+ID_3,104,104,1,-,A,T,mismatch,1,819,5,FALSE,FALSE,FALSE
+ID_4,14,21,8,+,"",GGGGGGGG,insertion,2,767,2,FALSE,TRUE,TRUE
+ID_4,5,22,18,+,"",ACCACACGTGCATCGTAC,insertion,3,833,1,FALSE,TRUE,TRUE
+ID_4,-67,-36,32,+,"","",deletion,1,497,4,FALSE,FALSE,TRUE
+ID_4,-13,-6,8,+,"","",deletion,1,497,4,FALSE,FALSE,FALSE
+ID_4,10,11,2,+,"","",deletion,1,497,4,FALSE,TRUE,TRUE
+ID_4,43,62,20,+,"","",deletion,1,497,4,FALSE,FALSE,TRUE
+ID_4,-68,-42,27,+,"","",deletion,2,767,2,FALSE,FALSE,TRUE
+ID_4,-52,-41,12,+,"","",deletion,3,833,1,FALSE,FALSE,TRUE
+ID_4,-2,-2,1,+,C,A,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,0,0,1,+,G,C,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,41,41,1,+,C,G,mismatch,1,497,4,FALSE,FALSE,TRUE
+ID_4,55,55,1,+,T,A,mismatch,2,767,2,FALSE,FALSE,TRUE
+ID_4,63,63,1,+,A,T,mismatch,2,767,2,FALSE,FALSE,TRUE
+ID_4,58,58,1,+,G,C,mismatch,3,833,1,FALSE,FALSE,TRUE
+ID_4,60,60,1,+,A,T,mismatch,3,833,1,FALSE,FALSE,TRUE
+ID_4,63,63,1,+,A,G,mismatch,3,833,1,FALSE,FALSE,TRUE
+ID_4,2,2,1,+,C,G,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,3,3,1,+,C,A,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,8,8,1,+,A,T,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,9,9,1,+,A,G,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,12,22,11,-,"",ACTGACTGCTG,insertion,1,626,4,FALSE,TRUE,TRUE
+ID_4,14,21,8,-,"",GGGGGGGG,insertion,2,767,2,FALSE,TRUE,FALSE
+ID_4,5,22,18,-,"",ACCACACGTGCATCGTAC,insertion,3,824,1,FALSE,TRUE,FALSE
+ID_4,-67,-36,32,-,"","",deletion,1,626,4,FALSE,FALSE,FALSE
+ID_4,43,62,20,-,"","",deletion,1,626,4,FALSE,FALSE,FALSE
+ID_4,-68,-42,27,-,"","",deletion,2,767,2,FALSE,FALSE,FALSE
+ID_4,-52,-41,12,-,"","",deletion,3,824,1,FALSE,FALSE,FALSE
+ID_4,41,41,1,-,C,G,mismatch,1,626,4,FALSE,FALSE,FALSE
+ID_4,55,55,1,-,T,A,mismatch,2,767,2,FALSE,FALSE,FALSE
+ID_4,63,63,1,-,A,T,mismatch,2,767,2,FALSE,FALSE,FALSE
+ID_4,58,58,1,-,G,C,mismatch,3,824,1,FALSE,FALSE,FALSE
+ID_4,60,60,1,-,A,T,mismatch,3,824,1,FALSE,FALSE,FALSE
+ID_4,63,63,1,-,A,G,mismatch,3,824,1,FALSE,FALSE,FALSE
+ID_5,17,17,1,+,G,A,mismatch,2,961,2,TRUE,TRUE,TRUE
+ID_5,17,17,1,-,G,A,mismatch,2,961,2,TRUE,TRUE,FALSE
diff -r 000000000000 -r 71adaaace336 test-data/events_filtered_shifted_normalized.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/events_filtered_shifted_normalized.csv Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,84 @@
+seqnames,start,end,width,strand,originally,replacement,type,read_id,score,counts,readType,overlaps,consensus
+ID_3,-40,-24,17,+,"","",deletion,3,860,1,FALSE,FALSE,TRUE
+ID_3,-40,-24,17,-,"","",deletion,3,860,1,FALSE,FALSE,FALSE
+ID_1,-35,-35,1,+,A,G,mismatch,1,597,3,FALSE,FALSE,TRUE
+ID_1,-35,-35,1,+,A,G,mismatch,2,557,2,FALSE,FALSE,TRUE
+ID_1,-35,-35,1,+,A,G,mismatch,4,532,1,FALSE,FALSE,TRUE
+ID_1,-35,-35,1,-,A,G,mismatch,1,597,3,FALSE,FALSE,FALSE
+ID_1,-35,-35,1,-,A,G,mismatch,2,557,2,FALSE,FALSE,FALSE
+ID_1,-35,-35,1,-,A,G,mismatch,4,532,1,FALSE,FALSE,FALSE
+ID_1,-32,51,84,+,"","",deletion,4,532,1,FALSE,TRUE,TRUE
+ID_1,-32,51,84,-,"","",deletion,4,532,1,FALSE,TRUE,FALSE
+ID_1,-28,45,74,+,"","",deletion,2,557,2,FALSE,TRUE,TRUE
+ID_1,-28,45,74,-,"","",deletion,2,557,2,FALSE,TRUE,FALSE
+ID_1,-24,41,66,+,"","",deletion,1,597,3,FALSE,TRUE,TRUE
+ID_1,-24,41,66,-,"","",deletion,1,597,3,FALSE,TRUE,FALSE
+ID_2,-9,-5,5,-,"","",deletion,3,885,1,FALSE,TRUE,FALSE
+ID_2,-9,-5,5,+,"","",deletion,3,885,1,FALSE,TRUE,TRUE
+ID_2,-4,4,9,-,"","",deletion,2,865,2,FALSE,TRUE,FALSE
+ID_2,-4,4,9,+,"","",deletion,2,865,2,FALSE,TRUE,TRUE
+ID_3,-3,2,6,+,"","",deletion,2,885,2,FALSE,TRUE,TRUE
+ID_3,-3,2,6,-,"","",deletion,2,885,2,FALSE,TRUE,FALSE
+ID_3,0,17,18,+,"","",deletion,1,819,5,FALSE,TRUE,TRUE
+ID_3,0,17,18,-,"","",deletion,1,819,5,FALSE,TRUE,FALSE
+ID_2,5,17,13,-,"","",deletion,1,845,3,FALSE,TRUE,FALSE
+ID_2,5,17,13,+,"","",deletion,1,845,3,FALSE,TRUE,TRUE
+ID_3,8,23,16,+,"",CCCCCCCCCCCCCCCC,insertion,3,860,1,FALSE,TRUE,TRUE
+ID_3,8,23,16,-,"",CCCCCCCCCCCCCCCC,insertion,3,860,1,FALSE,TRUE,FALSE
+ID_3,15,20,6,+,"","",deletion,2,885,2,FALSE,TRUE,TRUE
+ID_3,15,20,6,-,"","",deletion,2,885,2,FALSE,TRUE,FALSE
+ID_5,17,17,1,+,G,A,mismatch,2,961,2,TRUE,TRUE,TRUE
+ID_5,17,17,1,-,G,A,mismatch,2,961,2,TRUE,TRUE,FALSE
+ID_1,42,61,20,+,"",AAAAAAAAAAAAAAAAAAAA,insertion,1,597,3,FALSE,FALSE,TRUE
+ID_1,42,61,20,-,"",AAAAAAAAAAAAAAAAAAAA,insertion,1,597,3,FALSE,FALSE,FALSE
+ID_1,46,65,20,+,"",AAAAAAAAAAAAAAAAAAAA,insertion,2,557,2,FALSE,FALSE,TRUE
+ID_1,46,65,20,-,"",AAAAAAAAAAAAAAAAAAAA,insertion,2,557,2,FALSE,FALSE,FALSE
+ID_1,97,97,1,+,T,A,mismatch,1,597,3,FALSE,FALSE,TRUE
+ID_1,97,97,1,+,T,A,mismatch,2,557,2,FALSE,FALSE,TRUE
+ID_1,97,97,1,-,T,A,mismatch,1,597,3,FALSE,FALSE,FALSE
+ID_1,97,97,1,-,T,A,mismatch,2,557,2,FALSE,FALSE,FALSE
+ID_3,101,101,1,+,G,T,mismatch,1,819,5,FALSE,FALSE,TRUE
+ID_3,101,101,1,-,G,T,mismatch,1,819,5,FALSE,FALSE,FALSE
+ID_3,102,102,1,+,C,T,mismatch,1,819,5,FALSE,FALSE,TRUE
+ID_3,102,102,1,-,C,T,mismatch,1,819,5,FALSE,FALSE,FALSE
+ID_3,103,103,1,+,C,T,mismatch,1,819,5,FALSE,FALSE,TRUE
+ID_3,103,103,1,-,C,T,mismatch,1,819,5,FALSE,FALSE,FALSE
+ID_3,104,104,1,+,A,T,mismatch,1,819,5,FALSE,FALSE,TRUE
+ID_3,104,104,1,-,A,T,mismatch,1,819,5,FALSE,FALSE,FALSE
+ID_3,105,105,1,+,"",T,insertion,1,819,5,FALSE,FALSE,TRUE
+ID_3,105,105,1,-,"",T,insertion,1,819,5,FALSE,FALSE,FALSE
+ID_1,105,105,1,+,G,A,mismatch,4,532,1,FALSE,FALSE,TRUE
+ID_1,105,105,1,-,G,A,mismatch,4,532,1,FALSE,FALSE,FALSE
+ID_4,-68,-42,27,+,"","",deletion,2,767,2,FALSE,FALSE,TRUE
+ID_4,-68,-42,27,-,"","",deletion,2,767,2,FALSE,FALSE,FALSE
+ID_4,-67,-36,32,+,"","",deletion,1,497,4,FALSE,FALSE,TRUE
+ID_4,-67,-36,32,-,"","",deletion,1,626,4,FALSE,FALSE,FALSE
+ID_4,-52,-41,12,+,"","",deletion,3,833,1,FALSE,FALSE,TRUE
+ID_4,-52,-41,12,-,"","",deletion,3,824,1,FALSE,FALSE,FALSE
+ID_4,-13,-6,8,+,"","",deletion,1,497,4,FALSE,FALSE,FALSE
+ID_4,-2,-2,1,+,C,A,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,0,0,1,+,G,C,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,2,2,1,+,C,G,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,3,3,1,+,C,A,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,5,22,18,+,"",ACCACACGTGCATCGTAC,insertion,3,833,1,FALSE,TRUE,TRUE
+ID_4,5,22,18,-,"",ACCACACGTGCATCGTAC,insertion,3,824,1,FALSE,TRUE,FALSE
+ID_4,8,8,1,+,A,T,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,9,9,1,+,A,G,mismatch,1,497,4,FALSE,TRUE,TRUE
+ID_4,10,11,2,+,"","",deletion,1,497,4,FALSE,TRUE,TRUE
+ID_4,12,22,11,-,"",ACTGACTGCTG,insertion,1,626,4,FALSE,TRUE,TRUE
+ID_4,14,21,8,+,"",GGGGGGGG,insertion,2,767,2,FALSE,TRUE,TRUE
+ID_4,14,21,8,-,"",GGGGGGGG,insertion,2,767,2,FALSE,TRUE,FALSE
+ID_4,41,41,1,+,C,G,mismatch,1,497,4,FALSE,FALSE,TRUE
+ID_4,41,41,1,-,C,G,mismatch,1,626,4,FALSE,FALSE,FALSE
+ID_4,43,62,20,+,"","",deletion,1,497,4,FALSE,FALSE,TRUE
+ID_4,43,62,20,-,"","",deletion,1,626,4,FALSE,FALSE,FALSE
+ID_4,55,55,1,+,T,A,mismatch,2,767,2,FALSE,FALSE,TRUE
+ID_4,55,55,1,-,T,A,mismatch,2,767,2,FALSE,FALSE,FALSE
+ID_4,58,58,1,+,G,C,mismatch,3,833,1,FALSE,FALSE,TRUE
+ID_4,58,58,1,-,G,C,mismatch,3,824,1,FALSE,FALSE,FALSE
+ID_4,60,60,1,+,A,T,mismatch,3,833,1,FALSE,FALSE,TRUE
+ID_4,60,60,1,-,A,T,mismatch,3,824,1,FALSE,FALSE,FALSE
+ID_4,63,63,1,+,A,G,mismatch,3,833,1,FALSE,FALSE,TRUE
+ID_4,63,63,1,-,A,G,mismatch,3,824,1,FALSE,FALSE,FALSE
+ID_4,63,63,1,+,A,T,mismatch,2,767,2,FALSE,FALSE,TRUE
+ID_4,63,63,1,-,A,T,mismatch,2,767,2,FALSE,FALSE,FALSE
diff -r 000000000000 -r 71adaaace336 test-data/output_html.html
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_html.html Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,497 @@
+
+
+
+
+
+
+
+
+
+
+
+
+
+index.knit
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+title: ‘Summary Read Report’
+
+
+author: ‘ampliCan’
+
+
+date: ‘17 September 2021’
+
+
+output:
+
+
+html_document:
+
+
+toc: true
+
+
+theme: paper
+
+
+toc_float: true
+
+
+number_sections: true
+
+
+params:
+
+
+barcode_summary: “/tmp/tmp4obcv1no/job_working_directory/000/6/working/output_folder/barcode_reads_filters.csv”
+
+
+config_summary: “/tmp/tmp4obcv1no/job_working_directory/000/6/working/output_folder/config_summary.csv”
+
+
+links: “1. Report by id
+
+
+2. Report by barcode
+
+
+3. Report by group
+
+
+4. Report by guide
+
+
+5. Report by amplicon ”
+
+
+
+
+
+
+
Explanation of variables
+
+
Experiment Count - how many IDs belongs to this barcode
+Read Count - how many reads belongs to this barcode
+Bad Base Quality - how many reads had base quality worse than specified (default is 0)
+Bad Average Quality - how many reads had average base quality worse than specified (default is 0)
+Bad Alphabet - how many reads had alphabet with bases other than A, C, G, T
+Filtered Read Count - how many reads were left after filtering
+Unique Reads - how many reads (forward and reverse together) for this barcode is unique
+Assigned Reads/Unassigned Reads - how many reads have been assigned/not assigned to any of the experiments
+
+
+
+
Total reads
+
+
+
Read Quality
+
+
+
+
Read assignment
+
+
+
+
Edits
+
+
+
+
+
+
Reads by barcode
+
+
+
+
+
+
+
+
Summary Table
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+barcode_1
+2
+20
+0
+0
+3
+17
+10
+3
+7
+
+
+barcode_2
+3
+21
+0
+0
+0
+21
+9
+0
+9
+
+
+
+
Table 1. Reads distributed for each barcode
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff -r 000000000000 -r 71adaaace336 test-data/raw_events.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/raw_events.csv Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,95 @@
+seqnames,start,end,width,strand,originally,replacement,type,read_id,score,counts,readType
+ID_1,108,127,20,+,"",AAAAAAAAAAAAAAAAAAAA,insertion,1,597,3,FALSE
+ID_1,112,131,20,+,"",AAAAAAAAAAAAAAAAAAAA,insertion,2,557,2,FALSE
+ID_1,42,107,66,+,"","",deletion,1,597,3,FALSE
+ID_1,38,111,74,+,"","",deletion,2,557,2,FALSE
+ID_1,24,173,150,+,"","",deletion,3,193,1,FALSE
+ID_1,34,117,84,+,"","",deletion,4,532,1,FALSE
+ID_1,31,31,1,+,A,G,mismatch,1,597,3,FALSE
+ID_1,163,163,1,+,T,A,mismatch,1,597,3,FALSE
+ID_1,31,31,1,+,A,G,mismatch,2,557,2,FALSE
+ID_1,163,163,1,+,T,A,mismatch,2,557,2,FALSE
+ID_1,23,23,1,+,T,G,mismatch,3,193,1,FALSE
+ID_1,31,31,1,+,A,G,mismatch,4,532,1,FALSE
+ID_1,171,171,1,+,G,A,mismatch,4,532,1,FALSE
+ID_1,176,176,1,+,A,T,mismatch,3,193,1,FALSE
+ID_1,177,177,1,+,G,C,mismatch,3,193,1,FALSE
+ID_1,108,127,20,-,"",AAAAAAAAAAAAAAAAAAAA,insertion,1,597,3,FALSE
+ID_1,112,131,20,-,"",AAAAAAAAAAAAAAAAAAAA,insertion,2,557,2,FALSE
+ID_1,42,107,66,-,"","",deletion,1,597,3,FALSE
+ID_1,38,111,74,-,"","",deletion,2,557,2,FALSE
+ID_1,24,173,150,-,"","",deletion,3,193,1,FALSE
+ID_1,34,117,84,-,"","",deletion,4,532,1,FALSE
+ID_1,31,31,1,-,A,G,mismatch,1,597,3,FALSE
+ID_1,163,163,1,-,T,A,mismatch,1,597,3,FALSE
+ID_1,31,31,1,-,A,G,mismatch,2,557,2,FALSE
+ID_1,163,163,1,-,T,A,mismatch,2,557,2,FALSE
+ID_1,23,23,1,-,T,G,mismatch,3,193,1,FALSE
+ID_1,31,31,1,-,A,G,mismatch,4,532,1,FALSE
+ID_1,171,171,1,-,G,A,mismatch,4,532,1,FALSE
+ID_1,176,176,1,-,A,T,mismatch,3,193,1,FALSE
+ID_1,177,177,1,-,G,C,mismatch,3,193,1,FALSE
+ID_2,115,127,13,-,"","",deletion,1,845,3,FALSE
+ID_2,106,114,9,-,"","",deletion,2,865,2,FALSE
+ID_2,101,105,5,-,"","",deletion,3,885,1,FALSE
+ID_2,115,127,13,+,"","",deletion,1,845,3,FALSE
+ID_2,106,114,9,+,"","",deletion,2,865,2,FALSE
+ID_2,101,105,5,+,"","",deletion,3,885,1,FALSE
+ID_3,171,171,1,+,"",T,insertion,1,819,5,FALSE
+ID_3,74,89,16,+,"",CCCCCCCCCCCCCCCC,insertion,3,860,1,FALSE
+ID_3,66,83,18,+,"","",deletion,1,819,5,FALSE
+ID_3,63,68,6,+,"","",deletion,2,885,2,FALSE
+ID_3,81,86,6,+,"","",deletion,2,885,2,FALSE
+ID_3,26,42,17,+,"","",deletion,3,860,1,FALSE
+ID_3,21,176,156,+,"","",deletion,4,190,1,FALSE
+ID_3,167,167,1,+,G,T,mismatch,1,819,5,FALSE
+ID_3,168,168,1,+,C,T,mismatch,1,819,5,FALSE
+ID_3,169,169,1,+,C,T,mismatch,1,819,5,FALSE
+ID_3,170,170,1,+,A,T,mismatch,1,819,5,FALSE
+ID_3,171,171,1,-,"",T,insertion,1,819,5,FALSE
+ID_3,74,89,16,-,"",CCCCCCCCCCCCCCCC,insertion,3,860,1,FALSE
+ID_3,66,83,18,-,"","",deletion,1,819,5,FALSE
+ID_3,63,68,6,-,"","",deletion,2,885,2,FALSE
+ID_3,81,86,6,-,"","",deletion,2,885,2,FALSE
+ID_3,26,42,17,-,"","",deletion,3,860,1,FALSE
+ID_3,21,176,156,-,"","",deletion,4,190,1,FALSE
+ID_3,167,167,1,-,G,T,mismatch,1,819,5,FALSE
+ID_3,168,168,1,-,C,T,mismatch,1,819,5,FALSE
+ID_3,169,169,1,-,C,T,mismatch,1,819,5,FALSE
+ID_3,170,170,1,-,A,T,mismatch,1,819,5,FALSE
+ID_4,118,125,8,+,"",GGGGGGGG,insertion,2,767,2,FALSE
+ID_4,109,126,18,+,"",ACCACACGTGCATCGTAC,insertion,3,833,1,FALSE
+ID_4,37,68,32,+,"","",deletion,1,497,4,FALSE
+ID_4,91,98,8,+,"","",deletion,1,497,4,FALSE
+ID_4,114,115,2,+,"","",deletion,1,497,4,FALSE
+ID_4,147,166,20,+,"","",deletion,1,497,4,FALSE
+ID_4,36,62,27,+,"","",deletion,2,767,2,FALSE
+ID_4,52,63,12,+,"","",deletion,3,833,1,FALSE
+ID_4,102,102,1,+,C,A,mismatch,1,497,4,FALSE
+ID_4,104,104,1,+,G,C,mismatch,1,497,4,FALSE
+ID_4,145,145,1,+,C,G,mismatch,1,497,4,FALSE
+ID_4,159,159,1,+,T,A,mismatch,2,767,2,FALSE
+ID_4,167,167,1,+,A,T,mismatch,2,767,2,FALSE
+ID_4,162,162,1,+,G,C,mismatch,3,833,1,FALSE
+ID_4,164,164,1,+,A,T,mismatch,3,833,1,FALSE
+ID_4,167,167,1,+,A,G,mismatch,3,833,1,FALSE
+ID_4,106,106,1,+,C,G,mismatch,1,497,4,FALSE
+ID_4,107,107,1,+,C,A,mismatch,1,497,4,FALSE
+ID_4,112,112,1,+,A,T,mismatch,1,497,4,FALSE
+ID_4,113,113,1,+,A,G,mismatch,1,497,4,FALSE
+ID_4,116,126,11,-,"",ACTGACTGCTG,insertion,1,626,4,FALSE
+ID_4,118,125,8,-,"",GGGGGGGG,insertion,2,767,2,FALSE
+ID_4,109,126,18,-,"",ACCACACGTGCATCGTAC,insertion,3,824,1,FALSE
+ID_4,37,68,32,-,"","",deletion,1,626,4,FALSE
+ID_4,147,166,20,-,"","",deletion,1,626,4,FALSE
+ID_4,36,62,27,-,"","",deletion,2,767,2,FALSE
+ID_4,52,63,12,-,"","",deletion,3,824,1,FALSE
+ID_4,145,145,1,-,C,G,mismatch,1,626,4,FALSE
+ID_4,159,159,1,-,T,A,mismatch,2,767,2,FALSE
+ID_4,167,167,1,-,A,T,mismatch,2,767,2,FALSE
+ID_4,1,1,1,-,G,A,mismatch,3,824,1,FALSE
+ID_4,162,162,1,-,G,C,mismatch,3,824,1,FALSE
+ID_4,164,164,1,-,A,T,mismatch,3,824,1,FALSE
+ID_4,167,167,1,-,A,G,mismatch,3,824,1,FALSE
+ID_5,121,121,1,+,G,A,mismatch,2,961,2,TRUE
+ID_5,121,121,1,-,G,A,mismatch,2,961,2,TRUE
diff -r 000000000000 -r 71adaaace336 test-data/unassigned_reads.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/unassigned_reads.csv Wed Sep 22 21:01:40 2021 +0000
@@ -0,0 +1,4 @@
+Forward,Reverse,Total,BarcodeFrequency,Asigned,fwdPrInReadPos,forwardFound,rvePrInReadPos,reverseFound,Barcode
+AAATACTGTCTTGTGACCAAACCTTCTTAAGGTGCTGTTTTGATGATAAACTTTATTGTGCTTTTGTAGTTGTGCCCCTTGTGTTGGCAGAGGGTCAGCAGACCAGTAAGTCTTCTCAATTTCTTTTATTTATGTATATGTAGTGATAAAA,TGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCAGTGACCTTCCCTGACCTTCTTCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTCAGATATTTTTCATTTAGCCGTCAGCTT,2,0.117647058823529,FALSE,14,TRUE,,FALSE,barcode_1
+AAGCTGACGGCTAAATGAAAAATATCTGAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGAAGAAGGTCAGGGAAGGTCACTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCA,AAGCTGACGGCTAAATGAAAAATATCTGAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGAAGAAGGTCAGGGAAGGTCACTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCA,1,0.0588235294117647,FALSE,,FALSE,,FALSE,barcode_1
+AAGCTGACGGCTAAATGAAAAATATCTGAAACATCTGTTCCAGGTGCTGCGTATGCCAGGGCAGAGAAGAAGGTCAGGGAAGGTCACTGGAGGTCACTGGGATACCCTTTCTTCCCACACCAATGGGGAAAGGAGTCCTGCCAGATGACCA,TGGTCATCTGGCAGGACTCCTTTCCCCATTGGTGTGGGAAGAAAGGGTATCCCAGTGACCTCCAGTGACCTTCCCTGACCTTCTTCTCTGCCCTGGCATACGCAGCACCTGGAACAGATGTTTCAGATATTTTTCATTTAGCCGTCAGCTT,1,0.0588235294117647,FALSE,,FALSE,,FALSE,barcode_1