Repository 'seq2hla'
hg clone https://toolshed.g2.bx.psu.edu/repos/jjohnson/seq2hla

Changeset 0:262d5334c786 (2016-12-22)
Next changeset 1:6ecaa71a5aa3 (2019-10-01)
Commit message:
planemo upload for repository https://github.com/jj-umn/galaxytools/tree/master/seq2hla commit fb1e8b800e7dcd411c7281d1ed05e192fba14fcc-dirty
added:
seq2hla.xml
test-data/reads1.fastq
test-data/reads2.fastq
b
diff -r 000000000000 -r 262d5334c786 seq2hla.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/seq2hla.xml Thu Dec 22 09:15:31 2016 -0500
[
@@ -0,0 +1,107 @@
+<tool id="seq2hla" name="seq2HLA" version="0.1.0">
+    <description>HLA genotype and expression from RNA-seq</description>
+    <requirements>
+        <requirement type="package" version="2.2">seq2HLA</requirement>
+        <requirement type="package" version="1.0.0">bowtie</requirement>
+    </requirements>
+    <stdio>
+        <exit_code range="1:" />
+    </stdio>
+    <command><![CDATA[
+        seq2HLA --runName="$run_name" -1 "$fastq_input1" -2 "$fastq_input2" 
+        #if str($trim) != '':
+            --trim3=$trim
+        #end if
+        -p \${GALAXY_SLOTS:-1} >> "$seq2hla_log"
+        && cp -p "${run_name}-ClassI.HLAgenotype2digits" "${c1_genotype2digits}"
+        && cp -p "${run_name}-ClassI.HLAgenotype4digits" "${c1_genotype4digits}"
+        && echo "#Locus_RPKM" | cat - "${run_name}-ClassI.expression" | sed 's/^\(.*\): \([0-9.]*\).*$/\1_\2/' | tr '_' '\t' > "${c1_expression}"
+        && cp -p "${run_name}-ClassII.HLAgenotype4digits" "${c2_genotype4digits}"
+        && echo "#Locus_RPKM" | cat - "${run_name}-ClassII.expression" | sed 's/^\(.*\): \([0-9.]*\).*$/\1_\2/' | tr '_' '\t' > "${c2_expression}"
+        && cp -p "${run_name}.ambiguity" "${ambiguity}"
+    ]]></command>
+    <inputs>
+        <param name="run_name" type="text" value="sample1" label="Name prefix for this analysis">
+            <validator type="regex" message="Use letters,digits,_.-">^[A-Za-z0-9_\-+.]+$</validator>
+        </param>
+        <param name="fastq_input1" type="data" format="fastqsanger" label="Select first set of reads" help="Specify dataset with forward reads"/>
+        <param name="fastq_input2" type="data" format="fastqsanger" label="Select second set of reads" help="Specify dataset with reverse reads"/>
+        <param name="trim" type="integer" value="" min="0" optional="true" label="Trim bases from 3 prime" 
+               help="trim this many bases from the low-quality end of each read" />
+    </inputs>
+    <outputs>
+        <data format="txt" name="seq2hla_log" label="${tool.name} on ${on_string}: ${run_name} logfile"/>
+        <data format="tabular" name="c1_genotype2digits" label="${tool.name} on ${on_string}: ${run_name}-ClassI.HLAgenotype2digits"/>
+        <data format="tabular" name="c1_genotype4digits" label="${tool.name} on ${on_string}: ${run_name}-ClassI.HLAgenotype4digits"/>
+        <data format="tabular" name="c2_genotype4digits" label="${tool.name} on ${on_string}: ${run_name}-ClassII.HLAgenotype4digits"/>
+        <data format="tabular" name="c1_expression" label="${tool.name} on ${on_string}: ${run_name}-ClassI.expression"/>
+        <data format="tabular" name="c2_expression" label="${tool.name} on ${on_string}: ${run_name}-ClassII.expression"/>
+        <data format="tabular" name="c2_expression" label="${tool.name} on ${on_string}: ${run_name}-ClassII.expression"/>
+        <data format="txt" name="ambiguity" label="${tool.name} on ${on_string}: ${run_name}.ambiguity"/>
+    </outputs>
+    <tests>
+        <test>
+            <param name="run_name" value="test"/>
+            <param name="fastq_input1" ftype="fastqsanger" value="reads1.fastq"/>
+            <param name="fastq_input2" ftype="fastqsanger" value="reads2.fastq"/>
+            <output name="c1_genotype4digits">
+                <assert_contents>
+                    <has_text text="A*24:02" />
+                </assert_contents>
+            </output>
+        </test>
+    </tests>
+    <help><![CDATA[
+**seq2HLA**  *HLA typing from RNA-Seq sequence reads*
+
+Release: 2.2
+
+seq2HLA_ is an in-silico method, written in python and R, which takes standard RNA-Seq sequence reads in fastq format
+as input, uses a bowtie index comprising all HLA alleles and outputs the most likely HLA class I and class II genotypes (in 4 digit resolution),
+a p-value for each call, and the expression of each class
+
+**Inputs** 
+
+    Paired read fastq files with illumina style IDs.  
+
+
+**Outputs** 
+
+    1. <prefix>-ClassI.HLAgenotype2digits => 2 digit result of Class I
+    2. <prefix>-ClassII.HLAgenotype2digits => 2 digit result of Class II
+    3. <prefix>-ClassI.HLAgenotype4digits => 4 digit result of Class I
+    4. <prefix>-ClassII.HLAgenotype4digits => 4 digit result of Class II
+    5. <prefix>.ambiguity => reports typing ambuigities (more than one solution for an allele possible)
+    6. <prefix>-ClassI.expression => expression of Class I alleles
+    7. <prefix>-ClassII.expression => expression of Class II alleles
+
+
+    ClassI.HLAgenotype4digits
+
+       =======  ========  ===========  ========  ============
+        #Locus  Allele 1  Confidence   Allele 2  Confidence
+       =======  ========  ===========  ========  ============
+        A       A*03:01   0.000510333  A*02:01'  0.0005975604
+        B       B*50:01   0.001271273  B*58:02   3.52561e-05
+        C       C*04:01   0.06362723   C*06:02   0.04725865
+       =======  ========  ===========  ========  ============
+
+
+    ClassI.expression
+
+       =======  ======
+        #Locus   RPKM
+       =======  ======
+        A        89.59
+        B       139.66
+        C       184.42
+       =======  ======
+
+
+.. _seq2HLA: https://bitbucket.org/sebastian_boegel/seq2hla
+
+    ]]></help>
+    <citations>
+        <citation type="doi">10.1186/gm403</citation>
+    </citations>
+</tool>
b
diff -r 000000000000 -r 262d5334c786 test-data/reads1.fastq
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/reads1.fastq Thu Dec 22 09:15:31 2016 -0500
b
b'@@ -0,0 +1,1300 @@\n+@D00635:180:CA2WAANXX:5:2306:8104:2905 1:N:0:ATTACTCG+CAGCACGT\n+CCTGTCTCCTCGTCCCAATACTCCGGCCCCTCCTGCTCTATCCACGGCGCCCGCGGCTCCATCCTCTGGCTCGCGGCGTCGCTGTCGAACCGCACGAACTGCGTGTCGTCCACGTAGCCCACGGCG\n++\n+BCCCB1FGGGGGGGGGGGGGGGEGGBGGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGGGGGBGDGDGGGGGGGGGGGEBCGG@AGBDGBGGGGGGGGBGDGGGG<@GGGEGGADG\n+@D00635:180:CA2WAANXX:5:2306:17453:9637 1:N:0:ATTACTCG+CAGGACGT\n+CGGCCCCTCCTGCTCCACCCACGGCGCCCGCGGCTCCCCTCTCGGACTCGCGGCGTCGCTGTCGAACCGCACGAACTGCGTGTCGTCCACGTAGCCCAATGCGATGAAGTGGGGCTCCCCGCGGCC\n++\n+AAB@AE=FGB?FFGGGGGFGGGG<EGG<EGGG>GGGDGDGDGGGEGGGE0>/CG<CCGGGGBGGGEBDCCCCECAG<EDGG/CC/DGGDG?D/CDGE:.;/9E..8//7EB=GGG@E6@B>C;..8\n+@D00635:180:CA2WAANXX:5:2306:11733:15515 1:N:0:ATTACTCG+CAGGACGT\n+GCCTCGTGGTCAGAGACGGGATGGTGGGTCACGTGTGTCTTTGGGTGTTCCGCGCGCTGCAGCGTCTCCTTCCCATTCTTCAGGTATCTGCGGAGCCACTCCACGCACAGGCCCTCCAGGTAGGCT\n++\n+BABBCDGGGGGGFFGGGGGGGGGGGGDGGGGGGGGGG:FGGGGCBFGBBGGGGGGGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGEGGGGEGGA?GGBEGGGGGGGGGGDEGG<BEGEEDDGGGG/\n+@D00635:180:CA2WAANXX:5:2306:13187:20542 1:N:0:ATTACTCG+CAGGACGT\n+CAGGTTTCTGCGGAGCCACTCCACGCACAGGCCCTCCAGGTAGGCTCTCAGCTGCTCCGCCTCACGGGCCGCCTCCCACTTGCGCTGGGTGATCTGAGCCGCCGTGTCCGCGGCGGTCCAGGAGCG\n++\n+CCCCC>FFGGGGGGGGGGGGGGCGGGGGGGGGGGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGEGGGGGGGGGGGGGGGGGG0EGGGGGGGGGGEGG@GGGGDG>CGDBGGGGGGGCGGEGGDDEA\n+@D00635:180:CA2WAANXX:5:2306:3171:34119 1:N:0:ATTACTCG+CAGGACGG\n+CTCTGATGCTCCGCCACATGGGCCGCCTCCCACTTGCGCTTGGTGATCTGAGCCGCCATGTCCGCCGCGGTCCAAGAGCGCAGGTCCTCTTTCAGGGCGATGTAATCCTTGCCGTCGTAGGCGTAC\n++\n+CCCCC1@FGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGGGGGGGGGGGGCEGGG@GGGGGGGGGGGGCCGGGGGGGG@GGGGGGGGGGGGGGGGGGGGGEGBGGGGGGEGAGGGGGBGGGG.C\n+@D00635:180:CA2WAANXX:5:2306:6928:43996 1:N:0:ATTACTCG+CACGACGT\n+CTTCACTTTCCCTGTCTCCTCGTCCCAATACTCCGGCCCCTCCTGCTCTATCCACGGCGCCCGCGGCTCCATCCTCTGGCTCGCGGTGTCGCTGTCGAACCGCACGAACTGCGTGTCGTCCACGTA\n++\n+CCCCCGGGGGGGGGGGGGGFGGGGGGFEGGGGGGBGGGGGGGGFGGGGGGGGEGGD<GGGGGFGGGGGGGGGGGGGGGGGGGDGGGGGGGGGGGGGEGGGGBGGGG<DG8EGGGGGGDGGGBEGGD\n+@D00635:180:CA2WAANXX:5:2306:18514:51516 1:N:0:ATTACTCG+CAGGACGT\n+GGCGATGTAATCCTTGCCGTCGTAGGCGTACTGGTCATACCCGCGGAGGAGGCGCCCGTCGGGCCCCACGTCGCAGCCATACATCCTCTGGATGATGTGAGACCCGGCCTCGCTCTGGTTGTAGTA\n++\n+BCCCCGFGGGGGGGGGGGGGGFGGFDEGGGGGGGGEGGGGB@FGGGGGG>FGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGBGGEGGGGGGGGGGGGGGGGGG.CE=G8DC8DB6C\n+@D00635:180:CA2WAANXX:5:2306:19065:61209 1:N:0:ATTACTCG+CAGGACGG\n+GTCAAACATCATCTGGAGGGTGTGAGAACCGGCCTCGCTCTGGTTGTAGTAGCGGAGCGCGATCCGCAGGTTCTCTCGGTCAGTCTGTGAGTGGGCCTTCACTTTCCCTGTCTCCTCGTCCCAATA\n++\n+B<ABBGGGGGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGGGGGGGGGGGGFGGGGFGGGGGGGGGGGGGGGGGGCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGDGEG@\n+@D00635:180:CA2WAANXX:5:2306:9450:74231 1:N:0:ATTACTCG+CAGGACGT\n+CACGTCGCAGCCAAACATCATCTGGAGGGTGTGAGAACCGGCCTCGCTCTGGTTGTAGTAGCGGAGCGCGATCCGCAGGTTCTCTCGGTCAGTCTGTGAGTGGGCCTTCACTTTCCCTGTCTCCTC\n++\n+=BBBBGE<E>EGGEGGBFGDGGDGG>FGGFBGBCFGEGGG@BGFG=<EF:BF1=FFGGGDFG>9EDG/EGGGGBEGGG<FEGGGGEGGGGGGG=EGGGGGG=.8@.EBG=E=@DGGGGGGEDD/9D\n+@D00635:180:CA2WAANXX:5:2306:10675:81134 1:N:0:ATTACTCG+CAGGACGT\n+GGCTCTCAGCTGCTCCGCCTCACGGGCCGCCTCCCACTTGCGCTGGGTGATCTGAGCCGCCGTGTCCGCGGCGGTCCAGGAGCGCAGATCCTCGTTCAGGGCGATGTAATCCTTGCCGTCGTAGGC\n++\n+?A?AAFGGGGFFGGG1;/FFGEGG<<EGGGGBBGGEGECFFGB<C<GGGE1=@F>F@FGG/<=EBC0CGG<>A//::0CCD<DGGDG/DDEGGGEGBEGGGGGCA?GGBGGGGGGGG@D.CGG<.6\n+@D00635:180:CA2WAANXX:5:2306:14669:88822 1:N:0:ATTACTCG+CAGGACGT\n+CCGCCATGTCCGCCGCGGTCCAAGAGCGCAGGTCCTCTTTCAGGGCGATGTAATCCTTGCCGTCGTAGGCGTACTGGTGGTACCCGCGGAGGAAGCGCCCGTCCGACCCCACGTCGCAGCCAAACA\n++\n+ABBBBGGGGGCGDGGGGGGGGEGGGGGGGGGGGGGGGGGGGGFGGGG<EGGGGGGFGGGEGDBDDGGBGGGGDGGGGFGDGGGGGGGGDD/>/:E<DGGGGGDGDDGG@BGGGGGGGGDGG<GGGD\n+@D00635:180:CA2WAANXX:5:2306:3523:97789 1:N:0:ATTACTCG+CAGGACGG\n+CTCCGCCACACGGGCCGCCTCCCACTTGCGCTGGGTGATCTGAGCCGCCGTGTCCGCGGCGGTCCAGGAGCGCAGGTCCTCGTTCAGGGCGATGTAATCCTTGCCGTCGTAGGCGTACTGGTTATG\n++\n+ABB@BGGGG@GC/B<GBCGGDEGE@F@@1C/EEDBCBFGGGGGG11E@GGGD@@FE/E/:E;CG;E0E/CEDG;/C/C@DG?/ECGGGE/CCG>C/DGGGBED=GDGD;DB.>=C>A..CE889D/\n+@D00635:180:CA2WAANXX:5:2305:17386:6381 1:N:0:ATTACTCG+CAGGACGG\n+GTGTGTCTTTGGGGGGTCCGC'..b'GGGGGGGGGGGGGGGGGGGGGGGGGGGGDGGGGGGGGGGGGG0CCFGFGFFBFDGGG=GGGGGGGEEGCGCEBGGGGCDBEGGEGGD>GDE/CG=DGDGCGG\n+@D00635:180:CA2WAANXX:5:2111:16885:49734 1:N:0:ATTACTCG+CAGGACGT\n+CGCAGGTTCTCTCGGTCAGTCTGTGAGTGGGCCTTCACTTTCCCTGTCTCCTCGTCCCAATACTCCGGCCCCTCCTGCTCTATCCACGGCGCCCGCGGCTCCATCCTCTGGCTCGCGGCGTCGCTG\n++\n+BA@BBDGFFDCG1FGGGBFFGGGGGEGCGGDGGDGGGFGGEGE1FGCCGEEGGGGGGGEBGGGGGGGDGGBE>BGGGGGFGGGEGGGG/CDGGGGDGGD/CGGGGGGGGB=EGGGGGGGGGGG.CC\n+@D00635:180:CA2WAANXX:5:2111:14007:59060 1:N:0:ATTACTCG+CAGGACGT\n+CTTCACTTTCCCTGTCTCCTCGTCCCAATACTCCGGCCCCTCCTGCTCTATCCACGGCGCCCGCGGCTCCATCCTCTGGCTCGCGGCGTCGCTGTCGAACCGCACGAACTGCGTGTCGTCCACGTA\n++\n+CCCCCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGEGGGGGGGGGGEGGDGGEGGGGGGGFE@F@G>DGCGGGGGGG@EBGGDGGGGDGGGGGGGGGGGGGGGGGGGG\n+@D00635:180:CA2WAANXX:5:2111:15596:66739 1:N:0:ATTACTCG+CAGGACGT\n+GGCATCGCTCTGGTTGTAGTAGCGGAGCGCGATCCGCAGGTTCTCTCGGTCAGTCTGTGAGTGGGCCTTCACTTTCCCTGTCTCCTCGTCCCAATACTCCGGCCCCTCCTGCTCTATCCACGGCGC\n++\n+BBCCCFGGFGGGGGGGGGGGGGGGGGGGGFGGGGGEGGGGGGGGGGGDGGGGGGGGGGGGGGFGGBFGGGGEGGGGGGGGGGCGGGGGGGGGGGGGGF0FGGGGGGGGBDGGGGGEGGGGG.CGGG\n+@D00635:180:CA2WAANXX:5:2111:18215:76603 1:N:0:ATTACTCG+CAGGACGT\n+TGGTGATCTGAGCCGCCATGTCCGCCGCGGTCCAAGAGCGCAGGTCCTCTTTCAGGGCGATGTAATCCTTGCCGTCGTAGGCGTACTGGTGGTACCCGCGGAGGAAGCGCCCGTCCGACCCCACGT\n++\n+CBCCCGGGGCGGGGGGGGBEGGGB@BGGGGGGGGGGGGGGGGGCGGGGGGGGGGGGGGGGGGGGGEGGGGGGFEGGGGGGGGGGG@GGEEGBGGGEGGGGDAGDGGGGGGGGGGGGGGGGGDGGDD\n+@D00635:180:CA2WAANXX:5:2111:14226:83019 1:N:0:ATTACTCG+CAGGACGT\n+CTCGCTCTGGTTGTAGTAGCCGCGCAGGTTCCGCAGGCTCTCTCGGTAAGTCTGTGTGTTGGTCTTGGAGATCTGTGTCTCCCGGTCCCAATACTCCGGCCCCTCCTGCTCTATCCATGGCGCCCG\n++\n+CCCCCGGGGGGCGGDGGFGGGFGGGFGGGGGGGGGGGGGGGEGGGGGGGGGGGGGGGGGGEGGGEGGGCFGGEGGGGGGGGGGEGEGGGGGFGGGGGGGGGDAEDGDEGGGE/CE=GG=<B.>>C>\n+@D00635:180:CA2WAANXX:5:2111:19289:88648 1:N:0:ATTACTCG+CAGGACGT\n+ATGGTCAGAGATGGGGTGGTGGGTCATATGTGTCTTGGGGGGGTCCGTGCGCTGCAGCGTCTCCTTCCCGTTCTCCAGGTATCTGCGGAGCCCGTCCACGCACGTGCCCTCCAGGTAGGCTCTCTG\n++\n+BBBBCFEGGGFGGGGGGGGGGGGEGGGGGGGGGGGGGGGGGAGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGEGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGEGGGGGEEGGEGG/\n+@D00635:180:CA2WAANXX:5:2111:6549:96971 1:N:0:ATTACTCG+CAGGACGT\n+CCGCCACATGGGCCGCCTCCCACTTGCGCTTGGTGATCTGAGCCGCCATGTCCGCCGCGGTCCAAGAGCGCAGGTCCTCTTTCAGGGCGATGTAATCCTTGCCGTCGTAGGCGTACTGGTGGTACC\n++\n+CCCCCGGGGGGGGGFFDGGGGFGGGGGGGGGGGGB@FGGGGGGGGGGGGGGGDGGGGGGGGGGGGGGGGGGGDGGGGGGGFGGGGGGGGDGGGGGGGGGGGGGGGGGGGGDGAGGGGGGGEGGEGG\n+@D00635:180:CA2WAANXX:5:2109:2641:10752 1:N:0:ATTACTCG+CAGGACGT\n+CCGCGGAGGTAGCGCCCGTCCGACCCCACGTCGCAGCCAAACATCATCTGGAGGGTGTGAGAACCGGCCTCGCTCTGGTTGTAGTAGCGGAGCGCGATCCGCAGGTTCTCTCGGTCAGTCTGTGAG\n++\n+BBBBBGGGG>@GGGDGGAEDGGGGGGGGGDGFGGGGGGGGGGGGGGGGGGGGGGGE/CC@@GGGGGGGGGGGGGGGGGGDGGGCDGGGGGGCGGGGGGGGEGDCGGGEGGGEGGGGGGGGGDDGEG\n+@D00635:180:CA2WAANXX:5:2109:15937:23271 1:N:0:ATTACTCG+CAGGACGT\n+GTACATGCTCTGGAGGGTGTGAGACCCGGCCTCGCTCTGGTTGTAGTAGCCGCGCAGGTTCCGCAGGCTCTCTCGGTAAGTCTGTGTGTTGGTCTTGGAGATCTGTGTCTCCCGGTCCCAATACTC\n++\n+CCCCCGGGEGGGEGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGGGGGGGGGGGGGFGGEGGGGG@GGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGGEGGGGGBGGGGEGGGGGG\n+@D00635:180:CA2WAANXX:5:2109:9613:28877 1:N:0:ATTACTCG+CAGGACGT\n+CCACGTCGCAGCCGTACATGCTCTGGAGGGTGTGAGACCCGGCCTCGCTCTGGTTGTAGTAGCCGCGCAGGTTCCGCAGGCTCTCTCGGTAAGTCTGTGTGTTGGTCTTGGAGATCTGTGTCTCCC\n++\n+CCCBCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGAGGGGGGGGF>FGGGGGGEFGGGGGGGGGGGGGGGGGDGCGGGEGD0CGGGGGGGGGGGGGGGGG<=EGEGEGG<EGGGGGGGGGG\n+@D00635:180:CA2WAANXX:5:2109:13098:35617 1:N:0:ATTACTCG+CAGGACGT\n+CGGGCCGCCTCCCACTTGCGCTGGGTGATCTGAGCCGCCGTGTCCGCGGCGGTCCAGGAGCGCAGGTCCTCGTTCAGGGCGATGTAATCCTTGCCGTCGTAGGCGTACTGGTTATGCCCGCGGAGG\n++\n+BBBBBEGDGFG>FEGGEGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGBGGGEGGBECGG@D//DEG=GGGEGGGGGGGGGGGGBBGGGGGEGGGDC.9EGGGG...;E7C/CCBGGGGGGGGG\n+@D00635:180:CA2WAANXX:5:2109:3892:46389 1:N:0:ATTACTCG+CAGGACGT\n+CACGCACGTGCCCTCCAGGTAGGCTCTCTGCTGCTCCGCCACATGGGCCGCCTCCCACTTGCGCTTGGTGATCTGAGCCGCCATGTCCGCCGCGGTCCAAGAGCGCAGGTCCTCTTTCAGGGCGAT\n++\n+B?A:BGGAFGB@FGGGFEGGGGGGGGEGGGGFGG1>GBGGGGGB1B>BGGGGGGGGEGGGGGDG/>@FGG@B0CFFGEGGG<DGGFGGGAGGGGGCGGGGGBDGCG...EGDGGG=@DG=8@CGC?\n'
b
diff -r 000000000000 -r 262d5334c786 test-data/reads2.fastq
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/reads2.fastq Thu Dec 22 09:15:31 2016 -0500
b
b'@@ -0,0 +1,1300 @@\n+@D00635:180:CA2WAANXX:5:2306:8104:2905 2:N:0:ATTACTCG+CAGCACGT\n+CCTGGCCCTGACCCAGACCTGGGCAGGCTCCCACTCCATGAGGTATTTCTCCACATCCGTGTCCCGGCCCGGCCGCGGGGAGCCCCGCTTCATCGCCGTGGGCTACGTGGACGACACGCAGTTCGT\n++\n+BCCCBGGGGEEGGGDFGGGEDGBGGG/EFGGGGGGGGG1FFGGGGGGGGGGGCBFDGGDGGGGGGGGGGG<EGGGGGGGGDGGGGGGGGGGGGGGGGGAGCDGGEG?EGGGGGGG.CGG@@C/D<D\n+@D00635:180:CA2WAANXX:5:2306:17453:9637 2:N:0:ATTACTCG+CAGGACGT\n+CTCCCACTCCATGAGGTATTTCTACACCGCTGTGTCCCGGCCCGGCCGCGGGGAGCCCCACTTCATCGCAGTGGGCTACGTGGACGACACGCAGTTCGTGCGGTTCGACAGCGACGCCGCGAGTCC\n++\n+AAB@BG>EFGC>FEFGCCCDFGEGGGGGGGGGGGG>GGGGGGGGED//EB<E@B9CGGG<GFGCGCGEGB/:DDDGGEGGGGBDGGGGGBGGGGGGEDDEDDGBD<GE?EDGG.88?>?A.>DC@6\n+@D00635:180:CA2WAANXX:5:2306:11733:15515 2:N:0:ATTACTCG+CAGGACGT\n+CGTGAGGCGGAGCAGCTGAGAGCCTACCTGGAGGGCCTGTGCGTGGAGTGGCTCCGCAGATACCTGAAGAATGGGAAGGAGACGCTGCAGCGCGCGGAACACCCAAAGACACACGTGACCCACCAT\n++\n+AB<00F0FCBDGGGGGG>GEGDGGGCEBGGGBBFBBGGGGEGGGGFBGCGGGEGGGGGGGDFFGGGGFG0><F>GGEG<FFGEFGGGGGGGGGGGG;>AA<DGGGE<DGGGGGBGG.CGGGBDDG6\n+@D00635:180:CA2WAANXX:5:2306:13187:20542 2:N:0:ATTACTCG+CAGGACGT\n+GCCCTGAACGAGGATCTGCGCTCCTGGACCGCCGCGGACACGGCGGCTCAGATCACCCAGCGCAAGTGGGAGGCGGCCCGTGAGGCGGAGCAGCTGAGAGCCTACCTGGAGGGCCTGTGCGTGGAG\n++\n+CCCCCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGG;GCCDGGGGGGGGGGGGGBBGEGGGGGGGGGGGGGEGGBDGGGGGG@GBCDG.C6DGGGGG.C\n+@D00635:180:CA2WAANXX:5:2306:3171:34119 2:N:0:ATTACTCG+CAGGACGG\n+GATGTTTGGCTGCGACGTGGGGTCGGACGGGCGCTTCCTCCGCGGGTACCACCAGTACGCCTACGACGGCAAGGATTACATCGCCCTGAAAGAGGACCTGCGCTCTTGGACCGCGGCGGACATGGC\n++\n+BBBBBGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGG<DGGEGGGGGEDDGGGGGGGGGGGGGDEGDGGGGGGGGGGG0DGGGGGGGG@BDGDDGEGGGGGGGGGGGGG/7EBG@GGGGD>CD@EED\n+@D00635:180:CA2WAANXX:5:2306:6928:43996 2:N:0:ATTACTCG+CACGACGT\n+GGTATTTCTCCACATCCGTGTCCCGGCCCGGCCGCGGGGAGCCCCGCTTCATCGCCGTGGGCTACGTGGACGACACGCAGTTCGTGCGGTTCGACAGCGACACCGCGAGCCAGAGGATGGAGCCGC\n++\n+BBBBBGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGDDGGGGGGGGGGGGGGGGDGBGGGGGGGGGGGGGGGGDGGGGGGGGGGGGGGEGEGGA\n+@D00635:180:CA2WAANXX:5:2306:18514:51516 2:N:0:ATTACTCG+CAGGACGT\n+CAGAAGTACAAGCGCCAGGCACAGACTGACCGAGTGAGCCTGCGGAACCTGCGCGGCTACTACAACCAGAGCGAGGCCGGGTCTCACATCATCCAGAGGATGTATGGCTGCGACGTGGGGCCCGAC\n++\n+@@BBCGGGGGGGGGGFGGGGGGGGCGGGGCG/EGGGGGGGFGGGGGGGGGF>EGAGGGGGGGECGGGGGGGGG@@GGGGGDCCGGGGGGGGGGGBGBDGBDEG=GGGBEEGGGGG9CC.CG.CAG.\n+@D00635:180:CA2WAANXX:5:2306:19065:61209 2:N:0:ATTACTCG+CAGGACGG\n+CCGGAGTATTGGGACGAGGAGACAGGGAAAGTGAAGGCCCACTCACAGACTGACCGAGAGAACCTGCGGATCGCGCTCCGCTACTACAACCAGAGCGAGGCCGGTTCTCACACCCTCCAGATGATG\n++\n+BBBBAGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGDGGGGGGGGGGGGGGGGGGCGGDGGGGGGGGGGGGGGEGE=DGGG\n+@D00635:180:CA2WAANXX:5:2306:9450:74231 2:N:0:ATTACTCG+CAGGACGT\n+AGGATGGAGCCGCGGGCGCCGTGGATAGAGCAGGAGGGGCCGGAGTATTGGGACGAGGAGACAGGGAAAGTGAAGGCCCACTCACAGACTGACCGAGAGAACCTGCGGATCGCGCTCCGCTACTAC\n++\n+<AABBGGGBGGGGG<ED/9/CGGG<:FDFCFG1FFGG/9/CBG@GGGGGBGB==/?CCDGG@DED<//C@CB@DBD///:D9;//;D/EGEGGGAGGGG.CD<BGG?G;EGGGB.CC.CC.8.C/8\n+@D00635:180:CA2WAANXX:5:2306:10675:81134 2:N:0:ATTACTCG+CAGGACGT\n+TGCGACGTGGGGCCCGACGGGCGCCTCCTCCGCGGGTATGACCAGTACGCCTACGACGGCAAGGATTACATCGCCCTGAACGAGGATCTGCGCTCCTGGACCGCCGCGGACACGGCGGCTCAGATC\n++\n+BB@BADCC;/EEGG</GGDGGG>/<BFF>1CABG///909B@FCGGGCB//CFG</9/CC?AGG<DDGGGGGGGG<>EG=;/9:?A/C/CDA@GBADGBGGGGGDDG;CDGG<B@G;6..:@C/D@\n+@D00635:180:CA2WAANXX:5:2306:14669:88822 2:N:0:ATTACTCG+CAGGACGT\n+GCTCCGCTACTACAACCAGAGCGAGGCCGGTTCTCACACCCTCCAGATGATGTTTGGCTGCGACGTGGGGTCGGACGGGCGCTTCCTCCGCGGGTACCACCAGTACGCCTACGACGGCAAGGAGTA\n++\n+CC@BCGBBGGE>@DGGGGGBFGDAEAGFCBCCGGGGGGGBGGG<@1@1<EFD=FC1B@1CFGDGG/9EEGGGDGDAG;?/CGDGG/9/DGG?...EE@@EB<.ECD>AAE<.C6DGGD..@.C.98\n+@D00635:180:CA2WAANXX:5:2306:3523:97789 2:N:0:ATTACTCG+CAGGACGG\n+GTGGGGCCGGACGGGCGCCTCCTCCGCGGGCATAACCAGTACGCCTACGACGGCAAGGATTACATCGCCCTGAACGAGGACCTGCGCTCCTGGACCGCCGCGGACACGGCGGCTCAGATCACCCAG\n++\n+BBBBCGGBDA>BBBEGG///9E@GFB/EGGGDGDG@F<FFGGGBGGC0:/C?GD@GG<90;EGG90/CDBC@C=G<//:CEEGGGGG;.CGDG@@..C?DGGGGB@GDGGA;:?CG<CG@@D.:..\n+@D00635:180:CA2WAANXX:5:2305:17386:6381 2:N:0:ATTACTCG+CAGGACGG\n+GGGCGCCTCCTCCGCGGGCAT'..b'GE>G@GFGGG>/FFGGG@GGGGGG@GGCGEG<:/:DGGBGDDGGGE@DGEGGEDGEEGGGGGGGGEGDEDGGDGD@.8<EED@AC.C6999D>D.6C..6E/\n+@D00635:180:CA2WAANXX:5:2111:16885:49734 2:N:0:ATTACTCG+CAGGACGT\n+ACGCAGTTCGTGCGGTTCGACAGCGACGCCGCGAGCCAGAGGATGGAGCCGCGGGCGCCGTGGATAGAGCAGGAGGGGCCGGAGTATTGGGACGAGGAGACAGGGAAAGTGAAGGCCCACTCACAG\n++\n+BBB=AE/CDFGDGB>GGGGDGGGEGGA>EGGGD<EBGDGBFFFGGGFGBF<C>/C?C/CGG/EGD;@DGG=BDGGG/GDGGGGG<GCDGGGEGDADGCCB.DEB.<DDG@@=EGG.DDBGGG.@G@\n+@D00635:180:CA2WAANXX:5:2111:14007:59060 2:N:0:ATTACTCG+CAGGACGT\n+TGGCCCTGACCCAGACCTGGGCAGGCTCCCACTCCATGAGGTATTTCTCCACATCCGTGTCCCGGCCCGGCCGCGGGGAGCCCCGCTTCATCGCCGTGGGCTACGTGGACGACACGCAGTTCGTGC\n++\n+BBBBCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGGEGGGGGGGGGGGGGGGGGGGDGGGGGGGGFGGGGGGGGGGGGGGGGGGG;EG;CGGGGGGGDGGGGDDAGGGG.CEGGGG\n+@D00635:180:CA2WAANXX:5:2111:15596:66739 2:N:0:ATTACTCG+CAGGACGT\n+CAGTTCGTGCGGTTCGACAGCGACGCCGCGAGCCAGAGGATGGAGCCGCGGGCGCCGTGGATAGAGCAGGAGGGGCCGGAGTATTGGGACGAGGAGACAGGGAAAGTGAAGGCCCACTCACAGACT\n++\n+BBB<AGGGGGGGGGGGGGFGGGGGGGGGGGDGGGEEGGGGGFGGG>GAGGGGGGGGGGGGGGGBBGGGGGBGGGGBGGDDD:CEBD@G<EDEGDDBDDGG.:EEGGDGB=GGEGGGGGGGGGEGD:\n+@D00635:180:CA2WAANXX:5:2111:18215:76603 2:N:0:ATTACTCG+CAGGACGT\n+GCTACTACAACCAGAGCGAGGCCGGTTCTCACACCCTCCAGATGATGTTTGGCTGCGACGTGGGGTCGGACGGGCGCTTCCTCCGCGGGTACCACCAGTACGCCTACGACGGCAAGGATTACATCG\n++\n+BB=ABGGGFGGGGFGGGG@GGGGG<BEEGGGFGGGGGBF>DGGGFGG:FGBDGGGGEE<GCDBGDCFGG<CEDDDAA@GDGBGGGGDAGG@EGEGGGEGBGDGBCDGBG@DCDG>GE.8@CDG=E.\n+@D00635:180:CA2WAANXX:5:2111:14226:83019 2:N:0:ATTACTCG+CAGGACGT\n+CGAGTCCGAGGAAGGAGCCGCGGGCGCCATGGATAGAGCAGGAGGGGCCGGAGTATTGGGACCGGGAGACACAGATCTCCAAGACCAACACACAGACTTACCGAGAGAGCCTGCGGAACCTGCGCG\n++\n+BBBBBGEGGGFGGBGGGGGGGGGGGGGGGGGGCGGDGF11BGGGF@@<>GG@DFGGEGG@FEGBGDGGGGG<E<=BEGEBBGDGGGGGGGG//C@/EGGGGGD.EG?GG<DE@GGGBGDGGGGGGC\n+@D00635:180:CA2WAANXX:5:2111:19289:88648 2:N:0:ATTACTCG+CAGGACGT\n+CTCAGATCACCAAGCGCAAGTGGGAGGCGGCCCATGTGGCGGAGCAGCAGAGAGCCTACCTGGAGGGCACGTGCGTGGACGGGCTCCGCAGATACCTGGAGAACGGGAAGGAGACGCTGCAGCGCA\n++\n+BBBCBGGGGGGGGGGGGGGGCEFGGGGGEGGGGGGGGGFGGGFGGGFGGGGGGGGGGGGGGGGGGFGGGGGGGGGGGDGGGAGGCGGGGGGGGEGDGGEGGEDGGGGEGC?DGGGGGCGGGGGGG.\n+@D00635:180:CA2WAANXX:5:2111:6549:96971 2:N:0:ATTACTCG+CAGGACGT\n+GGTTCTCACACCCTCCAGATGATGTTTGGCTGCGACGTGGGGTCGGACGGGCGCTTCCTCCGCGGGTACCACCAGTACGCCTACGACGGCAAGGATTACATCGCCCTGAAAGAGGACCTGCGCTCT\n++\n+CCBBCGGGGGGDGGGGGGGGGGDFGCGGGGCGGGGGGGGGGGGGGGGGGGCCDGFGGGGGGFGGGGGGGGGGGGGGGGGDAGG/EBD>CGGGGDE@DD=@DGGGGGGGCDDGGGEGGGGGEAGGGG\n+@D00635:180:CA2WAANXX:5:2109:2641:10752 2:N:0:ATTACTCG+CAGGACGT\n+CACTCACAGACTGACCGAGAGAACCTGCGGATCGCGCTCCGCTACTACAACCAGAGCGAGGCCGGTTCTCACACCCTCCAGATGATGTTTGGCTGCGACGTGGGGTCGGACGGGCGCTACCTCCGC\n++\n+B=BBBGGGFEGGBFGG<>EB>G1FGGGGGGGGGGGGGGGGBGGGGGEGGGGGGE>FEGDGGGGGGGDGGGGG=FGGGGGG@EGGGGEGG9@BGGGGG@;CE>DGAGGGG.?CG..6.988@EGG>.\n+@D00635:180:CA2WAANXX:5:2109:15937:23271 2:N:0:ATTACTCG+CAGGACGT\n+GGAAGGAGCCGCGGGCGCCATGGATAGAGCAGGAGGGGCCGGAGTATTGGGACCGGGAGACACAGATCTCCAAGACCAACACACAGACTTACCGAGAGAGCCTGCGGAACCTGCGCGGCTACTACA\n++\n+BBBC@<EGGGGGGGGGGGGGGGFGGGGGGGGGGCGGGGGGGGGGGGGGGCGGFGGGGGGEGGGBGDGGGGGEGGGGEGGGGGEGGGG<DGGGEGDG.8DDEGGGGGCCGGGDGGG@CA:.>GBGDD\n+@D00635:180:CA2WAANXX:5:2109:9613:28877 2:N:0:ATTACTCG+CAGGACGT\n+GCCATGGATAGAGCAGGAGGGGCCGGAGTATTGGGACCGGGAGACACAGATCTCCAAGACCAACACACAGACTTACCGAGAGAGCCTGCGGAACCTGCGCGGCTACTACAACCAGAGCGAGGCCGG\n++\n+CCBCBGGGGF>FDEDGGFDBGGGGGGGGGGGGGGGGEGGGGGGGGGGGGGGGGGGEGCGEFEGGGFGGGGGGGDFCFGD@<DGDGGGBGGGGGGGGGGD?CA.CGGGGG@DGGGB.@D6>6C.@DG\n+@D00635:180:CA2WAANXX:5:2109:13098:35617 2:N:0:ATTACTCG+CAGGACGT\n+CTCACACCCTCCAGAGCATGTACGGCTGCGACGTGGGGCCGGACGGGCGCCTCCTCCGCGGGCATAACCAGTACGCCTACGACGGCAAGGATTACATCGCCCTGAACGAGGACCTGCGCTCCTGGA\n++\n+BCBBBGGGFGGGEGGGGGGGGGFGGGGGFGGGGGGGGGGGBGGGFGGGGGGDGGGGGGGGGGGGGGGGGGGGG0CGGGGGGGGGCDG@EGGGGGGGGGGGGGGGEGGGBGGDGGEGGGBDGGGCG.\n+@D00635:180:CA2WAANXX:5:2109:3892:46389 2:N:0:ATTACTCG+CAGGACGT\n+CACCAGTACGCCTACGACGGCAAGGATTACATCGCCCTGAAAGAGGACCTGCGCTCTTGGACCGCGGCGGACATGGCGGCTCAGATCACCAAGCGCAAGTGGGAGGCGGCCCATGTGGCGGAGCAG\n++\n+AB@0<CGCFGD<BDG<DDDGGGA@01:BBFGF>FG/FGB1:=B1BD10<=FGDG/<F@000009///9>D>CD@D<DA/9C>E0E;E@/EC@EE.>..8C7/.96.86..8.86.86/@>.666C.\n'