# HG changeset patch # User leomrtns # Date 1557826594 14400 # Node ID e86d1c122ee7e77e61550e6862266903828a166c initial upload diff -r 000000000000 -r e86d1c122ee7 nanostat.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/nanostat.xml Tue May 14 05:36:34 2019 -0400 @@ -0,0 +1,111 @@ + + + Calculate various statistics from a long read sequencing dataset in fastq, bam or albacore sequencing summary format + + + nanostat + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + @misc{githubnanostat, + url = {https://github.com/wdecoster/nanostat} + } + @article{10.1093/bioinformatics/bty149, + author = {De Coster, Wouter and D’Hert, Svenn and Schultz, Darrin T and Cruts, Marc and Van Broeckhoven, Christine}, + title = "{NanoPack: visualizing and processing long-read sequencing data}", + journal = {Bioinformatics}, + volume = {34}, + number = {15}, + pages = {2666-2669}, + year = {2018}, + month = {03}, + abstract = "{Here we describe NanoPack, a set of tools developed for visualization and processing of long-read sequencing data from Oxford Nanopore Technologies and Pacific Biosciences.The NanoPack tools are written in Python3 and released under the GNU GPL3.0 License. The source code can be found at https://github.com/wdecoster/nanopack, together with links to separate scripts and their documentation. The scripts are compatible with Linux, Mac OS and the MS Windows 10 subsystem for Linux and are available as a graphical user interface, a web service at http://nanoplot.bioinf.be and command line tools.Supplementary data are available at Bioinformatics online.}", + issn = {1367-4803}, + doi = {10.1093/bioinformatics/bty149}, + url = {https://doi.org/10.1093/bioinformatics/bty149}, + eprint = {http://oup.prod.sis.lan/bioinformatics/article-pdf/34/15/2666/25230836/bty149.pdf} + } + + + diff -r 000000000000 -r e86d1c122ee7 test-data/input_1.fq.gz Binary file test-data/input_1.fq.gz has changed diff -r 000000000000 -r e86d1c122ee7 test-data/input_2.fq.bz2 Binary file test-data/input_2.fq.bz2 has changed diff -r 000000000000 -r e86d1c122ee7 test-data/out.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/out.txt Tue May 14 05:36:34 2019 -0400 @@ -0,0 +1,26 @@ +General summary: +Mean read length: 144.9 +Mean read quality: 27.8 +Median read length: 151.0 +Median read quality: 28.2 +Number of reads: 18,250.0 +Read length N50: 151.0 +Total bases: 2,645,038.0 +Number, percentage and megabases of reads above quality cutoffs +>Q5: 18247 (100.0%) 2.6Mb +>Q7: 18247 (100.0%) 2.6Mb +>Q10: 18247 (100.0%) 2.6Mb +>Q12: 18247 (100.0%) 2.6Mb +>Q15: 18247 (100.0%) 2.6Mb +Top 5 highest mean basecall quality scores and their read lengths +1: 35.8 (151) +2: 35.8 (151) +3: 35.8 (151) +4: 35.8 (151) +5: 35.8 (151) +Top 5 longest reads and their mean basecall quality score +1: 151 (27.3) +2: 151 (32.2) +3: 151 (20.3) +4: 151 (32.5) +5: 151 (22.5)