comparison nanostat.xml @ 0:e86d1c122ee7 draft

initial upload
author leomrtns
date Tue, 14 May 2019 05:36:34 -0400
parents
children 845458a694e0
comparison
equal deleted inserted replaced
-1:000000000000 0:e86d1c122ee7
1 <tool id="nanostat" name="NanoStat" version="0.1.0">
2 <description>
3 Calculate various statistics from a long read sequencing dataset in fastq, bam or albacore sequencing summary format
4 </description>
5 <requirements>
6 <requirement type="package" version="1.1.2">nanostat</requirement>
7 </requirements>
8 <command detect_errors="exit_code"><![CDATA[
9 #import re
10 ## Galaxy creates xyz.dat but nanostat relies on suffix to detect compressed fasta/fastq; otoh Galaxy provides 'element_identifier'
11 #if str($input_type.type) == "fastq" or str($input_type.type) == "fasta"
12 #set $named_input_files = ''
13 #for $i_file in $input_type.file
14 ## Add single quotes around each input file identifier
15 #set $_input_file = "'{}'".format($i_file.element_identifier)
16 #set $named_input_files = $named_input_files + ' ' + $_input_file
17 ln -s '${i_file}' ${_input_file} &&
18 #end for
19 #end if
20 #### alternative would be something like: x=`file o.xyz.gz; if [[ $x == *gzip* ]]; then echo "found gzip"; fi
21
22 NanoStat
23 --threads \${GALAXY_SLOTS:-4}
24 #if str($input_type.type) == "fastq"
25 --fastq ${named_input_files}
26 #else if str($input_type.type) == "fasta"
27 --fasta "${named_input_files}"
28 #else if str($input_type.type) == "bam"
29 --bam "${input_type.file}"
30 #else if str($input_type.type) == "summary"
31 --readtype "${input_type.readtype}"
32 --summary "${input_type.file}"
33 #if $input_type.barcoded
34 --barcoded
35 #end if
36 #end if
37 -n "$output1"
38 ]]></command>
39 <inputs>
40 <conditional name="input_type">
41 <param name="type" type="select" label="File type of input read files" help="It is not possible to mix distinct file types.">
42 <option value="fastq" selected="true">fastq (compressed or not)</option>
43 <option value="fasta">fasta (compressed or not)</option>
44 <option value="bam">sorted bam</option>
45 <option value="summary">Use albacore or guppy summary file for quality scores</option>
46 </param>
47 <when value="fastq">
48 <param type="data" name="file" format="fastqsanger,fastqsanger.gz,fastqsanger.bz2, fastqsanger.bgz" multiple="true" label="One or more (compressed) fastq file(s)." optional="true"/>
49 </when>
50 <when value="fasta">
51 <param type="data" name="file" format="fasta, fasta.gz, fasta.bz2, fasta.bgz" multiple="true" label="One or more (compressed) fasta file(s)." optional="true"/>
52 </when>
53 <when value="bam">
54 <param type="data" name="file" format="bam" label="One or more sorted bam file(s)." multiple="true" optional="true"/>
55 </when>
56 <when value="summary">
57 <param type="data" name="file" format="tabular" label="Summary file generated by albacore or guppy." multiple="true" optional="true"/>
58 <param name="barcoded" argument="--barcoded" type="boolean" truevalue="--barcode" falsevalue="" checked="false" label="Do you want to split the summary file by barcode?" help="Default:No"/>
59 <param name="readtype" argument="--readtype" type="select" label="Which read type to extract information about from summary?">
60 <option value="1D" selected="true">1D</option>
61 <option value="2D">2D</option>
62 <option value="1D2">1D2</option>
63 </param>
64 </when>
65 </conditional>
66
67 </inputs>
68 <outputs>
69 <data name="output1" format="tabular" />
70 </outputs>
71 <tests>
72 <test>
73 <param name="type" value="fastq"/>
74 <param name="file" value="input_1.fq.gz,input_2.fq.bz2"/>
75 <output name="output1" file="out.txt"/>
76 </test>
77 </tests>
78 <help><![CDATA[
79 usage: NanoStat [-h] [-v] [-o OUTDIR] [-p PREFIX] [-n NAME] [-t N]
80 [--barcoded] [--readtype {1D,2D,1D2}]
81 (--fastq file [file ...] | --fasta file [file ...] | --summary file [file ...] | --bam file [file ...])
82
83 Calculate statistics of long read sequencing dataset.
84
85 EXAMPLE usage:
86 NanoStat --fastq reads.fastq.gz --outdir statreports
87
88 ]]> </help>
89 <citations>
90 <citation type="bibtex">
91 @misc{githubnanostat,
92 url = {https://github.com/wdecoster/nanostat}
93 }
94 @article{10.1093/bioinformatics/bty149,
95 author = {De Coster, Wouter and D’Hert, Svenn and Schultz, Darrin T and Cruts, Marc and Van Broeckhoven, Christine},
96 title = "{NanoPack: visualizing and processing long-read sequencing data}",
97 journal = {Bioinformatics},
98 volume = {34},
99 number = {15},
100 pages = {2666-2669},
101 year = {2018},
102 month = {03},
103 abstract = "{Here we describe NanoPack, a set of tools developed for visualization and processing of long-read sequencing data from Oxford Nanopore Technologies and Pacific Biosciences.The NanoPack tools are written in Python3 and released under the GNU GPL3.0 License. The source code can be found at https://github.com/wdecoster/nanopack, together with links to separate scripts and their documentation. The scripts are compatible with Linux, Mac OS and the MS Windows 10 subsystem for Linux and are available as a graphical user interface, a web service at http://nanoplot.bioinf.be and command line tools.Supplementary data are available at Bioinformatics online.}",
104 issn = {1367-4803},
105 doi = {10.1093/bioinformatics/bty149},
106 url = {https://doi.org/10.1093/bioinformatics/bty149},
107 eprint = {http://oup.prod.sis.lan/bioinformatics/article-pdf/34/15/2666/25230836/bty149.pdf}
108 }
109 </citation>
110 </citations>
111 </tool>