comparison convert.xml @ 0:6231ae8f87b8

Uploaded
author wolma
date Wed, 11 Feb 2015 08:29:02 -0500
parents
children a548b3c6ed00
comparison
equal deleted inserted replaced
-1:000000000000 0:6231ae8f87b8
1 <tool id="convert" name="Convert">
2 <description>between different sequence data formats</description>
3 <version_command>mimodd version -q</version_command>
4 <command>
5 mimodd convert
6
7 #for $i in $mode.input_list
8 "${i.file1}"
9 #if $str($mode.iformat) in ("fastq_pe", "gz_pe"):
10 "${i.file2}"
11 #end if
12 #end for
13 #if $str($mode.header) != "None":
14 --header "$(mode.header)"
15 #end if
16 --ofile "$outputname"
17 --iformat $(mode.iformat)
18 --oformat $(mode.oformat)
19 </command>
20
21 <inputs>
22 <conditional name="mode">
23 <param name="iformat" type="select" label="input file format" help="Your choice will update the interface to display further choices appropriate for your type of input data.">
24 <option value="fastq">fastq: single-end (one file)</option>
25 <option value="fastq_pe">fastq: paired-end (two files)</option>
26 <option value="gz">gzip compressed fastq: single-end (one file)</option>
27 <option value="gz_pe">gzip compressed fastq: paired-end (two files)</option>
28 <option value="sam">sam</option>
29 <option value="bam">bam</option>
30 </param>
31 <when value="fastq">
32 <param name="oformat" type="select" label="output file format">
33 <option value="sam">sam</option>
34 <option value="bam">bam</option>
35 </param>
36 <repeat name="input_list" title="fastq input dataset" default="1" min="1">
37 <param name="file1" format="fastq" type="data" label="inputfile"/>
38 </repeat>
39 <param name="header" type="data" format="sam" label="Use Header File" help="A SAM file with header information, as generated, for example, by the NGS Run Annotation Tool, that will be used to attach metainformation to the results file."/>
40 </when>
41 <when value="fastq_pe">
42 <param name="oformat" type="select" label="output file format">
43 <option value="sam">sam</option>
44 <option value="bam">bam</option>
45 </param>
46 <repeat name="input_list" title="fastq input datasets" default="1" min="1">
47 <param format="fastq" name="file1" type="data" label="inputfile with the first set of reads of paired-end data"/>
48 <param format="fastq" name="file2" type="data" label="inputfile with the second set of reads of paired-end data"/>
49 </repeat>
50 <param name="header" type="data" format="sam" label="Use Header File" help="A SAM file with header information, as generated, for example, by the NGS Run Annotation Tool, that will be used to attach metainformation to the results file."/>
51 </when>
52 <when value="gz">
53 <param name="oformat" type="select" label="output file format">
54 <option value="sam">sam</option>
55 <option value="bam">bam</option>
56 </param>
57 <repeat name="input_list" title="fastq.gz input dataset" default="1" min="1">
58 <param name="file1" format="data" type="data" label="inputfile"/>
59 </repeat>
60 <param name="header" type="data" format="sam" label="Use Header File" help="A SAM file with header information, as generated, for example, by the NGS Run Annotation Tool, that will be used to attach metainformation to the results file."/>
61 </when>
62 <when value="gz_pe">
63 <param name="oformat" type="select" label="output file format">
64 <option value="sam">sam</option>
65 <option value="bam">bam</option>
66 </param>
67 <repeat name="input_list" title="fastq.gz input datasets" default="1" min="1">
68 <param format="data" name="file1" type="data" label="inputfile with the first set of reads of paired-end data"/>
69 <param format="data" name="file2" type="data" label="inputfile with the second set of reads of paired-end data"/>
70 </repeat>
71 <param name="header" type="data" format="sam" label="Use Header File" help="A SAM file with header information, as generated, for example, by the NGS Run Annotation Tool, that will be used to attach metainformation to the results file."/>
72 </when>
73 <when value="sam">
74 <param name="oformat" type="select" label="output file format">
75 <option value="bam">bam</option>
76 </param>
77 <repeat name="input_list" title="sam input dataset" default="1" min="1" max="1">
78 <param name="file1" format="sam" type="data" label="inputfile"/>
79 </repeat>
80 <param name="header" type="hidden" value="None"/>
81 </when>
82 <when value="bam">
83 <param name="oformat" type="select" label="output file format">
84 <option value="sam">sam</option>
85 </param>
86 <repeat name="input_list" title="bam input dataset" default="1" min="1" max="1">
87 <param name="file1" format="bam" type="data" label="inputfile"/>
88 </repeat>
89 <param name="header" type="hidden" value="None"/>
90 </when>
91 </conditional>
92 </inputs>
93
94 <outputs>
95 <data name="outputname" format="bam" label="Converted reads from MiModd ${tool.name} on ${on_string}">
96 <change_format>
97 <when input="mode.oformat" value="sam" format="sam" />
98 </change_format>
99 </data>
100 </outputs>
101
102 <help>
103 .. class:: infomark
104
105 **What it does**
106
107 The tool converts between different file formats used for storing next-generation sequencing data.
108
109 As input file types it can handle uncompressed or gzipped fastq, SAM or BAM format, which it can convert to SAM or BAM format.
110
111 **Notes:**
112
113 1) In its standard configuration Galaxy will decompress any .gz files during their upload, so the option to align gzipped fastq input is useful only with customized Galaxy instances or by using linked files as explained in our `recipe for using gzipped fastq files in Galaxy`_ from the `MiModD user guide`_.
114
115 2) The tool can convert fastq files representing data from paired-end sequencing runs to appropriate SAM/BAM format provided that the mate information is split over two fastq files in corresponding order.
116
117 **TIP:** If your paired-end data is arranged differently, you may look into the *fastq splitter* and *fastq de-interlacer* tools for Galaxy from the `Fastq Manipulation category`_ of the Galaxy Tool Shed to see if they can convert your files to the expected format.
118
119 3) Merging partial fastq (or gzipped fastq) files into a single SAM/BAM file is supported both for single-end and paired-end data. Simply add additional input datasets and select the appropriate files (pairs of files in case of paired-end data).
120
121 Concatenation of SAM/BAM file during conversion is currently not supported.
122
123 4) For input in fastq format a SAM header file providing run metadata **has to be specified**. The information in this file will be used as the header data of the new SAM/BAM file. You can use the *NGS Run Annotation* tool to generate a new header file for your data.
124
125 For input in SAM/BAM format the tool will simply copy the existing header data to the new file. To modify the header of an existing SAM/BAM file, use the *Reheader BAM file* tool instead.
126
127 .. _Fastq Manipulation category: https://toolshed.g2.bx.psu.edu/repository/browse_repositories_in_category?id=310ff67d4caf6531
128 .. _recipe for using gzipped fastq files in Galaxy: http://mimodd.readthedocs.org/en/latest/recipes.html#use-gzipped-fastq-files-in-galaxy
129 .. _MiModD user guide: http://mimodd.readthedocs.org/en/latest
130
131 </help>
132 </tool>
133