annotate pileup_interval.xml @ 3:ef11139d4545 draft

planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947
author devteam
date Tue, 21 Jul 2015 15:40:07 -0400
parents 0b4181be05c8
children 9c1c0b947e46
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
ef11139d4545 planemo upload commit 00a7926c285bc4a339bd7deebf40b28f39c7d947
devteam
parents: 2
diff changeset
1 <tool id="pileup_interval" name="Pileup-to-Interval" version="1.0.2">
0
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
2 <description>condenses pileup format into ranges of bases</description>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
3 <command interpreter="python">
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
4 pileup_interval.py
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
5 --input=$input
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
6 --output=$output
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
7 --coverage=$coverage
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
8 --format=$format_type.format
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
9 #if $format_type.format == "ten":
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
10 --base=$format_type.which_base
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
11 --seq_column="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
12 --loc_column="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
13 --base_column="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
14 --cvrg_column="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
15 #elif $format_type.format == "manual":
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
16 --base="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
17 --seq_column=$format_type.seq_column
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
18 --loc_column=$format_type.loc_column
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
19 --base_column=$format_type.base_column
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
20 --cvrg_column=$format_type.cvrg_column
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
21 #else:
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
22 --base="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
23 --seq_column="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
24 --loc_column="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
25 --base_column="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
26 --cvrg_column="None"
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
27 #end if
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
28 </command>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
29 <inputs>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
30 <param name="input" type="data" format="tabular" label="Choose a pileup file to condense:" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
31 <conditional name="format_type">
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
32 <param name="format" type="select" label="which contains:" help="See &quot;Types of pileup datasets&quot; below for examples">
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
33 <option value="six" selected="true">Pileup with six columns (simple)</option>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
34 <option value="ten">Pileup with ten columns (with consensus)</option>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
35 <option value="manual">Set columns manually</option>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
36 </param>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
37 <when value="six" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
38 <when value="ten">
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
39 <param name="which_base" type="select" label="Which base do you want to concatenate">
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
40 <option value="first" selected="true">Reference base (first)</option>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
41 <option value="second">Consensus base (second)</option>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
42 </param>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
43 </when>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
44 <when value="manual">
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
45 <param name="seq_column" label="Select column with sequence name" type="data_column" numerical="false" data_ref="input" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
46 <param name="loc_column" label="Select column with base location" type="data_column" numerical="false" data_ref="input" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
47 <param name="base_column" label="Select column with base to concatenate" type="data_column" numerical="false" data_ref="input" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
48 <param name="cvrg_column" label="Select column with coverage" type="data_column" numerical="true" data_ref="input" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
49 </when>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
50 </conditional>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
51 <param name="coverage" type="integer" value="3" label="Do not report bases with coverage less than:" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
52 </inputs>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
53 <outputs>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
54 <data format="tabular" name="output" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
55 </outputs>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
56 <tests>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
57 <test>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
58 <param name="input" value="pileup_interval_in1.tabular" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
59 <param name="format" value="six" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
60 <param name="coverage" value="3" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
61 <output name="output" file="pileup_interval_out1.tabular" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
62 </test>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
63 <test>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
64 <param name="input" value="pileup_interval_in2.tabular" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
65 <param name="format" value="ten" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
66 <param name="which_base" value="first" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
67 <param name="coverage" value="3" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
68 <output name="output" file="pileup_interval_out2.tabular" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
69 </test>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
70 <test>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
71 <param name="input" value="pileup_interval_in2.tabular" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
72 <param name="format" value="manual" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
73 <param name="seq_column" value="1" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
74 <param name="loc_column" value="2" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
75 <param name="base_column" value="3" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
76 <param name="cvrg_column" value="8" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
77 <param name="coverage" value="3" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
78 <output name="output" file="pileup_interval_out2.tabular" />
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
79 </test>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
80 </tests>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
81 <help>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
82
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
83 **What is does**
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
84
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
85 Reduces the size of a results set by taking a pileup file and producing a condensed version showing consecutive sequences of bases meeting coverage criteria. The tool works on six and ten column pileup formats produced with *samtools pileup* command. You also can specify columns for the input file manually. The tool assumes that the pileup dataset was produced by *samtools pileup* command (although you can override this by setting column assignments manually).
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
86
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
87 --------
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
88
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
89 **Types of pileup datasets**
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
90
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
91 The description of pileup format below is largely based on information that can be found on SAMTools_ documentation page. The 6- and 10-column variants are described below.
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
92
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
93 .. _SAMTools: http://samtools.sourceforge.net/pileup.shtml
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
94
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
95 **Six column pileup**::
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
96
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
97 1 2 3 4 5 6
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
98 ---------------------------------
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
99 chrM 412 A 2 ., II
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
100 chrM 413 G 4 ..t, IIIH
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
101 chrM 414 C 4 ...a III2
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
102 chrM 415 C 4 TTTt III7
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
103
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
104 where::
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
105
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
106 Column Definition
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
107 ------ ----------------------------
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
108 1 Chromosome
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
109 2 Position (1-based)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
110 3 Reference base at that position
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
111 4 Coverage (# reads aligning over that position)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
112 5 Bases within reads where (see Galaxy wiki for more info)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
113 6 Quality values (phred33 scale, see Galaxy wiki for more)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
114
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
115 **Ten column pileup**
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
116
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
117 The `ten-column`__ pileup incorporates additional consensus information generated with *-c* option of *samtools pileup* command::
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
118
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
119
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
120 1 2 3 4 5 6 7 8 9 10
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
121 ------------------------------------------------
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
122 chrM 412 A A 75 0 25 2 ., II
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
123 chrM 413 G G 72 0 25 4 ..t, IIIH
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
124 chrM 414 C C 75 0 25 4 ...a III2
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
125 chrM 415 C T 75 75 25 4 TTTt III7
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
126
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
127 where::
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
128
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
129 Column Definition
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
130 ------- ----------------------------
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
131 1 Chromosome
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
132 2 Position (1-based)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
133 3 Reference base at that position
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
134 4 Consensus bases
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
135 5 Consensus quality
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
136 6 SNP quality
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
137 7 Maximum mapping quality
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
138 8 Coverage (# reads aligning over that position)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
139 9 Bases within reads where (see Galaxy wiki for more info)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
140 10 Quality values (phred33 scale, see Galaxy wiki for more)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
141
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
142
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
143 .. __: http://samtools.sourceforge.net/cns0.shtml
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
144
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
145 ------
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
146
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
147 **The output format**
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
148
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
149 The output file condenses the information in the pileup file so that consecutive bases are listed together as sequences. The starting and ending points of the sequence range are listed, with the starting value converted to a 0-based value.
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
150
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
151 Given the following input with minimum coverage set to 3::
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
152
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
153 1 2 3 4 5 6
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
154 ---------------------------------
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
155 chr1 112 G 3 ..Ta III6
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
156 chr1 113 T 2 aT.. III5
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
157 chr1 114 A 5 ,,.. IIH2
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
158 chr1 115 C 4 ,., III
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
159 chrM 412 A 2 ., II
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
160 chrM 413 G 4 ..t, IIIH
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
161 chrM 414 C 4 ...a III2
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
162 chrM 415 C 4 TTTt III7
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
163 chrM 490 T 3 a I
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
164
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
165 the following would be the output::
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
166
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
167 1 2 3 4
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
168 -------------------
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
169 chr1 111 112 G
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
170 chr1 113 115 AC
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
171 chrM 412 415 GCC
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
172 chrM 489 490 T
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
173
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
174 where::
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
175
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
176 Column Definition
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
177 ------- ----------------------------
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
178 1 Chromosome
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
179 2 Starting position (0-based)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
180 3 Ending position (1-based)
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
181 4 Sequence of bases
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
182
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
183 </help>
a110f9d6ae24 Uploaded tool tarball.
devteam
parents:
diff changeset
184 </tool>