Mercurial > repos > devteam > pileup_parser
annotate pileup_parser.xml @ 2:85bedbea8a12 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
author | devteam |
---|---|
date | Wed, 05 Oct 2016 06:30:36 -0400 |
parents | 1670f0565000 |
children |
rev | line source |
---|---|
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
1 <tool id="pileup_parser" name="Filter pileup" version="1.0.2"> |
0 | 2 <description>on coverage and SNPs</description> |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
3 <requirements> |
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
4 <requirement type="package" version="5.22.0">perl</requirement> |
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
5 </requirements> |
0 | 6 <command interpreter="perl"> |
7 #if $pileup_type.type_select == "six" #pileup_parser.pl $input "3" "5" "6" "4" $qv_cutoff $cvrg_cutoff $snps_only $interval "2" $out_file1 $diff $qc_base | |
8 #elif $pileup_type.type_select == "ten" #pileup_parser.pl $input "3" "9" "10" "8" $qv_cutoff $cvrg_cutoff $snps_only $interval "2" $out_file1 $diff $qc_base | |
9 #elif $pileup_type.type_select == "manual" #pileup_parser.pl $input $pileup_type.ref_base_column $pileup_type.read_bases_column $pileup_type.read_qv_column $pileup_type.cvrg_column $qv_cutoff $cvrg_cutoff $snps_only $interval $pileup_type.coord_column $out_file1 $diff $qc_base | |
10 #end if# | |
11 </command> | |
12 <inputs> | |
13 <param name="input" type="data" format="pileup" label="Select dataset"/> | |
14 <conditional name="pileup_type"> | |
15 <param name="type_select" type="select" label="which contains" help="See "Types of pileup datasets" below for examples"> | |
16 <option value="six" selected="true">Pileup with six columns (simple)</option> | |
17 <option value="ten">Pileup with ten columns (with consensus)</option> | |
18 <option value="manual">Set columns manually</option> | |
19 </param> | |
20 <when value="manual"> | |
21 <param name="ref_base_column" label="Select column with reference base" type="data_column" numerical="false" data_ref="input" /> | |
22 <param name="read_bases_column" label="Select column with read bases" type="data_column" numerical="false" data_ref="input" help="something like this: ..,a.."/> | |
23 <param name="read_qv_column" label="Select column with base qualities" type="data_column" numerical="false" data_ref="input" help="something like this: IIIGIAI"/> | |
24 <param name="cvrg_column" label="Select column with coverage" type="data_column" numerical="true" data_ref="input" /> | |
25 <param name="coord_column" label="Select coordinate column" type="data_column" numerical="true" data_ref="input" /> | |
26 </when> | |
27 <when value="six"> | |
28 </when> | |
29 <when value="ten"> | |
30 </when> | |
31 </conditional> | |
32 <param name="qv_cutoff" label="Do not consider read bases with quality lower than" type="integer" value="20" help="No variants with quality below this value will be reported"/> | |
33 <param name="cvrg_cutoff" label="Do not report positions with coverage lower than" type="integer" value="3" help="Pileup lines with coverage lower than this value will be skipped"/> | |
34 <param name="snps_only" label="Only report variants?" type="select" help="See "Examples 1 and 2" below for explanation"> | |
35 <option value="No">No</option> | |
36 <option value="Yes" selected="true">Yes</option> | |
37 </param> | |
38 <param name="interval" label="Convert coordinates to intervals?" type="select" help="See "Output format" below for explanation"> | |
39 <option value="No" selected="true">No</option> | |
40 <option value="Yes">Yes</option> | |
41 </param> | |
42 <param name="diff" label="Print total number of differences?" type="select" help="See "Example 3" below for explanation"> | |
43 <option value="No" selected="true">No</option> | |
44 <option value="Yes">Yes</option> | |
45 </param> | |
46 <param name="qc_base" label="Print quality and base string?" type="select" help="See "Example 4" below for explanation"> | |
47 <option value="No">No</option> | |
48 <option value="Yes" selected="true">Yes</option> | |
49 </param> | |
50 </inputs> | |
51 <outputs> | |
52 <data format="tabular" name="out_file1"> | |
53 <change_format> | |
54 <when input="interval" value="Yes" format="interval" /> | |
55 </change_format> | |
56 </data> | |
57 </outputs> | |
58 <tests> | |
59 <test> | |
60 <param name="input" value="pileup_parser.6col.pileup"/> | |
61 <output name="out_file1" file="pileup_parser.6col.20-3-yes-yes.pileup.out"/> | |
62 <param name="type_select" value="six"/> | |
63 <param name="qv_cutoff" value="20" /> | |
64 <param name="cvrg_cutoff" value="3" /> | |
65 <param name="snps_only" value="Yes"/> | |
66 <param name="interval" value="Yes" /> | |
67 <param name="diff" value="No" /> | |
68 <param name="qc_base" value="Yes" /> | |
69 </test> | |
70 <test> | |
71 <param name="input" value="pileup_parser.6col.pileup"/> | |
72 <output name="out_file1" file="pileup_parser.6col.20-3-yes-no.pileup.out"/> | |
73 <param name="type_select" value="six"/> | |
74 <param name="qv_cutoff" value="20" /> | |
75 <param name="cvrg_cutoff" value="3" /> | |
76 <param name="snps_only" value="Yes"/> | |
77 <param name="interval" value="No" /> | |
78 <param name="diff" value="No" /> | |
79 <param name="qc_base" value="Yes" /> | |
80 </test> | |
81 <test> | |
82 <param name="input" value="pileup_parser.6col.pileup"/> | |
83 <output name="out_file1" file="pileup_parser.6col.20-3-no-no.pileup.out"/> | |
84 <param name="type_select" value="six"/> | |
85 <param name="qv_cutoff" value="20" /> | |
86 <param name="cvrg_cutoff" value="3" /> | |
87 <param name="snps_only" value="No"/> | |
88 <param name="interval" value="No" /> | |
89 <param name="diff" value="No" /> | |
90 <param name="qc_base" value="Yes" /> | |
91 </test> | |
92 <test> | |
93 <param name="input" value="pileup_parser.10col.pileup"/> | |
94 <output name="out_file1" file="pileup_parser.10col.20-3-yes-yes.pileup.out"/> | |
95 <param name="type_select" value="ten"/> | |
96 <param name="qv_cutoff" value="20" /> | |
97 <param name="cvrg_cutoff" value="3" /> | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
98 <param name="snps_only" value="Yes"/> |
0 | 99 <param name="interval" value="Yes" /> |
100 <param name="diff" value="No" /> | |
101 <param name="qc_base" value="Yes" /> | |
102 </test> | |
103 <test> | |
104 <param name="input" value="pileup_parser.10col.pileup"/> | |
105 <output name="out_file1" file="pileup_parser.10col.20-3-yes-yes.pileup.out"/> | |
106 <param name="type_select" value="manual"/> | |
107 <param name="ref_base_column" value="3"/> | |
108 <param name="read_bases_column" value="9"/> | |
109 <param name="read_qv_column" value="10"/> | |
110 <param name="cvrg_column" value="8"/> | |
111 <param name="coord_column" value="2"/> | |
112 <param name="qv_cutoff" value="20" /> | |
113 <param name="cvrg_cutoff" value="3" /> | |
114 <param name="snps_only" value="Yes"/> | |
115 <param name="interval" value="Yes" /> | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
116 <param name="diff" value="No" /> |
0 | 117 <param name="qc_base" value="Yes" /> |
118 </test> | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
119 <test> |
0 | 120 <param name="input" value="pileup_parser.10col.pileup"/> |
121 <output name="out_file1" file="pileup_parser.10col.20-3-yes-yes-yes-yes.pileup.out"/> | |
122 <param name="type_select" value="manual"/> | |
123 <param name="ref_base_column" value="3"/> | |
124 <param name="read_bases_column" value="9"/> | |
125 <param name="read_qv_column" value="10"/> | |
126 <param name="cvrg_column" value="8"/> | |
127 <param name="coord_column" value="2"/> | |
128 <param name="qv_cutoff" value="20" /> | |
129 <param name="cvrg_cutoff" value="3" /> | |
130 <param name="snps_only" value="Yes"/> | |
131 <param name="interval" value="Yes" /> | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
132 <param name="diff" value="Yes" /> |
0 | 133 <param name="qc_base" value="Yes" /> |
134 </test> | |
135 <test> | |
136 <param name="input" value="pileup_parser.10col.pileup"/> | |
137 <output name="out_file1" file="pileup_parser.10col.20-3-yes-yes-yes-no.pileup.out"/> | |
138 <param name="type_select" value="manual"/> | |
139 <param name="ref_base_column" value="3"/> | |
140 <param name="read_bases_column" value="9"/> | |
141 <param name="read_qv_column" value="10"/> | |
142 <param name="cvrg_column" value="8"/> | |
143 <param name="coord_column" value="2"/> | |
144 <param name="qv_cutoff" value="20" /> | |
145 <param name="cvrg_cutoff" value="3" /> | |
146 <param name="snps_only" value="Yes"/> | |
147 <param name="interval" value="Yes" /> | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
148 <param name="diff" value="Yes" /> |
0 | 149 <param name="qc_base" value="No" /> |
150 </test> | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
151 </tests> |
0 | 152 <help> |
153 | |
154 **What it does** | |
155 | |
156 Allows one to find sequence variants and/or sites covered by a specified number of reads with bases above a set quality threshold. The tool works on six and ten column pileup formats produced with *samtools pileup* command. However, it also allows you to specify columns in the input file manually. The tool assumes the following: | |
157 | |
158 - the quality scores follow phred33 convention, where input qualities are ASCII characters equal to the Phred quality plus 33. | |
159 - the pileup dataset was produced by the *samtools pileup* command (although you can override this by setting column assignments manually). | |
160 | |
161 -------- | |
162 | |
163 **Types of pileup datasets** | |
164 | |
165 The descriptions of the following pileup formats are largely based on information that can be found on the SAMTools_ documentation page. The 6- and 10-column variants are described below. | |
166 | |
167 .. _SAMTools: http://samtools.sourceforge.net/pileup.shtml | |
168 | |
169 **Six column pileup**:: | |
170 | |
171 1 2 3 4 5 6 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
172 --------------------------------- |
0 | 173 chrM 412 A 2 ., II |
174 chrM 413 G 4 ..t, IIIH | |
175 chrM 414 C 4 ..Ta III2 | |
176 chrM 415 C 4 TTTt III7 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
177 |
0 | 178 where:: |
179 | |
180 Column Definition | |
181 ------- ---------------------------- | |
182 1 Chromosome | |
183 2 Position (1-based) | |
184 3 Reference base at that position | |
185 4 Coverage (# reads aligning over that position) | |
186 5 Bases within reads | |
187 6 Quality values (phred33 scale, see Galaxy wiki for more) | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
188 |
0 | 189 **Ten column pileup** |
190 | |
191 The `ten-column`__ pileup incorporates additional consensus information generated with the *-c* option of the *samtools pileup* command:: | |
192 | |
193 | |
194 1 2 3 4 5 6 7 8 9 10 | |
195 ------------------------------------------------ | |
196 chrM 412 A A 75 0 25 2 ., II | |
197 chrM 413 G G 72 0 25 4 ..t, IIIH | |
198 chrM 414 C C 75 0 25 4 ..Ta III2 | |
199 chrM 415 C T 75 75 25 4 TTTt III7 | |
200 | |
201 where:: | |
202 | |
203 Column Definition | |
204 ------- ---------------------------- | |
205 1 Chromosome | |
206 2 Position (1-based) | |
207 3 Reference base at that position | |
208 4 Consensus bases | |
209 5 Consensus quality | |
210 6 SNP quality | |
211 7 Maximum mapping quality | |
212 8 Coverage (# reads aligning over that position) | |
213 9 Bases within reads | |
214 10 Quality values (phred33 scale, see Galaxy wiki for more) | |
215 | |
216 | |
217 .. __: http://samtools.sourceforge.net/cns0.shtml | |
218 | |
219 ------ | |
220 | |
221 **The output format** | |
222 | |
223 The tool modifies the input dataset in two ways: | |
224 | |
225 1. It appends five columns to the end of every reported line: | |
226 | |
227 - Number of **A** variants | |
228 - Number of **C** variants | |
229 - Number of **G** variants | |
230 - Number of **T** variants | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
231 - Number of read bases covering this position, where quality is equal to or higher than the value set by **Do not consider read bases with quality lower than** option. |
0 | 232 |
233 Optionally, if **Print total number of differences?** is set to **Yes**, the tool will append the sixth column with the total number of deviants (see below). | |
234 | |
235 2. If **Convert coordinates to intervals?** is set to **Yes**, the tool replaces the position column (typically the second column) with a pair of tab-delimited start/end values. | |
236 | |
237 For example, if you are calling variants with base quality above 20 on this dataset:: | |
238 | |
239 chrM 412 A 2 ., II | |
240 chrM 413 G 4 ..t, III2 | |
241 chrM 414 C 4 ..Ta III2 | |
242 chrM 415 C 4 TTTt III7 | |
243 | |
244 you will get:: | |
245 | |
246 chrM 413 G 4 ..t, IIIH 0 0 2 1 3 | |
247 chrM 414 C 4 ..Ta III2 1 1 0 1 3 | |
248 chrM 415 C 4 TTTt III7 0 0 0 4 4 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
249 |
0 | 250 where:: |
251 | |
252 Column Definition | |
253 ------- ---------------------------- | |
254 1 Chromosome | |
255 2 Position (1-based) | |
256 3 Reference base at that position | |
257 4 Coverage (# reads aligning over that position) | |
258 5 Bases within reads where | |
259 6 Quality values (phred33 scale, see Galaxy wiki for more) | |
260 7 Number of A variants | |
261 8 Number of C variants | |
262 9 Number of G variants | |
263 10 Number of T variants | |
264 11 Quality adjusted coverage: | |
265 12 Number of read bases (i.e., # of reads) with quality above the set threshold | |
266 13 Total number of deviants (if Convert coordinates to intervals? is set to yes) | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
267 |
0 | 268 if **Print total number of differences?** is set to **Yes**, you will get:: |
269 | |
270 chrM 413 G 4 ..t, IIIH 0 0 2 1 3 1 | |
271 chrM 414 C 4 ..Ta III2 1 2 0 1 3 2 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
272 chrM 415 C 4 TTTt III7 0 0 0 4 4 0 |
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
273 |
0 | 274 Note the additional column 13, that contains the number of deviant reads (e.g., there are two deviants, T and a, for position 414). |
275 | |
276 Finally, if **Convert coordinates to intervals?** is set to **Yes**, you will get one additional column with the end coordinate:: | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
277 |
0 | 278 chrM 412 413 G 4 ..t, III2 0 0 2 1 3 |
279 chrM 414 415 C 4 ..Ta III2 1 2 0 1 3 | |
280 chrM 414 415 C 4 TTTt III7 0 0 0 4 4 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
281 |
0 | 282 where:: |
283 | |
284 Column Definition | |
285 ------- ---------------------------- | |
286 1 Chromosome | |
287 2 Start position (0-based) | |
288 3 End position (1-based) | |
289 4 Reference base at that position | |
290 5 Coverage (# reads aligning over that position) | |
291 6 Bases within reads | |
292 7 Quality values (phred33 scale, see Galaxy wiki for more) | |
293 8 Number of A variants | |
294 9 Number of C variants | |
295 10 Number of G variants | |
296 11 Number of T variants | |
297 12 Quality adjusted coverage | |
298 13 Total number of deviants (if Convert coordinates to intervals? is set to yes) | |
299 | |
300 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
301 Note that in this case the coordinates of SNPs were converted to intervals, where the start coordinate is 0-based and the end coordinate in 1-based using the UCSC Table Browser convention. |
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
302 |
0 | 303 Although three positions have variants in the original file (413, 414, and 415), only 413 and 415 are reported because the quality values associated with these two SNPs are above the threshold of 20. In the case of 414 the **a** allele has a quality value of 17 ( ord("2")-33 ), and is therefore not reported. Note that five columns have been added to each of the reported lines:: |
304 | |
305 chrM 413 G 4 ..t, IIIH 0 0 2 1 3 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
306 |
0 | 307 Here, there is one variant, **t**. Because the fourth column represents **T** counts, it is incremented by 1. The last column shows that at this position, three reads have bases above the quality threshold of 20. |
308 | |
309 ----- | |
310 | |
311 **Example 1**: Just variants | |
312 | |
313 In this mode, the tool only outputs the lines from the input datasets where at least one read contains a sequence variant with quality above the threshold set by the **Do not consider read bases with quality lower than** option. For example, suppose one has a pileup dataset like the following:: | |
314 | |
315 chrM 412 A 2 ., II | |
316 chrM 413 G 4 ..t, III2 | |
317 chrM 414 C 4 ..Ta III2 | |
318 chrM 415 C 4 TTTt III7 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
319 |
0 | 320 To call all variants (with no restriction by coverage) with quality above phred value of 20, we will need to set the parameters as follows: |
321 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
322 .. image:: pileup_parser_help1.png |
0 | 323 |
324 Running the tool with these parameters will return:: | |
325 | |
326 chrM 413 G 4 ..t, IIIH 0 0 0 1 3 | |
327 chrM 414 C 4 ..Ta III2 0 2 0 1 3 | |
328 chrM 415 C 4 TTTt III7 0 0 0 4 4 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
329 |
0 | 330 **Note** that position 414 is not reported because the *a* variant has associated quality value of 17 (because ord('2')-33 = 17) and is below the phred threshold of 20 set by the **Count variants with quality above this value** parameter. |
331 | |
332 ----- | |
333 | |
334 **Example 2**: Report everything | |
335 | |
336 In addition to calling variants, it is often useful to know the quality adjusted coverage. Running the tool with these parameters: | |
337 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
338 .. image:: pileup_parser_help2.png |
0 | 339 |
340 will report everything from the original file:: | |
341 | |
342 chrM 412 A 2 ., II 2 0 0 0 2 | |
343 chrM 413 G 4 ..t, III2 0 0 2 1 3 | |
344 chrM 414 C 4 ..Ta III2 0 2 0 1 3 | |
345 chrM 415 C 4 TTTt III7 0 0 0 4 4 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
346 |
0 | 347 Here, you can see that although the total coverage at position 414 is 4 (column 4), the quality adjusted coverage is 3 (last column). This is because only three out of four reads have bases with quality above the set threshold of 20 (the actual qualities are III2 or, after conversion, 40, 40, 40, 17). |
348 | |
349 One can use the last column of this dataset to filter out (using Galaxy's **Filter** tool) positions where quality adjusted coverage (last column) is below a set threshold. | |
350 | |
351 ------ | |
352 | |
353 **Example 3**: Report everything and print total number of differences | |
354 | |
355 If you set the **Print total number of differences?** to **Yes** the tool will print an additional column with the total number of reads where a devinat base is above the quality threshold. So, seetiing parametrs like this: | |
356 | |
1 | 357 .. image:: pileup_parser_help3.png |
0 | 358 |
359 will produce this:: | |
360 | |
361 chrM 412 A 2 ., II 2 0 0 0 2 0 | |
362 chrM 413 G 4 ..t, III2 0 0 2 1 3 1 | |
363 chrM 414 C 4 ..Ta III2 0 2 0 1 3 1 | |
364 chrM 415 C 4 TTTt III7 0 0 0 4 4 0 | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
365 |
0 | 366 ----- |
367 | |
368 **Example 4**: Report everything, print total number of differences, and ignore qualities and read bases | |
369 | |
370 Setting **Print quality and base string?** to **Yes** as shown here: | |
371 | |
1 | 372 .. image:: pileup_parser_help4.png |
0 | 373 |
374 will produce this:: | |
375 | |
376 chrM 412 A 2 2 0 0 0 2 0 | |
377 chrM 413 G 4 0 0 2 1 3 1 | |
378 chrM 414 C 4 0 2 0 1 3 1 | |
379 chrM 415 C 4 0 0 0 4 4 0 | |
380 </help> | |
2
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
381 <citations> |
85bedbea8a12
planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_parser commit ab627176cd4f6efe6d1fe4b85baa679aaa651eb1
devteam
parents:
1
diff
changeset
|
382 </citations> |
0 | 383 </tool> |