annotate bismark_wrapper/bismark_methylation_extractor.xml @ 1:183de9d00131 draft

add indices.loc files
author bjoern-gruening
date Tue, 25 Dec 2012 05:52:28 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
1 <tool id="bismark_methylation_extractor" name="Bismark" version="0.7.7.2">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
2 <!-- Wrapper compatible with Bismark version 0.7.7 -->
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
3 <description>methylation extractor</description>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
4 <!--<version_command>bismark_methylation_extractor version</version_command>-->
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
5 <requirements>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
6 <requirement type="set_environment">SCRIPT_PATH</requirement>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
7 <requirement type="package" version="0.12.8">bowtie</requirement>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
8 <requirement type="package" version="2.0.0-beta7">bowtie2</requirement>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
9 </requirements>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
10 <parallelism method="basic"></parallelism>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
11 <command interpreter="python">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
12 bismark_methylation_extractor.py
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
13
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
14 --infile $input
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
15
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
16 --bismark_path \$SCRIPT_PATH
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
17
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
18 #if $singlePaired.sPaired == "single":
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
19 --single-end
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
20 #else:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
21 --paired-end
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
22 $no_overlap
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
23 #end if
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
24
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
25 #if str($ignore_bps) != "0":
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
26 --ignore $ignore_bps
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
27 #end if
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
28
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
29 #if $report:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
30 --report-file $o_report
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
31 #end if
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
32
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
33 #if $comprehensive:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
34 --comprehensive
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
35 #end if
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
36
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
37 #if $merge_non_cpg:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
38 --merge-non-cpg
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
39 #end if
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
40
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
41 #if $compress:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
42 --compress $compressed_output
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
43 #else:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
44 #if $comprehensive == False and $merge_non_cpg == False:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
45 ##twelfe files
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
46 --cpg_ot $cpg_ot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
47 --chg_ot $chg_ot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
48 --chh_ot $chh_ot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
49 --cpg_ctot $cpg_ctot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
50 --chg_ctot $chg_ctot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
51 --chh_ctot $chh_ctot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
52 --cpg_ob $cpg_ob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
53 --chg_ob $chg_ob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
54 --chh_ob $chh_ob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
55 --cpg_ctob $cpg_ctob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
56 --chg_ctob $chg_ctob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
57 --chh_ctob $chh_ctob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
58 #elif $merge_non_cpg and $comprehensive:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
59 ## two files
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
60 --non_cpg_context $non_cpg_context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
61 --cpg_context $cpg_context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
62 #elif $comprehensive:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
63 ## three files
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
64 --cpg_context $cpg_context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
65 --chg_context $chg_context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
66 --chh_context $chh_context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
67 #elif $merge_non_cpg:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
68 ## eight files
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
69 --non_cpg_context_ctot $non_cpg_context_ctot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
70 --non_cpg_context_ot $non_cpg_context_ot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
71 --non_cpg_context_ob $non_cpg_context_ob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
72 --non_cpg_context_ctob $non_cpg_context_ctob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
73 --cpg_ot $cpg_ot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
74 --cpg_ctot $cpg_ctot
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
75 --cpg_ob $cpg_ob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
76 --cpg_ctob $cpg_ctob
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
77 #end if
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
78 ## end compress
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
79 #end if
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
80
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
81 </command>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
82 <inputs>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
83 <!-- Input Parameters -->
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
84 <param name="input" type="data" format="sam" label="SAM file from Bismark bisulfid mapper" />
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
85 <conditional name="singlePaired">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
86 <param name="sPaired" type="select" label="Is this library mate-paired?">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
87 <option value="single">Single-end</option>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
88 <option value="paired">Paired-end</option>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
89 </param>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
90 <when value="single" />
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
91 <when value="paired">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
92 <param name="no_overlap" type="boolean" truevalue="--no-overlap" falsevalue="" checked="False" label="This option avoids scoring overlapping methylation calls twice, in case of overlapping read one and read two" help="" />
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
93 </when>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
94 </conditional>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
95
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
96 <param name="ignore_bps" type="integer" value="0" label="Ignore the first N bp when processing the methylation call string" />
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
97 <param name="comprehensive" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Merge all four possible strand-specific methylation info
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
98 into context-dependent output files" help="" />
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
99 <param name="merge_non_cpg" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Merge all non-CpG contexts into one file" help="This will produce eight strand-specific output files, or two output files in comprehensive mode." />
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
100 <param name="report" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Short methylation summary output" />
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
101 <param name="compress" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Compress all result files and output one single file" />
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
102
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
103 </inputs>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
104 <outputs>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
105 <!--
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
106 OT – original top strand
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
107 CTOT – complementary to original top strand
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
108 OB – original bottom strand
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
109 CTOB – complementary to original bottom strand
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
110 -->
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
111 <data format="tabular" name="o_report" label="${tool.name} on ${on_string}: Report file">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
112 <filter> ( report is True ) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
113 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
114
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
115 <!-- default output 12 files -->
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
116 <data format="tabular" name="cpg_ot" label="${tool.name} on ${on_string}: CpG original top strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
117 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
118 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
119 <data format="tabular" name="chg_ot" label="${tool.name} on ${on_string}: CHG original top strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
120 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
121 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
122 <data format="tabular" name="chh_ot" label="${tool.name} on ${on_string}: CHH original top strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
123 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
124 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
125 <data format="tabular" name="cpg_ctot" label="${tool.name} on ${on_string}: CpG complementary to top strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
126 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
127 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
128 <data format="tabular" name="chg_ctot" label="${tool.name} on ${on_string}: CHG complementary to top strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
129 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
130 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
131 <data format="tabular" name="chh_ctot" label="${tool.name} on ${on_string}: CHH complementary to top strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
132 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
133 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
134
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
135 <data format="tabular" name="cpg_ob" label="${tool.name} on ${on_string}: CpG original bottom strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
136 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
137 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
138 <data format="tabular" name="chg_ob" label="${tool.name} on ${on_string}: CHG original bottom strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
139 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
140 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
141 <data format="tabular" name="chh_ob" label="${tool.name} on ${on_string}: CHH original bottom strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
142 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
143 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
144 <data format="tabular" name="cpg_ctob" label="${tool.name} on ${on_string}: CpG complementary to bottom strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
145 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
146 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
147 <data format="tabular" name="chg_ctob" label="${tool.name} on ${on_string}: CHG complementary to bottom strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
148 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
149 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
150 <data format="tabular" name="chh_ctob" label="${tool.name} on ${on_string}: CHH complementary to bottom strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
151 <filter> ( compress == False and comprehensive == False and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
152 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
153
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
154 <!-- Context-dependent methylation output files (comprehensive option) -->
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
155 <data format="tabular" name="cpg_context" label="${tool.name} on ${on_string}: CpG context dependent">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
156 <filter> ( compress == False and comprehensive) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
157 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
158 <data format="tabular" name="chg_context" label="${tool.name} on ${on_string}: CHG context dependent">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
159 <filter> ( compress == False and comprehensive and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
160 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
161 <data format="tabular" name="chh_context" label="${tool.name} on ${on_string}: CHH context dependent">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
162 <filter> ( compress == False and comprehensive and merge_non_CpG == False) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
163 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
164
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
165 <data format="tabular" name="non_cpg_context" label="${tool.name} on ${on_string}: Non CpG context dependent">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
166 <filter> ( compress == False and comprehensive and merge_non_cpg) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
167 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
168
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
169 <data format="tabular" name="non_cpg_context_ot" label="${tool.name} on ${on_string}: Non CpG context dependent on original top strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
170 <filter> ( compress == False and comprehensive == False and merge_non_cpg) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
171 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
172 <data format="tabular" name="non_cpg_context_ctot" label="${tool.name} on ${on_string}: Non CpG context dependent on complementary to top strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
173 <filter> ( compress == False and comprehensive == False and merge_non_cpg) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
174 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
175 <data format="tabular" name="non_cpg_context_ob" label="${tool.name} on ${on_string}: Non CpG context dependent on bottom top strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
176 <filter> ( compress == False and comprehensive == False and merge_non_cpg) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
177 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
178 <data format="tabular" name="non_cpg_context_ctob" label="${tool.name} on ${on_string}: Non CpG context dependent on complementary to bottom strand">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
179 <filter> ( compress == False and comprehensive == False and merge_non_cpg) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
180 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
181
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
182 <data format="gzipped" name="compressed_output" label="${tool.name} on ${on_string}: Result archive.">
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
183 <filter> ( compress ) </filter>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
184 </data>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
185 </outputs>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
186
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
187 <tests>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
188 </tests>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
189
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
190 <help>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
191
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
192 **What it does**
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
193
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
194 The following is a brief description of all options to control the Bismark_
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
195 methylation extractor. The script reads in a bisulfite read alignment results file
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
196 produced by the Bismark bisulfite mapper and extracts the methylation information
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
197 for individual cytosines. This information is found in the methylation call field
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
198 which can contain the following characters:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
199
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
200
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
201 - X = for methylated C in CHG context (was protected)
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
202 - x = for not methylated C CHG (was converted)
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
203 - H = for methylated C in CHH context (was protected)
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
204 - h = for not methylated C in CHH context (was converted)
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
205 - Z = for methylated C in CpG context (was protected)
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
206 - z = for not methylated C in CpG context (was converted)
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
207 - . = for any bases not involving cytosines
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
208
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
209
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
210 The methylation extractor outputs result files for cytosines in CpG, CHG and CHH
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
211 context (this distinction is actually already made in Bismark itself). As the methylation
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
212 information for every C analysed can produce files which easily have tens or even hundreds of
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
213 millions of lines, file sizes can become very large and more difficult to handle. The C
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
214 methylation info additionally splits cytosine methylation calls up into one of the four possible
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
215 strands a given bisulfite read aligned against:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
216
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
217 - OT = original top strand
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
218 - CTOT = complementary to original top strand
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
219
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
220 - OB = original bottom strand
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
221 - CTOB = complementary to original bottom strand
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
222
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
223 Thus, by default twelve individual output files are being generated per input file (unless
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
224 --comprehensive is specified, see below). The output files can be imported into a genome
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
225 viewer, such as SeqMonk, and re-combined into a single data group if desired (in fact
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
226 unless the bisulfite reads were generated preserving directionality it doesn't make any
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
227 sense to look at the data in a strand-specific manner). Strand-specific output files can
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
228 optionally be skipped, in which case only three output files for CpG, CHG or CHH context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
229 will be generated. For both the strand-specific and comprehensive outputs there is also
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
230 the option to merge both non-CpG contexts (CHG and CHH) into one single non-CpG context.
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
231
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
232
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
233 .. _Bismark: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
234
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
235
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
236 It is developed by Krueger F and Andrews SR. at the Babraham Institute. Krueger F, Andrews SR. (2011) Bismark: a flexible aligner and methylation caller for Bisulfite-Seq applications. Bioinformatics, 27, 1571-2.
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
237
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
238 -------
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
239
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
240 **Bismark settings**
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
241
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
242 All of the options have a default value. You can change any of them. If any Bismark function is missing please contact the tool author or your Galaxy admin.
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
243
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
244 ------
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
245
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
246 **Outputs**
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
247
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
248 The output files are in the following format (tab delimited)::
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
249
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
250
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
251 Column Description
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
252 -------- --------------------------------------------------------
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
253 1 seq-ID
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
254 2 strand
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
255 3 chromosome
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
256 4 position
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
257 5 methylation call
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
258
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
259
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
260 * Methylated cytosines receive a '+' orientation,
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
261 * Unmethylated cytosines receive a '-' orientation.
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
262
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
263 ------
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
264
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
265 **OPTIONS**
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
266
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
267 Input::
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
268
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
269 -s/--single-end Input file(s) are Bismark result file(s) generated from single-end
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
270 read data. Specifying either --single-end or --paired-end is
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
271 mandatory.
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
272
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
273 -p/--paired-end Input file(s) are Bismark result file(s) generated from paired-end
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
274 read data. Specifying either --paired-end or --single-end is
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
275 mandatory.
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
276
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
277 --no_overlap For paired-end reads it is theoretically possible that read_1 and
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
278 read_2 overlap. This option avoids scoring overlapping methylation
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
279 calls twice. Whilst this removes a bias towards more methylation calls
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
280 towards the center of sequenced fragments it can de facto remove
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
281 a good proportion of the data.
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
282
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
283 --ignore INT Ignore the first INT bp at the 5' end of each read when processing the
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
284 methylation call string. This can remove e.g. a restriction enzyme site
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
285 at the start of each read.
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
286
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
287 Output::
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
288
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
289 --comprehensive Specifying this option will merge all four possible strand-specific
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
290 methylation info into context-dependent output files. The default
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
291 contexts are:
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
292 - CpG context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
293 - CHG context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
294 - CHH context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
295
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
296 --merge_non_CpG This will produce two output files (in --comprehensive mode) or eight
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
297 strand-specific output files (default) for Cs in
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
298 - CpG context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
299 - non-CpG context
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
300
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
301 --report Prints out a short methylation summary as well as the paramaters used to run
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
302 this script.
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
303
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
304
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
305 </help>
183de9d00131 add indices.loc files
bjoern-gruening
parents:
diff changeset
306 </tool>