annotate mergeBed.xml @ 1:82aac94b06c3 draft

Uploaded
author iuc
date Thu, 08 Jan 2015 14:25:51 -0500
parents b8348686a0b9
children 457b09031d57
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
1 <tool id="bedtools_mergebed" name="Merge BED files" version="@WRAPPER_VERSION@.0">
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
2 <description>(mergeBed)</description>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
3 <macros>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
4 <import>macros.xml</import>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
5 </macros>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
6 <expand macro="requirements" />
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
7 <expand macro="stdio" />
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
8 <command>
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
9 <![CDATA[
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
10 mergeBed
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
11 -i "${input}"
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
12 $strand
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
13 -d $distance
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
14 $header
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
15 > "${output}"
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
16 ]]>
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
17 </command>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
18 <inputs>
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
19 <param name="input" format="bam,bed,gff,vcf" type="data" label="Sort the following BAM/BED/VCF/GFF file"/>
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
20 <param name="strand" type="select" label="Calculation based on strandedness?">
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
21 <option value="" selected="True">Overlaps on either strand</option>
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
22 <option value="-s">Force strandedness. That is, only merge features that are the same strand.</option>
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
23 <option value="-S +">Force merge for forward strand only.</option>
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
24 <option value="-S -">Force merge for reverse strand only.</option>
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
25 </param>
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
26 <param name="distance" type="integer" value="0"
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
27 label="Maximum distance between features allowed for features to be merged"
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
28 help="That is, overlapping and/or book-ended features are merged. (-d)"/>
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
29 <expand macro="print_header" />
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
30 <expand macro="choose_columns" />
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
31 <expand macro="choose_operations">
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
32 <expand macro="math_options" />
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
33 <expand macro="additional_math_options" />
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
34 </expand>
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
35 </inputs>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
36 <outputs>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
37 <data format="bed" name="output" metadata_source="input" label="Merged ${input.name}"/>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
38 </outputs>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
39 <tests>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
40 <test>
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
41 <param name="input" value="mergedBed1.bed" ftype="bed" />
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
42 <output name="output" file="mergedBed_result1.bed" ftype="bed" />
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
43 </test>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
44 <test>
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
45 <param name="input" value="mergedBed2.bed" ftype="bed" />
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
46 <param name="strandedness" value="-s" />
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
47 <output name="output" file="mergedBed_result2.bed" ftype="bed" />
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
48 </test>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
49 <test>
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
50 <param name="input" value="mergedBed3.bed" ftype="bed" />
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
51 <param name="report_number" value="-n" />
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
52 <output name="output" file="mergedBed_result3.bed" ftype="bed" />
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
53 </test>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
54 <test>
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
55 <param name="input" value="mergedBed4.bed" ftype="bed" />
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
56 <param name="distance" value="1000" />
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
57 <output name="output" file="mergedBed_result4.bed" ftype="bed" />
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
58 </test>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
59 </tests>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
60 <help>
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
61 <![CDATA[
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
62 **What it does**
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
63
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
64 bedtools merge combines overlapping or "book-ended" features in an interval file into a single feature which spans all of the combined features.
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
65
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
66
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
67 .. image:: $PATH_TO_IMAGES/merge-glyph.png
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
68
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
69
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
70 .. class:: warningmark
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
71
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
72 bedtools merge requires that you presort your data by chromosome and then by start position.
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
73
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
74
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
75 ==========================================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
76 Default behavior
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
77 ==========================================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
78 By default, ``bedtools merge`` combines overlapping (by at least 1 bp) and/or
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
79 bookended intervals into a single, "flattened" or "merged" interval.
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
80
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
81 ::
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
82
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
83 $ cat A.bed
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
84 chr1 100 200
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
85 chr1 180 250
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
86 chr1 250 500
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
87 chr1 501 1000
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
88
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
89 $ bedtools merge -i A.bed
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
90 chr1 100 500
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
91 chr1 501 1000
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
92
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
93
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
94 ==========================================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
95 *-s* Enforcing "strandedness"
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
96 ==========================================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
97 The ``-s`` option will only merge intervals that are overlapping/bookended
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
98 *and* are on the same strand.
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
99
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
100 ::
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
101
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
102 $ cat A.bed
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
103 chr1 100 200 a1 1 +
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
104 chr1 180 250 a2 2 +
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
105 chr1 250 500 a3 3 -
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
106 chr1 501 1000 a4 4 +
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
107
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
108 $ bedtools merge -i A.bed -s
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
109 chr1 100 250 +
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
110 chr1 501 1000 +
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
111 chr1 250 500 -
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
112
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
113
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
114 ==========================================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
115 *-n* Reporting the number of features that were merged
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
116 ==========================================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
117 The -n option will report the number of features that were combined from the
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
118 original file in order to make the newly merged feature. If a feature in the
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
119 original file was not merged with any other features, a "1" is reported.
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
120
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
121 ::
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
122
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
123 $ cat A.bed
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
124 chr1 100 200
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
125 chr1 180 250
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
126 chr1 250 500
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
127 chr1 501 1000
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
128
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
129 $ bedtools merge -i A.bed -n
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
130 chr1 100 500 3
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
131 chr1 501 1000 1
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
132
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
133
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
134 ==========================================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
135 *-d* Controlling how close two features must be in order to merge
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
136 ==========================================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
137 By default, only overlapping or book-ended features are combined into a new
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
138 feature. However, one can force ``merge`` to combine more distant features
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
139 with the ``-d`` option. For example, were one to set ``-d`` to 1000, any
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
140 features that overlap or are within 1000 base pairs of one another will be
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
141 combined.
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
142
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
143 ::
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
144
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
145 $ cat A.bed
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
146 chr1 100 200
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
147 chr1 501 1000
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
148
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
149 $ bedtools merge -i A.bed
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
150 chr1 100 200
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
151 chr1 501 1000
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
152
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
153 $ bedtools merge -i A.bed -d 1000
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
154 chr1 100 200 1000
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
155
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
156
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
157 =============================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
158 *-nms* Reporting the names of the features that were merged
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
159 =============================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
160 Occasionally, one might like to know that names of the features that were
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
161 merged into a new feature. The ``-nms`` option will add an extra column to the
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
162 ``merge`` output which lists (separated by semicolons) the names of the
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
163 merged features.
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
164
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
165 ::
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
166
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
167 $ cat A.bed
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
168 chr1 100 200 A1
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
169 chr1 150 300 A2
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
170 chr1 250 500 A3
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
171
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
172 $ bedtools merge -i A.bed -nms
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
173 chr1 100 500 A1,A2,A3
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
174
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
175
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
176 ===============================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
177 *-scores* Reporting the scores of the features that were merged
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
178 ===============================================================
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
179 Similarly, we might like to know that scores of the features that were
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
180 merged into a new feature. Enter the ``-scores`` option. One can specify
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
181 how the scores from each overlapping interval should be reported.
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
182
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
183 ::
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
184
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
185 $ cat A.bed
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
186 chr1 100 200 A1 1
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
187 chr1 150 300 A2 2
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
188 chr1 250 500 A3 3
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
189
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
190 $ bedtools merge -i A.bed -scores mean
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
191 chr1 100 500 2
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
192
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
193 $ bedtools merge -i A.bed -scores max
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
194 chr1 100 500 3
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
195
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
196 $ bedtools merge -i A.bed -scores collapse
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
197 chr1 100 500 1,2,3
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
198
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
199 @REFERENCES@
1
82aac94b06c3 Uploaded
iuc
parents: 0
diff changeset
200 ]]>
0
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
201 </help>
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
202 <expand macro="citations" />
b8348686a0b9 Imported from capsule None
iuc
parents:
diff changeset
203 </tool>