comparison macs2_callpeak.xml @ 8:e8a060164e11 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/macs2 commit 4e2bb09986aebf442f2981e8d77aa512d4c86b90
author iuc
date Wed, 27 Dec 2017 10:18:03 -0500
parents f5d67c722d67
children acbd3fb47f90
comparison
equal deleted inserted replaced
7:f5d67c722d67 8:e8a060164e11
1 <tool id="macs2_callpeak" name="MACS2 callpeak" version="@VERSION_STRING@.0"> 1 <tool id="macs2_callpeak" name="MACS2 callpeak" version="@VERSION_STRING@.1">
2 <description>Call peaks from alignment results</description> 2 <description>Call peaks from alignment results</description>
3 <macros> 3 <macros>
4 <import>macs2_macros.xml</import> 4 <import>macs2_macros.xml</import>
5 </macros> 5 </macros>
6 <expand macro="requirements"> 6 <expand macro="requirements">
7 </expand> 7 </expand>
8 <expand macro="stdio" /> 8 <expand macro="stdio" />
9 <expand macro="version_command" /> 9 <expand macro="version_command" />
10 <command> 10 <command><![CDATA[
11 <![CDATA[
12 #set $temp_stderr = 'macs2_stderr' 11 #set $temp_stderr = 'macs2_stderr'
13 (macs2 callpeak 12 (macs2 callpeak
14 13
15 --name 'MACS2' 14 --name 'MACS2'
16 -t ${ ' '.join( map( lambda x:'"%s"' % ( x ), $input_treatment_file ) ) } 15
17 16 ## Treatment File(s)
18 #if str( $input_control_file ) != 'None': 17
19 -c ${ ' '.join( map( lambda x:'"%s"' % ( x ), $input_control_file ) ) } 18 #if str($treatment.t_multi_select) == "Yes":
19 -t ${ ' '.join( map( lambda x:'"%s"' % ( x ), '$treatment.input_treatment_file' ) ) }
20
21 #if '$treatment.input_treatment_file[0].ext.upper()' == "BAM" and $bampe:
22 --format BAMPE
23 #else
24 --format='$treatment.input_treatment_file[0].ext.upper()'
25 #end if
26
27 #else
28 -t '$treatment.input_treatment_file'
29
30 #if '$treatment.input_treatment_file.ext.upper()' == "BAM" and $bampe:
31 --format BAMPE
32 #else
33 --format='$treatment.input_treatment_file.ext.upper()'
34 #end if
20 #end if 35 #end if
21 36
22 #for $ifile in $input_treatment_file: 37 ## Control File(s)
23 #if $ifile.ext.upper() == "BAM" and $bampe: 38
24 --format BAMPE 39 #if str($control.c_select) == "Yes":
25 #else 40 #if str($control.c_multiple.c_multi_select) == "Yes":
26 --format='$ifile.ext.upper()' 41 -c ${ ' '.join( map( lambda x:'"%s"' % ( x ), '$control.c_multiple.input_control_file' ) ) }
42 #else
43 -c '$control.c_multiple.input_control_file'
44 #end if
27 #end if 45 #end if
28 #end for
29 46
30 @effective_genome_size@ 47 @effective_genome_size@
31 48
32 --bw '${band_width}' 49 --bw '${band_width}'
33 @mfold_command@ 50 @mfold_command@
40 --slocal $advanced_options.slocal 57 --slocal $advanced_options.slocal
41 --llocal $advanced_options.llocal 58 --llocal $advanced_options.llocal
42 #if $advanced_options.broad_options.broad_options_selector == "broad": 59 #if $advanced_options.broad_options.broad_options_selector == "broad":
43 --broad 60 --broad
44 --broad-cutoff='${ advanced_options.broad_options.broad_cutoff }' 61 --broad-cutoff='${ advanced_options.broad_options.broad_cutoff }'
45 #else: 62 #else
46 $advanced_options.broad_options.call_summits 63 $advanced_options.broad_options.call_summits
47 #end if 64 #end if
48 65
49 #if str( $advanced_options.keep_dup_options.keep_dup_options_selector ) == "user": 66 #if str( $advanced_options.keep_dup_options.keep_dup_options_selector ) == "user":
50 --keep-dup '${ advanced_options.keep_dup_options.user_keepdup }' 67 --keep-dup '${ advanced_options.keep_dup_options.user_keepdup }'
102 #end if 119 #end if
103 && 120 &&
104 exit_code_for_galaxy=\$? && 121 exit_code_for_galaxy=\$? &&
105 cat $temp_stderr 2>&1 && 122 cat $temp_stderr 2>&1 &&
106 (exit \$exit_code_for_galaxy) 123 (exit \$exit_code_for_galaxy)
107 ]]> 124 ]]></command>
108 </command>
109 <inputs> 125 <inputs>
110 <param name="input_treatment_file" type="data" format="bam,sam,bed" multiple="true" 126 <conditional name="treatment">
111 label="ChIP-Seq Treatment File" /> 127 <param name="t_multi_select" type="select" label="Are you pooling Treatment Files?" help="For more information, see Help section below" >
112 <param name="input_control_file" type="data" format="bam,sam,bed" multiple="true" optional="True" 128 <option value="No" selected="True">No</option>
113 label="ChIP-Seq Control File" /> 129 <option value="Yes">Yes</option>
130 </param>
131 <when value="No" >
132 <param name="input_treatment_file" argument="-t" type="data" format="bam,sam,bed" label="ChIP-Seq Treatment File" />
133 </when>
134 <when value="Yes">
135 <param name="input_treatment_file" argument="-t" type="data" format="bam,sam,bed" multiple="true" label="ChIP-Seq Treatment File" />
136 </when>
137 </conditional>
138
139 <conditional name="control">
140 <param name="c_select" type="select" label="Do you have a Control File?" >
141 <option value="Yes" selected="True">Yes</option>
142 <option value="No">No</option>
143 </param>
144 <when value="Yes">
145 <conditional name="c_multiple">
146 <param name="c_multi_select" type="select" label="Are you pooling Control Files?" help="For more information, see Help section below" >
147 <option value="No" selected="True">No</option>
148 <option value="Yes">Yes</option>
149 </param>
150 <when value="No" >
151 <param name="input_control_file" argument="-c" type="data" format="bam,sam,bed" label="ChIP-Seq Control File" />
152 </when>
153 <when value="Yes">
154 <param name="input_control_file" argument="-c" type="data" format="bam,sam,bed" multiple="true" label="ChIP-Seq Control File" />
155 </when>
156 </conditional>
157 </when>
158 <when value="No" />
159 </conditional>
114 160
115 <param name="bampe" type="boolean" truevalue="--format BAMPE" falsevalue="" checked="False" 161 <param name="bampe" type="boolean" truevalue="--format BAMPE" falsevalue="" checked="False"
116 label="Are your inputs Paired-end BAM files?" 162 label="Are your inputs Paired-end BAM files?"
117 help="The 'Build model step' will be ignored and the real fragments will be used for each template defined by leftmost and rightmost mapping positions. (--format BAMPE)"/> 163 help="The 'Build model step' will be ignored and the real fragments will be used for each template defined by leftmost and rightmost mapping positions. (--format BAMPE)"/>
118 164
139 <option value="create_model" selected="true">Build the shifting model</option> 185 <option value="create_model" selected="true">Build the shifting model</option>
140 </param> 186 </param>
141 <when value="create_model"/> 187 <when value="create_model"/>
142 <when value="nomodel"> 188 <when value="nomodel">
143 <param name="extsize" type="integer" value="200" label="Set extension size" help="The arbitrary extension size in bp. When nomodel is true, MACS will use this value as fragment size to extend each read towards 3-prime; end, then pile them up. It is exactly twice the number of obsolete SHIFTSIZE. In previous language, each read is moved 5-prime-to-3-prime direction to middle of fragment by 0.5 d, then extended to both direction with 0.5 d. This is equivalent to say each read is extended towards 5-prime-to-3-prime into a d size fragment. --extsize (this option) and --shift (the option below) can be combined when necessary. See --shift option below. Default = 200 (--extsize)."/> 189 <param name="extsize" type="integer" value="200" label="Set extension size" help="The arbitrary extension size in bp. When nomodel is true, MACS will use this value as fragment size to extend each read towards 3-prime; end, then pile them up. It is exactly twice the number of obsolete SHIFTSIZE. In previous language, each read is moved 5-prime-to-3-prime direction to middle of fragment by 0.5 d, then extended to both direction with 0.5 d. This is equivalent to say each read is extended towards 5-prime-to-3-prime into a d size fragment. --extsize (this option) and --shift (the option below) can be combined when necessary. See --shift option below. Default = 200 (--extsize)."/>
144 <param name="shift" type="integer" value="0" label="Set shift size" help="(NOT the legacy --shiftsize option!) The arbitrary shift in bp. Use discretion while setting it other than default value. When NOMODEL is set, MACS will use this value to move cutting ends (5-prime) towards 5-prime-to-3-prime direction then apply EXTSIZE to extend them to fragments. When this value is negative, ends will be moved toward 3-prime-to-5-prime direction. Recommended to keep it as default 0 for ChIP-Seq datasets, or -1 * 0.5 of --extsize (option above) together with --extsize option for detecting enriched cutting loci such as certain DNAseI-Seq datasets. Note, you can't set values other than 0 if format is BAMPE for paired-end data. Default = 0 (--shift)."/> 190 <param name="shift" type="integer" value="0" label="Set shift size" help="(NOT the legacy --shiftsize option!) The arbitrary shift in bp. Use discretion while setting it other than default value. When NOMODEL is set, MACS will use this value to move cutting ends (5-prime) towards 5-prime-to-3-prime direction then apply EXTSIZE to extend them to fragments. When this value is negative, ends will be moved toward 3-prime-to-5-prime direction. Recommended to keep it as default 0 for ChIP-Seq datasets, or -1 * 0.5 of --extsize (option above) together with --extsize option for detecting enriched cutting loci such as certain DNAseI-Seq datasets. Note, you can't set values other than 0 if format is paired-end data (BAMPE). Default = 0 (--shift)."/>
145 </when> 191 </when>
146 </conditional> 192 </conditional>
147 193
148 <param name="outputs" type="select" display="checkboxes" multiple="True" optional="false" label="Outputs" help="PDF only created when model is build"> 194 <param name="outputs" type="select" display="checkboxes" multiple="True" optional="True" label="Additional Outputs" help="PDF is only created when the model is built">
149 <option value="peaks_tabular" selected="True">Peaks as tabular file</option> 195 <option value="peaks_tabular">Peaks as tabular file</option>
150 <option value="summits" selected="true">Peak summits</option> 196 <option value="summits">Peak summits</option>
151 <option value="bdg" selected="true">Scores in bedGraph files (--bdg)</option> 197 <option value="bdg" >Scores in bedGraph files (--bdg)</option>
152 <option value="html">Summary page (html)</option> 198 <option value="html">Summary page (html)</option>
153 <option value="pdf">Plot in PDF</option> 199 <option value="pdf">Plot in PDF</option>
154 </param> 200 </param>
155 201
156 <conditional name="advanced_options"> 202 <conditional name="advanced_options">
157 <param name="advanced_options_selector" type="select" label="Advanced options"> 203 <param name="advanced_options_selector" type="select" label="Advanced Options">
158 <option value="off" selected="true">Hide advanced options</option> 204 <option value="off" selected="true">Hide advanced options</option>
159 <option value="on">Display advanced options</option> 205 <option value="on">Display advanced options</option>
160 </param> 206 </param>
161 <when value="on"> 207 <when value="on">
162 <param name="to_large" type="boolean" truevalue="--to-large" falsevalue="" checked="False" 208 <param name="to_large" type="boolean" truevalue="--to-large" falsevalue="" checked="False"
193 </conditional> 239 </conditional>
194 </inputs> 240 </inputs>
195 <outputs> 241 <outputs>
196 <!--callpeaks output--> 242 <!--callpeaks output-->
197 <data name="output_tabular" format="tabular" label="${tool.name} on ${on_string} (Peaks in tabular format)"> 243 <data name="output_tabular" format="tabular" label="${tool.name} on ${on_string} (Peaks in tabular format)">
198 <filter>'peaks_tabular' in outputs</filter> 244 <filter> outputs and 'peaks_tabular' in outputs</filter>
199 </data> 245 </data>
200 <data name="output_broadpeaks" format="bed" from_work_dir="MACS2_peaks.broadPeak" label="${tool.name} on ${on_string} (broad Peaks)"> 246 <data name="output_broadpeaks" format="bed" from_work_dir="MACS2_peaks.broadPeak" label="${tool.name} on ${on_string} (broad Peaks)">
201 <filter> 247 <filter>
202 (( 248 ((
203 advanced_options['advanced_options_selector'] == "on" and 249 advanced_options['advanced_options_selector'] == "on" and
222 advanced_options['broad_options']['broad_options_selector'] == "nobroad" 268 advanced_options['broad_options']['broad_options_selector'] == "nobroad"
223 )) 269 ))
224 </filter> 270 </filter>
225 </data> 271 </data>
226 <data name="output_summits" format="bed" from_work_dir="MACS2_summits.bed" label="${tool.name} on ${on_string} (summits in BED)"> 272 <data name="output_summits" format="bed" from_work_dir="MACS2_summits.bed" label="${tool.name} on ${on_string} (summits in BED)">
227 <filter>'summits' in outputs</filter> 273 <filter>outputs and 'summits' in outputs</filter>
228 </data> 274 </data>
229 <data name="output_plot" format="pdf" from_work_dir="MACS2_model.pdf" label="${tool.name} on ${on_string} (plot)"> 275 <data name="output_plot" format="pdf" from_work_dir="MACS2_model.pdf" label="${tool.name} on ${on_string} (plot)">
230 <filter> 276 <filter>
231 (( 277 ((
232 'pdf' in outputs and 278 outputs and 'pdf' in outputs and
233 nomodel_type['nomodel_type_selector'] == "create_model" 279 nomodel_type['nomodel_type_selector'] == "create_model"
234 )) 280 ))
235 </filter> 281 </filter>
236 </data> 282 </data>
237 <data name="output_treat_pileup" format="bedgraph" from_work_dir="MACS2_treat_pileup.bdg" label="${tool.name} on ${on_string} (Bedgraph Treatment)"> 283 <data name="output_treat_pileup" format="bedgraph" from_work_dir="MACS2_treat_pileup.bdg" label="${tool.name} on ${on_string} (Bedgraph Treatment)">
238 <filter>'bdg' in outputs</filter> 284 <filter>outputs and 'bdg' in outputs</filter>
239 </data> 285 </data>
240 <data name="output_control_lambda" format="bedgraph" from_work_dir="MACS2_control_lambda.bdg" label="${tool.name} on ${on_string} (Bedgraph Control)"> 286 <data name="output_control_lambda" format="bedgraph" from_work_dir="MACS2_control_lambda.bdg" label="${tool.name} on ${on_string} (Bedgraph Control)">
241 <filter>'bdg' in outputs</filter> 287 <filter>outputs and 'bdg' in outputs</filter>
242 </data> 288 </data>
243 <data name="output_extra_files" format="html" label="${tool.name} on ${on_string} (html report)"> 289 <data name="output_extra_files" format="html" label="${tool.name} on ${on_string} (html report)">
244 <filter>'html' in outputs</filter> 290 <filter>outputs and 'html' in outputs</filter>
245 </data> 291 </data>
246 </outputs> 292 </outputs>
247 <tests> 293 <tests>
248 <test> 294 <test expect_num_outputs="5">
295 <param name="input_treatment_file" value="ChIP_200K.bed" ftype="bed"/>
296 <param name="c_select" value="Yes"/>
249 <param name="input_control_file" value="Control_200K.bed" ftype="bed"/> 297 <param name="input_control_file" value="Control_200K.bed" ftype="bed"/>
250 <param name="input_treatment_file" value="ChIP_200K.bed" ftype="bed"/>
251 <param name="cutoff_options_selector" value="qvalue"/> 298 <param name="cutoff_options_selector" value="qvalue"/>
252 <param name="qvalue" value="0.05"/> 299 <param name="qvalue" value="0.05"/>
253 <param name="band_width" value="300"/> 300 <param name="band_width" value="300"/>
254 <param name="outputs" value="peaks_tabular,bdg,html"/> 301 <param name="outputs" value="peaks_tabular,bdg,html"/>
255 <param name="effective_genome_size_options_selector" value="user_defined" /> 302 <param name="effective_genome_size_options_selector" value="user_defined" />
264 <has_text text="Additional output created by MACS2" /> 311 <has_text text="Additional output created by MACS2" />
265 </assert_contents> 312 </assert_contents>
266 </output> 313 </output>
267 314
268 </test> 315 </test>
269 <test> 316 <!-- Ensure pdf can be output -->
317 <test expect_num_outputs="2">
318 <param name="input_treatment_file" value="ChIP_200K.bed" ftype="bed"/>
319 <param name="c_select" value="Yes"/>
270 <param name="input_control_file" value="Control_200K.bed" ftype="bed"/> 320 <param name="input_control_file" value="Control_200K.bed" ftype="bed"/>
271 <param name="input_treatment_file" value="ChIP_200K.bed" ftype="bed"/>
272 <param name="cutoff_options_selector" value="qvalue"/> 321 <param name="cutoff_options_selector" value="qvalue"/>
273 <param name="qvalue" value="0.05"/> 322 <param name="qvalue" value="0.05"/>
274 <param name="band_width" value="300"/> 323 <param name="band_width" value="300"/>
275 <param name="outputs" value="pdf"/> 324 <param name="outputs" value="pdf"/>
276 <param name="effective_genome_size_options_selector" value="user_defined" /> 325 <param name="effective_genome_size_options_selector" value="user_defined" />
278 <param name="lower" value="5" /> 327 <param name="lower" value="5" />
279 <param name="upper" value="50" /> 328 <param name="upper" value="50" />
280 <output name="output_plot" file="magic.pdf" ftype="pdf" compare="contains" /> 329 <output name="output_plot" file="magic.pdf" ftype="pdf" compare="contains" />
281 </test> 330 </test>
282 </tests> 331 </tests>
283 <help> 332 <help><![CDATA[
284 <![CDATA[ 333
334 .. class:: infomark
335
285 **What it does** 336 **What it does**
286 337
287 **callpeak** is the main function of the MACS2_ package. MACS identifies enriched binding sites in ChIP-seq experiments. 338 **callpeak** is the main function of the MACS2_ package. MACS identifies enriched binding sites in ChIP-seq experiments. It captures the influence of genome complexity to evaluate the significance of enriched ChIP regions, and improves the spatial resolution of binding sites through combining the information of both sequencing tag position and orientation.
288 It captures the influence of genome complexity to evaluate the significance of enriched ChIP regions,
289 and improves the spatial resolution of binding sites through combining the information of both sequencing
290 tag position and orientation. MACS can be used for ChIP-Seq data alone, or with control sample with the
291 increase of specificity (recommended).
292 339
293 .. _MACS2: https://github.com/taoliu/MACS 340 .. _MACS2: https://github.com/taoliu/MACS
294 341
342 -----
343
344 **Inputs**
345
346 MACS can be used for ChIP-Seq data (Treatment) alone, or with a Control sample with the increase of specificity (recommended).
347
348 A Treatment File is the only REQUIRED parameter for MACS. The file can be in BAM or BED format and this tool will autodetect the format using the first treatment file provided as input. If you have more than one alignment file per sample, you can select to pool them above. MACS can pool files together e.g. as `-t A B C` for treatment or `-c A B C` for control.
349
350 Both single-end and paired-end mapping results can be input and you can specify if the data is from paired-end reads above. Paired-end mapping results can be input to MACS as a single BAM file, and just the left mate (5' end) tag will be automatically kept. However, when paired-end format (BAMPE) is specified, MACS will use the real fragments inferred from alignment results for reads pileup.
351
352 -----
353
354 **Outputs**
355
356 This tool produces a BED file of narrowPeaks as default output. It can also produce additional outputs, which can be selected under the **Additional Outputs** option above.
357
358 * **a BED file of peaks** (default)
359 * a tabular file of peaks
360 * a BED file of peak summits
361 * two bedGraph files of scores, for treatment pileup and control lambda
362 * a HTML summary page
363 * a PDF plot (if model is built)
364 * a BED file of broad peaks (if **Composite broad regions** is selected under Advanced Options)
365 * a BED file of gapped peaks (if **Composite broad regions** is selected under Advanced Options)
366
367 **Peaks BED File**
368
369 The default output is the narrowPeak BED file (BED6+4 format). This contains the peak locations, together with peak summit, pvalue and qvalue. You can load it to UCSC genome browser.
370
371 Example:
372
373 ======= ========= ======= ============ ==== === ======= ======== ======= =======
374 1 2 3 4 5 6 7 8 9 **10**
375 ======= ========= ======= ============ ==== === ======= ======== ======= =======
376 chr1 840081 840400 MACS2_peak_1 69 . 4.89872 10.50944 6.91052 158
377 chr1 919419 919785 MACS2_peak_2 87 . 5.85158 12.44148 8.70936 130
378 chr1 937220 937483 MACS2_peak_3 66 . 4.87632 10.06728 6.61759 154
379 ======= ========= ======= ============ ==== === ======= ======== ======= =======
380
381 Columns contain the following data:
382
383 * **1st**: chromosome name
384 * **2nd**: start position of peak
385 * **3rd**: end position of peak
386 * **4th**: name of peak
387 * **5th**: integer score for display in genome browser (e.g. UCSC)
388 * **6th**: strand, either "." (=no strand) or "+" or "-"
389 * **7th**: fold-change
390 * **8th**: -log10pvalue
391 * **9th**: -log10qvalue
392 * **10th**: relative summit position to peak start
393
394
395 **Peaks tabular File**
396
397 A tabular file which contains information about called peaks. You can open it in Excel and sort/filter using Excel functions.
398
399 Example:
400
401 ======= ========= ======= ========== ============== ========== ================== =================== ================== =============
402 **chr** **start** **end** **length** **abs_summit** **pileup** **-log10(pvalue)** **fold_enrichment** **-log10(qvalue)** **name**
403 ======= ========= ======= ========== ============== ========== ================== =================== ================== =============
404 chr1 840082 840400 319 840240 4.00 10.50944 4.89872 6.91052 MACS2_peak_1
405 chr1 919420 919785 366 919550 5.00 12.44148 5.85158 8.70936 MACS2_peak_2
406 chr1 937221 937483 263 937375 4.00 10.06728 4.87632 6.61759 MACS2_peak_3
407 ======= ========= ======= ========== ============== ========== ================== =================== ================== =============
408
409 Columns contain the following data:
410
411 * **chr**: chromosome name
412 * **start**: start position of peak
413 * **end**: end position of peak
414 * **length**: length of peak region
415 * **abs_summit**: absolute peak summit position
416 * **pileup**: pileup height at peak summit
417 * **-log10(pvalue)**: -log10(pvalue) for the peak summit (e.g. pvalue =1e-10, then this value should be 10)
418 * **fold_enrichment**: fold enrichment for this peak summit against random Poisson distribution with local lambda
419 * **-log10(qvalue)**: -log10(qvalue) at peak summit
420 * **name**: name of peak
421
422 *Note that these tabular file coordinates are 1-based which is different than the 0-based BED format (compare the start values in the BED and tabular Example above)*
423
424
425 **Summits BED File**
426
427 A BED file which contains the peak summits locations for every peaks. The 5th column in this file is -log10qvalue, the same as in the Peaks BED file. If you want to find the motifs at the binding sites, this file is recommended. The file can be loaded directly to UCSC genome browser. Remove the beginning track line if you want to analyze it by other tools.
428
429 Example:
430
431 ======= ========= ======= ============ =======
432 1 2 3 4 **5**
433 ======= ========= ======= ============ =======
434 chr1 840239 840240 MACS2_peak_1 6.91052
435 chr1 919549 919550 MACS2_peak_2 8.70936
436 chr1 937374 937375 MACS2_peak_3 6.61759
437 ======= ========= ======= ============ =======
438
439 Columns contain the following data:
440
441 * **1st**: chromosome name
442 * **2nd**: start position of peak
443 * **3rd**: end position of peak
444 * **4th**: name of peak
445 * **5th**: -log10qvalue
446
447
448 **BedGraph Files**
449
450 MACS2 will output two kinds of bedGraph files if the --bdg option is selected under the Additional Outputs option above, which contain the scores for the treatment fragment pileup and control local lambda, respectively. BedGraph files can be imported into genome browsers, such as UCSC genome browser, or be converted into even smaller bigWig files. For more information on bedGraphs, see the `UCSC website here`_.
451
452
453 Example:
454
455 **Treatment pileup file**
456
457 ======= ========= ======= =======
458 1 2 3 **4**
459 ======= ========= ======= =======
460 chr1 840146 840147 3.00000
461 chr1 840147 840332 4.00000
462 chr1 840332 840335 3.00000
463 ======= ========= ======= =======
464
465
466 **Control lambda file**
467
468 ======= ========= ======= =======
469 1 2 3 **4**
470 ======= ========= ======= =======
471 chr1 800953 801258 0.02536
472 chr1 801258 801631 0.25364
473 chr1 801631 801885 0.99858
474 ======= ========= ======= =======
475
476 Columns contain the following data:
477
478 * **1st**: chromosome name
479 * **2nd**: start position of peak
480 * **3rd**: end position of peak
481 * **4th**: treatment pileup score or control local lambda score
482
483
484 **Broad peaks File**
485
486 If the broad option (--broad) is selected unded Advanced Options above, MACS2 will output a broadPeaks file. When this flag is on, MACS will try to composite broad regions in BED12 ( a gene-model-like format ) by putting nearby highly enriched regions into a broad region with loose cutoff. The broad region is controlled by another cutoff through --broad-cutoff. The maximum length of broad region length is 4 times of d from MACS. The broad peaks file is in BED6+3 format which is similar to the narrowPeak file, except for missing the 10th column for annotating peak summits.
487
488 Example:
489
490 ======= ========= ======= ============ ==== === ======= ======= =======
491 1 2 3 4 5 6 7 8 9
492 ======= ========= ======= ============ ==== === ======= ======= =======
493 chr1 840081 840400 MACS2_peak_1 52 . 4.08790 8.57605 5.21506
494 chr1 919419 919785 MACS2_peak_2 56 . 4.37270 8.90436 5.60462
495 chr1 937220 937483 MACS2_peak_3 48 . 4.02343 8.06676 4.86861
496 ======= ========= ======= ============ ==== === ======= ======= =======
497
498
499 Columns contain the following data:
500
501 * **1st**: chromosome name
502 * **2nd**: start position of peak
503 * **3rd**: end position of peak
504 * **4th**: name of peak
505 * **5th**: integer score for display in genome browser (e.g. UCSC)
506 * **6th**: strand, either "." (=no strand) or "+" or "-"
507 * **7th**: fold-change
508 * **8th**: -log10pvalue
509 * **9th**: -log10qvalue
510
511
512 **Gapped peaks File**
513
514 If the broad option (--broad) is selected unded Advanced Options above, MACS2 will also output a gappedPeaks file. The gappedPeak file is in BED12+3 format and contains both the broad region and narrow peaks. The file can be loaded directly to UCSC genome browser.
515
516 Example:
517
518 ======= ========= ======= ============ ==== === ======= ======= === === === === ======= ======= =======
519 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
520 ======= ========= ======= ============ ==== === ======= ======= === === === === ======= ======= =======
521 chr1 840081 840400 MACS2_peak_1 52 . 840081 840400 0 1 319 0 4.08790 8.57605 5.21506
522 chr1 919419 919785 MACS2_peak_2 56 . 919419 919785 0 1 366 0 4.37270 8.90436 5.60462
523 chr1 937220 937483 MACS2_peak_3 48 . 937220 937483 0 1 263 0 4.02343 8.06676 4.86861
524 ======= ========= ======= ============ ==== === ======= ======= === === === === ======= ======= =======
525
526 Columns contain the following data:
527
528 * **1st**: chromosome name
529 * **2nd**: start position of peak
530 * **3rd**: end position of peak
531 * **4th**: name of peak
532 * **5th**: 10*-log10qvalue, to be more compatible to show grey levels on UCSC browser
533 * **6th**: strand, either "." (=no strand) or "+" or "-"
534 * **7th**: start of the first narrow peak in the region
535 * **8th**: end of the peak
536 * **9th**: RGB color key, default colour is 0
537 * **10th**: number of blocks, including the starting 1bp and ending 1bp of broad regions
538 * **11th**: length of each block, comma-separated values if multiple
539 * **12th**: start of each block, comma-separated values if multiple
540 * **13th**: fold-change
541 * **14th**: -log10pvalue
542 * **15th**: -log10qvalue
543
544 -----
545
546 **More Information**
547
295 MACS2 performs the following analysis steps: 548 MACS2 performs the following analysis steps:
296 549
297 * Artificially extend reads to expected fragment length, and generate coverage map along genome. 550 * Artificially extends reads to expected fragment length, and generates coverage map along genome.
298 * Assume background reads are Poisson distributed. Mean of the Poisson is locally variable and is estimated from control experiment (if available) in 5Kbp or 10Kbp around examined location. 551 * Assumes background reads are Poisson distributed. Mean of the Poisson is locally variable and is estimated from control experiment (if available) in 5Kbp or 10Kbp around examined location.
299 * For a given location, do we see more reads than we would have expected from the Poisson (p < 0.00005)? If Yes, MACS2 calls a peak. 552 * For a given location, asks do we see more reads than we would have expected from the Poisson (p < 0.00005)? If Yes, MACS2 calls a peak.
300 553
554
555 **Tips of fine-tuning peak calling**
556
557 Check out these other MACS2 tools:
558
559 * **MACS2 bdgcmp** can be used on the callpeak bedGraph files or bedGraph files from other resources to calculate score track.
560 * **MACS2 bdgpeakcall** can be used on the file generated from bdgcmp or bedGraph file from other resources to call peaks with given cutoff, maximum-gap between nearby mergable peaks and minimum length of peak. bdgbroadcall works similarly to bdgpeakcall, however it will output a broad peaks file in BED12 format.
561 * Differential calling tool **MACS2 bdgdiff**, can be used on 4 bedGraph files which are scores between treatment 1 and control 1, treatment 2 and control 2, treatment 1 and treatment 2, treatment 2 and treatment 1. It will output the consistent and unique sites according to parameter settings for minimum length, maximum gap and cutoff.
301 562
302 .. class:: warningmark 563 .. class:: warningmark
303 564
304 If MACS2 fails, it is usually because it cannot build the model for peaks. You may want to extend **mfold** range by increasing the upper bound or play with **Build model** options. 565 If MACS2 fails, it is usually because it cannot build the model for peaks. You may want to extend **mfold** range by increasing the upper bound or play with **Build model** options. For more information, see the MACS2_ website.
305 566
567 .. _`UCSC website here`: https://genome.ucsc.edu/goldenPath/help/bedgraph.html
306 568
307 @citation@ 569 @citation@
308 ]]> 570 ]]></help>
309 </help>
310 <expand macro="citations" /> 571 <expand macro="citations" />
311 </tool> 572 </tool>