comparison macs2_callpeak.xml @ 16:495a4173006f draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/macs2 commit 77a41905b31b6e93ff95b2c36bae865b60ab62d6
author iuc
date Tue, 16 Oct 2018 10:31:14 -0400
parents c33686854b19
children 424aefbd7777
comparison
equal deleted inserted replaced
15:c33686854b19 16:495a4173006f
165 </conditional> 165 </conditional>
166 </when> 166 </when>
167 <when value="No" /> 167 <when value="No" />
168 </conditional> 168 </conditional>
169 169
170 <param name="format" type="select" label="Format of Input Files" help="For Paired-end BAM (BAMPE) the 'Build model step' will be ignored and the real fragments will be used for each template defined by leftmost and rightmost mapping positions (--format). Default: Single-end BAM"> 170 <param argument="--format" type="select" label="Format of Input Files" help="For Paired-end BAM (BAMPE) the 'Build model step' will be ignored and the real fragments will be used for each template defined by leftmost and rightmost mapping positions. Default: Single-end BAM">
171 <option value="BAM" selected="True">Single-end BAM</option> 171 <option value="BAM" selected="True">Single-end BAM</option>
172 <option value="BAMPE">Paired-end BAM</option> 172 <option value="BAMPE">Paired-end BAM</option>
173 <option value="BED">Single-end BED</option> 173 <option value="BED">Single-end BED</option>
174 </param> 174 </param>
175 175
181 <option value="create_model" selected="true">Build the shifting model</option> 181 <option value="create_model" selected="true">Build the shifting model</option>
182 </param> 182 </param>
183 <when value="create_model"> 183 <when value="create_model">
184 <param name="mfold_lower" type="integer" value="5" label="Set lower mfold bound" help="Select the lower region within MFOLD range of high confidence enrichment ratio against background to build model. Fold-enrichment in regions must be higher than lower limit (--mfold). Default: 5" /> 184 <param name="mfold_lower" type="integer" value="5" label="Set lower mfold bound" help="Select the lower region within MFOLD range of high confidence enrichment ratio against background to build model. Fold-enrichment in regions must be higher than lower limit (--mfold). Default: 5" />
185 <param name="mfold_upper" type="integer" value="50" label="Set upper mfold bound" help="Select the upper region within MFOLD range of high confidence enrichment ratio against background to build model. Fold-enrichment in regions must be lower than the upper limit (--mfold). Default: 50"/> 185 <param name="mfold_upper" type="integer" value="50" label="Set upper mfold bound" help="Select the upper region within MFOLD range of high confidence enrichment ratio against background to build model. Fold-enrichment in regions must be lower than the upper limit (--mfold). Default: 50"/>
186 <param name="band_width" type="integer" value="300" 186 <param name="band_width" argument="--bw" type="integer" value="300"
187 label="Band width for picking regions to compute fragment size" 187 label="Band width for picking regions to compute fragment size"
188 help=" You can set this parameter as the medium fragment size expected from sonication or size selection (--bw). Default: 300" /> 188 help=" You can set this parameter as the medium fragment size expected from sonication or size selection. Default: 300" />
189 </when> 189 </when>
190 <when value="nomodel"> 190 <when value="nomodel">
191 <param name="extsize" type="integer" value="200" label="Set extension size" help="The arbitrary extension size in bp. When nomodel is true, MACS will use this value as fragment size to extend each read towards 3-prime; end, then pile them up. It is exactly twice the number of obsolete SHIFTSIZE. In previous language, each read is moved 5-prime-to-3-prime direction to middle of fragment by 0.5 d, then extended to both direction with 0.5 d. This is equivalent to say each read is extended towards 5-prime-to-3-prime into a d size fragment. --extsize (this option) and --shift (the option below) can be combined when necessary. See --shift option below. Default: 200 (--extsize)."/> 191 <param argument="--extsize" type="integer" value="200" label="Set extension size" help="The arbitrary extension size in bp. When nomodel is true, MACS will use this value as fragment size to extend each read towards 3-prime; end, then pile them up. It is exactly twice the number of obsolete SHIFTSIZE. In previous language, each read is moved 5-prime-to-3-prime direction to middle of fragment by 0.5 d, then extended to both direction with 0.5 d. This is equivalent to say each read is extended towards 5-prime-to-3-prime into a d size fragment. --extsize (this option) and --shift (the option below) can be combined when necessary. See --shift option below. Default: 200."/>
192 <param name="shift" type="integer" value="0" label="Set shift size" help="(NOT the legacy --shiftsize option!) The arbitrary shift in bp. Use discretion while setting it other than default value. When NOMODEL is set, MACS will use this value to move cutting ends (5-prime) towards 5-prime-to-3-prime direction then apply EXTSIZE to extend them to fragments. When this value is negative, ends will be moved toward 3-prime-to-5-prime direction. Recommended to keep it as default 0 for ChIP-Seq datasets, or -1 * 0.5 of --extsize (option above) together with --extsize option for detecting enriched cutting loci such as certain DNAseI-Seq datasets. Note, you can't set values other than 0 if format is paired-end data (BAMPE). Default: 0 (--shift)."/> 192 <param argument="--shift" type="integer" value="0" label="Set shift size" help="(NOT the legacy --shiftsize option!) The arbitrary shift in bp. Use discretion while setting it other than default value. When NOMODEL is set, MACS will use this value to move cutting ends (5-prime) towards 5-prime-to-3-prime direction then apply EXTSIZE to extend them to fragments. When this value is negative, ends will be moved toward 3-prime-to-5-prime direction. Recommended to keep it as default 0 for ChIP-Seq datasets, or -1 * 0.5 of --extsize (option above) together with --extsize option for detecting enriched cutting loci such as certain DNAseI-Seq datasets. Note, you can't set values other than 0 if format is paired-end data (BAMPE). Default: 0"/>
193 </when> 193 </when>
194 </conditional> 194 </conditional>
195 195
196 <conditional name="cutoff_options"> 196 <conditional name="cutoff_options">
197 <param name="cutoff_options_selector" type="select" label="Peak detection based on" help="default uses q-value"> 197 <param name="cutoff_options_selector" type="select" label="Peak detection based on" help="default uses q-value">
198 <option value="qvalue" selected="true">q-value</option> 198 <option value="qvalue" selected="true">q-value</option>
199 <option value="pvalue">p-value</option> 199 <option value="pvalue">p-value</option>
200 </param> 200 </param>
201 <when value="pvalue"> 201 <when value="pvalue">
202 <param name="pvalue" type="float" value="" label="p-value cutoff for peak detection" help="default: not set (--pvalue)"/> 202 <param argument="--pvalue" type="float" value="" label="p-value cutoff for peak detection" help="Default: not set"/>
203 </when> 203 </when>
204 <when value="qvalue"> 204 <when value="qvalue">
205 <param name="qvalue" type="float" value="0.05" label="Minimum FDR (q-value) cutoff for peak detection" help="The q-value (minimum FDR) cutoff to call significant regions. Default is 0.05. For broad marks, you can try 0.05 as cutoff. Q-values are calculated from p-values using Benjamini-Hochberg procedure. (--qvalue)"/> 205 <param argument="--qvalue" type="float" value="0.05" label="Minimum FDR (q-value) cutoff for peak detection" help="The q-value (minimum FDR) cutoff to call significant regions. Default is 0.05. For broad marks, you can try 0.05 as cutoff. Q-values are calculated from p-values using Benjamini-Hochberg procedure"/>
206 </when> 206 </when>
207 </conditional> 207 </conditional>
208 208
209 <param name="outputs" type="select" display="checkboxes" multiple="True" optional="True" label="Additional Outputs" help="PDF is only created when the model is built"> 209 <param name="outputs" type="select" display="checkboxes" multiple="True" optional="True" label="Additional Outputs" help="PDF is only created when the model is built">
210 <option value="peaks_tabular">Peaks as tabular file (compatible wih MultiQC)</option> 210 <option value="peaks_tabular">Peaks as tabular file (compatible wih MultiQC)</option>
213 <option value="html">Summary page (html)</option> 213 <option value="html">Summary page (html)</option>
214 <option value="pdf">Plot in PDF (only available if a model is created and if BAMPE is not used)</option> 214 <option value="pdf">Plot in PDF (only available if a model is created and if BAMPE is not used)</option>
215 </param> 215 </param>
216 216
217 <section name="advanced_options" title="Advanced Options"> 217 <section name="advanced_options" title="Advanced Options">
218 <param name="to_large" type="boolean" truevalue="--to-large" falsevalue="" checked="False" optional="True" 218 <param name="to_large" argument="--to-large" type="boolean" truevalue="--to-large" falsevalue="" checked="false"
219 label="When set, scale the small sample up to the bigger sample" 219 label="When set, scale the small sample up to the bigger sample"
220 help="By default, the bigger dataset will be scaled down towards the smaller dataset, which will lead to smaller p/qvalues and more specific results. Keep in mind that scaling down will bring down background noise more. (--to-large). Default: No"/> 220 help="By default, the bigger dataset will be scaled down towards the smaller dataset, which will lead to smaller p/qvalues and more specific results. Keep in mind that scaling down will bring down background noise more. Default: No"/>
221 <param name="nolambda" type="boolean" truevalue="--nolambda" falsevalue="" checked="False" optional="True" 221 <param argument="--nolambda" type="boolean" truevalue="--nolambda" falsevalue="" checked="false"
222 label="Use fixed background lambda as local lambda for every peak region" help="up to 9X more time consuming (--nolambda). Default: No"/> 222 label="Use fixed background lambda as local lambda for every peak region" help="up to 9X more time consuming. Default: No"/>
223 <param name="spmr" type="boolean" truevalue="--SPMR" falsevalue="" checked="False" optional="True" 223 <param name="spmr" argument="--SPMR" type="boolean" truevalue="--SPMR" falsevalue="" checked="false"
224 label="Save signal per million reads for fragment pileup profiles" 224 label="Save signal per million reads for fragment pileup profiles"
225 help="Requires 'Scores in bedGraph files (--bdg)' output to be selected. (--SPMR). Default: No"/> 225 help="Requires 'Scores in bedGraph files (--bdg)' output to be selected. Default: No"/>
226 <param name="ratio" type="float" optional="True" 226 <param argument="--ratio" type="float" optional="true"
227 label="When set, use a custom scaling ratio of ChIP/control (e.g. calculated using NCIS) for linear scaling" 227 label="When set, use a custom scaling ratio of ChIP/control (e.g. calculated using NCIS) for linear scaling"
228 help="(--ratio) Default: ignore"/> 228 help="Default: ignore"/>
229 <param name="slocal" type="integer" optional="True" label="The small nearby region in basepairs to calculate dynamic lambda" 229 <param name="slocal" type="integer" optional="True" label="The small nearby region in basepairs to calculate dynamic lambda"
230 help="This is used to capture the bias near the peak summit region. Invalid if there is no control data. If you set this to 0, MACS will skip slocal lambda calculation. *Note* that MACS will always perform a d-size local lambda calculation. The final local bias should be the maximum of the lambda value from d, slocal, and llocal size windows. (--slocal). Default: 1000"/> 230 help="This is used to capture the bias near the peak summit region. Invalid if there is no control data. If you set this to 0, MACS will skip slocal lambda calculation. *Note* that MACS will always perform a d-size local lambda calculation. The final local bias should be the maximum of the lambda value from d, slocal, and llocal size windows. (--slocal). Default: 1000"/>
231 <param name="llocal" type="integer" optional="True" label="The large nearby region in basepairs to calculate dynamic lambda" 231 <param argument="--llocal" type="integer" optional="True" label="The large nearby region in basepairs to calculate dynamic lambda"
232 help="This is used to capture the surround bias. If you set this to 0, MACS will skip llocal lambda calculation. *Note* that MACS will always perform a d-size local lambda calculation. The final local bias should be the maximum of the lambda value from d, slocal, and llocal size windows. (--llocal) Default: 10000"/> 232 help="This is used to capture the surround bias. If you set this to 0, MACS will skip llocal lambda calculation. *Note* that MACS will always perform a d-size local lambda calculation. The final local bias should be the maximum of the lambda value from d, slocal, and llocal size windows. Default: 10000"/>
233 <conditional name="broad_options"> 233 <conditional name="broad_options">
234 <param name="broad_options_selector" type="select" 234 <param name="broad_options_selector" argument="--broad" type="select"
235 label="Composite broad regions" help="by putting nearby highly enriched regions into a broad region with loose cutoff (--broad)"> 235 label="Composite broad regions" help="by putting nearby highly enriched regions into a broad region with loose cutoff">
236 <option value="nobroad" selected="true">No broad regions</option> 236 <option value="nobroad" selected="true">No broad regions</option>
237 <option value="broad">broad regions</option> 237 <option value="broad">broad regions</option>
238 </param> 238 </param>
239 <when value="broad"> 239 <when value="broad">
240 <param name="broad_cutoff" type="float" label="Cutoff for broad region" value="0.1" 240 <param name="broad_cutoff" type="float" label="Cutoff for broad region" value="0.1"
241 help="value is either p-value or q-value as specified above (--broad-cutoff)"/> 241 help="value is either p-value or q-value as specified above (--broad-cutoff)"/>
242 </when> 242 </when>
243 <when value="nobroad"> 243 <when value="nobroad">
244 <param name="call_summits" type="boolean" truevalue="--call-summits" falsevalue="" checked="False" 244 <param name="call_summits" argument="--call-summits" type="boolean" truevalue="--call-summits" falsevalue="" checked="false"
245 label="Use a more sophisticated signal processing approach to find subpeak summits in each enriched peak region" 245 label="Use a more sophisticated signal processing approach to find subpeak summits in each enriched peak region"/>
246 help="(--call-summits)"/>
247 </when> 246 </when>
248 </conditional> 247 </conditional>
249 <expand macro="keep_duplicates" /> 248 <expand macro="keep_duplicates" />
250 </section> 249 </section>
251 </inputs> 250 </inputs>
348 <param name="outputs" value="pdf"/> 347 <param name="outputs" value="pdf"/>
349 <output name="output_narrowpeaks" file="callpeak_bampe_narrow.bed"/> 348 <output name="output_narrowpeaks" file="callpeak_bampe_narrow.bed"/>
350 </test> 349 </test>
351 </tests> 350 </tests>
352 <help><![CDATA[ 351 <help><![CDATA[
353
354 .. class:: infomark 352 .. class:: infomark
355 353
356 **What it does** 354 **What it does**
357 355
358 **callpeak** is the main function of the MACS2_ package. MACS identifies enriched binding sites in ChIP-seq experiments. It captures the influence of genome complexity to evaluate the significance of enriched ChIP regions, and improves the spatial resolution of binding sites through combining the information of both sequencing tag position and orientation. 356 **callpeak** is the main function of the MACS2_ package. MACS identifies enriched binding sites in ChIP-seq experiments. It captures the influence of genome complexity to evaluate the significance of enriched ChIP regions, and improves the spatial resolution of binding sites through combining the information of both sequencing tag position and orientation.
399 397
400 The default output is the narrowPeak BED file (BED6+4 format). This contains the peak locations, together with peak summit, pvalue and qvalue. You can load it to UCSC genome browser. 398 The default output is the narrowPeak BED file (BED6+4 format). This contains the peak locations, together with peak summit, pvalue and qvalue. You can load it to UCSC genome browser.
401 399
402 Example: 400 Example:
403 401
404 ======= ========= ======= ============ ==== === ======= ======== ======= ======= 402 ======= ========= ======= ============= ==== === ======= ======== ======= =======
405 1 2 3 4 5 6 7 8 9 **10** 403 1 2 3 4 5 6 7 8 9 **10**
406 ======= ========= ======= ============ ==== === ======= ======== ======= ======= 404 ======= ========= ======= ============= ==== === ======= ======== ======= =======
407 chr1 840081 840400 treat1_peak_1 69 . 4.89872 10.50944 6.91052 158 405 chr1 840081 840400 treat1_peak_1 69 . 4.89872 10.50944 6.91052 158
408 chr1 919419 919785 treat1_peak_2 87 . 5.85158 12.44148 8.70936 130 406 chr1 919419 919785 treat1_peak_2 87 . 5.85158 12.44148 8.70936 130
409 chr1 937220 937483 treat1_peak_3 66 . 4.87632 10.06728 6.61759 154 407 chr1 937220 937483 treat1_peak_3 66 . 4.87632 10.06728 6.61759 154
410 ======= ========= ======= ============ ==== === ======= ======== ======= ======= 408 ======= ========= ======= ============= ==== === ======= ======== ======= =======
411 409
412 Columns contain the following data: 410 Columns contain the following data:
413 411
414 * **1st**: chromosome name 412 * **1st**: chromosome name
415 * **2nd**: start position of peak 413 * **2nd**: start position of peak
457 455
458 A BED file which contains the peak summits locations for every peaks. The 5th column in this file is -log10qvalue, the same as in the Peaks BED file. If you want to find the motifs at the binding sites, this file is recommended. The file can be loaded directly to UCSC genome browser. Remove the beginning track line if you want to analyze it by other tools. 456 A BED file which contains the peak summits locations for every peaks. The 5th column in this file is -log10qvalue, the same as in the Peaks BED file. If you want to find the motifs at the binding sites, this file is recommended. The file can be loaded directly to UCSC genome browser. Remove the beginning track line if you want to analyze it by other tools.
459 457
460 Example: 458 Example:
461 459
462 ======= ========= ======= ============ ======= 460 ======= ========= ======= ============= =======
463 1 2 3 4 **5** 461 1 2 3 4 **5**
464 ======= ========= ======= ============ ======= 462 ======= ========= ======= ============= =======
465 chr1 840239 840240 treat1_peak_1 6.91052 463 chr1 840239 840240 treat1_peak_1 6.91052
466 chr1 919549 919550 treat1_peak_2 8.70936 464 chr1 919549 919550 treat1_peak_2 8.70936
467 chr1 937374 937375 treat1_peak_3 6.61759 465 chr1 937374 937375 treat1_peak_3 6.61759
468 ======= ========= ======= ============ ======= 466 ======= ========= ======= ============= =======
469 467
470 Columns contain the following data: 468 Columns contain the following data:
471 469
472 * **1st**: chromosome name 470 * **1st**: chromosome name
473 * **2nd**: start position of peak 471 * **2nd**: start position of peak
516 514
517 If the broad option (--broad) is selected unded Advanced Options above, MACS2 will output a broadPeaks file. When this flag is on, MACS will try to composite broad regions in BED12 ( a gene-model-like format ) by putting nearby highly enriched regions into a broad region with loose cutoff. The broad region is controlled by another cutoff through --broad-cutoff. The maximum length of broad region length is 4 times of d from MACS. The broad peaks file is in BED6+3 format which is similar to the narrowPeak file, except for missing the 10th column for annotating peak summits. 515 If the broad option (--broad) is selected unded Advanced Options above, MACS2 will output a broadPeaks file. When this flag is on, MACS will try to composite broad regions in BED12 ( a gene-model-like format ) by putting nearby highly enriched regions into a broad region with loose cutoff. The broad region is controlled by another cutoff through --broad-cutoff. The maximum length of broad region length is 4 times of d from MACS. The broad peaks file is in BED6+3 format which is similar to the narrowPeak file, except for missing the 10th column for annotating peak summits.
518 516
519 Example: 517 Example:
520 518
521 ======= ========= ======= ============ ==== === ======= ======= ======= 519 ======= ====== ====== ============= ==== === ======= ======= =======
522 1 2 3 4 5 6 7 8 9 520 1 2 3 4 5 6 7 8 9
523 ======= ========= ======= ============ ==== === ======= ======= ======= 521 ======= ====== ====== ============= ==== === ======= ======= =======
524 chr1 840081 840400 treat1_peak_1 52 . 4.08790 8.57605 5.21506 522 chr1 840081 840400 treat1_peak_1 52 . 4.08790 8.57605 5.21506
525 chr1 919419 919785 treat1_peak_2 56 . 4.37270 8.90436 5.60462 523 chr1 919419 919785 treat1_peak_2 56 . 4.37270 8.90436 5.60462
526 chr1 937220 937483 treat1_peak_3 48 . 4.02343 8.06676 4.86861 524 chr1 937220 937483 treat1_peak_3 48 . 4.02343 8.06676 4.86861
527 ======= ========= ======= ============ ==== === ======= ======= ======= 525 ======= ====== ====== ============= ==== === ======= ======= =======
528
529 526
530 Columns contain the following data: 527 Columns contain the following data:
531 528
532 * **1st**: chromosome name 529 * **1st**: chromosome name
533 * **2nd**: start position of peak 530 * **2nd**: start position of peak
544 541
545 If the broad option (--broad) is selected unded Advanced Options above, MACS2 will also output a gappedPeaks file. The gappedPeak file is in BED12+3 format and contains both the broad region and narrow peaks. The file can be loaded directly to UCSC genome browser. 542 If the broad option (--broad) is selected unded Advanced Options above, MACS2 will also output a gappedPeaks file. The gappedPeak file is in BED12+3 format and contains both the broad region and narrow peaks. The file can be loaded directly to UCSC genome browser.
546 543
547 Example: 544 Example:
548 545
549 ======= ========= ======= ============ ==== === ======= ======= === === === === ======= ======= ======= 546 ======= ========= ======= ============= === === ======= ======= === === === === ======= ======= =======
550 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 547 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
551 ======= ========= ======= ============ ==== === ======= ======= === === === === ======= ======= ======= 548 ======= ========= ======= ============= === === ======= ======= === === === === ======= ======= =======
552 chr1 840081 840400 treat1_peak_1 52 . 840081 840400 0 1 319 0 4.08790 8.57605 5.21506 549 chr1 840081 840400 treat1_peak_1 52 . 840081 840400 0 1 319 0 4.08790 8.57605 5.21506
553 chr1 919419 919785 treat1_peak_2 56 . 919419 919785 0 1 366 0 4.37270 8.90436 5.60462 550 chr1 919419 919785 treat1_peak_2 56 . 919419 919785 0 1 366 0 4.37270 8.90436 5.60462
554 chr1 937220 937483 treat1_peak_3 48 . 937220 937483 0 1 263 0 4.02343 8.06676 4.86861 551 chr1 937220 937483 treat1_peak_3 48 . 937220 937483 0 1 263 0 4.02343 8.06676 4.86861
555 ======= ========= ======= ============ ==== === ======= ======= === === === === ======= ======= ======= 552 ======= ========= ======= ============= === === ======= ======= === === === === ======= ======= =======
556 553
557 Columns contain the following data: 554 Columns contain the following data:
558 555
559 * **1st**: chromosome name 556 * **1st**: chromosome name
560 * **2nd**: start position of peak 557 * **2nd**: start position of peak