annotate lumpy_preprocessing.xml @ 1:80adce82354c draft default tip

"planemo upload for repository https://github.com/arq5x/lumpy-sv commit 41cb10683d89fa20e122f4c60b8f5bf0e3c390d8"
author iuc
date Sat, 10 Jul 2021 07:40:25 +0000
parents 21f2361c32c9
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
80adce82354c "planemo upload for repository https://github.com/arq5x/lumpy-sv commit 41cb10683d89fa20e122f4c60b8f5bf0e3c390d8"
iuc
parents: 0
diff changeset
1 <tool id="lumpy_prep" name="LUMPY preprocessing" version="@WRAPPER_VERSION@" profile="20.05">
0
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
2 <description>extracts discordant read pairs and split-read alignments from a BAM dataset</description>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
3 <macros>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
4 <import>macros.xml</import>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
5 </macros>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
6 <requirements>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
7 <requirement type="package" version="@TOOL_VERSION@">lumpy-sv</requirement>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
8 </requirements>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
9 <command detect_errors="exit_code"><![CDATA[
1
80adce82354c "planemo upload for repository https://github.com/arq5x/lumpy-sv commit 41cb10683d89fa20e122f4c60b8f5bf0e3c390d8"
iuc
parents: 0
diff changeset
10 set -o pipefail;
80adce82354c "planemo upload for repository https://github.com/arq5x/lumpy-sv commit 41cb10683d89fa20e122f4c60b8f5bf0e3c390d8"
iuc
parents: 0
diff changeset
11
0
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
12 samtools collate -O --output-fmt sam '$bam_in' | samblaster $dup_handling --addMateTags | samtools view -bS - > blasted.bam &&
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
13
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
14 samtools view -b -F 1294 blasted.bam > discordants.unsorted.bam &&
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
15 samtools view -h blasted.bam | extractSplitReads_BwaMem -i stdin | samtools view -Sb - > splitters.unsorted.bam &&
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
16
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
17 samtools sort discordants.unsorted.bam > discordants.bam &&
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
18 samtools sort splitters.unsorted.bam > splitters.bam
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
19 ]]></command>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
20 <inputs>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
21 <param name="bam_in" type="data" format="bam" label="BAM input dataset" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
22 <param name="dup_handling" type="select"
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
23 label="Duplicate detection and removal"
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
24 help="Duplicate reads can be detected and removed with the help of samblaster. If you have already marked duplicates in the input dataset with another tool, you can choose to skip duplicate detection and remove only pre-marked duplicates. Not handling duplicates is only recommended if you have already deduplicated your input with other tools.">
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
25 <option value="--removeDups">Detect and remove duplicates (samblaster -r)</option>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
26 <option value="--acceptDupMarks --removeDups">Remove duplicates marked in input data (samblaster -a -r)</option>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
27 <option value="">Don't handle duplicates</option>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
28 </param>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
29 </inputs>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
30 <outputs>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
31 <data name="blasted_bam" format="qname_sorted.bam" from_work_dir="blasted.bam" label="${tool.name}: Collated and groomed on ${on_string}" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
32 <data name="discordants_bam" format="bam" from_work_dir="discordants.bam" label="${tool.name}: Discordant read pairs on ${on_string}" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
33 <data name="splitters_bam" format="bam" from_work_dir="splitters.bam" label="${tool.name}: Split-read alignments on ${on_string}" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
34 </outputs>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
35 <tests>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
36 <test>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
37 <param name="bam_in" ftype="bam" value="sample.bam" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
38 <param name="dup_handling" value="" />
1
80adce82354c "planemo upload for repository https://github.com/arq5x/lumpy-sv commit 41cb10683d89fa20e122f4c60b8f5bf0e3c390d8"
iuc
parents: 0
diff changeset
39 <output name="blasted_bam" ftype="qname_sorted.bam" file="blasted.bam" lines_diff="2"/>
80adce82354c "planemo upload for repository https://github.com/arq5x/lumpy-sv commit 41cb10683d89fa20e122f4c60b8f5bf0e3c390d8"
iuc
parents: 0
diff changeset
40 <output name="discordants_bam" ftype="bam" file="discordants.bam" lines_diff="2"/>
80adce82354c "planemo upload for repository https://github.com/arq5x/lumpy-sv commit 41cb10683d89fa20e122f4c60b8f5bf0e3c390d8"
iuc
parents: 0
diff changeset
41 <output name="splitters_bam" ftype="bam" file="splitters.bam" lines_diff="2"/>
0
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
42 </test>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
43 </tests>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
44 <help><![CDATA[
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
45 **What it does**
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
46
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
47 This tool implements the mapped reads preprocessing `suggested for LUMPY <https://github.com/arq5x/lumpy-sv#pre-processing>`__. It uses samblaster_, samtools and LUMPY's extractSplitReads_BwaMem script to collate and groom an input BAM dataset (preferably produced with bwa-mem) and to extract discordant read pairs and split-read alignments from it. The three output datasets can serve as the three inputs to LUMPY.
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
48
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
49 .. _samblaster: https://github.com/GregoryFaust/samblaster
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
50 ]]></help>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
51 <expand macro="citations">
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
52 <citation type="doi">10.1093/bioinformatics/btu314</citation>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
53 <citation type="bibtex">
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
54 @misc{SamTools_github,
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
55 title={SAMTools GitHub page},
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
56 url = {https://github.com/samtools/samtools},}
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
57 </citation>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
58 </expand>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
59 </tool>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
60