annotate lumpy_preprocessing.xml @ 0:21f2361c32c9 draft

"planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
author iuc
date Thu, 12 Nov 2020 16:48:34 +0000
parents
children 80adce82354c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
1 <tool id="lumpy_prep" name="LUMPY preprocessing" version="@WRAPPER_VERSION@">
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
2 <description>extracts discordant read pairs and split-read alignments from a BAM dataset</description>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
3 <macros>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
4 <import>macros.xml</import>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
5 </macros>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
6 <requirements>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
7 <requirement type="package" version="@TOOL_VERSION@">lumpy-sv</requirement>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
8 </requirements>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
9 <command detect_errors="exit_code"><![CDATA[
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
10 samtools collate -O --output-fmt sam '$bam_in' | samblaster $dup_handling --addMateTags | samtools view -bS - > blasted.bam &&
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
11
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
12 samtools view -b -F 1294 blasted.bam > discordants.unsorted.bam &&
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
13 samtools view -h blasted.bam | extractSplitReads_BwaMem -i stdin | samtools view -Sb - > splitters.unsorted.bam &&
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
14
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
15 samtools sort discordants.unsorted.bam > discordants.bam &&
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
16 samtools sort splitters.unsorted.bam > splitters.bam
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
17 ]]></command>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
18 <inputs>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
19 <param name="bam_in" type="data" format="bam" label="BAM input dataset" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
20 <param name="dup_handling" type="select"
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
21 label="Duplicate detection and removal"
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
22 help="Duplicate reads can be detected and removed with the help of samblaster. If you have already marked duplicates in the input dataset with another tool, you can choose to skip duplicate detection and remove only pre-marked duplicates. Not handling duplicates is only recommended if you have already deduplicated your input with other tools.">
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
23 <option value="--removeDups">Detect and remove duplicates (samblaster -r)</option>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
24 <option value="--acceptDupMarks --removeDups">Remove duplicates marked in input data (samblaster -a -r)</option>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
25 <option value="">Don't handle duplicates</option>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
26 </param>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
27 </inputs>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
28 <outputs>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
29 <data name="blasted_bam" format="qname_sorted.bam" from_work_dir="blasted.bam" label="${tool.name}: Collated and groomed on ${on_string}" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
30 <data name="discordants_bam" format="bam" from_work_dir="discordants.bam" label="${tool.name}: Discordant read pairs on ${on_string}" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
31 <data name="splitters_bam" format="bam" from_work_dir="splitters.bam" label="${tool.name}: Split-read alignments on ${on_string}" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
32 </outputs>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
33 <tests>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
34 <test>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
35 <param name="bam_in" ftype="bam" value="sample.bam" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
36 <param name="dup_handling" value="" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
37 <output name="blasted_bam" ftype="qname_sorted.bam" file="blasted.bam" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
38 <output name="discordants_bam" ftype="bam" file="discordants.bam" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
39 <output name="splitters_bam" ftype="bam" file="splitters.bam" />
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
40 </test>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
41 </tests>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
42 <help><![CDATA[
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
43 **What it does**
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
44
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
45 This tool implements the mapped reads preprocessing `suggested for LUMPY <https://github.com/arq5x/lumpy-sv#pre-processing>`__. It uses samblaster_, samtools and LUMPY's extractSplitReads_BwaMem script to collate and groom an input BAM dataset (preferably produced with bwa-mem) and to extract discordant read pairs and split-read alignments from it. The three output datasets can serve as the three inputs to LUMPY.
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
46
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
47 .. _samblaster: https://github.com/GregoryFaust/samblaster
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
48 ]]></help>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
49 <expand macro="citations">
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
50 <citation type="doi">10.1093/bioinformatics/btu314</citation>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
51 <citation type="bibtex">
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
52 @misc{SamTools_github,
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
53 title={SAMTools GitHub page},
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
54 url = {https://github.com/samtools/samtools},}
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
55 </citation>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
56 </expand>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
57 </tool>
21f2361c32c9 "planemo upload for repository https://github.com/arq5x/lumpy-sv commit cce17262b21b0964c31eb983bac5e89ae92b8ee9"
iuc
parents:
diff changeset
58