Mercurial > repos > iuc > basil
annotate basil.xml @ 0:e6ef29001647 draft default tip
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
author | iuc |
---|---|
date | Thu, 30 May 2019 21:14:58 -0400 |
parents | |
children |
rev | line source |
---|---|
0
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
1 <tool id="basil" name="basil" version="1.2.0"> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
2 <description>Breakpoint detection, including large insertions</description> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
3 <requirements> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
4 <requirement type="package" version="1.2.0">anise_basil</requirement> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
5 </requirements> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
6 <version_command>basil --version 2>&1 | grep 'basil version' | cut -f 3 -d ' '</version_command> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
7 <command detect_errors="aggressive"><![CDATA[ |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
8 ln -s '$ref' 'ref.fa' && |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
9 ln -s '$bam' 'in.bam' && |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
10 ln -s '$vcf' 'out.vcf' && |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
11 basil |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
12 --input-reference 'ref.fa' |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
13 --input-mapping 'in.bam' |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
14 --out-vcf 'out.vcf' |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
15 --oea-min-support-each-side '$min_oea_each_side' |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
16 ]]></command> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
17 <inputs> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
18 <param name="ref" argument="--input-reference" type="data" format="Fasta" label="Reference Sequence File" help="FASTA file with the reference."/> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
19 <param name="bam" argument="--input-mapping" type="data" format="sam,bam" label="Alignment File" help="SAM/BAM file to use as the input."/> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
20 <param name="min_oea_each_side" argument="--oea-min-support-each-side" type="integer" value="2" label="Minimum supporting reads, each side" help="Smallest number of OEA (one-end-anchor) reads on each side to support an insertion. In range [1..inf]. This is the minimum number of supporting reads (without mapped partners) on each side of an insertion breakpoint required to not be filtered." /> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
21 </inputs> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
22 <outputs> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
23 <data name="vcf" format="vcf" /> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
24 </outputs> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
25 <tests> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
26 <test> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
27 <param name="ref" value="ref.fa"/> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
28 <param name="bam" value="simulated.bam"/> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
29 <param name="min_oea_each_side" value="2"/> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
30 <output name="vcf" file="basil.vcf"/> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
31 </test> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
32 </tests> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
33 <help><![CDATA[ |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
34 BASIL is a method to detect breakpoints for structural variants (including insertion breakpoints) from aligned paired HTS reads in BAM format. Use BASIL to analyze BAM files for tentative insertion sites. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
35 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
36 Note that BASIL will in general detect all kinds of breakpoints, e.g. for inversions on real-world data. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
37 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
38 BASIL VCF fields |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
39 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
40 A typical line in BASIL might look as follows. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
41 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
42 1 5001 site_0 T <INS> . PASS IMPRECISE;SVTYPE=INS GSCORE:CLEFT:CRIGHT:OEALEFT:OEARIGHT 46.4256:10:12:35:32 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
43 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
44 The first seven columns are as usually in VCF files (ref name, 1-based position, reference base, abbreviation for long insertion, no assigned quality, passing all filters, imprecise insertion SV). |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
45 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
46 The eighth column contains the names of the score values given in the ninth column: |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
47 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
48 GSCORE Geometric mean of the sum of "1 + $score" for all of the following scores. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
49 CLEFT Number of clipping signatures supporting the site from the left side. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
50 CRIGHT Number of clipping signatures supporting the site from the right side. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
51 OEALEFT Number of OEA alignments supporting the site from the left. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
52 OEARIGHT Number of OEA alignmetns supproting the site from the right. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
53 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
54 Generally, one should filter for a minimum support of OEA records on each side, e.g. a value of 10 makes sense for a 30x coverage and showed good results on simulated data. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
55 |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
56 For a ranking, GSCORE is a suitable measure but we did not develop any statistical model for BASIL matches and it is a mean of pseudocounts only. It carries no statistically precise meaning. |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
57 ]]></help> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
58 <citations> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
59 <citation type="doi">10.1093/bioinformatics/btv051</citation> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
60 </citations> |
e6ef29001647
planemo upload commit b89c8017aeef91f940543a1cc7dadb4a85290865
iuc
parents:
diff
changeset
|
61 </tool> |