annotate DC_Genotyper.xml @ 7:8cfdb91bfc14 draft

Uploaded
author geert-vandeweyer
date Fri, 26 Sep 2014 03:57:06 -0400
parents 5c72a91ce518
children 7cbbf8aaa46c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
fa8566bd4a51 Corrected tool_id, name and version in wrapper
geert-vandeweyer
parents: 0
diff changeset
1 <tool id="DC_Genotyper" name="DC Genotyper" version='0.0.1'>
0
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
2 <description></description>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
3 <requirements>
5
5c72a91ce518 Uploaded
geert-vandeweyer
parents: 4
diff changeset
4 <requirement type='package' version='3.0.2'>R_3_0_2</requirement>
0
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
5 <requirement type='package' version='0.1.18'>samtools</requirement>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
6 <requirement type='package' version='0.2.6'>tabix</requirement>
5
5c72a91ce518 Uploaded
geert-vandeweyer
parents: 4
diff changeset
7 <requirement type='package' version='latest'>blat_server</requirement>
0
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
8 <requirement type='package' version='1.92'>perl_module_threads</requirement>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
9 <requirement type='package' version='1.46'>perl_module_threads_shared</requirement>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
10 <requirement type='package' version='3.02'>perl_module_Thread_Queue</requirement>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
11 <requirement type='package' version='2.3.32'>igvtools</requirement>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
12 </requirements>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
13 <command interpreter="perl">DC_Genotyper.pl
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
14 -t "$targets"
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
15 -b "$bamfile"
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
16 -R "${ref.fields.path}"
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
17 -p "\${GALAXY_SLOTS:-4}"
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
18 #if $dbsnp.source == "history":
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
19 -s "${dbsnp.ownFile}"
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
20 #else
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
21 -s "${dbsnp.indices.fields.path}"
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
22 #end if
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
23 -m $mincov
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
24 -P $ploidy
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
25
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
26 -a $output1
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
27 -v $output2
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
28 </command>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
29
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
30 <inputs>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
31 <param name="bamfile" type="data" format="bam" label="Sample BAM file" />
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
32 <param name="targets" type="data" format="bed" label="Enrichment BED file" />
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
33 <param name="ref" type="select" label="Select a reference genome">
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
34 <options from_data_table="DC_Genotyper_indexes">
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
35 <filter type="sort_by" column="2" />
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
36 <validator type="no_options" message="No indexes are available" />
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
37 </options>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
38 </param>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
39 <conditional name="dbsnp">
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
40 <param name="source" type="select" label="Will you select a dbSNP file from your history, or use a built in version (which is faster)">
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
41 <option value="indexed">Use a built-in version</option>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
42 <option value="history">Use one from the history</option>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
43 </param>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
44 <when value="indexed">
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
45 <param name="indices" type="select" label="Select a reference genome">
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
46 <options from_data_table="dbsnp_indexes">
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
47 <filter type="sort_by" column="2" />
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
48 <validator type="no_options" message="No indexes are available" />
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
49 </options>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
50 </param>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
51 </when>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
52 <when value="history">
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
53 <param name="ownFile" type="data" format="vcf,bcf" label="Select a dbSNP file from history"/>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
54 </when>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
55 </conditional>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
56 <param name="mincov" value="400" type="integer" label="Minimal Coverage Depth" />
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
57 <param name="ploidy" type="integer" value='10' label="Expected Sample Ploidy" />
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
58 </inputs>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
59
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
60 <outputs>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
61 <data format='txt' name="output1" label="${tool.name} on ${on_string}: Allele Fraction Distributions"/>
4
92207f2ec144 Various Fixes and added tool_data_conf
geert-vandeweyer
parents: 2
diff changeset
62 <data format='vcf' name='output2' label="${tool.name} on ${on_string}: VCF file" />
0
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
63 </outputs>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
64 <help>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
65
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
66 **What it does**
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
67
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
68 1. get allele counts on all positions in specified targets (bed) using igvtools. Only SNPs !!
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
69 2. remove known dbsnp positions (bcf file)
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
70 3. Get distribution of background noise (pcr/sequencing errors), by modelling allele fractions as normal distributions.
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
71 4. Based on these distributions, check each position for significant change from the reference allele (based on allele fraction)
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
72 5. For abberant positions, check each alternate allele to see if it passes the background signal.
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
73 6. Generate VCF file.
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
74
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
75
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
76 **Information**
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
77
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
78 This tools is created by Geert Vandeweyer. It is a very early version with several limitations. Current limitations are : no support for indels, no plotting of the noise-models, incorrect syntax in for multi-allelic sites in the VCF file.
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
79
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
80 Any feedback is welcome.
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
81
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
82 </help>
e8a32d824f39 Uploaded
geert-vandeweyer
parents:
diff changeset
83 </tool>