Mercurial > repos > geert-vandeweyer > dc_genotyper
annotate DC_Genotyper.xml @ 18:93f4d7524823 draft
Uploaded
author | geert-vandeweyer |
---|---|
date | Mon, 29 Sep 2014 04:00:18 -0400 |
parents | 36cc147395ad |
children | 8938f339ed37 |
rev | line source |
---|---|
15 | 1 <tool id="DC_Genotyper" name="DC Genotyper" version='0.0.2'> |
11 | 2 <description></description> |
3 <requirements> | |
4 <requirement type='package' version='3.0.2'>R_3_0_2</requirement> | |
13
08c4fb95c3a9
changed dep to samtools .19 to include bcftools
geert-vandeweyer
parents:
11
diff
changeset
|
5 <requirement type='package' version='0.1.19'>samtools</requirement> |
11 | 6 <requirement type='package' version='0.2.6'>tabix</requirement> |
7 <requirement type='package' version='latest'>blat_server</requirement> | |
8 <requirement type='package' version='1.92'>perl_module_threads</requirement> | |
9 <requirement type='package' version='1.46'>perl_module_threads_shared</requirement> | |
10 <requirement type='package' version='3.02'>perl_module_Thread_Queue</requirement> | |
11 <requirement type='package' version='2.3.32'>igvtools</requirement> | |
12 </requirements> | |
13 <command interpreter="perl">DC_Genotyper.pl | |
14 -t "$targets" | |
15 -b "$bamfile" | |
16 -R "${ref.fields.path}" | |
17 -p "\${GALAXY_SLOTS:-4}" | |
18 #if $dbsnp.source == "history": | |
19 -s "${dbsnp.ownFile}" | |
20 #else | |
21 -s "${dbsnp.indices.fields.path}" | |
22 #end if | |
23 -m $mincov | |
24 -P $ploidy | |
25 | |
26 -a $output1 | |
18 | 27 -v $output2 |
28 -d $output3 | |
11 | 29 </command> |
30 | |
31 <inputs> | |
32 <param name="bamfile" type="data" format="bam" label="Sample BAM file" /> | |
33 <param name="targets" type="data" format="bed" label="Enrichment BED file" /> | |
34 <param name="ref" type="select" label="Select a reference genome"> | |
35 <options from_data_table="DC_Genotyper_indexes"> | |
36 <filter type="sort_by" column="2" /> | |
37 <validator type="no_options" message="No indexes are available" /> | |
38 </options> | |
39 </param> | |
40 <conditional name="dbsnp"> | |
41 <param name="source" type="select" label="Will you select a dbSNP file from your history, or use a built in version (which is faster)"> | |
42 <option value="indexed">Use a built-in version</option> | |
43 <option value="history">Use one from the history</option> | |
44 </param> | |
45 <when value="indexed"> | |
46 <param name="indices" type="select" label="Select a dbSNP version"> | |
47 <options from_data_table="dbsnp_indexes"> | |
48 <filter type="sort_by" column="2" /> | |
49 <validator type="no_options" message="No indexes are available" /> | |
50 </options> | |
51 </param> | |
52 </when> | |
53 <when value="history"> | |
54 <param name="ownFile" type="data" format="vcf,bcf" label="Select a dbSNP file from history"/> | |
55 </when> | |
56 </conditional> | |
57 <param name="mincov" value="400" type="integer" label="Minimal Coverage Depth" /> | |
58 <param name="ploidy" type="integer" value='10' label="Expected Sample Ploidy" /> | |
59 </inputs> | |
60 | |
61 <outputs> | |
18 | 62 <data format='txt' name="output1" label="${tool.name} on ${on_string}: Allele Fraction Distributions (TXT)"/> |
63 <data format='pdf' name="output3" lable="${tool.name} on ${on_string}: Allele Fraction Distributions (PDF)"/> | |
11 | 64 <data format='vcf' name='output2' label="${tool.name} on ${on_string}: VCF file" /> |
65 </outputs> | |
66 <help> | |
67 | |
68 **What it does** | |
69 | |
70 1. get allele counts on all positions in specified targets (bed) using igvtools. Only SNPs !! | |
71 2. remove known dbsnp positions (bcf file) | |
72 3. Get distribution of background noise (pcr/sequencing errors), by modelling allele fractions as normal distributions. | |
73 4. Based on these distributions, check each position for significant change from the reference allele (based on allele fraction) | |
74 5. For abberant positions, check each alternate allele to see if it passes the background signal. | |
75 6. Generate VCF file. | |
76 | |
77 | |
78 **Information** | |
79 | |
80 This tools is created by Geert Vandeweyer. It is a very early version with several limitations. Current limitations are : no support for indels, no plotting of the noise-models, incorrect syntax in for multi-allelic sites in the VCF file. | |
81 | |
82 Any feedback is welcome. | |
83 | |
84 </help> | |
85 </tool> |