# HG changeset patch # User iuc # Date 1485884491 18000 # Node ID 6d2a5f0859cff59fb4577dadc90d71a99e8b98f3 # Parent 5337db17a5f77ffdcc87a1a05e31fc0e178cbf23 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bcftools commit 9df9b52baf62b70fbcfc3fbe965d7197d4e8738e diff -r 5337db17a5f7 -r 6d2a5f0859cf bcftools_call.xml --- a/bcftools_call.xml Mon Oct 03 12:19:38 2016 -0400 +++ b/bcftools_call.xml Tue Jan 31 12:41:31 2017 -0500 @@ -1,9 +1,32 @@ - + SNP/indel variant calling from VCF/BCF call macros.xml + + + + + + + #set $novel_rate = [] + #if str($section.genotypes.novel_rate_snp): + #silent $novel_rate.append(str($section.genotypes.novel_rate_snp)) + #end if + #if str($section.genotypes.novel_rate_del): + #silent $novel_rate.append(str($section.genotypes.novel_rate_del)) + #end if + #if str($section.genotypes.novel_rate_ins): + #silent $novel_rate.append(str($section.genotypes.novel_rate_ins)) + #end if + #if len($novel_rate) > 0: + --novel-rate '#echo ','.join($novel_rate)#' + #end if + @@ -34,9 +57,7 @@ #else #if $section.genotypes.constrain == 'trio': --constrain trio - #if $section.genotypes.novel_rate: - --novel-rate '$section.genotypes.novel_rate' - #end if + @NOVEL_RATE@ #end if #set $section = $sec_consensus_variant_calling.variant_calling.genotypes @TARGETS@ @@ -114,7 +135,7 @@ - + @@ -128,7 +149,7 @@ - + @@ -227,6 +248,8 @@ - Some of the original functionality has been temporarily lost in the process of transition to htslib, but will be added back on popular demand. - The original calling model can be invoked with the -c option. +The novel-rate option can be set to modify the likelihood of novel mutation for constrained -C trio calling. The trio genotype calling maximizes likelihood of a particular combination of genotypes for father, mother and the child P(F=i,M=j,C=k) = P(unconstrained) * Pn + P(constrained) * (1-Pn). By providing three values, the mutation rate Pn is set explicitly for SNPs, deletions and insertions, respectively. If two values are given, the first is interpreted as the mutation rate of SNPs and the second is used to calculate the mutation rate of indels according to their length as Pn=float*exp(-a-b*len), where a=22.8689, b=0.2994 for insertions and a=21.9313, b=0.2856 for deletions [pubmed:23975140]. If only one value is given, the same mutation rate Pn is used for SNPs and indels. + @REGIONS_HELP@ @TARGETS_HELP@ diff -r 5337db17a5f7 -r 6d2a5f0859cf macros.xml --- a/macros.xml Mon Oct 03 12:19:38 2016 -0400 +++ b/macros.xml Tue Jan 31 12:41:31 2017 -0500 @@ -14,14 +14,16 @@ bcftools htslib + samtools bcftools 2>&1 | grep 'Version:' - + 10.1093/bioinformatics/btp352 @@ -45,20 +47,20 @@ $input_vcf && bcftools index $input_vcf && -#elif $input_file.datatype.file_ext == 'vcf_bgzip' +#elif $input_file.is_of_type('vcf_bgzip') ln -s "$input_file" $input_vcf -#elif $input_file.datatype.file_ext == 'bcf' +#elif $input_file.is_of_type('bcf') #set $input_vcf = 'input.bcf' - ln -s "$input_file" $input_vcf && + ln -s "$input_file" $input_vcf && #if $input_file.metadata.bcf_index: ln -s $input_file.metadata.bcf_index ${input_vcf}.csi && - #else + #else bcftools index $input_vcf && #end if -#elif $input_file.datatype.file_ext == 'bcf_bgzip' +#elif $input_file.is_of_type('bcf_bgzip') ln -s "$input_file" $input_vcf #end if ]]> @@ -77,21 +79,21 @@ #set $vcfs_list_file = 'vcfs_list' #for (i,input_file) in enumerate($input_files): #set $input_vcf = 'input' + str($i) + '.vcf.gz' - #if $input_file.datatype.file_ext == 'vcf' + #if $input_file.is_of_type('vcf') bgzip -c "$input_file" > $input_vcf && bcftools index $input_vcf && - #elif $input_file.datatype.file_ext == 'vcf_bgz' + #elif $input_file.is_of_type('vcf_bgz') ln -s "$input_file" $input_vcf - #elif $input_file.datatype.file_ext == 'bcf' + #elif $input_file.is_of_type('bcf') #set $input_vcf = 'input' + str($i) + '.bcf.gz' ## bgzip -c "$input_file" > $input_vcf && ln -s "$input_file" $input_vcf && #if $input_file.metadata.bcf_index: ln -s $input_file.metadata.bcf_index ${input_vcf}.csi && - #else + #else bcftools index $input_vcf && #end if - #elif $input_file.datatype.file_ext == 'bcfvcf_bgz' + #elif $input_file.is_of_type('bcfvcf_bgz') ln -s "$input_file" $input_vcf && #end if echo '$input_vcf' >> $vcfs_list_file && @@ -225,7 +227,7 @@ - ^([^ \t\n\r\f\v,]+(,[^ \t\n\r\f\v,]+)*)?$ @@ -272,7 +274,7 @@ - ^(\w+(:\d+(-\d+)?)?(,\w+(:\d+(-\d+)?)?)*)?$ @@ -299,7 +301,7 @@ $targets_path && @@ -331,7 +333,7 @@ - ^(\w+(:\d+(-\d+)?)?(,\w+(:\d+(-\d+)?)?)*)?$ @@ -358,15 +360,15 @@ - ^(\w+(,\w+)*)?$ - - - @@ -416,7 +418,7 @@ - ^([^,]+(,[^,]+)*)?$ @@ -443,7 +445,7 @@ Output Type ----------- -Output compressed BCF (b), or uncompressed VCF (v). +Output compressed BCF (b), or uncompressed VCF (v). Use the BCF option when piping between bcftools subcommands to speed up performance by removing unecessary compression/decompression and VCF<->BCF conversion.