Repository 'bcftools_call'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/bcftools_call

Changeset 0:a531317a3527 (2016-05-02)
Next changeset 1:8959eda17fca (2016-07-06)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bcftools commit bbfd77c34b609b86ef3a24525dae1127d8b3d99b
added:
README.md
bcftools_call.xml
macros.xml
test-data/mpileup.1.out
test-data/mpileup.2.out
test-data/mpileup.vcf
tool_dependencies.xml
b
diff -r 000000000000 -r a531317a3527 README.md
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/README.md Mon May 02 17:27:10 2016 -0400
b
@@ -0,0 +1,21 @@
+# bcftools (v1.2)
+
+This aims to be a "faithful" rendering of the bcftool suite. I.e. options are
+presented essentially as closely to the command line version as is useful. 
+
+This may not appeal to all, if you'd like to see smaller and more dedicated
+tools (e.g. "intersect", "union" and "complement" being separate tools instead
+of all of them included in the "isec" tool,) please feel free to file an issue.
+
+## TODO:
+
+- Galaxy needs datatypes for bcf and vcf files, block-gzipped and uncompressed.
+- Galaxy needs to automatically index those files with tabix
+
+## "Complete" Wrappers
+
+The wrappers were automatically generated in bulk. That doesn't get them 100%
+of the way there (e.g. meaningful test cases), so the rest of the process is a
+bit slower.
+
+- bcftools call
b
diff -r 000000000000 -r a531317a3527 bcftools_call.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/bcftools_call.xml Mon May 02 17:27:10 2016 -0400
[
b'@@ -0,0 +1,159 @@\n+<?xml version=\'1.0\' encoding=\'utf-8\'?>\n+<tool name="bcftools @EXECUTABLE@" id="bcftools_@EXECUTABLE@" version="@VERSION@.0">\n+  <description>SNP/indel variant calling from VCF/BCF</description>\n+  <macros>\n+    <token name="@EXECUTABLE@">call</token>\n+    <import>macros.xml</import>\n+  </macros>\n+  <expand macro="requirements" />\n+  <expand macro="version_command" />\n+  <command detect_errors="aggressive"><![CDATA[\n+bcftools @EXECUTABLE@\n+\n+## Consensus/variant calling section\n+#if $sec_consensus_variant_calling.select_caller == "consensus":\n+    --consensus-caller\n+#else:\n+    --multiallelic-caller\n+#end if\n+\n+#if $sec_consensus_variant_calling.constraints.constrain_select == "alleles":\n+  --constrain alleles\n+#elif $sec_consensus_variant_calling.constraints.constrain_select == "trio":\n+  --constrain trio\n+  --novel-rate ${sec_consensus_variant_calling.constraints.novel_snp},${sec_consensus_variant_calling.constraints.novel_ins},${sec_consensus_variant_calling.constraints.novel_del}\n+  --pval-threshold "${sec_consensus_variant_calling.constraints.pval_threshold}"\n+#end if\n+\n+#if $sec_consensus_variant_calling.prior:\n+  --prior "${sec_consensus_variant_calling.prior}"\n+#end if\n+${sec_consensus_variant_calling.chromosome_X}\n+${sec_consensus_variant_calling.chromosome_Y}\n+\n+\n+## File format section\n+#if str($sec_default.select_output_type) != "__none__":\n+  --output-type "${sec_default.select_output_type}"\n+#end if\n+@SEC_DEF_REGIONS@\n+@SEC_DEF_SAMPLES@\n+@SEC_DEF_TARGETS@\n+\n+\n+## Input/output section\n+${sec_input_output.keep_alts}\n+#set values_sec_input_output_format_fields = \'","\'.join([str($value) for $value in $sec_input_output.format_fields_repeat])\n+#if $values_sec_input_output_format_fields:\n+  --format-fields "${values_sec_input_output_format_fields}"\n+#end if\n+\n+#if str($sec_input_output.gvcf) != "":\n+  --gvcf "${sec_input_output.gvcf}"\n+#end if\n+\n+${sec_input_output.insert_missed}\n+${sec_input_output.keep_masked_ref}\n+\n+#if str($sec_input_output.skip_variants) != "__none__":\n+  --skip-variants "${sec_input_output.skip_variants}"\n+#end if\n+\n+${sec_input_output.variants_only}\n+\n+## Primary Input/Outputs\n+\n+$input_file\n+>\n+$output_file\n+]]>\n+</command>\n+  <inputs>\n+    <param name="input_file" label="VCF/BCF Data" type="data" format="vcf,bcf,vcf_bgz,bcf_bgz" />\n+    <section name="sec_consensus_variant_calling" expanded="true" title="Consensus/variant calling Options">\n+      <param name="select_caller" label="Calling Method" type="select">\n+        <option value="consensus">the original calling method (-c, --consensus-caller)</option>\n+        <option value="multiallelic">alternative model for multiallelic and rare-variant calling (-m, --multiallelic-caller)</option>\n+      </param>\n+      <conditional name="constraints" label="Constraints">\n+        <param name="constrain_select" label="Constraints" type="select" argument="-C">\n+          <option value="__none__" selected="True">No constraints</option>\n+          <option value="alleles">call genotypes given alleles (alleles)</option>\n+          <option value="trio">call genotypes given the father-mother-child constraint (trio)</option>\n+        </param>\n+        <when value="__none__" />\n+        <when value="alleles" />\n+        <when value="trio">\n+          <param name="novel_snp" label="Novel Rate: SNPs" type="float" default="1e-8" optional="True" help="mutation rate of SNPs" argument="--novel-rate"/>\n+          <param name="novel_ins" label="Novel Rate: Insertions" type="float" default="1e-9" optional="True" help="mutation rate of insertions according to their length" argument="--novel-rate" />\n+          <param name="novel_del" label="Novel Rate: Deletions" type="float" default="1e-9" optional="True" help="mutation rate of deletions according to their length" argument="--novel-rate" />\n+          <param name="pval_threshold" label="Pval Threshold" type="float" default="0.5" optional="True" help="variant if P(ref|D)&lt;FLOAT with -c" argument="--p'..b'e="" help="haploid output for males and skips females (requires PED file with -s)" argument="--chromosome-Y"/>\n+    </section>\n+    <section name="sec_default" expanded="true" title="Default Options">\n+      <expand macro="macro_select_output_type" />\n+      <expand macro="macro_regions" />\n+      <expand macro="macro_samples" />\n+      <expand macro="macro_targets" />\n+    </section>\n+    <section name="sec_input_output" expanded="true" title="Input/output Options">\n+      <param name="keep_alts" label="Keep Alts" type="boolean" truevalue="--keep-alts" falsevalue="" help="keep all possible alternate alleles at variant sites" argument="--keep-alts"/>\n+      <repeat name="format_fields_repeat" title="Format Fields">\n+        <param name="format_fields" type="text" label="Format Fields" help="output format fields: e.g. GQ, GP (lowercase allowed)" argument="--format-fields" />\n+      </repeat>\n+      <param name="gvcf" label="Gvcf" type="integer" optional="True" help="output gVCF blocks of homozygous REF calls. The parameter is the minimum per-sample depth required to include a site in the non-variant block." argument="--gvcf"/>\n+      <param name="insert_missed" label="Insert Missed" type="boolean" truevalue="--insert-missed" falsevalue="" help="output also sites missed by mpileup but present in -T" argument="--insert-missed"/>\n+      <param name="keep_masked_ref" label="Keep Masked Ref" type="boolean" truevalue="--keep-masked-ref" falsevalue="" help="keep sites with masked reference allele (REF=N)" argument="--keep-masked-ref"/>\n+      <param name="skip_variants" label="Skip Variants" type="select" help="Skip indels/SNP sites" argument="--skip-variants">\n+        <option value="__none__" selected="True">Don\'t skip any</option>\n+        <option value="indels">Skip indels</option>\n+        <option value="snps">Skip snps</option>\n+      </param>\n+      <param name="variants_only" label="Variants Only" type="boolean" truevalue="--variants-only" falsevalue="" help="output variant sites only" argument="--variants-only"/>\n+    </section>\n+  </inputs>\n+  <outputs>\n+    <data name="output_file" format="vcf">\n+      <change_format>\n+        <when input="sec_file_format|select_output_type" value="b" format="bcf_bgz" />\n+        <when input="sec_file_format|select_output_type" value="u" format="bcf" />\n+        <when input="sec_file_format|select_output_type" value="z" format="vcf_bgz" />\n+        <when input="sec_file_format|select_output_type" value="v" format="vcf" />\n+      </change_format>\n+    </data>\n+  </outputs>\n+  <tests>\n+      <test>\n+          <param name="input_file" value="mpileup.vcf" />\n+          <param name="sec_consensus_variant_calling|select_caller" value="multiallelic" />\n+          <param name="sec_input_output|variants_only" value="--variants-only" />\n+          <param name="sec_file_format|select_output_type" value="v" />\n+          <output name="output_file" file="mpileup.1.out" lines_diff="2" ftype="vcf" />\n+      </test>\n+      <test>\n+          <param name="input_file" value="mpileup.vcf" />\n+          <param name="sec_consensus_variant_calling|select_caller" value="multiallelic" />\n+          <param name="sec_input_output|variants_only" value="--variants-only" />\n+          <param name="sec_input_output|gvcf" value="0" />\n+          <param name="sec_file_format|select_output_type" value="v" />\n+          <output name="output_file" file="mpileup.2.out" lines_diff="2" ftype="vcf" />\n+      </test>\n+  </tests>\n+  <help>\n+      <![CDATA[\n+      **bcftools call**\n+\n+      SNP/indel variant calling from VCF/BCF. To be used in conjunction with\n+      samtools mpileup. This command replaces the former "bcftools view"\n+      caller. Some of the original functionality has been temporarily lost in\n+      the process of transition to htslib, but will be added back on popular\n+      demand. The original calling model can be invoked with the -c\n+      option.\n+      ]]>\n+  </help>\n+  <expand macro="citations" />\n+</tool>\n'
b
diff -r 000000000000 -r a531317a3527 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Mon May 02 17:27:10 2016 -0400
[
@@ -0,0 +1,74 @@
+<?xml version='1.0' encoding='utf-8'?>
+<macros>
+  <token name="@VERSION@">1.2</token>
+  <xml name="requirements">
+    <requirements>
+      <!-- This requirement handles also bcftools from BioConda channel => https://github.com/bioconda/bioconda-recipes/tree/60d2ea750430dbe0191f6f8d5639f90fc1223bd9/recipes/bcftools/1.2 -->
+      <requirement type="package" version="1.2">bcftools</requirement>
+    </requirements>
+  </xml>
+  <xml name="version_command">
+      <version_command><![CDATA[bcftools 2>&1 | grep 'Version:']]></version_command>
+  </xml>
+  <xml name="citations">
+    <citations>
+      <citation type="doi">10.1093/bioinformatics/btp352</citation>
+      <yield />
+    </citations>
+  </xml>
+  <xml name="macro_exclude">
+    <param name="exclude" label="Exclude" help="exclude sites for which the expression is true (see man page for details)" />
+  </xml>
+  <xml name="macro_collapse">
+      <param name="collapse" label="Collapse" type="select" optional="True" help="Controls how to treat records with duplicate positions and defines compatible records across multiple input files">
+        <option value="snps">snps</option>
+        <option value="indels">indels</option>
+        <option value="both">both</option>
+        <option value="all">all</option>
+        <option value="some">some</option>
+        <option value="none" selected="True">None</option>
+    </param>
+  </xml>
+  <xml name="macro_apply_filters_repeat">
+    <repeat name="apply_filters_repeat" title="Apply Filters">
+      <param name="apply_filters" label="Apply Filters" help="require at least one of the listed FILTER strings (e.g. &quot;PASS,.&quot;)" />
+    </repeat>
+  </xml>
+
+  <token name="@SEC_DEF_REGIONS@">
+#if $sec_default.regions_file:
+  --regions-file "${sec_default.regions_file}"
+#end if
+  </token>
+  <token name="@SEC_DEF_TARGETS@">
+#if $sec_default.targets_file:
+  --targets-file "${sec_default.targets_file}"
+#end if
+  </token>
+  <token name="@SEC_DEF_SAMPLES@">
+#if $sec_default.samples_file:
+  --samples-file "${sec_default.samples_file}"
+#end if
+  </token>
+
+  <xml name="macro_samples">
+    <param name="samples_file" label="Samples File" type="data" format="data" optional="True" help="file of samples to include" />
+    <param name="invert_samples_file" label="Invert Samples" type="boolean" truevalue="^" falsevalue="" help="inverts the query/filtering applied by the sample file selection" />
+  </xml>
+  <xml name="macro_targets">
+    <param name="targets_file" label="Targets File" type="data" format="data" optional="True" help="similar to -R but streams rather than index-jumps" />
+    <param name="invert_targets_file" label="Invert Targets" type="boolean" truevalue="^" falsevalue="" help="inverts the query/filtering applied by the target file selection" />
+  </xml>
+  <xml name="macro_regions">
+    <param name="regions_file" label="Regions File" type="data" format="data" optional="True" help="restrict to regions listed in a file" />
+    <param name="invert_regions_file" label="Invert Regions" type="boolean" truevalue="^" falsevalue="" help="inverts the query/filtering applied by region file selection" />
+  </xml>
+  <xml name="macro_select_output_type">
+    <param name="select_output_type" type="select">
+      <option value="v" selected="True">uncompressed VCF</option>
+      <option value="z">compressed VCF</option>
+      <option value="u">uncompressed BCF</option>
+      <option value="b">compressed BCF</option>
+    </param>
+  </xml>
+</macros>
b
diff -r 000000000000 -r a531317a3527 test-data/mpileup.1.out
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/mpileup.1.out Mon May 02 17:27:10 2016 -0400
b
@@ -0,0 +1,40 @@
+##fileformat=VCFv4.2
+##FILTER=<ID=PASS,Description="All filters passed">
+##samtoolsVersion=1.1-19-g6b249e2+htslib-1.1-74-g845c515
+##samtoolsCommand=samtools mpileup -uvDV -b xxx//mpileup.bam.list -f xxx//mpileup.ref.fa.gz
+##reference=file://xxx//mpileup.ref.fa.gz
+##contig=<ID=17,length=81195210>
+##ALT=<ID=X,Description="Represents allele(s) other than observed.">
+##INFO=<ID=INDEL,Number=0,Type=Flag,Description="Indicates that the variant is an INDEL.">
+##INFO=<ID=IDV,Number=1,Type=Integer,Description="Maximum number of reads supporting an indel">
+##INFO=<ID=IMF,Number=1,Type=Float,Description="Maximum fraction of reads supporting an indel">
+##INFO=<ID=DP,Number=1,Type=Integer,Description="Raw read depth">
+##INFO=<ID=VDB,Number=1,Type=Float,Description="Variant Distance Bias for filtering splice-site artefacts in RNA-seq data (bigger is better)",Version="3">
+##INFO=<ID=RPB,Number=1,Type=Float,Description="Mann-Whitney U test of Read Position Bias (bigger is better)">
+##INFO=<ID=MQB,Number=1,Type=Float,Description="Mann-Whitney U test of Mapping Quality Bias (bigger is better)">
+##INFO=<ID=BQB,Number=1,Type=Float,Description="Mann-Whitney U test of Base Quality Bias (bigger is better)">
+##INFO=<ID=MQSB,Number=1,Type=Float,Description="Mann-Whitney U test of Mapping Quality vs Strand Bias (bigger is better)">
+##INFO=<ID=SGB,Number=1,Type=Float,Description="Segregation based metric.">
+##INFO=<ID=MQ0F,Number=1,Type=Float,Description="Fraction of MQ0 reads (smaller is better)">
+##FORMAT=<ID=PL,Number=G,Type=Integer,Description="List of Phred-scaled genotype likelihoods">
+##FORMAT=<ID=DP,Number=1,Type=Integer,Description="Number of high-quality bases">
+##FORMAT=<ID=DV,Number=1,Type=Integer,Description="Number of high-quality non-reference bases">
+##FORMAT=<ID=GT,Number=1,Type=String,Description="Genotype">
+##INFO=<ID=ICB,Number=1,Type=Float,Description="Inbreeding Coefficient Binomial test (bigger is better)">
+##INFO=<ID=HOB,Number=1,Type=Float,Description="Bias in the number of HOMs number (smaller is better)">
+##INFO=<ID=AC,Number=A,Type=Integer,Description="Allele count in genotypes for each ALT allele, in the same order as listed">
+##INFO=<ID=AN,Number=1,Type=Integer,Description="Total number of alleles in called genotypes">
+##INFO=<ID=DP4,Number=4,Type=Integer,Description="Number of high-quality ref-forward , ref-reverse, alt-forward and alt-reverse bases">
+##INFO=<ID=MQ,Number=1,Type=Integer,Description="Average mapping quality">
+#CHROM POS ID REF ALT QUAL FILTER INFO FORMAT HG00100 HG00101 HG00102
+17 302 . T TA 488 . INDEL;IDV=7;IMF=1;DP=25;VDB=0.27613;SGB=-4.22417;MQSB=0.0443614;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=2,4,8,11;MQ=49 GT:PL:DP:DV 0/1:167,0,96:11:6 0/1:157,0,9:7:6 1/1:201,21,0:7:7
+17 828 . T C 409 . DP=25;VDB=0.842082;SGB=-4.20907;RPB=0.950652;MQB=1;MQSB=1;BQB=0.929717;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=2,4,8,11;MQ=60 GT:PL:DP:DV 0/1:211,0,35:12:10 0/1:116,0,91:9:5 1/1:120,12,0:4:4
+17 834 . G A 364 . DP=25;VDB=0.788006;SGB=-4.01214;RPB=0.999233;MQB=1;MQSB=1;BQB=0.821668;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=2,3,7,10;MQ=60 GT:PL:DP:DV 0/1:185,0,46:11:9 0/1:128,0,59:8:5 1/1:89,9,0:3:3
+17 1665 . T C 3.10665 . DP=20;VDB=0.1;SGB=0.346553;RPB=0.222222;MQB=0.611111;MQSB=0.988166;BQB=0.944444;MQ0F=0;ICB=0.128205;HOB=0.0555556;AC=1;AN=6;DP4=7,11,1,1;MQ=55 GT:PL:DP:DV 0/0:0,21,185:7:0 0/0:0,27,222:9:0 0/1:35,0,51:4:2
+17 1869 . A T 138 . DP=24;VDB=0.928022;SGB=-11.9537;RPB=0.984127;MQB=0.96464;MQSB=0.931547;BQB=0.359155;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=6,9,5,4;MQ=58 GT:PL:DP:DV 0/1:115,0,224:18:7 0/1:16,0,104:5:1 1/1:42,3,0:1:1
+17 2041 . G A 447 . DP=31;VDB=0.816435;SGB=-4.18892;RPB=0.88473;MQB=0.972375;MQSB=0.968257;BQB=0.311275;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=6,5,12,7;MQ=58 GT:PL:DP:DV 0/1:229,0,212:21:11 0/1:32,0,24:2:1 1/1:223,21,0:7:7
+17 2220 . G A 303 . DP=21;VDB=0.532753;SGB=-3.51597;RPB=0.964198;MQB=0.898397;MQSB=0.875769;BQB=0.0354359;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=6,2,1,11;MQ=58 GT:PL:DP:DV 0/1:139,0,130:12:6 0/1:69,0,46:4:2 1/1:131,12,0:4:4
+17 2564 . A G 233 . DP=15;VDB=0.690812;SGB=-3.20711;RPB=0.197899;MQB=1;MQSB=1;BQB=0.965069;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=1,4,4,5;MQ=60 GT:PL:DP:DV 0/1:88,0,78:6:3 0/1:57,0,56:4:2 1/1:124,12,0:4:4
+17 3104 . C T 24.2837 . DP=25;VDB=0.8;SGB=0.346553;RPB=0.717391;MQB=0.956522;MQSB=0.962269;BQB=0.978261;MQ0F=0;ICB=0.128205;HOB=0.0555556;AC=1;AN=6;DP4=8,15,2,0;MQ=58 GT:PL:DP:DV 0/0:0,48,255:16:0 0/0:0,12,144:4:0 0/1:59,0,93:5:2
+17 3587 . G A 358 . DP=29;VDB=0.902044;SGB=-3.91326;RPB=0.800999;MQB=1;MQSB=1;BQB=0.156944;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=4,7,10,6;MQ=60 GT:PL:DP:DV 0/1:161,0,184:14:7 0/1:22,0,118:5:1 1/1:212,24,0:8:8
+17 3936 . A G 469 . DP=37;VDB=0.0574114;SGB=-4.60123;RPB=0.741697;MQB=0.812605;MQSB=0.143788;BQB=0.883831;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=5,6,6,17;MQ=56 GT:PL:DP:DV 0/1:233,0,206:20:11 0/1:77,0,58:6:4 1/1:196,24,0:8:8
b
diff -r 000000000000 -r a531317a3527 test-data/mpileup.2.out
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/mpileup.2.out Mon May 02 17:27:10 2016 -0400
b
@@ -0,0 +1,53 @@
+##fileformat=VCFv4.2
+##FILTER=<ID=PASS,Description="All filters passed">
+##samtoolsVersion=1.1-19-g6b249e2+htslib-1.1-74-g845c515
+##samtoolsCommand=samtools mpileup -uvDV -b xxx//mpileup.bam.list -f xxx//mpileup.ref.fa.gz
+##reference=file://xxx//mpileup.ref.fa.gz
+##contig=<ID=17,length=81195210>
+##ALT=<ID=X,Description="Represents allele(s) other than observed.">
+##INFO=<ID=INDEL,Number=0,Type=Flag,Description="Indicates that the variant is an INDEL.">
+##INFO=<ID=IDV,Number=1,Type=Integer,Description="Maximum number of reads supporting an indel">
+##INFO=<ID=IMF,Number=1,Type=Float,Description="Maximum fraction of reads supporting an indel">
+##INFO=<ID=DP,Number=1,Type=Integer,Description="Raw read depth">
+##INFO=<ID=VDB,Number=1,Type=Float,Description="Variant Distance Bias for filtering splice-site artefacts in RNA-seq data (bigger is better)",Version="3">
+##INFO=<ID=RPB,Number=1,Type=Float,Description="Mann-Whitney U test of Read Position Bias (bigger is better)">
+##INFO=<ID=MQB,Number=1,Type=Float,Description="Mann-Whitney U test of Mapping Quality Bias (bigger is better)">
+##INFO=<ID=BQB,Number=1,Type=Float,Description="Mann-Whitney U test of Base Quality Bias (bigger is better)">
+##INFO=<ID=MQSB,Number=1,Type=Float,Description="Mann-Whitney U test of Mapping Quality vs Strand Bias (bigger is better)">
+##INFO=<ID=SGB,Number=1,Type=Float,Description="Segregation based metric.">
+##INFO=<ID=MQ0F,Number=1,Type=Float,Description="Fraction of MQ0 reads (smaller is better)">
+##FORMAT=<ID=PL,Number=G,Type=Integer,Description="List of Phred-scaled genotype likelihoods">
+##FORMAT=<ID=DP,Number=1,Type=Integer,Description="Number of high-quality bases">
+##FORMAT=<ID=DV,Number=1,Type=Integer,Description="Number of high-quality non-reference bases">
+##FORMAT=<ID=GT,Number=1,Type=String,Description="Genotype">
+##INFO=<ID=ICB,Number=1,Type=Float,Description="Inbreeding Coefficient Binomial test (bigger is better)">
+##INFO=<ID=HOB,Number=1,Type=Float,Description="Bias in the number of HOMs number (smaller is better)">
+##INFO=<ID=AC,Number=A,Type=Integer,Description="Allele count in genotypes for each ALT allele, in the same order as listed">
+##INFO=<ID=AN,Number=1,Type=Integer,Description="Total number of alleles in called genotypes">
+##INFO=<ID=DP4,Number=4,Type=Integer,Description="Number of high-quality ref-forward , ref-reverse, alt-forward and alt-reverse bases">
+##INFO=<ID=MQ,Number=1,Type=Integer,Description="Average mapping quality">
+##INFO=<ID=END,Number=1,Type=Integer,Description="End position of the variant described in this record">
+#CHROM POS ID REF ALT QUAL FILTER INFO FORMAT HG00100 HG00101 HG00102
+17 1 . A . . . END=301 GT 0/0 0/0 0/0
+17 302 . T TA 488 . INDEL;IDV=7;IMF=1;DP=25;VDB=0.27613;SGB=-4.22417;MQSB=0.0443614;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=2,4,8,11;MQ=49 GT:PL:DP:DV 0/1:167,0,96:11:6 0/1:157,0,9:7:6 1/1:201,21,0:7:7
+17 303 . G . . . END=827 GT 0/0 0/0 0/0
+17 828 . T C 409 . DP=25;VDB=0.842082;SGB=-4.20907;RPB=0.950652;MQB=1;MQSB=1;BQB=0.929717;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=2,4,8,11;MQ=60 GT:PL:DP:DV 0/1:211,0,35:12:10 0/1:116,0,91:9:5 1/1:120,12,0:4:4
+17 829 . T . . . END=833 GT 0/0 0/0 0/0
+17 834 . G A 364 . DP=25;VDB=0.788006;SGB=-4.01214;RPB=0.999233;MQB=1;MQSB=1;BQB=0.821668;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=2,3,7,10;MQ=60 GT:PL:DP:DV 0/1:185,0,46:11:9 0/1:128,0,59:8:5 1/1:89,9,0:3:3
+17 835 . T . . . END=1664 GT 0/0 0/0 0/0
+17 1665 . T C 3.10665 . DP=20;VDB=0.1;SGB=0.346553;RPB=0.222222;MQB=0.611111;MQSB=0.988166;BQB=0.944444;MQ0F=0;ICB=0.128205;HOB=0.0555556;AC=1;AN=6;DP4=7,11,1,1;MQ=55 GT:PL:DP:DV 0/0:0,21,185:7:0 0/0:0,27,222:9:0 0/1:35,0,51:4:2
+17 1666 . G . . . END=1868 GT 0/0 0/0 0/0
+17 1869 . A T 138 . DP=24;VDB=0.928022;SGB=-11.9537;RPB=0.984127;MQB=0.96464;MQSB=0.931547;BQB=0.359155;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=6,9,5,4;MQ=58 GT:PL:DP:DV 0/1:115,0,224:18:7 0/1:16,0,104:5:1 1/1:42,3,0:1:1
+17 1870 . C . . . END=2040 GT 0/0 0/0 0/0
+17 2041 . G A 447 . DP=31;VDB=0.816435;SGB=-4.18892;RPB=0.88473;MQB=0.972375;MQSB=0.968257;BQB=0.311275;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=6,5,12,7;MQ=58 GT:PL:DP:DV 0/1:229,0,212:21:11 0/1:32,0,24:2:1 1/1:223,21,0:7:7
+17 2042 . G . . . END=2219 GT 0/0 0/0 0/0
+17 2220 . G A 303 . DP=21;VDB=0.532753;SGB=-3.51597;RPB=0.964198;MQB=0.898397;MQSB=0.875769;BQB=0.0354359;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=6,2,1,11;MQ=58 GT:PL:DP:DV 0/1:139,0,130:12:6 0/1:69,0,46:4:2 1/1:131,12,0:4:4
+17 2221 . G . . . END=2563 GT 0/0 0/0 0/0
+17 2564 . A G 233 . DP=15;VDB=0.690812;SGB=-3.20711;RPB=0.197899;MQB=1;MQSB=1;BQB=0.965069;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=1,4,4,5;MQ=60 GT:PL:DP:DV 0/1:88,0,78:6:3 0/1:57,0,56:4:2 1/1:124,12,0:4:4
+17 2565 . A . . . END=3103 GT 0/0 0/0 0/0
+17 3104 . C T 24.2837 . DP=25;VDB=0.8;SGB=0.346553;RPB=0.717391;MQB=0.956522;MQSB=0.962269;BQB=0.978261;MQ0F=0;ICB=0.128205;HOB=0.0555556;AC=1;AN=6;DP4=8,15,2,0;MQ=58 GT:PL:DP:DV 0/0:0,48,255:16:0 0/0:0,12,144:4:0 0/1:59,0,93:5:2
+17 3105 . T . . . END=3586 GT 0/0 0/0 0/0
+17 3587 . G A 358 . DP=29;VDB=0.902044;SGB=-3.91326;RPB=0.800999;MQB=1;MQSB=1;BQB=0.156944;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=4,7,10,6;MQ=60 GT:PL:DP:DV 0/1:161,0,184:14:7 0/1:22,0,118:5:1 1/1:212,24,0:8:8
+17 3588 . A . . . END=3935 GT 0/0 0/0 0/0
+17 3936 . A G 469 . DP=37;VDB=0.0574114;SGB=-4.60123;RPB=0.741697;MQB=0.812605;MQSB=0.143788;BQB=0.883831;MQ0F=0;ICB=0.8;HOB=0.222222;AC=4;AN=6;DP4=5,6,6,17;MQ=56 GT:PL:DP:DV 0/1:233,0,206:20:11 0/1:77,0,58:6:4 1/1:196,24,0:8:8
+17 3937 . C . . . END=4101 GT 0/0 0/0 0/0
b
diff -r 000000000000 -r a531317a3527 test-data/mpileup.vcf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/mpileup.vcf Mon May 02 17:27:10 2016 -0400
b
b'@@ -0,0 +1,4127 @@\n+##fileformat=VCFv4.2\n+##FILTER=<ID=PASS,Description="All filters passed">\n+##samtoolsVersion=1.1-19-g6b249e2+htslib-1.1-74-g845c515\n+##samtoolsCommand=samtools mpileup -uvDV -b xxx//mpileup.bam.list -f xxx//mpileup.ref.fa.gz\n+##reference=file://xxx//mpileup.ref.fa.gz\n+##contig=<ID=17,length=81195210>\n+##ALT=<ID=X,Description="Represents allele(s) other than observed.">\n+##INFO=<ID=INDEL,Number=0,Type=Flag,Description="Indicates that the variant is an INDEL.">\n+##INFO=<ID=IDV,Number=1,Type=Integer,Description="Maximum number of reads supporting an indel">\n+##INFO=<ID=IMF,Number=1,Type=Float,Description="Maximum fraction of reads supporting an indel">\n+##INFO=<ID=DP,Number=1,Type=Integer,Description="Raw read depth">\n+##INFO=<ID=VDB,Number=1,Type=Float,Description="Variant Distance Bias for filtering splice-site artefacts in RNA-seq data (bigger is better)",Version="3">\n+##INFO=<ID=RPB,Number=1,Type=Float,Description="Mann-Whitney U test of Read Position Bias (bigger is better)">\n+##INFO=<ID=MQB,Number=1,Type=Float,Description="Mann-Whitney U test of Mapping Quality Bias (bigger is better)">\n+##INFO=<ID=BQB,Number=1,Type=Float,Description="Mann-Whitney U test of Base Quality Bias (bigger is better)">\n+##INFO=<ID=MQSB,Number=1,Type=Float,Description="Mann-Whitney U test of Mapping Quality vs Strand Bias (bigger is better)">\n+##INFO=<ID=SGB,Number=1,Type=Float,Description="Segregation based metric.">\n+##INFO=<ID=MQ0F,Number=1,Type=Float,Description="Fraction of MQ0 reads (smaller is better)">\n+##INFO=<ID=I16,Number=16,Type=Float,Description="Auxiliary tag used for calling, see description of bcf_callret1_t in bam2bcf.h">\n+##INFO=<ID=QS,Number=R,Type=Float,Description="Auxiliary tag used for calling">\n+##FORMAT=<ID=PL,Number=G,Type=Integer,Description="List of Phred-scaled genotype likelihoods">\n+##FORMAT=<ID=DP,Number=1,Type=Integer,Description="Number of high-quality bases">\n+##FORMAT=<ID=DV,Number=1,Type=Integer,Description="Number of high-quality non-reference bases">\n+#CHROM\tPOS\tID\tREF\tALT\tQUAL\tFILTER\tINFO\tFORMAT\tHG00100\tHG00101\tHG00102\n+17\t1\t.\tA\t<X>\t0\t.\tDP=11;I16=11,0,0,0,452,18594,0,0,319,9251,0,0,223,4959,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t2\t.\tA\t<X>\t0\t.\tDP=11;I16=11,0,0,0,439,17587,0,0,319,9251,0,0,226,5030,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t3\t.\tG\t<X>\t0\t.\tDP=11;I16=11,0,0,0,431,16971,0,0,319,9251,0,0,229,5111,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t4\t.\tC\t<X>\t0\t.\tDP=11;I16=11,0,0,0,423,16417,0,0,319,9251,0,0,232,5202,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,71:3:0\n+17\t5\t.\tT\t<X>\t0\t.\tDP=11;I16=11,0,0,0,450,18520,0,0,319,9251,0,0,234,5252,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t6\t.\tT\t<X>\t0\t.\tDP=11;I16=11,0,0,0,403,14847,0,0,319,9251,0,0,236,5310,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t7\t.\tC\t<X>\t0\t.\tDP=11;I16=11,0,0,0,446,18114,0,0,319,9251,0,0,237,5327,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t8\t.\tT\t<X>\t0\t.\tDP=11;I16=11,0,0,0,465,19677,0,0,319,9251,0,0,238,5354,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t9\t.\tC\t<X>\t0\t.\tDP=11;I16=11,0,0,0,447,18205,0,0,319,9251,0,0,239,5391,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t10\t.\tA\t<X>\t0\t.\tDP=11;I16=11,0,0,0,426,16756,0,0,319,9251,0,0,240,5438,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,69:3:0\n+17\t11\t.\tC\t<X>\t0\t.\tDP=11;I16=11,0,0,0,413,15603,0,0,319,9251,0,0,241,5495,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t12\t.\tC\t<X>\t0\t.\tDP=11;I16=11,0,0,0,438,17506,0,0,319,9251,0,0,242,5562,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t13\t.\tC\t<X>\t0\t.\tDP=11;I16=11,0,0,0,437,17463,0,0,319,9251,0,0,243,5639,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t14\t.\tT\t<X>\t0\t.\tDP=11;I16=11,0,0,0,453,18715,0,0,319,9251,0,0,242,5628,0,0;QS=3,0;MQ0F=0\tPL:DP:DV\t0,15,100:5:0\t0,9,72:3:0\t0,9,72:3:0\n+17\t15\t.\tG\t'..b':DV\t0,15,142:5:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4072\t.\tG\t<X>\t0\t.\tDP=5;I16=2,2,0,0,138,4974,0,0,194,9938,0,0,55,987,0,0;QS=1,0;MQSB=0;MQ0F=0\tPL:DP:DV\t0,12,122:4:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4073\t.\tG\t<X>\t0\t.\tDP=5;I16=3,2,0,0,156,5082,0,0,254,13538,0,0,60,994,0,0;QS=1,0;MQSB=0.333333;MQ0F=0\tPL:DP:DV\t0,15,136:5:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4074\t.\tC\t<X>\t0\t.\tDP=5;I16=3,2,0,0,160,5602,0,0,254,13538,0,0,56,928,0,0;QS=1,0;MQSB=0.333333;MQ0F=0\tPL:DP:DV\t0,15,142:5:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4075\t.\tT\t<X>\t0\t.\tDP=5;I16=3,2,0,0,187,7069,0,0,254,13538,0,0,52,870,0,0;QS=1,0;MQSB=0.333333;MQ0F=0\tPL:DP:DV\t0,15,155:5:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4076\t.\tG\t<X>\t0\t.\tDP=5;I16=3,2,0,0,174,6298,0,0,254,13538,0,0,48,820,0,0;QS=1,0;MQSB=0.333333;MQ0F=0\tPL:DP:DV\t0,15,149:5:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4077\t.\tA\t<X>\t0\t.\tDP=4;I16=3,1,0,0,138,4810,0,0,194,9938,0,0,44,728,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,12,121:4:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4078\t.\tT\t<X>\t0\t.\tDP=4;I16=3,1,0,0,143,5173,0,0,194,9938,0,0,40,644,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,12,124:4:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4079\t.\tA\t<X>\t0\t.\tDP=4;I16=3,1,0,0,121,3847,0,0,194,9938,0,0,36,568,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,12,107:4:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4080\t.\tT\t<X>\t0\t.\tDP=4;I16=3,0,0,0,106,3778,0,0,134,6338,0,0,25,451,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,9,87:3:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4081\t.\tT\t<X>\t0\t.\tDP=4;I16=3,1,0,0,106,2934,0,0,194,9938,0,0,28,440,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,12,94:4:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4082\t.\tC\t<X>\t0\t.\tDP=3;I16=2,1,0,0,110,4042,0,0,134,6338,0,0,25,387,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,9,103:3:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4083\t.\tC\t<X>\t0\t.\tDP=3;I16=2,1,0,0,104,3648,0,0,134,6338,0,0,22,340,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,9,98:3:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4084\t.\tA\t<X>\t0\t.\tDP=2;I16=1,1,0,0,78,3050,0,0,97,4969,0,0,20,298,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,6,74:2:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4085\t.\tC\t<X>\t0\t.\tDP=2;I16=1,1,0,0,62,1940,0,0,97,4969,0,0,18,260,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,6,62:2:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4086\t.\tG\t<X>\t0\t.\tDP=2;I16=1,1,0,0,56,1640,0,0,97,4969,0,0,16,226,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,6,56:2:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4087\t.\tC\t<X>\t0\t.\tDP=2;I16=1,1,0,0,69,2405,0,0,97,4969,0,0,14,196,0,0;QS=1,0;MQSB=1;MQ0F=0\tPL:DP:DV\t0,6,68:2:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4088\t.\tA\t<X>\t0\t.\tDP=1;I16=1,0,0,0,39,1521,0,0,37,1369,0,0,13,169,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,37:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4089\t.\tC\t<X>\t0\t.\tDP=1;I16=1,0,0,0,36,1296,0,0,37,1369,0,0,12,144,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,36:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4090\t.\tC\t<X>\t0\t.\tDP=1;I16=1,0,0,0,33,1089,0,0,37,1369,0,0,11,121,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,33:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4091\t.\tT\t<X>\t0\t.\tDP=1;I16=1,0,0,0,36,1296,0,0,37,1369,0,0,10,100,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,36:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4092\t.\tG\t<X>\t0\t.\tDP=1;I16=1,0,0,0,37,1369,0,0,37,1369,0,0,9,81,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,37:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4093\t.\tC\t<X>\t0\t.\tDP=1;I16=1,0,0,0,35,1225,0,0,37,1369,0,0,8,64,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,35:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4094\t.\tT\t<X>\t0\t.\tDP=1;I16=1,0,0,0,40,1600,0,0,37,1369,0,0,7,49,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,37:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4095\t.\tA\t<X>\t0\t.\tDP=1;I16=1,0,0,0,35,1225,0,0,37,1369,0,0,6,36,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,35:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4096\t.\tC\t<X>\t0\t.\tDP=1;I16=1,0,0,0,32,1024,0,0,37,1369,0,0,5,25,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,32:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4097\t.\tA\t<X>\t0\t.\tDP=1;I16=1,0,0,0,35,1225,0,0,37,1369,0,0,4,16,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,35:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4098\t.\tC\t<X>\t0\t.\tDP=1;I16=1,0,0,0,31,961,0,0,37,1369,0,0,3,9,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,31:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4099\t.\tT\t<X>\t0\t.\tDP=1;I16=1,0,0,0,32,1024,0,0,37,1369,0,0,2,4,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,32:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4100\t.\tC\t<X>\t0\t.\tDP=1;I16=1,0,0,0,27,729,0,0,37,1369,0,0,1,1,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,27:1:0\t0,0,0:0:0\t0,0,0:0:0\n+17\t4101\t.\tC\t<X>\t0\t.\tDP=1;I16=1,0,0,0,26,676,0,0,37,1369,0,0,0,0,0,0;QS=1,0;MQ0F=0\tPL:DP:DV\t0,3,26:1:0\t0,0,0:0:0\t0,0,0:0:0\n'
b
diff -r 000000000000 -r a531317a3527 tool_dependencies.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_dependencies.xml Mon May 02 17:27:10 2016 -0400
b
@@ -0,0 +1,6 @@
+<?xml version="1.0"?>
+<tool_dependency>
+  <package name="samtools" version="0.1.19">
+    <repository changeset_revision="95d2c4aefb5f" name="package_samtools_0_1_19" owner="devteam" toolshed="https://toolshed.g2.bx.psu.edu" />
+  </package>
+</tool_dependency>