changeset 38:e698621cca1f draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/freebayes commit cdd582adf568e80558740ec7ff51c9447948cf77
author iuc
date Wed, 07 May 2025 05:35:17 +0000
parents 1e1291983bc7
children
files freebayes.xml leftalign.xml test-data/freebayes-phix174-input-sites-test3.vcf.bgzip test-data/freebayes-phix174-test3.vcf
diffstat 4 files changed, 20 insertions(+), 92 deletions(-) [+]
line wrap: on
line diff
--- a/freebayes.xml	Mon Mar 10 11:15:42 2025 +0000
+++ b/freebayes.xml	Wed May 07 05:35:17 2025 +0000
@@ -1,4 +1,4 @@
-<tool id="freebayes" name="FreeBayes" version="@TOOL_VERSION@+galaxy0">
+<tool id="freebayes" name="FreeBayes" version="@TOOL_VERSION@+galaxy1">
     <description>bayesian genetic variant detector</description>
     <xrefs>
         <xref type="bio.tools">freebayes</xref>
@@ -39,10 +39,10 @@
         #end if
     #end for
 
-    ## Tabixize optional input_variant_vcf file (for --variant-input option)
+    ## For --variant-input option, create symlinks to vcf.bgzip input and its accompanying tabix index
     #if ( str( $options_type.options_type_selector ) == 'cline' or str( $options_type.options_type_selector ) == 'full' ) and str( $options_type.optional_inputs.optional_inputs_selector ) == 'set' and str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf":
         ln -s -f '${options_type.optional_inputs.input_variant_type.input_variant_vcf}' input_variant_vcf.vcf.gz &&
-        ln -s -f '${Tabixized_input}' input_variant_vcf.vcf.gz.tbi &&
+        ln -s '$options_type.optional_inputs.input_variant_type.input_variant_vcf.metadata.tabix_index' input_variant_vcf.vcf.gz.tbi &&
     #end if
 
     ##if the user has specified a region or target file, just use that instead of calculating a set of unique regions
@@ -129,7 +129,7 @@
                     --cnv-map '${options_type.optional_inputs.A}'
                 #end if
                 #if str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf":
-                    --variant-input 'input_variant_vcf.vcf.gz'  ## input_variant_vcf.vcf.gz is symlinked to a galaxy-generated dataset in "Tabixize optional input_variant_vcf file" section of the command line above
+                    --variant-input 'input_variant_vcf.vcf.gz'
                     ${options_type.optional_inputs.input_variant_type.only_use_input_alleles}
                 #end if
                 #if $options_type.optional_inputs.haplotype_basis_alleles:
@@ -365,9 +365,7 @@
                             <when value="do_not_provide" />
                             <when value="provide_vcf">
                                 <param name="input_variant_vcf" argument="--variant-input" type="data" format="vcf_bgzip"
-                                       label="Use variants reported in this VCF dataset as input to the algorithm">
-                                    <conversion name="Tabixized_input" type="tabix" />
-                                </param>
+                                       label="Use variants reported in this VCF dataset as input to the algorithm"/>
                                 <param name="only_use_input_alleles" argument="--only-use-input-alleles" type="boolean" truevalue="--only-use-input-alleles" falsevalue="" checked="false"
                                        label="Only provide variant calls and genotype likelihoods for sites in VCF" />
                             </when>
@@ -640,15 +638,25 @@
             <param name="min_coverage" value="14"/>
             <output name="output_vcf" file="freebayes-phix174-test2.vcf" lines_diff="4" />
         </test>
+        <!-- Test that user-provided (variant-input option) sites are included in output -->
         <test>
             <param name="reference_source_selector" value="history" />
             <param name="processmode" value="individual" />
             <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
             <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
-            <param name="options_type_selector" value="naive_w_filters"/>
-            <param name="coverage_options_selector" value="set" />
-            <param name="min_coverage" value="14"/>
-            <output name="output_vcf" file="freebayes-phix174-test3.vcf" lines_diff="4" />
+            <param name="options_type_selector" value="full"/>
+            <conditional name="optional_inputs">
+                <param name="optional_inputs_selector" value="set" />
+                <conditional name="input_variant_type">
+                    <param name="input_variant_type_selector" value="provide_vcf" />
+                    <param name="input_variant_vcf" value="freebayes-phix174-input-sites-test3.vcf.bgzip" />
+                </conditional>
+            </conditional>
+            <output name="output_vcf">
+                <assert_contents>
+                    <has_line_matching expression="phiX174&#009;1134&#009;\.&#009;A&#009;\.&#009;.+"/>
+                </assert_contents>
+            </output>
         </test>
         <test>
             <param name="reference_source_selector" value="history" />
--- a/leftalign.xml	Mon Mar 10 11:15:42 2025 +0000
+++ b/leftalign.xml	Wed May 07 05:35:17 2025 +0000
@@ -1,5 +1,5 @@
 <?xml version="1.0"?>
-<tool id="bamleftalign" name="BamLeftAlign" version="@TOOL_VERSION@">
+<tool id="bamleftalign" name="BamLeftAlign" version="@TOOL_VERSION@+galaxy1">
     <description> indels in BAM datasets</description>
     <xrefs>
         <xref type="bio.tools">freebayes</xref>
Binary file test-data/freebayes-phix174-input-sites-test3.vcf.bgzip has changed
--- a/test-data/freebayes-phix174-test3.vcf	Mon Mar 10 11:15:42 2025 +0000
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,80 +0,0 @@
-##fileformat=VCFv4.2
-##fileDate=20191031
-##source=freeBayes v1.3.5
-##reference=localref.fa
-##contig=<ID=phiX174,length=5386>
-##phasing=none
-##commandline="freebayes --region phiX174:0..5386 --bam b_0.bam --fasta-reference localref.fa --vcf ./vcf_output/part_phiX174:0..5386.vcf --min-coverage 14 --skip-coverage 0 --limit-coverage 0 --haplotype-length 0 --min-alternate-count 1 --min-alternate-fraction 0.05 --pooled-continuous --report-monomorphic --standard-filters"
-##INFO=<ID=NS,Number=1,Type=Integer,Description="Number of samples with data">
-##INFO=<ID=DP,Number=1,Type=Integer,Description="Total read depth at the locus">
-##INFO=<ID=DPB,Number=1,Type=Float,Description="Total read depth per bp at the locus; bases in reads overlapping / bases in haplotype">
-##INFO=<ID=AC,Number=A,Type=Integer,Description="Total number of alternate alleles in called genotypes">
-##INFO=<ID=AN,Number=1,Type=Integer,Description="Total number of alleles in called genotypes">
-##INFO=<ID=AF,Number=A,Type=Float,Description="Estimated allele frequency in the range (0,1]">
-##INFO=<ID=RO,Number=1,Type=Integer,Description="Count of full observations of the reference haplotype.">
-##INFO=<ID=AO,Number=A,Type=Integer,Description="Count of full observations of this alternate haplotype.">
-##INFO=<ID=PRO,Number=1,Type=Float,Description="Reference allele observation count, with partial observations recorded fractionally">
-##INFO=<ID=PAO,Number=A,Type=Float,Description="Alternate allele observations, with partial observations recorded fractionally">
-##INFO=<ID=QR,Number=1,Type=Integer,Description="Reference allele quality sum in phred">
-##INFO=<ID=QA,Number=A,Type=Integer,Description="Alternate allele quality sum in phred">
-##INFO=<ID=PQR,Number=1,Type=Float,Description="Reference allele quality sum in phred for partial observations">
-##INFO=<ID=PQA,Number=A,Type=Float,Description="Alternate allele quality sum in phred for partial observations">
-##INFO=<ID=SRF,Number=1,Type=Integer,Description="Number of reference observations on the forward strand">
-##INFO=<ID=SRR,Number=1,Type=Integer,Description="Number of reference observations on the reverse strand">
-##INFO=<ID=SAF,Number=A,Type=Integer,Description="Number of alternate observations on the forward strand">
-##INFO=<ID=SAR,Number=A,Type=Integer,Description="Number of alternate observations on the reverse strand">
-##INFO=<ID=SRP,Number=1,Type=Float,Description="Strand balance probability for the reference allele: Phred-scaled upper-bounds estimate of the probability of observing the deviation between SRF and SRR given E(SRF/SRR) ~ 0.5, derived using Hoeffding's inequality">
-##INFO=<ID=SAP,Number=A,Type=Float,Description="Strand balance probability for the alternate allele: Phred-scaled upper-bounds estimate of the probability of observing the deviation between SAF and SAR given E(SAF/SAR) ~ 0.5, derived using Hoeffding's inequality">
-##INFO=<ID=AB,Number=A,Type=Float,Description="Allele balance at heterozygous sites: a number between 0 and 1 representing the ratio of reads showing the reference allele to all reads, considering only reads from individuals called as heterozygous">
-##INFO=<ID=ABP,Number=A,Type=Float,Description="Allele balance probability at heterozygous sites: Phred-scaled upper-bounds estimate of the probability of observing the deviation between ABR and ABA given E(ABR/ABA) ~ 0.5, derived using Hoeffding's inequality">
-##INFO=<ID=RUN,Number=A,Type=Integer,Description="Run length: the number of consecutive repeats of the alternate allele in the reference genome">
-##INFO=<ID=RPP,Number=A,Type=Float,Description="Read Placement Probability: Phred-scaled upper-bounds estimate of the probability of observing the deviation between RPL and RPR given E(RPL/RPR) ~ 0.5, derived using Hoeffding's inequality">
-##INFO=<ID=RPPR,Number=1,Type=Float,Description="Read Placement Probability for reference observations: Phred-scaled upper-bounds estimate of the probability of observing the deviation between RPL and RPR given E(RPL/RPR) ~ 0.5, derived using Hoeffding's inequality">
-##INFO=<ID=RPL,Number=A,Type=Float,Description="Reads Placed Left: number of reads supporting the alternate balanced to the left (5') of the alternate allele">
-##INFO=<ID=RPR,Number=A,Type=Float,Description="Reads Placed Right: number of reads supporting the alternate balanced to the right (3') of the alternate allele">
-##INFO=<ID=EPP,Number=A,Type=Float,Description="End Placement Probability: Phred-scaled upper-bounds estimate of the probability of observing the deviation between EL and ER given E(EL/ER) ~ 0.5, derived using Hoeffding's inequality">
-##INFO=<ID=EPPR,Number=1,Type=Float,Description="End Placement Probability for reference observations: Phred-scaled upper-bounds estimate of the probability of observing the deviation between EL and ER given E(EL/ER) ~ 0.5, derived using Hoeffding's inequality">
-##INFO=<ID=DPRA,Number=A,Type=Float,Description="Alternate allele depth ratio.  Ratio between depth in samples with each called alternate allele and those without.">
-##INFO=<ID=ODDS,Number=1,Type=Float,Description="The log odds ratio of the best genotype combination to the second-best.">
-##INFO=<ID=GTI,Number=1,Type=Integer,Description="Number of genotyping iterations required to reach convergence or bailout.">
-##INFO=<ID=TYPE,Number=A,Type=String,Description="The type of allele, either snp, mnp, ins, del, or complex.">
-##INFO=<ID=CIGAR,Number=A,Type=String,Description="The extended CIGAR representation of each alternate allele, with the exception that '=' is replaced by 'M' to ease VCF parsing.  Note that INDEL alleles do not have the first matched base (which is provided by default, per the spec) referred to by the CIGAR.">
-##INFO=<ID=NUMALT,Number=1,Type=Integer,Description="Number of unique non-reference alleles in called genotypes at this position.">
-##INFO=<ID=MEANALT,Number=A,Type=Float,Description="Mean number of unique non-reference allele observations per sample with the corresponding alternate alleles.">
-##INFO=<ID=LEN,Number=A,Type=Integer,Description="allele length">
-##INFO=<ID=MQM,Number=A,Type=Float,Description="Mean mapping quality of observed alternate alleles">
-##INFO=<ID=MQMR,Number=1,Type=Float,Description="Mean mapping quality of observed reference alleles">
-##INFO=<ID=PAIRED,Number=A,Type=Float,Description="Proportion of observed alternate alleles which are supported by properly paired read fragments">
-##INFO=<ID=PAIREDR,Number=1,Type=Float,Description="Proportion of observed reference alleles which are supported by properly paired read fragments">
-##INFO=<ID=MIN_DP,Number=1,Type=Integer,Description="Minimum depth in gVCF output block.">
-##INFO=<ID=END,Number=1,Type=Integer,Description="Last position (inclusive) in gVCF output record.">
-##FORMAT=<ID=GT,Number=1,Type=String,Description="Genotype">
-##FORMAT=<ID=GQ,Number=1,Type=Float,Description="Genotype Quality, the Phred-scaled marginal (or unconditional) probability of the called genotype">
-##FORMAT=<ID=GL,Number=G,Type=Float,Description="Genotype Likelihood, log10-scaled likelihoods of the data given the called genotype for each possible genotype generated from the reference and alternate alleles given the sample ploidy">
-##FORMAT=<ID=DP,Number=1,Type=Integer,Description="Read Depth">
-##FORMAT=<ID=AD,Number=R,Type=Integer,Description="Number of observation for each allele">
-##FORMAT=<ID=RO,Number=1,Type=Integer,Description="Reference allele observation count">
-##FORMAT=<ID=QR,Number=1,Type=Integer,Description="Sum of quality of the reference observations">
-##FORMAT=<ID=AO,Number=A,Type=Integer,Description="Alternate allele observation count">
-##FORMAT=<ID=QA,Number=A,Type=Integer,Description="Sum of quality of the alternate observations">
-##FORMAT=<ID=MIN_DP,Number=1,Type=Integer,Description="Minimum depth in gVCF output block.">
-#CHROM	POS	ID	REF	ALT	QUAL	FILTER	INFO	FORMAT	unknown
-phiX174	1134	.	A	.	0	.	DP=14;DPB=14;EPPR=3.0103;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=916;RO=14;RPPR=8.59409	GT:DP:AD:RO:QR:AO:QA:GL	0/0:14:14:14:916:.:.:0
-phiX174	1135	.	C	.	0	.	DP=14;DPB=14;EPPR=3.63072;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=957;RO=14;RPPR=5.49198	GT:DP:AD:RO:QR:AO:QA:GL	0/0:14:14:14:957:.:.:0
-phiX174	1136	.	G	.	0	.	DP=14;DPB=14;EPPR=8.59409;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=919;RO=14;RPPR=3.0103	GT:DP:AD:RO:QR:AO:QA:GL	0/0:14:14:14:919:.:.:0
-phiX174	1137	.	C	.	0	.	DP=14;DPB=14;EPPR=5.49198;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=927;RO=14;RPPR=3.63072	GT:DP:AD:RO:QR:AO:QA:GL	0/0:14:14:14:927:.:.:0
-phiX174	1138	.	C	.	0	.	DP=14;DPB=14;EPPR=3.63072;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=876;RO=14;RPPR=5.49198	GT:DP:AD:RO:QR:AO:QA:GL	0/0:14:14:14:876:.:.:0
-phiX174	1139	.	G	.	0	.	DP=14;DPB=14;EPPR=3.63072;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=946;RO=14;RPPR=5.49198	GT:DP:AD:RO:QR:AO:QA:GL	0/0:14:14:14:946:.:.:0
-phiX174	1140	.	T	.	0	.	DP=15;DPB=15;EPPR=4.31318;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=927;RO=15;RPPR=4.31318	GT:DP:AD:RO:QR:AO:QA:GL	0/0:15:15:15:927:.:.:0
-phiX174	1141	.	T	G	3.61953e-07	.	AB=0;ABP=0;AC=0;AF=0;AN=2;AO=1;CIGAR=1X;DP=15;DPB=15;DPRA=0;EPP=5.18177;EPPR=3.63072;GTI=0;LEN=1;MEANALT=1;MQM=37;MQMR=37;NS=1;NUMALT=1;ODDS=16.3003;PAIRED=0;PAIREDR=0;PAO=0;PQA=0;PQR=0;PRO=0;QA=50;QR=880;RO=14;RPL=0;RPP=5.18177;RPPR=5.49198;RPR=1;RUN=1;SAF=0;SAP=5.18177;SAR=1;SRF=5;SRP=5.49198;SRR=9;TYPE=snp	GT:DP:AD:RO:QR:AO:QA:GL	0/0:15:14,1:14:880:1:50:0,-0.836684,-42.5367
-phiX174	1142	.	G	.	0	.	DP=16;DPB=16;EPPR=5.18177;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=1082;RO=16;RPPR=3.55317	GT:DP:AD:RO:QR:AO:QA:GL	0/0:16:16:16:1082:.:.:0
-phiX174	1143	.	G	.	0	.	DP=16;DPB=16;EPPR=5.18177;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=1029;RO=16;RPPR=3.55317	GT:DP:AD:RO:QR:AO:QA:GL	0/0:16:16:16:1029:.:.:0
-phiX174	1144	.	C	.	0	.	DP=16;DPB=16;EPPR=5.18177;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=1114;RO=16;RPPR=3.55317	GT:DP:AD:RO:QR:AO:QA:GL	0/0:16:16:16:1114:.:.:0
-phiX174	1145	.	G	.	0	.	DP=15;DPB=15;EPPR=6.62942;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=1042;RO=15;RPPR=3.15506	GT:DP:AD:RO:QR:AO:QA:GL	0/0:15:15:15:1042:.:.:0
-phiX174	1146	.	C	.	0	.	DP=15;DPB=15;EPPR=6.62942;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=1058;RO=15;RPPR=3.15506	GT:DP:AD:RO:QR:AO:QA:GL	0/0:15:15:15:1058:.:.:0
-phiX174	1147	.	T	.	0	.	DP=15;DPB=15;EPPR=4.31318;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=999;RO=15;RPPR=4.31318	GT:DP:AD:RO:QR:AO:QA:GL	0/0:15:15:15:999:.:.:0
-phiX174	1148	.	C	.	0	.	DP=15;DPB=15;EPPR=4.31318;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=1003;RO=15;RPPR=4.31318	GT:DP:AD:RO:QR:AO:QA:GL	0/0:15:15:15:1003:.:.:0
-phiX174	1149	.	T	C	4.04114e-07	.	AB=0;ABP=0;AC=0;AF=0;AN=2;AO=1;CIGAR=1X;DP=14;DPB=14;DPRA=0;EPP=5.18177;EPPR=3.17734;GTI=0;LEN=1;MEANALT=1;MQM=37;MQMR=37;NS=1;NUMALT=1;ODDS=16.1901;PAIRED=0;PAIREDR=0;PAO=0;PQA=0;PQR=0;PRO=0;QA=33;QR=830;RO=13;RPL=0;RPP=5.18177;RPPR=7.18621;RPR=1;RUN=1;SAF=0;SAP=5.18177;SAR=1;SRF=5;SRP=4.51363;SRR=8;TYPE=snp	GT:DP:AD:RO:QR:AO:QA:GL	0/0:14:13,1:13:830:1:33:0,-1.0599,-39.8344
-phiX174	1151	.	C	T	3.45599e-08	.	AB=0;ABP=0;AC=0;AF=0;AN=2;AO=1;CIGAR=1X;DP=15;DPB=15;DPRA=0;EPP=5.18177;EPPR=8.59409;GTI=0;LEN=1;MEANALT=1;MQM=37;MQMR=37;NS=1;NUMALT=1;ODDS=18.6491;PAIRED=0;PAIREDR=0;PAO=0;PQA=0;PQR=0;PRO=0;QA=27;QR=946;RO=14;RPL=1;RPP=5.18177;RPPR=3.0103;RPR=0;RUN=1;SAF=1;SAP=5.18177;SAR=0;SRF=3;SRP=12.937;SRR=11;TYPE=snp	GT:DP:AD:RO:QR:AO:QA:GL	0/0:15:14,1:14:946:1:27:0,-1.85676,-43.833
-phiX174	1152	.	G	.	0	.	DP=16;DPB=16;EPPR=5.18177;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=993;RO=16;RPPR=5.18177	GT:DP:AD:RO:QR:AO:QA:GL	0/0:16:16:16:993:.:.:0
-phiX174	1153	.	T	.	3.38668e-15	.	DP=15;DPB=15;EPPR=4.31318;GTI=0;MQMR=37;NS=1;NUMALT=0;ODDS=0;PAIREDR=0;PQR=0;PRO=0;QR=880;RO=15;RPPR=4.31318	GT:DP:AD:RO:QR:AO:QA:GL	0/0:15:15:15:880:.:.:0