Repository 'lofreq_filter'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/lofreq_filter

Changeset 0:6f9ffff040ce (2019-12-17)
Next changeset 1:fdba1586551d (2020-01-31)
Commit message:
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/lofreq commit 9efcb813ab17041c7f5aad834dfff45bd7046c60"
added:
lofreq_filter.xml
macros.xml
test-data/alnqual-out1.bam
test-data/alnqual-out2.bam
test-data/alnqual-out3.bam
test-data/alnqual-out4.bam
test-data/alnqual-out5.bam
test-data/call-out1.vcf
test-data/call-out2.vcf
test-data/indelqual-out1.bam
test-data/indelqual-out2.bam
test-data/indelqual-out3.bam
test-data/lofreq-in1.bam
test-data/pBR322.fa
test-data/viterbi-out1.bam
test-data/viterbi-out2.bam
tool-data/fasta_indexes.loc.sample
tool_data_table_conf.xml.sample
b
diff -r 000000000000 -r 6f9ffff040ce lofreq_filter.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/lofreq_filter.xml Tue Dec 17 17:26:32 2019 -0500
[
b'@@ -0,0 +1,300 @@\n+<tool id="lofreq_filter" name="Lofreq filter" version="@TOOL_VERSION@">\n+    <description>called variants posteriorly</description>\n+    <macros>\n+        <import>macros.xml</import>\n+        <xml name="snvqual_filter_config">\n+            <conditional name="snvqual_filter">\n+                <param name="snvqual" type="select"\n+                label="Filter SNVs based on call quality?">\n+                    <option value="no">No, don\'t apply call quality filter</option>\n+                    <option value="min-phred">Yes, filter on explicit QUAL threshold</option>\n+                    <option value="mtc">Yes, filter on multiple testing corrected p-value</option>\n+                </param>\n+                <when value="no">\n+                </when>\n+                <when value="min-phred">\n+                    <param argument="-Q" name="snvqual_thresh" type="integer" min="0" value="0"\n+                    label="Minimum QUAL value"\n+                    help="Specify the minimum value of the QUAL field required to retain a variant" />\n+                </when>\n+                <when value="mtc">\n+                    <param argument="-r" name="snvqual_alpha" type="float" min="0" max="1" value="1"\n+                    label="Multiple-testing corrected p-value threshold" />\n+                    <param argument="-q" name="snvqual_mtc" type="select"\n+                    label="Multiple testing correction method">\n+                        <option value="bonf">Bonferroni</option>\n+                        <option value="holm">Holm-Sidak</option>\n+                        <option value="fdr">False-discovery rate</option>\n+                    </param>\n+                    <param argument="-s" name="snvqual_ntests" type="integer" min="1" value="1"\n+                    label="Estimate of number of tests performed"\n+                    help="Ideally, this would be the number of SNVs considered during variant calling. The lofreq variant caller emits this number as part of its output. For other variant callers, all you will typically have is a lower bound estimate given by the number of SNV records in your VCF input." />\n+                </when>\n+            </conditional>\n+        </xml>\n+        <xml name="indelqual_filter_config">\n+            <conditional name="indelqual_filter">\n+                <param name="indelqual" type="select"\n+                label="Filter indels based on call quality?">\n+                    <option value="no">No, don\'t apply call quality filter</option>\n+                    <option value="min-phred">Yes, filter on explicit QUAL threshold</option>\n+                    <option value="mtc">Yes, filter on multiple testing corrected p-value</option>\n+                </param>\n+                <when value="no">\n+                </when>\n+                <when value="min-phred">\n+                    <param argument="-K" name="indelqual_thresh" type="integer" min="0" value="0"\n+                    label="Minimum QUAL value"\n+                    help="Specify the minimum value of the QUAL field required to retain a variant" />\n+                </when>\n+                <when value="mtc">\n+                    <param argument="-l" name="indelqual_alpha" type="float" min="0" max="1" value="1"\n+                    label="Multiple-testing corrected p-value threshold" />\n+                    <param argument="-k" name="indelqual_mtc" type="select"\n+                    label="Multiple testing correction method">\n+                        <option value="bonf">Bonferroni</option>\n+                        <option value="holm">Holm-Sidak</option>\n+                        <option value="fdr">False-discovery rate</option>\n+                    </param>\n+                    <param argument="-m" name="indelqual_ntests" type="integer" min="1" value="1"\n+                    label="Estimate of number of tests performed"\n+                    help="Ideally, this would be the number of indels considered during variant calling. The lo'..b'ter behaves correctly. => two additional diff lines -->\n+            <output name="outvcf" file="call-out1.vcf" lines_diff="6" />\n+        </test>\n+        <test>\n+            <!-- Express lofreq call default filtering as a\n+            multiple testing correction filter -->\n+            <param name="invcf" ftype="vcf" value="call-out2.vcf" />\n+            <conditional name="filter_by_type">\n+                <param name="keep_only" value="--only-snvs" />\n+                <section name="qual">\n+                    <conditional name="snvqual_filter">\n+                        <param name="snvqual" value="mtc" />\n+                        <param name="snvqual_alpha" value="0.01" />\n+                        <param name="snvqual_mtc" value="bonf" />\n+                        <param name="snvqual_ntests" value="66" />\n+                    </conditional>\n+                </section>\n+            </conditional>\n+            <!-- expect additional diff lines because of different\n+            ##FILTER declarations -->\n+            <output name="outvcf" file="call-out1.vcf" lines_diff="9" />\n+        </test>\n+        <test>\n+            <!-- Test print-all option -->\n+            <param name="invcf" ftype="vcf" value="call-out2.vcf" />\n+            <conditional name="filter_by_type">\n+                <section name="qual">\n+                    <conditional name="snvqual_filter">\n+                        <param name="snvqual" value="min-phred" />\n+                        <param name="snvqual_thresh" value="38" />\n+                    </conditional>\n+                    <conditional name="indelqual_filter">\n+                        <param name="indelqual" value="min-phred" />\n+                        <param name="indelqual_thresh" value="20" />\n+                    </conditional>\n+                </section>\n+            </conditional>\n+            <param name="flag_or_drop" value="--print-all" />\n+            <!-- All variants should be retained with print-all,\n+            but variants failing filters should be flagged with the names\n+            of those filters -->\n+            <output name="outvcf">\n+                <assert_contents>\n+                    <has_line_matching expression="pBR322&#009;1134&#009;.&#009;C&#009;T&#009;49314&#009;PASS&#009;.+" />\n+                    <has_line_matching expression="pBR322&#009;1193&#009;.&#009;G&#009;A&#009;0&#009;min_snvqual_38&#009;.+" />\n+                </assert_contents>\n+            </output>\n+        </test>\n+    </tests>\n+    <help><![CDATA[\n+**What it does**\n+\n+**Lofreq filter** tries to eliminate false-positive calls from a list of\n+variants in VCF format.\n+\n+To this end, it applies a variety of user-configurable filters to the input\n+variants, which all operate on variant attributes expected to be embedded in\n+the VCF input.\n+\n+Specifically, certain filters expect:\n+\n+- the `QUAL` field of the variant records to be set\n+- any of the following subfields of a variant\'s `INFO` field:\n+\n+  * `DP` (required for coverage-based filtering)\n+  * `AF` (required for filtering based on variant allele frequency)\n+  * `SB` (required for filtering on strand bias)\n+  * `DP4` (required for the compound strand bias filter)\n+\n+------\n+\n+**Note**:\n+\n+.. class:: Warning mark\n+\n+   This tool is optimized for posterior filtering of variants called with\n+   `Lofreq call`, which outputs all variant attributes required by the various\n+   configurable filters.\n+\n+If you are using `Lofreq filter` to filter VCF variant lists produced with\n+other tools, be prepared for surprises.\n+\n+In general, if any piece of variant information required for applying a\n+given filter is missing from the input data, the tool will try to disable\n+that filter. Watch out for corresponding warnings in the tool\'s standard\n+output.\n+\n+In addition, any p-value based filtering on variant qualities may behave\n+incorrectly since different variant callers might use different QUAL scales.\n+    ]]></help>\n+    <expand macro="citations" />\n+</tool>\n'
b
diff -r 000000000000 -r 6f9ffff040ce macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Tue Dec 17 17:26:32 2019 -0500
[
@@ -0,0 +1,88 @@
+<macros>
+    <token name="@WRAPPER_VERSION@">@TOOL_VERSION@+galaxy</token>
+    <token name="@TOOL_VERSION@">2.1.3.1</token>
+    <xml name="requirements">
+        <requirements>
+            <requirement type="package" version="@TOOL_VERSION@">lofreq</requirement>
+            <yield/>
+        </requirements>
+    </xml>
+    <xml name="citations">
+        <citations>
+            <citation type="doi">10.1093/nar/gks918</citation>
+            <yield />
+        </citations>
+    </xml>
+    <token name="@PREPARE_REF@"><![CDATA[
+        #if str($reference_source.ref_selector) == 'history':
+            #set $reference_fasta_fn = 'reference.fa'
+            ln -s '$reference_source.ref' $reference_fasta_fn &&
+            lofreq faidx $reference_fasta_fn 2>&1 || echo "Error running samtools faidx for indexing fasta reference for lofreq" >&2 &&
+        #else
+            #set $reference_fasta_fn = str($reference_source.ref.fields.path)
+        #end if
+    ]]></token>
+    <xml name="reference_interface">
+        <conditional name="reference_source">
+            <param name="ref_selector" type="select"
+            label="Choose the source for the reference genome">
+                <option value="cached">Locally cached</option>
+                <option value="history">History</option>
+            </param>
+            <when value="cached">
+                <param argument="--ref" type="select"
+                label="Reference genome">
+                    <options from_data_table="fasta_indexes">
+                        <filter type="data_meta" column="dbkey" key="dbkey" ref="reads" />
+                        <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file" />
+                    </options>
+                </param>
+            </when>
+            <when value="history">
+                <param argument="--ref" type="data" format="fasta" label="Reference" help="Reference sequence" />
+            </when>
+        </conditional>
+    </xml>
+    <xml name="handle_existing_alnqual">
+        <conditional name="alnqual_choice">
+            <param name="alnquals_to_use" type="select"
+            label="Use the following alignment quality scores">
+                <option value="">Base and indel alignment qualities (BAQ and IDAQ)</option>
+                <option value="-A">Only base alignment qualities (BAQ)</option>
+                <option value="-B">Only indel alignment qualities (IDAQ)</option>
+            </param>
+            <when value="-B">
+                <param name="extended_baq" type="hidden" value="" />
+            </when>
+            <when value="">
+                <param argument="-e" name="extended_baq" type="boolean" checked="true" truevalue="" falsevalue="-e"
+                label="If BAQ needs to be computed, calculate extended BAQ?" />
+            </when>
+            <when value="-A">
+                <param argument="-e" name="extended_baq" type="boolean" checked="true" truevalue="" falsevalue="-e"
+                label="If BAQ needs to be computed, calculate extended BAQ?" />
+            </when>
+        </conditional>
+    </xml>
+    <xml name="handle_alnqual" token_mode="Use">
+        <conditional name="alnqual_choice">
+            <param name="alnquals_to_use" type="select"
+            label="@MODE@ the following alignment quality scores">
+                <option value="">Base and indel alignment qualities (BAQ and IDAQ)</option>
+                <option value="-A">Only base alignment qualities (BAQ)</option>
+                <option value="-B">Only indel alignment qualities (IDAQ)</option>
+            </param>
+            <when value="-B">
+                <param name="extended_baq" type="hidden" value="" />
+            </when>
+            <when value="">
+                <param argument="-e" name="extended_baq" type="boolean" checked="true" truevalue="" falsevalue="-e"
+                label="Use extended BAQ?" />
+            </when>
+            <when value="-A">
+                <param argument="-e" name="extended_baq" type="boolean" checked="true" truevalue="" falsevalue="-e"
+                label="Use extended BAQ?" />
+            </when>
+        </conditional>
+    </xml>
+</macros>
b
diff -r 000000000000 -r 6f9ffff040ce test-data/alnqual-out1.bam
b
Binary file test-data/alnqual-out1.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/alnqual-out2.bam
b
Binary file test-data/alnqual-out2.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/alnqual-out3.bam
b
Binary file test-data/alnqual-out3.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/alnqual-out4.bam
b
Binary file test-data/alnqual-out4.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/alnqual-out5.bam
b
Binary file test-data/alnqual-out5.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/call-out1.vcf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/call-out1.vcf Tue Dec 17 17:26:32 2019 -0500
b
@@ -0,0 +1,19 @@
+##fileformat=VCFv4.0
+##fileDate=20191125
+##source=lofreq call --verbose --ref reference.fa --sig 0.01 --bonf dynamic --no-default-filter -r pBR322:1-2180 -o /tmp/lofreq2_call_parallel3mrmthi_/0.vcf.gz alignments.bam
+##reference=reference.fa
+##INFO=<ID=DP,Number=1,Type=Integer,Description="Raw Depth">
+##INFO=<ID=AF,Number=1,Type=Float,Description="Allele Frequency">
+##INFO=<ID=SB,Number=1,Type=Integer,Description="Phred-scaled strand bias at this position">
+##INFO=<ID=DP4,Number=4,Type=Integer,Description="Counts for ref-forward bases, ref-reverse, alt-forward and alt-reverse bases">
+##INFO=<ID=INDEL,Number=0,Type=Flag,Description="Indicates that the variant is an INDEL.">
+##INFO=<ID=CONSVAR,Number=0,Type=Flag,Description="Indicates that the variant is a consensus variant (as opposed to a low frequency variant).">
+##INFO=<ID=HRUN,Number=1,Type=Integer,Description="Homopolymer length to the right of report indel position">
+##FILTER=<ID=min_snvqual_38,Description="Minimum SNV Quality (Phred) 38">
+##FILTER=<ID=min_indelqual_20,Description="Minimum Indel Quality (Phred) 20">
+##FILTER=<ID=min_dp_10,Description="Minimum Coverage 10">
+##FILTER=<ID=sb_fdr,Description="Strand-Bias Multiple Testing Correction: fdr corr. pvalue > 0.001000">
+##FILTER=<ID=min_snvqual_38,Description="Minimum SNV Quality (Phred) 38">
+##FILTER=<ID=min_indelqual_20,Description="Minimum Indel Quality (Phred) 20">
+#CHROM POS ID REF ALT QUAL FILTER INFO
+pBR322 1134 . C T 49314 PASS DP=1767;AF=1.000000;SB=0;DP4=0,0,910,857
b
diff -r 000000000000 -r 6f9ffff040ce test-data/call-out2.vcf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/call-out2.vcf Tue Dec 17 17:26:32 2019 -0500
b
@@ -0,0 +1,27 @@
+##fileformat=VCFv4.0
+##fileDate=20191204
+##source=lofreq call --verbose --ref reference.fa --sig 1 --bonf 1 --no-default-filter --no-default-filter -r pBR322:1-2180 -o /tmp/tmpjsbggC/job_working_directory/000/8/working/pp-tmp/lofreq2_call_parallelj9yxuugx/0.vcf.gz reads.bam 
+##reference=reference.fa
+##INFO=<ID=DP,Number=1,Type=Integer,Description="Raw Depth">
+##INFO=<ID=AF,Number=1,Type=Float,Description="Allele Frequency">
+##INFO=<ID=SB,Number=1,Type=Integer,Description="Phred-scaled strand bias at this position">
+##INFO=<ID=DP4,Number=4,Type=Integer,Description="Counts for ref-forward bases, ref-reverse, alt-forward and alt-reverse bases">
+##INFO=<ID=INDEL,Number=0,Type=Flag,Description="Indicates that the variant is an INDEL.">
+##INFO=<ID=CONSVAR,Number=0,Type=Flag,Description="Indicates that the variant is a consensus variant (as opposed to a low frequency variant).">
+##INFO=<ID=HRUN,Number=1,Type=Integer,Description="Homopolymer length to the right of report indel position">
+#CHROM POS ID REF ALT QUAL FILTER INFO
+pBR322 815 . A G 0 . DP=665;AF=0.003008;SB=6;DP4=333,311,0,2
+pBR322 861 . A C 0 . DP=946;AF=0.002114;SB=3;DP4=447,497,0,2
+pBR322 1001 . A C 0 . DP=1797;AF=0.000556;SB=3;DP4=877,918,1,0
+pBR322 1013 . C G 0 . DP=1773;AF=0.000564;SB=0;DP4=875,897,0,1
+pBR322 1068 . T G 0 . DP=1774;AF=0.000564;SB=3;DP4=853,920,1,0
+pBR322 1084 . G T 0 . DP=1789;AF=0.000559;SB=3;DP4=875,913,1,0
+pBR322 1113 . T A 0 . DP=1784;AF=0.000561;SB=0;DP4=885,898,0,1
+pBR322 1134 . C T 49314 . DP=1767;AF=1.000000;SB=0;DP4=0,0,910,857
+pBR322 1193 . G A 0 . DP=1698;AF=0.000589;SB=3;DP4=865,832,0,1
+pBR322 1218 . A C 0 . DP=1708;AF=0.000585;SB=3;DP4=875,831,0,1
+pBR322 1230 . T C 0 . DP=1759;AF=0.000569;SB=3;DP4=907,850,0,1
+pBR322 1256 . A G 0 . DP=1746;AF=0.000573;SB=0;DP4=902,842,1,0
+pBR322 1498 . C G 0 . DP=1195;AF=0.000837;SB=3;DP4=588,606,1,0
+pBR322 1503 . T G 0 . DP=1156;AF=0.000865;SB=3;DP4=563,592,1,0
+pBR322 1505 . G A 0 . DP=1137;AF=0.000880;SB=0;DP4=560,576,0,1
b
diff -r 000000000000 -r 6f9ffff040ce test-data/indelqual-out1.bam
b
Binary file test-data/indelqual-out1.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/indelqual-out2.bam
b
Binary file test-data/indelqual-out2.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/indelqual-out3.bam
b
Binary file test-data/indelqual-out3.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/lofreq-in1.bam
b
Binary file test-data/lofreq-in1.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/pBR322.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/pBR322.fa Tue Dec 17 17:26:32 2019 -0500
b
@@ -0,0 +1,74 @@
+>pBR322
+TTCTCATGTTTGACAGCTTATCATCGATAAGCTTTAATGCGGTAGTTTATCACAGTTAAA
+TTGCTAACGCAGTCAGGCACCGTGTATGAAATCTAACAATGCGCTCATCGTCATCCTCGG
+CACCGTCACCCTGGATGCTGTAGGCATAGGCTTGGTTATGCCGGTACTGCCGGGCCTCTT
+GCGGGATATCGTCCATTCCGACAGCATCGCCAGTCACTATGGCGTGCTGCTAGCGCTATA
+TGCGTTGATGCAATTTCTATGCGCACCCGTTCTCGGAGCACTGTCCGACCGCTTTGGCCG
+CCGCCCAGTCCTGCTCGCTTCGCTACTTGGAGCCACTATCGACTACGCGATCATGGCGAC
+CACACCCGTCCTGTGGATCCTCTACGCCGGACGCATCGTGGCCGGCATCACCGGCGCCAC
+AGGTGCGGTTGCTGGCGCCTATATCGCCGACATCACCGATGGGGAAGATCGGGCTCGCCA
+CTTCGGGCTCATGAGCGCTTGTTTCGGCGTGGGTATGGTGGCAGGCCCCGTGGCCGGGGG
+ACTGTTGGGCGCCATCTCCTTGCATGCACCATTCCTTGCGGCGGCGGTGCTCAACGGCCT
+CAACCTACTACTGGGCTGCTTCCTAATGCAGGAGTCGCATAAGGGAGAGCGTCGACCGAT
+GCCCTTGAGAGCCTTCAACCCAGTCAGCTCCTTCCGGTGGGCGCGGGGCATGACTATCGT
+CGCCGCACTTATGACTGTCTTCTTTATCATGCAACTCGTAGGACAGGTGCCGGCAGCGCT
+CTGGGTCATTTTCGGCGAGGACCGCTTTCGCTGGAGCGCGACGATGATCGGCCTGTCGCT
+TGCGGTATTCGGAATCTTGCACGCCCTCGCTCAAGCCTTCGTCACTGGTCCCGCCACCAA
+ACGTTTCGGCGAGAAGCAGGCCATTATCGCCGGCATGGCGGCCGACGCGCTGGGCTACGT
+CTTGCTGGCGTTCGCGACGCGAGGCTGGATGGCCTTCCCCATTATGATTCTTCTCGCTTC
+CGGCGGCATCGGGATGCCCGCGTTGCAGGCCATGCTGTCCAGGCAGGTAGATGACGACCA
+TCAGGGACAGCTTCAAGGATCGCTCGCGGCTCTTACCAGCCTAACTTCGATCACTGGACC
+GCTGATCGTCACGGCGATTTATGCCGCCTCGGCGAGCACATGGAACGGGTTGGCATGGAT
+TGTAGGCGCCGCCCTATACCTTGTCTGCCTCCCCGCGTTGCGTCGCGGTGCATGGAGCCG
+GGCCACCTCGACCTGAATGGAAGCCGGCGGCACCTCGCTAACGGATTCACCACTCCAAGA
+ATTGGAGCCAATCAATTCTTGCGGAGAACTGTGAATGCGCAAACCAACCCTTGGCAGAAC
+ATATCCATCGCGTCCGCCATCTCCAGCAGCCGCACGCGGCGCATCTCGGGCAGCGTTGGG
+TCCTGGCCACGGGTGCGCATGATCGTGCTCCTGTCGTTGAGGACCCGGCTAGGCTGGCGG
+GGTTGCCTTACTGGTTAGCAGAATGAATCACCGATACGCGAGCGAACGTGAAGCGACTGC
+TGCTGCAAAACGTCTGCGACCTGAGCAACAACATGAATGGTCTTCGGTTTCCGTGTTTCG
+TAAAGTCTGGAAACGCGGAAGTCAGCGCCCTGCACCATTATGTTCCGGATCTGCATCGCA
+GGATGCTGCTGGCTACCCTGTGGAACACCTACATCTGTATTAACGAAGCGCTGGCATTGA
+CCCTGAGTGATTTTTCTCTGGTCCCGCCGCATCCATACCGCCAGTTGTTTACCCTCACAA
+CGTTCCAGTAACCGGGCATGTTCATCATCAGTAACCCGTATCGTGAGCATCCTCTCTCGT
+TTCATCGGTATCATTACCCCCATGAACAGAAATCCCCCTTACACGGAGGCATCAGTGACC
+AAACAGGAAAAAACCGCCCTTAACATGGCCCGCTTTATCAGAAGCCAGACATTAACGCTT
+CTGGAGAAACTCAACGAGCTGGACGCGGATGAACAGGCAGACATCTGTGAATCGCTTCAC
+GACCACGCTGATGAGCTTTACCGCAGCTGCCTCGCGCGTTTCGGTGATGACGGTGAAAAC
+CTCTGACACATGCAGCTCCCGGAGACGGTCACAGCTTGTCTGTAAGCGGATGCCGGGAGC
+AGACAAGCCCGTCAGGGCGCGTCAGCGGGTGTTGGCGGGTGTCGGGGCGCAGCCATGACC
+CAGTCACGTAGCGATAGCGGAGTGTATACTGGCTTAACTATGCGGCATCAGAGCAGATTG
+TACTGAGAGTGCACCATATGCGGTGTGAAATACCGCACAGATGCGTAAGGAGAAAATACC
+GCATCAGGCGCTCTTCCGCTTCCTCGCTCACTGACTCGCTGCGCTCGGTCGTTCGGCTGC
+GGCGAGCGGTATCAGCTCACTCAAAGGCGGTAATACGGTTATCCACAGAATCAGGGGATA
+ACGCAGGAAAGAACATGTGAGCAAAAGGCCAGCAAAAGGCCAGGAACCGTAAAAAGGCCG
+CGTTGCTGGCGTTTTTCCATAGGCTCCGCCCCCCTGACGAGCATCACAAAAATCGACGCT
+CAAGTCAGAGGTGGCGAAACCCGACAGGACTATAAAGATACCAGGCGTTTCCCCCTGGAA
+GCTCCCTCGTGCGCTCTCCTGTTCCGACCCTGCCGCTTACCGGATACCTGTCCGCCTTTC
+TCCCTTCGGGAAGCGTGGCGCTTTCTCATAGCTCACGCTGTAGGTATCTCAGTTCGGTGT
+AGGTCGTTCGCTCCAAGCTGGGCTGTGTGCACGAACCCCCCGTTCAGCCCGACCGCTGCG
+CCTTATCCGGTAACTATCGTCTTGAGTCCAACCCGGTAAGACACGACTTATCGCCACTGG
+CAGCAGCCACTGGTAACAGGATTAGCAGAGCGAGGTATGTAGGCGGTGCTACAGAGTTCT
+TGAAGTGGTGGCCTAACTACGGCTACACTAGAAGGACAGTATTTGGTATCTGCGCTCTGC
+TGAAGCCAGTTACCTTCGGAAAAAGAGTTGGTAGCTCTTGATCCGGCAAACAAACCACCG
+CTGGTAGCGGTGGTTTTTTTGTTTGCAAGCAGCAGATTACGCGCAGAAAAAAAGGATCTC
+AAGAAGATCCTTTGATCTTTTCTACGGGGTCTGACGCTCAGTGGAACGAAAACTCACGTT
+AAGGGATTTTGGTCATGAGATTATCAAAAAGGATCTTCACCTAGATCCTTTTAAATTAAA
+AATGAAGTTTTAAATCAATCTAAAGTATATATGAGTAAACTTGGTCTGACAGTTACCAAT
+GCTTAATCAGTGAGGCACCTATCTCAGCGATCTGTCTATTTCGTTCATCCATAGTTGCCT
+GACTCCCCGTCGTGTAGATAACTACGATACGGGAGGGCTTACCATCTGGCCCCAGTGCTG
+CAATGATACCGCGAGACCCACGCTCACCGGCTCCAGATTTATCAGCAATAAACCAGCCAG
+CCGGAAGGGCCGAGCGCAGAAGTGGTCCTGCAACTTTATCCGCCTCCATCCAGTCTATTA
+ATTGTTGCCGGGAAGCTAGAGTAAGTAGTTCGCCAGTTAATAGTTTGCGCAACGTTGTTG
+CCATTGCTGCAGGCATCGTGGTGTCACGCTCGTCGTTTGGTATGGCTTCATTCAGCTCCG
+GTTCCCAACGATCAAGGCGAGTTACATGATCCCCCATGTTGTGCAAAAAAGCGGTTAGCT
+CCTTCGGTCCTCCGATCGTTGTCAGAAGTAAGTTGGCCGCAGTGTTATCACTCATGGTTA
+TGGCAGCACTGCATAATTCTCTTACTGTCATGCCATCCGTAAGATGCTTTTCTGTGACTG
+GTGAGTACTCAACCAAGTCATTCTGAGAATAGTGTATGCGGCGACCGAGTTGCTCTTGCC
+CGGCGTCAACACGGGATAATACCGCGCCACATAGCAGAACTTTAAAAGTGCTCATCATTG
+GAAAACGTTCTTCGGGGCGAAAACTCTCAAGGATCTTACCGCTGTTGAGATCCAGTTCGA
+TGTAACCCACTCGTGCACCCAACTGATCTTCAGCATCTTTTACTTTCACCAGCGTTTCTG
+GGTGAGCAAAAACAGGAAGGCAAAATGCCGCAAAAAAGGGAATAAGGGCGACACGGAAAT
+GTTGAATACTCATACTCTTCCTTTTTCAATATTATTGAAGCATTTATCAGGGTTATTGTC
+TCATGAGCGGATACATATTTGAATGTATTTAGAAAAATAAACAAATAGGGGTTCCGCGCA
+CATTTCCCCGAAAAGTGCCACCTGACGTCTAAGAAACCATTATTATCATGACATTAACCT
+ATAAAAATAGGCGTATCACGAGGCCCTTTCGTCTTCAAGAA
\ No newline at end of file
b
diff -r 000000000000 -r 6f9ffff040ce test-data/viterbi-out1.bam
b
Binary file test-data/viterbi-out1.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce test-data/viterbi-out2.bam
b
Binary file test-data/viterbi-out2.bam has changed
b
diff -r 000000000000 -r 6f9ffff040ce tool-data/fasta_indexes.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/fasta_indexes.loc.sample Tue Dec 17 17:26:32 2019 -0500
b
@@ -0,0 +1,29 @@
+#This is a sample file distributed with Galaxy that enables tools
+#to use a directory of Samtools indexed sequences data files.  You will need
+#to create these data files and then create a fasta_indexes.loc file
+#similar to this one (store it in this directory) that points to
+#the directories in which those files are stored. The fasta_indexes.loc
+#file has this format (white space characters are TAB characters):
+#
+# <unique_build_id> <dbkey> <display_name> <file_base_path>
+#
+#So, for example, if you had hg19 Canonical indexed stored in
+#
+# /depot/data2/galaxy/hg19/sam/,
+#
+#then the fasta_indexes.loc entry would look like this:
+#
+#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /depot/data2/galaxy/hg19/sam/hg19canon.fa
+#
+#and your /depot/data2/galaxy/hg19/sam/ directory
+#would contain hg19canon.fa and hg19canon.fa.fai files.
+#
+#Your fasta_indexes.loc file should include an entry per line for
+#each index set you have stored.  The file in the path does actually
+#exist, but it should never be directly used. Instead, the name serves
+#as a prefix for the index file.  For example:
+#
+#hg18canon hg18 Human (Homo sapiens): hg18 Canonical /depot/data2/galaxy/hg18/sam/hg18canon.fa
+#hg18full hg18 Human (Homo sapiens): hg18 Full /depot/data2/galaxy/hg18/sam/hg18full.fa
+#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /depot/data2/galaxy/hg19/sam/hg19canon.fa
+#hg19full hg19 Human (Homo sapiens): hg19 Full /depot/data2/galaxy/hg19/sam/hg19full.fa
b
diff -r 000000000000 -r 6f9ffff040ce tool_data_table_conf.xml.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.sample Tue Dec 17 17:26:32 2019 -0500
b
@@ -0,0 +1,7 @@
+<tables>
+    <!-- Location of SAMTools indexes for FASTA files -->
+    <table name="fasta_indexes" comment_char="#">
+        <columns>value, dbkey, name, path</columns>
+        <file path="tool-data/fasta_indexes.loc" />
+    </table>
+</tables>