Repository 'gubbins'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/gubbins

Changeset 0:637ec5d5368c (2017-06-23)
Next changeset 1:96e6283e4745 (2022-08-24)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gubbins commit 98be6edc2544513347149b50e0cfb530811f890a
added:
gubbins.xml
test-data/multiple_recombinations.aln
b
diff -r 000000000000 -r 637ec5d5368c gubbins.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/gubbins.xml Fri Jun 23 08:29:43 2017 -0400
[
b'@@ -0,0 +1,298 @@\n+<tool id="gubbins" name="Gubbins" version="0.1.0">\n+    <description>Recombination detection in Bacteria</description>\n+    <requirements>\n+        <requirement type="package" version="2.2.1">gubbins</requirement>\n+    </requirements>\n+    \n+    <version_command>run_gubbins.py --version</version_command>\n+    \n+    <command detect_errors="exit_code"><![CDATA[\n+        \n+        ln -s \'$alignment_file\' foo.aln &&\n+      \n+        run_gubbins.py\n+        \n+        --threads \\${GALAXY_SLOTS:-1}\n+        \n+        #if $adv.iters\n+            -i \'$adv.iters\'\n+        #end if\n+        \n+        #if $adv.conv_meth\n+            -z \'$adv.conv_meth\'\n+        #end if\n+        \n+        #if $adv.outgroup\n+            -o \'$adv.outgroup\'\n+        #end if\n+        \n+        #if $really_adv.tree_builder\n+            -t \'$really_adv.tree_builder\'\n+        #end if\n+        \n+        #if $really_adv.min_snps\n+            -m \'$really_adv.min_snps\'\n+        #end if\n+        \n+        #if $really_adv.filter_percentage\n+            -f \'$really_adv.filter_percentage\'\n+        #end if\n+        \n+        #if $really_adv.min_window_size\n+            -a \'$really_adv.min_window_size\'\n+        #end if\n+        \n+        #if $really_adv.max_window_size\n+            -b \'$really_adv.max_window_size\'\n+        #end if\n+        \n+        $really_adv.remove_duplicates\n+        \n+        foo.aln\n+        \n+    ]]></command>\n+    <inputs>\n+        <!-- Just the data set.. -->\n+        <param type="data" name="alignment_file" format="fasta" label="Whole genome alignment file" help="Whole genome alignment file in fasta format"/>\n+      \n+        <!-- output file picker -->\n+        <param type="select" name="outfiles" multiple="true" display="checkboxes" label="Select the required output files" help="Default selections are the Final Tree in Newick format, the Recombination Predictions in gff3 format and the Summary of SNP Distribution">\n+            <option value="ftree" selected="true">Final Tree in newick format</option>\n+            <option value="gff" selected="true">Recombination Predictions in gff3 format</option>\n+            <option value="vcf" selected="true">Summary of SNP Distribution in vcf format</option>\n+            <option value="recomb_embl">Recombination Predictions in embl format</option>\n+            <option value="fpoly">Filtered Polymorphic Sites in fasta format</option>\n+            <option value="ppoly">Filtered Polymorphic Sites in phylip format</option>\n+            <option value="stats">Per Branch Statistics in csv format</option>\n+            <option value="baseb">Base Branch Reconstruction in embl format</option>\n+        </param>\n+      \n+        <!-- A semi advanced section, really shouldn\'t have to change anything. -->\n+        <section name="adv" title="Advanced options" expanded="True">\n+            <param name="iters" type="integer" label="Iterations" value="5" help="Maximum No. of iterations, default is 5" />\n+            <param name="conv_meth" type="select" label="Model Conversion Options" help="Criteria to use to know when to halt iterations">\n+                <option value="weighted_robinson_foulds" selected="True">Weighted Robinson Foulds</option>\n+                <option value="robinson_foulds">Robinson Foulds</option>\n+                <option value="recombination">Recombination</option>\n+            </param>\n+            <param name="outgroup" type="text" label="Outgroup" value="" help="Outgroup name for rerooting. A list of comma separated names can be used if they form a clade."/>\n+        </section>\n+      \n+        <!-- a really advanced section, play with this at your peril! -->\n+        <section name="really_adv" title="Really advanced options - change these if you really know what you are doing." expanded="false">\n+            <param name="tree_builder" type="select" label="Tree builder" help="Application to use for tree building, default RAxML">\n+                <option value="raxml" selected="tru'..b'               <has_text text="FT" />\n+                </assert_contents>\n+            </output>\n+            <output name="filt_polymorph_phy">\n+                <assert_contents>\n+                    <has_text text="sequence_1" />\n+                </assert_contents>\n+            </output>\n+            <output name="per_b_stat_csv">\n+                <assert_contents>\n+                    <has_text text="Node" />\n+                </assert_contents>\n+            </output>\n+            <output name="base_branch_embl">\n+                <assert_contents>\n+                    <has_text text="FT" />\n+                </assert_contents>\n+            </output>\n+            <output name="final_tree">\n+                <assert_contents>\n+                    <has_text text="((sequence_" />\n+                </assert_contents>\n+            </output>\n+        </test>\n+    </tests>\n+    \n+    \n+    <help><![CDATA[\n+**Gubbins**\n+\n+Since the introduction of high-throughput, second-generation DNA sequencing technologies, there has been an enormous increase in the size of datasets being used for estimating bacterial population phylodynamics. Although many phylogenetic techniques are scalable to hundreds of bacterial genomes, methods which have been used for mitigating the effect of mechanisms of horizontal sequence transfer on phylogenetic reconstructions cannot cope with these new datasets. Gubbins (Genealogies Unbiased By recomBinations In Nucleotide Sequences) is an algorithm that iteratively identifies loci containing elevated densities of base substitutions while concurrently constructing a phylogeny based on the putative point mutations outside of these regions. Simulations demonstrate the algorithm generates highly accurate reconstructions under realistic models of short-term bacterial evolution, and can be run in only a few hours on alignments of hundreds of bacterial genome sequences.\n+\n+**Running Gubbins**\n+\n+To run Gubbins with default settings:\n+\n+Supply a "fasta" genome alignment file and press execute.\n+\n+**Other options** \n+\n+**Advanced**\n+\n+*Iterations*, (-i)\t\n+\n+The maximum number of iterations to perform; the algorithm will stop earlier than this if it converges on the same tree in two successive iterations. Default is 5.\n+\n+*Converge_method* (-z)\n+\n+Criteria to use to know when to halt iterations [weighted_robinson_foulds|robinson_foulds|recombination]. Default is weighted_robinson_foulds.\n+\n+*Outgroup*, (-o)\t\n+\n+The name of a sequence in the alignment on which to root the tree\n+\n+**Really Advanced**\n+\n+These options are here for completeness and you shouldn\'t need to change them from their defaults. You really need to know what you are doing before you use these.\n+\n+*Tree builder*, (-t)\n+\n+The algorithm to use in the construction of phylogenies in the analysis; can be \xe2\x80\x98raxml\xe2\x80\x99, to use RAxML, \xe2\x80\x98fasttree\xe2\x80\x99, to use Fasttree, or \xe2\x80\x98hybrid\xe2\x80\x99, to use Fasttree for the first iteration and RAxML in all subsequent iterations. Default is raxml\n+\n+Filter Percentage, (-f)\t\n+\n+Filter out taxa with more than this percentage of missing data. Default is 25%\n+\n+*Minimum snps*, (-m)\t\n+\n+The minimum number of base substitutions required to identify a recombination. Default is 3.\n+\n+\n+And others...\n+\n+\n+\n+**Output files**\n+\n+* Recombination predictions in EMBL tab file format.\n+\n+\n+* Recombination predictions in GFF3 format\n+\n+\n+* Base substitution reconstruction in EMBL tab format.\n+\n+\n+* VCF file summarising the distribution of SNPs\n+\n+\n+* Per branch reporting of the base substitutions inside and outside recombinations events.\n+\n+\n+* FASTA format alignment of filtered polymorphic sites used to generate the phylogeny in the final iteration.\n+\n+\n+* Phylip format alignment of filtered polymorphic sites used to generate the phylogeny in the final iteration.\n+\n+\n+* Final phylogenetic tree in newick format.\n+\n+    ]]></help>\n+    \n+    \n+    <citations>\n+        <citation type="doi">doi:10.1093/nar/gku1196</citation>\n+    </citations>\n+\n+</tool>\n'
b
diff -r 000000000000 -r 637ec5d5368c test-data/multiple_recombinations.aln
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/multiple_recombinations.aln Fri Jun 23 08:29:43 2017 -0400
b
@@ -0,0 +1,20 @@
+>sequence_1
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+>sequence_2
+AAAAAAAAAAAAAAAAAAAAACAAAAAAAAAAAAAAAAAAAAAAAAAAAACACCCCCCCCCCCCCCCACCCACCCCCCCCCCACAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+>sequence_3
+AAAAAAAAAAAAAAAAAAAAACAAAAAAAAAAAATAAAAAAAAAAAAAAACACCCCCCCCCCCCCCCACCCACCCCCCCCCCACAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+>sequence_4
+AAAAAAAAAAAAAAAAAAAAACAAAAAAAAAAAATAAAAAGAAAAAAAAACACCCCCCCCCCCCCCCACCCACCCCCCCCCCACAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+>sequence_5
+AAAAAAAAAAAAAAAGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAACACCCCCCCCCCCCCCCACCCACCCCCCCCCCACAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+>sequence_6
+AAAAAAAAAAAAAAAGAAAAAAAAAAACAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+>sequence_7
+AAAAAAAAAAAAAAAGAAAAAAAGAAACGGGGGGGGGGGGGGGGGGGGGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+>sequence_8
+AAAAAAAAAAAAAAAGAAAAAAAGAAACGGGGGGGGGGGGGGGGGGGGGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+>sequence_9
+---------------GAAAAAAAGAAAAGGGGGGGGGGGGGGGGGGGGGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
+>sequence_10
+NNNNNNNNNNNNNNNGAAAAAAAAAAAAGGGGGGGGGGGGGGGGGGGGGAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAATTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTTT
\ No newline at end of file