Mercurial > repos > thanhlv > fastani
view fastani.xml @ 0:93549392d20d draft default tip
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/fastani commit 6410237f37dfd76382f9780e73a14cf48aba3695-dirty
author | thanhlv |
---|---|
date | Fri, 19 Jul 2019 06:49:02 -0400 |
parents | |
children |
line wrap: on
line source
<tool id="fastani" name="FastANI" version="1.1"> <description> fast alignment-free computation of whole-genome Average Nucleotide Identity</description> <macros> <import>macros.xml</import> </macros> <expand macro="requirements" /> <version_command>fastANI --version</version_command> <command detect_errors="exit_code"> <![CDATA[ #for $counter_q, $input_q in enumerate($query): ln -fs '$input_q' ${input_q.element_identifier}_query && echo ${input_q.element_identifier}_query >> query.lst && #end for #for $counter_r, $input_r in enumerate($reference): ln -fs '$input_r' ${input_r.element_identifier}_ref && echo ${input_r.element_identifier}_query >> ref.lst && #end for fastANI #if len($query) == 1 and len($reference) == 1: -q ${input_q.element_identifier}_query -r ${input_r.element_identifier}_ref -o output #elif len($query) == 1 and len($reference) > 1: -q ${input_q.element_identifier}_query --rl ref.lst -o output #elif len($query) > 1 and len($reference) > 1: --ql query.lst --rl ref.lst -o output #end if 2>&1 ]]></command> <inputs> <param name="query" type="data" format="fasta" multiple="true" label="Query sequences" /> <param name="reference" type="data" format="fasta" multiple="true" label="Reference sequence" /> </inputs> <outputs> <data name="output" format="txt" from_work_dir="output" label="${tool.name} on ${on_string} Output"/> </outputs> <tests> <test> <param name="query" value="Shigella_flexneri_2a_01.fna" /> <param name="reference" value="Escherichia_coli_str_K12_MG1655.fna" /> <output name="output" file="fastani.out" compare="sim_size" /> </test> </tests> <help><![CDATA[ FastANI is developed for fast alignment-free computation of whole-genome Average Nucleotide Identity (ANI). ANI is defined as mean nucleotide identity of orthologous gene pairs shared between two microbial genomes. FastANI supports pairwise comparison of both complete and draft genome assemblies. Its underlying procedure follows a similar workflow as described by Goris et al. 2007. However, it avoids expensive sequence alignments and uses Mashmap as its MinHash based sequence mapping engine to compute the orthologous mappings and alignment identity estimates. Based on our experiments with complete and draft genomes, its accuracy is on par with BLAST-based ANI solver and it achieves two to three orders of magnitude speedup. Therefore, it is useful for pairwise ANI computation of large number of genome pairs. More details about its speed, accuracy and potential applications are described here: "High Throughput ANI Analysis of 90K Prokaryotic Genomes Reveals Clear Species Boundaries". ]]></help> <expand macro="citations" /> </tool>