Mercurial > repos > dannon > metaphlan
changeset 0:4f3fe44edb3f
Initial upload. Still needs tests.
author | dannon |
---|---|
date | Thu, 29 Mar 2012 03:32:11 -0400 |
parents | |
children | 016f6375aadc |
files | metaphlan.xml |
diffstat | 1 files changed, 121 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/metaphlan.xml Thu Mar 29 03:32:11 2012 -0400 @@ -0,0 +1,121 @@ +<tool id="metaphlan" name="MetaPhlAn" version="1.0"> +<requirements> +<requirement type="package">metaphlan</requirement> +<requirement type="package" version="2.2.25+">blast</requirement> +</requirements> + <description>Metagenomic Phylogenetic Analysis</description> + <command> + metaphlan.py + #if str($source.type) == "fasta": + ${source.fasta_input} + #else: + ${source.blast_input} + #end if + ${metaphlan_out} + --nproc 4 + #if str($source.type) == "fasta": + --blastout metagenome.outfmt6.txt + --evalue ${source.evalue} + #end if + --lib_dir ${GALAXY_DATA_INDEX_DIR}/shared/metaphlan + --min_cu_len ${min_cu_len} + --min_nreads ${min_nreads} + </command> + <inputs> + + <conditional name="source"> + <param name="type" type="select" label="Input Type"> + <option value="fasta">multi-fasta file containing metagenomic reads</option> + <option value="blast">NCBI BLAST output file</option> + </param> + <when value="fasta"> + <param format="fasta" name="fasta_input" type="data" label="from"/> + <param name="evalue" type="float" size="15" value="0.00001" label="evalue threshold for the blasting" /> + </when> + <when value="blast"> + <param format="tabular" name="blast_input" type="data" label="from"/> + </when> + </conditional> + + <param name="tax_lev" type="select" label="Taxonomic Level" help="The taxonomic level for the relative abundance output"> + <option value="a">All taxonomic levels</option> + <option value="k">Kingdoms (Bacteria and Archaea) only</option> + <option value="p">Phyla only</option> + <option value="c">Classes only</option> + <option value="o">Orders only</option> + <option value="f">Families only</option> + <option value="g">Genera only</option> + <option value="s">Species only</option> + </param> + <param name="min_cu_len" type="integer" value="10000" help="min_cu_len" label="Minimum total nucleotide length for the unique markers for estimating the abundance without considering children clade abundances" /> + <param name="min_nreads" type="integer" value="5" help="min_nreads" label="minimum total reads assigned to a clade for estimating the abundance without considering children clade abundances" /> + </inputs> + <outputs> + <data format="tabular" name="metaphlan_out" label="MetaPhlAn on ${on_string}" /> + <data format="tabular" name="blast_out" from_work_dir="metagenome.outfmt6.txt" label="MetaPhlAn BLAST on ${on_string}"> + <filter>source['type'] == "fasta"</filter> + </data> + </outputs> + <tests> + </tests> + <help> + +**What it does** +MetaPhlAn is a computational tool for profiling the composition of microbial communities from metagenomic shotgun sequencing data. MetaPhlAn relies on unique clade-specific marker genes identified from reference genomes, allowing orders of magnitude speedups and unambiguous taxonomic assignments. + +MetaPhlAn main features are: + +More than 100x computational speedup compared to Blast-based approaches or other available methods with species level resolution +Higher accuracy in estimating the true composition of microbial communities in terms of organismal relative abundance +Unambiguous read-to-taxa assignments as conserved inter-clade sequences are removed from the reference sequence data + +--------- + +**Inputs** + +The input file can be a multi-fasta file containing metagenomic reads OR a NCBI BLAST output file (-outfmt 6 format) of the metagenomic read fasta file against the metaflan database. + +**outputs** + +The output is a tab-separated output file of the predicted taxon relative abundances. +If the input is a multi-fasta file then the output from the BLAST operation is also provided as an additional output. + +--------- + +**Settings**:: + + --tax_lev TAXONOMIC_LEVEL + The taxonomic level for the relative abundance + output: + 'a' : all taxonomic levels + 'k' : kingdoms (Bacteria and Archaea) only + 'p' : phyla only + 'c' : classes only + 'o' : orders only + 'f' : families only + 'g' : genera only + 's' : species only + [default 'a'] + --evalue evalue threshold for the blasting + [default 1e-6] + --min_cu_len minimum total nucleotide lenght for the unique + markers for estimating the abundance without + considering children clade abundances + [default 10000] + --min_nreads minimum total reads assigned to a clade for + estimating the abundance without considering + children clade abundances + [default 5] + +----- + +**Citation** + +If you find MetaPhlAn useful in your research, please cite our paper: +Nicola Segata, Levi Waldron, Annalisa Ballarini, Vagheesh Narasimhan, Olivier Jousson, Curtis Huttenhower. +"Fast and accurate metagenomic profiling of microbial community composition using unique clade-specific marker genes" +***in review*** + + </help> +</tool> +