Mercurial > repos > iuc > dram_distill
diff dram_distill.xml @ 0:f9a3ea1c618c draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/dram commit df10ba86507266a6a6f83c9bbefb7191a41b46f5
author | iuc |
---|---|
date | Sat, 10 Dec 2022 21:15:05 +0000 |
parents | |
children | 9471e3d97837 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/dram_distill.xml Sat Dec 10 21:15:05 2022 +0000 @@ -0,0 +1,93 @@ +<tool id="dram_distill" name="DRAM distill" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@"> + <description>metagenome-assembled-genomes (MAGs)</description> + <macros> + <import>macros.xml</import> + </macros> + <expand macro="requirements"/> + <expand macro="stdio"/> + <command detect_errors="exit_code"><![CDATA[ +DRAM.py distill +--input_file '$input_file' +--output_dir 'output_dir' +#if $rrna_path: + --rrna_path '$rrna_path' +#end if +#if $trna_path: + --trna_path '$trna_path' +#end if +--groupby_column '$groupby_column' +#if $custom_distillate: + --custom_distillate '$custom_distillate' +#end if +$distillate_gene_names +--genomes_per_product $genomes_per_product +&& test -f 'output_dir/genome_stats.tsv' && mv 'output_dir/genome_stats.tsv' '$output_genome_stats' || echo 'No genome_stats.tsv output produced' +&& test -f 'output_dir/metabolism_summary.xlsx' && mv 'output_dir/metabolism_summary.xlsx' '$output_metabolism_summary' || echo 'No metabolism_summary.xlsx output produced' +&& test -f 'output_dir/product.html' && mv 'output_dir/product.html' '$output_product_html' || echo 'No product.html output produced' +&& test -f 'output_dir/product.tsv' && mv 'output_dir/product.tsv' '$output_product_tsv' || echo 'No product.tsv output produced' + ]]></command> + <inputs> + <expand macro="input_file_param"/> + <param argument="--rrna_path" type="data" format="tabular" optional="true" label="rRNA file" help="Produced by the DRAM annotate tool (optional, leave blank to ignore)"/> + <param argument="--trna_path" type="data" format="tabular" optional="true" label="tRNA file" help="Produced by the DRAM annotate tool (optional, leave blank to ignore)"/> + <param argument="--groupby_column" type="text" value="fasta" label="Column from annotations to group as organism units"> + <expand macro="sanitizer"/> + </param> + <expand macro="custom_distillate_param"/> + <param argument="--distillate_gene_names" type="boolean" truevalue="--distillate_gene_names" falsevalue="" checked="false" label="Give names of genes instead of counts in genome metabolism summary?"/> + <param argument="--genomes_per_product" type="integer" value="1000" min="0" label="Number of genomes per product.html output"/> + </inputs> + <outputs> + <data name="output_genome_stats" format="tabular" label="${tool.name} on ${on_string}: genome stats"/> + <data name="output_metabolism_summary" format="xlsx" label="${tool.name} on ${on_string}: metabolism summary"/> + <data name="output_product_html" format="html" label="${tool.name} on ${on_string}: product html"/> + <data name="output_product_tsv" format="tabular" label="${tool.name} on ${on_string}: product_tsv"/> + </outputs> + <tests> + <!-- + These tests succeed, but the outputs are empty because the DRAM + database is not available in the test environment. This warning + is displayed in the log... + warnings.warn('Database does not exist at path %s' % self.description_loc) + ...and this exception is raised: + ValueError: Invalid file path or buffer object type: <class 'NoneType' + --> + <test expect_failure="true"> + <param name="input_file" ftype="tabular" value="annotated1.tabular"/> + <param name="rrna_path" ftype="tabular" value="input_distill_rrna1.tabular"/> + <param name="trna_path" ftype="tabular" value="input_distill_trna1.tabular"/> + <param name="custom_distillate" ftype="tabular" value="distill_custom.tabular"/> + <assert_stderr> + <has_text text="Traceback"/> + </assert_stderr> + </test> + </tests> + <help> +**What it does** + +@WHATITDOESHEADER@ + +This tool accepts a tabular file with all gene annotations from Pfam, UniProt, dbCAN and MEROPS databases produced by the +DRAM annotate tool and curates them into useful functional categories, creating genome statistics and metabolism summary +files. The genome statistics provides most genome quality information required for MIMAG standards, including GTDB-tk +and checkM information if provided by the user. The summarised metabolism table includes the number of genes with specific +metabolic function identifiers (KO, CAZY ID, etc) for each genome with information obtained from multiple databases. + +@CUSTOMDISTILLATEFILES@ + +This tool produces the following outputs. + +* **Distillate** + + * **genome stats** - a tabular file with genome statistics for all input genomes including all statistics required by recently defined MIMAG standards + * **metabolism summary** - an Excel file with metabolism summary of all input genomes which gives gene counts of functional and structural genes across a wide variety of metabolisms + +* **Liquor** + + * **product html** - an html file containing an interactive heatmap showing coverage of pathways, the coverage of electron transport chain components and the presence of selected metabolic functions + * **product tsv** - a tabular file with corresponding genes for the html heatmap + +@WHATITDOESFOOTER@ + </help> + <expand macro="citations"/> +</tool>