Mercurial > repos > brinkmanlab > parsnp
diff ParSNP.xml @ 0:932410434dd1 draft
"planemo upload for repository https://github.com/brinkmanlab/galaxy-tools/tree/master/parsnp commit 33b02e08cbc8f76fb4b8537f8c968393f85a1b5e"
author | brinkmanlab |
---|---|
date | Fri, 24 Jan 2020 17:45:42 -0500 |
parents | |
children | 2e855db9b19b |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/ParSNP.xml Fri Jan 24 17:45:42 2020 -0500 @@ -0,0 +1,198 @@ +<tool id="parsnp" name="ParSNP" version="1.2" profile="16.04"> + <description>Efficient microbial core genome alignment and SNP detection</description> + <edam_topics> + <edam_topic>topic_3293</edam_topic> + <edam_topic>topic_0194</edam_topic> + <edam_topic>topic_0091</edam_topic> + </edam_topics> + <edam_operations> + <edam_operation>operation_2451</edam_operation> + <edam_operation>operation_0323</edam_operation> + </edam_operations> + <requirements> + <requirement type="package" version="1.2">parsnp</requirement> + </requirements> + <version_command><![CDATA[parsnp -V |& tail -n1]]></version_command> + <command detect_errors="aggressive"><![CDATA[ + export GENOME_DIR=\$(mktemp -d -p `pwd`) + #for $genome in $genomes + && ln -sf '$genome' + #if $adv.use_ids + \$GENOME_DIR/'$genome.element_identifier' + #else + \$GENOME_DIR/\$(basename '$genome') + #end if + #end for + && parsnp -v -o `pwd` -p \${GALAXY_SLOTS:-1} -P \${GALAXY_MEMORY_MB:-15000000} -d "\$GENOME_DIR" + #if $ref_or_gbk.ref_type == "fasta" + #if $ref_or_gbk.ref_genome.random_ref + -r '!' + #else + -r '$ref_or_gbk.ref_genome.reference' + #end if + #else + -g ' + #for $gbk_file in $ref_or_gbk.genbank_files + #if $gbk_file + $gbk_file, + #end if + #end for + ' + #end if + $adv.MUMi_or_curated.curated $adv.extend_lcb $adv.output_unaligned + #if $adv.query_genome + -q '$adv.query_genome' + #end if + #unless $adv.MUMi_or_curated.curated + $adv.MUMi_or_curated.MUMi.MUMi_only + #unless $adv.MUMi_or_curated.MUMi.max_mumi_distribution.max_distribution_default + -U '$adv.MUMi_or_curated.MUMi.max_mumi_distribution.max_distribution' + #end unless + #unless $adv.MUMi_or_curated.MUMi.max_mumi_distance.max_distance_default + -i '$adv.MUMi_or_curated.MUMi.max_mumi_distance.max_distance' + #end unless + #end unless + #unless $adv.min_anchor_len.anchor_default + -a '$adv.min_anchor_len.anchor' + #end unless + -C '$adv.d_value' + -z '$adv.lcb_size' + #if $adv.max_diag_diff.diag_diff_unit + -D '$adv.max_diag_diff.diag_diff_bp$adv.max_diag_diff.diag_diff_unit' + #else + -D '$adv.max_diag_diff.diag_diff' + #end if + #unless $adv.aligner == "muscle" + -n '$adv.aligner' + #end unless + + ]]></command> + <inputs> + <!-- Inputs --> + <param name="genomes" type="data" multiple="true" argument="-d" format="fasta" label="Genomes/Contigs/Scaffolds" /> + <conditional name="ref_or_gbk"> + <param name="ref_type" type="select" label="Reference type"> + <option value="fasta">Single fasta</option> + <option value="gbk">Multiple genbank files</option> + </param> + <when value="fasta"> + <conditional name="ref_genome" label="Reference genome"> + <param name="random_ref" type="boolean" checked="false" label="Use random genome from above" /> + <when value="false"> + <param name="reference" type="data" format="fasta" label="Reference"/> + </when> + </conditional> + </when> + <when value="gbk"> + <param name="genbank_files" type="data" format="genbank" argument="-g" multiple="true" label="Reference genbank files" /> + </when> + </conditional> + + <section name="adv" title="Advanced options" expanded="false"> + <param name="query_genome" type="data" format="fasta" optional="true" label="Specify additional (assembled) query genome to use" /> + <param name="use_ids" type="boolean" checked="true" label="Use dataset name or collection id's instead of file name in output" help="IDs must be valid POSIX file names" /> + + <!-- Recombination filtration --> + <param name="filter_snp" type="boolean" checked="false" truevalue="-x" falsevalue="" label="Enable filtering of SNPs located in PhiPack identified regions of recombination" /> + + <!-- MUM --> + <conditional name="min_anchor_len"> + <param name="anchor_default" type="boolean" checked="true" label="Minimum ANCHOR length default" /> + <when value="false"> + <param name="anchor" type="float" min="0" value="1.1" label="Minimum ANCHOR length"/> + </when> + </conditional> + <param name="d_value" type="integer" min="0" value="100" argument="-C" label="Maximal cluster D value"/> + <param name="lcb_size" type="integer" min="0" value="25" argument="-z" label="Min LCB size" /> + + <!-- MUMi --> + <conditional name="MUMi_or_curated"> + <param name="curated" type="boolean" checked="false" truevalue="-c" falsevalue="" label="Curated genome directory, use all genomes and ignore MUMi" /> + <when value=""> + <conditional name="MUMi"> + <param name="MUMi_only" type="boolean" checked="false" truevalue="-M" falsevalue="" argument="-M" label="Only calculate MUMi and exit" /> + <when value=""> + <conditional name="max_mumi_distribution" label="Max MUMi distance value for MUMi distribution"> + <param name="max_distribution_default" type="boolean" checked="true" label="Default" /> + <when value="false"> + <param name="max_distribution" type="float" value="1" /> + </when> + </conditional> + <conditional name="max_mumi_distance" label="Max MUMi distance"> + <param name="max_distance_default" type="boolean" checked="true" label="Autocutoff based on distribution of MUMi values" /> + <when value="false"> + <param name="max_distance" type="float" value="1" /> + </when> + </conditional> + </when> + </conditional> + </when> + </conditional> + + <!--LCB --> + <conditional name="max_diag_diff" label="Maximal diagonal difference"> + <param name="diag_diff_unit" type="select" label="Unit"> + <option value="" selected="true">%</option> + <option value="bp">Base pairs</option> + </param> + <when value=""> + <param name="diag_diff" type="float" min="0" max="1" value="0.12" /> + </when> + <when value="bp"> + <param name="diag_diff_bp" type="integer" min="0" value="100" /> + </when> + </conditional> + <param name="extend_lcb" type="boolean" checked="false" truevalue="-e" falsevalue="" argument="-e" label="Greedily extend LCBs" /> + <param name="aligner" type="select" argument="-n" label="Alignment program"> + <option value="muscle" selected="true">muscle</option> + <option value="mafft">mafft</option> + <option value="fsa">fsa</option> + <option value="prank">prank</option> + </param> + <param name="output_unaligned" type="boolean" checked="false" truevalue="-u" falsevalue="" argument="-u" label="Output unaligned regions" /> + </section> + </inputs> + <outputs> + <data name="tree" format="newick" from_work_dir="parsnp.tree" label="${tool.name} on ${on_string}: Newick formatted core genome SNP tree" /> + <data name="vcf" format="vcf" from_work_dir="parsnp.vcf" label="${tool.name} on ${on_string}: SNPs used to infer phylogeny" /> + <data name="ggr" format="ggr" from_work_dir="parsnp.ggr" label="${tool.name} on ${on_string}: Gingr formatted binary archive" /> + <data name="xfma" format="xfma" from_work_dir="parsnp.xmfa" label="${tool.name} on ${on_string}: XMFA formatted multiple alignment" /> + <data name="unaligned" format="txt" from_work_dir="parsnp.unaligned" label="${tool.name} on ${on_string}: Unaligned regions" > + <filter>adv['output_unaligned']</filter> + </data> + </outputs> + <tests> + <test expect_num_outputs="4"> + <param name="genomes" > + <collection type="list"> + <element name="test1" value="test-data/15596_genome.fasta" ftype="fasta" /> + <element name="test2" value="test-data/15602_genome.fasta" ftype="fasta" /> + <element name="test3" value="test-data/15599_genome.fasta" ftype="fasta" /> + </collection> + </param> + <conditional name="ref_or_gbk"> + <param name="ref_type" value="fasta" /> + <conditional name="ref_genome"> + <param name="random_ref" value="false" /> + <param name="reference" value="test-data/15600_genome.fasta" ftype="fasta" /> + </conditional> + </conditional> + <section name="adv"> + <conditional name="MUMi_or_curated"> + <param name="curated" value="-c" /> + </conditional> + </section> + <output name="tree" checksum="sha256:66a2cc47666452fae008b546ab2bd5f9a06c7c7daca88e34e2be7a5cdd371137" ftype="newick" /> + <output name="vcf" checksum="sha256:e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855" ftype="vcf" /> + <output name="ggr" checksum="sha256:9e91807a25a9549070cfde5cc60844991db5cbee55d9181c61e75220b67f35c5" ftype="txt" /> + <output name="xfma" checksum="sha256:1774759cc4c34b53e117406a9055f933620960be852ab77501eab1d34badbbfa" ftype="txt" /> + </test> + </tests> + <help><![CDATA[ + https://harvest.readthedocs.io/en/latest/content/parsnp.html + ]]></help> + <citations> + <citation type="doi">10.5281/zenodo.3364789</citation> + <citation type="doi">10.1101/007351</citation> + </citations> +</tool>