comparison mash_screen.xml @ 0:bac720dc1948 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/mash commit 500478e8adcabf5249941012f78fe2140ecc7264
author iuc
date Mon, 07 Jan 2019 15:09:58 -0500
parents
children 402b67d1af7d
comparison
equal deleted inserted replaced
-1:000000000000 0:bac720dc1948
1 <tool id="mash_screen" name="mash screen" version="@TOOL_VERSION@+galaxy0" profile="19.01">
2 <description>determines how well query sequences are contained within a pool of sequences.</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <requirements>
7 <requirement type="package" version="@TOOL_VERSION@">mash</requirement>
8 </requirements>
9 <version_command>mash --version</version_command>
10 <command detect_errors="exit_code"><![CDATA[
11 ln -s '$queries' queries.msh &&
12 mash screen
13 $winner_takes_all
14 -i $minimum_identity_to_report
15 -v $maximum_p_value_to_report
16 queries.msh
17 '${ str($pool).replace(',', '\' \'') }'
18 > '$output'
19 ]]></command>
20 <inputs>
21 <param name="queries" type="data" format="msh" />
22 <param type="data" multiple="true" name="pool" format="@INTYPES@" />
23 <param type="boolean" name="winner_takes_all" argument="-w" truevalue="-w" falsevalue=""/>
24 <param type="float" name="minimum_identity_to_report" argument="-i" value="0." min="-1." max="1." />
25 <param type="float" name="maximum_p_value_to_report" argument="-v" value="1." min="0." max="1."/>
26 </inputs>
27 <outputs>
28 <data name="output" format="tabular" />
29 </outputs>
30 <tests>
31 <test>
32 <param name="queries" value="NZ_MYON01000010.1.msh"/>
33 <param name="pool" value="ERR024951_seqtk_sample_1000_1.fastq"/>
34 <output name="output" file="mash_screen_NZ_MYON01000010.1_ERR024951_seqtk_sample_1000_1.tsv"/>
35 </test>
36 <test>
37 <param name="queries" value="NZ_MYON01000010.1.msh"/>
38 <param name="pool" value="ERR024951_seqtk_sample_1000_2.fastq"/>
39 <output name="output" file="mash_screen_NZ_MYON01000010.1_ERR024951_seqtk_sample_1000_2.tsv"/>
40 </test>
41 <test>
42 <param name="queries" value="NZ_MYON01000010.1.msh"/>
43 <param name="pool" value="ERR024951_seqtk_sample_1000_1.fastq,ERR024951_seqtk_sample_1000_2.fastq"/>
44 <output name="output" file="mash_screen_NZ_MYON01000010.1_ERR024951_seqtk_sample_1000_1and2.tsv"/>
45 </test>
46 </tests>
47 <help><![CDATA[
48 Description:
49
50 Determine how well query sequences are contained within a pool of sequences.
51 The queries must be formatted as a single Mash sketch file (.msh), created
52 with the `mash sketch` command. The <pool> files can be contigs or reads, in
53 fasta or fastq, gzipped or not, and "-" can be given for <pool> to read from
54 standard input. The <pool> sequences are assumed to be nucleotides, and will
55 be 6-frame translated if the <queries> are amino acids. The output fields are
56 [identity, shared-hashes, median-multiplicity, p-value, query-ID,
57 query-comment], where median-multiplicity is computed for shared hashes, based
58 on the number of observations of those hashes within the pool.
59 ]]></help>
60 <citations>
61 <citation type="bibtex">
62 @article{ondov2016mash,
63 title={Mash: fast genome and metagenome distance estimation using MinHash},
64 author={Ondov, Brian D and Treangen, Todd J and Melsted, P{\'a}ll and Mallonee, Adam B and Bergman, Nicholas H and Koren, Sergey and Phillippy, Adam M},
65 journal={Genome biology},
66 volume={17},
67 number={1},
68 pages={132},
69 year={2016},
70 publisher={BioMed Central}
71 }
72 </citation>
73 </citations>
74 </tool>