0
|
1 <tool id="mlst" name="MLST" version="2.11">
|
|
2 <requirements>
|
|
3 <requirement type="package" version="2.11">mlst</requirement>
|
|
4 </requirements>
|
|
5
|
|
6 <version_command>mlst --version</version_command>
|
|
7
|
|
8 <command detect_errors="exit_code"><![CDATA[
|
|
9 mlst "$input_file" --nopath
|
|
10 #if $settings.advanced == "advanced"
|
|
11 #if $settings.min_dna_id
|
|
12 --minid=$settings.min_dna_id
|
|
13 #end if
|
|
14 #if $settings.min_dna_cov
|
|
15 --mincov=$settings.min_dna_cov
|
|
16 #end if
|
|
17 #if $settings.scheme
|
|
18 --scheme=$settings.scheme
|
|
19 #end if
|
|
20 #end if
|
|
21 > "$report"
|
|
22 ]]></command>
|
|
23
|
|
24 <inputs>
|
|
25 <param type="data" name="input_file" format="fasta,genbank" />
|
|
26 <conditional name="settings">
|
|
27 <param name="advanced" type="select" label="Specify advanced parameters">
|
|
28 <option value="simple" selected="true">No, use program defaults.</option>
|
|
29 <option value="advanced">Yes, see full parameter list.</option>
|
|
30 </param>
|
|
31 <when value="simple">
|
|
32 </when>
|
|
33 <when value="advanced">
|
|
34 <param name="min_dna_id" type="integer" label="Minimum DNA identity" value="95" min="0" max="100" help="Minimum DNA identity of full allelle to consider 'similar' (default 95, must be between 0-100)" optional="true" />
|
|
35 <param name="min_dna_cov" type="integer" label="Minimum DNA coverage" value="10" help="Minimum DNA coverage to report partial allele at all (default 10)" optional="true" />
|
|
36 <param name="scheme" type="text" area="false" label="PubMLST Scheme" help="Turn off auto-detection and only use this scheme" optional="true" />
|
|
37 </when>
|
|
38 </conditional>
|
|
39 </inputs>
|
|
40
|
|
41 <outputs>
|
|
42 <data name="report" format="tabular" />
|
|
43 </outputs>
|
|
44
|
|
45 <tests>
|
|
46 <!-- Basic test - will produce no results. -->
|
|
47 <test>
|
|
48 <param name="input_file" value="Acetobacter.fna"/>
|
|
49 <param name="advanced" value="simple"/>
|
|
50 <output name="report" ftype="tabular" file="output_noresults.txt" compare="contains"/>
|
|
51 </test>
|
|
52
|
|
53 <!-- Basic test - will produce results. -->
|
|
54 <test>
|
|
55 <param name="input_file" value="MRSA0252_trimmed.fna"/>
|
|
56 <param name="advanced" value="simple"/>
|
|
57 <output name="report" ftype="tabular" file="output_mrsa.txt" compare="contains"/>
|
|
58 </test>
|
|
59
|
|
60 <!-- Advanced test - Min DNA Coverage 100 -->
|
|
61 <test>
|
|
62 <param name="input_file" value="MRSA0252_trimmed.fna"/>
|
|
63 <param name="advanced" value="advanced"/>
|
|
64 <param name="min_dna_cov" value="100"/>
|
|
65 <output name="report" ftype="tabular" file="output_mincov100.txt" compare="contains"/>
|
|
66 </test>
|
|
67
|
|
68 <!-- Advanced test - Min DNA ID 100 -->
|
|
69 <test>
|
|
70 <param name="input_file" value="MRSA0252_trimmed.fna"/>
|
|
71 <param name="advanced" value="advanced"/>
|
|
72 <param name="min_dna_id" value="100"/>
|
|
73 <output name="report" ftype="tabular" file="output_minid100.txt" compare="contains"/>
|
|
74 </test>
|
|
75 </tests>
|
|
76
|
|
77 <help><![CDATA[
|
|
78 **What it does**
|
|
79
|
|
80 Given a genome file in FASTA or Genbank format, MLST will scan the file against PubMLST typing schemes.
|
|
81
|
|
82 **Output**
|
|
83
|
|
84 MLST will produce a tab-seperated output file which contains:
|
|
85 - the filename
|
|
86 - the closest PubMLST scheme name
|
|
87 - the ST (sequence type)
|
|
88 - the allele IDs
|
|
89
|
|
90 **Example Output**
|
|
91
|
|
92 ::
|
|
93
|
|
94 genomes/6008.fna saureus 239 arcc(2) aroe(3) glpf(1) gmk_(1) pta_(4) tpi_(4) yqil(3)
|
|
95
|
|
96 **Without auto-detection**
|
|
97
|
|
98 If you provide the 'scheme' parameter, it will print a fixed tabular output with a heading containing allele names specific to that scheme. To view a list of schemes, use the MLST List tool.
|
|
99
|
|
100 ::
|
|
101
|
|
102 FILE SCHEME ST abcZ adk aroE fumC gdh pdhC pgm
|
|
103 NM003.fa neisseria 11 2 3 4 3 8 4 6
|
|
104
|
|
105 **Missing data**
|
|
106 MLST does not just look for exact matches to full length alleles. It attempts to tell you as much as possible about what it found using the notation below:
|
|
107
|
|
108 +--------+---------------------------+
|
|
109 | Symbol | Meaning |
|
|
110 +========+===========================+
|
|
111 | n | Exact intact allele |
|
|
112 +--------+---------------------------+
|
|
113 | ~n | Novel allele similar to n |
|
|
114 +--------+---------------------------+
|
|
115 | n,m | Multiple alleles |
|
|
116 +--------+---------------------------+
|
|
117 | *-* | Allele missing |
|
|
118 +--------+---------------------------+
|
|
119
|
|
120 Galaxy wrapper maintained by Simon Gladman.
|
|
121 ]]></help>
|
|
122
|
|
123 <citations>
|
|
124 <citation type="bibtex">
|
|
125 @UNPUBLISHED{Seemann2016,
|
|
126 author = "Seemann T",
|
|
127 title = "MLST: Scan contig files against PubMLST typing schemes",
|
|
128 year = "2016",
|
|
129 note = "https://github.com/tseemann/mlst"}
|
|
130 </citation>
|
|
131 </citations>
|
|
132 </tool>
|