annotate ITSx.xml @ 0:57e76d405a97 draft default tip

Uploaded
author aafc-mbb
date Mon, 14 Mar 2016 16:15:08 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
1 <tool id="ITSx" name="ITSx Extractor" version="1.0.11">
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
2
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
3 <description>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
4 ITSx -- Identifies ITS sequences and extracts the ITS region
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
5 </description>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
6
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
7 <requirements>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
8 <requirement type="package" version="3.1b2">hmmer</requirement>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
9 </requirements>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
10
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
11 <stdio>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
12 <regex match="ITSx" source="both" level="log"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
13 <regex match="analysis" source="both" level="log"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
14 <regex match="ERROR" source="both" level="fatal"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
15 <regex match="error" source="both" level="fatal"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
16 </stdio>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
17
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
18 <command interpreter="perl">
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
19 ITSx -i $input
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
20 --detailed_results T
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
21 -E $domain_eval
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
22 -S $domain_score
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
23 -N $domain_num
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
24 --cpu=\${GALAXY_SLOTS:-1}
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
25 $allow_reorder
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
26 $complement
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
27 $heuristics
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
28 $preserve
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
29 $reset
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
30 $truncate
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
31 #if $hmmer_search.search == "eval"
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
32 --search_eval $hmmer_search.eval_cutoff
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
33 #else
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
34 --search_score $hmmer_search.score_cutoff
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
35 #end if
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
36 </command>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
37
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
38 <inputs>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
39 <param name="input" type="data" format="fasta" label="Input Fasta"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
40
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
41 <param name="domain_eval" type="float" value="0.00001" label="Domain E-value Cutoff"
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
42 help="Domain E-value cutoff a sequence must obtain in the HMMER-based step to be included in the output."/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
43
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
44 <param name="domain_score" type="integer" value="0" label="Domain Score Cutoff"
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
45 help="Domain score cutoff that a sequence must obtain in the HMMER-based step to be included in the output."/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
46
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
47 <param name="domain_num" type="integer" value="2" label="Minimum Number of Domains"
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
48 help="The minimum number of domains (different HMM gene profiles) that must match a sequence or it to be included in the output (detected as an ITS sequence). Setting the value lower than two will increase the number of false positives, while increasing it above two will decrease ITSx detection abilities on fragmentary data. "/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
49
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
50 <conditional name="hmmer_search">
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
51 <param name="search" type="select" label="HMMER Search Type">
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
52 <option value="eval">Search E-value</option>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
53 <option value="score">Search Score</option>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
54 </param>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
55 <when value="eval">
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
56 <param name="eval_cutoff" type="float" value="0.01" label="Search E-value"
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
57 help="The actual E-value cutoff used in the HMMER search. High numbers may slow down the process. Should never be set to a lower value than the Domain E-value Cutoff opion. Cannot be used in combination with Search Score option."/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
58 </when>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
59 <when value="score">
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
60 <param name="score_cutoff" type="integer" value="0" label="Seach Score"
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
61 help="The score cutoff used in the HMMER search. Low numbers may slow down the process. Should never be set to a higher number than the Domain Score Cutoff. Cannot be used in combination with the Search E-value option."/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
62 </when>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
63 </conditional>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
64
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
65 <param name="reset" type="boolean" checked="true" truevalue="--reset T" falsevalue="--reset F" label="Re-creates the HMM-database before ITSx is run"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
66
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
67 <!-- <param name="cpu" type="integer" value="1" label="cpu"/> -->
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
68
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
69 <param name="allow_reorder" type="boolean" checked="false" truevalue="--allow_reorder T" falsevalue="--allow_reorder F" label="Allow profiles not to be in the expected order on the extracted sequences"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
70
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
71 <param name="complement" type="boolean" checked="true" truevalue="--complement T" falsevalue="--complement F" label="Check both DNA strands against the database"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
72
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
73 <param name="heuristics" type="boolean" checked="false" truevalue="--heuristics T" falsevalue="--heuristics F" label="Use HMMER's heuristic filtering"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
74
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
75 <param name="preserve" type="boolean" checked="false" truevalue="--preserve T" falsevalue="--preserve F" label=" Preserve sequence headers instead of printing out ITSx headers"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
76
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
77 <param name="truncate" type="boolean" checked="true" truevalue="--truncate T" falsevalue="--truncate F" label="Remove ends of ITS sequences if they are outside of the ITS region"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
78 </inputs>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
79
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
80 <outputs>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
81 <data name="ITS1" format="fasta" label="Extracted ITS1 Fasta File" from_work_dir="ITSx_out.ITS1.fasta"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
82 <data name="ITS2" format="fasta" label="Extracted ITS2 Fasta File" from_work_dir="ITSx_out.ITS2.fasta"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
83 <data name="fullfasta" format="fasta" label="Full Fasta of ITS extracted" from_work_dir="ITSx_out.full.fasta"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
84 <data name="graph" format="txt" label="Graph of ITS regions" from_work_dir="ITSx_out.graph"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
85 <data name="nodetect" format="fasta" label="No ITS region" from_work_dir="ITSx_out_no_detections.fasta"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
86 <data name="positions" format="tabular" label="ITSx feature positions" from_work_dir="ITSx_out.positions.txt"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
87 <data name="problematic" format="tabular" label="Problematic sequences" from_work_dir="ITSx_out.problematic.txt"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
88 <data name="summary" format="txt" label="ITSx summary" from_work_dir="ITSx_out.summary.txt"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
89 <data name="extractions" format="tabular" label="ITSx extraction results" from_work_dir="ITSx_out.extraction.results"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
90 </outputs>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
91
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
92 <tests>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
93 <test>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
94 <param name="input" value="testITSsequences.fasta"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
95 <param name="domain_eval" value="0.00001" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
96 <param name="domain_score" value="0" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
97 <param name="domain_num" value="2" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
98 <param name="search" value="eval" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
99 <param name="eval_cutoff" value="0.01" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
100 <param name="reset" value="--reset T" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
101 <param name="allow_reorder" value="--allow_reorder F" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
102 <param name="complement" value="--complement T"/>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
103 <param name="heuristics" value="--heuristics F" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
104 <param name="preserve" value="--preserve F" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
105 <param name="truncate" value="--truncate T" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
106 <output name="ITS1" file="expectedOutput.ITS1.fasta" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
107 <output name="ITS2" file="expectedOutput.ITS2.fasta" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
108 <output name="fullfasta" file="expectedOutput.full.fasta" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
109 <output name="graph" file="expectedOutput.graph" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
110 <!-- This output is commented out because it is empty -->
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
111 <!--<output name="nodetect" file="expectedOutput_no_detections.fasta" />-->
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
112 <output name="positions" file="expectedOutput.positions.txt" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
113 <!-- This output is commented out because it causes the test to fail (due to the difference in time that gets printed out in the expected output and the output of the test) -->
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
114 <!--<output name="summary" file="expectedOutput.summary.txt" />-->
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
115 <output name="problematic" file="expectedOutput.problematic.txt" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
116 <output name="extractions" file="expectedOutput.extractions.txt" />
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
117 </test>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
118 </tests>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
119
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
120 <help>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
121 **Description**
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
122
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
123 Identifies ITS sequences and extracts the ITS regions.
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
124
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
125 ITSx is an open source software utility to extract the highly variable ITS1 and ITS2 subregions from ITS sequences, which is commonly used as a molecular barcode for e.g. fungi. As the inclusion of parts of the neighbouring, very conserved, ribosomal genes (SSU, 5S and LSU rRNA sequences) in the sequence identification process can lead to severely misleading results, ITSx identifies and extracts only the ITS regions themselves.
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
126 For more information regarding the settings of the tool, please visit the ITSx Users Guide on http://microbiology.se/publ/itsx_users_guide.pdf
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
127
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
128 -----
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
129
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
130 **Inputs and Outputs**
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
131
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
132 - Inputs:
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
133 + Accepts input in the FASTA format. It is possible to input both aligned and unaligned FASTA files, containing both DNA and RNA sequences
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
134
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
135 - Outputs:
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
136 + Summary file of the entire run
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
137 + One or more detailed table containing the positions in the respective sequences where the ITS subregions were found
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
138 + Semi-graphical representation of hits
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
139 + FASTA file of all identified sequences
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
140 + FASTA file for ITS1 regions
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
141 + FASTA file for ITS2 regions
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
142 + A list of sequence IDs representing the entries (if they exist) that did not contain any ITS region
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
143 + A file containing chimeric sequences (if they are found)
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
144 + A file for problematic sequences
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
145
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
146 -----
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
147
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
148 **Tool Information**
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
149
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
150 - ITSx tool v1.0.11:
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
151 + Release Date: December 2014
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
152 + URL: http://microbiology.se/software/itsx/
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
153 + Source URL: http://microbiology.se/sw/ITSx_1.0.11.tar.gz
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
154 + Copyright (C) 2012-2013 Johan Bengtsson-Palme et al.
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
155
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
156 -----
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
157
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
158 **Contact Information**
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
159
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
160 - For more information, contact:
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
161 + AAFC-MBB Team
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
162 + E-mail: mbb@agr.gc.ca
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
163 + Agriculture and Agri-foods Canada, Ottawa, ON, Canada
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
164 </help>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
165
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
166 <citations>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
167 <citation type="bibtex">@ARTICLE{a1,
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
168 author = {Bengtsson-Palme, Johan},
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
169 title = {ITSx: Improved software detection and extraction of ITS1 and ITS2 from ribosomal ITS sequences of fungi and other eukaryotes for use in environmental sequencing},
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
170 year = {2013}
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
171 }</citation>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
172 </citations>
57e76d405a97 Uploaded
aafc-mbb
parents:
diff changeset
173 </tool>