annotate ITSx.xml @ 0:f82c70f54bd7 draft

Uploaded
author okorol
date Tue, 24 Mar 2015 12:02:48 -0400
parents
children b433586432d7
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
1 <tool id="ITSx" name="ITSx Extractor" version="1.0.6">
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
2
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
3 <description>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
4 ITSx -- Identifies ITS sequences and extracts the ITS region
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
5 </description>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
6
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
7 <command interpreter="perl">
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
8 ITSx -i $input --detailed_results T --cpu $cpu $preserve $reset
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
9 </command>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
10 <requirements>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
11 <requirement type="package" version="3.1b1">hmmer</requirement>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
12 </requirements>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
13 <inputs>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
14 <param name="input" type="data" format="fasta" label="Input Fasta"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
15 <param name="cpu" type="integer" value="1" label="cpu"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
16 <param name="complement" type="boolean" checked="true" truevalue="--complement T" falsevalue="--complement F" label="Checks both DNA strands against the database"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
17 <param name="heuristics" type="boolean" checked="false" truevalue="--heuristics T" falsevalue="--heuristics F" label="Use HMMER's heuristic filtering"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
18 <param name="reset" type="boolean" checked="false" truevalue="--reset T" falsevalue="--reset F" label="Re-creates the HMM-database before ITSx is run"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
19 <param name="preserve" type="boolean" checked="false" truevalue="--preserve T" falsevalue="--preserve F" label=" Preserve sequence headers instead of printing out ITSx headers"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
20 </inputs>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
21
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
22 <outputs>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
23 <data name="ITS1" format="fasta" label="Extracted ITS1 Fasta File" from_work_dir="ITSx_out.ITS1.fasta"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
24 <data name="ITS2" format="fasta" label="Extracted ITS2 Fasta File" from_work_dir="ITSx_out.ITS2.fasta"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
25 <data name="fullfasta" format="fasta" label="Full Fasta of ITS extracted" from_work_dir="ITSx_out.full.fasta"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
26 <data name="graph" format="txt" label="Graph of ITS regions" from_work_dir="ITSx_out.graph"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
27 <data name="nodetect" format="fasta" label="No ITS region" from_work_dir="ITSx_out_no_detections.fasta"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
28 <data name="positions" format="tabular" label="ITSx feature positions" from_work_dir="ITSx_out.positions.txt"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
29 <data name="problematic" format="tabular" label="Problematic sequences" from_work_dir="ITSx_out.problematic.txt"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
30 <data name="summary" format="txt" label="ITSx summary" from_work_dir="ITSx_out.summary.txt"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
31 <data name="extractions" format="tabular" label="ITSx extraction results" from_work_dir="ITSx_out.extraction.results"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
32 </outputs>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
33
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
34 <stdio>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
35 <regex match="ITSx" source="both" level="log"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
36 <regex match="analysis" source="both" level="log"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
37 <regex match="ERROR" source="both" level="fatal"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
38 <regex match="error" source="both" level="fatal"/>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
39 </stdio>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
40
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
41 <test></test>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
42 <help>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
43 ITSx -- Identifies ITS sequences and extracts the ITS region
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
44
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
45 Source code available at:
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
46 http://microbiology.se/software/itsx
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
47
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
48 Version: 1.0.6
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
49 ITSx -- Identifies ITS sequences and extracts the ITS region
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
50 Copyright (C) 2012-2013 Johan Bengtsson-Palme et al.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
51 Contact: Johan Bengtsson-Palme, johan[at]microbiology.se
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
52 Programmer: Johan Bengtsson-Palme
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
53
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
54 Full installation instructions can be found in the User's Guide.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
55 A quick installation guide follows below.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
56
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
57 ITSx requires Perl and HMMER3.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
58
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
59 1) Perl is usually installed on Unix-like systems by default. If not, it can be retrieved from http://www.perl.org/
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
60
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
61 2) HMMER3 can be found at http://hmmer.janelia.org/software
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
62 Download it and follow the on site instructions for installation.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
63
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
64 3) Obtain the ITSx package from http://microbiology.se/software/itsx
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
65 Unpack the tarball and move into the newly created "ITSx" directory.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
66
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
67 4) Copy the ITSx file and the ITSx_db directory to your preferred bin directory.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
68
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
69 5) To test if ITSx was successfully installed type "ITSx --help" on the command-line. You should now see the ITSx help message.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
70
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
71 To run ITSx, you need a FASTA-formatted output file. You can e.g. use the test.fasta file supplied with the package. To check for ITS sequences in the test file, type "ITSx -i test.fasta -o test" on the command line. If you are on a multicore machine, you might want to use the "--cpu 2" option to speed up the processes by using two (or more) cores.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
72
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
73 New features in this version:
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
74 - Fixed a bug causing over-reporting of chimeras
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
75
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
76
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
77 If you encounter a bug or some other strange behaviour, please report it to:
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
78 johan[at]microbiology.se
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
79
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
80 This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version.This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.You should have received a copy of the GNU General Public License along with this program, in a file called 'license.txt'. If not, see: http://www.gnu.org/licenses/.
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
81
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
82 ----
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
83
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
84 Usage: ITSx -i [input file] -o [output file]
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
85
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
86 Options:
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
87
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
88 -i {file} : DNA FASTA input file to investigate
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
89
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
90 -o {file} : Base for the names of output file(s)
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
91
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
92 -p {directory} : A path to a directory of HMM-profile collections representing ITS conserved regions, default is in the same directory as ITSx itself
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
93
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
94 --date {T or F} : Adds a date and time stamp to the output directory, off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
95
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
96 --reset {T or F} : Re-creates the HMM-database before ITSx is run, off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
97
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
98 Sequence selection options:
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
99
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
100 -t {character code} : Profile set to use for the search, see the User's Guide (comma-separated), default is all
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
101
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
102 -E {value} : Domain E-value cutoff for a sequence to be included in the output, default = 1e-5
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
103
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
104 -S {value} : Domain score cutoff for a sequence to be included in the output, default = 0
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
105
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
106 -N {value} : The minimal number of domains that must match a sequence before it is included, default = 2
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
107
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
108 --selection_priority {sum, domains, eval, score} : Selects what will be of highest priority when determining the origin of the sequence, default is sum
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
109
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
110 --search_eval {value} : The E-value cutoff used in the HMMER search, high numbers may slow down the process, cannot be used with the --search_score option, default is 0.01
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
111
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
112 --search_score {value} : The score cutoff used in the HMMER search, low numbers may slow down the process, cannot be used with the --search_eval option, default is to used E-value cutoff, not score
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
113
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
114 --allow_single_domain {e-value,score or F} : Allow inclusion of sequences that only find a single domain, given that they meet the given E-value and score thresholds, on with parameters 1e-9,0 by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
115
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
116 --allow_reorder {T or F} : Allows profiles to be in the wrong order on extracted sequences, off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
117
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
118 --complement {T or F} : Checks both DNA strands against the database, creating reverse complements, on (T) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
119
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
120 --cpu {value} : the number of CPU threads to use, default is 1
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
121
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
122 --multi_thread {T or F} : Multi-thread the HMMER-search, on (T) if number of CPUs (--cpu option > 1), else off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
123
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
124 --heuristics {T or F} : Selects whether to use HMMER's heuristic filtering, off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
125
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
126 Output options:
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
127
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
128 --summary {T or F} : Summary of results output, on (T) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
129
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
130 --graphical {T or F} : 'Graphical' output, on (T) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
131
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
132 --fasta {T or F} : FASTA-format output of extracted ITS sequences, on (T) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
133
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
134 --preserve {T or F} : Preserve sequence headers in input file instead of printing out ITSx headers, off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
135
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
136 --save_regions {SSU,ITS1,5.8S,ITS2,LSU,all,none} : A comma separated list of regions to output separate FASTA files for, 'ITS1,ITS2' by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
137
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
138 --anchor {integer or HMM} : Saves an additional number of bases before and after each extracted region. If set to 'HMM' all bases matching the corresponding HMM will be output, default = 0
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
139
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
140 --partial {integer} : Saves additional FASTA-files for full and partial ITS sequences longer than the specified cutoff, default = 0 (off)
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
141
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
142 --concat {T or F} : Saves a FASTA-file with concatenated ITS sequences (with 5.8S removed), off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
143
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
144 --minlen {integer} : Minimum length the ITS regions must be to be outputted in the concatenated file (see above), default = 0
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
145
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
146 --positions {T or F} : Table format output containing the positions ITS sequences were found in, on (T) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
147
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
148 --table {T or F} : Table format output of sequences containing probable ITS sequences, off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
149
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
150 --not_found {T or F} : Saves a list of non-found entries, on (T) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
151
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
152 --detailed_results {T or F} : Saves a tab-separated list of all results, off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
153
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
154 --truncate {T or F} : Truncates the FASTA output to only contain the actual ITS sequences found, on (T) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
155
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
156 --silent {T or F} : Supresses printing progress info to stderr, off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
157
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
158 --graph_scale {value} : Sets the scale of the graph output, if value is zero, a percentage view is shown, default = 0
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
159
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
160 --save_raw {T or F} : Saves all raw data for searches etc. instead of removing it on finish, off (F) by default
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
161
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
162 -h : displays this help message
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
163
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
164 --help : displays this help message
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
165
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
166 --bugs : displays the bug fixes and known bugs in this version of ITSx
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
167
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
168 --license : displays licensing information
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
169
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
170 </help>
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
171
f82c70f54bd7 Uploaded
okorol
parents:
diff changeset
172 </tool>