annotate long-orfs_wrapper.xml @ 0:9c8ffce71f7c draft default tip

Uploaded
author crs4
date Mon, 09 Sep 2013 12:16:17 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
1 <tool id="long_orfs_wrapper" name="Long-ORFs" version="0.2">
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
2 <description></description>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
3 <requirements>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
4 <requirement type="package" version="3.02">glimmer</requirement>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
5 </requirements>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
6 <command interpreter="python">
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
7 long-orfs_wrapper.py --loSequence $loSequence
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
8 #if $loStartCodons
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
9 --loStartCodons="$loStartCodons"
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
10 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
11 #if $loEntropy
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
12 --loEntropy=$loEntropy
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
13 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
14 #if $loFixed
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
15 --loFixed
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
16 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
17 #if str($loMinLen)
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
18 --loMinLen=$loMinLen
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
19 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
20 #if $loLinear
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
21 --loLinear
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
22 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
23 #if $loLengthOpt
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
24 --loLengthOpt
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
25 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
26 #if $loNoHeader
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
27 --loNoHeader
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
28 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
29 #if str($loMaxOverlap)
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
30 --loMaxOverlap=$loMaxOverlap
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
31 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
32 #if str($loCutoff)
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
33 --loCutoff=$loCutoff
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
34 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
35 #if $loWithoutStops
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
36 --loWithoutStops
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
37 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
38 #if str($loTransTable)
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
39 --loTransTable=$loTransTable
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
40 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
41 #if $loStopCodons
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
42 --loStopCodons="$loStopCodons"
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
43 #end if
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
44 --loOutput $loOutput --logfile $logfile
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
45 </command>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
46
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
47 <inputs>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
48 <param name="loSequence" type="data" format="fasta" label="DNA sequence to be analyzed" help="FASTA format" />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
49
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
50 <param name="loStartCodons" type="text" value="" optional="true" label="Specify allowable start codons as a comma-separated list (-A, --start_codons)" help="Sample format: 'atg,gtg'. The default start codons are atg, gtg and ttg." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
51
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
52 <param name="loEntropy" type="data" format="glimmer_entropy_profiles" optional="true" label="Entropy profiles (-E, --entropy)" help="The entropy profiles are used only if the cutoff option is specified." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
53
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
54 <param name="loFixed" type="boolean" checked="false" label="Fixed minimum gene length (-f, --fixed)" help="Do NOT automatically calculate the minimum gene length that maximizes the number or length of output regions, but instead use either the value specified by the 'minimum gene length' option or else the default, which is 90." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
55
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
56 <param name="loMinLen" type="integer" value="" optional="true" label="Minimum gene length in number of nucleotides (-g, --min_len)" help="It does not include the bases in the stop codon." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
57
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
58 <param name="loLinear" type="boolean" checked="false" label="Assuming a linear genome (-l, --linear)" help="No 'wrap-around' genes with part at the beginning of the sequence and the rest at the end of the sequence." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
59
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
60 <param name="loLengthOpt" type="boolean" checked="false" label="Optimize minimum gene length (-L, --length_opt)" help="Find and use as the minimum gene length the value that maximizes the total length of non-overlapping genes, instead of the default behaviour, which is to maximize the total number of non-overlapping genes." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
61
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
62 <param name="loNoHeader" type="boolean" checked="true" label="Do not include the program-settings header information in the output file (-n, --no_header)" help="The output file will contain only the coordinates of the selected ORFs." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
63
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
64 <param name="loMaxOverlap" type="integer" value="" optional="true" label="Maximum overlap length (-o, --max_olap)" help="Overlaps of this many or fewer bases between genes are not regarded as overlaps." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
65
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
66 <param name="loCutoff" type="float" value="" optional="true" label="Only genes with an entropy distance score less than this value will be considered (-t, --cutoff)" help=" This cutoff is made before any subsequent steps in the algorithm." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
67
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
68 <param name="loWithoutStops" type="boolean" checked="false" label="Do NOT include the stop codon in the region described by the output coordinates (-w, --without_stops)" help="By default it is included." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
69
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
70 <param name="loTransTable" type="integer" value="" optional="true" label="Use GenBank translation table number n to specify stop codons (-z, --trans_table)" help="" />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
71
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
72 <param name="loStopCodons" type="text" value="" optional="true" label="Specify allowable stop codons as a comma-separated list (-Z, --stop_codons)" help="Sample format: 'tag,tga'. The default stop codons are tag, tga and taa." />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
73 </inputs>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
74
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
75 <outputs>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
76 <data name="logfile" format="txt" label="${tool.name} on ${on_string}: log" />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
77 <data name="loOutput" format="glimmer_coords" label="${tool.name} on ${on_string}: output" />
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
78 </outputs>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
79
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
80 <tests>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
81
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
82 </tests>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
83 <help>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
84 **What it does**
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
85
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
86 This program identifies long, non-overlapping open reading frames (ORFs) in a DNA sequence file. These ORFs are very likely to contain genes, and can be used as a set of training sequences for Build-ICM. More specifically, among all ORFs longer than a minimum length, those that do not overlap any others are output. The start codon used for each ORF is the first possible one. The program, by default, automatically determines the value that maximizes the number of ORFs that are output. With the -t option, the initial set of candidate ORFs also can be filtered using entropy distance, which generally produces a larger, more accurate training set, particularly for high-GC-content genomes.
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
87
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
88
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
89 **License and citation**
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
90
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
91 This Galaxy tool is Copyright © 2013 `CRS4 Srl.`_ and is released under the `MIT license`_.
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
92
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
93 .. _CRS4 Srl.: http://www.crs4.it/
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
94 .. _MIT license: http://opensource.org/licenses/MIT
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
95
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
96 If you use this tool in Galaxy, please cite |Cuccuru2013|_.
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
97
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
98 .. |Cuccuru2013| replace:: Cuccuru, G., Orsini, M., Pinna, A., Sbardellati, A., Soranzo, N., Travaglione, A., Uva, P., Zanetti, G., Fotia, G. (2013) Orione, a web-based framework for NGS analysis in microbiology. *Submitted*
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
99 .. _Cuccuru2013: http://orione.crs4.it/
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
100
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
101 This tool uses `Glimmer`_, which is licensed separately. Please cite |Delcher2007|_.
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
102
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
103 .. _Glimmer: http://ccb.jhu.edu/software/glimmer/index.shtml
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
104 .. |Delcher2007| replace:: Delcher, A. L., Bratke, K. A., Powers, E. C., Salzberg, S. L. (2007) Identifying bacterial genes and endosymbiont DNA with Glimmer. *Bioinformatics* 23(6), 673-679
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
105 .. _Delcher2007: http://bioinformatics.oxfordjournals.org/content/23/6/673
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
106 </help>
9c8ffce71f7c Uploaded
crs4
parents:
diff changeset
107 </tool>