annotate glimmer_build-icm.xml @ 2:b1ad88bbc5fa draft default tip

Uploaded
author bgruening
date Mon, 12 Aug 2013 11:55:07 -0400
parents 841357e0acbf
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
841357e0acbf Uploaded
bgruening
parents:
diff changeset
1 <tool id="glimmer_build-icm" name="Glimmer ICM builder" version="0.2">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
2 <description></description>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
3 <requirements>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
4 <requirement type="package" version="3.02b">glimmer</requirement>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
5 </requirements>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
6 <command>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
7 build-icm
841357e0acbf Uploaded
bgruening
parents:
diff changeset
8 --depth $depth
841357e0acbf Uploaded
bgruening
parents:
diff changeset
9 #if $no_stops:
841357e0acbf Uploaded
bgruening
parents:
diff changeset
10 --no_stops
841357e0acbf Uploaded
bgruening
parents:
diff changeset
11 #end if
841357e0acbf Uploaded
bgruening
parents:
diff changeset
12 --period $period
841357e0acbf Uploaded
bgruening
parents:
diff changeset
13 --width $width
841357e0acbf Uploaded
bgruening
parents:
diff changeset
14
841357e0acbf Uploaded
bgruening
parents:
diff changeset
15 #if $stop_codon_opts.stop_codon_opts_selector == "gb":
841357e0acbf Uploaded
bgruening
parents:
diff changeset
16 --trans_table "${stop_codon_opts.genbank_gencode}"
841357e0acbf Uploaded
bgruening
parents:
diff changeset
17 #else:
841357e0acbf Uploaded
bgruening
parents:
diff changeset
18 --stop_codons "${stop_codon_opts.stop_codons}"
841357e0acbf Uploaded
bgruening
parents:
diff changeset
19 #end if
841357e0acbf Uploaded
bgruening
parents:
diff changeset
20
841357e0acbf Uploaded
bgruening
parents:
diff changeset
21 $outfile &lt; $infile 2>&#38;1;
841357e0acbf Uploaded
bgruening
parents:
diff changeset
22 </command>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
23 <inputs>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
24 <param name="infile" type="data" format="fasta" label="Trainings Dataset" help="A set of known genes in FASTA format." />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
25 <param name="depth" type="integer" value="7" label="Set the depth of the ICM" help="The depth is the maximum number of positions in the context window that will be used to determine the probability of the predicted position." />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
26 <param name="period" type="integer" value="3" label="Set the period of the ICM" help="The period is the number of different submodels for different positions in the text in a cyclic pattern. E.g., if the period is 3, the first submodel will determine positions 1, 4, 7, ..." />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
27 <param name="width" type="integer" value="12" label="Set the width of the ICM" help="The width includes the predicted position." />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
28 <param name="no_stops" type="boolean" truevalue="--no_stops" falsevalue="" checked="false" label="Do not use any input strings with in-frame stop codons" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
29
841357e0acbf Uploaded
bgruening
parents:
diff changeset
30 <conditional name="stop_codon_opts">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
31 <param name="stop_codon_opts_selector" type="select" label="Specify start codons as">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
32 <option value="gb" selected="True">Genbank translation table entry</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
33 <option value="free_form">Comma-separated list</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
34 </param>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
35 <when value="gb">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
36 <param name="genbank_gencode" type="select" label="Use Genbank translation table to specify stop codons">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
37 <option value="1" select="True">1. Standard</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
38 <option value="2">2. Vertebrate Mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
39 <option value="3">3. Yeast Mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
40 <option value="4">4. Mold, Protozoan, and Coelenterate Mitochondrial Code and the Mycoplasma/Spiroplasma Code</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
41 <option value="5">5. Invertebrate Mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
42 <option value="6">6. Ciliate, Dasycladacean and Hexamita Nuclear Code</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
43 <option value="9">9. Echinoderm Mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
44 <option value="10">10. Euplotid Nuclear</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
45 <option value="11">11. Bacteria and Archaea</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
46 <option value="12">12. Alternative Yeast Nuclear</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
47 <option value="13">13. Ascidian Mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
48 <option value="14">14. Flatworm Mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
49 <option value="15">15. Blepharisma Macronuclear</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
50 <option value="16">16. Chlorophycean Mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
51 <option value="21">21. Trematode Mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
52 <option value="22">22. Scenedesmus obliquus mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
53 <option value="23">23. Thraustochytrium Mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
54 <option value="24">24. Pterobranchia mitochondrial</option>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
55 </param>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
56 </when>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
57 <when value="free_form">
841357e0acbf Uploaded
bgruening
parents:
diff changeset
58 <param name="stop_codons" type="text" value="tag,tga,taa" label="Specify stop codons as a comma-separated list" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
59 </when>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
60 </conditional>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
61 </inputs>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
62 <outputs>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
63 <data format="data" name="outfile" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
64 </outputs>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
65 <tests>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
66 <test>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
67 <param name="infile" value='streptomyces_Tu6071_plasmid_genes.fasta' />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
68 <param name="depth" value="7" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
69 <param name="period" value="3" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
70 <param name="width" value="12" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
71 <param name="no_stops" value="" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
72 <param name="genbank_gencode" value="11" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
73 <!-- compare files sizes, because the output is a binary -->
841357e0acbf Uploaded
bgruening
parents:
diff changeset
74 <output name="outfile" file='streptomyces_Tu6071_plasmid_genes.icm' compare="sim_size" delta="1000" ftype="data" />
841357e0acbf Uploaded
bgruening
parents:
diff changeset
75 </test>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
76 </tests>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
77
841357e0acbf Uploaded
bgruening
parents:
diff changeset
78 <help>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
79
841357e0acbf Uploaded
bgruening
parents:
diff changeset
80 **What it does**
841357e0acbf Uploaded
bgruening
parents:
diff changeset
81
841357e0acbf Uploaded
bgruening
parents:
diff changeset
82 This program constructs an interpolated context model (ICM) from an input set of sequences.
841357e0acbf Uploaded
bgruening
parents:
diff changeset
83
841357e0acbf Uploaded
bgruening
parents:
diff changeset
84 This model can be used by Glimmer3 to predict genes.
841357e0acbf Uploaded
bgruening
parents:
diff changeset
85
841357e0acbf Uploaded
bgruening
parents:
diff changeset
86 **TIP** To extract CDS from a GenBank file use the tool *Extract ORF from a GenBank file*.
841357e0acbf Uploaded
bgruening
parents:
diff changeset
87
841357e0acbf Uploaded
bgruening
parents:
diff changeset
88 -----
841357e0acbf Uploaded
bgruening
parents:
diff changeset
89
841357e0acbf Uploaded
bgruening
parents:
diff changeset
90 **Example**
841357e0acbf Uploaded
bgruening
parents:
diff changeset
91
841357e0acbf Uploaded
bgruening
parents:
diff changeset
92 *Input*::
841357e0acbf Uploaded
bgruening
parents:
diff changeset
93
841357e0acbf Uploaded
bgruening
parents:
diff changeset
94 - Genome Sequence
841357e0acbf Uploaded
bgruening
parents:
diff changeset
95
841357e0acbf Uploaded
bgruening
parents:
diff changeset
96 >CELF22B7 C.aenorhabditis elegans (Bristol N2) cosmid F22B7
841357e0acbf Uploaded
bgruening
parents:
diff changeset
97 GATCCTTGTAGATTTTGAATTTGAAGTTTTTTCTCATTCCAAAACTCTGT
841357e0acbf Uploaded
bgruening
parents:
diff changeset
98 GATCTGAAATAAAATGTCTCAAAAAAATAGAAGAAAACATTGCTTTATAT
841357e0acbf Uploaded
bgruening
parents:
diff changeset
99 TTATCAGTTATGGTTTTCAAAATTTTCTGACATACCGTTTTGCTTCTTTT
841357e0acbf Uploaded
bgruening
parents:
diff changeset
100 TTTCTCATCTTCTTCAAATATCAATTGTGATAATCTGACTCCTAACAATC
841357e0acbf Uploaded
bgruening
parents:
diff changeset
101 GAATTTCTTTTCCTTTTTCTTTTTCCAACAACTCCAGTGAGAACTTTTGA
841357e0acbf Uploaded
bgruening
parents:
diff changeset
102 ATATCTTCAAGTGACTTCACCACATCAGAAGGTGTCAACGATCTTGTGAG
841357e0acbf Uploaded
bgruening
parents:
diff changeset
103 AACATCGAATGAAGATAATTTTAATTTTAGAGTTACAGTTTTTCCTCCGA
841357e0acbf Uploaded
bgruening
parents:
diff changeset
104 CAATTCCTGATTTACGAACATCTTCTTCAAGCATTCTACAGATTTCTTGA
841357e0acbf Uploaded
bgruening
parents:
diff changeset
105 TGCTCTTCTAGGAGGATGTTGAAATCCGAAGTTGGAGAAAAAGTTCTCTC
841357e0acbf Uploaded
bgruening
parents:
diff changeset
106 AACTGAAATGCTTTTTCTTCGTGGATCCGATTCAGATGGACGACCTGGCA
841357e0acbf Uploaded
bgruening
parents:
diff changeset
107 GTCCGAGAGCCGTTCGAAGGAAAGATTCTTGTGAGAGAGGCGTGAAACAC
841357e0acbf Uploaded
bgruening
parents:
diff changeset
108 AAAGGGTATAGGTTCTTCTTCAGATTCATATCACCAACAGTTTGAATATC
841357e0acbf Uploaded
bgruening
parents:
diff changeset
109 CATTGCTTTCAGTTGAGCTTCGCATACACGACCAATTCCTCCAACCTAAA
841357e0acbf Uploaded
bgruening
parents:
diff changeset
110 AAATTATCTAGGTAAAACTAGAAGGTTATGCTTTAATAGTCTCACCTTAC
841357e0acbf Uploaded
bgruening
parents:
diff changeset
111 GAATCGGTAAATCCTTCAAAAACTCCATAATCGCGTTTTTATCATTTTCT
841357e0acbf Uploaded
bgruening
parents:
diff changeset
112 .....
841357e0acbf Uploaded
bgruening
parents:
diff changeset
113
841357e0acbf Uploaded
bgruening
parents:
diff changeset
114 *Output*::
841357e0acbf Uploaded
bgruening
parents:
diff changeset
115 interpolated context model (ICM)
841357e0acbf Uploaded
bgruening
parents:
diff changeset
116
841357e0acbf Uploaded
bgruening
parents:
diff changeset
117 -------
841357e0acbf Uploaded
bgruening
parents:
diff changeset
118
841357e0acbf Uploaded
bgruening
parents:
diff changeset
119 **References**
841357e0acbf Uploaded
bgruening
parents:
diff changeset
120
841357e0acbf Uploaded
bgruening
parents:
diff changeset
121 A.L. Delcher, K.A. Bratke, E.C. Powers, and S.L. Salzberg. Identifying bacterial genes and endosymbiont DNA with Glimmer. Bioinformatics (Advance online version) (2007).
841357e0acbf Uploaded
bgruening
parents:
diff changeset
122
841357e0acbf Uploaded
bgruening
parents:
diff changeset
123
841357e0acbf Uploaded
bgruening
parents:
diff changeset
124 </help>
841357e0acbf Uploaded
bgruening
parents:
diff changeset
125 </tool>