comparison hmmemit.xml @ 0:f48f9bbfcfd8 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/hmmer3 commit 4261b86af790a3535c0b9a8122f92225f8f67b47
author iuc
date Sat, 25 Jun 2016 15:05:37 -0400
parents
children 7b7ff4d209f7
comparison
equal deleted inserted replaced
-1:000000000000 0:f48f9bbfcfd8
1 <?xml version="1.0"?>
2 <tool id="hmmer_hmmemit" name="hmmemit" version="@WRAPPER_VERSION@.0">
3 <description>sample sequence(s) from a profile HMM</description>
4 <macros>
5 <import>macros.xml</import>
6 </macros>
7 <expand macro="requirements"/>
8 <expand macro="stdio"/>
9 <command><![CDATA[
10 hmmemit
11
12 #if $oformat.oformat_select == "fasta":
13 -N $oformat.N_fa
14 #elif $oformat.oformat_select == "aln":
15 -N $oformat.N_aln
16 -a
17 #elif $oformat.oformat_select == "mrcs":
18 -c
19 #elif $oformat.oformat_select == "mrcsf":
20 --minl $oformat.minl
21 --minu $oformat.minu
22 -C
23 #else:
24 -N $oformat.N_smp
25 -p
26 #if $oformat.L:
27 -L $oformat.L
28 #end if
29 $oformat.emission_profiles
30 #end if
31
32
33 @SEED@
34
35 $hmmfile
36 > $output
37 ]]></command>
38 <inputs>
39 <expand macro="input_hmm" />
40
41 <conditional name="oformat">
42 <param name="oformat_select" type="select" label="Output Format">
43 <option value="fasta" selected="true">Fasta</option>
44 <option value="aln">Alignment</option>
45 <option value="mrcs">Majority-Rule Concensus Sequence</option>
46 <option value="mrcsf">Fancier Concensus Sequence</option>
47 <option value="sample">Sample sequences from profile, not core model</option>
48 </param>
49 <when value="fasta">
50 <param name="N_fa" type="integer" value="1" min="1" help="(-N)"
51 label="Number of sequences to generate"/>
52 </when>
53 <when value="aln">
54 <param name="N_aln" type="integer" value="1" min="1" help="(-N)"
55 label="Number of sequences to generate"/>
56 </when>
57 <when value="mrcs">
58 </when>
59 <when value="mrcsf">
60 <param name="minl" type="float" value="0.7" help="(--minl)"
61 label="show consensus as 'any' (X/N) unless >= this fraction"/>
62 <param name="minu" type="float" value="0.2" help="(--minu)"
63 label="show consensus as upper case if >= this fraction"/>
64 </when>
65 <when value="sample">
66 <param name="N_smp" type="integer" value="1" min="1" help="(-N)"
67 label="Number of sequences to generate"/>
68 <param name="L" type="integer" optional="True" help="(-L)"
69 label="Expected length of profile"/>
70
71 <param name="emission_profiles" type="select" label="Emission profile options">
72 <option value="--local" selected="true">configure profile in multihit local mode</option>
73 <option value="--unilocal">configure profile in unilocal mode</option>
74 <option value="--glocal">configure profile in multihit glocal mode</option>
75 <option value="--uniglocal">configure profile in unihit glocal mode</option>
76 </param>
77 </when>
78 </conditional>
79
80
81 <expand macro="seed"/>
82 </inputs>
83 <outputs>
84 <data format="fasta" name="output" label="Sequences generated from $hmmfile.name">
85 <change_format>
86 <when input="oformat_select" value="aln" format="stockholm"/>
87 <!-- the rest are fasta -->
88 </change_format>
89 </data>
90 </outputs>
91 <tests>
92 <test>
93 <param name="hmmfile" value="globins4.hmm"/>
94 <param name="oformat_select" value="aln"/>
95 <param name="N_aln" value="10"/>
96 <expand macro="seed_test" />
97 <output name="output" file="globins4-emit.sto" lines_diff="4"/>
98 </test>
99 <test>
100 <param name="hmmfile" value="globins4.hmm"/>
101 <param name="oformat_select" value="fasta"/>
102 <param name="N_aln" value="10"/>
103 <expand macro="seed_test" />
104 <output name="output" file="globins4-emit-1.sto" lines_diff="4"/>
105 </test>
106 </tests>
107 <help><![CDATA[
108 @HELP_PRE@
109
110 The hmmemit program samples (emits) sequences from the profile HMM(s) in
111 hmmfile, and writes them to output. Sampling sequences may be useful for a
112 variety of purposes, including creating synthetic true positives for benchmarks
113 or tests.
114
115 The default is to sample one unaligned sequence from the core probability
116 model, which means that each sequence consists of one full-length domain.
117 Alternatively, with the -c option, you can emit a simple majority-rule
118 consensus sequence; or with the -a option, you can emit an alignment (in which
119 case, you probably also want to set -N to something other than its default of 1
120 sequence per model).
121
122 As another option, with the -p option you can sample a sequence from a fully
123 configured HMMER search profile. This means sampling a ‘homologous sequence’ by
124 HMMER’s definition, including nonhomologous flanking sequences, local
125 alignments, and multiple domains per sequence, depending on the length model
126 and alignment mode chosen for the profile.
127
128 The hmmfile may contain a library of HMMs, in which case each HMM will be used
129 in turn.
130
131 @HELP_PRE_OTH@
132
133 Output Formats
134 --------------
135
136 Several output formats are available, each with different options.
137
138 **Fasta**
139
140 Fasta option is the easiest to understand, given an input model, it will produce N sequences in fasta format from that model.
141
142 **Alignment**
143
144 Produces a stockholm alignment, of what the Fasta output would have produced.
145
146 **Majority-Rule Concensus Sequence**
147
148 Emit a plurality-rule consensus sequence, instead of sampling a sequence from
149 the profile HMM’s probability distribution. The consensus sequence is formed by
150 selecting the maximum probability residue at each match state.
151
152 **Fancier Concensus Sequence**
153
154 Emit a fancier plurality-rule consensus sequence than the -c option. If the
155 maximum probability residue has p < minl show it as a lower case ’any’ residue
156 (n or x); if p >= minl and < minu show it as a lower case residue; and if p >=
157 minu show it as an upper case residue. The default settings of minu and minl
158 are both 0.0, which means -C gives the same output as -c unless you also set
159 minu and minl to what you want.
160
161 **Sample**
162
163 Sample unaligned sequences from the implicit search profile, not from the core
164 model. The core model consists only of the homologous states (between the begin
165 and end states of a HMMER Plan7 model). The profile includes the nonhomologous
166 N, C, and J states, local/glocal and uni/multihit algorithm configuration, and
167 the target length model. Therefore sequences sampled from a profile may in-
168 clude nonhomologous as well as homologous sequences, and may contain more than
169 one homologous sequence segment. By default, the profile is in multihit local
170 mode, and the target sequence length is configured for L=400.
171
172 @ATTRIBUTION@
173 ]]></help>
174 <expand macro="citation"/>
175 </tool>