comparison progressivemauve.xml @ 1:bd1901839519 draft

planemo upload commit 94b0cd1fff0826c6db3e7dc0c91c0c5a8be8bb0c
author cpt
date Mon, 05 Jun 2023 02:46:06 +0000
parents
children faa752f96ab9
comparison
equal deleted inserted replaced
0:69795939c29b 1:bd1901839519
1 <tool id="progressivemauve" name="progressiveMauve" version="19.1.0.0" profile="16.04">
2 <description>constructs multiple genome alignments</description>
3 <macros>
4 <import>macros.xml</import>
5 <import>cpt-macros.xml</import>
6 </macros>
7 <requirements>
8 <requirement type="package">progressivemauve</requirement>
9 </requirements>
10 <command detect_errors="aggressive"><![CDATA[
11 ## Symlink files in with correct extensions
12 #for $file in '$sequences':
13 ln -s '$file' `basename '$file'`;
14 #end for
15
16 progressiveMauve
17 ## Input Options
18
19 #if $apply_backbone:
20 --apply-backbone='$apply_backbone'
21 #end if
22 --island-gap-size='$island_gap_size'
23 '$mums'
24
25 #if $seed_weight:
26 --seed-weight='$seed_weight'
27 #end if
28
29 #if $max_gapped_aligner_length:
30 --max-gapped-aligner-length='$max_gapped_aligner_length'
31 #end if
32
33 #if $match_input:
34 --match-input='$match_input'
35 #end if
36
37 '$collinear'
38 --scoring-scheme='$scoring_scheme'
39 '$no_weight_scaling'
40
41 --max-breakpoint-distance-scale='$max_breakpoint_distance_scale'
42 --conservation-distance-scale='$conservation_distance_scale'
43 '$skip_refinement'
44 '$skip_gapped_alignment'
45
46 #if $bp_dist_estimate_min_score:
47 --bp-dist-estimate-min-score='$bp_dist_estimate_min_score'
48 #end if
49
50 #if $gap_open:
51 --gap-open='$gap_open'
52 #end if
53
54 #if $gap_extend:
55 --gap-extend='$gap_extend'
56 #end if
57
58 #if $weight:
59 --weight='$weight'
60 #end if
61
62 #if $min_scaled_penalty:
63 --min-scaled-penalty='$min_scaled_penalty'
64 #end if
65
66 --hmm-p-go-homologous='$hmm_p_go_homologous'
67 --hmm-p-go-unrelated='$hmm_p_go_unrelated'
68 --hmm-identity='$hmm_identity'
69
70 '$seed_family'
71 '$solid_seeds'
72 '$coding_seeds'
73 '$no_recursion'
74 '$disable_backbone'
75
76 ## Outputs
77 --output='$output'
78 #if $output_guide_tree:
79 --output-guide-tree='$output_guide_tree_file'
80 #end if
81
82 #if $output_backbone:
83 --backbone-output='$output_backbone_file'
84 #end if
85
86 ## Sequences
87 #for file in $sequences:
88 `basename "${file}"`
89 #end for
90
91 ]]></command>
92 <inputs>
93 <param type="data" format="fasta" name="sequences" multiple="True" label="Select sequences to align" help="in fasta format"/>
94 <param type="data" format="xmfa" label="Apply Backbone" name="apply_backbone" optional="True" help="Read an existing sequence alignment in XMFA format and apply backbone statistics to it (--apply-backbone)"/>
95 <param type="integer" label="Island gap size" value="20" name="island_gap_size" help="Alignment gaps above this size in nucleotides are considered to be islands (--island-gap-size)"/>
96 <param type="boolean" truevalue="--disable-backbone" falsevalue="" name="disable_backbone" label="Disable backbone" help="Disable backbone detection (--disable-backbone)"/>
97 <param type="boolean" truevalue="True" falsevalue="" name="output_guide_tree" label="Output Guide Tree" help="Write out the guide tree used for alignment to a file (--output-guide-tree)"/>
98 <param type="boolean" truevalue="True" falsevalue="" name="output_backbone" label="Output Backbone" help="Write out the backbone to a file (--backbone-output)"/>
99 <param type="boolean" truevalue="--mums" falsevalue="" label="MUMs" name="mums" help="Find MUMs only, do not attempt to determine locally collinear blocks (LCBs) (--mums)"/>
100 <param type="integer" label="Seed weight" name="seed_weight" value="0" optional="True" help="Use the specified seed weight for calculating initial anchors (--seed-weight)"/>
101 <param type="data" format="tabular" label="Match Input" name="match_input" optional="True" help="Use specified match file instead of searching for matches (--match-input)"/>
102 <!--<param type="file" label="input-id-matrix" help="An identity matrix describing similarity among all pairs of input sequences/alignments (- -input-id-matrix)" />-->
103 <param type="integer" label="Max gapped aligner length" value="0" optional="True" name="max_gapped_aligner_length" help="Maximum number of base pairs to attempt aligning with the gapped aligner (--max-gapped-aligner-length)"/>
104 <param type="data" format="nhx" label="input-guide-tree" optional="True" name="input_guide_tree" help="A phylogenetic guide tree in Newick format that describes the order in which sequences will be aligned (--input-guide-tree)"/>
105 <param type="boolean" truevalue="--collinear" falsevalue="" label="Collinear inputs" name="collinear" help="Assume that input sequences are collinear--they have no rearrangements (--collinear)"/>
106 <param type="select" label="Scoring scheme" name="scoring_scheme" help="Selects the anchoring score function. (--scoring-scheme)">
107 <option value="sp" selected="True">Extant sum-of-pairs (sp)</option>
108 <option value="ancestral_sp">Sum-of-pairs + Ancestral (ancestral_sp)</option>
109 <option value="ancestral">Ancestral (ancestral)</option>
110 </param>
111 <param type="boolean" truevalue="--no-weight-scaling" falsevalue="" label="No weight scaling" name="no_weight_scaling" help="Don't scale LCB weights by conservation distance and breakpoint distance (--no-weight-scaling)"/>
112 <param type="float" min="0" max="1" label="max-breakpoint-distance-scale" value="0.5" name="max_breakpoint_distance_scale" help="Set the maximum weight scaling by breakpoint distance. (--max-breakpoint-distance-scale)"/>
113 <param type="float" min="0" max="1" label="conservation-distance-scale" value="0.5" name="conservation_distance_scale" help="Scale conservation distances by this amount. (--conservation-distance-scale)"/>
114 <param type="boolean" truevalue="--skip-refinement" falsevalue="" label="Skip refinement" name="skip_refinement" help="Do not perform iterative refinement (--skip-refinement)"/>
115 <param type="boolean" truevalue="--skip-gapped-alignment" falsevalue="" label="Skip gapped alignment" name="skip_gapped_alignment" help="Do not perform gapped alignment (--skip-gapped-alignment)"/>
116 <param type="integer" label="BP dist estimate min score" name="bp_dist_estimate_min_score" value="0" optional="True" help="Minimum LCB score for estimating pairwise breakpoint distance (--bp-dist-estimate-min-score)"/>
117 <param type="integer" label="Gap open" name="gap_open" value="0" optional="True" help="Gap open penalty (--gap-open)"/>
118 <param type="select" label="Repeat penalty" name="repeat_penalty" help="Sets whether the repeat scores go negative or go to zero for highly repetitive sequences. (--repeat-penalty)">
119 <option value="negative" selected="True">Negative</option>
120 <option value="zero">Zero</option>
121 </param>
122 <param type="integer" label="Gap extend" name="gap_extend" value="0" optional="True" help="Gap extend penalty (--gap-extend)"/>
123 <!--<param type="data" label="Substitution matrix" -->
124 <!--help="Nucleotide substitution matrix in NCBI format (- -substitution-matrix)" />-->
125 <param type="integer" label="Weight" name="weight" value="0" optional="True" help="Minimum pairwise LCB score (--weight)"/>
126 <param type="integer" label="Min scaled penalty" name="min_scaled_penalty" value="0" optional="True" help="Minimum breakpoint penalty after scaling the penalty by expected divergence (--min-scaled-penalty)"/>
127 <param type="float" label="HMM p go homologous" name="hmm_p_go_homologous" min="0" max="1" value="0.00001" help="Probability of transitioning from the unrelated to the homologous state (--hmm-p-go-homologous)"/>
128 <param type="float" label="HMM p go unrelated" name="hmm_p_go_unrelated" min="0" max="1" value="0.000000001" help="Probability of transitioning from the homologous to the unrelated state (--hmm-p-go-unrelated)"/>
129 <param type="float" label="HMM identity" name="hmm_identity" min="0" max="1" value="0.7" help="Expected level of sequence identity among pairs of sequences(--hmm-identity)"/>
130 <param type="boolean" truevalue="--seed-family" falsevalue="" label="Seed family" name="seed_family" help="Use a family of spaced seeds to improve sensitivity (--seed-family)"/>
131 <param type="boolean" truevalue="--solid-seeds" falsevalue="" label="Solid seeds" name="solid_seeds" help="Use solid seeds. Do not permit substitutions in anchor matches. (--solid-seeds)"/>
132 <param type="boolean" truevalue="--coding-seeds" falsevalue="" label="Coding seeds" name="coding_seeds" help="Use coding pattern seeds. Useful to generate matches coding regions with 3rd codon position degeneracy. (--coding-seeds)"/>
133 <param type="boolean" truevalue="--no-recursion" falsevalue="" label="No recursion" name="no_recursion" help="Disable recursive anchor search (--no-recursion)"/>
134 </inputs>
135 <outputs>
136 <data format="xmfa" name="output" label="${tool.name} alignment of ${on_string}">
137 <change_format>
138 <when input="mums" value="--mums" format="tabular"/>
139 </change_format>
140 </data>
141 <data format="nhx" name="output_guide_tree_file" label="${tool.name} alignment of ${on_string}: Guide tree">
142 <filter>output_guide_tree</filter>
143 </data>
144 <data format="tabular" name="output_backbone_file" label="${tool.name} alignment of ${on_string}: Backbone">
145 <filter>output_backbone</filter>
146 </data>
147 </outputs>
148 <tests>
149 <test>
150 <param name="sequences" value="phagey.fa,karma.fa"/>
151 <output name="output" file="1.xmfa" lines_diff="20"/>
152 </test>
153 <test>
154 <param name="sequences" value="merged.fa"/>
155 <output name="output" file="2.xmfa" lines_diff="20"/>
156 </test>
157 <test>
158 <param name="sequences" value="merged.fa"/>
159 <param name="output_guide_tree" value="True"/>
160 <output name="output" file="3.xmfa" lines_diff="20"/>
161 <output name="output_guide_tree_file" file="3.nhx"/>
162 </test>
163 <test>
164 <param name="sequences" value="merged.fa"/>
165 <param name="mums" value="True"/>
166 <output name="output" file="4.mums" compare="sim_size" delta="1000"/>
167 </test>
168 <test>
169 <param name="sequences" value="merged.fa"/>
170 <param name="match_input" value="4.mums"/>
171 <output name="output" file="5.xmfa" lines_diff="24"/>
172 </test>
173 </tests>
174 <help><![CDATA[
175 What it does
176 ============
177
178 Mauve is a system for efficiently constructing multiple genome alignments in
179 the presence of large-scale evolutionary events such as rearrangement and
180 inversion. Multiple genome alignment provides a basis for research into
181 comparative genomics and the study of evolutionary dynamics. Aligning whole
182 genomes is a fundamentally different problem than aligning short sequences.
183
184 Mauve has been developed with the idea that a multiple genome aligner should
185 require only modest computational resources. It employs algorithmic techniques
186 that scale well in the amount of sequence being aligned. For example, a pair of
187 Y. pestis genomes can be aligned in under a minute, while a group of 9
188 divergent Enterobacterial genomes can be aligned in a few hours.
189
190
191 Example Usage
192 =============
193
194 +-----------------------------------+-------------+
195 | Usage | Notes |
196 +===================================+=============+
197 | Align genomes |Simply |
198 | |select as |
199 | |many fasta |
200 | |files with |
201 | |one or more |
202 | |sequences as |
203 | |necessary |
204 +-----------------------------------+-------------+
205 | Align genomes but also save |Use the |
206 | the guide tree and produce a |**Output |
207 | backbone file |Guide Tree** |
208 | |and **Output |
209 | |Backbone** |
210 | |options |
211 +-----------------------------------+-------------+
212 | Align genomes, but do not |Use the |
213 | detect forced alignment of |**Disable |
214 | unrelated sequences |backbone** |
215 | |option |
216 +-----------------------------------+-------------+
217 | Detect forced alignment of |Use the |
218 | unrelated sequence in the |**Apply |
219 | alignment produced |Backbone** |
220 | in previous example, use |option and |
221 | custom Homology HMM transition |specify the |
222 | parameters. |XMFA file |
223 | |produced |
224 | |in the |
225 | |previous |
226 | |example |
227 +-----------------------------------+-------------+
228 | Compute ungapped |Use the |
229 | local-multiple alignments among |**MUMs** |
230 | the input sequences |option |
231 +-----------------------------------+-------------+
232 | Compute an alignment of the |Set the |
233 | same genomes, using previously |**Match |
234 | computed local-multiple |Input** to |
235 | alignments |the tabular |
236 | |MUMs file |
237 | |produced in |
238 | |the previous |
239 | |example |
240 +-----------------------------------+-------------+
241 | Set a minimum scaled |Use the |
242 | breakpoint penalty to cope with |**Min Scaled |
243 | the case where most genomes |Penalty** and|
244 | are aligned correctly, but manual |set to a |
245 | inspection reveals that |value like |
246 | a divergent genome has too |5000 |
247 | many predicted rearrangements. | |
248 +-----------------------------------+-------------+
249 | Globally align a set of |Use the |
250 | collinear virus |**Colinear**,|
251 | genomes, using seed families |**Seed |
252 | to improve anchoring sensitivity |Family** |
253 | in regions below 70% sequence |options |
254 | identity. | |
255 +-----------------------------------+-------------+
256
257 ]]></help>
258 <citations>
259 <expand macro="citation/progressive_mauve"/>
260 <expand macro="citation/mijalisrasche"/>
261 </citations>
262 </tool>