annotate lastz_wrapper.xml @ 1:a36c081e0043 draft

Updated functional test definition to reference data copied to the test data repository.
author devteam
date Wed, 20 Mar 2013 15:16:31 -0400
parents 0801f8207d30
children 12d4359b7e2f
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
1 <tool id="lastz_wrapper_2" name="Lastz" version="1.2.2">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
2 <requirements>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
3 <requirement type="package" version="1.02.00">lastz</requirement>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
4 </requirements>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
5 <description> map short reads against reference sequence</description>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
6 <command interpreter="python">lastz_wrapper.py
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
7 #if $seq_name.how_to_name=="yes":
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
8 --ref_name=$seq_name.ref_name
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
9 #end if
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
10 --ref_source=$source.ref_source
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
11 --source_select=$params.source_select
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
12 --out_format=$out_format
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
13 --input2=$input2
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
14 #if $source.ref_source=="history":
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
15 --input1=$source.input1
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
16 --ref_sequences=$input1.metadata.sequences
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
17 #else:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
18 --input1="${source.input1_2bit.fields.path}"
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
19 --ref_sequences="None"
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
20 #end if
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
21 #if $params.source_select=="pre_set":
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
22 --pre_set_options=${params.pre_set_options}
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
23 #else:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
24 --strand=$params.strand
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
25 --seed=$params.seed
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
26 --gfextend=$params.gfextend
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
27 --chain=$params.chain
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
28 --transition="$params.transition"
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
29 --O=$params.O
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
30 --E=$params.E
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
31 --X=$params.X
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
32 --Y=$params.Y
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
33 --K=$params.K
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
34 --L=$params.L
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
35 --entropy=$params.entropy
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
36 #end if
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
37 --identity_min=$min_ident
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
38 --identity_max=$max_ident
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
39 --coverage=$min_cvrg
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
40 --output=$output1
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
41 --unmask=$unmask
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
42 --lastzSeqsFileDir=${GALAXY_DATA_INDEX_DIR}
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
43 </command>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
44 <inputs>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
45 <param name="input2" format="fasta" type="data" label="Align sequencing reads in" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
46 <conditional name="source">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
47 <param name="ref_source" type="select" label="Against reference sequences that are">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
48 <option value="cached">locally cached</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
49 <option value="history">in your history</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
50 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
51 <when value="cached">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
52 <param name="input1_2bit" type="select" label="Using reference genome" help="If your genome of interest is not listed, contact the Galaxy team">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
53 <options from_data_table="lastz_seqs" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
54 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
55 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
56 <when value="history">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
57 <param name="input1" type="data" format="fasta" label="Select a reference dataset" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
58 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
59 </conditional>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
60 <param name="out_format" type="select" label="Output format">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
61 <option value="sam">SAM</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
62 <option value="diffs">Polymorphisms</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
63 <option value="tabular">Tabular</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
64 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
65 <conditional name="params">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
66 <param name="source_select" type="select" label="Lastz settings to use" help="For most mapping needs use Commonly used settings. If you want full control use Full List">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
67 <option value="pre_set">Commonly used</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
68 <option value="full">Full Parameter List</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
69 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
70 <when value="pre_set">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
71 <param name="pre_set_options" type="select" label="Select mapping mode">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
72 <option value="yasra98">Roche-454 98% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
73 <option value="yasra95">Roche-454 95% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
74 <option value="yasra90">Roche-454 90% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
75 <option value="yasra85">Roche-454 85% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
76 <option value="yasra75">Roche-454 75% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
77 <option value="yasra95short">Illumina 95% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
78 <option value="yasra85short">Illumina 85% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
79 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
80 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
81 <when value="full">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
82 <param name="strand" type="select" label="Which strand to search?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
83 <option value="both">Both</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
84 <option value="plus">Search forward strand only (the one in the reference)</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
85 <option value="minus">Search the reverse complement strand only (opposite of the reference)</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
86 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
87 <param name="seed" type="select" label="Select seeding settings" help="allows you set word size and number of mismatches">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
88 <option value="12of19">Seed hits require a 19 bp word with matches in 12 specific positions</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
89 <option value="14of22">Seed hits require a 22 bp word with matches in 14 specific positions</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
90 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
91 <param name="transition" type="select" label="Select transition settings" help="affects the number of allowed transition substitutions">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
92 <option value="transition">Allow one transition in each seed hit</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
93 <option value="transition=2">Allow two transitions in a seed hit </option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
94 <option value="notransition">Don't allow any transitions in seed hits</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
95 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
96 <param name="gfextend" type="select" label="Perform gap-free extension of seed hits to HSPs (high scoring segment pairs)?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
97 <option value="nogfextend">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
98 <option value="gfextend">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
99 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
100 <param name="chain" type="select" label="Perform chaining of HSPs?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
101 <option value="nochain">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
102 <option value="chain">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
103 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
104 <param name="O" type="integer" size="5" value="400" label="Gap opening penalty"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
105 <param name="E" type="integer" size="5" value="30" label="Gap extension penalty"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
106 <param name="X" type="integer" size="5" value="910" label="X-drop threshold"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
107 <param name="Y" type="integer" size="5" value="9370" label="Y-drop threshold"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
108 <param name="K" type="integer" size="5" value="3000" label="Set the threshold for HSPs (ungapped extensions scoring lower are discarded)"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
109 <param name="L" type="integer" size="5" value="3000" label="Set the threshold for gapped alignments (gapped extensions scoring lower are discarded)"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
110 <param name="entropy" type="select" label="Involve entropy when filtering HSPs?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
111 <option value="noentropy">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
112 <option value="entropy">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
113 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
114 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
115 </conditional>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
116 <conditional name="seq_name">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
117 <param name="how_to_name" type="select" label="Do you want to modify the reference name?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
118 <option value="no">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
119 <option value="yes">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
120 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
121 <when value="yes">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
122 <param name="ref_name" type="text" size="25" value="Type sequence name here" label="Enter name for the Reference sequence"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
123 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
124 <when value="no" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
125 </conditional>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
126 <param name="min_ident" type="integer" size="3" value="0" label="Do not report matches below this identity (%)"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
127 <param name="max_ident" type="integer" size="3" value="100" label="Do not report matches above this identity (%)"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
128 <param name="min_cvrg" type="integer" size="3" value="0" label="Do not report matches that cover less than this percentage of each read"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
129 <param name="unmask" type="select" label="Convert lowercase bases to uppercase">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
130 <option value="yes">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
131 <option value="no">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
132 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
133 </inputs>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
134 <outputs>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
135 <data format="tabular" name="output1" label="${tool.name} on ${on_string}: mapped reads">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
136 <change_format>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
137 <when input="out_format" value="sam" format="sam" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
138 </change_format>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
139 </data>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
140 </outputs>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
141 <tests>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
142 <test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
143 <!--
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
144 Lastz command:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
145 lastz phiX.2bit/phiX174[nickname=Ref] test-data/b1.fasta +nogfextend +nochain +gapped +strand=both +seed=12of19 +transition O=400 E=30 X=910 Y=9370 K=3000 L=3000 +noentropy +ambiguousn +nolaj +identity=0..100 +coverage=0 +format=sam- > lastz_wrapper_out2.sam
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
146 You need to point to phiX.2bit somewhere on your system. b1.fasta is located in galaxy's test-data. You will have to replace all the pluses before the
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
147 commands with 2 dashes, as double-dash can't appear in an XML comment.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
148 -->
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
149 <param name="input2" value="b1.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
150 <param name="ref_source" value="cached" />
1
a36c081e0043 Updated functional test definition to reference data copied to the test data repository.
devteam
parents: 0
diff changeset
151 <param name="input1_2bit" value="phiX174" />
0
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
152 <param name="out_format" value="sam" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
153 <param name="source_select" value="full" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
154 <param name="strand" value="both" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
155 <param name="seed" value="12of19" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
156 <param name="transition" value="transition" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
157 <param name="gfextend" value="nogfextend" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
158 <param name="chain" value="nochain" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
159 <param name="O" value="400" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
160 <param name="E" value="30" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
161 <param name="X" value="910" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
162 <param name="Y" value="9370" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
163 <param name="K" value="3000" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
164 <param name="L" value="3000" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
165 <param name="entropy" value="noentropy" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
166 <!--
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
167 how_to_name is not the default. It is changed to modify
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
168 input1_2bit by adding the ref_name as a nickname
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
169 -->
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
170 <param name="how_to_name" value="yes" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
171 <param name="ref_name" value="Ref" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
172 <param name="min_ident" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
173 <param name="max_ident" value="100" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
174 <param name="min_cvrg" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
175 <param name="unmask" value="yes" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
176 <output name="output1" file="lastz_wrapper_out2.sam" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
177 </test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
178 <test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
179 <!--
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
180 Lastz command:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
181 lastz test-data/phiX.fasta test-data/b1.fasta[fullnames] +yasra95short +ambiguousn +nolaj +identity=0..100 +coverage=0 +format=diffs > lastz_wrapper_out3.tabular
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
182 phiX.fasta and b1.fasta are located in galaxy's test-data. You will have to replace all the pluses before the commands with 2 dashes,
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
183 as double-dash can't appear in an XML comment.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
184 -->
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
185 <param name="input2" value="b1.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
186 <param name="ref_source" value="history" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
187 <param name="input1" value="phiX.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
188 <param name="out_format" value="diffs" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
189 <param name="source_select" value="pre_set" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
190 <param name="pre_set_options" value="yasra95short" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
191 <param name="how_to_name" value="no" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
192 <param name="min_ident" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
193 <param name="max_ident" value="100" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
194 <param name="min_cvrg" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
195 <param name="unmask" value="yes" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
196 <output name="output1" file="lastz_wrapper_out3.tabular" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
197 </test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
198 <test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
199 <!--
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
200 Lastz command: first you will need to split the file phiX_split.fasta into two files,
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
201 phiX1.fasta and phiX2.fasta, each with 1 sequence (phiX1 and phiX2, respectively). Then:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
202 lastz phiX1.fasta test-data/b1.fasta *yasra95short *ambiguousn *nolaj *identity=0..100 *coverage=0 *format=general-:score,name1,strand1,size1,start1,zstart1,end1,length1,text1,name2,strand2,size2,start2,zstart2,end2,start2+,zstart2+,end2+,length2,text2,diff,cigar,identity,coverage,gaprate,diagonal,shingle > lastz_wrapper_out4.tabular
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
203 lastz phiX2.fasta test-data/b1.fasta *yasra95short *ambiguousn *nolaj *identity=0..100 *coverage=0 *format=general-:score,name1,strand1,size1,start1,zstart1,end1,length1,text1,name2,strand2,size2,start2,zstart2,end2,start2+,zstart2+,end2+,length2,text2,diff,cigar,identity,coverage,gaprate,diagonal,shingle >> lastz_wrapper_out4.tabular
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
204 You need to point to phiX1.fasta and phiX2.fasta somewhere on your system.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
205 phiX_split.fasta and b1.fasta are located in galaxy's test-data
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
206 You will have to replace all the asterisks before the commands with 2 dashes,
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
207 as double-dash can't appear in an XML comment
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
208
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
209 NOTE: since the input file include more than 1 sequence, the output must be sorted in
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
210 order for functional test to pass. This is done using the sort="True" attribute on the output.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
211 -->
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
212 <param name="input2" value="b1.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
213 <param name="ref_source" value="history" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
214 <param name="input1" value="phiX_split.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
215 <param name="out_format" value="tabular" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
216 <param name="source_select" value="pre_set" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
217 <param name="pre_set_options" value="yasra95short" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
218 <param name="how_to_name" value="no" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
219 <param name="min_ident" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
220 <param name="max_ident" value="100" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
221 <param name="min_cvrg" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
222 <param name="unmask" value="yes" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
223 <output name="output1" file="lastz_wrapper_out4.tabular" sort="True" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
224 </test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
225 </tests>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
226 <help>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
227
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
228 **What it does**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
229
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
230 **LASTZ** is a high performance pairwise sequence aligner derived from BLASTZ. It is written by Bob Harris in Webb Miller's laboratory at Penn State University. Special scoring sets were derived to improve runtime performance and quality. This Galaxy version of LASTZ is geared towards aligning short (Illumina/Solexa, AB/SOLiD) and medium (Roche/454) reads against a reference sequence. There is excellent, extensive documentation on LASTZ available here_.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
231
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
232 .. _here: http://www.bx.psu.edu/miller_lab/dist/README.lastz-1.02.00/README.lastz-1.02.00.html
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
233
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
234 ------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
235
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
236 **Input formats**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
237
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
238 LASTZ accepts reference and reads in FASTA format. However, because Galaxy supports implicit format conversion the tool will recognize fastq and other method specific formats.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
239
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
240 ------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
241
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
242 **Outputs**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
243
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
244 LASTZ generates one output. Depending on the choice you make in the *Select output format* drop-down, LASTZ will produce a SAM file showing sequence alignments, a list of differences between the reads and reference (Polymorphisms), or a general table with one line per alignment block (Tabular). Examples of these outputs are shown below.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
245
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
246 **SAM output**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
247
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
248 SAM has 12 columns::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
249
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
250 1 2 3 4 5 6 7 8 9 10 11 12
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
251 ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
252 HWI-EAS91_1_30788AAXX:1:2:1670:915 99 chr9 58119878 60 36M = 58120234 392 GACCCCTACCCCACCGTGCTCTGGATCTCAGTGTTT IIIIIIIIIIIIIIIIEIIIIIII7IIIIIIIIIII XT:A:U NM:i:0 SM:i:37 AM:i:37 X0:i:1 X1:i:0 XM:i:0 XO:i:0 XG:i:0 MD:Z:36
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
253 HWI-EAS91_1_30788AAXX:1:2:1670:915 147 chr9 58120234 60 36M = 58119878 -392 ATGAGTCGAATTCTATTTTCCAAACTGTTAACAAAA IFIIDI;IIICIIIIIIIIIIIIIIIIIIIIIIIII XT:A:U NM:i:0 SM:i:37 AM:i:37 X0:i:1 X1:i:0 XM:i:0 XO:i:0 XG:i:0 MD:Z:36
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
254
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
255
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
256 where::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
257
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
258 Column Description
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
259 --------- ---------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
260 1. QNAME Query (pair) NAME
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
261 2. FLAG bitwise FLAG
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
262 3. RNAME Reference sequence NAME
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
263 4. POS 1-based leftmost POSition/coordinate of clipped sequence
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
264 5. MAPQ MAPping Quality (Phred-scaled)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
265 6. CIGAR extended CIGAR string
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
266 7. MRNM Mate Reference sequence NaMe ('=' if same as RNAME)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
267 8. MPOS 1-based Mate POSition
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
268 9. ISIZE Inferred insert SIZE
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
269 10. SEQ query SEQuence on the same strand as the reference
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
270 11. QUAL query QUALity (ASCII-33 gives the Phred base quality)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
271 12. OPT variable OPTional fields in the format TAG:VTYPE:VALUE, tab-separated
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
272
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
273 The flags are as follows::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
274
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
275 Flag Description
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
276 ------ -------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
277 0x0001 the read is paired in sequencing
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
278 0x0002 the read is mapped in a proper pair
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
279 0x0004 the query sequence itself is unmapped
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
280 0x0008 the mate is unmapped
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
281 0x0010 strand of the query (1 for reverse)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
282 0x0020 strand of the mate
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
283 0x0040 the read is the first read in a pair
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
284 0x0080 the read is the second read in a pair
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
285 0x0100 the alignment is not primary
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
286
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
287 **Polymorphism (SNP or differences) output**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
288
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
289 Polymorphism output contains 14 columns::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
290
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
291 1 2 3 4 5 6 7 8 9 10 11 12 13 14
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
292 --------------------------------------------------------------------------------------------------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
293 chrM 2490 2491 + 5386 HWI-EAS91_1_306UPAAXX:6:1:486:822 10 11 - 36 C A ACCTGTTTTACAGACACCTAAAGCTACATCGTCAAC ACCTGTTTTAAAGACACCTAAAGCTACATCGTCAAC
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
294 chrM 2173 2174 + 5386 HWI-EAS91_1_306UPAAXX:6:1:259:1389 26 27 + 36 G T GCGTACTTATTCGCCACCATGATTATGACCAGTGTT GCGTACTTATTCGCCACCATGATTATTACCAGTGTT
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
295
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
296 where::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
297
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
298 1. (chrM) - Reference sequence id
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
299 2. (2490) - Start position of the difference in the reference
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
300 3. (2491) - End position of the difference in the reference
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
301 4. (+) - Strand of the reference (always plus)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
302 5. (5386) - Length of the reference sequence
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
303 6. (HWI...) - read id
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
304 7. (10) - Start position of the difference in the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
305 8. (11) - End position of the difference in the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
306 9. (+) - Strand of the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
307 10. (36) - Length of the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
308 11. (C) - Nucleotide in the reference
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
309 12. (A) - Nucleotide in the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
310 13. (ACC...) - Reference side os the alignment
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
311 14. (ACC...) - Read side of the alignment
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
312
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
313 **Tabular output**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
314
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
315 Tabular output is a tab-separated format with 30 columns::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
316
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
317 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
318 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
319 14 PHIX174 + 5386 4648 4647 4661 14 ATTTTCGTGATATT EYKX4VC01BV8HS + 204 154 153 167 154 153 167 14 ATTTTCGTGATATT .............. 14M 14/14 100.0% 14/204 6.9% 0/14 0.0% 4494 NA
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
320 16 PHIX174 + 5386 3363 3362 3378 16 GACGCCGGATTTGAGA EYKX4VC01AWJ88 - 259 36 35 51 209 208 224 16 GACGCCGGATTTGAGA ................ 16M 16/16 100.0% 16/259 6.2% 0/16 0.0% 3327 NA
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
321
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
322 The following columns are present::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
323
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
324 Field Meaning
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
325 ---------------- -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
326 1. score Score of the alignment block. The scale and meaning of this number will vary, depending on the final stage performed and other command-line options.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
327 2. name1 Name of the target sequence.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
328 3. strand1 Target sequence strand, either "+" or "−".
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
329 4. size1 Size of the entire target sequence.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
330 5. start1 Starting position of the alignment block in the target, origin-one.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
331 6. zstart1 Starting position of the alignment block in the target, origin-zero.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
332 7. end1 Ending position of the alignment block in the target, expressed either as origin-one closed or origin-zero half-open (the ending value is the same in both systems).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
333 8. length1 Length of the alignment block in the target (excluding gaps).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
334 9. text1 Aligned characters in the target, including gap characters.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
335 10. name2 Name of the query sequence.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
336 11. strand2 Query sequence strand, either "+" or "−".
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
337 12. size2 Size of the entire query sequence.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
338 13. start2 Starting position of the alignment block in the query, origin-one.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
339 14. zstart2 Starting position of the alignment block in the query, origin-zero.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
340 15. end2 Ending position of the alignment block in the query, expressed either as origin-one closed or origin-zero half-open (the ending value is the same in both systems).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
341 16. start2+ Starting position of the alignment block in the query, counting along the query sequence's positive strand (regardless of which query strand was aligned), origin-one. Note that if strand2 is "−", then this is the other end of the block from start2.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
342 17. zstart2+ Starting position of the alignment block in the query, counting along the query sequence's positive strand (regardless of which query strand was aligned), origin-zero. Note that if strand2 is "−", then this is the other end of the block from zstart2.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
343 18. end2+ Ending position of the alignment block in the query, counting along the query sequence's positive strand (regardless of which query strand was aligned), expressed either as origin-one closed or origin-zero half-open (the ending value is the same in both systems). Note that if strand2 is "−", then this is the other end of the block from end2.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
344 19. length2 Length of the alignment block in the query (excluding gaps).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
345 20. text2 Aligned characters in the query, including gap characters.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
346 21. diff Differences between what would be written for text1 and text2. Matches are written as . (period), transitions as : (colon), transversions as X, and gaps as - (hyphen).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
347 22. cigar A CIGAR-like representation of the alignment's path through the Dynamic Programming matrix. This is the short representation, without spaces, described in the Ensembl CIGAR specification.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
348 23./24. identity Fraction of aligned bases in the block that are matches (see Identity). This is written as two fields. The first field is a fraction, written as &lt;n&gt;/&lt;d&gt;. The second field contains the same value, computed as a percentage.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
349 25./26. coverage Fraction of the entire input sequence (target or query, whichever is shorter) that is covered by the alignment block (see Coverage). This is written as two fields. The first field is a fraction, written as &lt;n&gt;/&lt;d&gt;. The second field contains the same value, computed as a percentage.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
350 27./28. gaprate Rate of gaps (also called indels) in the alignment block. This is written as two fields. The first field is a fraction, written as &lt;n&gt;/&lt;d&gt;, with the numerator being the number of alignment columns containing gaps and the denominator being the number without gaps. The second field contains the same value, computed as a percentage.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
351 29. diagonal The diagonal of the start of the alignment block in the dynamic programming matrix, expressed as an identifying number start1-start2.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
352 30. shingle A measurement of the shingle overlap between the target and the query. This is intended for the case where both the target and query are relatively short, and their ends are expected to overlap.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
353
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
354 -------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
355
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
356 **LASTZ Settings**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
357
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
358 There are two setting modes: (1) **Commonly used settings** and (2) **Full Parameter List**.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
359
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
360 **Commonly used settings**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
361
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
362 There are seven modes::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
363
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
364 Illumina-Solexa/AB-SOLiD 95% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
365 Illumina-Solexa/AB-SOLiD 85% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
366 Roche-454 98% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
367 Roche-454 95% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
368 Roche-454 90% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
369 Roche-454 85% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
370 Roche-454 75% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
371
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
372 When deciding which one to use, consider the following: a 36 bp read with two differences will be 34/36 = 94% identical to the reference.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
373
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
374 **Full Parameter List**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
375
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
376 This mode gives you fuller control over lastz. The description of these and other parameters is found at the end of this page. Note that not all parameters are included in this interface. If you would like to make additional options available through Galaxy, e-mail us at galaxy-bugs@bx.psu.edu.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
377
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
378 ------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
379
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
380 **Do you want to modify the reference name?**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
381
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
382 This option allows you to set the name of the reference sequence manually. This is helpful when, for example, you would like to make the reference name compatible with the UCSC naming conventions to be able to display your lastz results as a custom track at the UCSC Genome Browser.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
383
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
384 ------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
385
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
386 **LASTZ parameter list**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
387
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
388 This is an exhaustive list of LASTZ options. Once again, please note that not all options are included in this interface. If you would like to make additional options available through Galaxy, e-mail us at galaxy-bugs@bx.psu.edu::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
389
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
390 target[[s..e]][-] spec/file containing target sequence (fasta or nib)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
391 [s..e] defines a subrange of the file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
392 - indicates reverse-complement
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
393 (use --help=files for more details)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
394 query[[s..e]][-] spec/file containing query sequences (fasta or nib)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
395 if absent, queries come from stdin (unless they
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
396 aren't needed, as for --self or --tableonly)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
397 (use --help=files for more details)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
398 --self the target sequence is also the query
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
399 --quantum the query sequence contains quantum DNA
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
400 --seed=match&lt;length&gt; use a word with no gaps instead of a seed pattern
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
401 --seed=half&lt;length&gt; use space-free half-weight word instead of seed pattern
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
402 --match=&lt;reward&gt;[,&lt;penalty&gt;] set the score values for a match (+&lt;reward&gt;)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
403 and mismatch (-&lt;penalty&gt;)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
404 --[no]trans[ition][=2] allow one or two transitions in a seed hit
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
405 (by default a transition is allowed)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
406 --word=&lt;bits&gt; set max bits for word hash; use this to trade time for
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
407 memory, eliminating thrashing for heavy seeds
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
408 (default is 28 bits)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
409 --[no]filter=[&lt;T&gt;:]&lt;M&gt; filter half-weight seed hits, requiring at least M
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
410 matches and allowing no more than T transversions
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
411 (default is no filtering)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
412 --notwins require just one seed hit
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
413 --twins=[&lt;min&gt;:]&lt;maxgap&gt; require two nearby seed hits on the same diagonal
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
414 (default is twins aren't required)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
415 --notwins allow single, isolated seeds
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
416 --[no]recoverseeds avoid losing seeds in hash collisions. Cannot be used with --twins
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
417 --seedqueue=&lt;entries&gt; set number of entries in seed hit queue
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
418 (default is 262144)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
419 --anchors=&lt;file&gt; read anchors from a file, instead of discovering anchors
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
420 via seeding
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
421 --recoverhits recover hash-collision seed hits
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
422 (default is not to recover seed hits)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
423 --step=&lt;length&gt; set step length (default is 1)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
424 --maxwordcount=&lt;limit&gt; words occurring more often than &lt;limit&gt; in the target
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
425 are not eligible for seeds
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
426 --strand=both search both strands
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
427 --strand=plus search + strand only (matching strand of query spec)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
428 --strand=minus search - strand only (opposite strand of query spec)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
429 (by default both strands are searched)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
430 --ambiguousn treat N as an ambiguous nucleotide
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
431 (by default N is treated as a sequence splicing character)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
432 --[no]gfextend perform gap-free extension of seed hits to HSPs
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
433 (by default no extension is performed)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
434 --[no]chain perform chaining
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
435 --chain=&lt;diag,anti&gt; perform chaining with given penalties for diagonal and
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
436 anti-diagonal
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
437 (by default no chaining is performed)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
438 --[no]gapped perform gapped alignment (instead of gap-free)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
439 (by default gapped alignment is performed)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
440 --score[s]=&lt;file&gt; read substitution scores from a file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
441 (default is HOXD70)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
442 --unitscore[s] scores are +1/-1 for match/mismatch
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
443 --gap=&lt;[open,]extend&gt; set gap open and extend penalties (default is 400,30)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
444 --xdrop=&lt;score&gt; set x-drop threshold (default is 10*sub[A][A])
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
445 --ydrop=&lt;score&gt; set y-drop threshold (default is open+300extend)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
446 --infer[=&lt;control&gt;] infer scores from the sequences, then use them
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
447 --inferonly[=&lt;control&gt;] infer scores, but don't use them (requires --infscores)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
448 all inference options are read from the control file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
449 --infscores[=&lt;file&gt;] write inferred scores to a file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
450 --hspthresh=&lt;score&gt; set threshold for high scoring pairs (default is 3000)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
451 ungapped extensions scoring lower are discarded
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
452 &lt;score&gt; can also be a percentage or base count
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
453 --entropy adjust for entropy when qualifying HSPs in the x-drop extension
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
454 method
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
455 --noentropy don't adjust for entropy when qualifying HSPs
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
456 --exact=&lt;length&gt; set threshold for exact matches
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
457 if specified, exact matches are found rather than high
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
458 scoring pairs (replaces --hspthresh)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
459 --inner=&lt;score&gt; set threshold for HSPs during interpolation
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
460 (default is no interpolation)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
461 --gappedthresh=&lt;score&gt; set threshold for gapped alignments
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
462 gapped extensions scoring lower are discarded
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
463 &lt;score&gt; can also be a percentage or base count
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
464 (default is to use same value as --hspthresh)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
465 --ball=&lt;score&gt; set minimum score required of words 'in' a quantum ball
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
466 --[no]entropy involve entropy in filtering high scoring pairs
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
467 (default is "entropy")
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
468 --[no]mirror report/use mirror image of all gap-free alignments
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
469 (default is "mirror" for self-alignments only)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
470 --traceback=&lt;bytes&gt; space for trace-back information
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
471 (default is 80.0M)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
472 --masking=&lt;count&gt; mask any position in target hit this many times
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
473 zero indicates no masking
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
474 (default is no masking)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
475 --targetcapsule=&lt;capsule_file&gt; the target seed word position table and seed
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
476 (as well as the target sequence)are read from specified file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
477 --segments=&lt;segment_file&gt; read segments from a file, instead of discovering
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
478 them via seeding. Replaces other seeding or gap-free extension
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
479 options
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
480 --[no]census[=&lt;file&gt;] count/report how many times each target base aligns
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
481 (default is to not report census)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
482 --identity=&lt;min&gt;[..&lt;max&gt;] filter alignments by percent identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
483 0&lt;=min&lt;=max&lt;=100; blocks (or HSPs) outside min..max
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
484 are discarded
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
485 (default is no identity filtering)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
486 --coverage=&lt;min&gt;[..&lt;max&gt;] filter alignments by percentage pf query covered
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
487 0&lt;=min&lt;=max&lt;=100; blocks (or HSPs) outside min..max
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
488 are discarded
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
489 (default is no query coverage filtering)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
490 --notrivial do not output trivial self-alignment block if the target and query
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
491 sequences are identical. Using --self enables this option automatically
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
492 --output=&lt;output_file&gt; write the alignments to the specified file name instead of stdout
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
493 --code=&lt;file&gt; give quantum code for query sequence (only for display)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
494 --format=&lt;type&gt; specify output format; one of lav, axt, maf, maf+, maf-, text,
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
495 lav+text, cigar, text, rdplot, general, or general:&lt;fields&gt;
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
496 (by default output is LAV)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
497 --rdotplot=&lt;file&gt; create an additional output file suitable for plotting the alignments
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
498 with the R statistical package.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
499 --markend Just before normal completion, write "# lastz end-of-file" to output file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
500 --census[=&lt;output_file&gt;] count and report how many times each target base aligns, up
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
501 to 255. Ns are included in the count
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
502 --census16[=&lt;output_file&gt;] count and report how many times each target base aligns, up
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
503 up 65 thousand
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
504 --census32[=&lt;output_file&gt;] count and report how many times each target bas aligns, up
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
505 to 4 billion
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
506 --writecapsule=&lt;capsule_file&gt; just write out a target capsule file and quit; don't
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
507 search for seeds or perform subsequent stages
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
508 --verbosity=&lt;level&gt; set info level (0 is minimum, 10 is everything)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
509 (default is 0)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
510 --[no]runtime report runtime in the output file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
511 (default is to not report runtime)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
512 --tableonly[=count] just produce the target position table, don't
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
513 search for seeds
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
514 --[no]stats[=&lt;file&gt;] show search statistics (or don't)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
515 (not available in this build)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
516 --version report the program version and quit
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
517 --help list all options
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
518 --help=files list information about file specifiers
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
519 --help=short[cuts] list blastz-compatible shortcuts
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
520 --help=yasra list yasra-specific shortcuts
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
521
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
522 </help>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
523 </tool>