annotate lastz_wrapper.xml @ 0:0801f8207d30 draft

Uploaded tarball
author devteam
date Mon, 26 Nov 2012 09:47:51 -0500
parents
children a36c081e0043
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
1 <tool id="lastz_wrapper_2" name="Lastz" version="1.2.2">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
2 <requirements>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
3 <requirement type="package" version="1.02.00">lastz</requirement>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
4 </requirements>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
5 <description> map short reads against reference sequence</description>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
6 <command interpreter="python">lastz_wrapper.py
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
7 #if $seq_name.how_to_name=="yes":
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
8 --ref_name=$seq_name.ref_name
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
9 #end if
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
10 --ref_source=$source.ref_source
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
11 --source_select=$params.source_select
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
12 --out_format=$out_format
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
13 --input2=$input2
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
14 #if $source.ref_source=="history":
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
15 --input1=$source.input1
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
16 --ref_sequences=$input1.metadata.sequences
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
17 #else:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
18 --input1="${source.input1_2bit.fields.path}"
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
19 --ref_sequences="None"
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
20 #end if
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
21 #if $params.source_select=="pre_set":
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
22 --pre_set_options=${params.pre_set_options}
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
23 #else:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
24 --strand=$params.strand
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
25 --seed=$params.seed
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
26 --gfextend=$params.gfextend
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
27 --chain=$params.chain
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
28 --transition="$params.transition"
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
29 --O=$params.O
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
30 --E=$params.E
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
31 --X=$params.X
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
32 --Y=$params.Y
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
33 --K=$params.K
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
34 --L=$params.L
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
35 --entropy=$params.entropy
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
36 #end if
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
37 --identity_min=$min_ident
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
38 --identity_max=$max_ident
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
39 --coverage=$min_cvrg
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
40 --output=$output1
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
41 --unmask=$unmask
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
42 --lastzSeqsFileDir=${GALAXY_DATA_INDEX_DIR}
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
43 </command>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
44 <inputs>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
45 <param name="input2" format="fasta" type="data" label="Align sequencing reads in" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
46 <conditional name="source">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
47 <param name="ref_source" type="select" label="Against reference sequences that are">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
48 <option value="cached">locally cached</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
49 <option value="history">in your history</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
50 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
51 <when value="cached">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
52 <param name="input1_2bit" type="select" label="Using reference genome" help="If your genome of interest is not listed, contact the Galaxy team">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
53 <options from_data_table="lastz_seqs" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
54 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
55 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
56 <when value="history">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
57 <param name="input1" type="data" format="fasta" label="Select a reference dataset" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
58 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
59 </conditional>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
60 <param name="out_format" type="select" label="Output format">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
61 <option value="sam">SAM</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
62 <option value="diffs">Polymorphisms</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
63 <option value="tabular">Tabular</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
64 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
65 <conditional name="params">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
66 <param name="source_select" type="select" label="Lastz settings to use" help="For most mapping needs use Commonly used settings. If you want full control use Full List">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
67 <option value="pre_set">Commonly used</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
68 <option value="full">Full Parameter List</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
69 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
70 <when value="pre_set">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
71 <param name="pre_set_options" type="select" label="Select mapping mode">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
72 <option value="yasra98">Roche-454 98% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
73 <option value="yasra95">Roche-454 95% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
74 <option value="yasra90">Roche-454 90% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
75 <option value="yasra85">Roche-454 85% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
76 <option value="yasra75">Roche-454 75% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
77 <option value="yasra95short">Illumina 95% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
78 <option value="yasra85short">Illumina 85% identity</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
79 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
80 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
81 <when value="full">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
82 <param name="strand" type="select" label="Which strand to search?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
83 <option value="both">Both</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
84 <option value="plus">Search forward strand only (the one in the reference)</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
85 <option value="minus">Search the reverse complement strand only (opposite of the reference)</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
86 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
87 <param name="seed" type="select" label="Select seeding settings" help="allows you set word size and number of mismatches">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
88 <option value="12of19">Seed hits require a 19 bp word with matches in 12 specific positions</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
89 <option value="14of22">Seed hits require a 22 bp word with matches in 14 specific positions</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
90 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
91 <param name="transition" type="select" label="Select transition settings" help="affects the number of allowed transition substitutions">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
92 <option value="transition">Allow one transition in each seed hit</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
93 <option value="transition=2">Allow two transitions in a seed hit </option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
94 <option value="notransition">Don't allow any transitions in seed hits</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
95 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
96 <param name="gfextend" type="select" label="Perform gap-free extension of seed hits to HSPs (high scoring segment pairs)?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
97 <option value="nogfextend">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
98 <option value="gfextend">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
99 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
100 <param name="chain" type="select" label="Perform chaining of HSPs?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
101 <option value="nochain">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
102 <option value="chain">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
103 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
104 <param name="O" type="integer" size="5" value="400" label="Gap opening penalty"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
105 <param name="E" type="integer" size="5" value="30" label="Gap extension penalty"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
106 <param name="X" type="integer" size="5" value="910" label="X-drop threshold"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
107 <param name="Y" type="integer" size="5" value="9370" label="Y-drop threshold"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
108 <param name="K" type="integer" size="5" value="3000" label="Set the threshold for HSPs (ungapped extensions scoring lower are discarded)"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
109 <param name="L" type="integer" size="5" value="3000" label="Set the threshold for gapped alignments (gapped extensions scoring lower are discarded)"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
110 <param name="entropy" type="select" label="Involve entropy when filtering HSPs?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
111 <option value="noentropy">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
112 <option value="entropy">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
113 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
114 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
115 </conditional>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
116 <conditional name="seq_name">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
117 <param name="how_to_name" type="select" label="Do you want to modify the reference name?">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
118 <option value="no">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
119 <option value="yes">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
120 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
121 <when value="yes">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
122 <param name="ref_name" type="text" size="25" value="Type sequence name here" label="Enter name for the Reference sequence"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
123 </when>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
124 <when value="no" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
125 </conditional>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
126 <param name="min_ident" type="integer" size="3" value="0" label="Do not report matches below this identity (%)"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
127 <param name="max_ident" type="integer" size="3" value="100" label="Do not report matches above this identity (%)"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
128 <param name="min_cvrg" type="integer" size="3" value="0" label="Do not report matches that cover less than this percentage of each read"/>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
129 <param name="unmask" type="select" label="Convert lowercase bases to uppercase">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
130 <option value="yes">Yes</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
131 <option value="no">No</option>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
132 </param>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
133 </inputs>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
134 <outputs>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
135 <data format="tabular" name="output1" label="${tool.name} on ${on_string}: mapped reads">
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
136 <change_format>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
137 <when input="out_format" value="sam" format="sam" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
138 </change_format>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
139 </data>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
140 </outputs>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
141 <tests>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
142 <test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
143 <!--
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
144 Lastz command:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
145 lastz phiX.2bit/phiX174[nickname=Ref] test-data/b1.fasta +nogfextend +nochain +gapped +strand=both +seed=12of19 +transition O=400 E=30 X=910 Y=9370 K=3000 L=3000 +noentropy +ambiguousn +nolaj +identity=0..100 +coverage=0 +format=sam- > lastz_wrapper_out2.sam
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
146 You need to point to phiX.2bit somewhere on your system. b1.fasta is located in galaxy's test-data. You will have to replace all the pluses before the
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
147 commands with 2 dashes, as double-dash can't appear in an XML comment.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
148 -->
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
149 <param name="input2" value="b1.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
150 <param name="ref_source" value="cached" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
151 <!-- this is the backwards-compatible "unique value" for this file, not an actual path -->
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
152 <param name="input1_2bit" value="/galaxy/data/phiX/seq/phiX.2bit" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
153 <param name="out_format" value="sam" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
154 <param name="source_select" value="full" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
155 <param name="strand" value="both" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
156 <param name="seed" value="12of19" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
157 <param name="transition" value="transition" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
158 <param name="gfextend" value="nogfextend" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
159 <param name="chain" value="nochain" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
160 <param name="O" value="400" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
161 <param name="E" value="30" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
162 <param name="X" value="910" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
163 <param name="Y" value="9370" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
164 <param name="K" value="3000" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
165 <param name="L" value="3000" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
166 <param name="entropy" value="noentropy" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
167 <!--
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
168 how_to_name is not the default. It is changed to modify
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
169 input1_2bit by adding the ref_name as a nickname
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
170 -->
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
171 <param name="how_to_name" value="yes" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
172 <param name="ref_name" value="Ref" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
173 <param name="min_ident" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
174 <param name="max_ident" value="100" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
175 <param name="min_cvrg" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
176 <param name="unmask" value="yes" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
177 <output name="output1" file="lastz_wrapper_out2.sam" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
178 </test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
179 <test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
180 <!--
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
181 Lastz command:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
182 lastz test-data/phiX.fasta test-data/b1.fasta[fullnames] +yasra95short +ambiguousn +nolaj +identity=0..100 +coverage=0 +format=diffs > lastz_wrapper_out3.tabular
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
183 phiX.fasta and b1.fasta are located in galaxy's test-data. You will have to replace all the pluses before the commands with 2 dashes,
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
184 as double-dash can't appear in an XML comment.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
185 -->
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
186 <param name="input2" value="b1.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
187 <param name="ref_source" value="history" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
188 <param name="input1" value="phiX.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
189 <param name="out_format" value="diffs" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
190 <param name="source_select" value="pre_set" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
191 <param name="pre_set_options" value="yasra95short" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
192 <param name="how_to_name" value="no" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
193 <param name="min_ident" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
194 <param name="max_ident" value="100" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
195 <param name="min_cvrg" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
196 <param name="unmask" value="yes" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
197 <output name="output1" file="lastz_wrapper_out3.tabular" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
198 </test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
199 <test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
200 <!--
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
201 Lastz command: first you will need to split the file phiX_split.fasta into two files,
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
202 phiX1.fasta and phiX2.fasta, each with 1 sequence (phiX1 and phiX2, respectively). Then:
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
203 lastz phiX1.fasta test-data/b1.fasta *yasra95short *ambiguousn *nolaj *identity=0..100 *coverage=0 *format=general-:score,name1,strand1,size1,start1,zstart1,end1,length1,text1,name2,strand2,size2,start2,zstart2,end2,start2+,zstart2+,end2+,length2,text2,diff,cigar,identity,coverage,gaprate,diagonal,shingle > lastz_wrapper_out4.tabular
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
204 lastz phiX2.fasta test-data/b1.fasta *yasra95short *ambiguousn *nolaj *identity=0..100 *coverage=0 *format=general-:score,name1,strand1,size1,start1,zstart1,end1,length1,text1,name2,strand2,size2,start2,zstart2,end2,start2+,zstart2+,end2+,length2,text2,diff,cigar,identity,coverage,gaprate,diagonal,shingle >> lastz_wrapper_out4.tabular
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
205 You need to point to phiX1.fasta and phiX2.fasta somewhere on your system.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
206 phiX_split.fasta and b1.fasta are located in galaxy's test-data
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
207 You will have to replace all the asterisks before the commands with 2 dashes,
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
208 as double-dash can't appear in an XML comment
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
209
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
210 NOTE: since the input file include more than 1 sequence, the output must be sorted in
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
211 order for functional test to pass. This is done using the sort="True" attribute on the output.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
212 -->
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
213 <param name="input2" value="b1.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
214 <param name="ref_source" value="history" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
215 <param name="input1" value="phiX_split.fasta" ftype="fasta" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
216 <param name="out_format" value="tabular" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
217 <param name="source_select" value="pre_set" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
218 <param name="pre_set_options" value="yasra95short" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
219 <param name="how_to_name" value="no" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
220 <param name="min_ident" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
221 <param name="max_ident" value="100" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
222 <param name="min_cvrg" value="0" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
223 <param name="unmask" value="yes" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
224 <output name="output1" file="lastz_wrapper_out4.tabular" sort="True" />
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
225 </test>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
226 </tests>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
227 <help>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
228
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
229 **What it does**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
230
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
231 **LASTZ** is a high performance pairwise sequence aligner derived from BLASTZ. It is written by Bob Harris in Webb Miller's laboratory at Penn State University. Special scoring sets were derived to improve runtime performance and quality. This Galaxy version of LASTZ is geared towards aligning short (Illumina/Solexa, AB/SOLiD) and medium (Roche/454) reads against a reference sequence. There is excellent, extensive documentation on LASTZ available here_.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
232
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
233 .. _here: http://www.bx.psu.edu/miller_lab/dist/README.lastz-1.02.00/README.lastz-1.02.00.html
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
234
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
235 ------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
236
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
237 **Input formats**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
238
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
239 LASTZ accepts reference and reads in FASTA format. However, because Galaxy supports implicit format conversion the tool will recognize fastq and other method specific formats.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
240
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
241 ------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
242
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
243 **Outputs**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
244
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
245 LASTZ generates one output. Depending on the choice you make in the *Select output format* drop-down, LASTZ will produce a SAM file showing sequence alignments, a list of differences between the reads and reference (Polymorphisms), or a general table with one line per alignment block (Tabular). Examples of these outputs are shown below.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
246
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
247 **SAM output**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
248
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
249 SAM has 12 columns::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
250
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
251 1 2 3 4 5 6 7 8 9 10 11 12
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
252 ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
253 HWI-EAS91_1_30788AAXX:1:2:1670:915 99 chr9 58119878 60 36M = 58120234 392 GACCCCTACCCCACCGTGCTCTGGATCTCAGTGTTT IIIIIIIIIIIIIIIIEIIIIIII7IIIIIIIIIII XT:A:U NM:i:0 SM:i:37 AM:i:37 X0:i:1 X1:i:0 XM:i:0 XO:i:0 XG:i:0 MD:Z:36
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
254 HWI-EAS91_1_30788AAXX:1:2:1670:915 147 chr9 58120234 60 36M = 58119878 -392 ATGAGTCGAATTCTATTTTCCAAACTGTTAACAAAA IFIIDI;IIICIIIIIIIIIIIIIIIIIIIIIIIII XT:A:U NM:i:0 SM:i:37 AM:i:37 X0:i:1 X1:i:0 XM:i:0 XO:i:0 XG:i:0 MD:Z:36
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
255
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
256
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
257 where::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
258
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
259 Column Description
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
260 --------- ---------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
261 1. QNAME Query (pair) NAME
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
262 2. FLAG bitwise FLAG
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
263 3. RNAME Reference sequence NAME
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
264 4. POS 1-based leftmost POSition/coordinate of clipped sequence
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
265 5. MAPQ MAPping Quality (Phred-scaled)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
266 6. CIGAR extended CIGAR string
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
267 7. MRNM Mate Reference sequence NaMe ('=' if same as RNAME)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
268 8. MPOS 1-based Mate POSition
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
269 9. ISIZE Inferred insert SIZE
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
270 10. SEQ query SEQuence on the same strand as the reference
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
271 11. QUAL query QUALity (ASCII-33 gives the Phred base quality)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
272 12. OPT variable OPTional fields in the format TAG:VTYPE:VALUE, tab-separated
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
273
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
274 The flags are as follows::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
275
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
276 Flag Description
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
277 ------ -------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
278 0x0001 the read is paired in sequencing
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
279 0x0002 the read is mapped in a proper pair
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
280 0x0004 the query sequence itself is unmapped
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
281 0x0008 the mate is unmapped
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
282 0x0010 strand of the query (1 for reverse)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
283 0x0020 strand of the mate
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
284 0x0040 the read is the first read in a pair
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
285 0x0080 the read is the second read in a pair
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
286 0x0100 the alignment is not primary
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
287
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
288 **Polymorphism (SNP or differences) output**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
289
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
290 Polymorphism output contains 14 columns::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
291
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
292 1 2 3 4 5 6 7 8 9 10 11 12 13 14
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
293 --------------------------------------------------------------------------------------------------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
294 chrM 2490 2491 + 5386 HWI-EAS91_1_306UPAAXX:6:1:486:822 10 11 - 36 C A ACCTGTTTTACAGACACCTAAAGCTACATCGTCAAC ACCTGTTTTAAAGACACCTAAAGCTACATCGTCAAC
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
295 chrM 2173 2174 + 5386 HWI-EAS91_1_306UPAAXX:6:1:259:1389 26 27 + 36 G T GCGTACTTATTCGCCACCATGATTATGACCAGTGTT GCGTACTTATTCGCCACCATGATTATTACCAGTGTT
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
296
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
297 where::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
298
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
299 1. (chrM) - Reference sequence id
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
300 2. (2490) - Start position of the difference in the reference
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
301 3. (2491) - End position of the difference in the reference
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
302 4. (+) - Strand of the reference (always plus)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
303 5. (5386) - Length of the reference sequence
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
304 6. (HWI...) - read id
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
305 7. (10) - Start position of the difference in the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
306 8. (11) - End position of the difference in the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
307 9. (+) - Strand of the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
308 10. (36) - Length of the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
309 11. (C) - Nucleotide in the reference
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
310 12. (A) - Nucleotide in the read
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
311 13. (ACC...) - Reference side os the alignment
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
312 14. (ACC...) - Read side of the alignment
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
313
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
314 **Tabular output**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
315
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
316 Tabular output is a tab-separated format with 30 columns::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
317
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
318 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
319 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
320 14 PHIX174 + 5386 4648 4647 4661 14 ATTTTCGTGATATT EYKX4VC01BV8HS + 204 154 153 167 154 153 167 14 ATTTTCGTGATATT .............. 14M 14/14 100.0% 14/204 6.9% 0/14 0.0% 4494 NA
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
321 16 PHIX174 + 5386 3363 3362 3378 16 GACGCCGGATTTGAGA EYKX4VC01AWJ88 - 259 36 35 51 209 208 224 16 GACGCCGGATTTGAGA ................ 16M 16/16 100.0% 16/259 6.2% 0/16 0.0% 3327 NA
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
322
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
323 The following columns are present::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
324
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
325 Field Meaning
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
326 ---------------- -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
327 1. score Score of the alignment block. The scale and meaning of this number will vary, depending on the final stage performed and other command-line options.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
328 2. name1 Name of the target sequence.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
329 3. strand1 Target sequence strand, either "+" or "−".
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
330 4. size1 Size of the entire target sequence.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
331 5. start1 Starting position of the alignment block in the target, origin-one.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
332 6. zstart1 Starting position of the alignment block in the target, origin-zero.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
333 7. end1 Ending position of the alignment block in the target, expressed either as origin-one closed or origin-zero half-open (the ending value is the same in both systems).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
334 8. length1 Length of the alignment block in the target (excluding gaps).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
335 9. text1 Aligned characters in the target, including gap characters.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
336 10. name2 Name of the query sequence.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
337 11. strand2 Query sequence strand, either "+" or "−".
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
338 12. size2 Size of the entire query sequence.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
339 13. start2 Starting position of the alignment block in the query, origin-one.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
340 14. zstart2 Starting position of the alignment block in the query, origin-zero.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
341 15. end2 Ending position of the alignment block in the query, expressed either as origin-one closed or origin-zero half-open (the ending value is the same in both systems).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
342 16. start2+ Starting position of the alignment block in the query, counting along the query sequence's positive strand (regardless of which query strand was aligned), origin-one. Note that if strand2 is "−", then this is the other end of the block from start2.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
343 17. zstart2+ Starting position of the alignment block in the query, counting along the query sequence's positive strand (regardless of which query strand was aligned), origin-zero. Note that if strand2 is "−", then this is the other end of the block from zstart2.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
344 18. end2+ Ending position of the alignment block in the query, counting along the query sequence's positive strand (regardless of which query strand was aligned), expressed either as origin-one closed or origin-zero half-open (the ending value is the same in both systems). Note that if strand2 is "−", then this is the other end of the block from end2.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
345 19. length2 Length of the alignment block in the query (excluding gaps).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
346 20. text2 Aligned characters in the query, including gap characters.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
347 21. diff Differences between what would be written for text1 and text2. Matches are written as . (period), transitions as : (colon), transversions as X, and gaps as - (hyphen).
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
348 22. cigar A CIGAR-like representation of the alignment's path through the Dynamic Programming matrix. This is the short representation, without spaces, described in the Ensembl CIGAR specification.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
349 23./24. identity Fraction of aligned bases in the block that are matches (see Identity). This is written as two fields. The first field is a fraction, written as &lt;n&gt;/&lt;d&gt;. The second field contains the same value, computed as a percentage.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
350 25./26. coverage Fraction of the entire input sequence (target or query, whichever is shorter) that is covered by the alignment block (see Coverage). This is written as two fields. The first field is a fraction, written as &lt;n&gt;/&lt;d&gt;. The second field contains the same value, computed as a percentage.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
351 27./28. gaprate Rate of gaps (also called indels) in the alignment block. This is written as two fields. The first field is a fraction, written as &lt;n&gt;/&lt;d&gt;, with the numerator being the number of alignment columns containing gaps and the denominator being the number without gaps. The second field contains the same value, computed as a percentage.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
352 29. diagonal The diagonal of the start of the alignment block in the dynamic programming matrix, expressed as an identifying number start1-start2.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
353 30. shingle A measurement of the shingle overlap between the target and the query. This is intended for the case where both the target and query are relatively short, and their ends are expected to overlap.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
354
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
355 -------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
356
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
357 **LASTZ Settings**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
358
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
359 There are two setting modes: (1) **Commonly used settings** and (2) **Full Parameter List**.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
360
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
361 **Commonly used settings**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
362
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
363 There are seven modes::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
364
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
365 Illumina-Solexa/AB-SOLiD 95% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
366 Illumina-Solexa/AB-SOLiD 85% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
367 Roche-454 98% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
368 Roche-454 95% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
369 Roche-454 90% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
370 Roche-454 85% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
371 Roche-454 75% identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
372
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
373 When deciding which one to use, consider the following: a 36 bp read with two differences will be 34/36 = 94% identical to the reference.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
374
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
375 **Full Parameter List**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
376
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
377 This mode gives you fuller control over lastz. The description of these and other parameters is found at the end of this page. Note that not all parameters are included in this interface. If you would like to make additional options available through Galaxy, e-mail us at galaxy-bugs@bx.psu.edu.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
378
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
379 ------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
380
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
381 **Do you want to modify the reference name?**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
382
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
383 This option allows you to set the name of the reference sequence manually. This is helpful when, for example, you would like to make the reference name compatible with the UCSC naming conventions to be able to display your lastz results as a custom track at the UCSC Genome Browser.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
384
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
385 ------
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
386
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
387 **LASTZ parameter list**
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
388
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
389 This is an exhaustive list of LASTZ options. Once again, please note that not all options are included in this interface. If you would like to make additional options available through Galaxy, e-mail us at galaxy-bugs@bx.psu.edu::
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
390
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
391 target[[s..e]][-] spec/file containing target sequence (fasta or nib)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
392 [s..e] defines a subrange of the file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
393 - indicates reverse-complement
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
394 (use --help=files for more details)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
395 query[[s..e]][-] spec/file containing query sequences (fasta or nib)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
396 if absent, queries come from stdin (unless they
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
397 aren't needed, as for --self or --tableonly)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
398 (use --help=files for more details)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
399 --self the target sequence is also the query
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
400 --quantum the query sequence contains quantum DNA
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
401 --seed=match&lt;length&gt; use a word with no gaps instead of a seed pattern
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
402 --seed=half&lt;length&gt; use space-free half-weight word instead of seed pattern
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
403 --match=&lt;reward&gt;[,&lt;penalty&gt;] set the score values for a match (+&lt;reward&gt;)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
404 and mismatch (-&lt;penalty&gt;)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
405 --[no]trans[ition][=2] allow one or two transitions in a seed hit
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
406 (by default a transition is allowed)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
407 --word=&lt;bits&gt; set max bits for word hash; use this to trade time for
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
408 memory, eliminating thrashing for heavy seeds
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
409 (default is 28 bits)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
410 --[no]filter=[&lt;T&gt;:]&lt;M&gt; filter half-weight seed hits, requiring at least M
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
411 matches and allowing no more than T transversions
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
412 (default is no filtering)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
413 --notwins require just one seed hit
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
414 --twins=[&lt;min&gt;:]&lt;maxgap&gt; require two nearby seed hits on the same diagonal
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
415 (default is twins aren't required)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
416 --notwins allow single, isolated seeds
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
417 --[no]recoverseeds avoid losing seeds in hash collisions. Cannot be used with --twins
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
418 --seedqueue=&lt;entries&gt; set number of entries in seed hit queue
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
419 (default is 262144)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
420 --anchors=&lt;file&gt; read anchors from a file, instead of discovering anchors
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
421 via seeding
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
422 --recoverhits recover hash-collision seed hits
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
423 (default is not to recover seed hits)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
424 --step=&lt;length&gt; set step length (default is 1)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
425 --maxwordcount=&lt;limit&gt; words occurring more often than &lt;limit&gt; in the target
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
426 are not eligible for seeds
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
427 --strand=both search both strands
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
428 --strand=plus search + strand only (matching strand of query spec)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
429 --strand=minus search - strand only (opposite strand of query spec)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
430 (by default both strands are searched)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
431 --ambiguousn treat N as an ambiguous nucleotide
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
432 (by default N is treated as a sequence splicing character)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
433 --[no]gfextend perform gap-free extension of seed hits to HSPs
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
434 (by default no extension is performed)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
435 --[no]chain perform chaining
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
436 --chain=&lt;diag,anti&gt; perform chaining with given penalties for diagonal and
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
437 anti-diagonal
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
438 (by default no chaining is performed)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
439 --[no]gapped perform gapped alignment (instead of gap-free)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
440 (by default gapped alignment is performed)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
441 --score[s]=&lt;file&gt; read substitution scores from a file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
442 (default is HOXD70)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
443 --unitscore[s] scores are +1/-1 for match/mismatch
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
444 --gap=&lt;[open,]extend&gt; set gap open and extend penalties (default is 400,30)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
445 --xdrop=&lt;score&gt; set x-drop threshold (default is 10*sub[A][A])
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
446 --ydrop=&lt;score&gt; set y-drop threshold (default is open+300extend)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
447 --infer[=&lt;control&gt;] infer scores from the sequences, then use them
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
448 --inferonly[=&lt;control&gt;] infer scores, but don't use them (requires --infscores)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
449 all inference options are read from the control file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
450 --infscores[=&lt;file&gt;] write inferred scores to a file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
451 --hspthresh=&lt;score&gt; set threshold for high scoring pairs (default is 3000)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
452 ungapped extensions scoring lower are discarded
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
453 &lt;score&gt; can also be a percentage or base count
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
454 --entropy adjust for entropy when qualifying HSPs in the x-drop extension
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
455 method
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
456 --noentropy don't adjust for entropy when qualifying HSPs
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
457 --exact=&lt;length&gt; set threshold for exact matches
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
458 if specified, exact matches are found rather than high
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
459 scoring pairs (replaces --hspthresh)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
460 --inner=&lt;score&gt; set threshold for HSPs during interpolation
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
461 (default is no interpolation)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
462 --gappedthresh=&lt;score&gt; set threshold for gapped alignments
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
463 gapped extensions scoring lower are discarded
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
464 &lt;score&gt; can also be a percentage or base count
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
465 (default is to use same value as --hspthresh)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
466 --ball=&lt;score&gt; set minimum score required of words 'in' a quantum ball
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
467 --[no]entropy involve entropy in filtering high scoring pairs
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
468 (default is "entropy")
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
469 --[no]mirror report/use mirror image of all gap-free alignments
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
470 (default is "mirror" for self-alignments only)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
471 --traceback=&lt;bytes&gt; space for trace-back information
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
472 (default is 80.0M)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
473 --masking=&lt;count&gt; mask any position in target hit this many times
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
474 zero indicates no masking
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
475 (default is no masking)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
476 --targetcapsule=&lt;capsule_file&gt; the target seed word position table and seed
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
477 (as well as the target sequence)are read from specified file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
478 --segments=&lt;segment_file&gt; read segments from a file, instead of discovering
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
479 them via seeding. Replaces other seeding or gap-free extension
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
480 options
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
481 --[no]census[=&lt;file&gt;] count/report how many times each target base aligns
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
482 (default is to not report census)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
483 --identity=&lt;min&gt;[..&lt;max&gt;] filter alignments by percent identity
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
484 0&lt;=min&lt;=max&lt;=100; blocks (or HSPs) outside min..max
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
485 are discarded
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
486 (default is no identity filtering)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
487 --coverage=&lt;min&gt;[..&lt;max&gt;] filter alignments by percentage pf query covered
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
488 0&lt;=min&lt;=max&lt;=100; blocks (or HSPs) outside min..max
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
489 are discarded
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
490 (default is no query coverage filtering)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
491 --notrivial do not output trivial self-alignment block if the target and query
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
492 sequences are identical. Using --self enables this option automatically
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
493 --output=&lt;output_file&gt; write the alignments to the specified file name instead of stdout
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
494 --code=&lt;file&gt; give quantum code for query sequence (only for display)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
495 --format=&lt;type&gt; specify output format; one of lav, axt, maf, maf+, maf-, text,
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
496 lav+text, cigar, text, rdplot, general, or general:&lt;fields&gt;
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
497 (by default output is LAV)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
498 --rdotplot=&lt;file&gt; create an additional output file suitable for plotting the alignments
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
499 with the R statistical package.
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
500 --markend Just before normal completion, write "# lastz end-of-file" to output file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
501 --census[=&lt;output_file&gt;] count and report how many times each target base aligns, up
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
502 to 255. Ns are included in the count
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
503 --census16[=&lt;output_file&gt;] count and report how many times each target base aligns, up
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
504 up 65 thousand
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
505 --census32[=&lt;output_file&gt;] count and report how many times each target bas aligns, up
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
506 to 4 billion
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
507 --writecapsule=&lt;capsule_file&gt; just write out a target capsule file and quit; don't
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
508 search for seeds or perform subsequent stages
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
509 --verbosity=&lt;level&gt; set info level (0 is minimum, 10 is everything)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
510 (default is 0)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
511 --[no]runtime report runtime in the output file
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
512 (default is to not report runtime)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
513 --tableonly[=count] just produce the target position table, don't
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
514 search for seeds
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
515 --[no]stats[=&lt;file&gt;] show search statistics (or don't)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
516 (not available in this build)
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
517 --version report the program version and quit
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
518 --help list all options
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
519 --help=files list information about file specifiers
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
520 --help=short[cuts] list blastz-compatible shortcuts
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
521 --help=yasra list yasra-specific shortcuts
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
522
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
523 </help>
0801f8207d30 Uploaded tarball
devteam
parents:
diff changeset
524 </tool>