annotate tools/metag_tools/shrimp_color_wrapper.xml @ 1:cdcb0ce84a1b

Uploaded
author xuebing
date Fri, 09 Mar 2012 19:45:15 -0500
parents 9071e359b9a3
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
1 <tool id="shrimp_color_wrapper" name="SHRiMP for Color-space" version="1.0.0">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
2 <description>reads mapping against reference sequence </description>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
3 <command interpreter="python">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
4 #if $param.skip_or_full=="skip" #shrimp_color_wrapper.py $input_target $input_query $output1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
5 #else #shrimp_color_wrapper.py $input_target $input_query $output1 $param.spaced_seed $param.seed_matches_per_window $param.seed_hit_taboo_length $param.seed_generation_taboo_length $param.seed_window_length $param.max_hits_per_read $param.max_read_length $param.kmer $param.sw_match_value $param.sw_mismatch_value $param.sw_gap_open_ref $param.sw_gap_open_query $param.sw_gap_ext_ref $param.sw_gap_ext_query $param.sw_crossover_penalty $param.sw_full_hit_threshold $param.sw_vector_hit_threshold
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
6 #end if#
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
7 </command>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
8 <inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
9 <page>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
10 <param name="input_query" type="data" format="csfasta" label="Align sequencing reads" help="No dataset? Read tip below"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
11 <param name="input_target" type="data" format="fasta" label="against reference" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
12 <conditional name="param">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
13 <param name="skip_or_full" type="select" label="SHRiMP settings to use" help="For most mapping needs use Commonly used settings. If you want full control use Full List">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
14 <option value="skip">Commonly used</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
15 <option value="full">Full Parameter List</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
16 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
17 <when value="skip" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
18 <when value="full">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
19 <param name="spaced_seed" type="text" size="30" value="1111001111" label="Spaced Seed" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
20 <param name="seed_matches_per_window" type="integer" size="5" value="2" label="Seed Matches per Window" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
21 <param name="seed_hit_taboo_length" type="integer" size="5" value="4" label="Seed Hit Taboo Length" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
22 <param name="seed_generation_taboo_length" type="integer" size="5" value="0" label="Seed Generation Taboo Length" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
23 <param name="seed_window_length" type="float" size="10" value="115.0" label="Seed Window Length" help="in percentage"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
24 <param name="max_hits_per_read" type="integer" size="10" value="100" label="Maximum Hits per Read" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
25 <param name="max_read_length" type="integer" size="10" value="1000" label="Maximum Read Length" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
26 <param name="kmer" type="integer" size="10" value="-1" label="Kmer Std. Deviation Limit" help="-1 as None"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
27 <param name="sw_match_value" type="integer" size="10" value="100" label="S-W Match Value" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
28 <param name="sw_mismatch_value" type="integer" size="10" value="-150" label="S-W Mismatch Value" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
29 <param name="sw_gap_open_ref" type="integer" size="10" value="-400" label="S-W Gap Open Penalty (Reference)" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
30 <param name="sw_gap_open_query" type="integer" size="10" value="-400" label="S-W Gap Open Penalty (Query)" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
31 <param name="sw_gap_ext_ref" type="integer" size="10" value="-70" label="S-W Gap Extend Penalty (Reference)" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
32 <param name="sw_gap_ext_query" type="integer" size="10" value="-70" label="S-W Gap Extend Penalty (Query)" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
33 <param name="sw_crossover_penalty" type="integer" size="10" value="-140" label="S-W Crossover Penalty" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
34 <param name="sw_full_hit_threshold" type="float" size="10" value="68.0" label="S-W Full Hit Threshold" help="in percentage"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
35 <param name="sw_vector_hit_threshold" type="float" size="10" value="60.0" label="S-W Vector Hit Threshold" help="in percentage"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
36 </when>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
37 </conditional>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
38 </page>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
39 </inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
40 <outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
41 <data name="output1" format="tabular"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
42 </outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
43 <requirements>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
44 <requirement type="binary">rmapper-cs</requirement>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
45 </requirements>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
46 <tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
47 <test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
48 <param name="skip_or_full" value="skip" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
49 <param name="input_target" value="Ssuis.fasta" ftype="fasta" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
50 <param name="input_query" value="shrimp_cs_test1.csfasta" ftype="csfasta"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
51 <output name="output1" file="shrimp_cs_test1.out" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
52 </test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
53 </tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
54 <help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
55
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
56 .. class:: warningmark
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
57
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
58 To use this tool your dataset needs to be in the *csfasta* (as ABI SOLiD color-space sequences) format. Click pencil icon next to your dataset to set the datatype to *csfasta*.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
59
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
60
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
61 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
62
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
63 **What it does**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
64
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
65 SHRiMP (SHort Read Mapping Package) is a software package for aligning genomic reads against a target genome.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
66
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
67
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
68 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
69
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
70 **Input formats**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
71
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
72 A multiple color-space file, for example::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
73
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
74 >2_263_779_F3
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
75 T132032030200202202003211302222202230022110222
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
76
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
77
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
78 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
79
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
80 **Outputs**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
81
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
82 The tool returns the default SHRiMP output::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
83
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
84
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
85 1 2 3 4 5 6 7 8 9 10
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
86 --------------------------------------------------------------------------------------------------------------------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
87 >2_263_779_F3 Streptococcus_suis + 814344 814388 1 45 45 3660 8x19x3x2x6x4x3
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
88
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
89 where::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
90
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
91 1. (>2_263_779_F3) - Read id
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
92 2. (Streptococcus_suis) - Reference sequence id
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
93 3. (+) - Strand of the read
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
94 4. (814344) - Start position of the alignment in the reference
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
95 5. (814388) - End position of the alignment in the reference
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
96 6. (1) - Start position of the alignment in the read
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
97 7. (45) - End position of the alignment in the read
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
98 8. (45) - Length of the read
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
99 9. (3660) - Score
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
100 10. (8x19x3x2x6x4x3) - Edit string
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
101
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
102
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
103 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
104
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
105 **SHRiMP parameter list**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
106
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
107 The commonly used parameters with default value setting::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
108
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
109 -s Spaced Seed (default: 111111011111)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
110 The spaced seed is a single contiguous string of 0's and 1's.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
111 0's represent wildcards, or positions which will always be
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
112 considered as matching, whereas 1's dictate positions that
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
113 must match. A string of all 1's will result in a simple kmer scan.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
114 -n Seed Matches per Window (default: 2)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
115 The number of seed matches per window dictates how many seeds
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
116 must match within some window length of the genome before that
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
117 region is considered for Smith-Waterman alignment. A lower
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
118 value will increase sensitivity while drastically increasing
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
119 running time. Higher values will have the opposite effect.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
120 -t Seed Hit Taboo Length (default: 4)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
121 The seed taboo length specifies how many target genome bases
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
122 or colours must exist prior to a previous seed match in order
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
123 to count another seed match as a hit.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
124 -9 Seed Generation Taboo Length (default: 0)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
125
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
126 -w Seed Window Length (default: 115.00%)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
127 This parameter specifies the genomic span in bases (or colours)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
128 in which *seed_matches_per_window* must exist before the read
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
129 is given consideration by the Simth-Waterman alignment machinery.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
130 -o Maximum Hits per Read (default: 100)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
131 This parameter specifies how many hits to remember for each read.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
132 If more hits are encountered, ones with lower scores are dropped
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
133 to make room.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
134 -r Maximum Read Length (default: 1000)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
135 This parameter specifies the maximum length of reads that will
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
136 be encountered in the dataset. If larger reads than the default
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
137 are used, an appropriate value must be passed to *rmapper*.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
138 -d Kmer Std. Deviation Limit (default: -1 [None])
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
139 This option permits pruning read kmers, which occur with
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
140 frequencies greater than *kmer_std_dev_limit* standard
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
141 deviations above the average. This can shorten running
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
142 time at the cost of some sensitivity.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
143 *Note*: A negative value disables this option.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
144 -m S-W Match Value (default: 100)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
145 The value applied to matches during the Smith-Waterman score calculation.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
146 -i S-W Mismatch Value (default: -150)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
147 The value applied to mismatches during the Smith-Waterman
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
148 score calculation.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
149 -g S-W Gap Open Penalty (Reference) (default: -400)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
150 The value applied to gap opens along the reference sequence
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
151 during the Smith-Waterman score calculation.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
152 *Note*: Note that for backward compatibility, if -g is set
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
153 and -q is not set, the gap open penalty for the query will
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
154 be set to the same value as specified for the reference.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
155 -q S-W Gap Open Penalty (Query) (default: -400)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
156 The value applied to gap opens along the query sequence during
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
157 the Smith-Waterman score calculation.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
158 -e S-W Gap Extend Penalty (Reference) (default: -70)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
159 The value applied to gap extends during the Smith-Waterman score calculation.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
160 *Note*: Note that for backward compatibility, if -e is set
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
161 and -f is not set, the gap exten penalty for the query will
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
162 be set to the same value as specified for the reference.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
163 -f S-W Gap Extend Penalty (Query) (default: -70)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
164 The value applied to gap extends during the Smith-Waterman score calculation.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
165 -x
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
166 -h S-W Full Hit Threshold (default: 68.00%)
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
167 In letter-space, this parameter determines the threshold
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
168 score for both vectored and full Smith-Waterman alignments.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
169 Any values less than this quantity will be thrown away.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
170 *Note* This option differs slightly in meaning between letter-space and color-space.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
171 -v
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
172
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
173
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
174 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
175
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
176 **Reference**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
177
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
178 **SHRiMP**: Stephen M. Rumble, Michael Brudno, Phil Lacroute, Vladimir Yanovsky, Marc Fiume, Adrian Dalca. shrimp at cs dot toronto dot edu.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
179
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
180 </help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
181 </tool>