comparison SMART/galaxy/compareOverlapping.xml @ 36:44d5973c188c

Uploaded
author m-zytnicki
date Tue, 30 Apr 2013 15:02:29 -0400
parents
children
comparison
equal deleted inserted replaced
35:d94018ca4ada 36:44d5973c188c
1 <tool id="CompareOverlapping" name="compare Overlapping">
2 <description>Print all the transcripts from a first file which overlap with the transcripts from a second file.</description>
3 <command interpreter="python">
4 ../Java/Python/CompareOverlapping.py -i $formatType.inputFileName1
5 #if $formatType.FormatInputFileName1 == 'bed':
6 -f bed
7 #elif $formatType.FormatInputFileName1 == 'gff':
8 -f gff
9 #elif $formatType.FormatInputFileName1 == 'gff2':
10 -f gff2
11 #elif $formatType.FormatInputFileName1 == 'gff3':
12 -f gff3
13 #elif $formatType.FormatInputFileName1 == 'sam':
14 -f sam
15 #elif $formatType.FormatInputFileName1 == 'gtf':
16 -f gtf
17 #end if
18
19 -j $formatType2.inputFileName2
20 #if $formatType2.FormatInputFileName2 == 'bed':
21 -g bed
22 #elif $formatType2.FormatInputFileName2 == 'gff':
23 -g gff
24 #elif $formatType2.FormatInputFileName2 == 'gff2':
25 -g gff2
26 #elif $formatType2.FormatInputFileName2 == 'gff3':
27 -g gff3
28 #elif $formatType2.FormatInputFileName2 == 'sam':
29 -g sam
30 #elif $formatType2.FormatInputFileName2 == 'gtf':
31 -g gtf
32 #end if
33
34 -o $outputFileGff
35
36 #if $optionNFirstFile1.NFirstForFile1 == 'Yes':
37 -S $optionNFirstFile1.firstNtFile1
38 #end if
39 #if $optionNFirstFile2.NFirstForFile2 == 'Yes':
40 -s $optionNFirstFile2.firstNtFile2
41 #end if
42 #if $optionNLastFile1.NLastForFile1 == 'Yes':
43 -U $optionNLastFile1.lastNtFile1
44 #end if
45 #if $optionNLastFile2.NLastForFile2 == 'Yes':
46 -u $optionNLastFile2.lastNtFile2
47 #end if
48
49 #if $optionExtentionCinqFile1.extentionFile1 == 'Yes':
50 -E $optionExtentionCinqFile1.extention51
51 #end if
52 #if $optionExtentionCinqFile2.extentionFile2 == 'Yes':
53 -e $optionExtentionCinqFile2.extention52
54 #end if
55
56 #if $optionExtentionTroisFile1.extentionFile1 == 'Yes':
57 -N $optionExtentionTroisFile1.extention31
58 #end if
59 #if $optionExtentionTroisFile2.extentionFile2 == 'Yes':
60 -n $optionExtentionTroisFile2.extention32
61 #end if
62
63 #if $OptionColinearOrAntiSens.OptionCA == 'Colinear':
64 -c
65 #elif $OptionColinearOrAntiSens.OptionCA == 'AntiSens':
66 -a
67 #end if
68
69 #if $OptionDistance.Dist == 'Yes':
70 -d $OptionDistance.distance
71 #end if
72
73 #if $OptionMinOverlap.MO == 'Yes':
74 -m $OptionMinOverlap.minOverlap
75 #end if
76
77 $InvertMatch
78 $ReportIntron
79 $NotOverlapping
80
81 </command>
82
83 <inputs>
84 <conditional name="formatType">
85 <param name="FormatInputFileName1" type="select" label="Input File Format 1">
86 <option value="bed">bed</option>
87 <option value="gff">gff</option>
88 <option value="gff2">gff2</option>
89 <option value="gff3">gff3</option>
90 <option value="sam">sam</option>
91 <option value="gtf">gtf</option>
92 </param>
93 <when value="bed">
94 <param name="inputFileName1" format="bed" type="data" label="Input File 1"/>
95 </when>
96 <when value="gff">
97 <param name="inputFileName1" format="gff" type="data" label="Input File 1"/>
98 </when>
99 <when value="gff2">
100 <param name="inputFileName1" format="gff2" type="data" label="Input File 1"/>
101 </when>
102 <when value="gff3">
103 <param name="inputFileName1" format="gff3" type="data" label="Input File 1"/>
104 </when>
105 <when value="sam">
106 <param name="inputFileName1" format="sam" type="data" label="Input File 1"/>
107 </when>
108 <when value="gtf">
109 <param name="inputFileName1" format="gtf" type="data" label="Input File 1"/>
110 </when>
111 </conditional>
112
113 <conditional name="formatType2">
114 <param name="FormatInputFileName2" type="select" label="Input File Format 2">
115 <option value="bed">bed</option>
116 <option value="gff">gff</option>
117 <option value="gff2">gff2</option>
118 <option value="gff3">gff3</option>
119 <option value="sam">sam</option>
120 <option value="gtf">gtf</option>
121 </param>
122 <when value="bed">
123 <param name="inputFileName2" format="bed" type="data" label="Input File 2"/>
124 </when>
125 <when value="gff">
126 <param name="inputFileName2" format="gff" type="data" label="Input File 2"/>
127 </when>
128 <when value="gff2">
129 <param name="inputFileName2" format="gff2" type="data" label="Input File 2"/>
130 </when>
131 <when value="gff3">
132 <param name="inputFileName2" format="gff3" type="data" label="Input File 2"/>
133 </when>
134 <when value="sam">
135 <param name="inputFileName2" format="sam" type="data" label="Input File 2"/>
136 </when>
137 <when value="gtf">
138 <param name="inputFileName2" format="gtf" type="data" label="Input File 2"/>
139 </when>
140 </conditional>
141
142 <conditional name="optionNFirstFile1">
143 <param name="NFirstForFile1" type="select" label="Shrink the queries to their first N nt.">
144 <option value="Yes">Yes</option>
145 <option value="No" selected="true">No</option>
146 </param>
147 <when value="Yes">
148 <param name="firstNtFile1" type="integer" value="1" label="size" />
149 </when>
150 <when value="No">
151 </when>
152 </conditional>
153 <conditional name="optionNFirstFile2">
154 <param name="NFirstForFile2" type="select" label="Shrink the references to their first N nt.">
155 <option value="Yes">Yes</option>
156 <option value="No" selected="true">No</option>
157 </param>
158 <when value="Yes">
159 <param name="firstNtFile2" type="integer" value="1" label="size" />
160 </when>
161 <when value="No">
162 </when>
163 </conditional>
164
165 <conditional name="optionNLastFile1">
166 <param name="NLastForFile1" type="select" label="Shrink the queries to their last N nt.">
167 <option value="Yes">Yes</option>
168 <option value="No" selected="true">No</option>
169 </param>
170 <when value="Yes">
171 <param name="lastNtFile1" type="integer" value="1" label="size"/>
172 </when>
173 <when value="No">
174 </when>
175 </conditional>
176 <conditional name="optionNLastFile2">
177 <param name="NLastForFile2" type="select" label="Shrink the references to their last N nt.">
178 <option value="Yes">Yes</option>
179 <option value="No" selected="true">No</option>
180 </param>
181 <when value="Yes">
182 <param name="lastNtFile2" type="integer" value="1" label="size"/>
183 </when>
184 <when value="No">
185 </when>
186 </conditional>
187
188 <conditional name="optionExtentionCinqFile1">
189 <param name="extentionFile1" type="select" label="Extend the query features towards the 5' end">
190 <option value="Yes">Yes</option>
191 <option value="No" selected="true">No</option>
192 </param>
193 <when value="Yes">
194 <param name="extention51" type="integer" value="1" label="in file 1" />
195 </when>
196 <when value="No">
197 </when>
198 </conditional>
199
200 <conditional name="optionExtentionCinqFile2">
201 <param name="extentionFile2" type="select" label="Extend the reference features towards 5' end">
202 <option value="Yes">Yes</option>
203 <option value="No" selected="true">No</option>
204 </param>
205 <when value="Yes">
206 <param name="extention52" type="integer" value="1" label="in file 2"/>
207 </when>
208 <when value="No">
209 </when>
210 </conditional>
211
212 <conditional name="optionExtentionTroisFile1">
213 <param name="extentionFile1" type="select" label="Extend the query features towards 3' end">
214 <option value="Yes">Yes</option>
215 <option value="No" selected="true">No</option>
216 </param>
217 <when value="Yes">
218 <param name="extention31" type="integer" value="1" label="in file 1" />
219 </when>
220 <when value="No">
221 </when>
222 </conditional>
223
224 <conditional name="optionExtentionTroisFile2">
225 <param name="extentionFile2" type="select" label="Extend the reference features towards 3' end">
226 <option value="Yes">Yes</option>
227 <option value="No" selected="true">No</option>
228 </param>
229 <when value="Yes">
230 <param name="extention32" type="integer" value="1" label="in file 2" />
231 </when>
232 <when value="No">
233 </when>
234 </conditional>
235
236 <conditional name="OptionColinearOrAntiSens">
237 <param name="OptionCA" type="select" label="Report queries which are collinear/antisens w.r.t. a reference">
238 <option value="Colinear">Colinear</option>
239 <option value="AntiSens">AntiSens</option>
240 <option value="NONE" selected="true">NONE</option>
241 </param>
242 <when value="Colinear">
243 </when>
244 <when value="AntiSens">
245 </when>
246 <when value="NONE">
247 </when>
248 </conditional>
249
250 <conditional name="OptionDistance">
251 <param name="Dist" type="select" label="Maximum Distance between two reads">
252 <option value="Yes">Yes</option>
253 <option value="No" selected="true">No</option>
254 </param>
255 <when value="Yes">
256 <param name="distance" type="integer" value="0"/>
257 </when>
258 <when value="No">
259 </when>
260 </conditional>
261
262 <conditional name="OptionMinOverlap">
263 <param name="MO" type="select" label="Minimum number of overlapping between two reads">
264 <option value="Yes">Yes</option>
265 <option value="No" selected="true">No</option>
266 </param>
267 <when value="Yes">
268 <param name="minOverlap" type="integer" value="1"/>
269 </when>
270 <when value="No">
271 </when>
272 </conditional>
273 <param name="ReportIntron" type="boolean" truevalue="-t" falsevalue="" checked="false" label="Also report queries which overlap with the introns of references, or queries such that a reference is in one of its intron"/>
274 <param name="InvertMatch" type="boolean" truevalue="-x" falsevalue="" checked="false" label="Invert match: the output file will contain all query elements which do NOT overlap"/>
275 <param name="NotOverlapping" type="boolean" truevalue="-O" falsevalue="" checked="false" label="Also report the query data which do not overlap, with the nbOverlaps tag set to 0."/>
276 </inputs>
277
278 <outputs>
279 <data name="outputFileGff" format="gff3"/>
280 </outputs>
281
282 <help>
283 This script may be the most important one. It basically compares two sets of transcripts and keeps those from the first set which overlap with the second one. The first set is considered as the query set (basically, your data) and the second one is the reference set (RefSeq data, for example).
284
285 It is vital to understand that it will output the elements of the first file which overlap with the elements of the second one.
286
287 Various modifiers are also available:
288
289 -Restrict query / reference set to the first nucleotide. Useful to check if the TSS of one set overlap with the other one.
290
291 -Extend query / reference set on the 5' / 3' direction. Useful to check if one set is located upstream / downstream the other one.
292
293 -Include introns in the comparison.
294
295 -Invert selection (report those which do not overlap).
296
297 -Restrict to colinear / anti-sense overlapping data.
298
299 -Keep the query data even if they do not strictly overlap with the reference data, but are located not further away than *n* nucleotide from some reference data.
300
301 -Keep the query data with are strictly included into reference data, meaning that a query transcript such that at least 1 nucleotide does not overlap with reference data will not be presented as a solution.
302
303 The mechanism of shrinking and extending is also useful to make a fine grain comparison. For example, if you want to keep those such that the TSS is overlapping the reference set, you just shrink the query set to 1 nucleotide. Now, if you want to keep those which are overlapping you data or located 2kb downstream of it, just extend the query data in the downstream direction, and you will have what you want. You can also extend in the opposite direction to get the possible transcript factor sites which are upstream.
304
305 Some option reverses the selection. Put in other words, it performs the comparison as usual, and outputs all those query data which do not overlap.
306 </help>
307 </tool>