comparison SMART/galaxy/Clusterize.xml @ 31:0ab839023fe4

Uploaded
author m-zytnicki
date Tue, 30 Apr 2013 14:33:21 -0400
parents 94ab73e8a190
children
comparison
equal deleted inserted replaced
30:5677346472b5 31:0ab839023fe4
1 <tool id="MergingDataClusterize" name="clusterize"> 1 <tool id="MergingDataClusterize" name="Clusterize">
2 <description>Clusterize features when their genomic intervals overlap.</description> 2 <description>Clusterizes the reads when their genomic intervals overlap.</description>
3 <requirements>
4 <requirement type="set_environment">PYTHONPATH</requirement>
5 </requirements>
6 <command interpreter="python"> 3 <command interpreter="python">
7 ../Java/Python/clusterize.py -i $formatType.inputFileName 4 ../Java/Python/clusterize.py -i $formatType.inputFileName
8 #if $formatType.FormatInputFileName == 'bed': 5 #if $formatType.FormatInputFileName == 'bed':
9 -f bed 6 -f bed
10 #elif $formatType.FormatInputFileName == 'gff': 7 #elif $formatType.FormatInputFileName == 'gff':
11 -f gff 8 -f gff
12 #elif $formatType.FormatInputFileName == 'gff2': 9 #elif $formatType.FormatInputFileName == 'gff2':
13 -f gff2 10 -f gff2
14 #elif $formatType.FormatInputFileName == 'gff3': 11 #elif $formatType.FormatInputFileName == 'gff3':
15 -f gff3 12 -f gff3
13 #elif $formatType.FormatInputFileName == 'csv':
14 -f csv
16 #elif $formatType.FormatInputFileName == 'sam': 15 #elif $formatType.FormatInputFileName == 'sam':
17 -f sam 16 -f sam
18 #elif $formatType.FormatInputFileName == 'gtf': 17 #elif $formatType.FormatInputFileName == 'gtf':
19 -f gtf 18 -f gtf
20 #end if 19 #end if
21 -o $outputFileGff 20 -o $outputFileGff
22 $colinear 21 $colinear
23 $normalize 22 $normalize
24 -d $distance 23 -d $distance
24 $log $outputFileLog
25 </command> 25 </command>
26 26
27 <inputs> 27 <inputs>
28 <conditional name="formatType"> 28 <conditional name="formatType">
29 <param name="FormatInputFileName" type="select" label="Input File Format"> 29 <param name="FormatInputFileName" type="select" label="Input File Format">
30 <option value="bed">bed</option> 30 <option value="bed">bed</option>
31 <option value="gff">gff</option> 31 <option value="gff">gff</option>
32 <option value="gff2">gff2</option> 32 <option value="gff2">gff2</option>
33 <option value="gff3">gff3</option> 33 <option value="gff3">gff3</option>
34 <option value="csv">csv</option>
34 <option value="sam">sam</option> 35 <option value="sam">sam</option>
35 <option value="gtf">gtf</option> 36 <option value="gtf">gtf</option>
36 </param> 37 </param>
37 <when value="bed"> 38 <when value="bed">
38 <param name="inputFileName" format="bed" type="data" label="Input File"/> 39 <param name="inputFileName" format="bed" type="data" label="Input File"/>
44 <param name="inputFileName" format="gff2" type="data" label="Input File"/> 45 <param name="inputFileName" format="gff2" type="data" label="Input File"/>
45 </when> 46 </when>
46 <when value="gff3"> 47 <when value="gff3">
47 <param name="inputFileName" format="gff3" type="data" label="Input File"/> 48 <param name="inputFileName" format="gff3" type="data" label="Input File"/>
48 </when> 49 </when>
50 <when value="csv">
51 <param name="inputFileName" format="csv" type="data" label="Input File"/>
52 </when>
49 <when value="sam"> 53 <when value="sam">
50 <param name="inputFileName" format="sam" type="data" label="Input File"/> 54 <param name="inputFileName" format="sam" type="data" label="Input File"/>
51 </when> 55 </when>
52 <when value="gtf"> 56 <when value="gtf">
53 <param name="inputFileName" format="gtf" type="data" label="Input File"/> 57 <param name="inputFileName" format="gtf" type="data" label="Input File"/>
54 </when> 58 </when>
55 </conditional> 59 </conditional>
56 60
57 <param name="colinear" type="boolean" truevalue="-c" falsevalue="" checked="false" label="Only merge collinear features"/> 61 <param name="colinear" type="boolean" truevalue="-c" falsevalue="" checked="false" label="colinear option" help="This option clusterizes only the same strand reads"/>
58 <param name="normalize" type="boolean" truevalue="-n" falsevalue="" checked="false" label="Normalize counts" help="Only works if the nbOccurrences tag is set."/> 62 <param name="normalize" type="boolean" truevalue="-n" falsevalue="" checked="false" label="normalize option for only GFF3 file format" help="This option normalize (attention!! Only for GFF3 file!!!!!)"/>
59 <param name="distance" type="text" value="0" label="merge features if their relative distance is within N nt"/> 63 <param name="log" type="boolean" truevalue="-l" falsevalue="" checked="false" label="log option" help="This option create a log file"/>
64 <param name="distance" type="text" value="0" label="distance option" help="Limit the maximum distance between two reads"/>
60 </inputs> 65 </inputs>
61 66
62 <outputs> 67 <outputs>
63 <data name="outputFileGff" format="gff3"/> 68 <data name="outputFileGff" format="gff3"/>
69 <data name="outputFileLog" format="txt">
70 <filter>log</filter>
71 </data>
64 </outputs> 72 </outputs>
65
66 <help>
67 The script clusterizes the input genomic data. Two features are clusterized when their genomic intervals overlap. The output is a GFF3 file, where each element is a cluster. The number of elements in the cluster is given by the tag **nbElements**. The name of a cluster is the concatation of the names of its reads (like **read1--read2--read3**). Note that if the size of the name of the cluster exceeds 100 characters, it is truncated to the first 100 characters.
68
69 Some options may clusterize the features which are closer than a given distance.
70
71 By default, the tool clusterizes all features which overlap (or nearly overlap), even if they are on different strands. If you want to clusterize the features which are on the same strand only, you can specify it.
72 </help>
73 </tool> 73 </tool>