annotate tools/annotation_profiler/annotation_profiler.xml @ 1:cdcb0ce84a1b

Uploaded
author xuebing
date Fri, 09 Mar 2012 19:45:15 -0500
parents 9071e359b9a3
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
1 <tool id="Annotation_Profiler_0" name="Profile Annotations" version="1.0.0">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
2 <description>for a set of genomic intervals</description>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
3 <command interpreter="python">annotation_profiler_for_interval.py -i $input1 -c ${input1.metadata.chromCol} -s ${input1.metadata.startCol} -e ${input1.metadata.endCol} -o $out_file1 $keep_empty -p ${GALAXY_DATA_INDEX_DIR}/annotation_profiler/$dbkey $summary -b 3 -t $table_names</command>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
4 <inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
5 <param format="interval" name="input1" type="data" label="Choose Intervals">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
6 <validator type="dataset_metadata_in_file" filename="annotation_profiler_valid_builds.txt" metadata_name="dbkey" metadata_column="0" message="Profiling is not currently available for this species."/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
7 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
8 <param name="keep_empty" type="select" label="Keep Region/Table Pairs with 0 Coverage">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
9 <option value="-k">Keep</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
10 <option value="" selected="true">Discard</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
11 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
12 <param name="summary" type="select" label="Output per Region/Summary">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
13 <option value="-S">Summary</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
14 <option value="" selected="true">Per Region</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
15 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
16 <param name="table_names" type="drill_down" display="checkbox" hierarchy="recurse" multiple="true" label="Choose Tables to Use" help="Selecting no tables will result in using all tables." from_file="annotation_profiler_options.xml"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
17 </inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
18 <outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
19 <data format="input" name="out_file1">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
20 <change_format>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
21 <when input="summary" value="-S" format="tabular" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
22 </change_format>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
23 </data>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
24 </outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
25 <tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
26 <test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
27 <param name="input1" value="4.bed" dbkey="hg18"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
28 <param name="keep_empty" value=""/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
29 <param name="summary" value=""/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
30 <param name="table_names" value="acembly,affyGnf1h,knownAlt,knownGene,mrna,multiz17way,multiz28way,refGene,snp126"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
31 <output name="out_file1" file="annotation_profiler_1.out" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
32 </test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
33 <test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
34 <param name="input1" value="3.bed" dbkey="hg18"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
35 <param name="keep_empty" value=""/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
36 <param name="summary" value="Summary"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
37 <param name="table_names" value="acembly,affyGnf1h,knownAlt,knownGene,mrna,multiz17way,multiz28way,refGene,snp126"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
38 <output name="out_file1" file="annotation_profiler_2.out" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
39 </test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
40 </tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
41 <help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
42 **What it does**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
43
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
44 Takes an input set of intervals and for each interval determines the base coverage of the interval by a set of features (tables) available from UCSC. Genomic regions from the input feature data have been merged by overlap / direct adjacency (e.g. a table having ranges of: 1-10, 6-12, 12-20 and 25-28 results in two merged ranges of: 1-20 and 25-28).
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
45
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
46 By default, this tool will check the coverage of your intervals against all available features; you may, however, choose to select only those tables that you want to include. Selecting a section heading will effectively cause all of its children to be selected.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
47
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
48 You may alternatively choose to receive a summary across all of the intervals that you provide.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
49
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
50 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
51
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
52 **Example**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
53
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
54 Using the interval below and selecting several tables::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
55
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
56 chr1 4558 14764 uc001aab.1 0 -
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
57
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
58 results in::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
59
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
60 chr1 4558 14764 uc001aab.1 0 - snp126Exceptions 151 142
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
61 chr1 4558 14764 uc001aab.1 0 - genomicSuperDups 10206 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
62 chr1 4558 14764 uc001aab.1 0 - chainOryLat1 3718 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
63 chr1 4558 14764 uc001aab.1 0 - multiz28way 10206 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
64 chr1 4558 14764 uc001aab.1 0 - affyHuEx1 3553 32
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
65 chr1 4558 14764 uc001aab.1 0 - netXenTro2 3050 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
66 chr1 4558 14764 uc001aab.1 0 - intronEst 10206 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
67 chr1 4558 14764 uc001aab.1 0 - xenoMrna 10203 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
68 chr1 4558 14764 uc001aab.1 0 - ctgPos 10206 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
69 chr1 4558 14764 uc001aab.1 0 - clonePos 10206 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
70 chr1 4558 14764 uc001aab.1 0 - chainStrPur2Link 1323 29
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
71 chr1 4558 14764 uc001aab.1 0 - affyTxnPhase3HeLaNuclear 9011 8
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
72 chr1 4558 14764 uc001aab.1 0 - snp126orthoPanTro2RheMac2 61 58
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
73 chr1 4558 14764 uc001aab.1 0 - snp126 205 192
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
74 chr1 4558 14764 uc001aab.1 0 - chainEquCab1 10206 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
75 chr1 4558 14764 uc001aab.1 0 - netGalGal3 3686 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
76 chr1 4558 14764 uc001aab.1 0 - phastCons28wayPlacMammal 10172 3
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
77
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
78 Where::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
79
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
80 The first added column is the table name.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
81 The second added column is the number of bases covered by the table.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
82 The third added column is the number of regions from the table that is covered by the interval.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
83
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
84 Alternatively, requesting a summary, using the intervals below and selecting several tables::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
85
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
86 chr1 4558 14764 uc001aab.1 0 -
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
87 chr1 4558 19346 uc001aac.1 0 -
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
88
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
89 results in::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
90
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
91 #tableName tableSize tableRegionCount allIntervalCount allIntervalSize allCoverage allTableRegionsOverlaped allIntervalsOverlapingTable nrIntervalCount nrIntervalSize nrCoverage nrTableRegionsOverlaped nrIntervalsOverlapingTable
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
92 snp126Exceptions 133601 92469 2 24994 388 359 2 1 14788 237 217 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
93 genomicSuperDups 12268847 657 2 24994 24994 2 2 1 14788 14788 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
94 chainOryLat1 70337730 2542 2 24994 7436 2 2 1 14788 3718 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
95 affyHuEx1 15703901 112274 2 24994 7846 70 2 1 14788 4293 38 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
96 netXenTro2 111440392 1877 2 24994 6100 2 2 1 14788 3050 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
97 snp126orthoPanTro2RheMac2 700436 690674 2 24994 124 118 2 1 14788 63 60 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
98 intronEst 135796064 2332 2 24994 24994 2 2 1 14788 14788 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
99 xenoMrna 129031327 1586 2 24994 20406 2 2 1 14788 10203 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
100 snp126 956976 838091 2 24994 498 461 2 1 14788 293 269 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
101 clonePos 224999719 39 2 24994 24994 2 2 1 14788 14788 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
102 chainStrPur2Link 7948016 119841 2 24994 2646 58 2 1 14788 1323 29 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
103 affyTxnPhase3HeLaNuclear 136797870 140244 2 24994 22601 17 2 1 14788 13590 9 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
104 multiz28way 225928588 38 2 24994 24994 2 2 1 14788 14788 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
105 ctgPos 224999719 39 2 24994 24994 2 2 1 14788 14788 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
106 chainEquCab1 246306414 141 2 24994 24994 2 2 1 14788 14788 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
107 netGalGal3 203351973 461 2 24994 7372 2 2 1 14788 3686 1 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
108 phastCons28wayPlacMammal 221017670 22803 2 24994 24926 6 2 1 14788 14754 3 1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
109
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
110 Where::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
111
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
112 tableName is the name of the table
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
113 tableChromosomeCoverage is the number of positions existing in the table for only the chromosomes that were referenced by the interval file
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
114 tableChromosomeCount is the number of regions existing in the table for only the chromosomes that were referenced by the interval file
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
115 tableRegionCoverage is the number of positions existing in the table between the minimal and maximal bounding regions that were referenced by the interval file
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
116 tableRegionCount is the number of regions existing in the table between the minimal and maximal bounding regions that were referenced by the interval file
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
117
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
118 allIntervalCount is the number of provided intervals
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
119 allIntervalSize is the sum of the lengths of the provided interval file
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
120 allCoverage is the sum of the coverage for each provided interval
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
121 allTableRegionsOverlapped is the sum of the number of regions of the table (non-unique) that were overlapped for each interval
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
122 allIntervalsOverlappingTable is the number of provided intervals which overlap the table
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
123
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
124 nrIntervalCount is the number of non-redundant intervals
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
125 nrIntervalSize is the sum of the lengths of non-redundant intervals
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
126 nrCoverage is the sum of the coverage of non-redundant intervals
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
127 nrTableRegionsOverlapped is the number of regions of the table (unique) that were overlapped by the non-redundant intervals
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
128 nrIntervalsOverlappingTable is the number of non-redundant intervals which overlap the table
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
129
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
130
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
131 .. class:: infomark
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
132
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
133 **TIP:** non-redundant (nr) refers to the set of intervals that remains after the intervals provided have been merged to resolve overlaps
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
134
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
135 </help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
136 </tool>