annotate mytools/binaverage.xml @ 9:87eb5c5ddfe9

Uploaded
author xuebing
date Fri, 09 Mar 2012 20:01:43 -0500
parents f0dc65e7f6c0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
7
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
1 <tool id="binaverage" name="bin and average">
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
2 <description>of numeric columns</description>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
3 <command>cat $script_file | R --vanilla --slave > $out_log </command>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
4 <inputs>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
5 <param name="input" type="data" format="tabular" label="Data file"/>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
6 <param name="data_avg" type="integer" value="1" label="Column number of the data to average"/>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
7 <param name="label_avg" type="text" value="label-avg" size="30" label="data label"/>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
8 <param name="log_avg" label="log2 transform the data" type="boolean" truevalue="logavg" falsevalue="none" checked="False"/>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
9 <param name="data_bin" type="integer" value="2" label="Column number of the data used to make bins"/>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
10 <param name="label_bin" type="text" value="label-bin" size="30" label="data label"/>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
11 <param name="log_bin" label="log2 transform the data" type="boolean" truevalue="logbin" falsevalue="none" checked="False"/>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
12 <param name="nbin" type="integer" value="3" label="number of bins"/>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
13 <param name="bintype" type="select" label="Bin by rank or by value" >
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
14 <option value="rank" selected="true">by rank: bins have the same number of data points</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
15 <option value="value">by value: bins may have different number of data points</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
16 </param>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
17 <param name="legendloc" type="select" label="legend location on CDF plot" >
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
18 <option value="bottomright" selected="true">bottomright</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
19 <option value="bottomleft">bottomleft</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
20 <option value="bottom">bottom</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
21 <option value="left">left</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
22 <option value="topleft">topleft</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
23 <option value="top">top</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
24 <option value="topright">topright</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
25 <option value="right">right</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
26 <option value="center">center</option>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
27 </param>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
28
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
29 <param name="title" type="text" value="bin-average" size="50" label="title of this analysis"/>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
30
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
31 </inputs>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
32
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
33 <configfiles>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
34 <configfile name="script_file">
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
35 ## Setup R error handling to go to stderr
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
36 options(warn=-1)
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
37 source("/Users/xuebing/galaxy-dist/tools/mytools/cdf.r")
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
38 x = read.table("${input}",sep='\t')
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
39 x = x[,c($data_bin,$data_avg)]
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
40 label_avg = "${label_avg}"
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
41 label_bin = "${label_bin}"
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
42 if ("${log_bin}" == "logbin"){
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
43 x[,1] = log2(1+x[,1])
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
44 label_bin = paste('log2',label_bin)
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
45 }
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
46 if ("${log_avg}" == "logavg"){
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
47 x[,2] = log2(1+x[,2])
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
48 label_avg = paste('log2',label_avg)
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
49 }
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
50 res = binaverage(x,$nbin,"${bintype}")
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
51 attach(res)
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
52 for (i in 1:${nbin}){
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
53 print(paste(label_bin,labels[i],sep=':'))
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
54 print(summary(binned[[i]]))
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
55 }
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
56 pdf("${out_file}")
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
57 mycdf(binned,"${title}",labels,"$legendloc",label_avg,label_bin)
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
58 dev.off()
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
59 </configfile>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
60 </configfiles>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
61
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
62 <outputs>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
63 <data format="txt" name="out_log" label="${title}: (log)" />
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
64 <data format="pdf" name="out_file" label="${title}: (plot)" />
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
65 </outputs>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
66
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
67 <help>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
68
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
69 .. class:: infomark
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
70
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
71 This tool generates barplot and CDF plot comparing data/rows in a numeric column that are binned by a second numeric column. The input should have at least two numeric columns. One of the column is used to group rows into bins, and then values in the other column are compared using barplot, CDF plot, and KS test.
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
72
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
73 </help>
f0dc65e7f6c0 Uploaded
xuebing
parents:
diff changeset
74 </tool>