annotate Dotplot_Release/Step1_data_reformating.R @ 17:296e40bfe2d7 draft

Uploaded
author bornea
date Wed, 16 Mar 2016 12:11:39 -0400
parents bc752a05f16d
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
bc752a05f16d Uploaded
bornea
parents:
diff changeset
1 #!/usr/bin/env Rscript
bc752a05f16d Uploaded
bornea
parents:
diff changeset
2
bc752a05f16d Uploaded
bornea
parents:
diff changeset
3 args <- commandArgs(trailingOnly = TRUE)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
4
bc752a05f16d Uploaded
bornea
parents:
diff changeset
5 d = read.delim(args[1], header=T, sep="\t", as.is=T)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
6
bc752a05f16d Uploaded
bornea
parents:
diff changeset
7 ### Select Prey interactions were at least one Bait > Probability Threshold
bc752a05f16d Uploaded
bornea
parents:
diff changeset
8
bc752a05f16d Uploaded
bornea
parents:
diff changeset
9 preylist=unique(c(d$PreyGene[d$BFDR <= as.numeric(args[2])]))
bc752a05f16d Uploaded
bornea
parents:
diff changeset
10 pid = d$PreyGene %in% preylist
bc752a05f16d Uploaded
bornea
parents:
diff changeset
11 d = d[pid,]
bc752a05f16d Uploaded
bornea
parents:
diff changeset
12
bc752a05f16d Uploaded
bornea
parents:
diff changeset
13 bb = unique(d$Bait)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
14 pp = unique(d$PreyGene)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
15
bc752a05f16d Uploaded
bornea
parents:
diff changeset
16 nbait = length(bb)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
17 nprey = length(pp)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
18
bc752a05f16d Uploaded
bornea
parents:
diff changeset
19 ### Reformat the SAINToutput data into a spreadsheet
bc752a05f16d Uploaded
bornea
parents:
diff changeset
20 mat = matrix(0, nprey, nbait)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
21
bc752a05f16d Uploaded
bornea
parents:
diff changeset
22 n = nrow(d)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
23 mb = match(d$Bait, bb)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
24 mp = match(d$PreyGene, pp)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
25
bc752a05f16d Uploaded
bornea
parents:
diff changeset
26 ### Using the AvgSpec for the spectral counts
bc752a05f16d Uploaded
bornea
parents:
diff changeset
27 for(i in 1:n) {
bc752a05f16d Uploaded
bornea
parents:
diff changeset
28 mat[mp[i],mb[i]] = d$AvgSpec[i]
bc752a05f16d Uploaded
bornea
parents:
diff changeset
29 }
bc752a05f16d Uploaded
bornea
parents:
diff changeset
30
bc752a05f16d Uploaded
bornea
parents:
diff changeset
31 rownames(mat) = pp
bc752a05f16d Uploaded
bornea
parents:
diff changeset
32 colnames(mat) = bb
bc752a05f16d Uploaded
bornea
parents:
diff changeset
33
bc752a05f16d Uploaded
bornea
parents:
diff changeset
34 outfile <- paste(c(args[3]), "matrix.txt", sep="_")
bc752a05f16d Uploaded
bornea
parents:
diff changeset
35 ### The following file is the outcome of running this step.
bc752a05f16d Uploaded
bornea
parents:
diff changeset
36 write.table(mat, outfile, sep="\t", quote=F)
bc752a05f16d Uploaded
bornea
parents:
diff changeset
37
bc752a05f16d Uploaded
bornea
parents:
diff changeset
38
bc752a05f16d Uploaded
bornea
parents:
diff changeset
39
bc752a05f16d Uploaded
bornea
parents:
diff changeset
40
bc752a05f16d Uploaded
bornea
parents:
diff changeset
41