Mercurial > repos > jfb > kinatest_r_7_7testing
comparison kinatestid_r/Kinatest-R_part2.R @ 4:2f3df9b1c05b draft
Uploaded
author | jfb |
---|---|
date | Tue, 06 Feb 2018 17:16:05 -0500 |
parents | |
children | f80306fc5d69 |
comparison
equal
deleted
inserted
replaced
3:65f235b5fe14 | 4:2f3df9b1c05b |
---|---|
1 #test myself: this script should take in amino acids for each of the 9 positions and give out every single combination of those AAs | |
2 | |
3 #need to do following: fix it so that the accession numbers stay with the substrates, | |
4 #also the neg false constant is totaly unphos'd Ys found by FASTA-2-CSV system# uniprot | |
5 | |
6 #HOW MANY: IF THERE'S two aas in each position you get 2^9, so I assume the numbers are: | |
7 #(number in position-4)*(number in position -3)*(number in position -2)...=total | |
8 # require(rJava) | |
9 # require(xlsxjars) | |
10 # require(xlsx) | |
11 # # require(readxl) | |
12 | |
13 View(SDtable) | |
14 bareSDs<-SDtable[2:21,2:16] | |
15 goodones<-bareSDs>2 | |
16 | |
17 Positionm7<-which(goodones[,1] %in% TRUE) | |
18 if (length(Positionm7)<1){Positionm7<-which(bareSDs[,1]==max(bareSDs[,1]))} | |
19 Positionm6<-which(goodones[,2] %in% TRUE) | |
20 if (length(Positionm6)<1){Positionm6<-which(bareSDs[,2]==max(bareSDs[,2]))} | |
21 Positionm5<-which(goodones[,3] %in% TRUE) | |
22 if (length(Positionm5)<1){Positionm5<-which(bareSDs[,3]==max(bareSDs[,3]))} | |
23 Positionm4<-which(goodones[,4] %in% TRUE) | |
24 if (length(Positionm4)<1){Positionm4<-which(bareSDs[,4]==max(bareSDs[,4]))} | |
25 Positionm3<-which(goodones[,5] %in% TRUE) | |
26 if (length(Positionm3)<1){Positionm3<-which(bareSDs[,5]==max(bareSDs[,5]))} | |
27 Positionm2<-which(goodones[,6] %in% TRUE) | |
28 if (length(Positionm2)<1){Positionm2<-which(bareSDs[,6]==max(bareSDs[,6]))} | |
29 Positionm1<-which(goodones[,7] %in% TRUE) | |
30 if (length(Positionm1)<1){Positionm1<-which(bareSDs[,7]==max(bareSDs[,7]))} | |
31 | |
32 Positiond0<-which(goodones[,8] %in% TRUE) | |
33 if (length(Positiond0)<1){Positiond0<-which(bareSDs[,8]==max(bareSDs[,8]))} | |
34 | |
35 Positionp1<-which(goodones[,9] %in% TRUE) | |
36 if (length(Positionp1)<1){Positionp1<-which(bareSDs[,9]==max(bareSDs[,9]))} | |
37 Positionp2<-which(goodones[,10] %in% TRUE) | |
38 if (length(Positionp2)<1){Positionp2<-which(bareSDs[,10]==max(bareSDs[,10]))} | |
39 Positionp3<-which(goodones[,11] %in% TRUE) | |
40 if (length(Positionp3)<1){Positionp3<-which(bareSDs[,11]==max(bareSDs[,11]))} | |
41 Positionp4<-which(goodones[,12] %in% TRUE) | |
42 if (length(Positionp4)<1){Positionp4<-which(bareSDs[,12]==max(bareSDs[,12]))} | |
43 Positionp5<-which(goodones[,13] %in% TRUE) | |
44 if (length(Positionp5)<1){Positionp5<-which(bareSDs[,13]==max(bareSDs[,13]))} | |
45 Positionp6<-which(goodones[,14] %in% TRUE) | |
46 if (length(Positionp6)<1){Positionp6<-which(bareSDs[,14]==max(bareSDs[,14]))} | |
47 Positionp7<-which(goodones[,15] %in% TRUE) | |
48 if (length(Positionp7)<1){Positionp7<-which(bareSDs[,15]==max(bareSDs[,15]))} | |
49 | |
50 aa_props2 <- c("1"="A", "2"="C", "3"="D", "4"="E", "5"="F", "6"="G", "7"="H", "8"="I", "9"="K", "10"="L", "11"="M", "12"="N", | |
51 "13"="P", "14"="Q", "15"="R", "16"="S", "17"="T", "18"="V", "19"="W", "20"="Y") | |
52 aa_props2<-c(1="A") | |
53 | |
54 Positionm7<-sapply(Positionm7, function (x) aa_props2[x]) | |
55 Positionm6<-sapply(Positionm6, function (x) aa_props2[x]) | |
56 Positionm5<-sapply(Positionm5, function (x) aa_props2[x]) | |
57 Positionm4<-sapply(Positionm4, function (x) aa_props2[x]) | |
58 Positionm3<-sapply(Positionm3, function (x) aa_props2[x]) | |
59 Positionm2<-sapply(Positionm2, function (x) aa_props2[x]) | |
60 Positionm1<-sapply(Positionm1, function (x) aa_props2[x]) | |
61 Positiond0<-sapply(Positiond0, function (x) aa_props2[x]) | |
62 Positionp1<-sapply(Positionp1, function (x) aa_props2[x]) | |
63 Positionp2<-sapply(Positionp2, function (x) aa_props2[x]) | |
64 Positionp3<-sapply(Positionp3, function (x) aa_props2[x]) | |
65 Positionp4<-sapply(Positionp4, function (x) aa_props2[x]) | |
66 Positionp5<-sapply(Positionp5, function (x) aa_props2[x]) | |
67 Positionp6<-sapply(Positionp6, function (x) aa_props2[x]) | |
68 Positionp7<-sapply(Positionp7, function (x) aa_props2[x]) | |
69 | |
70 | |
71 # Positionm7<-c("D","H","N","V") | |
72 # Positionm6<-c("E","V") | |
73 # Positionm5<-c("D","H") | |
74 # Positionm4<-c("D","N") | |
75 # Positionm3<-c("D","E","F","Q") | |
76 # Positionm2<-c("D","N","Q","S") | |
77 # Positionm1<-c("F","I","L") | |
78 # Positiond0<-c("Y") | |
79 # Positionp1<-c("A","E") | |
80 # Positionp2<-c("T","S","Q","E") | |
81 # Positionp3<-c("V") | |
82 # Positionp4<-c("K") | |
83 # Positionp5<-c("K") | |
84 # Positionp6<-c("K") | |
85 # Positionp7<-c("R") | |
86 #this is where the amino acids for each position are given. m means minus, p mean plus | |
87 ######################################## | |
88 # ScreenerFilename<-"C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls" | |
89 | |
90 | |
91 | |
92 | |
93 | |
94 | |
95 | |
96 | |
97 | |
98 | |
99 | |
100 screaner<-read.csv(ScreenerFilename, header = FALSE, stringsAsFactors = FALSE) | |
101 | |
102 | |
103 Abl<-screaner[2:25,] | |
104 Arg<-screaner[27:50,] | |
105 Btk<-screaner[52:75,] | |
106 Csk<-screaner[77:100,] | |
107 Fyn<-screaner[102:125,] | |
108 Hck<-screaner[127:150,] | |
109 JAK2<-screaner[152:175,] | |
110 Lck<-screaner[177:200,] | |
111 Lyn<-screaner[202:225,] | |
112 Pyk2<-screaner[227:250,] | |
113 Src<-screaner[252:275,] | |
114 Syk<-screaner[277:300,] | |
115 Yes<-screaner[302:325,] | |
116 | |
117 #two questions: why are we doing BTK when we already have a bioninformatics page about it? | |
118 #two I reran everything and only get 96 positions of interest in the SD table | |
119 | |
120 | |
121 | |
122 | |
123 | |
124 | |
125 | |
126 | |
127 | |
128 #Do_You_want_An_Excel_Output_Questionmark<-"NO" | |
129 GeneratedPeptidesFile<-"GeneratedPeptidesFile.csv" | |
130 | |
131 | |
132 # Abl<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 4) | |
133 # Arg<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 5) | |
134 # Btk<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 6) | |
135 # Csk<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 7) | |
136 # Fyn<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 8) | |
137 # Hck<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 9) | |
138 # JAK2<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 10) | |
139 # Lck<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 11) | |
140 # Lyn<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 12) | |
141 # Pyk2<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 13) | |
142 # Src<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 14) | |
143 # Syk<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 15) | |
144 # Yes<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 16) | |
145 # | |
146 | |
147 | |
148 "A"=1 | |
149 "C"=2 | |
150 "D"=3 | |
151 "E"=4 | |
152 "F"=5 | |
153 "G"=6 | |
154 "H"=7 | |
155 "I"=8 | |
156 "K"=9 | |
157 "L"=10 | |
158 "M"=11 | |
159 "N"=12 | |
160 "P"=13 | |
161 "Q"=14 | |
162 "R"=15 | |
163 "S"=16 | |
164 "T"=17 | |
165 "V"=18 | |
166 "W"=19 | |
167 "Y"=20 | |
168 | |
169 aa_props <- c("A"=A, "C"=C, "D"=D, "E"=E, "F"=F,"G"=G,"H"=H,"I"=I,"K"=K,"L"=L,"M"=M,"N"=N,"P"=P,"Q"=Q,"R"=R, | |
170 "S"=S,"T"=T,"V"=V,"W"=W,"Y"=Y,"xY"=Y,"O"=21) | |
171 | |
172 number15<-sapply(Positionm7, function (x) aa_props[x]) | |
173 number14<-sapply(Positionm6, function (x) aa_props[x]) | |
174 number13<-sapply(Positionm5, function (x) aa_props[x]) | |
175 number1 <- sapply(Positionm4, function (x) aa_props[x]) | |
176 number2 <- sapply(Positionm3, function (x) aa_props[x]) | |
177 number3 <- sapply(Positionm2, function (x) aa_props[x]) | |
178 number4 <- sapply(Positionm1, function (x) aa_props[x]) | |
179 number5 <- sapply(Positiond0, function (x) aa_props[x]) | |
180 number6 <- sapply(Positionp1, function (x) aa_props[x]) | |
181 number7 <- sapply(Positionp2, function (x) aa_props[x]) | |
182 number8 <- sapply(Positionp3, function (x) aa_props[x]) | |
183 number9 <- sapply(Positionp4, function (x) aa_props[x]) | |
184 number10<-sapply(Positionp5, function (x) aa_props[x]) | |
185 number11<-sapply(Positionp6, function (x) aa_props[x]) | |
186 number12<-sapply(Positionp7, function (x) aa_props[x]) | |
187 | |
188 # number1<-Positionm4 | |
189 # number2<-Positionm3 | |
190 # number3<-Positionm2 | |
191 # number4<-Positionm1 | |
192 # number5<-Positiond0 | |
193 # number6<-Positionp1 | |
194 # number7<-Positionp2 | |
195 # number8<-Positionp3 | |
196 # number9<-Positionp4 | |
197 | |
198 ############################# | |
199 #here I create the Abl seqs with proper value for each number | |
200 if (1==0){ | |
201 Ablnumber1<- gsub("A",A,Ablnumber1,perl = TRUE) | |
202 Ablnumber1<- gsub("C",C,Ablnumber1,perl = TRUE) | |
203 Ablnumber1<- gsub("D",D,Ablnumber1,perl = TRUE) | |
204 Ablnumber1<- gsub("E",E,Ablnumber1,perl = TRUE) | |
205 Ablnumber1<- gsub("F",F,Ablnumber1,perl = TRUE) | |
206 Ablnumber1<- gsub("G",G,Ablnumber1,perl = TRUE) | |
207 Ablnumber1<- gsub("H",H,Ablnumber1,perl = TRUE) | |
208 Ablnumber1<- gsub("I",I,Ablnumber1,perl = TRUE) | |
209 Ablnumber1<- gsub("K",K,Ablnumber1,perl = TRUE) | |
210 Ablnumber1<- gsub("L",L,Ablnumber1,perl = TRUE) | |
211 Ablnumber1<- gsub("M",M,Ablnumber1,perl = TRUE) | |
212 Ablnumber1<- gsub("N",N,Ablnumber1,perl = TRUE) | |
213 Ablnumber1<- gsub("P",P,Ablnumber1,perl = TRUE) | |
214 Ablnumber1<- gsub("Q",Q,Ablnumber1,perl = TRUE) | |
215 Ablnumber1<- gsub("R",R,Ablnumber1,perl = TRUE) | |
216 Ablnumber1<- gsub("S",S,Ablnumber1,perl = TRUE) | |
217 Ablnumber1<- gsub("T",T,Ablnumber1,perl = TRUE) | |
218 Ablnumber1<- gsub("V",V,Ablnumber1,perl = TRUE) | |
219 Ablnumber1<- gsub("W",W,Ablnumber1,perl = TRUE) | |
220 Ablnumber1<- gsub("Y",Y,Ablnumber1,perl = TRUE) | |
221 | |
222 Ablnumber2<- gsub("A",A,Ablnumber2,perl = TRUE) | |
223 Ablnumber2<- gsub("C",C,Ablnumber2,perl = TRUE) | |
224 Ablnumber2<- gsub("D",D,Ablnumber2,perl = TRUE) | |
225 Ablnumber2<- gsub("E",E,Ablnumber2,perl = TRUE) | |
226 Ablnumber2<- gsub("F",F,Ablnumber2,perl = TRUE) | |
227 Ablnumber2<- gsub("G",G,Ablnumber2,perl = TRUE) | |
228 Ablnumber2<- gsub("H",H,Ablnumber2,perl = TRUE) | |
229 Ablnumber2<- gsub("I",I,Ablnumber2,perl = TRUE) | |
230 Ablnumber2<- gsub("K",K,Ablnumber2,perl = TRUE) | |
231 Ablnumber2<- gsub("L",L,Ablnumber2,perl = TRUE) | |
232 Ablnumber2<- gsub("M",M,Ablnumber2,perl = TRUE) | |
233 Ablnumber2<- gsub("N",N,Ablnumber2,perl = TRUE) | |
234 Ablnumber2<- gsub("P",P,Ablnumber2,perl = TRUE) | |
235 Ablnumber2<- gsub("Q",Q,Ablnumber2,perl = TRUE) | |
236 Ablnumber2<- gsub("R",R,Ablnumber2,perl = TRUE) | |
237 Ablnumber2<- gsub("S",S,Ablnumber2,perl = TRUE) | |
238 Ablnumber2<- gsub("T",T,Ablnumber2,perl = TRUE) | |
239 Ablnumber2<- gsub("V",V,Ablnumber2,perl = TRUE) | |
240 Ablnumber2<- gsub("W",W,Ablnumber2,perl = TRUE) | |
241 Ablnumber2<- gsub("Y",Y,Ablnumber2,perl = TRUE) | |
242 | |
243 Ablnumber3<- gsub("A",A,Ablnumber3,perl = TRUE) | |
244 Ablnumber3<- gsub("C",C,Ablnumber3,perl = TRUE) | |
245 Ablnumber3<- gsub("D",D,Ablnumber3,perl = TRUE) | |
246 Ablnumber3<- gsub("E",E,Ablnumber3,perl = TRUE) | |
247 Ablnumber3<- gsub("F",F,Ablnumber3,perl = TRUE) | |
248 Ablnumber3<- gsub("G",G,Ablnumber3,perl = TRUE) | |
249 Ablnumber3<- gsub("H",H,Ablnumber3,perl = TRUE) | |
250 Ablnumber3<- gsub("I",I,Ablnumber3,perl = TRUE) | |
251 Ablnumber3<- gsub("K",K,Ablnumber3,perl = TRUE) | |
252 Ablnumber3<- gsub("L",L,Ablnumber3,perl = TRUE) | |
253 Ablnumber3<- gsub("M",M,Ablnumber3,perl = TRUE) | |
254 Ablnumber3<- gsub("N",N,Ablnumber3,perl = TRUE) | |
255 Ablnumber3<- gsub("P",P,Ablnumber3,perl = TRUE) | |
256 Ablnumber3<- gsub("Q",Q,Ablnumber3,perl = TRUE) | |
257 Ablnumber3<- gsub("R",R,Ablnumber3,perl = TRUE) | |
258 Ablnumber3<- gsub("S",S,Ablnumber3,perl = TRUE) | |
259 Ablnumber3<- gsub("T",T,Ablnumber3,perl = TRUE) | |
260 Ablnumber3<- gsub("V",V,Ablnumber3,perl = TRUE) | |
261 Ablnumber3<- gsub("W",W,Ablnumber3,perl = TRUE) | |
262 Ablnumber3<- gsub("Y",Y,Ablnumber3,perl = TRUE) | |
263 | |
264 Ablnumber4<- gsub("A",A,Ablnumber4,perl = TRUE) | |
265 Ablnumber4<- gsub("C",C,Ablnumber4,perl = TRUE) | |
266 Ablnumber4<- gsub("D",D,Ablnumber4,perl = TRUE) | |
267 Ablnumber4<- gsub("E",E,Ablnumber4,perl = TRUE) | |
268 Ablnumber4<- gsub("F",F,Ablnumber4,perl = TRUE) | |
269 Ablnumber4<- gsub("G",G,Ablnumber4,perl = TRUE) | |
270 Ablnumber4<- gsub("H",H,Ablnumber4,perl = TRUE) | |
271 Ablnumber4<- gsub("I",I,Ablnumber4,perl = TRUE) | |
272 Ablnumber4<- gsub("K",K,Ablnumber4,perl = TRUE) | |
273 Ablnumber4<- gsub("L",L,Ablnumber4,perl = TRUE) | |
274 Ablnumber4<- gsub("M",M,Ablnumber4,perl = TRUE) | |
275 Ablnumber4<- gsub("N",N,Ablnumber4,perl = TRUE) | |
276 Ablnumber4<- gsub("P",P,Ablnumber4,perl = TRUE) | |
277 Ablnumber4<- gsub("Q",Q,Ablnumber4,perl = TRUE) | |
278 Ablnumber4<- gsub("R",R,Ablnumber4,perl = TRUE) | |
279 Ablnumber4<- gsub("S",S,Ablnumber4,perl = TRUE) | |
280 Ablnumber4<- gsub("T",T,Ablnumber4,perl = TRUE) | |
281 Ablnumber4<- gsub("V",V,Ablnumber4,perl = TRUE) | |
282 Ablnumber4<- gsub("W",W,Ablnumber4,perl = TRUE) | |
283 Ablnumber4<- gsub("Y",Y,Ablnumber4,perl = TRUE) | |
284 | |
285 Ablnumber5<- gsub("A",A,Ablnumber5,perl = TRUE) | |
286 Ablnumber5<- gsub("C",C,Ablnumber5,perl = TRUE) | |
287 Ablnumber5<- gsub("D",D,Ablnumber5,perl = TRUE) | |
288 Ablnumber5<- gsub("E",E,Ablnumber5,perl = TRUE) | |
289 Ablnumber5<- gsub("F",F,Ablnumber5,perl = TRUE) | |
290 Ablnumber5<- gsub("G",G,Ablnumber5,perl = TRUE) | |
291 Ablnumber5<- gsub("H",H,Ablnumber5,perl = TRUE) | |
292 Ablnumber5<- gsub("I",I,Ablnumber5,perl = TRUE) | |
293 Ablnumber5<- gsub("K",K,Ablnumber5,perl = TRUE) | |
294 Ablnumber5<- gsub("L",L,Ablnumber5,perl = TRUE) | |
295 Ablnumber5<- gsub("M",M,Ablnumber5,perl = TRUE) | |
296 Ablnumber5<- gsub("N",N,Ablnumber5,perl = TRUE) | |
297 Ablnumber5<- gsub("P",P,Ablnumber5,perl = TRUE) | |
298 Ablnumber5<- gsub("Q",Q,Ablnumber5,perl = TRUE) | |
299 Ablnumber5<- gsub("R",R,Ablnumber5,perl = TRUE) | |
300 Ablnumber5<- gsub("S",S,Ablnumber5,perl = TRUE) | |
301 Ablnumber5<- gsub("T",T,Ablnumber5,perl = TRUE) | |
302 Ablnumber5<- gsub("V",V,Ablnumber5,perl = TRUE) | |
303 Ablnumber5<- gsub("W",W,Ablnumber5,perl = TRUE) | |
304 Ablnumber5<- gsub("Y",Y,Ablnumber5,perl = TRUE) | |
305 | |
306 Ablnumber6<- gsub("A",A,Ablnumber6,perl = TRUE) | |
307 Ablnumber6<- gsub("C",C,Ablnumber6,perl = TRUE) | |
308 Ablnumber6<- gsub("D",D,Ablnumber6,perl = TRUE) | |
309 Ablnumber6<- gsub("E",E,Ablnumber6,perl = TRUE) | |
310 Ablnumber6<- gsub("F",F,Ablnumber6,perl = TRUE) | |
311 Ablnumber6<- gsub("G",G,Ablnumber6,perl = TRUE) | |
312 Ablnumber6<- gsub("H",H,Ablnumber6,perl = TRUE) | |
313 Ablnumber6<- gsub("I",I,Ablnumber6,perl = TRUE) | |
314 Ablnumber6<- gsub("K",K,Ablnumber6,perl = TRUE) | |
315 Ablnumber6<- gsub("L",L,Ablnumber6,perl = TRUE) | |
316 Ablnumber6<- gsub("M",M,Ablnumber6,perl = TRUE) | |
317 Ablnumber6<- gsub("N",N,Ablnumber6,perl = TRUE) | |
318 Ablnumber6<- gsub("P",P,Ablnumber6,perl = TRUE) | |
319 Ablnumber6<- gsub("Q",Q,Ablnumber6,perl = TRUE) | |
320 Ablnumber6<- gsub("R",R,Ablnumber6,perl = TRUE) | |
321 Ablnumber6<- gsub("S",S,Ablnumber6,perl = TRUE) | |
322 Ablnumber6<- gsub("T",T,Ablnumber6,perl = TRUE) | |
323 Ablnumber6<- gsub("V",V,Ablnumber6,perl = TRUE) | |
324 Ablnumber6<- gsub("W",W,Ablnumber6,perl = TRUE) | |
325 Ablnumber6<- gsub("Y",Y,Ablnumber6,perl = TRUE) | |
326 | |
327 Ablnumber7<- gsub("A",A,Ablnumber7,perl = TRUE) | |
328 Ablnumber7<- gsub("C",C,Ablnumber7,perl = TRUE) | |
329 Ablnumber7<- gsub("D",D,Ablnumber7,perl = TRUE) | |
330 Ablnumber7<- gsub("E",E,Ablnumber7,perl = TRUE) | |
331 Ablnumber7<- gsub("F",F,Ablnumber7,perl = TRUE) | |
332 Ablnumber7<- gsub("G",G,Ablnumber7,perl = TRUE) | |
333 Ablnumber7<- gsub("H",H,Ablnumber7,perl = TRUE) | |
334 Ablnumber7<- gsub("I",I,Ablnumber7,perl = TRUE) | |
335 Ablnumber7<- gsub("K",K,Ablnumber7,perl = TRUE) | |
336 Ablnumber7<- gsub("L",L,Ablnumber7,perl = TRUE) | |
337 Ablnumber7<- gsub("M",M,Ablnumber7,perl = TRUE) | |
338 Ablnumber7<- gsub("N",N,Ablnumber7,perl = TRUE) | |
339 Ablnumber7<- gsub("P",P,Ablnumber7,perl = TRUE) | |
340 Ablnumber7<- gsub("Q",Q,Ablnumber7,perl = TRUE) | |
341 Ablnumber7<- gsub("R",R,Ablnumber7,perl = TRUE) | |
342 Ablnumber7<- gsub("S",S,Ablnumber7,perl = TRUE) | |
343 Ablnumber7<- gsub("T",T,Ablnumber7,perl = TRUE) | |
344 Ablnumber7<- gsub("V",V,Ablnumber7,perl = TRUE) | |
345 Ablnumber7<- gsub("W",W,Ablnumber7,perl = TRUE) | |
346 Ablnumber7<- gsub("Y",Y,Ablnumber7,perl = TRUE) | |
347 | |
348 Ablnumber8<- gsub("A",A,Ablnumber8,perl = TRUE) | |
349 Ablnumber8<- gsub("C",C,Ablnumber8,perl = TRUE) | |
350 Ablnumber8<- gsub("D",D,Ablnumber8,perl = TRUE) | |
351 Ablnumber8<- gsub("E",E,Ablnumber8,perl = TRUE) | |
352 Ablnumber8<- gsub("F",F,Ablnumber8,perl = TRUE) | |
353 Ablnumber8<- gsub("G",G,Ablnumber8,perl = TRUE) | |
354 Ablnumber8<- gsub("H",H,Ablnumber8,perl = TRUE) | |
355 Ablnumber8<- gsub("I",I,Ablnumber8,perl = TRUE) | |
356 Ablnumber8<- gsub("K",K,Ablnumber8,perl = TRUE) | |
357 Ablnumber8<- gsub("L",L,Ablnumber8,perl = TRUE) | |
358 Ablnumber8<- gsub("M",M,Ablnumber8,perl = TRUE) | |
359 Ablnumber8<- gsub("N",N,Ablnumber8,perl = TRUE) | |
360 Ablnumber8<- gsub("P",P,Ablnumber8,perl = TRUE) | |
361 Ablnumber8<- gsub("Q",Q,Ablnumber8,perl = TRUE) | |
362 Ablnumber8<- gsub("R",R,Ablnumber8,perl = TRUE) | |
363 Ablnumber8<- gsub("S",S,Ablnumber8,perl = TRUE) | |
364 Ablnumber8<- gsub("T",T,Ablnumber8,perl = TRUE) | |
365 Ablnumber8<- gsub("V",V,Ablnumber8,perl = TRUE) | |
366 Ablnumber8<- gsub("W",W,Ablnumber8,perl = TRUE) | |
367 Ablnumber8<- gsub("Y",Y,Ablnumber8,perl = TRUE) | |
368 | |
369 Ablnumber9<- gsub("A",A,Ablnumber9,perl = TRUE) | |
370 Ablnumber9<- gsub("C",C,Ablnumber9,perl = TRUE) | |
371 Ablnumber9<- gsub("D",D,Ablnumber9,perl = TRUE) | |
372 Ablnumber9<- gsub("E",E,Ablnumber9,perl = TRUE) | |
373 Ablnumber9<- gsub("F",F,Ablnumber9,perl = TRUE) | |
374 Ablnumber9<- gsub("G",G,Ablnumber9,perl = TRUE) | |
375 Ablnumber9<- gsub("H",H,Ablnumber9,perl = TRUE) | |
376 Ablnumber9<- gsub("I",I,Ablnumber9,perl = TRUE) | |
377 Ablnumber9<- gsub("K",K,Ablnumber9,perl = TRUE) | |
378 Ablnumber9<- gsub("L",L,Ablnumber9,perl = TRUE) | |
379 Ablnumber9<- gsub("M",M,Ablnumber9,perl = TRUE) | |
380 Ablnumber9<- gsub("N",N,Ablnumber9,perl = TRUE) | |
381 Ablnumber9<- gsub("P",P,Ablnumber9,perl = TRUE) | |
382 Ablnumber9<- gsub("Q",Q,Ablnumber9,perl = TRUE) | |
383 Ablnumber9<- gsub("R",R,Ablnumber9,perl = TRUE) | |
384 Ablnumber9<- gsub("S",S,Ablnumber9,perl = TRUE) | |
385 Ablnumber9<- gsub("T",T,Ablnumber9,perl = TRUE) | |
386 Ablnumber9<- gsub("V",V,Ablnumber9,perl = TRUE) | |
387 Ablnumber9<- gsub("W",W,Ablnumber9,perl = TRUE) | |
388 Ablnumber9<- gsub("Y",Y,Ablnumber9,perl = TRUE) | |
389 } | |
390 ######################################## | |
391 | |
392 | |
393 total=length(Positionp7)*length(Positionp6)*length(Positionp5)*length(Positionp4)*length(Positionp3)*(length(Positionp2))*length(Positionp1)* | |
394 length(Positiond0)*length(Positionm1)*length(Positionm2)*length(Positionm3)*length(Positionm4)*length(Positionm5)*length(Positionm6)*length(Positionm7) | |
395 #this is just a way to doublecheck that the length of the generated peptides vector is correct | |
396 | |
397 GeneratedPeptides<-rep(NA, times=total*15) | |
398 GeneratedPeptides<-matrix(data = GeneratedPeptides,ncol = 15) | |
399 | |
400 NumeratedPeptides<-GeneratedPeptides | |
401 #create an empty vector of correct length by finding the number of each AAs per position and multiplying them | |
402 count<-0 | |
403 for (t in 1:length(Positionm7)) { | |
404 for (s in 1:length(Positionm6)) { | |
405 for (r in 1:length(Positionm5)) { | |
406 for (i in 1:length(Positionm4)) { | |
407 for (j in 1:length(Positionm3)) { | |
408 for (k in 1:length(Positionm2)) { | |
409 for (l in 1:length(Positionm1)) { | |
410 for (m in 1:length(Positiond0)) { | |
411 for (n in 1:length(Positionp1)) { | |
412 for (o in 1:length(Positionp2)) { | |
413 for (p in 1:length(Positionp3)) { | |
414 for (q in 1:length(Positionp4)) { | |
415 for (u in 1:length(Positionp5)) { | |
416 for (v in 1:length(Positionp6)) { | |
417 for (w in 1:length(Positionp7)) { | |
418 # i=1 | |
419 # j=1 | |
420 # k=1 | |
421 # l=1 | |
422 # m=1 | |
423 # n=1 | |
424 # o=1 | |
425 # p=1 | |
426 # q=1 | |
427 # | |
428 #for every single position, increment the count number, create a peptide using the AAs at that position | |
429 #then put them together into the generated peptides sequencex | |
430 count<-count+1 | |
431 tabulation<-c(Positionm7[t],Positionm6[s],Positionm5[r],Positionm4[i],Positionm3[j],Positionm2[k],Positionm1[l],Positiond0[m],Positionp1[n], | |
432 Positionp2[o],Positionp3[p],Positionp4[q],Positionp5[u],Positionp6[v],Positionp7[w]) | |
433 numeration<-c(number15[t],number14[s],number13[r],number1[i],number2[j],number3[k],number4[l],number5[m],number6[n],number7[o],number8[p],number9[q],number10[u],number11[v], | |
434 number12[w]) | |
435 #tabulation<-paste(tabulation, sep="", collapse="") | |
436 GeneratedPeptides[count,1:15]<-tabulation | |
437 NumeratedPeptides[count,1:15]<-numeration | |
438 } | |
439 } | |
440 } | |
441 } | |
442 } | |
443 } | |
444 } | |
445 } | |
446 } | |
447 } | |
448 } | |
449 } | |
450 } | |
451 } | |
452 } | |
453 #################################################################### | |
454 #now here I use the Endogenous Probabilty matrix from the previous script, which is called EMPtable | |
455 #to score the created peptides | |
456 ThisKinTable<-EPMtableu#[1:nrow(SDtable),] | |
457 TKTcolumn<-c(data=rep(1,times=21)) | |
458 TKTcolumn<-as.matrix(TKTcolumn,ncol=1) | |
459 ThisKinTable<-cbind(TKTcolumn,ThisKinTable) | |
460 | |
461 ThisKinGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
462 ThisKinGenWeirdScore<-rep(NA,times=nrow(GeneratedPeptides)) | |
463 | |
464 for (x in 1:nrow(GeneratedPeptides)){ | |
465 Scoringpeptide<-NumeratedPeptides[x,1:15] | |
466 Scoringpeptide<-Scoringpeptide+1 | |
467 ThisKinTableScore<-as.numeric(ThisKinTable[Scoringpeptide[1],3])*ThisKinTable[as.numeric(Scoringpeptide[2]),4]*ThisKinTable[as.numeric(Scoringpeptide[3]),5]* | |
468 ThisKinTable[as.numeric(Scoringpeptide[4]),6]*ThisKinTable[as.numeric(Scoringpeptide[5]),7]*ThisKinTable[as.numeric(Scoringpeptide[6]),8]*ThisKinTable[as.numeric(Scoringpeptide[7]),9]* | |
469 #ThisKinTable[as.numeric(Scoringpeptide[8]),10]* | |
470 ThisKinTable[as.numeric(Scoringpeptide[9]),11]*ThisKinTable[as.numeric(Scoringpeptide[10]),12]*ThisKinTable[as.numeric(Scoringpeptide[11]),13]* | |
471 ThisKinTable[as.numeric(Scoringpeptide[12]),14]*ThisKinTable[as.numeric(Scoringpeptide[13]),15]*ThisKinTable[as.numeric(Scoringpeptide[14]),16]*ThisKinTable[as.numeric(Scoringpeptide[15]),17] | |
472 ThisKinGeneratedScores[x]<-ThisKinTableScore | |
473 ThisKinTableScore<-(ThisKinTableScore/(ThisKinTableScore+1/as.numeric(NormalizationScore[2]))) | |
474 ThisKinGenWeirdScore[x]<-ThisKinTableScore | |
475 } | |
476 | |
477 AblGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
478 ArgGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
479 BtkGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
480 CskGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
481 FynGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
482 HckGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
483 JAK2GeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
484 LckGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
485 LynGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
486 Pyk2GeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
487 SrcGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
488 SykGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
489 YesGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
490 | |
491 | |
492 for (x in 1:nrow(GeneratedPeptides)){ | |
493 Scoringpeptide<-NumeratedPeptides[x,1:15] | |
494 AblScore<-Abl[Scoringpeptide[1],2]*Abl[Scoringpeptide[2],3]*Abl[Scoringpeptide[3],4]*Abl[Scoringpeptide[4],5]*Abl[Scoringpeptide[5],6]*Abl[Scoringpeptide[6],7]* | |
495 Abl[Scoringpeptide[7],8]*Abl[Scoringpeptide[9],10]*Abl[Scoringpeptide[10],11]*Abl[Scoringpeptide[11],12]*Abl[Scoringpeptide[12],13]* | |
496 Abl[Scoringpeptide[13],14]*Abl[Scoringpeptide[14],15]*Abl[Scoringpeptide[15],16] | |
497 AblGeneratedScores[x]<-AblScore | |
498 | |
499 ArgScore<-Arg[Scoringpeptide[1],2]*Arg[Scoringpeptide[2],3]*Arg[Scoringpeptide[3],4]*Arg[Scoringpeptide[4],5]*Arg[Scoringpeptide[5],6]*Arg[Scoringpeptide[6],7]* | |
500 Arg[Scoringpeptide[7],8]*Arg[Scoringpeptide[9],10]*Arg[Scoringpeptide[10],11]*Arg[Scoringpeptide[11],12]*Arg[Scoringpeptide[12],13]* | |
501 Arg[Scoringpeptide[13],14]*Arg[Scoringpeptide[14],15]*Arg[Scoringpeptide[15],16] | |
502 ArgGeneratedScores[x]<-ArgScore | |
503 | |
504 BtkScore<-Btk[Scoringpeptide[1],2]*Btk[Scoringpeptide[2],3]*Btk[Scoringpeptide[3],4]*Btk[Scoringpeptide[4],5]*Btk[Scoringpeptide[5],6]*Btk[Scoringpeptide[6],7]* | |
505 Btk[Scoringpeptide[7],8]*Btk[Scoringpeptide[9],10]*Btk[Scoringpeptide[10],11]*Btk[Scoringpeptide[11],12]*Btk[Scoringpeptide[12],13]* | |
506 Btk[Scoringpeptide[13],14]*Btk[Scoringpeptide[14],15]*Btk[Scoringpeptide[15],16] | |
507 BtkGeneratedScores[x]<-BtkScore | |
508 | |
509 CskScore<-Csk[Scoringpeptide[1],2]*Csk[Scoringpeptide[2],3]*Csk[Scoringpeptide[3],4]*Csk[Scoringpeptide[4],5]*Csk[Scoringpeptide[5],6]*Csk[Scoringpeptide[6],7]* | |
510 Csk[Scoringpeptide[7],8]*Csk[Scoringpeptide[9],10]*Csk[Scoringpeptide[10],11]*Csk[Scoringpeptide[11],12]*Csk[Scoringpeptide[12],13]* | |
511 Csk[Scoringpeptide[13],14]*Csk[Scoringpeptide[14],15]*Csk[Scoringpeptide[15],16] | |
512 CskGeneratedScores[x]<-CskScore | |
513 | |
514 FynScore<-Fyn[Scoringpeptide[1],2]*Fyn[Scoringpeptide[2],3]*Fyn[Scoringpeptide[3],4]*Fyn[Scoringpeptide[4],5]*Fyn[Scoringpeptide[5],6]*Fyn[Scoringpeptide[6],7]* | |
515 Fyn[Scoringpeptide[7],8]*Fyn[Scoringpeptide[9],10]*Fyn[Scoringpeptide[10],11]*Fyn[Scoringpeptide[11],12]*Fyn[Scoringpeptide[12],13]* | |
516 Fyn[Scoringpeptide[13],14]*Fyn[Scoringpeptide[14],15]*Fyn[Scoringpeptide[15],16] | |
517 FynGeneratedScores[x]<-FynScore | |
518 | |
519 HckScore<-Hck[Scoringpeptide[1],2]*Hck[Scoringpeptide[2],3]*Hck[Scoringpeptide[3],4]*Hck[Scoringpeptide[4],5]*Hck[Scoringpeptide[5],6]*Hck[Scoringpeptide[6],7]* | |
520 Hck[Scoringpeptide[7],8]*Hck[Scoringpeptide[9],10]*Hck[Scoringpeptide[10],11]*Hck[Scoringpeptide[11],12]*Hck[Scoringpeptide[12],13]* | |
521 Hck[Scoringpeptide[13],14]*Hck[Scoringpeptide[14],15]*Hck[Scoringpeptide[15],16] | |
522 HckGeneratedScores[x]<-HckScore | |
523 | |
524 JAK2Score<-JAK2[Scoringpeptide[1],2]*JAK2[Scoringpeptide[2],3]*JAK2[Scoringpeptide[3],4]*JAK2[Scoringpeptide[4],5]*JAK2[Scoringpeptide[5],6]*JAK2[Scoringpeptide[6],7]* | |
525 JAK2[Scoringpeptide[7],8]*JAK2[Scoringpeptide[9],10]*JAK2[Scoringpeptide[10],11]*JAK2[Scoringpeptide[11],12]*JAK2[Scoringpeptide[12],13]* | |
526 JAK2[Scoringpeptide[13],14]*JAK2[Scoringpeptide[14],15]*JAK2[Scoringpeptide[15],16] | |
527 JAK2GeneratedScores[x]<-JAK2Score | |
528 | |
529 LckScore<-Lck[Scoringpeptide[1],2]*Lck[Scoringpeptide[2],3]*Lck[Scoringpeptide[3],4]*Lck[Scoringpeptide[4],5]*Lck[Scoringpeptide[5],6]*Lck[Scoringpeptide[6],7]* | |
530 Lck[Scoringpeptide[7],8]*Lck[Scoringpeptide[9],10]*Lck[Scoringpeptide[10],11]*Lck[Scoringpeptide[11],12]*Lck[Scoringpeptide[12],13]* | |
531 Lck[Scoringpeptide[13],14]*Lck[Scoringpeptide[14],15]*Lck[Scoringpeptide[15],16] | |
532 LckGeneratedScores[x]<-LckScore | |
533 | |
534 LynScore<-Lyn[Scoringpeptide[1],2]*Lyn[Scoringpeptide[2],3]*Lyn[Scoringpeptide[3],4]*Lyn[Scoringpeptide[4],5]*Lyn[Scoringpeptide[5],6]*Lyn[Scoringpeptide[6],7]* | |
535 Lyn[Scoringpeptide[7],8]*Lyn[Scoringpeptide[9],10]*Lyn[Scoringpeptide[10],11]*Lyn[Scoringpeptide[11],12]*Lyn[Scoringpeptide[12],13]* | |
536 Lyn[Scoringpeptide[13],14]*Lyn[Scoringpeptide[14],15]*Lyn[Scoringpeptide[15],16] | |
537 LynGeneratedScores[x]<-LynScore | |
538 | |
539 Pyk2Score<-Pyk2[Scoringpeptide[1],2]*Pyk2[Scoringpeptide[2],3]*Pyk2[Scoringpeptide[3],4]*Pyk2[Scoringpeptide[4],5]*Pyk2[Scoringpeptide[5],6]*Pyk2[Scoringpeptide[6],7]* | |
540 Pyk2[Scoringpeptide[7],8]*Pyk2[Scoringpeptide[9],10]*Pyk2[Scoringpeptide[10],11]*Pyk2[Scoringpeptide[11],12]*Pyk2[Scoringpeptide[12],13]* | |
541 Pyk2[Scoringpeptide[13],14]*Pyk2[Scoringpeptide[14],15]*Pyk2[Scoringpeptide[15],16] | |
542 Pyk2GeneratedScores[x]<-Pyk2Score | |
543 | |
544 SrcScore<-Src[Scoringpeptide[1],2]*Src[Scoringpeptide[2],3]*Src[Scoringpeptide[3],4]*Src[Scoringpeptide[4],5]*Src[Scoringpeptide[5],6]*Src[Scoringpeptide[6],7]* | |
545 Src[Scoringpeptide[7],8]*Src[Scoringpeptide[9],10]*Src[Scoringpeptide[10],11]*Src[Scoringpeptide[11],12]*Src[Scoringpeptide[12],13]* | |
546 Src[Scoringpeptide[13],14]*Src[Scoringpeptide[14],15]*Src[Scoringpeptide[15],16] | |
547 SrcGeneratedScores[x]<-SrcScore | |
548 | |
549 SykScore<-Syk[Scoringpeptide[1],2]*Syk[Scoringpeptide[2],3]*Syk[Scoringpeptide[3],4]*Syk[Scoringpeptide[4],5]*Syk[Scoringpeptide[5],6]*Syk[Scoringpeptide[6],7]* | |
550 Syk[Scoringpeptide[7],8]*Syk[Scoringpeptide[9],10]*Syk[Scoringpeptide[10],11]*Syk[Scoringpeptide[11],12]*Syk[Scoringpeptide[12],13]* | |
551 Syk[Scoringpeptide[13],14]*Syk[Scoringpeptide[14],15]*Syk[Scoringpeptide[15],16] | |
552 SykGeneratedScores[x]<-SykScore | |
553 | |
554 YesScore<-Yes[Scoringpeptide[1],2]*Yes[Scoringpeptide[2],3]*Yes[Scoringpeptide[3],4]*Yes[Scoringpeptide[4],5]*Yes[Scoringpeptide[5],6]*Yes[Scoringpeptide[6],7]* | |
555 Yes[Scoringpeptide[7],8]*Yes[Scoringpeptide[9],10]*Yes[Scoringpeptide[10],11]*Yes[Scoringpeptide[11],12]*Yes[Scoringpeptide[12],13]* | |
556 Yes[Scoringpeptide[13],14]*Yes[Scoringpeptide[14],15]*Yes[Scoringpeptide[15],16] | |
557 YesGeneratedScores[x]<-YesScore | |
558 | |
559 # ThisKinTableScore<-ThisKinTable[as.numeric(Scoringpeptide[1]),3]*ThisKinTable[as.numeric(Scoringpeptide[2]),4]*ThisKinTable[as.numeric(Scoringpeptide[3]),5]* | |
560 # ThisKinTable[as.numeric(Scoringpeptide[4]),6]*ThisKinTable[as.numeric(Scoringpeptide[6]),8]* | |
561 # ThisKinTable[as.numeric(Scoringpeptide[7]),9]*ThisKinTable[as.numeric(Scoringpeptide[8]),10]*ThisKinTable[as.numeric(Scoringpeptide[9]),11] | |
562 # ThisKinGeneratedScores[x]<-ThisKinTableScore | |
563 } | |
564 | |
565 | |
566 | |
567 AblNorm<-1/as.numeric(Abl[22,1]) | |
568 AblThresh<-as.numeric(Abl[24,1]) | |
569 AblTrueThresh<-((AblThresh*AblNorm)/(100-AblThresh)) | |
570 AblActive<-unlist(AblGeneratedScores)>AblTrueThresh | |
571 | |
572 ArgNorm<-1/as.numeric(Arg[22,1]) | |
573 ArgThresh<-as.numeric(Arg[24,1]) | |
574 ArgTrueThresh<-((ArgThresh*ArgNorm)/(100-ArgThresh)) | |
575 ArgActive<-unlist(ArgGeneratedScores)>ArgTrueThresh | |
576 | |
577 BtkNorm<-1/as.numeric(Btk[22,1]) | |
578 BtkThresh<-as.numeric(Btk[24,1]) | |
579 BtkTrueThresh<-((BtkThresh*BtkNorm)/(100-BtkThresh)) | |
580 BtkActive<-unlist(BtkGeneratedScores)>BtkTrueThresh | |
581 | |
582 CskNorm<-1/as.numeric(Csk[22,1]) | |
583 CskThresh<-as.numeric(Csk[24,1]) | |
584 CskTrueThresh<-((CskThresh*CskNorm)/(100-CskThresh)) | |
585 CskActive<-(CskGeneratedScores)>CskTrueThresh | |
586 | |
587 FynNorm<-1/as.numeric(Fyn[22,1]) | |
588 FynThresh<-as.numeric(Fyn[24,1]) | |
589 FynTrueThresh<-((FynThresh*FynNorm)/(100-FynThresh)) | |
590 FynActive<-unlist(FynGeneratedScores)>FynTrueThresh | |
591 | |
592 HckNorm<-1/as.numeric(Hck[22,1]) | |
593 HckThresh<-as.numeric(Hck[24,1]) | |
594 HckTrueThresh<-((HckThresh*HckNorm)/(100-HckThresh)) | |
595 HckActive<-unlist(HckGeneratedScores)>HckTrueThresh | |
596 | |
597 JAK2Norm<-1/as.numeric(JAK2[22,1]) | |
598 JAK2Thresh<-as.numeric(JAK2[24,1]) | |
599 JAK2TrueThresh<-((JAK2Thresh*JAK2Norm)/(100-JAK2Thresh)) | |
600 JAk2Active<-unlist(JAK2GeneratedScores)>JAK2TrueThresh | |
601 | |
602 LckNorm<-1/as.numeric(Lck[22,1]) | |
603 LckThresh<-as.numeric(Lck[24,1]) | |
604 LckTrueThresh<-((LckThresh*LckNorm)/(100-LckThresh)) | |
605 LckActive<-unlist(LckGeneratedScores)>LckTrueThresh | |
606 | |
607 LynNorm<-1/as.numeric(Lyn[22,1]) | |
608 LynThresh<-as.numeric(Lyn[24,1]) | |
609 LynTrueThresh<-((LynThresh*LynNorm)/(100-LynThresh)) | |
610 LynActive<-unlist(LynGeneratedScores)>LynTrueThresh | |
611 | |
612 Pyk2Norm<-1/as.numeric(Pyk2[22,1]) | |
613 Pyk2Thresh<-as.numeric(Pyk2[24,1]) | |
614 Pyk2TrueThresh<-((Pyk2Thresh*Pyk2Norm)/(100-Pyk2Thresh)) | |
615 Pyk2Active<-unlist(Pyk2GeneratedScores)>Pyk2TrueThresh | |
616 | |
617 SrcNorm<-1/as.numeric(Src[22,1]) | |
618 SrcThresh<-as.numeric(Src[24,1]) | |
619 SrcTrueThresh<-((SrcThresh*SrcNorm)/(100-SrcThresh)) | |
620 SrcActive<-unlist(SrcGeneratedScores)>SrcTrueThresh | |
621 | |
622 SykNorm<-1/as.numeric(Syk[22,1]) | |
623 SykThresh<-as.numeric(Syk[24,1]) | |
624 SykTrueThresh<-((SykThresh*SykNorm)/(100-SykThresh)) | |
625 SykActive<-unlist(SykGeneratedScores)>SykTrueThresh | |
626 | |
627 YesNorm<-1/as.numeric(Yes[22,1]) | |
628 YesThresh<-as.numeric(Yes[24,1]) | |
629 YesTrueThresh<-((YesThresh*YesNorm)/(100-YesThresh)) | |
630 YesActive<-unlist(YesGeneratedScores)>YesTrueThresh | |
631 | |
632 AllActive<-AblActive+ArgActive+BtkActive+CskActive+FynActive+HckActive+JAk2Active+LckActive+LynActive+Pyk2Active+SrcActive+SykActive+YesActive | |
633 #Btkactive+ | |
634 | |
635 Scores<-ThisKinGeneratedScores | |
636 ThresholdValues<-ThisKinGenWeirdScore | |
637 | |
638 FullMotifs<-rep("Z",times=nrow(GeneratedPeptides)) | |
639 for (i in 1:nrow(GeneratedPeptides)) { | |
640 motif<-GeneratedPeptides[i,1:15] | |
641 motif<-paste(motif,sep = "", collapse = "") | |
642 FullMotifs[i]<-motif | |
643 } | |
644 | |
645 PeptidesWithRanks<-cbind.data.frame(FullMotifs,GeneratedPeptides,Scores,ThresholdValues) | |
646 PeptidesWithRanks<-cbind.data.frame(PeptidesWithRanks,AllActive,AblActive,ArgActive,BtkActive,CskActive,FynActive,HckActive,JAk2Active,LckActive,LynActive,Pyk2Active,SrcActive,SykActive,YesActive) | |
647 RanksPeptides<-PeptidesWithRanks[order(PeptidesWithRanks$AllActive,decreasing = FALSE),] | |
648 # PepRankHead<-c(1:9,"Sequence","RPMS","PMS") | |
649 # RanksPeptides<-rbind.data.frame(PepRankHead,PeptidesWithRanks) | |
650 head(RanksPeptides) | |
651 | |
652 | |
653 #now I have to score the negative sequences... for some reason | |
654 #write up how we transfect with lipofectamine | |
655 #3,4,5 questions | |
656 | |
657 #PAUSED EHRE AT 4:50, HOPING THAT FIXING MINERVOTHING SO THAT LEFT SPACES WORKS FIXES A THING. OTHERWISE | |
658 #I FUCKED WITH THE MCC TABLE AND NEED TO FINISH IT | |
659 | |
660 ThisKinBlanks<-rep(1,times=17) | |
661 ThisKinTable<-rbind(ThisKinTable,ThisKinBlanks) | |
662 | |
663 NegativeScores<-rep(NA,times=nrow(NegativeSubstrateList)) | |
664 NegativeWeirdScores<-rep(NA,times=nrow(NegativeSubstrateList)) | |
665 for (v in 1:nrow(NegativeSubstrateList)) { | |
666 motif<-NegativeSubstrateList[v,2] | |
667 motif<-unlist(strsplit(motif,"")) | |
668 #if (length(motif)<9){print(v)}} | |
669 # motif[1] <- sapply(motif[1], function (x) aa_props[x]) | |
670 # motif[2] <- sapply(motif[2], function (x) aa_props[x]) | |
671 # motif[3] <- sapply(motif[3], function (x) aa_props[x]) | |
672 # motif[4] <- sapply(motif[4], function (x) aa_props[x]) | |
673 # motif[5] <- sapply(motif[5], function (x) aa_props[x]) | |
674 # motif[6] <- sapply(motif[6], function (x) aa_props[x]) | |
675 # motif[7] <- sapply(motif[7], function (x) aa_props[x]) | |
676 # motif[8] <- sapply(motif[8], function (x) aa_props[x]) | |
677 # motif[9] <- sapply(motif[9], function (x) aa_props[x]) | |
678 motif<- gsub(" ","O",motif) | |
679 motif <- sapply(motif, function (x) aa_props[x]) | |
680 Scoringpeptide<-motif | |
681 Scoringpeptide<-Scoringpeptide+1 | |
682 ThisKinTableScore<-as.numeric(ThisKinTable[Scoringpeptide[1],3])*ThisKinTable[as.numeric(Scoringpeptide[2]),4]*ThisKinTable[as.numeric(Scoringpeptide[3]),5]* | |
683 ThisKinTable[as.numeric(Scoringpeptide[4]),6]*ThisKinTable[as.numeric(Scoringpeptide[5]),7]*ThisKinTable[as.numeric(Scoringpeptide[6]),8]*ThisKinTable[as.numeric(Scoringpeptide[7]),9]* | |
684 #ThisKinTable[as.numeric(Scoringpeptide[8]),10]* | |
685 ThisKinTable[as.numeric(Scoringpeptide[9]),11]*ThisKinTable[as.numeric(Scoringpeptide[10]),12]*ThisKinTable[as.numeric(Scoringpeptide[11]),13]* | |
686 ThisKinTable[as.numeric(Scoringpeptide[12]),14]*ThisKinTable[as.numeric(Scoringpeptide[13]),15]*ThisKinTable[as.numeric(Scoringpeptide[14]),16]*ThisKinTable[as.numeric(Scoringpeptide[15]),17] | |
687 NegativeScores[v]<-ThisKinTableScore | |
688 ThisKinTableScore<-(ThisKinTableScore/(ThisKinTableScore+1/as.numeric(NormalizationScore[2]))) | |
689 NegativeWeirdScores[v]<-ThisKinTableScore*100 | |
690 } | |
691 | |
692 negativesubstrates<-NegativeSubstrateList[,2] | |
693 NegativeWithScores<-cbind(negativesubstrates,as.character(NegativeScores),as.character(NegativeWeirdScores)) | |
694 | |
695 | |
696 #NEED TO HAVE THE NEGATIVE SUBSTRATES BE OUTPUTTED | |
697 | |
698 PositiveScores<-rep(NA,times=nrow(ImportedSubstrateList)) | |
699 PositiveWeirdScores<-rep(NA,times=nrow(ImportedSubstrateList)) | |
700 | |
701 for (v in 1:nrow(ImportedSubstrateList)) { | |
702 motif<-ImportedSubstrateList[v,4:18] | |
703 motif<-unlist(motif) | |
704 motif<- gsub("^$","O",motif) | |
705 motif <- sapply(motif, function (x) aa_props[x]) | |
706 Scoringpeptide<-motif | |
707 Scoringpeptide<-Scoringpeptide+1 | |
708 ThisKinTableScore<-as.numeric(ThisKinTable[Scoringpeptide[1],3])*ThisKinTable[as.numeric(Scoringpeptide[2]),4]*ThisKinTable[as.numeric(Scoringpeptide[3]),5]* | |
709 ThisKinTable[as.numeric(Scoringpeptide[4]),6]*ThisKinTable[as.numeric(Scoringpeptide[5]),7]*ThisKinTable[as.numeric(Scoringpeptide[6]),8]*ThisKinTable[as.numeric(Scoringpeptide[7]),9]* | |
710 #ThisKinTable[as.numeric(Scoringpeptide[8]),10]* | |
711 ThisKinTable[as.numeric(Scoringpeptide[9]),11]*ThisKinTable[as.numeric(Scoringpeptide[10]),12]*ThisKinTable[as.numeric(Scoringpeptide[11]),13]* | |
712 ThisKinTable[as.numeric(Scoringpeptide[12]),14]*ThisKinTable[as.numeric(Scoringpeptide[13]),15]*ThisKinTable[as.numeric(Scoringpeptide[14]),16]*ThisKinTable[as.numeric(Scoringpeptide[15]),17] | |
713 | |
714 PositiveScores[v]<-ThisKinTableScore | |
715 ThisKinTableScore<-(ThisKinTableScore/(ThisKinTableScore+1/as.numeric(NormalizationScore[2]))) | |
716 PositiveWeirdScores[v]<-ThisKinTableScore*100 | |
717 } | |
718 | |
719 positivesubstrates<-ImportedSubstrateList[,4:18] | |
720 positivewithscores<-cbind.data.frame(positivesubstrates,PositiveScores,PositiveWeirdScores) | |
721 | |
722 | |
723 #write down the transient transfection SOP and what we will be doing with them | |
724 #write down the vector names I will be using | |
725 #write down something about transforming bacteria and with what | |
726 | |
727 #90% whatevernness | |
728 # TPninetyone<-length(PositiveWeirdScores[PositiveWeirdScores>=0.91]) | |
729 # Senseninetyone<-TPninetyone/nrow(positivesubstrates) | |
730 # | |
731 # TNninetyone<-length(NegativeWeirdScores[NegativeWeirdScores<91]) | |
732 # Specninetyone<-TNninetyone/100 | |
733 | |
734 #create the MCC table | |
735 | |
736 threshold<-c(1:100) | |
737 threshold<-order(threshold,decreasing = TRUE) | |
738 | |
739 Truepositives<-c(1:100) | |
740 Falsenegatives<-c(1:100) | |
741 Sensitivity<-c(1:100) | |
742 TrueNegatives<-c(1:100) | |
743 FalsePositives<-c(1:100) | |
744 Specificity<-c(1:100) | |
745 Accuracy<-c(1:100) | |
746 MCC<-c(1:100) | |
747 EER<-c(1:100) | |
748 | |
749 #MAKE DAMN SURE THAT THE ACCESSION NUMBERS FOLLOW THE MOTIFS | |
750 | |
751 for (z in 1:100) { | |
752 thres<-101-z | |
753 Truepositives[z]<-length(PositiveWeirdScores[PositiveWeirdScores>=(thres)]) | |
754 Falsenegatives[z]<-nrow(positivesubstrates)-Truepositives[z] | |
755 Sensitivity[z]<-Truepositives[z]/(Falsenegatives[z]+Truepositives[z]) | |
756 TrueNegatives[z]<-length(NegativeWeirdScores[NegativeWeirdScores<(thres)]) | |
757 # at thresh 100 this should be 0, because it is total minus true negatives | |
758 FalsePositives[z]<-nrow(NegativeSubstrateList)-TrueNegatives[z] | |
759 Specificity[z]<-1-(TrueNegatives[z]/(FalsePositives[z]+TrueNegatives[z])) | |
760 Accuracy[z]<-100*(Truepositives[z]+TrueNegatives[z])/(Falsenegatives[z]+FalsePositives[z]+TrueNegatives[z]+Truepositives[z]) | |
761 MCC[z]<-((Truepositives[z]+TrueNegatives[z])-(Falsenegatives[z]+FalsePositives[z]))/sqrt(round(round(Truepositives[z]+Falsenegatives[z])*round(TrueNegatives[z]+FalsePositives[z])*round(Truepositives[z]+FalsePositives[z])*round(TrueNegatives[z]+Falsenegatives[z]))) | |
762 EER[z]<-.01*(((1-(Sensitivity[z]))*(Truepositives[z]+Falsenegatives[z]))+(Specificity[z]*(1-(Truepositives[z]+Falsenegatives[z])))) | |
763 } | |
764 Characterization<-cbind.data.frame(threshold,Truepositives,Falsenegatives,Sensitivity,TrueNegatives,FalsePositives,Specificity,Accuracy,MCC,EER) | |
765 | |
766 positiveheader<-c(1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,"RPMS","PMS") | |
767 positivewithscores<-rbind.data.frame(positiveheader,positivewithscores) | |
768 | |
769 negativeheader<-c("Substrate","RPMS","PMS") | |
770 colnames(NegativeWithScores)<-negativeheader | |
771 | |
772 # write.xlsx(NegativeWithScores,file = FILENAME, sheetName = "Negative Sequences Scored",col.names = TRUE,row.names = FALSE,append = TRUE) | |
773 # write.xlsx(Characterization,file = FILENAME,sheetName = "Characterization Table",col.names = TRUE,row.names = FALSE,append = TRUE) | |
774 # write.xlsx(RanksPeptides,file = FILENAME,sheetName = "Ranked Generated Peptides",col.names = FALSE,row.names = FALSE,append = TRUE) | |
775 # write.xlsx(positivewithscores,file = FILENAME, sheetName = "Positive Sequences Scored",col.names = FALSE,row.names = FALSE,append = TRUE) | |
776 write.table(x=c("Characterzation Table"),file = FILENAME2, col.names = FALSE,row.names = FALSE, append = TRUE,sep = ",") | |
777 write.table(Characterization,file = FILENAME2, col.names = TRUE,row.names = FALSE, append = TRUE,sep = ",") | |
778 | |
779 | |
780 write.table(RanksPeptides,file = FILENAME3,append = TRUE,row.names = FALSE,col.names = TRUE,sep = ",") | |
781 | |
782 |