Mercurial > repos > jfb > kinatest_r_7_7testing
comparison kinatestid_r/Kinatest-R_part2.R @ 4:2f3df9b1c05b draft
Uploaded
| author | jfb |
|---|---|
| date | Tue, 06 Feb 2018 17:16:05 -0500 |
| parents | |
| children | f80306fc5d69 |
comparison
equal
deleted
inserted
replaced
| 3:65f235b5fe14 | 4:2f3df9b1c05b |
|---|---|
| 1 #test myself: this script should take in amino acids for each of the 9 positions and give out every single combination of those AAs | |
| 2 | |
| 3 #need to do following: fix it so that the accession numbers stay with the substrates, | |
| 4 #also the neg false constant is totaly unphos'd Ys found by FASTA-2-CSV system# uniprot | |
| 5 | |
| 6 #HOW MANY: IF THERE'S two aas in each position you get 2^9, so I assume the numbers are: | |
| 7 #(number in position-4)*(number in position -3)*(number in position -2)...=total | |
| 8 # require(rJava) | |
| 9 # require(xlsxjars) | |
| 10 # require(xlsx) | |
| 11 # # require(readxl) | |
| 12 | |
| 13 View(SDtable) | |
| 14 bareSDs<-SDtable[2:21,2:16] | |
| 15 goodones<-bareSDs>2 | |
| 16 | |
| 17 Positionm7<-which(goodones[,1] %in% TRUE) | |
| 18 if (length(Positionm7)<1){Positionm7<-which(bareSDs[,1]==max(bareSDs[,1]))} | |
| 19 Positionm6<-which(goodones[,2] %in% TRUE) | |
| 20 if (length(Positionm6)<1){Positionm6<-which(bareSDs[,2]==max(bareSDs[,2]))} | |
| 21 Positionm5<-which(goodones[,3] %in% TRUE) | |
| 22 if (length(Positionm5)<1){Positionm5<-which(bareSDs[,3]==max(bareSDs[,3]))} | |
| 23 Positionm4<-which(goodones[,4] %in% TRUE) | |
| 24 if (length(Positionm4)<1){Positionm4<-which(bareSDs[,4]==max(bareSDs[,4]))} | |
| 25 Positionm3<-which(goodones[,5] %in% TRUE) | |
| 26 if (length(Positionm3)<1){Positionm3<-which(bareSDs[,5]==max(bareSDs[,5]))} | |
| 27 Positionm2<-which(goodones[,6] %in% TRUE) | |
| 28 if (length(Positionm2)<1){Positionm2<-which(bareSDs[,6]==max(bareSDs[,6]))} | |
| 29 Positionm1<-which(goodones[,7] %in% TRUE) | |
| 30 if (length(Positionm1)<1){Positionm1<-which(bareSDs[,7]==max(bareSDs[,7]))} | |
| 31 | |
| 32 Positiond0<-which(goodones[,8] %in% TRUE) | |
| 33 if (length(Positiond0)<1){Positiond0<-which(bareSDs[,8]==max(bareSDs[,8]))} | |
| 34 | |
| 35 Positionp1<-which(goodones[,9] %in% TRUE) | |
| 36 if (length(Positionp1)<1){Positionp1<-which(bareSDs[,9]==max(bareSDs[,9]))} | |
| 37 Positionp2<-which(goodones[,10] %in% TRUE) | |
| 38 if (length(Positionp2)<1){Positionp2<-which(bareSDs[,10]==max(bareSDs[,10]))} | |
| 39 Positionp3<-which(goodones[,11] %in% TRUE) | |
| 40 if (length(Positionp3)<1){Positionp3<-which(bareSDs[,11]==max(bareSDs[,11]))} | |
| 41 Positionp4<-which(goodones[,12] %in% TRUE) | |
| 42 if (length(Positionp4)<1){Positionp4<-which(bareSDs[,12]==max(bareSDs[,12]))} | |
| 43 Positionp5<-which(goodones[,13] %in% TRUE) | |
| 44 if (length(Positionp5)<1){Positionp5<-which(bareSDs[,13]==max(bareSDs[,13]))} | |
| 45 Positionp6<-which(goodones[,14] %in% TRUE) | |
| 46 if (length(Positionp6)<1){Positionp6<-which(bareSDs[,14]==max(bareSDs[,14]))} | |
| 47 Positionp7<-which(goodones[,15] %in% TRUE) | |
| 48 if (length(Positionp7)<1){Positionp7<-which(bareSDs[,15]==max(bareSDs[,15]))} | |
| 49 | |
| 50 aa_props2 <- c("1"="A", "2"="C", "3"="D", "4"="E", "5"="F", "6"="G", "7"="H", "8"="I", "9"="K", "10"="L", "11"="M", "12"="N", | |
| 51 "13"="P", "14"="Q", "15"="R", "16"="S", "17"="T", "18"="V", "19"="W", "20"="Y") | |
| 52 aa_props2<-c(1="A") | |
| 53 | |
| 54 Positionm7<-sapply(Positionm7, function (x) aa_props2[x]) | |
| 55 Positionm6<-sapply(Positionm6, function (x) aa_props2[x]) | |
| 56 Positionm5<-sapply(Positionm5, function (x) aa_props2[x]) | |
| 57 Positionm4<-sapply(Positionm4, function (x) aa_props2[x]) | |
| 58 Positionm3<-sapply(Positionm3, function (x) aa_props2[x]) | |
| 59 Positionm2<-sapply(Positionm2, function (x) aa_props2[x]) | |
| 60 Positionm1<-sapply(Positionm1, function (x) aa_props2[x]) | |
| 61 Positiond0<-sapply(Positiond0, function (x) aa_props2[x]) | |
| 62 Positionp1<-sapply(Positionp1, function (x) aa_props2[x]) | |
| 63 Positionp2<-sapply(Positionp2, function (x) aa_props2[x]) | |
| 64 Positionp3<-sapply(Positionp3, function (x) aa_props2[x]) | |
| 65 Positionp4<-sapply(Positionp4, function (x) aa_props2[x]) | |
| 66 Positionp5<-sapply(Positionp5, function (x) aa_props2[x]) | |
| 67 Positionp6<-sapply(Positionp6, function (x) aa_props2[x]) | |
| 68 Positionp7<-sapply(Positionp7, function (x) aa_props2[x]) | |
| 69 | |
| 70 | |
| 71 # Positionm7<-c("D","H","N","V") | |
| 72 # Positionm6<-c("E","V") | |
| 73 # Positionm5<-c("D","H") | |
| 74 # Positionm4<-c("D","N") | |
| 75 # Positionm3<-c("D","E","F","Q") | |
| 76 # Positionm2<-c("D","N","Q","S") | |
| 77 # Positionm1<-c("F","I","L") | |
| 78 # Positiond0<-c("Y") | |
| 79 # Positionp1<-c("A","E") | |
| 80 # Positionp2<-c("T","S","Q","E") | |
| 81 # Positionp3<-c("V") | |
| 82 # Positionp4<-c("K") | |
| 83 # Positionp5<-c("K") | |
| 84 # Positionp6<-c("K") | |
| 85 # Positionp7<-c("R") | |
| 86 #this is where the amino acids for each position are given. m means minus, p mean plus | |
| 87 ######################################## | |
| 88 # ScreenerFilename<-"C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls" | |
| 89 | |
| 90 | |
| 91 | |
| 92 | |
| 93 | |
| 94 | |
| 95 | |
| 96 | |
| 97 | |
| 98 | |
| 99 | |
| 100 screaner<-read.csv(ScreenerFilename, header = FALSE, stringsAsFactors = FALSE) | |
| 101 | |
| 102 | |
| 103 Abl<-screaner[2:25,] | |
| 104 Arg<-screaner[27:50,] | |
| 105 Btk<-screaner[52:75,] | |
| 106 Csk<-screaner[77:100,] | |
| 107 Fyn<-screaner[102:125,] | |
| 108 Hck<-screaner[127:150,] | |
| 109 JAK2<-screaner[152:175,] | |
| 110 Lck<-screaner[177:200,] | |
| 111 Lyn<-screaner[202:225,] | |
| 112 Pyk2<-screaner[227:250,] | |
| 113 Src<-screaner[252:275,] | |
| 114 Syk<-screaner[277:300,] | |
| 115 Yes<-screaner[302:325,] | |
| 116 | |
| 117 #two questions: why are we doing BTK when we already have a bioninformatics page about it? | |
| 118 #two I reran everything and only get 96 positions of interest in the SD table | |
| 119 | |
| 120 | |
| 121 | |
| 122 | |
| 123 | |
| 124 | |
| 125 | |
| 126 | |
| 127 | |
| 128 #Do_You_want_An_Excel_Output_Questionmark<-"NO" | |
| 129 GeneratedPeptidesFile<-"GeneratedPeptidesFile.csv" | |
| 130 | |
| 131 | |
| 132 # Abl<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 4) | |
| 133 # Arg<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 5) | |
| 134 # Btk<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 6) | |
| 135 # Csk<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 7) | |
| 136 # Fyn<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 8) | |
| 137 # Hck<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 9) | |
| 138 # JAK2<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 10) | |
| 139 # Lck<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 11) | |
| 140 # Lyn<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 12) | |
| 141 # Pyk2<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 13) | |
| 142 # Src<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 14) | |
| 143 # Syk<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 15) | |
| 144 # Yes<-read.xlsx("C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/Kinatest ID/Screener.xls", sheetIndex = 16) | |
| 145 # | |
| 146 | |
| 147 | |
| 148 "A"=1 | |
| 149 "C"=2 | |
| 150 "D"=3 | |
| 151 "E"=4 | |
| 152 "F"=5 | |
| 153 "G"=6 | |
| 154 "H"=7 | |
| 155 "I"=8 | |
| 156 "K"=9 | |
| 157 "L"=10 | |
| 158 "M"=11 | |
| 159 "N"=12 | |
| 160 "P"=13 | |
| 161 "Q"=14 | |
| 162 "R"=15 | |
| 163 "S"=16 | |
| 164 "T"=17 | |
| 165 "V"=18 | |
| 166 "W"=19 | |
| 167 "Y"=20 | |
| 168 | |
| 169 aa_props <- c("A"=A, "C"=C, "D"=D, "E"=E, "F"=F,"G"=G,"H"=H,"I"=I,"K"=K,"L"=L,"M"=M,"N"=N,"P"=P,"Q"=Q,"R"=R, | |
| 170 "S"=S,"T"=T,"V"=V,"W"=W,"Y"=Y,"xY"=Y,"O"=21) | |
| 171 | |
| 172 number15<-sapply(Positionm7, function (x) aa_props[x]) | |
| 173 number14<-sapply(Positionm6, function (x) aa_props[x]) | |
| 174 number13<-sapply(Positionm5, function (x) aa_props[x]) | |
| 175 number1 <- sapply(Positionm4, function (x) aa_props[x]) | |
| 176 number2 <- sapply(Positionm3, function (x) aa_props[x]) | |
| 177 number3 <- sapply(Positionm2, function (x) aa_props[x]) | |
| 178 number4 <- sapply(Positionm1, function (x) aa_props[x]) | |
| 179 number5 <- sapply(Positiond0, function (x) aa_props[x]) | |
| 180 number6 <- sapply(Positionp1, function (x) aa_props[x]) | |
| 181 number7 <- sapply(Positionp2, function (x) aa_props[x]) | |
| 182 number8 <- sapply(Positionp3, function (x) aa_props[x]) | |
| 183 number9 <- sapply(Positionp4, function (x) aa_props[x]) | |
| 184 number10<-sapply(Positionp5, function (x) aa_props[x]) | |
| 185 number11<-sapply(Positionp6, function (x) aa_props[x]) | |
| 186 number12<-sapply(Positionp7, function (x) aa_props[x]) | |
| 187 | |
| 188 # number1<-Positionm4 | |
| 189 # number2<-Positionm3 | |
| 190 # number3<-Positionm2 | |
| 191 # number4<-Positionm1 | |
| 192 # number5<-Positiond0 | |
| 193 # number6<-Positionp1 | |
| 194 # number7<-Positionp2 | |
| 195 # number8<-Positionp3 | |
| 196 # number9<-Positionp4 | |
| 197 | |
| 198 ############################# | |
| 199 #here I create the Abl seqs with proper value for each number | |
| 200 if (1==0){ | |
| 201 Ablnumber1<- gsub("A",A,Ablnumber1,perl = TRUE) | |
| 202 Ablnumber1<- gsub("C",C,Ablnumber1,perl = TRUE) | |
| 203 Ablnumber1<- gsub("D",D,Ablnumber1,perl = TRUE) | |
| 204 Ablnumber1<- gsub("E",E,Ablnumber1,perl = TRUE) | |
| 205 Ablnumber1<- gsub("F",F,Ablnumber1,perl = TRUE) | |
| 206 Ablnumber1<- gsub("G",G,Ablnumber1,perl = TRUE) | |
| 207 Ablnumber1<- gsub("H",H,Ablnumber1,perl = TRUE) | |
| 208 Ablnumber1<- gsub("I",I,Ablnumber1,perl = TRUE) | |
| 209 Ablnumber1<- gsub("K",K,Ablnumber1,perl = TRUE) | |
| 210 Ablnumber1<- gsub("L",L,Ablnumber1,perl = TRUE) | |
| 211 Ablnumber1<- gsub("M",M,Ablnumber1,perl = TRUE) | |
| 212 Ablnumber1<- gsub("N",N,Ablnumber1,perl = TRUE) | |
| 213 Ablnumber1<- gsub("P",P,Ablnumber1,perl = TRUE) | |
| 214 Ablnumber1<- gsub("Q",Q,Ablnumber1,perl = TRUE) | |
| 215 Ablnumber1<- gsub("R",R,Ablnumber1,perl = TRUE) | |
| 216 Ablnumber1<- gsub("S",S,Ablnumber1,perl = TRUE) | |
| 217 Ablnumber1<- gsub("T",T,Ablnumber1,perl = TRUE) | |
| 218 Ablnumber1<- gsub("V",V,Ablnumber1,perl = TRUE) | |
| 219 Ablnumber1<- gsub("W",W,Ablnumber1,perl = TRUE) | |
| 220 Ablnumber1<- gsub("Y",Y,Ablnumber1,perl = TRUE) | |
| 221 | |
| 222 Ablnumber2<- gsub("A",A,Ablnumber2,perl = TRUE) | |
| 223 Ablnumber2<- gsub("C",C,Ablnumber2,perl = TRUE) | |
| 224 Ablnumber2<- gsub("D",D,Ablnumber2,perl = TRUE) | |
| 225 Ablnumber2<- gsub("E",E,Ablnumber2,perl = TRUE) | |
| 226 Ablnumber2<- gsub("F",F,Ablnumber2,perl = TRUE) | |
| 227 Ablnumber2<- gsub("G",G,Ablnumber2,perl = TRUE) | |
| 228 Ablnumber2<- gsub("H",H,Ablnumber2,perl = TRUE) | |
| 229 Ablnumber2<- gsub("I",I,Ablnumber2,perl = TRUE) | |
| 230 Ablnumber2<- gsub("K",K,Ablnumber2,perl = TRUE) | |
| 231 Ablnumber2<- gsub("L",L,Ablnumber2,perl = TRUE) | |
| 232 Ablnumber2<- gsub("M",M,Ablnumber2,perl = TRUE) | |
| 233 Ablnumber2<- gsub("N",N,Ablnumber2,perl = TRUE) | |
| 234 Ablnumber2<- gsub("P",P,Ablnumber2,perl = TRUE) | |
| 235 Ablnumber2<- gsub("Q",Q,Ablnumber2,perl = TRUE) | |
| 236 Ablnumber2<- gsub("R",R,Ablnumber2,perl = TRUE) | |
| 237 Ablnumber2<- gsub("S",S,Ablnumber2,perl = TRUE) | |
| 238 Ablnumber2<- gsub("T",T,Ablnumber2,perl = TRUE) | |
| 239 Ablnumber2<- gsub("V",V,Ablnumber2,perl = TRUE) | |
| 240 Ablnumber2<- gsub("W",W,Ablnumber2,perl = TRUE) | |
| 241 Ablnumber2<- gsub("Y",Y,Ablnumber2,perl = TRUE) | |
| 242 | |
| 243 Ablnumber3<- gsub("A",A,Ablnumber3,perl = TRUE) | |
| 244 Ablnumber3<- gsub("C",C,Ablnumber3,perl = TRUE) | |
| 245 Ablnumber3<- gsub("D",D,Ablnumber3,perl = TRUE) | |
| 246 Ablnumber3<- gsub("E",E,Ablnumber3,perl = TRUE) | |
| 247 Ablnumber3<- gsub("F",F,Ablnumber3,perl = TRUE) | |
| 248 Ablnumber3<- gsub("G",G,Ablnumber3,perl = TRUE) | |
| 249 Ablnumber3<- gsub("H",H,Ablnumber3,perl = TRUE) | |
| 250 Ablnumber3<- gsub("I",I,Ablnumber3,perl = TRUE) | |
| 251 Ablnumber3<- gsub("K",K,Ablnumber3,perl = TRUE) | |
| 252 Ablnumber3<- gsub("L",L,Ablnumber3,perl = TRUE) | |
| 253 Ablnumber3<- gsub("M",M,Ablnumber3,perl = TRUE) | |
| 254 Ablnumber3<- gsub("N",N,Ablnumber3,perl = TRUE) | |
| 255 Ablnumber3<- gsub("P",P,Ablnumber3,perl = TRUE) | |
| 256 Ablnumber3<- gsub("Q",Q,Ablnumber3,perl = TRUE) | |
| 257 Ablnumber3<- gsub("R",R,Ablnumber3,perl = TRUE) | |
| 258 Ablnumber3<- gsub("S",S,Ablnumber3,perl = TRUE) | |
| 259 Ablnumber3<- gsub("T",T,Ablnumber3,perl = TRUE) | |
| 260 Ablnumber3<- gsub("V",V,Ablnumber3,perl = TRUE) | |
| 261 Ablnumber3<- gsub("W",W,Ablnumber3,perl = TRUE) | |
| 262 Ablnumber3<- gsub("Y",Y,Ablnumber3,perl = TRUE) | |
| 263 | |
| 264 Ablnumber4<- gsub("A",A,Ablnumber4,perl = TRUE) | |
| 265 Ablnumber4<- gsub("C",C,Ablnumber4,perl = TRUE) | |
| 266 Ablnumber4<- gsub("D",D,Ablnumber4,perl = TRUE) | |
| 267 Ablnumber4<- gsub("E",E,Ablnumber4,perl = TRUE) | |
| 268 Ablnumber4<- gsub("F",F,Ablnumber4,perl = TRUE) | |
| 269 Ablnumber4<- gsub("G",G,Ablnumber4,perl = TRUE) | |
| 270 Ablnumber4<- gsub("H",H,Ablnumber4,perl = TRUE) | |
| 271 Ablnumber4<- gsub("I",I,Ablnumber4,perl = TRUE) | |
| 272 Ablnumber4<- gsub("K",K,Ablnumber4,perl = TRUE) | |
| 273 Ablnumber4<- gsub("L",L,Ablnumber4,perl = TRUE) | |
| 274 Ablnumber4<- gsub("M",M,Ablnumber4,perl = TRUE) | |
| 275 Ablnumber4<- gsub("N",N,Ablnumber4,perl = TRUE) | |
| 276 Ablnumber4<- gsub("P",P,Ablnumber4,perl = TRUE) | |
| 277 Ablnumber4<- gsub("Q",Q,Ablnumber4,perl = TRUE) | |
| 278 Ablnumber4<- gsub("R",R,Ablnumber4,perl = TRUE) | |
| 279 Ablnumber4<- gsub("S",S,Ablnumber4,perl = TRUE) | |
| 280 Ablnumber4<- gsub("T",T,Ablnumber4,perl = TRUE) | |
| 281 Ablnumber4<- gsub("V",V,Ablnumber4,perl = TRUE) | |
| 282 Ablnumber4<- gsub("W",W,Ablnumber4,perl = TRUE) | |
| 283 Ablnumber4<- gsub("Y",Y,Ablnumber4,perl = TRUE) | |
| 284 | |
| 285 Ablnumber5<- gsub("A",A,Ablnumber5,perl = TRUE) | |
| 286 Ablnumber5<- gsub("C",C,Ablnumber5,perl = TRUE) | |
| 287 Ablnumber5<- gsub("D",D,Ablnumber5,perl = TRUE) | |
| 288 Ablnumber5<- gsub("E",E,Ablnumber5,perl = TRUE) | |
| 289 Ablnumber5<- gsub("F",F,Ablnumber5,perl = TRUE) | |
| 290 Ablnumber5<- gsub("G",G,Ablnumber5,perl = TRUE) | |
| 291 Ablnumber5<- gsub("H",H,Ablnumber5,perl = TRUE) | |
| 292 Ablnumber5<- gsub("I",I,Ablnumber5,perl = TRUE) | |
| 293 Ablnumber5<- gsub("K",K,Ablnumber5,perl = TRUE) | |
| 294 Ablnumber5<- gsub("L",L,Ablnumber5,perl = TRUE) | |
| 295 Ablnumber5<- gsub("M",M,Ablnumber5,perl = TRUE) | |
| 296 Ablnumber5<- gsub("N",N,Ablnumber5,perl = TRUE) | |
| 297 Ablnumber5<- gsub("P",P,Ablnumber5,perl = TRUE) | |
| 298 Ablnumber5<- gsub("Q",Q,Ablnumber5,perl = TRUE) | |
| 299 Ablnumber5<- gsub("R",R,Ablnumber5,perl = TRUE) | |
| 300 Ablnumber5<- gsub("S",S,Ablnumber5,perl = TRUE) | |
| 301 Ablnumber5<- gsub("T",T,Ablnumber5,perl = TRUE) | |
| 302 Ablnumber5<- gsub("V",V,Ablnumber5,perl = TRUE) | |
| 303 Ablnumber5<- gsub("W",W,Ablnumber5,perl = TRUE) | |
| 304 Ablnumber5<- gsub("Y",Y,Ablnumber5,perl = TRUE) | |
| 305 | |
| 306 Ablnumber6<- gsub("A",A,Ablnumber6,perl = TRUE) | |
| 307 Ablnumber6<- gsub("C",C,Ablnumber6,perl = TRUE) | |
| 308 Ablnumber6<- gsub("D",D,Ablnumber6,perl = TRUE) | |
| 309 Ablnumber6<- gsub("E",E,Ablnumber6,perl = TRUE) | |
| 310 Ablnumber6<- gsub("F",F,Ablnumber6,perl = TRUE) | |
| 311 Ablnumber6<- gsub("G",G,Ablnumber6,perl = TRUE) | |
| 312 Ablnumber6<- gsub("H",H,Ablnumber6,perl = TRUE) | |
| 313 Ablnumber6<- gsub("I",I,Ablnumber6,perl = TRUE) | |
| 314 Ablnumber6<- gsub("K",K,Ablnumber6,perl = TRUE) | |
| 315 Ablnumber6<- gsub("L",L,Ablnumber6,perl = TRUE) | |
| 316 Ablnumber6<- gsub("M",M,Ablnumber6,perl = TRUE) | |
| 317 Ablnumber6<- gsub("N",N,Ablnumber6,perl = TRUE) | |
| 318 Ablnumber6<- gsub("P",P,Ablnumber6,perl = TRUE) | |
| 319 Ablnumber6<- gsub("Q",Q,Ablnumber6,perl = TRUE) | |
| 320 Ablnumber6<- gsub("R",R,Ablnumber6,perl = TRUE) | |
| 321 Ablnumber6<- gsub("S",S,Ablnumber6,perl = TRUE) | |
| 322 Ablnumber6<- gsub("T",T,Ablnumber6,perl = TRUE) | |
| 323 Ablnumber6<- gsub("V",V,Ablnumber6,perl = TRUE) | |
| 324 Ablnumber6<- gsub("W",W,Ablnumber6,perl = TRUE) | |
| 325 Ablnumber6<- gsub("Y",Y,Ablnumber6,perl = TRUE) | |
| 326 | |
| 327 Ablnumber7<- gsub("A",A,Ablnumber7,perl = TRUE) | |
| 328 Ablnumber7<- gsub("C",C,Ablnumber7,perl = TRUE) | |
| 329 Ablnumber7<- gsub("D",D,Ablnumber7,perl = TRUE) | |
| 330 Ablnumber7<- gsub("E",E,Ablnumber7,perl = TRUE) | |
| 331 Ablnumber7<- gsub("F",F,Ablnumber7,perl = TRUE) | |
| 332 Ablnumber7<- gsub("G",G,Ablnumber7,perl = TRUE) | |
| 333 Ablnumber7<- gsub("H",H,Ablnumber7,perl = TRUE) | |
| 334 Ablnumber7<- gsub("I",I,Ablnumber7,perl = TRUE) | |
| 335 Ablnumber7<- gsub("K",K,Ablnumber7,perl = TRUE) | |
| 336 Ablnumber7<- gsub("L",L,Ablnumber7,perl = TRUE) | |
| 337 Ablnumber7<- gsub("M",M,Ablnumber7,perl = TRUE) | |
| 338 Ablnumber7<- gsub("N",N,Ablnumber7,perl = TRUE) | |
| 339 Ablnumber7<- gsub("P",P,Ablnumber7,perl = TRUE) | |
| 340 Ablnumber7<- gsub("Q",Q,Ablnumber7,perl = TRUE) | |
| 341 Ablnumber7<- gsub("R",R,Ablnumber7,perl = TRUE) | |
| 342 Ablnumber7<- gsub("S",S,Ablnumber7,perl = TRUE) | |
| 343 Ablnumber7<- gsub("T",T,Ablnumber7,perl = TRUE) | |
| 344 Ablnumber7<- gsub("V",V,Ablnumber7,perl = TRUE) | |
| 345 Ablnumber7<- gsub("W",W,Ablnumber7,perl = TRUE) | |
| 346 Ablnumber7<- gsub("Y",Y,Ablnumber7,perl = TRUE) | |
| 347 | |
| 348 Ablnumber8<- gsub("A",A,Ablnumber8,perl = TRUE) | |
| 349 Ablnumber8<- gsub("C",C,Ablnumber8,perl = TRUE) | |
| 350 Ablnumber8<- gsub("D",D,Ablnumber8,perl = TRUE) | |
| 351 Ablnumber8<- gsub("E",E,Ablnumber8,perl = TRUE) | |
| 352 Ablnumber8<- gsub("F",F,Ablnumber8,perl = TRUE) | |
| 353 Ablnumber8<- gsub("G",G,Ablnumber8,perl = TRUE) | |
| 354 Ablnumber8<- gsub("H",H,Ablnumber8,perl = TRUE) | |
| 355 Ablnumber8<- gsub("I",I,Ablnumber8,perl = TRUE) | |
| 356 Ablnumber8<- gsub("K",K,Ablnumber8,perl = TRUE) | |
| 357 Ablnumber8<- gsub("L",L,Ablnumber8,perl = TRUE) | |
| 358 Ablnumber8<- gsub("M",M,Ablnumber8,perl = TRUE) | |
| 359 Ablnumber8<- gsub("N",N,Ablnumber8,perl = TRUE) | |
| 360 Ablnumber8<- gsub("P",P,Ablnumber8,perl = TRUE) | |
| 361 Ablnumber8<- gsub("Q",Q,Ablnumber8,perl = TRUE) | |
| 362 Ablnumber8<- gsub("R",R,Ablnumber8,perl = TRUE) | |
| 363 Ablnumber8<- gsub("S",S,Ablnumber8,perl = TRUE) | |
| 364 Ablnumber8<- gsub("T",T,Ablnumber8,perl = TRUE) | |
| 365 Ablnumber8<- gsub("V",V,Ablnumber8,perl = TRUE) | |
| 366 Ablnumber8<- gsub("W",W,Ablnumber8,perl = TRUE) | |
| 367 Ablnumber8<- gsub("Y",Y,Ablnumber8,perl = TRUE) | |
| 368 | |
| 369 Ablnumber9<- gsub("A",A,Ablnumber9,perl = TRUE) | |
| 370 Ablnumber9<- gsub("C",C,Ablnumber9,perl = TRUE) | |
| 371 Ablnumber9<- gsub("D",D,Ablnumber9,perl = TRUE) | |
| 372 Ablnumber9<- gsub("E",E,Ablnumber9,perl = TRUE) | |
| 373 Ablnumber9<- gsub("F",F,Ablnumber9,perl = TRUE) | |
| 374 Ablnumber9<- gsub("G",G,Ablnumber9,perl = TRUE) | |
| 375 Ablnumber9<- gsub("H",H,Ablnumber9,perl = TRUE) | |
| 376 Ablnumber9<- gsub("I",I,Ablnumber9,perl = TRUE) | |
| 377 Ablnumber9<- gsub("K",K,Ablnumber9,perl = TRUE) | |
| 378 Ablnumber9<- gsub("L",L,Ablnumber9,perl = TRUE) | |
| 379 Ablnumber9<- gsub("M",M,Ablnumber9,perl = TRUE) | |
| 380 Ablnumber9<- gsub("N",N,Ablnumber9,perl = TRUE) | |
| 381 Ablnumber9<- gsub("P",P,Ablnumber9,perl = TRUE) | |
| 382 Ablnumber9<- gsub("Q",Q,Ablnumber9,perl = TRUE) | |
| 383 Ablnumber9<- gsub("R",R,Ablnumber9,perl = TRUE) | |
| 384 Ablnumber9<- gsub("S",S,Ablnumber9,perl = TRUE) | |
| 385 Ablnumber9<- gsub("T",T,Ablnumber9,perl = TRUE) | |
| 386 Ablnumber9<- gsub("V",V,Ablnumber9,perl = TRUE) | |
| 387 Ablnumber9<- gsub("W",W,Ablnumber9,perl = TRUE) | |
| 388 Ablnumber9<- gsub("Y",Y,Ablnumber9,perl = TRUE) | |
| 389 } | |
| 390 ######################################## | |
| 391 | |
| 392 | |
| 393 total=length(Positionp7)*length(Positionp6)*length(Positionp5)*length(Positionp4)*length(Positionp3)*(length(Positionp2))*length(Positionp1)* | |
| 394 length(Positiond0)*length(Positionm1)*length(Positionm2)*length(Positionm3)*length(Positionm4)*length(Positionm5)*length(Positionm6)*length(Positionm7) | |
| 395 #this is just a way to doublecheck that the length of the generated peptides vector is correct | |
| 396 | |
| 397 GeneratedPeptides<-rep(NA, times=total*15) | |
| 398 GeneratedPeptides<-matrix(data = GeneratedPeptides,ncol = 15) | |
| 399 | |
| 400 NumeratedPeptides<-GeneratedPeptides | |
| 401 #create an empty vector of correct length by finding the number of each AAs per position and multiplying them | |
| 402 count<-0 | |
| 403 for (t in 1:length(Positionm7)) { | |
| 404 for (s in 1:length(Positionm6)) { | |
| 405 for (r in 1:length(Positionm5)) { | |
| 406 for (i in 1:length(Positionm4)) { | |
| 407 for (j in 1:length(Positionm3)) { | |
| 408 for (k in 1:length(Positionm2)) { | |
| 409 for (l in 1:length(Positionm1)) { | |
| 410 for (m in 1:length(Positiond0)) { | |
| 411 for (n in 1:length(Positionp1)) { | |
| 412 for (o in 1:length(Positionp2)) { | |
| 413 for (p in 1:length(Positionp3)) { | |
| 414 for (q in 1:length(Positionp4)) { | |
| 415 for (u in 1:length(Positionp5)) { | |
| 416 for (v in 1:length(Positionp6)) { | |
| 417 for (w in 1:length(Positionp7)) { | |
| 418 # i=1 | |
| 419 # j=1 | |
| 420 # k=1 | |
| 421 # l=1 | |
| 422 # m=1 | |
| 423 # n=1 | |
| 424 # o=1 | |
| 425 # p=1 | |
| 426 # q=1 | |
| 427 # | |
| 428 #for every single position, increment the count number, create a peptide using the AAs at that position | |
| 429 #then put them together into the generated peptides sequencex | |
| 430 count<-count+1 | |
| 431 tabulation<-c(Positionm7[t],Positionm6[s],Positionm5[r],Positionm4[i],Positionm3[j],Positionm2[k],Positionm1[l],Positiond0[m],Positionp1[n], | |
| 432 Positionp2[o],Positionp3[p],Positionp4[q],Positionp5[u],Positionp6[v],Positionp7[w]) | |
| 433 numeration<-c(number15[t],number14[s],number13[r],number1[i],number2[j],number3[k],number4[l],number5[m],number6[n],number7[o],number8[p],number9[q],number10[u],number11[v], | |
| 434 number12[w]) | |
| 435 #tabulation<-paste(tabulation, sep="", collapse="") | |
| 436 GeneratedPeptides[count,1:15]<-tabulation | |
| 437 NumeratedPeptides[count,1:15]<-numeration | |
| 438 } | |
| 439 } | |
| 440 } | |
| 441 } | |
| 442 } | |
| 443 } | |
| 444 } | |
| 445 } | |
| 446 } | |
| 447 } | |
| 448 } | |
| 449 } | |
| 450 } | |
| 451 } | |
| 452 } | |
| 453 #################################################################### | |
| 454 #now here I use the Endogenous Probabilty matrix from the previous script, which is called EMPtable | |
| 455 #to score the created peptides | |
| 456 ThisKinTable<-EPMtableu#[1:nrow(SDtable),] | |
| 457 TKTcolumn<-c(data=rep(1,times=21)) | |
| 458 TKTcolumn<-as.matrix(TKTcolumn,ncol=1) | |
| 459 ThisKinTable<-cbind(TKTcolumn,ThisKinTable) | |
| 460 | |
| 461 ThisKinGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 462 ThisKinGenWeirdScore<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 463 | |
| 464 for (x in 1:nrow(GeneratedPeptides)){ | |
| 465 Scoringpeptide<-NumeratedPeptides[x,1:15] | |
| 466 Scoringpeptide<-Scoringpeptide+1 | |
| 467 ThisKinTableScore<-as.numeric(ThisKinTable[Scoringpeptide[1],3])*ThisKinTable[as.numeric(Scoringpeptide[2]),4]*ThisKinTable[as.numeric(Scoringpeptide[3]),5]* | |
| 468 ThisKinTable[as.numeric(Scoringpeptide[4]),6]*ThisKinTable[as.numeric(Scoringpeptide[5]),7]*ThisKinTable[as.numeric(Scoringpeptide[6]),8]*ThisKinTable[as.numeric(Scoringpeptide[7]),9]* | |
| 469 #ThisKinTable[as.numeric(Scoringpeptide[8]),10]* | |
| 470 ThisKinTable[as.numeric(Scoringpeptide[9]),11]*ThisKinTable[as.numeric(Scoringpeptide[10]),12]*ThisKinTable[as.numeric(Scoringpeptide[11]),13]* | |
| 471 ThisKinTable[as.numeric(Scoringpeptide[12]),14]*ThisKinTable[as.numeric(Scoringpeptide[13]),15]*ThisKinTable[as.numeric(Scoringpeptide[14]),16]*ThisKinTable[as.numeric(Scoringpeptide[15]),17] | |
| 472 ThisKinGeneratedScores[x]<-ThisKinTableScore | |
| 473 ThisKinTableScore<-(ThisKinTableScore/(ThisKinTableScore+1/as.numeric(NormalizationScore[2]))) | |
| 474 ThisKinGenWeirdScore[x]<-ThisKinTableScore | |
| 475 } | |
| 476 | |
| 477 AblGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 478 ArgGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 479 BtkGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 480 CskGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 481 FynGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 482 HckGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 483 JAK2GeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 484 LckGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 485 LynGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 486 Pyk2GeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 487 SrcGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 488 SykGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 489 YesGeneratedScores<-rep(NA,times=nrow(GeneratedPeptides)) | |
| 490 | |
| 491 | |
| 492 for (x in 1:nrow(GeneratedPeptides)){ | |
| 493 Scoringpeptide<-NumeratedPeptides[x,1:15] | |
| 494 AblScore<-Abl[Scoringpeptide[1],2]*Abl[Scoringpeptide[2],3]*Abl[Scoringpeptide[3],4]*Abl[Scoringpeptide[4],5]*Abl[Scoringpeptide[5],6]*Abl[Scoringpeptide[6],7]* | |
| 495 Abl[Scoringpeptide[7],8]*Abl[Scoringpeptide[9],10]*Abl[Scoringpeptide[10],11]*Abl[Scoringpeptide[11],12]*Abl[Scoringpeptide[12],13]* | |
| 496 Abl[Scoringpeptide[13],14]*Abl[Scoringpeptide[14],15]*Abl[Scoringpeptide[15],16] | |
| 497 AblGeneratedScores[x]<-AblScore | |
| 498 | |
| 499 ArgScore<-Arg[Scoringpeptide[1],2]*Arg[Scoringpeptide[2],3]*Arg[Scoringpeptide[3],4]*Arg[Scoringpeptide[4],5]*Arg[Scoringpeptide[5],6]*Arg[Scoringpeptide[6],7]* | |
| 500 Arg[Scoringpeptide[7],8]*Arg[Scoringpeptide[9],10]*Arg[Scoringpeptide[10],11]*Arg[Scoringpeptide[11],12]*Arg[Scoringpeptide[12],13]* | |
| 501 Arg[Scoringpeptide[13],14]*Arg[Scoringpeptide[14],15]*Arg[Scoringpeptide[15],16] | |
| 502 ArgGeneratedScores[x]<-ArgScore | |
| 503 | |
| 504 BtkScore<-Btk[Scoringpeptide[1],2]*Btk[Scoringpeptide[2],3]*Btk[Scoringpeptide[3],4]*Btk[Scoringpeptide[4],5]*Btk[Scoringpeptide[5],6]*Btk[Scoringpeptide[6],7]* | |
| 505 Btk[Scoringpeptide[7],8]*Btk[Scoringpeptide[9],10]*Btk[Scoringpeptide[10],11]*Btk[Scoringpeptide[11],12]*Btk[Scoringpeptide[12],13]* | |
| 506 Btk[Scoringpeptide[13],14]*Btk[Scoringpeptide[14],15]*Btk[Scoringpeptide[15],16] | |
| 507 BtkGeneratedScores[x]<-BtkScore | |
| 508 | |
| 509 CskScore<-Csk[Scoringpeptide[1],2]*Csk[Scoringpeptide[2],3]*Csk[Scoringpeptide[3],4]*Csk[Scoringpeptide[4],5]*Csk[Scoringpeptide[5],6]*Csk[Scoringpeptide[6],7]* | |
| 510 Csk[Scoringpeptide[7],8]*Csk[Scoringpeptide[9],10]*Csk[Scoringpeptide[10],11]*Csk[Scoringpeptide[11],12]*Csk[Scoringpeptide[12],13]* | |
| 511 Csk[Scoringpeptide[13],14]*Csk[Scoringpeptide[14],15]*Csk[Scoringpeptide[15],16] | |
| 512 CskGeneratedScores[x]<-CskScore | |
| 513 | |
| 514 FynScore<-Fyn[Scoringpeptide[1],2]*Fyn[Scoringpeptide[2],3]*Fyn[Scoringpeptide[3],4]*Fyn[Scoringpeptide[4],5]*Fyn[Scoringpeptide[5],6]*Fyn[Scoringpeptide[6],7]* | |
| 515 Fyn[Scoringpeptide[7],8]*Fyn[Scoringpeptide[9],10]*Fyn[Scoringpeptide[10],11]*Fyn[Scoringpeptide[11],12]*Fyn[Scoringpeptide[12],13]* | |
| 516 Fyn[Scoringpeptide[13],14]*Fyn[Scoringpeptide[14],15]*Fyn[Scoringpeptide[15],16] | |
| 517 FynGeneratedScores[x]<-FynScore | |
| 518 | |
| 519 HckScore<-Hck[Scoringpeptide[1],2]*Hck[Scoringpeptide[2],3]*Hck[Scoringpeptide[3],4]*Hck[Scoringpeptide[4],5]*Hck[Scoringpeptide[5],6]*Hck[Scoringpeptide[6],7]* | |
| 520 Hck[Scoringpeptide[7],8]*Hck[Scoringpeptide[9],10]*Hck[Scoringpeptide[10],11]*Hck[Scoringpeptide[11],12]*Hck[Scoringpeptide[12],13]* | |
| 521 Hck[Scoringpeptide[13],14]*Hck[Scoringpeptide[14],15]*Hck[Scoringpeptide[15],16] | |
| 522 HckGeneratedScores[x]<-HckScore | |
| 523 | |
| 524 JAK2Score<-JAK2[Scoringpeptide[1],2]*JAK2[Scoringpeptide[2],3]*JAK2[Scoringpeptide[3],4]*JAK2[Scoringpeptide[4],5]*JAK2[Scoringpeptide[5],6]*JAK2[Scoringpeptide[6],7]* | |
| 525 JAK2[Scoringpeptide[7],8]*JAK2[Scoringpeptide[9],10]*JAK2[Scoringpeptide[10],11]*JAK2[Scoringpeptide[11],12]*JAK2[Scoringpeptide[12],13]* | |
| 526 JAK2[Scoringpeptide[13],14]*JAK2[Scoringpeptide[14],15]*JAK2[Scoringpeptide[15],16] | |
| 527 JAK2GeneratedScores[x]<-JAK2Score | |
| 528 | |
| 529 LckScore<-Lck[Scoringpeptide[1],2]*Lck[Scoringpeptide[2],3]*Lck[Scoringpeptide[3],4]*Lck[Scoringpeptide[4],5]*Lck[Scoringpeptide[5],6]*Lck[Scoringpeptide[6],7]* | |
| 530 Lck[Scoringpeptide[7],8]*Lck[Scoringpeptide[9],10]*Lck[Scoringpeptide[10],11]*Lck[Scoringpeptide[11],12]*Lck[Scoringpeptide[12],13]* | |
| 531 Lck[Scoringpeptide[13],14]*Lck[Scoringpeptide[14],15]*Lck[Scoringpeptide[15],16] | |
| 532 LckGeneratedScores[x]<-LckScore | |
| 533 | |
| 534 LynScore<-Lyn[Scoringpeptide[1],2]*Lyn[Scoringpeptide[2],3]*Lyn[Scoringpeptide[3],4]*Lyn[Scoringpeptide[4],5]*Lyn[Scoringpeptide[5],6]*Lyn[Scoringpeptide[6],7]* | |
| 535 Lyn[Scoringpeptide[7],8]*Lyn[Scoringpeptide[9],10]*Lyn[Scoringpeptide[10],11]*Lyn[Scoringpeptide[11],12]*Lyn[Scoringpeptide[12],13]* | |
| 536 Lyn[Scoringpeptide[13],14]*Lyn[Scoringpeptide[14],15]*Lyn[Scoringpeptide[15],16] | |
| 537 LynGeneratedScores[x]<-LynScore | |
| 538 | |
| 539 Pyk2Score<-Pyk2[Scoringpeptide[1],2]*Pyk2[Scoringpeptide[2],3]*Pyk2[Scoringpeptide[3],4]*Pyk2[Scoringpeptide[4],5]*Pyk2[Scoringpeptide[5],6]*Pyk2[Scoringpeptide[6],7]* | |
| 540 Pyk2[Scoringpeptide[7],8]*Pyk2[Scoringpeptide[9],10]*Pyk2[Scoringpeptide[10],11]*Pyk2[Scoringpeptide[11],12]*Pyk2[Scoringpeptide[12],13]* | |
| 541 Pyk2[Scoringpeptide[13],14]*Pyk2[Scoringpeptide[14],15]*Pyk2[Scoringpeptide[15],16] | |
| 542 Pyk2GeneratedScores[x]<-Pyk2Score | |
| 543 | |
| 544 SrcScore<-Src[Scoringpeptide[1],2]*Src[Scoringpeptide[2],3]*Src[Scoringpeptide[3],4]*Src[Scoringpeptide[4],5]*Src[Scoringpeptide[5],6]*Src[Scoringpeptide[6],7]* | |
| 545 Src[Scoringpeptide[7],8]*Src[Scoringpeptide[9],10]*Src[Scoringpeptide[10],11]*Src[Scoringpeptide[11],12]*Src[Scoringpeptide[12],13]* | |
| 546 Src[Scoringpeptide[13],14]*Src[Scoringpeptide[14],15]*Src[Scoringpeptide[15],16] | |
| 547 SrcGeneratedScores[x]<-SrcScore | |
| 548 | |
| 549 SykScore<-Syk[Scoringpeptide[1],2]*Syk[Scoringpeptide[2],3]*Syk[Scoringpeptide[3],4]*Syk[Scoringpeptide[4],5]*Syk[Scoringpeptide[5],6]*Syk[Scoringpeptide[6],7]* | |
| 550 Syk[Scoringpeptide[7],8]*Syk[Scoringpeptide[9],10]*Syk[Scoringpeptide[10],11]*Syk[Scoringpeptide[11],12]*Syk[Scoringpeptide[12],13]* | |
| 551 Syk[Scoringpeptide[13],14]*Syk[Scoringpeptide[14],15]*Syk[Scoringpeptide[15],16] | |
| 552 SykGeneratedScores[x]<-SykScore | |
| 553 | |
| 554 YesScore<-Yes[Scoringpeptide[1],2]*Yes[Scoringpeptide[2],3]*Yes[Scoringpeptide[3],4]*Yes[Scoringpeptide[4],5]*Yes[Scoringpeptide[5],6]*Yes[Scoringpeptide[6],7]* | |
| 555 Yes[Scoringpeptide[7],8]*Yes[Scoringpeptide[9],10]*Yes[Scoringpeptide[10],11]*Yes[Scoringpeptide[11],12]*Yes[Scoringpeptide[12],13]* | |
| 556 Yes[Scoringpeptide[13],14]*Yes[Scoringpeptide[14],15]*Yes[Scoringpeptide[15],16] | |
| 557 YesGeneratedScores[x]<-YesScore | |
| 558 | |
| 559 # ThisKinTableScore<-ThisKinTable[as.numeric(Scoringpeptide[1]),3]*ThisKinTable[as.numeric(Scoringpeptide[2]),4]*ThisKinTable[as.numeric(Scoringpeptide[3]),5]* | |
| 560 # ThisKinTable[as.numeric(Scoringpeptide[4]),6]*ThisKinTable[as.numeric(Scoringpeptide[6]),8]* | |
| 561 # ThisKinTable[as.numeric(Scoringpeptide[7]),9]*ThisKinTable[as.numeric(Scoringpeptide[8]),10]*ThisKinTable[as.numeric(Scoringpeptide[9]),11] | |
| 562 # ThisKinGeneratedScores[x]<-ThisKinTableScore | |
| 563 } | |
| 564 | |
| 565 | |
| 566 | |
| 567 AblNorm<-1/as.numeric(Abl[22,1]) | |
| 568 AblThresh<-as.numeric(Abl[24,1]) | |
| 569 AblTrueThresh<-((AblThresh*AblNorm)/(100-AblThresh)) | |
| 570 AblActive<-unlist(AblGeneratedScores)>AblTrueThresh | |
| 571 | |
| 572 ArgNorm<-1/as.numeric(Arg[22,1]) | |
| 573 ArgThresh<-as.numeric(Arg[24,1]) | |
| 574 ArgTrueThresh<-((ArgThresh*ArgNorm)/(100-ArgThresh)) | |
| 575 ArgActive<-unlist(ArgGeneratedScores)>ArgTrueThresh | |
| 576 | |
| 577 BtkNorm<-1/as.numeric(Btk[22,1]) | |
| 578 BtkThresh<-as.numeric(Btk[24,1]) | |
| 579 BtkTrueThresh<-((BtkThresh*BtkNorm)/(100-BtkThresh)) | |
| 580 BtkActive<-unlist(BtkGeneratedScores)>BtkTrueThresh | |
| 581 | |
| 582 CskNorm<-1/as.numeric(Csk[22,1]) | |
| 583 CskThresh<-as.numeric(Csk[24,1]) | |
| 584 CskTrueThresh<-((CskThresh*CskNorm)/(100-CskThresh)) | |
| 585 CskActive<-(CskGeneratedScores)>CskTrueThresh | |
| 586 | |
| 587 FynNorm<-1/as.numeric(Fyn[22,1]) | |
| 588 FynThresh<-as.numeric(Fyn[24,1]) | |
| 589 FynTrueThresh<-((FynThresh*FynNorm)/(100-FynThresh)) | |
| 590 FynActive<-unlist(FynGeneratedScores)>FynTrueThresh | |
| 591 | |
| 592 HckNorm<-1/as.numeric(Hck[22,1]) | |
| 593 HckThresh<-as.numeric(Hck[24,1]) | |
| 594 HckTrueThresh<-((HckThresh*HckNorm)/(100-HckThresh)) | |
| 595 HckActive<-unlist(HckGeneratedScores)>HckTrueThresh | |
| 596 | |
| 597 JAK2Norm<-1/as.numeric(JAK2[22,1]) | |
| 598 JAK2Thresh<-as.numeric(JAK2[24,1]) | |
| 599 JAK2TrueThresh<-((JAK2Thresh*JAK2Norm)/(100-JAK2Thresh)) | |
| 600 JAk2Active<-unlist(JAK2GeneratedScores)>JAK2TrueThresh | |
| 601 | |
| 602 LckNorm<-1/as.numeric(Lck[22,1]) | |
| 603 LckThresh<-as.numeric(Lck[24,1]) | |
| 604 LckTrueThresh<-((LckThresh*LckNorm)/(100-LckThresh)) | |
| 605 LckActive<-unlist(LckGeneratedScores)>LckTrueThresh | |
| 606 | |
| 607 LynNorm<-1/as.numeric(Lyn[22,1]) | |
| 608 LynThresh<-as.numeric(Lyn[24,1]) | |
| 609 LynTrueThresh<-((LynThresh*LynNorm)/(100-LynThresh)) | |
| 610 LynActive<-unlist(LynGeneratedScores)>LynTrueThresh | |
| 611 | |
| 612 Pyk2Norm<-1/as.numeric(Pyk2[22,1]) | |
| 613 Pyk2Thresh<-as.numeric(Pyk2[24,1]) | |
| 614 Pyk2TrueThresh<-((Pyk2Thresh*Pyk2Norm)/(100-Pyk2Thresh)) | |
| 615 Pyk2Active<-unlist(Pyk2GeneratedScores)>Pyk2TrueThresh | |
| 616 | |
| 617 SrcNorm<-1/as.numeric(Src[22,1]) | |
| 618 SrcThresh<-as.numeric(Src[24,1]) | |
| 619 SrcTrueThresh<-((SrcThresh*SrcNorm)/(100-SrcThresh)) | |
| 620 SrcActive<-unlist(SrcGeneratedScores)>SrcTrueThresh | |
| 621 | |
| 622 SykNorm<-1/as.numeric(Syk[22,1]) | |
| 623 SykThresh<-as.numeric(Syk[24,1]) | |
| 624 SykTrueThresh<-((SykThresh*SykNorm)/(100-SykThresh)) | |
| 625 SykActive<-unlist(SykGeneratedScores)>SykTrueThresh | |
| 626 | |
| 627 YesNorm<-1/as.numeric(Yes[22,1]) | |
| 628 YesThresh<-as.numeric(Yes[24,1]) | |
| 629 YesTrueThresh<-((YesThresh*YesNorm)/(100-YesThresh)) | |
| 630 YesActive<-unlist(YesGeneratedScores)>YesTrueThresh | |
| 631 | |
| 632 AllActive<-AblActive+ArgActive+BtkActive+CskActive+FynActive+HckActive+JAk2Active+LckActive+LynActive+Pyk2Active+SrcActive+SykActive+YesActive | |
| 633 #Btkactive+ | |
| 634 | |
| 635 Scores<-ThisKinGeneratedScores | |
| 636 ThresholdValues<-ThisKinGenWeirdScore | |
| 637 | |
| 638 FullMotifs<-rep("Z",times=nrow(GeneratedPeptides)) | |
| 639 for (i in 1:nrow(GeneratedPeptides)) { | |
| 640 motif<-GeneratedPeptides[i,1:15] | |
| 641 motif<-paste(motif,sep = "", collapse = "") | |
| 642 FullMotifs[i]<-motif | |
| 643 } | |
| 644 | |
| 645 PeptidesWithRanks<-cbind.data.frame(FullMotifs,GeneratedPeptides,Scores,ThresholdValues) | |
| 646 PeptidesWithRanks<-cbind.data.frame(PeptidesWithRanks,AllActive,AblActive,ArgActive,BtkActive,CskActive,FynActive,HckActive,JAk2Active,LckActive,LynActive,Pyk2Active,SrcActive,SykActive,YesActive) | |
| 647 RanksPeptides<-PeptidesWithRanks[order(PeptidesWithRanks$AllActive,decreasing = FALSE),] | |
| 648 # PepRankHead<-c(1:9,"Sequence","RPMS","PMS") | |
| 649 # RanksPeptides<-rbind.data.frame(PepRankHead,PeptidesWithRanks) | |
| 650 head(RanksPeptides) | |
| 651 | |
| 652 | |
| 653 #now I have to score the negative sequences... for some reason | |
| 654 #write up how we transfect with lipofectamine | |
| 655 #3,4,5 questions | |
| 656 | |
| 657 #PAUSED EHRE AT 4:50, HOPING THAT FIXING MINERVOTHING SO THAT LEFT SPACES WORKS FIXES A THING. OTHERWISE | |
| 658 #I FUCKED WITH THE MCC TABLE AND NEED TO FINISH IT | |
| 659 | |
| 660 ThisKinBlanks<-rep(1,times=17) | |
| 661 ThisKinTable<-rbind(ThisKinTable,ThisKinBlanks) | |
| 662 | |
| 663 NegativeScores<-rep(NA,times=nrow(NegativeSubstrateList)) | |
| 664 NegativeWeirdScores<-rep(NA,times=nrow(NegativeSubstrateList)) | |
| 665 for (v in 1:nrow(NegativeSubstrateList)) { | |
| 666 motif<-NegativeSubstrateList[v,2] | |
| 667 motif<-unlist(strsplit(motif,"")) | |
| 668 #if (length(motif)<9){print(v)}} | |
| 669 # motif[1] <- sapply(motif[1], function (x) aa_props[x]) | |
| 670 # motif[2] <- sapply(motif[2], function (x) aa_props[x]) | |
| 671 # motif[3] <- sapply(motif[3], function (x) aa_props[x]) | |
| 672 # motif[4] <- sapply(motif[4], function (x) aa_props[x]) | |
| 673 # motif[5] <- sapply(motif[5], function (x) aa_props[x]) | |
| 674 # motif[6] <- sapply(motif[6], function (x) aa_props[x]) | |
| 675 # motif[7] <- sapply(motif[7], function (x) aa_props[x]) | |
| 676 # motif[8] <- sapply(motif[8], function (x) aa_props[x]) | |
| 677 # motif[9] <- sapply(motif[9], function (x) aa_props[x]) | |
| 678 motif<- gsub(" ","O",motif) | |
| 679 motif <- sapply(motif, function (x) aa_props[x]) | |
| 680 Scoringpeptide<-motif | |
| 681 Scoringpeptide<-Scoringpeptide+1 | |
| 682 ThisKinTableScore<-as.numeric(ThisKinTable[Scoringpeptide[1],3])*ThisKinTable[as.numeric(Scoringpeptide[2]),4]*ThisKinTable[as.numeric(Scoringpeptide[3]),5]* | |
| 683 ThisKinTable[as.numeric(Scoringpeptide[4]),6]*ThisKinTable[as.numeric(Scoringpeptide[5]),7]*ThisKinTable[as.numeric(Scoringpeptide[6]),8]*ThisKinTable[as.numeric(Scoringpeptide[7]),9]* | |
| 684 #ThisKinTable[as.numeric(Scoringpeptide[8]),10]* | |
| 685 ThisKinTable[as.numeric(Scoringpeptide[9]),11]*ThisKinTable[as.numeric(Scoringpeptide[10]),12]*ThisKinTable[as.numeric(Scoringpeptide[11]),13]* | |
| 686 ThisKinTable[as.numeric(Scoringpeptide[12]),14]*ThisKinTable[as.numeric(Scoringpeptide[13]),15]*ThisKinTable[as.numeric(Scoringpeptide[14]),16]*ThisKinTable[as.numeric(Scoringpeptide[15]),17] | |
| 687 NegativeScores[v]<-ThisKinTableScore | |
| 688 ThisKinTableScore<-(ThisKinTableScore/(ThisKinTableScore+1/as.numeric(NormalizationScore[2]))) | |
| 689 NegativeWeirdScores[v]<-ThisKinTableScore*100 | |
| 690 } | |
| 691 | |
| 692 negativesubstrates<-NegativeSubstrateList[,2] | |
| 693 NegativeWithScores<-cbind(negativesubstrates,as.character(NegativeScores),as.character(NegativeWeirdScores)) | |
| 694 | |
| 695 | |
| 696 #NEED TO HAVE THE NEGATIVE SUBSTRATES BE OUTPUTTED | |
| 697 | |
| 698 PositiveScores<-rep(NA,times=nrow(ImportedSubstrateList)) | |
| 699 PositiveWeirdScores<-rep(NA,times=nrow(ImportedSubstrateList)) | |
| 700 | |
| 701 for (v in 1:nrow(ImportedSubstrateList)) { | |
| 702 motif<-ImportedSubstrateList[v,4:18] | |
| 703 motif<-unlist(motif) | |
| 704 motif<- gsub("^$","O",motif) | |
| 705 motif <- sapply(motif, function (x) aa_props[x]) | |
| 706 Scoringpeptide<-motif | |
| 707 Scoringpeptide<-Scoringpeptide+1 | |
| 708 ThisKinTableScore<-as.numeric(ThisKinTable[Scoringpeptide[1],3])*ThisKinTable[as.numeric(Scoringpeptide[2]),4]*ThisKinTable[as.numeric(Scoringpeptide[3]),5]* | |
| 709 ThisKinTable[as.numeric(Scoringpeptide[4]),6]*ThisKinTable[as.numeric(Scoringpeptide[5]),7]*ThisKinTable[as.numeric(Scoringpeptide[6]),8]*ThisKinTable[as.numeric(Scoringpeptide[7]),9]* | |
| 710 #ThisKinTable[as.numeric(Scoringpeptide[8]),10]* | |
| 711 ThisKinTable[as.numeric(Scoringpeptide[9]),11]*ThisKinTable[as.numeric(Scoringpeptide[10]),12]*ThisKinTable[as.numeric(Scoringpeptide[11]),13]* | |
| 712 ThisKinTable[as.numeric(Scoringpeptide[12]),14]*ThisKinTable[as.numeric(Scoringpeptide[13]),15]*ThisKinTable[as.numeric(Scoringpeptide[14]),16]*ThisKinTable[as.numeric(Scoringpeptide[15]),17] | |
| 713 | |
| 714 PositiveScores[v]<-ThisKinTableScore | |
| 715 ThisKinTableScore<-(ThisKinTableScore/(ThisKinTableScore+1/as.numeric(NormalizationScore[2]))) | |
| 716 PositiveWeirdScores[v]<-ThisKinTableScore*100 | |
| 717 } | |
| 718 | |
| 719 positivesubstrates<-ImportedSubstrateList[,4:18] | |
| 720 positivewithscores<-cbind.data.frame(positivesubstrates,PositiveScores,PositiveWeirdScores) | |
| 721 | |
| 722 | |
| 723 #write down the transient transfection SOP and what we will be doing with them | |
| 724 #write down the vector names I will be using | |
| 725 #write down something about transforming bacteria and with what | |
| 726 | |
| 727 #90% whatevernness | |
| 728 # TPninetyone<-length(PositiveWeirdScores[PositiveWeirdScores>=0.91]) | |
| 729 # Senseninetyone<-TPninetyone/nrow(positivesubstrates) | |
| 730 # | |
| 731 # TNninetyone<-length(NegativeWeirdScores[NegativeWeirdScores<91]) | |
| 732 # Specninetyone<-TNninetyone/100 | |
| 733 | |
| 734 #create the MCC table | |
| 735 | |
| 736 threshold<-c(1:100) | |
| 737 threshold<-order(threshold,decreasing = TRUE) | |
| 738 | |
| 739 Truepositives<-c(1:100) | |
| 740 Falsenegatives<-c(1:100) | |
| 741 Sensitivity<-c(1:100) | |
| 742 TrueNegatives<-c(1:100) | |
| 743 FalsePositives<-c(1:100) | |
| 744 Specificity<-c(1:100) | |
| 745 Accuracy<-c(1:100) | |
| 746 MCC<-c(1:100) | |
| 747 EER<-c(1:100) | |
| 748 | |
| 749 #MAKE DAMN SURE THAT THE ACCESSION NUMBERS FOLLOW THE MOTIFS | |
| 750 | |
| 751 for (z in 1:100) { | |
| 752 thres<-101-z | |
| 753 Truepositives[z]<-length(PositiveWeirdScores[PositiveWeirdScores>=(thres)]) | |
| 754 Falsenegatives[z]<-nrow(positivesubstrates)-Truepositives[z] | |
| 755 Sensitivity[z]<-Truepositives[z]/(Falsenegatives[z]+Truepositives[z]) | |
| 756 TrueNegatives[z]<-length(NegativeWeirdScores[NegativeWeirdScores<(thres)]) | |
| 757 # at thresh 100 this should be 0, because it is total minus true negatives | |
| 758 FalsePositives[z]<-nrow(NegativeSubstrateList)-TrueNegatives[z] | |
| 759 Specificity[z]<-1-(TrueNegatives[z]/(FalsePositives[z]+TrueNegatives[z])) | |
| 760 Accuracy[z]<-100*(Truepositives[z]+TrueNegatives[z])/(Falsenegatives[z]+FalsePositives[z]+TrueNegatives[z]+Truepositives[z]) | |
| 761 MCC[z]<-((Truepositives[z]+TrueNegatives[z])-(Falsenegatives[z]+FalsePositives[z]))/sqrt(round(round(Truepositives[z]+Falsenegatives[z])*round(TrueNegatives[z]+FalsePositives[z])*round(Truepositives[z]+FalsePositives[z])*round(TrueNegatives[z]+Falsenegatives[z]))) | |
| 762 EER[z]<-.01*(((1-(Sensitivity[z]))*(Truepositives[z]+Falsenegatives[z]))+(Specificity[z]*(1-(Truepositives[z]+Falsenegatives[z])))) | |
| 763 } | |
| 764 Characterization<-cbind.data.frame(threshold,Truepositives,Falsenegatives,Sensitivity,TrueNegatives,FalsePositives,Specificity,Accuracy,MCC,EER) | |
| 765 | |
| 766 positiveheader<-c(1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,"RPMS","PMS") | |
| 767 positivewithscores<-rbind.data.frame(positiveheader,positivewithscores) | |
| 768 | |
| 769 negativeheader<-c("Substrate","RPMS","PMS") | |
| 770 colnames(NegativeWithScores)<-negativeheader | |
| 771 | |
| 772 # write.xlsx(NegativeWithScores,file = FILENAME, sheetName = "Negative Sequences Scored",col.names = TRUE,row.names = FALSE,append = TRUE) | |
| 773 # write.xlsx(Characterization,file = FILENAME,sheetName = "Characterization Table",col.names = TRUE,row.names = FALSE,append = TRUE) | |
| 774 # write.xlsx(RanksPeptides,file = FILENAME,sheetName = "Ranked Generated Peptides",col.names = FALSE,row.names = FALSE,append = TRUE) | |
| 775 # write.xlsx(positivewithscores,file = FILENAME, sheetName = "Positive Sequences Scored",col.names = FALSE,row.names = FALSE,append = TRUE) | |
| 776 write.table(x=c("Characterzation Table"),file = FILENAME2, col.names = FALSE,row.names = FALSE, append = TRUE,sep = ",") | |
| 777 write.table(Characterization,file = FILENAME2, col.names = TRUE,row.names = FALSE, append = TRUE,sep = ",") | |
| 778 | |
| 779 | |
| 780 write.table(RanksPeptides,file = FILENAME3,append = TRUE,row.names = FALSE,col.names = TRUE,sep = ",") | |
| 781 | |
| 782 |
