18
|
1 SubstrateBackgroundFrequency<- read.csv("7to7PositiveSubBAckFreq_11-7-17.csv", stringsAsFactors=FALSE, header = FALSE)
|
|
2 ScreenerFilename<-"screener7-7.csv"
|
|
3 FILENAME<-"output1.csv"
|
|
4 FILENAME2<-"output2.csv"
|
|
5 FILENAME3<-"output3.csv"
|
|
6 SubstrateBackgroundFrequency<-t(SubstrateBackgroundFrequency)
|
|
7 # number<-nrow(SubstrateBackgroundFrequency)-1
|
|
8 SubstrateBackgroundFrequency<-SubstrateBackgroundFrequency[2:nrow(SubstrateBackgroundFrequency),]
|
|
9 Sub<-na.omit(SubstrateBackgroundFrequency)
|
|
10 SubstrateBackgroundFrequency<-Sub
|
|
11 #
|
|
12 # args = commandArgs(trailingOnly=TRUE)
|
|
13 # TodaysKinase<-as.character(args[1])
|
|
14 OutputMatrix<-"KinaseMatrix.csv"
|
|
15 CharacterizationTable<-"CharacterizationTableForThisKinase.csv"
|
|
16 SDtable<-"SDtableforthisKinase"
|
|
17 SiteSelectivityTable<-"SiteSelectivityForThisKinase"
|
|
18 substrates<-matrix(rep("A",times=((nrow(ImportedSubstrateList)-1)*15)),ncol = 15)
|
|
19 #SeqsToBeScored<-"asdasd"
|
|
20 for (i in 2:nrow(ImportedSubstrateList))
|
|
21 {
|
|
22 substratemotif<-ImportedSubstrateList[i,4:18]
|
|
23 substratemotif[8]<-"Y"
|
|
24 #substratemotif<-paste(substratemotif,sep = "",collapse = "")
|
|
25 j=i-1
|
|
26 substratemotif<-unlist(substratemotif)
|
|
27 substrates[j,1:15]<-substratemotif
|
|
28 }
|
|
29 # SpacesToOs<-c(""="O",)
|
|
30 # substrates<-SpacesToOs[substrates]
|
|
31 SubstrateBackgroundFrequency[nrow(SubstrateBackgroundFrequency),2]
|
|
32 if(2==2){
|
|
33 Amean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),2]), na.rm=TRUE)
|
|
34 Cmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),3]), na.rm=TRUE)
|
|
35 Dmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),4]), na.rm=TRUE)
|
|
36 Emean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),5]), na.rm=TRUE)
|
|
37 Fmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),6]), na.rm=TRUE)
|
|
38 Gmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),7]), na.rm=TRUE)
|
|
39 Hmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),8]), na.rm=TRUE)
|
|
40 Imean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),9]), na.rm=TRUE)
|
|
41 Kmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),10]), na.rm=TRUE)
|
|
42 Lmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),11]), na.rm=TRUE)
|
|
43 Mmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),12]), na.rm=TRUE)
|
|
44 Nmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),13]), na.rm=TRUE)
|
|
45 Pmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),14]), na.rm=TRUE)
|
|
46 Qmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),15]), na.rm=TRUE)
|
|
47 Rmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),16]), na.rm=TRUE)
|
|
48 Smean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),17]), na.rm=TRUE)
|
|
49 Tmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),18]), na.rm=TRUE)
|
|
50 Vmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),19]), na.rm=TRUE)
|
|
51 Wmean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),20]), na.rm=TRUE)
|
|
52 Ymean<-mean(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),21]), na.rm=TRUE)
|
|
53 AllMeans<-c(Amean,Cmean,Dmean,Emean,Fmean,Gmean,Hmean,Imean,Kmean,Lmean,Mmean,Nmean,Pmean,Qmean,Rmean,Smean,Tmean,Vmean,Wmean,Ymean)
|
|
54 Asd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),2]), na.rm=TRUE)
|
|
55 Csd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),3]), na.rm=TRUE)
|
|
56 Dsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),4]), na.rm=TRUE)
|
|
57 Esd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),5]), na.rm=TRUE)
|
|
58 Fsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),6]), na.rm=TRUE)
|
|
59 Gsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),7]), na.rm=TRUE)
|
|
60 Hsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),8]), na.rm=TRUE)
|
|
61 Isd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),9]), na.rm=TRUE)
|
|
62 Ksd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),10]), na.rm=TRUE)
|
|
63 Lsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),11]), na.rm=TRUE)
|
|
64 Msd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),12]), na.rm=TRUE)
|
|
65 Nsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),13]), na.rm=TRUE)
|
|
66 Psd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),14]), na.rm=TRUE)
|
|
67 Qsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),15]), na.rm=TRUE)
|
|
68 Rsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),16]), na.rm=TRUE)
|
|
69 Ssd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),17]), na.rm=TRUE)
|
|
70 Tsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),18]), na.rm=TRUE)
|
|
71 Vsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),19]), na.rm=TRUE)
|
|
72 Wsd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),20]), na.rm=TRUE)
|
|
73 Ysd<-sd(as.numeric(SubstrateBackgroundFrequency[1:(nrow(SubstrateBackgroundFrequency)),21]), na.rm=TRUE)
|
|
74 }
|
|
75 AllSDs<-c(Asd,Csd,Dsd,Esd,Fsd,Gsd,Hsd,Isd,Ksd,Lsd,Msd,Nsd,Psd,Qsd,Rsd,Ssd,Tsd,Vsd,Wsd,Ysd)
|
|
76 #this is subbackfreq SDs
|
|
77 SBF_statisticalvalues<-cbind(AllMeans,AllSDs)
|
|
78 #create the percent table
|
|
79 if (1==1){
|
|
80 Column1<-substrates[,1]
|
|
81 Column2<-substrates[,2]
|
|
82 Column3<-substrates[,3]
|
|
83 Column4<-substrates[,4]
|
|
84 Column5<-substrates[,5]
|
|
85 Column6<-substrates[,6]
|
|
86 Column7<-substrates[,7]
|
|
87 Column8<-substrates[,8]
|
|
88 Column9<-substrates[,9]
|
|
89 Column10<-substrates[,10]
|
|
90 Column11<-substrates[,11]
|
|
91 Column12<-substrates[,12]
|
|
92 Column13<-substrates[,13]
|
|
93 Column14<-substrates[,14]
|
|
94 Column15<-substrates[,15]
|
|
95 spaces1<-sum((Column1%in% ""))
|
|
96 spaces2<-sum(Column2%in% "")
|
|
97 spaces3<-sum(Column3%in% "")
|
|
98 spaces4<-sum(Column4%in% "")
|
|
99 spaces5<-sum(Column5%in% "")
|
|
100 spaces6<-sum(Column6%in% "")
|
|
101 spaces7<-sum(Column7%in% "")
|
|
102 spaces8<-sum(Column8%in% "")
|
|
103 spaces9<-sum(Column9%in% "")
|
|
104 spaces10<-sum(Column10%in% "")
|
|
105 spaces11<-sum(Column11%in% "")
|
|
106 spaces12<-sum(Column12%in% "")
|
|
107 spaces13<-sum(Column13%in% "")
|
|
108 spaces14<-sum(Column14%in% "")
|
|
109 spaces15<-sum(Column15%in% "")
|
|
110 A1<-sum(Column1 %in% "A")/(length(Column1)-spaces1)
|
|
111 A2<-sum(Column2 %in% "A")/(length(Column2)-spaces2)
|
|
112 A3<-sum(Column3 %in% "A")/(length(Column3)-spaces3)
|
|
113 A4<-sum(Column4 %in% "A")/(length(Column4)-spaces4)
|
|
114 A5<-sum(Column5 %in% "A")/(length(Column5)-spaces5)
|
|
115 A6<-sum(Column6 %in% "A")/(length(Column6)-spaces6)
|
|
116 A7<-sum(Column7 %in% "A")/(length(Column7)-spaces7)
|
|
117 A8<-sum(Column8 %in% "A")/(length(Column8)-spaces8)
|
|
118 A9<-sum(Column9 %in% "A")/(length(Column9)-spaces9)
|
|
119 A10<-sum(Column10 %in% "A")/(length(Column10)-spaces10)
|
|
120 A11<-sum(Column11 %in% "A")/(length(Column11)-spaces11)
|
|
121 A12<-sum(Column12 %in% "A")/(length(Column12)-spaces12)
|
|
122 A13<-sum(Column13 %in% "A")/(length(Column13)-spaces13)
|
|
123 A14<-sum(Column14 %in% "A")/(length(Column14)-spaces14)
|
|
124 A15<-sum(Column15 %in% "A")/(length(Column15)-spaces15)
|
|
125 AllAs<-cbind(A1,A2,A3,A4,A5,A6,A7,A8,A9,A10,A11,A12,A13,A14,A15)
|
|
126 C1<-sum(Column1 %in% "C")/(length(Column1)-spaces1)
|
|
127 C2<-sum(Column2 %in% "C")/(length(Column2)-spaces2)
|
|
128 C3<-sum(Column3 %in% "C")/(length(Column3)-spaces3)
|
|
129 C4<-sum(Column4 %in% "C")/(length(Column4)-spaces4)
|
|
130 C5<-sum(Column5 %in% "C")/(length(Column5)-spaces5)
|
|
131 C6<-sum(Column6 %in% "C")/(length(Column6)-spaces6)
|
|
132 C7<-sum(Column7 %in% "C")/(length(Column7)-spaces7)
|
|
133 C8<-sum(Column8 %in% "C")/(length(Column8)-spaces8)
|
|
134 C9<-sum(Column9 %in% "C")/(length(Column9)-spaces9)
|
|
135 C10<-sum(Column10 %in% "C")/(length(Column10)-spaces10)
|
|
136 C11<-sum(Column11 %in% "C")/(length(Column11)-spaces11)
|
|
137 C12<-sum(Column12 %in% "C")/(length(Column12)-spaces12)
|
|
138 C13<-sum(Column13 %in% "C")/(length(Column13)-spaces13)
|
|
139 C14<-sum(Column14 %in% "C")/(length(Column14)-spaces14)
|
|
140 C15<-sum(Column15 %in% "C")/(length(Column15)-spaces15)
|
|
141 CllCs<-cbind(C1,C2,C3,C4,C5,C6,C7,C8,C9,C10,C11,C12,C13,C14,C15)
|
|
142 D1<-sum(Column1 %in% "D")/(length(Column1)-spaces1)
|
|
143 D2<-sum(Column2 %in% "D")/(length(Column2)-spaces2)
|
|
144 D3<-sum(Column3 %in% "D")/(length(Column3)-spaces3)
|
|
145 D4<-sum(Column4 %in% "D")/(length(Column4)-spaces4)
|
|
146 D5<-sum(Column5 %in% "D")/(length(Column5)-spaces5)
|
|
147 D6<-sum(Column6 %in% "D")/(length(Column6)-spaces6)
|
|
148 D7<-sum(Column7 %in% "D")/(length(Column7)-spaces7)
|
|
149 D8<-sum(Column8 %in% "D")/(length(Column8)-spaces8)
|
|
150 D9<-sum(Column9 %in% "D")/(length(Column9)-spaces9)
|
|
151 D10<-sum(Column10 %in% "D")/(length(Column10)-spaces10)
|
|
152 D11<-sum(Column11 %in% "D")/(length(Column11)-spaces11)
|
|
153 D12<-sum(Column12 %in% "D")/(length(Column12)-spaces12)
|
|
154 D13<-sum(Column13 %in% "D")/(length(Column13)-spaces13)
|
|
155 D14<-sum(Column14 %in% "D")/(length(Column14)-spaces14)
|
|
156 D15<-sum(Column15 %in% "D")/(length(Column15)-spaces15)
|
|
157 DllDs<-cbind(D1,D2,D3,D4,D5,D6,D7,D8,D9,D10,D11,D12,D13,D14,D15)
|
|
158 E1<-sum(Column1 %in% "E")/(length(Column1)-spaces1)
|
|
159 E2<-sum(Column2 %in% "E")/(length(Column2)-spaces2)
|
|
160 E3<-sum(Column3 %in% "E")/(length(Column3)-spaces3)
|
|
161 E4<-sum(Column4 %in% "E")/(length(Column4)-spaces4)
|
|
162 E5<-sum(Column5 %in% "E")/(length(Column5)-spaces5)
|
|
163 E6<-sum(Column6 %in% "E")/(length(Column6)-spaces6)
|
|
164 E7<-sum(Column7 %in% "E")/(length(Column7)-spaces7)
|
|
165 E8<-sum(Column8 %in% "E")/(length(Column8)-spaces8)
|
|
166 E9<-sum(Column9 %in% "E")/(length(Column9)-spaces9)
|
|
167 E10<-sum(Column10 %in% "E")/(length(Column10)-spaces10)
|
|
168 E11<-sum(Column11 %in% "E")/(length(Column11)-spaces11)
|
|
169 E12<-sum(Column12 %in% "E")/(length(Column12)-spaces12)
|
|
170 E13<-sum(Column13 %in% "E")/(length(Column13)-spaces13)
|
|
171 E14<-sum(Column14 %in% "E")/(length(Column14)-spaces14)
|
|
172 E15<-sum(Column15 %in% "E")/(length(Column15)-spaces15)
|
|
173 EllEs<-cbind(E1,E2,E3,E4,E5,E6,E7,E8,E9,E10,E11,E12,E13,E14,E15)
|
|
174 F1<-sum(Column1 %in% "F")/(length(Column1)-spaces1)
|
|
175 F2<-sum(Column2 %in% "F")/(length(Column2)-spaces2)
|
|
176 F3<-sum(Column3 %in% "F")/(length(Column3)-spaces3)
|
|
177 F4<-sum(Column4 %in% "F")/(length(Column4)-spaces4)
|
|
178 F5<-sum(Column5 %in% "F")/(length(Column5)-spaces5)
|
|
179 F6<-sum(Column6 %in% "F")/(length(Column6)-spaces6)
|
|
180 F7<-sum(Column7 %in% "F")/(length(Column7)-spaces7)
|
|
181 F8<-sum(Column8 %in% "F")/(length(Column8)-spaces8)
|
|
182 F9<-sum(Column9 %in% "F")/(length(Column9)-spaces9)
|
|
183 F10<-sum(Column10 %in% "F")/(length(Column10)-spaces10)
|
|
184 F11<-sum(Column11 %in% "F")/(length(Column11)-spaces11)
|
|
185 F12<-sum(Column12 %in% "F")/(length(Column12)-spaces12)
|
|
186 F13<-sum(Column13 %in% "F")/(length(Column13)-spaces13)
|
|
187 F14<-sum(Column14 %in% "F")/(length(Column14)-spaces14)
|
|
188 F15<-sum(Column15 %in% "F")/(length(Column15)-spaces15)
|
|
189 FllFs<-cbind(F1,F2,F3,F4,F5,F6,F7,F8,F9,F10,F11,F12,F13,F14,F15)
|
|
190 G1<-sum(Column1 %in% "G")/(length(Column1)-spaces1)
|
|
191 G2<-sum(Column2 %in% "G")/(length(Column2)-spaces2)
|
|
192 G3<-sum(Column3 %in% "G")/(length(Column3)-spaces3)
|
|
193 G4<-sum(Column4 %in% "G")/(length(Column4)-spaces4)
|
|
194 G5<-sum(Column5 %in% "G")/(length(Column5)-spaces5)
|
|
195 G6<-sum(Column6 %in% "G")/(length(Column6)-spaces6)
|
|
196 G7<-sum(Column7 %in% "G")/(length(Column7)-spaces7)
|
|
197 G8<-sum(Column8 %in% "G")/(length(Column8)-spaces8)
|
|
198 G9<-sum(Column9 %in% "G")/(length(Column9)-spaces9)
|
|
199 G10<-sum(Column10 %in% "G")/(length(Column10)-spaces10)
|
|
200 G11<-sum(Column11 %in% "G")/(length(Column11)-spaces11)
|
|
201 G12<-sum(Column12 %in% "G")/(length(Column12)-spaces12)
|
|
202 G13<-sum(Column13 %in% "G")/(length(Column13)-spaces13)
|
|
203 G14<-sum(Column14 %in% "G")/(length(Column14)-spaces14)
|
|
204 G15<-sum(Column15 %in% "G")/(length(Column15)-spaces15)
|
|
205 GllGs<-cbind(G1,G2,G3,G4,G5,G6,G7,G8,G9,G10,G11,G12,G13,G14,G15)
|
|
206 H1<-sum(Column1 %in% "H")/(length(Column1)-spaces1)
|
|
207 H2<-sum(Column2 %in% "H")/(length(Column2)-spaces2)
|
|
208 H3<-sum(Column3 %in% "H")/(length(Column3)-spaces3)
|
|
209 H4<-sum(Column4 %in% "H")/(length(Column4)-spaces4)
|
|
210 H5<-sum(Column5 %in% "H")/(length(Column5)-spaces5)
|
|
211 H6<-sum(Column6 %in% "H")/(length(Column6)-spaces6)
|
|
212 H7<-sum(Column7 %in% "H")/(length(Column7)-spaces7)
|
|
213 H8<-sum(Column8 %in% "H")/(length(Column8)-spaces8)
|
|
214 H9<-sum(Column9 %in% "H")/(length(Column9)-spaces9)
|
|
215 H10<-sum(Column10 %in% "H")/(length(Column10)-spaces10)
|
|
216 H11<-sum(Column11 %in% "H")/(length(Column11)-spaces11)
|
|
217 H12<-sum(Column12 %in% "H")/(length(Column12)-spaces12)
|
|
218 H13<-sum(Column13 %in% "H")/(length(Column13)-spaces13)
|
|
219 H14<-sum(Column14 %in% "H")/(length(Column14)-spaces14)
|
|
220 H15<-sum(Column15 %in% "H")/(length(Column15)-spaces15)
|
|
221 HllHs<-cbind(H1,H2,H3,H4,H5,H6,H7,H8,H9,H10,H11,H12,H13,H14,H15)
|
|
222 I1<-sum(Column1 %in% "I")/(length(Column1)-spaces1)
|
|
223 I2<-sum(Column2 %in% "I")/(length(Column2)-spaces2)
|
|
224 I3<-sum(Column3 %in% "I")/(length(Column3)-spaces3)
|
|
225 I4<-sum(Column4 %in% "I")/(length(Column4)-spaces4)
|
|
226 I5<-sum(Column5 %in% "I")/(length(Column5)-spaces5)
|
|
227 I6<-sum(Column6 %in% "I")/(length(Column6)-spaces6)
|
|
228 I7<-sum(Column7 %in% "I")/(length(Column7)-spaces7)
|
|
229 I8<-sum(Column8 %in% "I")/(length(Column8)-spaces8)
|
|
230 I9<-sum(Column9 %in% "I")/(length(Column9)-spaces9)
|
|
231 I10<-sum(Column10 %in% "I")/(length(Column10)-spaces10)
|
|
232 I11<-sum(Column11 %in% "I")/(length(Column11)-spaces11)
|
|
233 I12<-sum(Column12 %in% "I")/(length(Column12)-spaces12)
|
|
234 I13<-sum(Column13 %in% "I")/(length(Column13)-spaces13)
|
|
235 I14<-sum(Column14 %in% "I")/(length(Column14)-spaces14)
|
|
236 I15<-sum(Column15 %in% "I")/(length(Column15)-spaces15)
|
|
237 IllIs<-cbind(I1,I2,I3,I4,I5,I6,I7,I8,I9,I10,I11,I12,I13,I14,I15)
|
|
238 K1<-sum(Column1 %in% "K")/(length(Column1)-spaces1)
|
|
239 K2<-sum(Column2 %in% "K")/(length(Column2)-spaces2)
|
|
240 K3<-sum(Column3 %in% "K")/(length(Column3)-spaces3)
|
|
241 K4<-sum(Column4 %in% "K")/(length(Column4)-spaces4)
|
|
242 K5<-sum(Column5 %in% "K")/(length(Column5)-spaces5)
|
|
243 K6<-sum(Column6 %in% "K")/(length(Column6)-spaces6)
|
|
244 K7<-sum(Column7 %in% "K")/(length(Column7)-spaces7)
|
|
245 K8<-sum(Column8 %in% "K")/(length(Column8)-spaces8)
|
|
246 K9<-sum(Column9 %in% "K")/(length(Column9)-spaces9)
|
|
247 K10<-sum(Column10 %in% "K")/(length(Column10)-spaces10)
|
|
248 K11<-sum(Column11 %in% "K")/(length(Column11)-spaces11)
|
|
249 K12<-sum(Column12 %in% "K")/(length(Column12)-spaces12)
|
|
250 K13<-sum(Column13 %in% "K")/(length(Column13)-spaces13)
|
|
251 K14<-sum(Column14 %in% "K")/(length(Column14)-spaces14)
|
|
252 K15<-sum(Column15 %in% "K")/(length(Column15)-spaces15)
|
|
253 KllKs<-cbind(K1,K2,K3,K4,K5,K6,K7,K8,K9,K10,K11,K12,K13,K14,K15)
|
|
254 L1<-sum(Column1 %in% "L")/(length(Column1)-spaces1)
|
|
255 L2<-sum(Column2 %in% "L")/(length(Column2)-spaces2)
|
|
256 L3<-sum(Column3 %in% "L")/(length(Column3)-spaces3)
|
|
257 L4<-sum(Column4 %in% "L")/(length(Column4)-spaces4)
|
|
258 L5<-sum(Column5 %in% "L")/(length(Column5)-spaces5)
|
|
259 L6<-sum(Column6 %in% "L")/(length(Column6)-spaces6)
|
|
260 L7<-sum(Column7 %in% "L")/(length(Column7)-spaces7)
|
|
261 L8<-sum(Column8 %in% "L")/(length(Column8)-spaces8)
|
|
262 L9<-sum(Column9 %in% "L")/(length(Column9)-spaces9)
|
|
263 L10<-sum(Column10 %in% "L")/(length(Column10)-spaces10)
|
|
264 L11<-sum(Column11 %in% "L")/(length(Column11)-spaces11)
|
|
265 L12<-sum(Column12 %in% "L")/(length(Column12)-spaces12)
|
|
266 L13<-sum(Column13 %in% "L")/(length(Column13)-spaces13)
|
|
267 L14<-sum(Column14 %in% "L")/(length(Column14)-spaces14)
|
|
268 L15<-sum(Column15 %in% "L")/(length(Column15)-spaces15)
|
|
269 LllLs<-cbind(L1,L2,L3,L4,L5,L6,L7,L8,L9,L10,L11,L12,L13,L14,L15)
|
|
270 M1<-sum(Column1 %in% "M")/(length(Column1)-spaces1)
|
|
271 M2<-sum(Column2 %in% "M")/(length(Column2)-spaces2)
|
|
272 M3<-sum(Column3 %in% "M")/(length(Column3)-spaces3)
|
|
273 M4<-sum(Column4 %in% "M")/(length(Column4)-spaces4)
|
|
274 M5<-sum(Column5 %in% "M")/(length(Column5)-spaces5)
|
|
275 M6<-sum(Column6 %in% "M")/(length(Column6)-spaces6)
|
|
276 M7<-sum(Column7 %in% "M")/(length(Column7)-spaces7)
|
|
277 M8<-sum(Column8 %in% "M")/(length(Column8)-spaces8)
|
|
278 M9<-sum(Column9 %in% "M")/(length(Column9)-spaces9)
|
|
279 M10<-sum(Column10 %in% "M")/(length(Column10)-spaces10)
|
|
280 M11<-sum(Column11 %in% "M")/(length(Column11)-spaces11)
|
|
281 M12<-sum(Column12 %in% "M")/(length(Column12)-spaces12)
|
|
282 M13<-sum(Column13 %in% "M")/(length(Column13)-spaces13)
|
|
283 M14<-sum(Column14 %in% "M")/(length(Column14)-spaces14)
|
|
284 M15<-sum(Column15 %in% "M")/(length(Column15)-spaces15)
|
|
285 MllMs<-cbind(M1,M2,M3,M4,M5,M6,M7,M8,M9,M10,M11,M12,M13,M14,M15)
|
|
286 N1<-sum(Column1 %in% "N")/(length(Column1)-spaces1)
|
|
287 N2<-sum(Column2 %in% "N")/(length(Column2)-spaces2)
|
|
288 N3<-sum(Column3 %in% "N")/(length(Column3)-spaces3)
|
|
289 N4<-sum(Column4 %in% "N")/(length(Column4)-spaces4)
|
|
290 N5<-sum(Column5 %in% "N")/(length(Column5)-spaces5)
|
|
291 N6<-sum(Column6 %in% "N")/(length(Column6)-spaces6)
|
|
292 N7<-sum(Column7 %in% "N")/(length(Column7)-spaces7)
|
|
293 N8<-sum(Column8 %in% "N")/(length(Column8)-spaces8)
|
|
294 N9<-sum(Column9 %in% "N")/(length(Column9)-spaces9)
|
|
295 N10<-sum(Column10 %in% "N")/(length(Column10)-spaces10)
|
|
296 N11<-sum(Column11 %in% "N")/(length(Column11)-spaces11)
|
|
297 N12<-sum(Column12 %in% "N")/(length(Column12)-spaces12)
|
|
298 N13<-sum(Column13 %in% "N")/(length(Column13)-spaces13)
|
|
299 N14<-sum(Column14 %in% "N")/(length(Column14)-spaces14)
|
|
300 N15<-sum(Column15 %in% "N")/(length(Column15)-spaces15)
|
|
301 NllNs<-cbind(N1,N2,N3,N4,N5,N6,N7,N8,N9,N10,N11,N12,N13,N14,N15)
|
|
302 P1<-sum(Column1 %in% "P")/(length(Column1)-spaces1)
|
|
303 P2<-sum(Column2 %in% "P")/(length(Column2)-spaces2)
|
|
304 P3<-sum(Column3 %in% "P")/(length(Column3)-spaces3)
|
|
305 P4<-sum(Column4 %in% "P")/(length(Column4)-spaces4)
|
|
306 P5<-sum(Column5 %in% "P")/(length(Column5)-spaces5)
|
|
307 P6<-sum(Column6 %in% "P")/(length(Column6)-spaces6)
|
|
308 P7<-sum(Column7 %in% "P")/(length(Column7)-spaces7)
|
|
309 P8<-sum(Column8 %in% "P")/(length(Column8)-spaces8)
|
|
310 P9<-sum(Column9 %in% "P")/(length(Column9)-spaces9)
|
|
311 P10<-sum(Column10 %in% "P")/(length(Column10)-spaces10)
|
|
312 P11<-sum(Column11 %in% "P")/(length(Column11)-spaces11)
|
|
313 P12<-sum(Column12 %in% "P")/(length(Column12)-spaces12)
|
|
314 P13<-sum(Column13 %in% "P")/(length(Column13)-spaces13)
|
|
315 P14<-sum(Column14 %in% "P")/(length(Column14)-spaces14)
|
|
316 P15<-sum(Column15 %in% "P")/(length(Column15)-spaces15)
|
|
317 PllPs<-cbind(P1,P2,P3,P4,P5,P6,P7,P8,P9,P10,P11,P12,P13,P14,P15)
|
|
318 Q1<-sum(Column1 %in% "Q")/(length(Column1)-spaces1)
|
|
319 Q2<-sum(Column2 %in% "Q")/(length(Column2)-spaces2)
|
|
320 Q3<-sum(Column3 %in% "Q")/(length(Column3)-spaces3)
|
|
321 Q4<-sum(Column4 %in% "Q")/(length(Column4)-spaces4)
|
|
322 Q5<-sum(Column5 %in% "Q")/(length(Column5)-spaces5)
|
|
323 Q6<-sum(Column6 %in% "Q")/(length(Column6)-spaces6)
|
|
324 Q7<-sum(Column7 %in% "Q")/(length(Column7)-spaces7)
|
|
325 Q8<-sum(Column8 %in% "Q")/(length(Column8)-spaces8)
|
|
326 Q9<-sum(Column9 %in% "Q")/(length(Column9)-spaces9)
|
|
327 Q10<-sum(Column10 %in% "Q")/(length(Column10)-spaces10)
|
|
328 Q11<-sum(Column11 %in% "Q")/(length(Column11)-spaces11)
|
|
329 Q12<-sum(Column12 %in% "Q")/(length(Column12)-spaces12)
|
|
330 Q13<-sum(Column13 %in% "Q")/(length(Column13)-spaces13)
|
|
331 Q14<-sum(Column14 %in% "Q")/(length(Column14)-spaces14)
|
|
332 Q15<-sum(Column15 %in% "Q")/(length(Column15)-spaces15)
|
|
333 QllQs<-cbind(Q1,Q2,Q3,Q4,Q5,Q6,Q7,Q8,Q9,Q10,Q11,Q12,Q13,Q14,Q15)
|
|
334 R1<-sum(Column1 %in% "R")/(length(Column1)-spaces1)
|
|
335 R2<-sum(Column2 %in% "R")/(length(Column2)-spaces2)
|
|
336 R3<-sum(Column3 %in% "R")/(length(Column3)-spaces3)
|
|
337 R4<-sum(Column4 %in% "R")/(length(Column4)-spaces4)
|
|
338 R5<-sum(Column5 %in% "R")/(length(Column5)-spaces5)
|
|
339 R6<-sum(Column6 %in% "R")/(length(Column6)-spaces6)
|
|
340 R7<-sum(Column7 %in% "R")/(length(Column7)-spaces7)
|
|
341 R8<-sum(Column8 %in% "R")/(length(Column8)-spaces8)
|
|
342 R9<-sum(Column9 %in% "R")/(length(Column9)-spaces9)
|
|
343 R10<-sum(Column10 %in% "R")/(length(Column10)-spaces10)
|
|
344 R11<-sum(Column11 %in% "R")/(length(Column11)-spaces11)
|
|
345 R12<-sum(Column12 %in% "R")/(length(Column12)-spaces12)
|
|
346 R13<-sum(Column13 %in% "R")/(length(Column13)-spaces13)
|
|
347 R14<-sum(Column14 %in% "R")/(length(Column14)-spaces14)
|
|
348 R15<-sum(Column15 %in% "R")/(length(Column15)-spaces15)
|
|
349 RllRs<-cbind(R1,R2,R3,R4,R5,R6,R7,R8,R9,R10,R11,R12,R13,R14,R15)
|
|
350 S1<-sum(Column1 %in% "S")/(length(Column1)-spaces1)
|
|
351 S2<-sum(Column2 %in% "S")/(length(Column2)-spaces2)
|
|
352 S3<-sum(Column3 %in% "S")/(length(Column3)-spaces3)
|
|
353 S4<-sum(Column4 %in% "S")/(length(Column4)-spaces4)
|
|
354 S5<-sum(Column5 %in% "S")/(length(Column5)-spaces5)
|
|
355 S6<-sum(Column6 %in% "S")/(length(Column6)-spaces6)
|
|
356 S7<-sum(Column7 %in% "S")/(length(Column7)-spaces7)
|
|
357 S8<-sum(Column8 %in% "S")/(length(Column8)-spaces8)
|
|
358 S9<-sum(Column9 %in% "S")/(length(Column9)-spaces9)
|
|
359 S10<-sum(Column10 %in% "S")/(length(Column10)-spaces10)
|
|
360 S11<-sum(Column11 %in% "S")/(length(Column11)-spaces11)
|
|
361 S12<-sum(Column12 %in% "S")/(length(Column12)-spaces12)
|
|
362 S13<-sum(Column13 %in% "S")/(length(Column13)-spaces13)
|
|
363 S14<-sum(Column14 %in% "S")/(length(Column14)-spaces14)
|
|
364 S15<-sum(Column15 %in% "S")/(length(Column15)-spaces15)
|
|
365 SllSs<-cbind(S1,S2,S3,S4,S5,S6,S7,S8,S9,S10,S11,S12,S13,S14,S15)
|
|
366 T1<-sum(Column1 %in% "T")/(length(Column1)-spaces1)
|
|
367 T2<-sum(Column2 %in% "T")/(length(Column2)-spaces2)
|
|
368 T3<-sum(Column3 %in% "T")/(length(Column3)-spaces3)
|
|
369 T4<-sum(Column4 %in% "T")/(length(Column4)-spaces4)
|
|
370 T5<-sum(Column5 %in% "T")/(length(Column5)-spaces5)
|
|
371 T6<-sum(Column6 %in% "T")/(length(Column6)-spaces6)
|
|
372 T7<-sum(Column7 %in% "T")/(length(Column7)-spaces7)
|
|
373 T8<-sum(Column8 %in% "T")/(length(Column8)-spaces8)
|
|
374 T9<-sum(Column9 %in% "T")/(length(Column9)-spaces9)
|
|
375 T10<-sum(Column10 %in% "T")/(length(Column10)-spaces10)
|
|
376 T11<-sum(Column11 %in% "T")/(length(Column11)-spaces11)
|
|
377 T12<-sum(Column12 %in% "T")/(length(Column12)-spaces12)
|
|
378 T13<-sum(Column13 %in% "T")/(length(Column13)-spaces13)
|
|
379 T14<-sum(Column14 %in% "T")/(length(Column14)-spaces14)
|
|
380 T15<-sum(Column15 %in% "T")/(length(Column15)-spaces15)
|
|
381 TllTs<-cbind(T1,T2,T3,T4,T5,T6,T7,T8,T9,T10,T11,T12,T13,T14,T15)
|
|
382 V1<-sum(Column1 %in% "V")/(length(Column1)-spaces1)
|
|
383 V2<-sum(Column2 %in% "V")/(length(Column2)-spaces2)
|
|
384 V3<-sum(Column3 %in% "V")/(length(Column3)-spaces3)
|
|
385 V4<-sum(Column4 %in% "V")/(length(Column4)-spaces4)
|
|
386 V5<-sum(Column5 %in% "V")/(length(Column5)-spaces5)
|
|
387 V6<-sum(Column6 %in% "V")/(length(Column6)-spaces6)
|
|
388 V7<-sum(Column7 %in% "V")/(length(Column7)-spaces7)
|
|
389 V8<-sum(Column8 %in% "V")/(length(Column8)-spaces8)
|
|
390 V9<-sum(Column9 %in% "V")/(length(Column9)-spaces9)
|
|
391 V10<-sum(Column10 %in% "V")/(length(Column10)-spaces10)
|
|
392 V11<-sum(Column11 %in% "V")/(length(Column11)-spaces11)
|
|
393 V12<-sum(Column12 %in% "V")/(length(Column12)-spaces12)
|
|
394 V13<-sum(Column13 %in% "V")/(length(Column13)-spaces13)
|
|
395 V14<-sum(Column14 %in% "V")/(length(Column14)-spaces14)
|
|
396 V15<-sum(Column15 %in% "V")/(length(Column15)-spaces15)
|
|
397 VllVs<-cbind(V1,V2,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15)
|
|
398 W1<-sum(Column1 %in% "W")/(length(Column1)-spaces1)
|
|
399 W2<-sum(Column2 %in% "W")/(length(Column2)-spaces2)
|
|
400 W3<-sum(Column3 %in% "W")/(length(Column3)-spaces3)
|
|
401 W4<-sum(Column4 %in% "W")/(length(Column4)-spaces4)
|
|
402 W5<-sum(Column5 %in% "W")/(length(Column5)-spaces5)
|
|
403 W6<-sum(Column6 %in% "W")/(length(Column6)-spaces6)
|
|
404 W7<-sum(Column7 %in% "W")/(length(Column7)-spaces7)
|
|
405 W8<-sum(Column8 %in% "W")/(length(Column8)-spaces8)
|
|
406 W9<-sum(Column9 %in% "W")/(length(Column9)-spaces9)
|
|
407 W10<-sum(Column10 %in% "W")/(length(Column10)-spaces10)
|
|
408 W11<-sum(Column11 %in% "W")/(length(Column11)-spaces11)
|
|
409 W12<-sum(Column12 %in% "W")/(length(Column12)-spaces12)
|
|
410 W13<-sum(Column13 %in% "W")/(length(Column13)-spaces13)
|
|
411 W14<-sum(Column14 %in% "W")/(length(Column14)-spaces14)
|
|
412 W15<-sum(Column15 %in% "W")/(length(Column15)-spaces15)
|
|
413 WllWs<-cbind(W1,W2,W3,W4,W5,W6,W7,W8,W9,W10,W11,W12,W13,W14,W15)
|
|
414 Y1<-sum(Column1 %in% "Y")/(length(Column1)-spaces1)
|
|
415 Y2<-sum(Column2 %in% "Y")/(length(Column2)-spaces2)
|
|
416 Y3<-sum(Column3 %in% "Y")/(length(Column3)-spaces3)
|
|
417 Y4<-sum(Column4 %in% "Y")/(length(Column4)-spaces4)
|
|
418 Y5<-sum(Column5 %in% "Y")/(length(Column5)-spaces5)
|
|
419 Y6<-sum(Column6 %in% "Y")/(length(Column6)-spaces6)
|
|
420 Y7<-sum(Column7 %in% "Y")/(length(Column7)-spaces7)
|
|
421 Y8<-sum(Column8 %in% "Y")/(length(Column8)-spaces8)
|
|
422 Y9<-sum(Column9 %in% "Y")/(length(Column9)-spaces9)
|
|
423 Y10<-sum(Column10 %in% "Y")/(length(Column10)-spaces10)
|
|
424 Y11<-sum(Column11 %in% "Y")/(length(Column11)-spaces11)
|
|
425 Y12<-sum(Column12 %in% "Y")/(length(Column12)-spaces12)
|
|
426 Y13<-sum(Column13 %in% "Y")/(length(Column13)-spaces13)
|
|
427 Y14<-sum(Column14 %in% "Y")/(length(Column14)-spaces14)
|
|
428 Y15<-sum(Column15 %in% "Y")/(length(Column15)-spaces15)
|
|
429 YllYs<-cbind(Y1,Y2,Y3,Y4,Y5,Y6,Y7,Y8,Y9,Y10,Y11,Y12,Y13,Y14,Y15)
|
|
430 }
|
|
431 #this is substrate percents
|
|
432 #A C D E F G H I K L N P Q R S T V W Y
|
|
433 PercentTable<-rbind(AllAs,CllCs,DllDs,EllEs,FllFs,GllGs,HllHs,IllIs,KllKs,LllLs,MllMs,NllNs,PllPs,QllQs,RllRs,SllSs,TllTs,VllVs,WllWs,YllYs)
|
|
434 PercentTable<-PercentTable*100
|
|
435 #create the SD table
|
|
436 SDtable<-matrix(data = rep(1,times=(nrow(PercentTable)*ncol(PercentTable))),nrow = nrow(PercentTable),ncol = ncol(PercentTable))
|
|
437 #for every row, a percertage minus the same mean over the same SD
|
|
438 if(1==1){
|
|
439 SDtable[1,]<-(PercentTable[1,]-Amean)/Asd
|
|
440 SDtable[2,]<-(PercentTable[2,]-Cmean)/Csd
|
|
441 SDtable[3,]<-(PercentTable[3,]-Dmean)/Dsd
|
|
442 SDtable[4,]<-(PercentTable[4,]-Emean)/Esd
|
|
443 SDtable[5,]<-(PercentTable[5,]-Fmean)/Fsd
|
|
444 SDtable[6,]<-(PercentTable[6,]-Gmean)/Gsd
|
|
445 SDtable[7,]<-(PercentTable[7,]-Hmean)/Hsd
|
|
446 SDtable[8,]<-(PercentTable[8,]-Imean)/Isd
|
|
447 SDtable[9,]<-(PercentTable[9,]-Kmean)/Ksd
|
|
448 SDtable[10,]<-(PercentTable[10,]-Lmean)/Lsd
|
|
449 SDtable[11,]<-(PercentTable[11,]-Mmean)/Msd
|
|
450 SDtable[12,]<-(PercentTable[12,]-Nmean)/Nsd
|
|
451 SDtable[13,]<-(PercentTable[13,]-Pmean)/Psd
|
|
452 SDtable[14,]<-(PercentTable[14,]-Qmean)/Qsd
|
|
453 SDtable[15,]<-(PercentTable[15,]-Rmean)/Rsd
|
|
454 SDtable[16,]<-(PercentTable[16,]-Smean)/Ssd
|
|
455 SDtable[17,]<-(PercentTable[17,]-Tmean)/Tsd
|
|
456 SDtable[18,]<-(PercentTable[18,]-Vmean)/Vsd
|
|
457 SDtable[19,]<-(PercentTable[19,]-Wmean)/Wsd
|
|
458 SDtable[20,]<-(PercentTable[20,]-Ymean)/Ysd
|
|
459 }
|
|
460 SetOfAAs<-c("Letter","A","C","D","E","F","G","H","I","K","L","M","N","P","Q","R","S","T","V","W","Y")
|
|
461 SumOfSigmaAAs<-c(1:15)
|
|
462 for (i in 1:15){
|
|
463 SumOfSigmasValue<-0
|
|
464 for (j in 1:20){
|
|
465 value<-0
|
|
466 if (SDtable[j,i]>2){
|
|
467 value<-sum(substrates[,i]==SetOfAAs[j])
|
|
468 }
|
|
469 SumOfSigmasValue<-SumOfSigmasValue+value
|
|
470 }
|
|
471 SumOfSigmaAAs[i]<-SumOfSigmasValue
|
|
472 }
|
|
473 # AAs1<-length(substrates[,1])-sum(substrates[,1]=="")
|
|
474 # AAs2<-length(substrates[,2])-sum(substrates[,2]=="")
|
|
475 # AAs3<-length(substrates[,3])-sum(substrates[,3]=="")
|
|
476 # AAs4<-length(substrates[,4])-sum(substrates[,4]=="")
|
|
477 # AAs5<-length(substrates[,5])-sum(substrates[,5]=="")
|
|
478 # AAs6<-length(substrates[,6])-sum(substrates[,6]=="")
|
|
479 # AAs7<-length(substrates[,7])-sum(substrates[,7]=="")
|
|
480 # AAs8<-length(substrates[,8])-sum(substrates[,8]=="")
|
|
481 # AAs9<-length(substrates[,9])-sum(substrates[,9]=="")
|
|
482 #
|
|
483 #
|
|
484 #
|
|
485 # #AAsAtPositions<-c(AAs1,AAs2,AAs3,AAs4,AAs5,AAs6,AAs7,AAs8,AAs9)
|
|
486 # AAsAtPositions<-c(length(substrates[,1]),length(substrates[,2]),length(substrates[,3]),length(substrates[,4]),
|
|
487 # length(substrates[,5]),length(substrates[,6]),length(substrates[,7]),length(substrates[,8]),
|
|
488 # length(substrates[,9]))
|
|
489 SumOfExpectedSigmaAAs<-c(1:15)
|
|
490 for (i in 1:15){
|
|
491 ExpectedValue<-0
|
|
492 for (j in 1:20){
|
|
493 value<-0
|
|
494 if (SDtable[j,i]>2){
|
|
495 value<-AllMeans[j]
|
|
496 }
|
|
497 ExpectedValue<-ExpectedValue+value
|
|
498 }
|
|
499 SumOfExpectedSigmaAAs[i]<-ExpectedValue*(length(substrates[,i])-sum(substrates[,i]%in% ""))/100
|
|
500 }
|
|
501 SelectivityRow<-SumOfSigmaAAs/SumOfExpectedSigmaAAs
|
|
502 SelectivitySheet<-rbind(SumOfSigmaAAs,SumOfExpectedSigmaAAs,SelectivityRow)
|
|
503 SetOfAAs<-matrix(data = SetOfAAs,ncol = 1)
|
|
504 SDtable
|
|
505 Amean
|
|
506 Cmean
|
|
507 Wsd
|
|
508 Amean
|
|
509 head(SubstrateBackgroundFrequency)
|
|
510 source('C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/KinatestSwitcheroo.R')
|
|
511 source('C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/KinatestSwitcheroo.R')
|
|
512 source('C:/Users/User Name/Desktop/UMN 2017 Spring/Parker Lab/KinatestSwitcheroo.R')
|