annotate CorrTable/Corr_Script_samples_row.R @ 2:2173ad5e7750 draft default tip

Uploaded
author melpetera
date Wed, 16 Oct 2019 03:12:55 -0400
parents 29ec7e3afdd4
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
1 #################################################################################################
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
2 # CORRELATION TABLE #
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
3 # #
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
4 # #
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
5 # Input : 2 tables with shared samples #
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
6 # Output : Correlation table ; Heatmap (pdf) #
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
7 # #
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
8 # Dependencies : Libraries "ggplot2" and "reshape2" #
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
9 # #
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
10 #################################################################################################
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
11
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
12
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
13 # Parameters (for dev)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
14 if(FALSE){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
15
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
16 tab1.name <- "test/ressources/inputs/CT/CT2_DM.tabular"
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
17 tab2.name <- "test/ressources/inputs/CT/CT2_base_Diapason_14ClinCES_PRIN.txt"
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
18 param1.samples <- "column"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
19 param2.samples <- "row"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
20 corr.method <- "pearson"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
21 test.corr <- "yes"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
22 alpha <- 0.05
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
23 multi.name <- "none"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
24 filter <- "yes"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
25 filters.choice <- "filters_0_thr"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
26 threshold <- 0.2
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
27 reorder.var <- "yes"
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
28 plot.choice <- "auto"
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
29 color.heatmap <- "yes"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
30 type.classes <-"irregular"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
31 reg.value <- 1/3
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
32 irreg.vect <- c(-0.3, -0.2, -0.1, 0, 0.3, 0.4)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
33 output1 <- "Correlation_table.txt"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
34 output2 <- "Heatmap.pdf"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
35
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
36 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
37
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
38
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
39
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
40 correlation.tab <- function(tab1.name, tab2.name, param1.samples, param2.samples, corr.method, test.corr, alpha,
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
41 multi.name, filter, filters.choice, threshold, reorder.var, plot.choice, color.heatmap,
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
42 type.classes, reg.value, irreg.vect, output1, output2){
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
43
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
44 # This function allows to visualize the correlation between two tables
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
45 #
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
46 # Parameters:
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
47 # - tab1.name: table 1 file's access
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
48 # - tab2.name: table 2 file's access
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
49 # - param1.samples ("row" or "column"): where the samples are in tab1
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
50 # - param2.samples ("row" or "column"): where the samples are in tab2
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
51 # - corr.method ("pearson", "spearman", "kendall"):
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
52 # - test.corr ("yes" or "no"): test the significance of a correlation coefficient
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
53 # - alpha (value between 0 and 1): risk for the correlation significance test
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
54 # - multi.name ("holm", "hochberg", "hommel", "bonferroni", "BH", "BY", "fdr", "none"): correction of multiple tests
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
55 # - filter ("yes", "no"): use filter.0 or/and filter.threshold
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
56 # - filters.choice ("filter_0" or "filters_0_thr"): zero filter removes variables with all their correlation coefficients = 0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
57 # and threshold filter remove variables with all their correlation coefficients in abs < threshold
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
58 # - threshold (value between 0 and 1): threshold for filter threshold
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
59 # - reorder.var ("yes" or "no"): reorder variables in the correlation table thanks to the HCA
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
60 # - plot.choice ("auto", "forced" or "none"): determine whether a heatmap is plotted
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
61 # - color.heatmap ("yes" or "no"): color the heatmap with classes defined by the user
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
62 # - type.classes ("regular" or "irregular"): choose to color the heatmap with regular or irregular classes
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
63 # - reg.value (value between 0 and 1): value for regular classes
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
64 # - irreg.vect (vector with values between -1 and 1): vector which indicates values for intervals (irregular classes)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
65 # - output1: correlation table file's access
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
66 # - output2: heatmap (colored correlation table) file's access
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
67
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
68
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
69 # Input ----------------------------------------------------------------------------------------------
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
70
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
71 tab1 <- read.table(tab1.name, sep = "\t", header = TRUE, check.names = FALSE, row.names = 1)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
72 tab2 <- read.table(tab2.name, sep = "\t", header = TRUE, check.names = FALSE, row.names = 1)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
73
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
74 # Transpose tables according to the samples
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
75 if(param1.samples == "column"){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
76 tab1 <- t(tab1)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
77 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
78
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
79 if(param2.samples == "column"){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
80 tab2 <- t(tab2)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
81 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
82
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
83 # Sorting tables in alphabetical order of the samples
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
84 tab1 <- tab1[order(rownames(tab1)),]
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
85 tab2 <- tab2[order(rownames(tab2)),]
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
86
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
87
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
88 # Checks ---------------------------------------------------------------------------------------------
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
89
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
90 # Check if the 2 datasets match regarding samples identifiers
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
91 # Adapt from functions "check.err" and "match2", RcheckLibrary.R
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
92
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
93 err.stock <- NULL
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
94
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
95 id1 <- rownames(tab1)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
96 id2 <- rownames(tab2)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
97
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
98 if(sum(id1 != id2) > 0){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
99 err.stock <- c("\nThe two tables do not match regarding sample identifiers.\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
100
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
101 if(length(which(id1%in%id2)) != length(id1)){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
102 identif <- id1[which(!(id1%in%id2))]
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
103 if (length(identif) < 4){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
104 err.stock <- c(err.stock, "\nThe following identifier(s) found in the first table do not appear in the second table:\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
105 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
106 else {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
107 err.stock <- c(err.stock, "\nFor example, the following identifiers found in the first table do not appear in the second table:\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
108 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
109 identif <- identif[1:min(3,length(which(!(id1%in%id2))))]
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
110 err.stock <- c(err.stock," ",paste(identif,collapse="\n "),"\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
111 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
112
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
113 if(length(which(id2%in%id1)) != length(id2)){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
114 identif <- id2[which(!(id2%in%id1))]
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
115 if (length(identif) < 4){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
116 err.stock <- c(err.stock, "\nThe following identifier(s) found in the second table do not appear in the first table:\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
117 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
118 else{
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
119 err.stock <- c(err.stock, "\nFor example, the following identifiers found in the second table do not appear in the first table:\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
120 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
121 identif <- identif[1:min(3,length(which(!(id2%in%id1))))]
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
122 err.stock <- c(err.stock," ",paste(identif,collapse="\n "),"\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
123 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
124 err.stock <- c(err.stock,"\nPlease check your data.\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
125 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
126
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
127 if(length(err.stock)!=0){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
128 stop("\n- - - - - - - - -\n",err.stock,"\n- - - - - - - - -\n\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
129 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
130
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
131
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
132 # Check whether tab1=tab2
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
133
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
134 err.msg <- NULL
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
135
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
136 if((ncol(tab1)==ncol(tab2))&&(sum(tab1!=tab2,na.rm=TRUE)==0)){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
137 autocor <- TRUE
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
138 err.msg <- c(err.msg, "\nYou chose the same table for the two dataset inputs. \nTo allow filtering options,",
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
139 "we will turn the diagonal to 0 in the correlation matrix during the filtering process.\n")
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
140 }else{
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
141 autocor <- FALSE
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
142 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
143
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
144
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
145 # Check qualitative variables in each input tables
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
146
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
147 var1.quali <- vector()
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
148 var2.quali <- vector()
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
149
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
150 for (i in 1:dim(tab1)[2]){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
151 if(class(tab1[,i]) != "numeric" & class(tab1[,i]) != "integer"){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
152 var1.quali <- c(var1.quali,i)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
153 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
154 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
155
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
156 for (j in 1:dim(tab2)[2]){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
157 if(class(tab2[,j]) != "numeric" & class(tab2[,j]) != "integer"){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
158 var2.quali <- c(var2.quali, j)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
159 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
160 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
161
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
162 if (length(var1.quali) != 0 | length(var2.quali) != 0){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
163 err.msg <- c(err.msg, "\nThere are qualitative variables in your input tables which have been removed to compute the correlation table.\n\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
164
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
165 if(length(var1.quali) != 0 && length(var1.quali) < 4){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
166 err.msg <- c(err.msg, "In table 1, the following qualitative variables have been removed:\n",
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
167 " ",paste(colnames(tab1)[var1.quali],collapse="\n "),"\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
168 } else if(length(var1.quali) != 0 && length(var1.quali) > 3){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
169 err.msg <- c(err.msg, "For example, in table 1, the following qualitative variables have been removed:\n",
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
170 " ",paste(colnames(tab1)[var1.quali[1:3]],collapse="\n "),"\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
171 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
172
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
173 if(length(var2.quali) != 0 && length(var2.quali) < 4){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
174 err.msg <- c(err.msg, "In table 2, the following qualitative variables have been removed:\n",
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
175 " ",paste(colnames(tab2)[var2.quali],collapse="\n "),"\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
176 } else if(length(var2.quali) != 0 && length(var2.quali) > 3){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
177 err.msg <- c(err.msg, "For example, in table 2, the following qualitative variables have been removed:\n",
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
178 " ",paste(colnames(tab2)[var2.quali[1:3]],collapse="\n "),"\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
179 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
180 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
181
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
182 if(length(var1.quali) != 0){
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
183 tab1 <- tab1[,-var1.quali,drop=FALSE]
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
184 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
185 if(length(var2.quali) != 0){
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
186 tab2 <- tab2[,-var2.quali,drop=FALSE]
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
187 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
188
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
189
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
190 # Check whether there are constant variables
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
191
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
192 var1.cons <- vector()
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
193 var2.cons <- vector()
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
194
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
195 for (i in 1:dim(tab1)[2]){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
196 if(length(levels(as.factor(tab1[,i])))==1){ var1.cons <- c(var1.cons,i) }
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
197 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
198
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
199 for (j in 1:dim(tab2)[2]){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
200 if(length(levels(as.factor(tab2[,j])))==1){ var2.cons <- c(var2.cons, j) }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
201 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
202
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
203 if (length(var1.cons) != 0 | length(var2.cons) != 0){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
204 err.msg <- c(err.msg, "\nThere are constant variables in your input tables which have been removed to compute the correlation table.\n\n")
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
205
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
206 if(length(var1.cons) != 0 && length(var1.cons) < 4){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
207 err.msg <- c(err.msg, "In table 1, the following constant variables have been removed:\n",
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
208 " ",paste(colnames(tab1)[var1.cons],collapse="\n "),"\n")
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
209 } else if(length(var1.cons) != 0 && length(var1.cons) > 3){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
210 err.msg <- c(err.msg, "For example, in table 1, the following constant variables have been removed:\n",
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
211 " ",paste(colnames(tab1)[var1.cons[1:3]],collapse="\n "),"\n")
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
212 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
213
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
214 if(length(var2.cons) != 0 && length(var2.cons) < 4){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
215 err.msg <- c(err.msg, "In table 2, the following constant variables have been removed:\n",
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
216 " ",paste(colnames(tab2)[var2.cons],collapse="\n "),"\n")
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
217 } else if(length(var2.cons) != 0 && length(var2.cons) > 3){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
218 err.msg <- c(err.msg, "For example, in table 2, the following constant variables have been removed:\n",
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
219 " ",paste(colnames(tab2)[var2.cons[1:3]],collapse="\n "),"\n")
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
220 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
221 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
222
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
223 if(length(var1.cons) != 0){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
224 tab1 <- tab1[,-var1.cons,drop=FALSE]
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
225 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
226 if(length(var2.cons) != 0){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
227 tab2 <- tab2[,-var2.cons,drop=FALSE]
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
228 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
229
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
230
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
231 # Print info message
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
232
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
233 if(length(err.msg) != 0){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
234 cat("\n- - - - - - - - -\n",err.msg,"\n- - - - - - - - -\n\n")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
235 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
236
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
237 rm(err.stock,var1.quali,var2.quali,var1.cons,var2.cons,err.msg)
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
238
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
239
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
240 # Correlation table ---------------------------------------------------------------------------------
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
241
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
242 tab.corr <- matrix(nrow = dim(tab2)[2], ncol = dim(tab1)[2])
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
243 for (i in 1:dim(tab2)[2]){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
244 for (j in 1:dim(tab1)[2]){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
245 tab.corr[i,j] <- cor(tab2[,i], tab1[,j], method = corr.method, use = "pairwise.complete.obs")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
246 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
247 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
248
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
249 colnames(tab.corr) <- colnames(tab1)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
250 rownames(tab.corr) <- colnames(tab2)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
251
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
252
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
253 # Significance of correlation test ------------------------------------------------------------------
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
254
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
255 if (test.corr == "yes"){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
256
2
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
257 repcorrtest1 <- function(vari1,vari2,corrmeth){
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
258 suppressWarnings(corrtest <- cor.test(vari2, vari1, method = corrmeth))
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
259 return(corrtest$p.value)
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
260 }
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
261 repcorrtest2 <- function(stab,ftab,cormeth){
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
262 listp <- apply(X=ftab,2,repcorrtest1,vari2=stab,corrmeth=cormeth)
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
263 return(listp)
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
264 }
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
265 pvalue <- apply(X=tab1,2,repcorrtest2,ftab=tab2,cormeth=corr.method)
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
266
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
267
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
268 if(multi.name != "none"){
2
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
269 pvalue <- matrix(p.adjust(pvalue, method = multi.name), nrow = dim(tab.corr)[1], ncol = dim(tab.corr)[2])
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
270 }
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
271
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
272 tab.corr[pvalue > alpha] <- 0
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
273
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
274 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
275
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
276
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
277 # Filter settings ------------------------------------------------------------------------------------
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
278
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
279 if (filter == "yes"){
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
280
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
281 # Turn diagonal from 1 to 0 if autocorrelation
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
282 if(autocor){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
283 for(i in 1:(ncol(tab.corr))){ tab.corr[i,i] <- 0 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
284 }
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
285
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
286 # Remove variables with all their correlation coefficients = 0 :
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
287 if (filters.choice == "filter_0"){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
288 threshold <- 0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
289 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
290
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
291 var2.thres <- vector()
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
292 for (i in 1:dim(tab.corr)[1]){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
293 if (length(which(abs(tab.corr[i,]) <= threshold)) == dim(tab.corr)[2]){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
294 var2.thres <- c(var2.thres, i)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
295 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
296 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
297
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
298 if (length(var2.thres) != 0){
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
299 tab.corr <- tab.corr[-var2.thres,,drop=FALSE]
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
300 tab2 <- tab2[, -var2.thres,drop=FALSE]
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
301 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
302
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
303 var1.thres <- vector()
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
304 for (i in 1:dim(tab.corr)[2]){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
305 if (length(which(abs(tab.corr[,i]) <= threshold)) == dim(tab.corr)[1]){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
306 var1.thres <- c(var1.thres, i)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
307 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
308 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
309
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
310 if (length(var1.thres) != 0){
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
311 tab.corr <- tab.corr[,-var1.thres,drop=FALSE]
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
312 tab1 <- tab1[,-var1.thres,drop=FALSE]
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
313 }
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
314
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
315 # Turn diagonal from 0 back to 1 if autocorrelation
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
316 if(autocor){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
317 for(i in 1:(ncol(tab.corr))){ tab.corr[i,i] <- 1 }
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
318 }
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
319
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
320 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
321
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
322
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
323 # Reorder variables in the correlation table (with the HCA) ------------------------------------------
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
324 if (reorder.var == "yes"){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
325
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
326 cormat.tab2 <- cor(tab2, method = corr.method, use = "pairwise.complete.obs")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
327 dist.tab2 <- as.dist(1 - cormat.tab2)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
328 hc.tab2 <- hclust(dist.tab2, method = "ward.D2")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
329 tab.corr <- tab.corr[hc.tab2$order,]
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
330 rm(cormat.tab2)
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
331
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
332 cormat.tab1 <- cor(tab1, method = corr.method, use = "pairwise.complete.obs")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
333 dist.tab1 <- as.dist(1 - cormat.tab1)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
334 hc.tab1 <- hclust(dist.tab1, method = "ward.D2")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
335 tab.corr <- tab.corr[,hc.tab1$order]
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
336 rm(cormat.tab1)
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
337
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
338 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
339
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
340
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
341 # Output 1 : Correlation table -----------------------------------------------------------------------
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
342
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
343
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
344 # Export correlation table
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
345 write.table(x = data.frame(name = rownames(tab.corr), tab.corr), file = output1, sep = "\t", quote = FALSE, row.names = FALSE)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
346
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
347
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
348
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
349 # Create the heatmap ---------------------------------------------------------------------------------
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
350
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
351 if(plot.choice != "none"){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
352
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
353 # A message if no variable kept
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
354 if(length(tab.corr)==0){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
355 pdf(output2)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
356 plot.new()
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
357 legend("center","Filtering leads to no remaining correlation coefficient.")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
358 dev.off()
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
359 } else {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
360
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
361 # A message if more than 1000 variable in auto mode
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
362 if((plot.choice=="auto")&&(max(dim(tab.corr))>1000)){
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
363 pdf(output2)
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
364 war.msg <- paste0("In 'default' mode, the colored table is not provided when\none of the tables contains more than ",
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
365 "a thousand\nvariables after the filter step.\n\nOne of your table still contains ",max(dim(tab.corr))," variables.\n",
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
366 "Please consider more filtering, or use the 'Always plot a\ncolored table' mode to obtain your colored table.")
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
367 plot.new()
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
368 legend("center",war.msg,adj=c(0.05,0.075))
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
369 dev.off()
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
370 } else {
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
371
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
372
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
373 library(ggplot2)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
374 library(reshape2)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
375
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
376 # Melt the correlation table :
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
377 melted.tab.corr <- melt(tab.corr)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
378
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
379 if (color.heatmap == "yes") {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
380
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
381 # Add a column for the classes of each correlation coefficient
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
382 classe <- rep(0, dim(melted.tab.corr)[1])
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
383 melted <- cbind(melted.tab.corr, classe)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
384
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
385 if (type.classes == "regular"){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
386
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
387 vect <- vector()
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
388 if (seq(-1,0,reg.value)[length(seq(-1,0,reg.value))] == 0){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
389 vect <- c(seq(-1,0,reg.value)[-length(seq(-1,0,reg.value))],
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
390 rev(seq(1,0,-reg.value)))
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
391 } else {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
392 vect <- c(seq(-1,0,reg.value), 0, rev(seq(1,0,-reg.value)))
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
393 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
394
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
395 } else if (type.classes == "irregular") {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
396
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
397 irreg.vect <- c(-1, irreg.vect, 1)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
398 vect <- irreg.vect
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
399
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
400 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
401
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
402 # Color palette :
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
403 myPal <- colorRampPalette(c("#00CC00", "white", "red"), space = "Lab", interpolate = "spline")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
404
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
405 # Create vector intervals
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
406 cl <- vector()
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
407 cl <- paste("[", vect[1], ";", round(vect[2],3), "]", sep = "")
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
408
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
409 for (x in 2:(length(vect)-1)) {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
410 if (vect[x+1] == 0) {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
411 cl <- c(cl, paste("]", round(vect[x],3), ";", round(vect[x+1],3), "[", sep = ""))
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
412 } else {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
413 cl <- c(cl, paste("]", round(vect[x],3), ";",
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
414 round(vect[x+1],3), "]", sep = ""))
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
415 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
416 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
417
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
418 # Assign an interval to each correlation coefficient
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
419 for (j in 1:(length(cl))){
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
420 if (vect[j] == -1){
2
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
421 melted$classe[melted$value >= vect[j] & melted$value <= vect[j+1]] <- cl[j]
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
422 } else {
2
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
423 melted$classe[melted$value > vect[j] & melted$value <= vect[j+1]] <- cl[j]
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
424 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
425 }
2
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
426
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
427
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
428 # Find the 0 and assign it the white as name
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
429 if (length(which(vect == 0)) == 1) {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
430 melted$classe[melted$value == 0] <- "0"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
431 indic <- which(vect == 0)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
432 cl <- c(cl[1:(indic-1)], 0, cl[indic:length(cl)])
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
433 names(cl)[indic] <- "#FFFFFF"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
434 } else if (length(which(vect == 0)) == 0) {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
435 indic <- 0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
436 for (x in 1:(length(vect)-1)) {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
437 if (0 > vect[x] && 0 <= vect[x+1]) {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
438 names(cl)[x] <- "#FFFFFF"
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
439 indic <- x
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
440 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
441 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
442 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
443
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
444 indic <- length(cl) - indic + 1
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
445 cl <- rev(cl)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
446
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
447 # Assign the colors of each intervals as their name
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
448 names(cl)[1:(indic-1)] <- myPal(length(cl[1:indic])*2-1)[1:indic-1]
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
449 names(cl)[(indic+1):length(cl)] <- myPal(length(cl[indic:length(cl)])*2-1)[(ceiling(length(myPal(length(cl[indic:length(cl)])*2-1))/2)+1):length(myPal(length(cl[indic:length(cl)])*2-1))]
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
450
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
451
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
452 melted$classe <- factor(melted$classe)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
453 melted$classe <- factor(melted$classe, levels = cl[cl%in%levels(melted$classe)])
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
454
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
455 # Heatmap if color.heatmap = yes :
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
456 ggplot(melted, aes(Var2, Var1, fill = classe)) +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
457 ggtitle("Colored correlation table" ) + xlab("Table 1") + ylab("Table 2") +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
458 geom_tile(color ="ghostwhite") +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
459 scale_fill_manual( breaks = levels(melted$classe),
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
460 values = names(cl)[cl%in%levels(melted$classe)],
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
461 name = paste(corr.method, "correlation", sep = "\n")) +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
462 theme_classic() +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
463 theme(axis.text.x = element_text(angle = 90, vjust = 0.5),
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
464 plot.title = element_text(hjust = 0.5))
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
465
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
466 } else {
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
467
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
468 # Heatmap if color.heatmap = no :
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
469 ggplot(melted.tab.corr, aes(Var2, Var1, fill = value)) +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
470 ggtitle("Colored correlation table" ) + xlab("Table 1") + ylab("Table 2") +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
471 geom_tile(color ="ghostwhite") +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
472 scale_fill_gradient2(low = "red", high = "#00CC00", mid = "white", midpoint = 0, limit = c(-1,1),
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
473 name = paste(corr.method, "correlation", sep = "\n")) +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
474 theme_classic() +
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
475 theme(axis.text.x = element_text(angle = 90, vjust = 0.5),
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
476 plot.title = element_text(hjust = 0.5))
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
477 }
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
478
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
479
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
480 ggsave(output2, device = "pdf", width = 10+0.075*dim(tab.corr)[2], height = 5+0.075*dim(tab.corr)[1], limitsize = FALSE)
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
481
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
482
1
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
483 } # End of if((plot.choice=="auto")&&(max(dim(tab.corr))>1000))else
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
484 } # End of if(length(tab.corr)==0)else
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
485 } # End of if(plot.choice != "auto")
29ec7e3afdd4 Uploaded
melpetera
parents: 0
diff changeset
486
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
487
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
488 } # End of correlation.tab
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
489
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
490
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
491 # Function call
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
492 # correlation.tab(tab1.name, tab2.name, param1.samples, param2.samples, corr.method, test.corr, alpha, multi.name, filter,
2
2173ad5e7750 Uploaded
melpetera
parents: 1
diff changeset
493 # filters.choice, threshold, reorder.var, plot.choice, color.heatmap, type.classes,
0
b22c453e4cf4 Uploaded
melpetera
parents:
diff changeset
494 # reg.value, irreg.vect, output1, output2)