Mercurial > repos > testtool > geo_data
changeset 35:694382fd220a draft
Uploaded
author | testtool |
---|---|
date | Fri, 14 Apr 2017 14:16:46 -0400 |
parents | 59a5237b72a3 |
children | b3761b109ca9 |
files | GRsetFromGEO/GRsetFromGEO.R |
diffstat | 1 files changed, 54 insertions(+), 3 deletions(-) [+] |
line wrap: on
line diff
--- a/GRsetFromGEO/GRsetFromGEO.R Fri Apr 14 09:25:08 2017 -0400 +++ b/GRsetFromGEO/GRsetFromGEO.R Fri Apr 14 14:16:46 2017 -0400 @@ -4,6 +4,57 @@ GSE = args[1] output = args[2] -GRset <- getGenomicRatioSetFromGEO(GSE) - -save(GRset,output) \ No newline at end of file +function (GSE = NULL, path = NULL, array = "IlluminaHumanMethylation450k", + annotation = .default.450k.annotation, what = c("Beta", "M"), + mergeManifest = FALSE, i = 1) +{ + what <- match.arg(what) + if (is.null(GSE) && is.null(path)) + stop("Either GSE or path must be supplied.") + if (!is.null(GSE)) + gset <- GEOquery::getGEO(GSE) + else gset <- GEOquery::getGEO(filename = file.path(path, + list.files(path, pattern = ".soft"))) + if (length(gset) == 0) + stop("Empty list retrieved from GEO.") + if (length(gset) > 1) { + warning("More than one ExpressionSet found:\n", names(gset), + "\nUsing entry ", i) + gset <- gset[[i]] + } + else gset <- gset[[1]] + platform <- annotation(gset) + if (platform != "GPL13534") + warning(sprintf("%s is not the platform ID associated with IlluminaHumanMethylation450k. Should be GPL13534.", + platform)) + if (what == "Beta" & (min(exprs(gset)[, 1], na.rm = TRUE) < + 0 | max(exprs(gset)[, 1], na.rm = TRUE) > 1)) + warning("Values outside [0,1] detected. 'what' argument should not be Beta.") + ann <- .getAnnotationString(c(array = array, annotation = annotation)) + if (!require(ann, character.only = TRUE)) + stop(sprintf("cannot load annotation package %s", ann)) + object <- get(ann) + gr <- getLocations(object, mergeManifest = mergeManifest, + orderByLocation = TRUE) + locusNames <- names(gr) + sampleNames(gset) <- gset$title + common <- intersect(locusNames, fData(gset)$Name) + if (length(common) == 0) + stop("No rowname matches. 'rownames' need to match IlluminaHumanMethylation450k probe names.") + ind1 <- match(common, fData(gset)$Name) + ind2 <- match(common, locusNames) + preprocessing <- c(rg.norm = paste0("See GEO ", GSE, " for details")) + if (what == "Beta") { + out <- GenomicRatioSet(gr = gr[ind2, ], Beta = exprs(gset)[ind1, + , drop = FALSE], M = NULL, CN = NULL, pData = pData(gset), + annotation = c(array = array, annotation = annotation), + preprocessMethod = preprocessing) + } + else { + out <- GenomicRatioSet(gr = gr[ind2, ], Beta = NULL, + M = exprs(gset)[ind1, , drop = FALSE], CN = NULL, + pData = pData(gset), annotation = c(array = array, + annotation = annotation), preprocessMethod = preprocessing) + } + save(out,output) +}