datasetMerging: x
In bhklab/MetaGx: R package for meta-analysis of breast cancer gene expressions

1	datasetMerging(esets, method = c("union", "intersect"), standardization = c("quantile", "robust.scaling", "scaling", "none"), nthread = 1)

`esets`
`method`
`standardization`
`nthread`

##---- Should be DIRECTLY executable !! ----
##-- ==>  Define data, use random,
##--	or do  help(data=index)  for the standard data sets.

## The function is currently defined as
function (esets, method = c("union", "intersect"), standardization = c("quantile", 
    "robust.scaling", "scaling", "none"), nthread = 1) 
{
    require(Biobase)
    require(genefu)
    if (nthread > 1) {
        require(parallel)
    }
    method <- match.arg(method)
    standardization <- match.arg(standardization)
    ugid <- lapply(esets, function(x) {
        return(Biobase::featureData(x)@data)
    })
    ugid <- do.call(rbind, ugid)
    ugid <- ugid[!is.na(ugid[, "ENTREZID"]) & !duplicated(as.character(ugid[, 
        "ENTREZID"])), , drop = FALSE]
    rownames(ugid) <- gsub(sprintf("(%s).", paste(names(esets), 
        collapse = "|")), "", rownames(ugid))
    switch(method, union = {
        feature.merged <- ugid
    }, intersect = {
        feature.merged <- lapply(esets, function(x) {
            return(as.character(Biobase::featureData(x)@data[, 
                "ENTREZID"]))
        })
        feature.merged <- table(unlist(feature.merged))
        feature.merged <- names(feature.merged)[feature.merged == 
            length(esets)]
        feature.merged <- ugid[match(feature.merged, as.character(ugid[, 
            "ENTREZID"])), , drop = FALSE]
    }, {
        stop("Unknown method")
    })
    exprs.merged <- lapply(esets, function(x, y) {
        ee <- Biobase::exprs(x)
        eem <- matrix(NA, nrow = length(y), ncol = ncol(ee), 
            dimnames = list(y, colnames(ee)))
        eem[rownames(ee), colnames(ee)] <- ee
        return(eem)
    }, y = rownames(feature.merged))
    exprs.merged <- do.call(cbind, exprs.merged)
    ucid <- lapply(esets, function(x) {
        return(colnames(phenoData(x)@data))
    })
    ucid <- table(unlist(ucid))
    ucid <- names(ucid)[ucid == length(esets)]
    clinicinfo.merged <- lapply(esets, function(x, y) {
        ee <- Biobase::pData(x)[, y, drop = FALSE]
    }, y = ucid)
    clinicinfo.merged <- do.call(rbind, clinicinfo.merged)
    rownames(clinicinfo.merged) <- gsub(sprintf("(%s).", paste(names(esets), 
        collapse = "|")), "", rownames(clinicinfo.merged))
    eset.merged <- ExpressionSet(assayData = exprs.merged, phenoData = AnnotatedDataFrame(data = clinicinfo.merged), 
        featureData = AnnotatedDataFrame(data = feature.merged))
    experimentData(eset.merged)@preprocessing <- list(normalization = "mixed", 
        package = "unspecified", version = "0")
    annotation(eset.merged) <- "mixed"
    switch(standardization, none = {
    }, quantile = {
        require(limma)
        require(genefu)
        ee <- exprs(eset.merged)
        splitix <- parallel::splitIndices(nx = ncol(ee), ncl = nthread)
        mcres <- parallel::mclapply(splitix, function(x, data) {
            res <- apply(data[, x, drop = FALSE], 2, function(dx) {
                return((genefu::rescale(dx, q = 0.05, na.rm = TRUE) - 
                  0.5) * 2)
            })
            return(res)
        }, data = ee, mc.cores = nthread)
        ee <- do.call(cbind, mcres)
        ee <- limma::normalizeBetweenArrays(object = ee, method = "quantile")
        exprs(eset.merged) <- ee
    }, robust.scling = {
        require(genefu)
        ee <- exprs(eset.merged)
        splitix <- parallel::splitIndices(nx = ncol(ee), ncl = nthread)
        mcres <- parallel::mclapply(splitix, function(x, data) {
            res <- apply(data[, x, drop = FALSE], 2, function(dx) {
                return((genefu::rescale(dx, q = 0.05, na.rm = TRUE) - 
                  0.5) * 2)
            })
            return(res)
        }, data = ee, mc.cores = nthread)
        ee <- do.call(cbind, mcres)
        exprs(eset.merged) <- ee
    }, scaling = {
        ee <- exprs(eset.merged)
        splitix <- parallel::splitIndices(nx = ncol(ee), ncl = nthread)
        mcres <- parallel::mclapply(splitix, function(x, data) {
            return(apply(data[, x, drop = FALSE], 2, scale))
        }, data = ee, mc.cores = nthread)
        ee <- do.call(cbind, mcres)
        exprs(eset.merged) <- ee
    }, {
        stop("Unknown data standardization method")
    })
    return(eset.merged)
  }