R/estimateScore.R
In estimate: Estimate of Stromal and Immune Cells in Malignant Tumor Tissues from Expression Data

###
### $Id: estimateScore.R 13 2016-09-28 19:32:16Z proebuck $
###


##-----------------------------------------------------------------------------
estimateScore <- function(input.ds,
                          output.ds,
                          platform=c("affymetrix", "agilent", "illumina")) {

    ## Check arguments
    stopifnot(is.character(input.ds) && length(input.ds) == 1 && nzchar(input.ds))
    stopifnot(is.character(output.ds) && length(output.ds) == 1 && nzchar(output.ds))
    platform <- match.arg(platform)   
   
    ## Read input dataset(GCT format)
    ds <- read.delim(input.ds,
                     header=TRUE,
                     sep="\t",
                     skip=2,
                     row.names=1,
                     blank.lines.skip=TRUE,
                     as.is=TRUE,
                     na.strings="")
    descs <- ds[, 1]
    ds <- ds[-1]
    row.names <- row.names(ds)
    names <- names(ds)
    dataset <- list(ds=ds,
                    row.names=row.names,
                    descs=descs,
                    names=names)

    m <- data.matrix(dataset$ds)
    gene.names <- dataset$row.names
    sample.names <- dataset$names
    Ns <- length(m[1, ]) # Number of genes
    Ng <- length(m[, 1]) # Number of samples
    temp <- strsplit(input.ds, split="/")
    s <- length(temp[[1]])
    input.file.name <- temp[[1]][s]
    temp <- strsplit(input.file.name, split=".gct")
    input.file.prefix <-  temp[[1]][1]

    ## Sample rank normalization
    for (j in 1:Ns) {
        m[, j] <- rank(m[, j], ties.method="average")
    }
    m <- 10000*m/Ng

    ## SI_geneset
    gs <- as.matrix(SI_geneset[, -1],dimnames=NULL) 
    N.gs <- 2
    gs.names <- row.names(SI_geneset) 
   
    ## Loop over gene sets
    score.matrix <- matrix(0, nrow=N.gs, ncol=Ns)
    for (gs.i in 1:N.gs) {
        gene.set <- gs[gs.i,]
        gene.overlap <- intersect(gene.set, gene.names)
        print(paste(gs.i, "gene set:", gs.names[gs.i], " overlap=", length(gene.overlap)))
        if (length(gene.overlap) == 0) { 
           score.matrix[gs.i, ] <- rep(NA, Ns)
           next
        } else {
            ES.vector <- vector(length=Ns)
         
            ## Enrichment score
            for (S.index in 1:Ns) {
                gene.list <- order(m[, S.index], decreasing=TRUE)            
                gene.set2 <- match(gene.overlap, gene.names)
                correl.vector <- m[gene.list, S.index]
          
                TAG <- sign(match(gene.list, gene.set2, nomatch=0))    # 1 (TAG) & 0 (no.TAG)
                no.TAG <- 1 - TAG 
                N <- length(gene.list) 
                Nh <- length(gene.set2) 
                Nm <-  N - Nh 
                correl.vector <- abs(correl.vector)^0.25
                sum.correl  <- sum(correl.vector[TAG == 1])
                P0 <- no.TAG / Nm
                F0 <- cumsum(P0)
                Pn <- TAG * correl.vector / sum.correl
                Fn <- cumsum(Pn)
                RES <- Fn - F0
                max.ES <- max(RES)
                min.ES <- min(RES)
                if (max.ES > - min.ES) {
                    arg.ES <- which.max(RES)
                } else {
                    arg.ES <- which.min(RES)
                }
                ES <- sum(RES)
                EnrichmentScore <- list(ES=ES,
                                        arg.ES=arg.ES,
                                        RES=RES,
                                        indicator=TAG)
                ES.vector[S.index] <- EnrichmentScore$ES
            }
            score.matrix[gs.i, ] <- ES.vector
        }
    }

    score.data <- data.frame(score.matrix)
    names(score.data) <- sample.names
    row.names(score.data) <- gs.names
    estimate.score <- apply(score.data, 2, sum)
   
    if (platform != "affymetrix"){
        score.data <- rbind(score.data, estimate.score)
        rownames(score.data) <- c("StromalScore",
                                  "ImmuneScore",
                                  "ESTIMATEScore")
    } else {
        ##---------------------------------------------------------------------
        ## Calculate ESTIMATE-based tumor purity (Affymetrix-specific)
        convert_row_estimate_score_to_tumor_purity <- function(x) {
            stopifnot(is.numeric(x))
            cos(0.6049872018 + 0.0001467884*x)
        }
        
        est.new <- NULL
        for (i in 1:length(estimate.score)) {
            est_i <- convert_row_estimate_score_to_tumor_purity(estimate.score[i])
            est.new <- rbind(est.new, est_i)
            if (est_i >= 0) {
                next
            } else {
                message(paste(sample.names[i],": out of bounds", sep=""))
            }
        }
        colnames(est.new) <- c("TumorPurity")
        estimate.t1 <- cbind(estimate.score, est.new)
        x.bad.tumor.purities <- estimate.t1[, "TumorPurity"] < 0
        estimate.t1[x.bad.tumor.purities, "TumorPurity"] <- NA
        score.data <- rbind(score.data, t(estimate.t1))
        rownames(score.data) <- c("StromalScore",
                                  "ImmuneScore",
                                  "ESTIMATEScore",
                                  "TumorPurity")
    }
    outputGCT(score.data, output.ds)
}

Any scripts or data that you put into this service are public.

estimate documentation built on May 2, 2019, 4:38 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

estimate
Estimate of Stromal and Immune Cells in Malignant Tumor Tissues from Expression Data

R/estimateScore.R
In estimate: Estimate of Stromal and Immune Cells in Malignant Tumor Tissues from Expression Data

Try the estimate package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

estimate Estimate of Stromal and Immune Cells in Malignant Tumor Tissues from Expression Data

R/estimateScore.R In estimate: Estimate of Stromal and Immune Cells in Malignant Tumor Tissues from Expression Data

Try the estimate package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

estimate
Estimate of Stromal and Immune Cells in Malignant Tumor Tissues from Expression Data

R/estimateScore.R
In estimate: Estimate of Stromal and Immune Cells in Malignant Tumor Tissues from Expression Data