R/edger.R

Defines functions edger_confects

Documented in edger_confects

#' Confident log2 fold change based on the edgeR Quasi-Likelihood method
#'
#' For all possible absolute log2 fold changes (LFC), which genes have at least
#' this fold change at a specified False Discovery Rate?
#'
#' Results are presented in a table such that for any given LFC, if the reader
#' chooses the genes with abs(confect) less than this they are assured that this
#' set of genes has at least this LFC (with the specified FDR). The confect
#' column may also be viewed as a confidence bound on the LFC of each gene, with
#' a dynamic correction for multiple testing.
#'
#' @param fit An edgeR DGEGLM object produced using \code{glmQLFit}.
#'
#' @param coef Coefficient to test, as per \code{glmTreat}. Use either coef or
#'   contrast or effect.
#'
#' @param contrast Contrast to test, as per \code{glmTreat}. Use either coef or
#'   contrast or effect.
#'
#' @param fdr False Discovery Rate to control for.
#'
#' @param step Granularity of log2 fold changes to test.
#'
#' @param null "null" parameter passed through to edger::glmTreat (if coef or
#'   contrast given). Choices are "worst.case" or "interval". Note that the
#'   default here is "worst.case", to be consistent with other functions in
#'   topconfects. This differs from the default for glmTreat.
#'
#' @return
#'
#' See \code{\link{nest_confects}} for details of how to interpret the result.
#'
#' @examples
#'
#' # Generate some random data
#' n <- 100
#' folds <- seq(-4,4,length.out=n)
#' row_means <- runif(n, min=0, max=5)
#' lib_scale <- c(1,2,3,4)
#' means <- 2^(outer(folds, c(-0.5,-0.5,0.5,0.5))) *
#'     row_means * rep(lib_scale,each=n)
#' counts <- rnbinom(length(means), mu=means, size=1/0.1)
#' dim(counts) <- dim(means)
#'
#' design <- cbind(c(1,1,0,0), c(0,0,1,1))
#'
#' # Fit data using edgeR quasi-likelihood
#' library(edgeR)
#' y <- DGEList(counts)
#' y <- calcNormFactors(y)
#' y <- estimateDisp(y, design)
#' fit <- glmQLFit(y, design)
#'
#' # Find top confident effect sizes
#' edger_confects(fit, contrast=c(-1,1))
#'
#' @export
edger_confects <- function(
        fit, coef=NULL, contrast=NULL,
        fdr=0.05, step=0.01, null=c("worst.case","interval")) {
    assert_that(requireNamespace("edgeR", quietly=TRUE), msg=
        "edger_confects requires installing the Bioconductor package 'edgeR'")
    assert_that(is(fit, "DGEGLM"))
    assert_that((!is.null(coef)) + (!is.null(contrast)) == 1)

    null <- match.arg(null)

    n <- nrow(fit)

    tested <- edgeR::glmQLFTest(fit,coef=coef,contrast=contrast)
    top_tags <- edgeR::topTags(tested, n=n,sort.by="none")

    pfunc <- function(i, mag) {
        if (mag == 0.0)
            top_treats <- top_tags
        else {
            treat_tested <- edgeR::glmTreat(
                fit, coef=coef, contrast=contrast, lfc=mag, null=null)
            top_treats <- edgeR::topTags(treat_tested, n=n, sort.by="none")
        }

        top_treats$table$PValue[i]
    }

    confects <- nest_confects(n, pfunc, fdr=fdr, step=step)
    confects$effect_desc <- "log2 fold change"
    logFC <- top_tags$table$logFC[confects$table$index]
    confects$table$confect <- sign(logFC) * confects$table$confect
    confects$table$effect <- logFC
    confects$table$logCPM <- top_tags$table$logCPM[confects$table$index]
    confects$table$name <- rownames(top_tags$table)[confects$table$index]

    confects$edger_fit <- fit

    if (!is.null(fit$genes)) {
        confects$table <- cbind(
            confects$table,
            fit$genes[confects$table$index,,drop=FALSE])
    }

    confects
}
pfh/topconfects documentation built on Nov. 18, 2023, 9:49 p.m.