R/evaluate.R
In cases: Stratified Evaluation of Subgroup Classification Accuracy

Documented in evaluate

#' Evaluate the accuracy of multiple (candidate) classifiers in several subgroups
#'
#' Assess classification accuracy of multiple classifcation rules stratified
#' by subgroups, e.g. in diseased (sensitivity) and healthy (specificity)
#' individuals.
#'
#' @param data (list) \cr of n_g x m binary matrix or data.frame (n_g observations of m binary decisions),
#' g is the index of subgroups/classes, usually created via \code{\link{compare}}.
#' @param contrast (\code{cases_contrast}) \cr specified via \code{\link{define_contrast}}
#' @param benchmark (numeric) \cr value to compare against (RHS), should have same length as data.
#' @param alpha (numeric) \cr significance level (default: 0.05)
#' @param alternative (character) \cr specification of alternative hypothesis
#' @param adjustment (character) \cr specification of statistical adjustment taken to address multiplicity.
#' The default 'none' does not perform any adjustment for multiplicity.
#' @param transformation (character) \cr define transformation to ensure results
#' (e.g. point estimates, confidence limits) lie in unit interval ("none" (default), "logit", or "arcsin" (sqrt))
#' @param analysis (character) \cr "co-primary" or "full"
#' @param regu (numeric | logical) \cr vector of length 3, specify type of shrinkage.
#' Alternatively, logical of length one (TRUE := c(1, 1/2, 1/4), FALSE := c(0, 0, 0))
#' @param pars (list) \cr further parameters given as named list list(type="pairs", nboot=2000)
#' @param ... (any) \cr additional named parameters, can be used instead of (in in conjunction with) \code{pars}
#'
#' @return (\code{cases_results}) \cr
#' list of analysis results including (adjusted) confidence intervals and p-values
#' @details
#' Adjustment methods (\code{adjustment}) and additional parameters (\code{pars} or \code{...}):\cr
#'
#' \strong{"none"} (default): no adjustment for multiplicity\cr
#'
#' \strong{"bonferroni"}: Bonferroni adjustment\cr
#'
#' \strong{"maxt"}: maxT adjustment, based on a multivariate normal approximation of the vector of test statistics\cr
#'
#' \strong{"bootstrap"}: Bootstrap approach
#' - nboot: number of bootstrap draws (default: 2000)
#' - type: type of bootstrap, "pairs" (default) or "wild"
#' - dist: residual distribution for wild bootstrap, "Normal" (default) or "Rademacher"
#' - proj_est: should bootstrapped estimates for wild bootstrap be projected into unit interval? (default: TRUE)
#' - res_tra: type of residual transformation for wild boostrap, 0,1,2 or 3 (default: 0 = no transformation)
#' (for details on res_tra options, see this presentation by
#' \href{https://www.math.kth.se/matstat/gru/sf2930/papers/wild.bootstrap.pdf}{James G. MacKinnon (2012)} and references therein)
#'
#' \strong{"mbeta"}: A heuristic Bayesian approach which is based on a multivariate beta-binomial model.
#' - nrep: number of posterior draws (default: 5000)
#' - lfc_pr: prior probability of 'least-favorable parameter configuration' (default: 1 if analysis == "co-primary", 0 if analysis == "full").


#' @export
#'
#' @examples#
#' data <- draw_data_roc()
#' evaluate(data)
evaluate <- function(data,
                     contrast = define_contrast("raw"),
                     benchmark = 0.5,
                     alpha = 0.05,
                     alternative = c("two.sided", "greater", "less"),
                     adjustment = c("none", "bonferroni", "maxt", "bootstrap", "mbeta"),
                     transformation = c("none", "logit", "arcsin"),
                     analysis = c("co-primary", "full"),
                     regu = FALSE,
                     pars = list(),
                     ...) {
  ## check 'data' argument:
  stopifnot(is.list(data))
  stopifnot(all(sapply(data, function(x) {
    any(class(x) %in% c("data.frame", "matrix"))
  })))
  if (any(sapply(data, function(x) any(class(x) == "data.frame")))) {
    data <- lapply(data, as.matrix)
  }
  stopifnot(all(diff(sapply(data, ncol)) == 0))
  if (!all(apply(
    sapply(data, colnames) %>% matrix(nrow = ncol(data[[1]])), 1,
    function(x) length(unique(x)) == 1
  ))) {
    stop("Expecting identical column names!")
  }

  ## check 'contrast' argument:
  stopifnot("cases_contrast" %in% class(contrast))

  ## check 'benchmark' argument:
  if (!(length(benchmark) %in% c(1, length(data)))) {
    stop("benchmark argument needs to be numeric of length one or of same length as data argument!")
  }
  if (length(benchmark) == 1) {
    benchmark <- rep(benchmark, length(data))
  }
  stopifnot(all(abs(benchmark) < 1))

  ## check 'alpha' argument:
  stopifnot(is.numeric(alpha))
  stopifnot(length(alpha) == 1)
  stopifnot(alpha > 0 & alpha < 1)

  ## check 'pars' argument:
  stopifnot(is.list(pars))

  ## prepare arguments for specific evaluate_xyz function:
  args <-
    list(
      data = data,
      contrast = contrast,
      benchmark = benchmark,
      alpha = alpha,
      alternative = match.arg(alternative),
      analysis = match.arg(analysis),
      transformation = match.arg(transformation),
      regu = preproc_regu(regu),
      pars = c(list(...), pars)
    )

  ## derive attributes which will be added later to result:
  args$attrs <- derive_attrs(args)

  ## calculate & return results:
  do.call(paste0("evaluate_", match.arg(adjustment)), args)
}