R/friedmanTestBMR.R

#' @title Perform overall Friedman test for a BenchmarkResult.
#'
#' @description Performs a \code{\link[stats]{friedman.test}} for a selected measure.
#' The null hypothesis is that apart from an effect of the different
#' [\code{\link{Task}}], the location parameter (aggregated performance measure)
#' is the same for each \code{\link{Learner}}.
#' Note that benchmark results for at least two learners on at least two tasks
#' are required.
#'
#' @template arg_bmr
#' @template arg_measure
#' @template arg_aggregation_method
#' @return [\code{htest}]: See \code{\link[stats]{friedman.test}} for details.
#' @family benchmark
#' @export
#' @examples
#' # see benchmark
friedmanTestBMR = function(bmr, measure = NULL, aggregation = "default") {

  assertClass(bmr, "BenchmarkResult")
  measure = checkBMRMeasure(measure, bmr)
  assertChoice(aggregation, c("default", "mean"))
  n.learners = length(bmr$learners)
  if (n.learners < 2)
    stop("Benchmark results for at least two learners are required")
  n.tasks = length(bmr$results)
  if (n.tasks < 2)
    stop("Benchmark results for at least two tasks are required")

  # aggregate mean or default over iterations
  if (aggregation == "mean") {
    df = as.data.frame(bmr)
    df = aggregate(df[[measure$id]],
      by = list(task.id = df$task.id, learner.id = df$learner.id),
      FUN = mean)
    aggr.meas = "x"
  } else {
    aggr.meas = measureAggrName(measure)
    df = getBMRAggrPerformances(bmr, as.df = TRUE)
  }
  friedman.test(as.formula(stri_paste(aggr.meas, " ~ learner.id | task.id", sep = "")), data = df)
}
Najah-lshanableh/R-data-mining2 documentation built on May 6, 2019, 10:11 a.m.