R/FDistribution.R

Defines functions get_tau_ANOVA ANOVA NestedModels

Documented in ANOVA get_tau_ANOVA NestedModels

#' F-Distribution
#'
#' Implements the F-distribution used for an ANOVA or for the comparison of the fit of two
#' nested regression models. In both cases, the test statistic follows a F-distribution.
#' \code{NestedModel} is used to compare the fit of two regression models, where one model contains
#' the independent variables of the smaller model as a subset. Then, one can use ANOVA to determine
#' whether more variance can be explained by adding more independent variables.
#' In the class \code{ANOVA}, the number of independent variables of the smaller model is set to \eqn{1}
#' in order to match the degrees of freedom and we obtain a one-way ANOVA.
#'
#' @slot p_inner number of parameters in smaller model
#' @slot p_outer number of parameters in bigger model
#'
#' @template DataDistributionTemplate
#'
#' @include DataDistribution.R
#'
#' @rdname NestedModels-class
#' @exportClass NestedModels
setClass("NestedModels", representation(
  p_inner  = "numeric",
  p_outer  =  "numeric"),
  contains = "DataDistribution")


#' @include DataDistribution.R
#'
#' @rdname ANOVA-class
#' @exportClass ANOVA
setClass("ANOVA", contains = "NestedModels")



#' @param p_inner number of independent variables in smaller model
#' @param p_outer number of independent variables in bigger model
#'
#' @examples
#' model <- NestedModels(2, 4)
#'
#' @seealso See \code{\link{probability_density_function}} and
#'    \code{\link{cumulative_distribution_function}} to evaluate the pdf
#'    and the cdf, respectively. Use \code{\link{ANOVA}} for detailed information
#'    of ANOVA.
#'
#' @rdname NestedModels-class
#' @export
NestedModels <- function(p_inner, p_outer) {
  if (any(p_inner < 0 || abs(p_inner - round(p_inner)) > sqrt(.Machine$double.eps),
          p_outer < 0 || abs(p_outer - round(p_outer)) > sqrt(.Machine$double.eps))){
    stop("The numbers of groups must be natural numbers.")
  }
  
  new("NestedModels", p_inner = p_inner, p_outer = p_outer)
}


#' Analysis of Variance
#'
#' ANOVA is used to test whether there is a significant difference between the means of groups.
#' The sample size which \code{adoptr} returns is the group wise sample size.
#' The function \code{get_tau_ANOVA} is used to obtain a parameter \eqn{\tau},
#' which is used in the same way as \eqn{\theta} to describe the difference of
#' means between the groups.
#'
#' @param n_groups number of groups to be compared
#'
#' @examples
#' model <- ANOVA(3L)
#'
#' @seealso see \code{\link{probability_density_function}} and
#'    \code{\link{cumulative_distribution_function}} to evaluate the pdf
#'    and the cdf, respectively. Use \code{\link{NestedModels}} to get insights
#'    in the implementation of \code{ANOVA}.
#'
#' @rdname ANOVA-class
#' @export
ANOVA <- function(n_groups) {
  if (n_groups < 0 || abs(n_groups - round(n_groups)) > sqrt(.Machine$double.eps))
    stop("The number of groups must be a natural number.")
  new("ANOVA", p_outer = n_groups, p_inner = 1L)
}

#' @param means vector denoting the mean per group
#' @param common_sd standard deviation of the groups
#'
#' @examples
#' H1 <- PointMassPrior(get_tau_ANOVA(c(0.4, 0.8, 0.5)), 1)
#'
#' @rdname ANOVA-class
#'
#' @export
get_tau_ANOVA <- function(means, common_sd = 1) {
  mean((means - mean(means))^2) / common_sd^2
}


#' @examples
#' probability_density_function(ANOVA(3), 1, 30, get_tau_ANOVA(c(0.3, 0.4, 0.7, 0.2)))
#'
#' @rdname probability_density_function
#' @export
setMethod("probability_density_function", signature("NestedModels", "numeric", "numeric", "numeric"),
          function(dist, x, n, theta, ...) {
            n <- n * (dist@p_outer - dist@p_inner + 1)
            ret <- x
            ret[x == Inf] <- 0
            ret[x == -Inf] <- 0
            ret[!is.infinite(x)] <- stats::df(x[!is.infinite(x)],
                                              df1 = dist@p_outer - dist@p_inner,
                                              df2 = max(1, n - dist@p_outer),
                                              ncp = n * theta)
            return(ret)
          })


#' @examples
#' cumulative_distribution_function(ANOVA(3), 1, 30, get_tau_ANOVA(c(0.3, 0.4, 0.7, 0.2)))
#'
#' @rdname cumulative_distribution_function
#' @export
setMethod("cumulative_distribution_function", signature("NestedModels", "numeric", "numeric", "numeric"),
          function(dist, x, n, theta, ...) {
            n <- n * (dist@p_outer - dist@p_inner + 1)
            ret <- x
            ret[x == Inf] <- 1
            ret[x == -Inf] <- 0
            ret[!is.infinite(x)] <- stats::pf(x[!is.infinite(x)],
                                              df1 = dist@p_outer - dist@p_inner,
                                              df2 = max(1, n - dist@p_outer),
                                              ncp = n * theta)
            return(ret)
          })


#' @param probs vector of probabilities
#'
#' @rdname NestedModels-class
#' @export
setMethod("quantile", signature("NestedModels"),
          function(x, probs, n, theta, ...) { # must be x to conform with generic
            n <- n * (x@p_outer - x@p_inner + 1)
            return(stats::qf(probs, df1 = x@p_outer - x@p_inner, 
                             df2 = max(1, n - x@p_outer), ncp = n * theta))
          })



#' @rdname NestedModels-class
#'
#' @param object object of class \code{NestedModels}
#' @param nsim number of simulation runs
#' @param seed random seed
#'
#' @export
setMethod("simulate", signature("NestedModels", "numeric"),
          function(object, nsim, n, theta, seed = NULL, ...) {
            if (!is.null(seed)) set.seed(seed)
            n <- n * (object@p_outer - object@p_inner + 1)
            return(stats::rf(nsim, df1 = object@p_outer - object@p_inner, 
                             df2 = max(1, n - object@p_outer),  ncp = n * theta))
          })

setMethod("print", signature('NestedModels'), function(x, ...) {
  glue::glue(
    "{class(x)[1]}<p_inner={x@p_inner},p_outer={x@p_outer}>"
  )
})

setMethod("print", signature('ANOVA'), function(x, ...) {
  glue::glue(
    "{class(x)[1]}<n_groups={x@p_outer}>"
  )
})

Try the adoptr package in your browser

Any scripts or data that you put into this service are public.

adoptr documentation built on Oct. 3, 2024, 1:08 a.m.