R/totalCorMat.R

Defines functions totalCorMat

Documented in totalCorMat

#' @title Total Correlation Matrix
#'
#' @description Computes the pairwise total correlation
#' (\code{\link[EGAnet]{totalCor}}) for a dataset
#'
#' @param data Matrix or data frame.
#' Should consist only of variables to be used in the analysis
#'
#' @param base Numeric (length = 1).
#' Base to use for entropy.
#' Defaults to \code{exp(1)} or \code{2.718282}
#'
#' @param normalized Boolean (length = 1).
#' Should the normalized total correlation be computed?
#' Defaults to \code{FALSE}
#'
#' @return Returns a symmetric matrix with pairwise total correlations
#'
#' @author Hudson F. Golino <hfg9s at virginia.edu>
#'
#' @examples
#' # Compute total correlation matrix
#' totalCorMat(wmt2[,7:24])
#'
#' @references
#' \strong{Formalization of total correlation} \cr
#' Watanabe, S. (1960).
#' Information theoretical analysis of multivariate correlation.
#' \emph{IBM Journal of Research and Development} \emph{4}, 66-82.
#'
#' \strong{Applied implementation} \cr
#' Felix, L. M., Mansur-Alves, M., Teles, M., Jamison, L., & Golino, H. (2021).
#' Longitudinal impact and effects of booster sessions in a cognitive training program for healthy older adults.
#' \emph{Archives of Gerontology and Geriatrics}, \emph{94}, 104337.
#'
#' @export
#'
# Total Correlation Matrix ----
# Updated 03.08.2024
totalCorMat <- function(data, base = 2.718282, normalized = FALSE)
{

  # 'data' errors
  object_error(data, c("matrix", "data.frame", "tibble"), "totalCorMat")

  # 'base' errors
  typeof_error(base, "numeric", "totalCorMat")
  length_error(base, 1, "totalCorMat")

  # 'normalized' errors
  typeof_error(normalized, "logical", "totalCorMat")
  length_error(normalized, 1, "totalCorMat")

  # Ensure data is matrix
  data <- as.matrix(usable_data(data, verbose = TRUE))

  # Get dimensions of data
  dimensions <- dim(data)

  # Ensure variable names
  data <- ensure_dimension_names(data)

  # Get variable names
  variable_names <- dimnames(data)[[2]]

  # Initialize total correlation matrix
  total_correlation <- matrix(
    nrow = dimensions[2], ncol = dimensions[2],
    dimnames = list(variable_names, variable_names)
  )

  # Set output
  output <- swiftelse(normalized, "Normalized", "Total.Cor")

  # Fill matrix
  for(i in seq_len(dimensions[2])){

    # Loop over other variables
    for(j in i:dimensions[2]){

      # Fill both sides of the matrix
      total_correlation[i,j] <-
      total_correlation[j,i] <-
      totalCor(data[,c(i, j)])[[output]]

    }

  }

  # Return total correlation matrix
  return(total_correlation)
}

# Bug Checking ----
# ## Basic input
# data <- wmt2[,7:24]
hfgolino/EGA documentation built on Nov. 11, 2024, 9:28 p.m.