R/cor-tbl.R

Defines functions check_dimension check_extra_mat_name gcor_tbl cor_tbl

Documented in cor_tbl gcor_tbl

#' Create a cor_tbl object
#' @title Create a cor_tbl object
#' @description Functions to create cor_tbl object from correlation matrix.
#' @param corr correlation matrix.
#' @param p.value significance value matrix of correaltion.
#' @param extra.mat any other matrix-like data with same dimmsion as \code{x}.
#' @param type a string, "full" (default), "upper" or "lower", display full,
#'     lower triangular or upper triangular matrix.
#' @param show.diag a logical value indicating whether keep the diagonal.
#' @param row.names,col.names row/column names of correlation matrix.
#' @param row.order,col.order row/column order of correlation matrix.
#' @param cluster one of "all", "row", "col" or "none". If is logical value,
#' TRUE value means "all", and FALSE means "none".
#' @param ... extra params passing to \code{\link{matrix_order}}.
#' @return a cor_tbl object.
#' @importFrom utils modifyList
#' @importFrom stats setNames
#' @rdname cor_tbl
#' @examples
#' cor_tbl(cor(mtcars))
#' corr <- correlate(mtcars, cor.test = TRUE)
#'
#' ## with p value
#' cor_tbl(corr$r, corr$p.value)
#'
#' ## reorder correlation matrix
#' cor_tbl(corr$r, corr$p.value, cluster = TRUE)
#'
#' ## exclude upper or lower
#' ### exclude lower
#' cor_tbl(corr$r, corr$p.value, type = "upper")
#' ### exclude upper
#' cor_tbl(corr$r, corr$p.value, type = "lower", show.diag = FALSE)
#'
#' ## add extra matrix data
#' m <- matrix(rnorm(11*11), nrow = 11)
#' cor_tbl(corr$r, corr$p.value, extra.mat = list(m = m))
#' @author Houyun Huang, Lei Zhou, Jian Chen, Taiyun Wei
#' @export
cor_tbl <- function(corr,
                    p.value = NULL,
                    extra.mat = list(),
                    type = "full",
                    show.diag = TRUE,
                    row.names = NULL,
                    col.names = NULL,
                    row.order = NULL,
                    col.order = NULL,
                    cluster = "none",
                    ...)
{
  type <- match.arg(type, c("full", "upper", "lower"))
  if(isTRUE(cluster)) {
    cluster <- "all"
  } else {
    if(!cluster %in% c("all", "row", "col", "none")) {
      cluster <- "none"
    }
  }

  check_extra_mat_name(extra.mat)
  ## exclude NULL
  missing.corr <- missing(corr)
  if(missing.corr && is.null(p.value) && length(extra.mat) == 0) {
    stop("No matrix data input.", call. = FALSE)
  }

  first <- if(missing.corr) {
    if(length(extra.mat) == 0) p.value else extra.mat[[1]]
  } else corr
  if(!is.matrix(first))
    first <- as.matrix(first)

  if(missing.corr) {
    corr <- if(is.null(p.value)) list() else list(p.value = p.value)
  } else {
    corr <- if(is.null(p.value)) list(r = corr) else list(r = corr, p.value = p.value)
  }

  corr <- modifyList(corr, extra.mat)

  corr <- lapply(corr, function(.x) {
    if(!is.matrix(.x)) as.matrix(.x) else .x
  })
  name <- names(corr)

  if(length(corr) > 1) {
    lapply(names(corr), function(name) {
      check_dimension(first, corr[[name]])
    })
  }
  row.names <- row.names %||% rownames(first) %||% paste0("row", 1:nrow(first))
  col.names <- col.names %||% colnames(first) %||% paste0("col", 1:ncol(first))
  if(length(row.names) != nrow(first))
    stop("'row.names' must have same length as rows of matrix.", call. = FALSE)
  if(length(col.names) != ncol(first))
    stop("'col.names' must have same length as columns of matrix.", call. = FALSE)

  ## check cluster and row/col.order
  row.ord <- seq_along(row.names)
  col.ord <- seq_along(col.names)
  row.hc <- col.hc <- NULL
  if(!is.null(row.order)) {
    if(cluster %in% c("row", "all")) {
      warning("'row.order' has been specified, ",
              "cluster = ", cluster, " will not be used to clustering rows.", call. = FALSE)
      cluster <- if(cluster == "all") "col" else "none"
    }

    row.ord <- get_order(row.order, index = "row", name = row.names)
    if(inherits(row.order, "hclust") || inherits(row.order, "dendrogram") ||
       inherits(row.order, "ggtree")) {
      row.hc <- row.order
    }
    if(inherits(row.order, "dist")) {
      row.hc <- hclust(row.order)
    }
  }

  if(!is.null(col.order)) {
    if(cluster %in% c("col", "all")) {
      warning("'col.order' has been specified, ",
              "cluster = ", cluster, " will not be used to clustering cols.", call. = FALSE)
      cluster <- if(cluster == "all") {
        if(!is.null(row.order)) "none" else "row"
        } else "none"
    }

    col.ord <- get_order(col.order, index = "col", name = col.names)
    if(inherits(col.order, "hclust") || inherits(col.order, "dendrogram") ||
       inherits(col.order, "ggtree")) {
      col.hc <- col.order
    }
    if(inherits(col.order, "dist")) {
      col.hc <- hclust(col.order)
    }
  }

  if(cluster == "all") {
    hc <- matrix_order(first, is.cor = !missing.corr, ...)
    row.hc <- hc$row.hc
    col.hc <- hc$col.hc
    row.ord <- row.hc$order
    col.ord <- col.hc$order
  } else if(cluster == "row") {
    hc <- matrix_order(first, is.cor = !missing.corr, ...)
    row.hc <- hc$row.hc
    row.ord <- row.hc$order
  } else if(cluster == "col") {
    hc <- matrix_order(first, is.cor = !missing.corr, ...)
    col.hc <- hc$col.hc
    col.ord <- col.hc$order
  }

  ## Todo: check the cluster and row/col.order
  corr <- lapply(corr, function(.x) {
    .x[row.ord, col.ord]
  })
  row.names <- row.names[row.ord]
  col.names <- col.names[col.ord]

  ## check type
  first <- first[row.ord, col.ord]
  symmet <- isSymmetric(first) && identical(colnames(first), rownames(first))
  if(!symmet) {
    if(type != "full") {
      warning("'type = ", type, "' just supports for symmetric matrix.", call. = FALSE)
      type <- "full"
      if(type == "full") show.diag <- TRUE
    }
  }

  id <- list(
    .row.names = rep(row.names, ncol(first)),
    .col.names = rep(col.names, each = nrow(first)),
    .row.id = rep(nrow(first):1, ncol(first)),
    .col.id = rep(1:ncol(first), each = nrow(first))
  )
  data <- modifyList(id, setNames(lapply(corr, as.vector), name))
  new.order <- intersect(c(".row.names", ".col.names", name, ".row.id", ".col.id"),
                         names(data))
  cls <- if(missing.corr) {
    c("gcor_tbl", "cor_tbl", "tbl_df", "tbl", "data.frame")
  } else {
    c("cor_tbl", "tbl_df", "tbl", "data.frame")
  }
  data <- structure(.Data = new_data_frame(data[new.order]),
                    .row.names = row.names,
                    .col.names = col.names,
                    type = type,
                    show.diag = show.diag,
                    hclust = list(row.hc = row.hc, col.hc = col.hc),
                    grouped = FALSE,
                    class = cls)
  switch (type,
          full = if(isTRUE(show.diag)) data else get_diag_tri(data),
          upper = get_upper_data(data, show.diag = show.diag),
          lower = get_lower_data(data, show.diag = show.diag)
  )
}

#' Create a general cor_tbl object
#' @title Create a general cor_tbl object
#' @param x a matrix-like object.
#' @param name variable name.
#' @param extra.mat extra matrix data.
#' @param ... parameters passing to \code{cor_tbl}.
#' @return a general_cor_tbl object.
#' @rdname gcor_tbl
#' @examples
#' gcor_tbl(mtcars)
#' gcor_tbl(mtcars, "var")
#' @author Houyun Huang, Lei Zhou, Jian Chen, Taiyun Wei
#' @export
gcor_tbl <- function(x,
                     name = "value",
                     extra.mat = list(),
                     ...)
{
  if("corr" %in% names(list(...))) {
    stop("please use `cor_tbl()` to tidy correlation matrix.", call. = FALSE)
  }
  nm <- name %||% deparse(substitute(x))
  extra.mat[[nm]] <- x
  cor_tbl(extra.mat = extra.mat, ...)
}

#' @noRd
check_extra_mat_name <- function(l)
{
  n <- length(l)
  if(n > 0) {
    name <- names(l)
    if(is.null(name) || length(unique(name)) != n) {
      stop(
        "Names of extra.mat check:", "\n",
        "The elements of 'extra.mat' must have unique name.",
        call. = FALSE)
    }
    if(any(name %in% c("r", "p.value"))) {
      stop(
        "Names of extra.mat check:", "\n",
        "'r' and 'p.value' are preserved.",
        call. = FALSE)
    }
  }
}

#' @noRd
check_dimension <- function(x, y) {
  x_nm <- as.character(match.call()[["x"]])
  y_nm <- as.character(match.call()[["y"]])
  if(any(dim(x) != dim(y))) {
    msg <- paste0(" Dimension error: ", y_nm, " must have same dimension as ", x_nm)
    stop(msg, call. = FALSE)
  }
}
houyunhuang/ggcor documentation built on July 22, 2020, 8:31 p.m.