R/gghm.R
In ggcorrheatmap: Make Flexible 'ggplot2' Correlation Heatmaps

Documented in gghm prepare_mixed_param scale_mat

#' Make a heatmap with ggplot2.
#'
#' @param x Matrix or data frame in wide format to make a heatmap of. If rownames are present they are used for the y axis labels, otherwise the row number is used.
#' If a column named `.names` (containing unique row identifiers) is present it will be used as rownames.
#' @param layout String specifying the layout of the output heatmap. Possible layouts include
#' 'topleft', 'topright', 'bottomleft', 'bottomright', or the 'whole'/'full' heatmap (default and only possible option if the matrix is asymmetric).
#' A combination of the first letters of each word also works (i.e. f, w, tl, tr, bl, br).
#' If layout is of length two with two opposing triangles, a mixed layout will be used. For mixed layouts,
#' `mode` needs a vector of length two (applied in the same order as layout). See details for more information.
#' @param mode A string specifying plotting mode. Possible values are `heatmap`/`hm` for a normal heatmap, a number from 1 to 25 to draw the corresponding shape,
#' `text` to write the cell values instead of filling cells (colour scaling with value), and `none` for blank cells.
#' @param scale_data Character string specifying scaling of the matrix. NULL or "none" for no scaling, "rows" for rows, and "columns" for
#' columns. Can also be a substring of the beginning of the words.
#' @param col_scale Colour scale to use for cells. If NULL, the default ggplot2 scale is used. If a string, the corresponding Brewer or Viridis scale is used.
#' A string with a scale name with "rev_" in the beginning or "_rev" at the end will result in the reversed scale. Can also be a ggplot2 scale object to overwrite the scale.
#' In mixed layouts, a list of two scales can be provided.
#' @param col_name String to use for the colour scale legend title. Can be two values in mixed layouts for dual scales.
#' @param limits Numeric vector of length two for the limits of the colour scale. NULL uses the default.
#' @param bins Number of bins to divide the scale into (if continuous values). A 'double' class value uses 'nice.breaks' to put the breaks at nice numbers which may not result
#' in the specified number of bins. If an integer the number of bins will be prioritised.
#' @param size_scale `ggplot2::scale_size_*` call to use for size scaling if `mode` is a number from 1 to 25 (R pch). In mixed layouts, can also be a list
#' of length two containing the two scales to use.
#' @param size_name String to use for the size scale legend title. Can be two values in mixed layouts for dual scales.
#' @param legend_order Integer vector specifying the order of legends (first value is for the first legend, second for the second, etc). The default (NULL) shows all legends.
#' NAs hide the corresponding legends, a single NA hides all. Ignored for `ggplot2` scale objects in `col_scale` and `size_scale`.
#' @param include_diag Logical indicating if the diagonal cells (of a symmetric matrix) should be plotted.
#' Mostly only useful for getting a cleaner look with symmetric correlation matrices with triangular layouts, where the diagonal is known to be 1.
#' @param na_col Colour to use for cells with NA (both main heatmap and annotation).
#' @param na_remove Logical indicating if NA values in the heatmap should be omitted (meaning no cell border is drawn).
#' If NAs are kept, the fill colour can be set in the `ggplot2` scale.
#' @param return_data Logical indicating if the data used for plotting and clustering results should be returned.
#' @param cell_labels Logical specifying if the cells should be labelled with the values. Alternatively, a matrix or data frame with the same shape and dimnames as `x`
#' containing values to write in the cells. If mode is `text`, the cell label colours will scale with the cell values and `cell_label_col` is ignored.
#' @param cell_label_col Colour to use for cell labels, passed to `ggplot2::geom_text()`.
#' @param cell_label_size Size of cell labels, used as the `size` argument in `ggplot2::geom_text()`.
#' @param cell_label_digits Number of digits to display when cells are labelled (if numeric values). Default is 2, passed to `base::round()`. NULL for no rounding.
#' @param border_col Colour of cell borders. If `mode` is not a number, `border_col` can be set to NA to remove borders completely.
#' @param border_lwd Size of cell borders. If `mode` is a number, `border_col` can be set to 0 to remove borders.
#' @param border_lty Line type of cell borders. Either a number or its corresponding name, or a string of length 2, 4, 6, or 8. See 'lty' of `graphics::par()` for details.
#' Not supported for numeric `mode`.
#' @param cell_bg_col Colour to use for cell backgrounds in modes 'text' and 'none'.
#' @param cell_bg_alpha Alpha for cell colours in modes 'text' and 'none'.
#' @param show_names_diag Logical indicating if names should be written in the diagonal cells (for symmetric input).
#' @param names_diag_params List with named parameters (such as size, angle, etc) passed on to geom_text when writing the column names in the diagonal.
#' @param show_names_x,show_names_y Logical indicating if names should be written on the x and y axes. Labels can be customised using `ggplot2::theme()` on the output plot.
#' @param names_x_side String specifying position of the x axis names ("top" or "bottom").
#' @param names_y_side String specifying position of the y axis names ("left" or "right").
#' @param annot_rows_df,annot_cols_df Data frame for row and column annotations. The names of the columns in the data must be included,
#' either as row names or in a column named `.names`. Each other column specifies an annotation where the column name
#' will be used as the annotation name (in the legend and next to the annotation). Numeric columns will use a continuous
#' colour scale while factor or character columns use discrete scales.
#' @param annot_rows_col,annot_cols_col Named list for row and column annotation colour scales. The names should specify which annotation each scale applies to.
#' Elements can be strings or ggplot2 "Scale" class objects. If a string, it is used as the brewer palette or viridis option.
#' If a scale object it is used as is, allowing more flexibility. This may change the order that legends are drawn in,
#' specify order using the `guide` argument in the `ggplot2` scale function.
#' @param annot_rows_side String specifying which side row annotation should be drawn ('left' or 'right', defaults to 'left').
#' @param annot_cols_side String specifying which side column annotation should be drawn ('bottom' or 'top', defaults to 'bottom').
#' @param annot_dist Distance between heatmap and first annotation cell where 1 is the size of one heatmap cell. Used for both row and column annotation.
#' @param annot_gap Distance between each annotation where 1 is the size of one heatmap cell. Used for both row and column annotation.
#' @param annot_size Size (width for row annotation, height for column annotation) of annotation cells compared to a heatmap cell. Used for both row and column annotation.
#' @param annot_border_col Colour of cell borders in annotation. By default it is the same as `border_col` of the main heatmap if it is of length 1, otherwise uses default (grey).
#' @param annot_border_lwd Line width of cell borders in annotation. By default it is the same as `border_lwd` of the main heatmap if it is of length 1, otherwise uses default (0.5).
#' @param annot_border_lty Line type of cell borders in annotation. By default it is the same as `border_lty` of the main heatmap if it is of length 1, otherwise uses default (solid).
#' @param annot_na_col Colour to use for NA values in annotations. Annotation-specific colour can be set in the ggplot2 scales in
#' the `annot_*_fill` arguments.
#' @param annot_na_remove Logical indicating if NAs in the annotations should be removed (producing empty spaces).
#' @param annot_rows_params,annot_cols_params Named list with parameters for row and column annotations to overwrite the defaults set by the `annot_*` arguments, each name corresponding to the `*` part
#' (see details for more information).
#' @param show_annot_names Logical controlling if names of annotations should be shown in the drawing area.
#' @param annot_names_size Size of annotation names.
#' @param annot_rows_names_side String specifying which side the row annotation names should be on. Either "top" or "bottom".
#' @param annot_cols_names_side String specifying which side the column annotation names should be on. Either "left" or "right".
#' @param annot_rows_names_params,annot_cols_names_params Named list of parameters for row and column annotation names. Given to `ggplot2::geom_text()`.
#' @param annot_rows_name_params,annot_cols_name_params Deprecated and kept for backward compatibility. Named list of parameters given to `grid::textGrob()` for annotation names.
#' Does not work well with heatmap splits.
#' @param cluster_rows,cluster_cols Logical indicating if rows or columns should be clustered. Can also be `hclust` or `dendrogram` objects.
#' @param cluster_distance String with the distance metric to use for clustering, given to `stats::dist()`.
#' @param cluster_method String with the clustering method to use, given to `stats::hclust()`.
#' @param show_dend_rows,show_dend_cols Logical indicating if a dendrogram should be drawn for the rows or columns.
#' @param dend_rows_side Which side to draw the row dendrogram on ('left' or 'right', defaults to 'left').
#' @param dend_cols_side Which side to draw the column dendrogram on ('bottom' or 'top', defaults to 'bottom').
#' @param dend_col Colour to use for dendrogram lines, applied to both row and column dendrograms.
#' @param dend_dist Distance from heatmap (or annotation) to leaves of dendrogram, measured in heatmap cells (1 is the size of one cell).
#' @param dend_height Number by which to scale dendrogram height, applied to both row and column dendrograms.
#' @param dend_lwd Linewidth of dendrogram lines, applied to both row and column dendrograms.
#' @param dend_lty Dendrogram line type, applied to both row and column dendrograms.
#' @param dend_rows_params,dend_cols_params Named list for row or column dendrogram parameters to overwrite common parameter values. See details for more information.
#' @param dend_rows_extend,dend_cols_extend Named list or functional sequence for specifying `dendextend` functions to apply to the row or column dendrogram. See details for usage.
#' @param split_rows,split_cols Vectors for splitting the rows and columns into facets. Can be a numeric vector shorter than the number of rows/columns to split the heatmap after those indices,
#' or a vector of the same length as the number of rows/columns containing the facet memberships. In the latter case names can be used to match with rows/columns.
#' Alternatively, if clustering is applied a single numeric value is accepted for the number of clusters to divide the plot into.
#' @param split_rows_side,split_cols_side Which side the row/column facet strips should be drawn on ('left'/'right', 'top'/'bottom').
#'
#' @return The heatmap as a `ggplot` object.
#' If `return_data` is TRUE the output is a list containing the plot (named 'plot'),
#' the plotting data ('plot_data', with factor columns 'row' and 'col' and a column 'value' containing the cell values),
#' and the result of the clustering ('row_clustering' and/or 'col_clustering).
#' If the layout is mixed, an extra factor column named 'layout' is included in 'plot_data', showing which triangle each cell belongs to.
#'
#' @export
#'
#' @details
#'
#' When using mixed layouts (`layout` is length two), `mode` needs to be length two as well, specifying the mode to use in each triangle.
#' The `cell_label_*` and `border_*` arguments can all be length one to apply to the whole heatmap, length two vectors to apply to each triangle,
#' or lists of length two, each element containing one value (apply to whole triangle) or a value per cell (apply cell-wise in triangle).
#' `cell_labels` can also be specified per triangle, either as a logical vector of length two, or a list of length two containing a mix of
#' logicals and matrices/data frames.
#'
#' It is also possible to provide two scales for filling or colouring the triangles differently.
#' In this case the `col_scale` must be one character value (scale used for both triangles) or NULL or a list of length two
#' containing the scales to use (character or scale object, or NULL for default). `size_scale` works in the same way (but takes no character values).
#' In addition, the scale-modifying arguments `bins`, `na_col` and `limits` can also be specified per triangle. `limits` must be a list of length two (or one) where each
#' element is a numeric vector of length two.
#'
#' The annotation parameter arguments `annot_rows_params` and `annot_cols_params` should be named lists, where the possible options correspond to
#' the different `annot_*` arguments. The possible options are "dist" (distance between heatmap and annotation), "gap" (distance between annotations),
#' "size" (cell size), "show_names" (logical, if the annotation names should be displayed), "border_col" (colour of border) and "border_lwd" (border line width).
#' Any unused options will use the defaults set by the `annot_*` arguments.
#'
#' The dendrogram parameters arguments `dend_rows_params` and `dend_cols_params` should be named lists, analogous to the annotation parameter arguments. Possible options are
#' "col" (line colour), "dist" (distance from heatmap to dendrogram), "height" (height scaling), "lwd" (line width), and "lty" (line type).
#'
#' The `dend_rows_extend` and `dend_cols_extend` arguments make it possible to customise the dendrograms using the `dendextend` package.
#' The argument should be a named list, each element named after the `dendextend` function to use (consecutive usage of the `set` function
#' is supported due to duplicate list names being possible). Each element should contain any arguments given to the `dendextend` function,
#' such as the `what` argument used in the `set` function. Alternatively, `dendextend` functions can be provided in a functional sequence ("fseq" object)
#' by piping together functions using the `%>%` pipe. Functions modifying the labels do not work as the dendrogram labels are not displayed (they are in the axis text).
#' As dendextend::as.ggdend() is used for conversion of the dendrogram, anything not supported by as.ggdend() will not work (such as "nodes_bg" or "rect.dendrogram").
#' See examples and the clustering article for example usage.
#'
#' @examples
#' library(ggplot2)
#'
#' # Use part of the mtcars data (for visibility)
#' hm_in <- mtcars[1:15, ]
#'
#' # Basic usage
#' gghm(hm_in)
#'
#' # Different layout (using a symmetric matrix)
#' gghm(cor(mtcars), layout = "tl")
#'
#' # Mixed layouts
#' gghm(cor(mtcars), layout = c("tr", "bl"),
#'      # Hide one of the legends
#'      legend_order = c(1, NA))
#'
#' # With clustering
#' gghm(scale(hm_in), cluster_rows = TRUE, cluster_cols = TRUE)
#'
#' # Adjusting cluster dendrograms using common and specific options
#' gghm(scale(hm_in), cluster_rows = TRUE, cluster_cols = TRUE,
#'      # Common options
#'      dend_lwd = 0.7, dend_col = "magenta",
#'      # Specific options
#'      dend_rows_params = list(height = 1), dend_cols_params = list(lty = 2))
#'
#' # With annotation and specifying colour scales
#' set.seed(123)
#' annot_rows <- data.frame(.names = rownames(hm_in),
#'                          annot1 = rnorm(nrow(hm_in)),
#'                          annot2 = sample(letters[1:3], nrow(hm_in), TRUE))
#' # Specify colour scale for one of the annotations (viridis mako)
#' annot_fill <- list(annot1 = "G")
#'
#' gghm(scale(hm_in),
#'      # Change colours of heatmap (Brewer Purples)
#'      col_scale = "Purples",
#'      annot_rows_df = annot_rows, annot_rows_col = annot_fill) +
#'      # Use ggplot2::theme to adjust margins to fit the annotation names
#'      theme(plot.margin = margin(30, 10, 60, 20))
#'
#' # Using the dend_*_extend arguments
#' gghm(scale(hm_in), cluster_rows = TRUE, dend_rows_extend =
#'   list("set" = list("branches_lty", c(1, 2, 3)),
#'        # Empty list element (or NULL) if no arguments to be given
#'        "highlight_branches_col" = list()))
gghm <- function(x,
                 layout = "full",
                 mode = if (length(layout) == 1) "heatmap" else c("heatmap", "text"),
                 scale_data = NULL,
                 col_scale = NULL, col_name = "value",
                 limits = NULL, bins = NULL,
                 size_scale = NULL, size_name = "value",
                 legend_order = NULL,
                 include_diag = TRUE, show_names_diag = FALSE, names_diag_params = NULL,
                 show_names_x = TRUE, names_x_side = "top", show_names_y = TRUE, names_y_side = "left",
                 na_col = "grey50", na_remove = FALSE, return_data = FALSE,
                 cell_labels = FALSE, cell_label_col = "black", cell_label_size = 3, cell_label_digits = 2,
                 border_col = "grey", border_lwd = 0.1, border_lty = 1,
                 cell_bg_col = "white", cell_bg_alpha = 0,
                 annot_rows_df = NULL, annot_cols_df = NULL,
                 annot_rows_col = NULL, annot_cols_col = NULL,
                 annot_rows_side = "right", annot_cols_side = "bottom",
                 annot_dist = 0.2, annot_gap = 0, annot_size = 0.5,
                 annot_border_col = if (length(border_col) == 1) border_col else "grey",
                 annot_border_lwd = if (length(border_lwd) == 1) border_lwd else 0.5,
                 annot_border_lty = if (length(border_lty) == 1) border_lty else 1,
                 annot_na_col = na_col, annot_na_remove = na_remove,
                 annot_rows_params = NULL, annot_cols_params = NULL,
                 show_annot_names = TRUE, annot_names_size = 3,
                 annot_rows_names_side = "bottom", annot_cols_names_side = "left",
                 annot_rows_names_params = NULL, annot_cols_names_params = NULL,
                 annot_rows_name_params = NULL, annot_cols_name_params = NULL,
                 cluster_rows = FALSE, cluster_cols = FALSE,
                 cluster_distance = "euclidean", cluster_method = "complete",
                 show_dend_rows = TRUE, show_dend_cols = TRUE, dend_rows_side = "right", dend_cols_side = "bottom",
                 dend_col = "black", dend_dist = 0, dend_height = 0.3, dend_lwd = 0.3, dend_lty = 1,
                 dend_rows_params = NULL, dend_cols_params = NULL,
                 dend_rows_extend = NULL, dend_cols_extend = NULL,
                 split_rows = NULL, split_cols = NULL,
                 split_rows_side = "right", split_cols_side = "bottom") {

  if (!is.matrix(x) & !is.data.frame(x)) cli::cli_abort("{.var x} must be a matrix or data frame.", class = "input_class_error")

  # Check return_data so you don't get an error after everything is done
  check_logical(return_data = return_data)

  # Convert a tibble to a data frame to support row names
  if (inherits(x, "tbl_df")) {x <- as.data.frame(x)}

  # Check that there are colnames
  if (is.null(colnames(x))) {colnames(x) <- 1:ncol(x)}

  if (".names" %in% colnames(x)) {
    rownames(x) <- x[[".names"]]
    x <- dplyr::select(x, -".names")
  }
  # Explicitly define the rownames to prevent ggplot2 error if x is a data frame without explicit rownames
  rownames(x) <- rownames(x)

  # Check that there are rownames
  if (is.null(rownames(x))) {rownames(x) <- 1:nrow(x)}

  # Scale data if specified
  x <- scale_mat(x, scale_data)

  # Check if matrix becomes asymmetric after clustering to throw a warning
  x_sym <- isSymmetric(as.matrix(x))

  # Check layout and mode
  layout_check <- check_layout(layout, mode)

  # Check annotation data frames
  if (!is.null(annot_rows_df)) {
    annot_rows_df <- check_annot_df(annot_rows_df, rownames(x), "annot_rows_df")
  }
  if (!is.null(annot_cols_df)) {
    annot_cols_df <- check_annot_df(annot_cols_df, colnames(x), "annot_cols_df")
  }

  # Logical for full plot layout or not (mixed layout treated as full and triangular)
  full_plt <- if (length(layout) == 1) {layout %in% c("full", "f", "whole", "w")} else {TRUE}

  # If the matrix is asymmetric, triangular layouts break! Throw a warning
  if (!x_sym & (!full_plt | length(layout) == 2)) {
    cli::cli_warn("Triangular layouts are not supported for asymmetric matrices, plotting the full matrix instead.",
                  class = "force_full_warn")
    full_plt <- TRUE
    layout <- "f"
    mode <- mode[1]
  }

  # Overwrite show_names_diag if the input is non-symmetric as it would cause
  # new ghost columns to be added to draw the names where row == col
  # This does not prevent diag names in initially symmetric matrices that become asymmetric as a result
  # of unequal clustering of rows and columns, the result will look a bit strange but no new columns are created
  if (!x_sym) {
    show_names_diag <- FALSE
  }

  # If clustering a symmetric matrix with a triangular layout, both rows and columns must be clustered. Automatically cluster both and throw a warning
  if (x_sym & (!full_plt | length(layout) == 2)) {

    if (((!isFALSE(cluster_rows) & isFALSE(cluster_cols)) | (isFALSE(cluster_rows) & !isFALSE(cluster_cols)))) {
      cli::cli_warn("Cannot cluster only one dimension for triangular layouts, clustering both rows and columns instead.",
                    class = "force_clust_warn")
      if (isFALSE(cluster_rows)) {cluster_rows <- cluster_cols}
      else if (isFALSE(cluster_cols)) {cluster_cols <- cluster_rows}
    }
  }

  # Make dendrograms
  # To allow for providing a hclust or dendrogram object when clustering, make a separate logical clustering variable
  lclust_rows <- FALSE
  row_clustering <- NULL
  if (!isFALSE(cluster_rows)) {
    row_clustering <- cluster_data(cluster_rows, x, cluster_distance, cluster_method, dend_rows_extend)

    # Reorder matrix to fit clustering
    x <- x[row_clustering$dendro$labels$label, ]
    lclust_rows <- TRUE
  }

  lclust_cols <- FALSE
  col_clustering <- NULL
  if (!isFALSE(cluster_cols)) {
    col_clustering <- cluster_data(cluster_cols, t(x), cluster_distance, cluster_method, dend_cols_extend)

    # Reorder matrix to fit clustering
    x <- x[, col_clustering$dendro$labels$label]
    lclust_cols <- TRUE
  }

  # Throw a warning if clustering caused a symmetric input to become asymmetric. Plot the full matrix if not already the case
  if (x_sym & !isSymmetric(as.matrix(x))) {
    cli::cli_warn(paste0("The clustering has ordered rows and columns differently and caused the matrix to become asymmetric.",
                         ifelse(length(layout) == 2 | !full_plt, " Plotting the full matrix.", ""),
                         " The diagonal may be scrambled due to the unequal row and column orders."),
                  class = "unequal_clust_warn")
    layout <- "f"
    full_plt <- TRUE
    mode <- mode[1]
  }

  # Evaluate annot_border_col, annot_border_lwd, annot_border_lty so they get values based on border_col etc
  # Otherwise they may be influenced by border_col etc becoming lists in the next step
  annot_border_col <- annot_border_col
  annot_border_lwd <- annot_border_lwd
  annot_border_lty <- annot_border_lty

  # Prepare parameters for mixed layouts
  if (length(layout) == 2) {
    # Allow for triangle-specific customisation in mixed layouts
    border_col <- prepare_mixed_param(border_col, "border_col")
    border_lwd <- prepare_mixed_param(border_lwd, "border_lwd")
    border_lty <- prepare_mixed_param(border_lty, "border_lty")
    cell_bg_col <- prepare_mixed_param(cell_bg_col, "cell_bg_col")
    cell_labels <- prepare_mixed_param(cell_labels, "cell_labels")
    cell_bg_alpha <- prepare_mixed_param(cell_bg_alpha, "cell_bg_alpha")
    cell_label_col <- prepare_mixed_param(cell_label_col, "cell_label_col")
    cell_label_size <- prepare_mixed_param(cell_label_size, "cell_label_size")
    cell_label_digits <- prepare_mixed_param(cell_label_digits, "cell_label_digits")
  }

  if (!full_plt) {
    # Move annotation and dendrograms to non-empty sides if not full plot
    annot_rows_side <- dend_rows_side <- ifelse(layout %in% c("topleft", "tl", "bottomleft", "bl"), "left", "right")
    annot_cols_side <- dend_cols_side <- ifelse(layout %in% c("bottomleft", "bl", "bottomright", "br"), "bottom", "top")
  }

  # Make long format data, ordering columns to fit layout
  if (length(layout) == 1) {
    x_long <- layout_hm(x, layout = layout, na_remove = na_remove)

    # Reorder data to ensure it is in the drawing order
    x_long <- if (any(c("topleft", "tl", "bottomright", "br") %in% layout)) {
      dplyr::arrange(x_long, col, row)
    } else {
      dplyr::arrange(x_long, col, dplyr::desc(row))
    }

  } else if (length(layout) == 2) {
    # Mixed layout, generate one per half and mark by layout. The first one gets the diagonal
    x_long <- dplyr::bind_rows(
      dplyr::mutate(layout_hm(x, layout = layout[1], na_remove = na_remove), layout = layout[1]),
      dplyr::filter(
        dplyr::mutate(layout_hm(x, layout = layout[2], na_remove = na_remove), layout = layout[2]),
        as.character(row) != as.character(col)
        )
    )
    # Convert layout to a factor vector
    x_long[["layout"]] <- factor(x_long[["layout"]], levels = layout)

    x_long <- if (any(c("topleft", "tl", "bottomright", "br") %in% layout)) {
      dplyr::arrange(x_long, layout, col, row)
    } else {
      dplyr::arrange(x_long, layout, col, dplyr::desc(row))
    }
  }

  # If clustering and facetting the same dimension, cannot show dendrogram
  facet_already_warned <- FALSE
  if (!isFALSE(cluster_rows) && !is.null(split_rows)) {
    show_dend_rows <- FALSE
  }
  if (!isFALSE(cluster_cols) && !is.null(split_cols)) {
    show_dend_cols <- FALSE
  }

  # Introduce facetting
  split_rows_names <- split_cols_names <- FALSE
  if (!is.null(split_rows)) {
    x_long <- prepare_facets(x_long, x, facet_in = split_rows, layout = layout,
                             context = "row", dendro = row_clustering)
    # Hide facet names if facet input is shorter than number of rows, unless data is clustered
    split_rows_names <- ifelse(length(split_rows) < nrow(x) && isFALSE(cluster_rows), FALSE, TRUE)
  }
  if (!is.null(split_cols)) {
    x_long <- prepare_facets(x_long, x, facet_in = split_cols, layout = layout,
                             context = "col", dendro = col_clustering)
    split_cols_names <- ifelse(length(split_cols) < ncol(x) && isFALSE(cluster_cols), FALSE, TRUE)
  }

  # Annotation for rows and columns
  # Default annotation parameters
  annot_default <- list(dist = annot_dist, gap = annot_gap, size = annot_size,
                        show_names = show_annot_names, border_col = annot_border_col,
                        border_lwd = annot_border_lwd, border_lty = annot_border_lty)
  # Deal with deprecated annot name params
  annot_rows_names_strategy <- check_annot_names_deprecated(new_params = annot_rows_names_params,
                                                            old_params = annot_rows_name_params,
                                                            context = "rows")
  annot_rows_names_params <- switch(annot_rows_names_strategy, "geom" = annot_rows_names_params,
                                    "grid" = annot_rows_name_params)

  annot_cols_names_strategy <- check_annot_names_deprecated(new_params = annot_cols_names_params,
                                                            old_params = annot_cols_name_params,
                                                            context = "cols")
  annot_cols_names_params <- switch(annot_cols_names_strategy, "geom" = annot_cols_names_params,
                                    "grid" = annot_cols_name_params)

  if (is.data.frame(annot_rows_df)) {
    annot_rows_prep <- prepare_annotation(annot_df = annot_rows_df, annot_defaults = annot_default,
                                          annot_params = annot_rows_params, annot_side = annot_rows_side,
                                          context = "rows", annot_name_params = annot_rows_names_params,
                                          annot_names_size = annot_names_size,
                                          annot_names_side = annot_rows_names_side, data_size = ncol(x),
                                          x_long = x_long, annot_names_strategy = annot_rows_names_strategy)
    annot_rows_df <- annot_rows_prep[[1]]; annot_rows_params <- annot_rows_prep[[2]];
    annot_rows_pos <- annot_rows_prep[[3]]; annot_rows_names_params <- annot_rows_prep[[4]]
    annot_rows_names_side <- annot_rows_prep[[5]]
  }

  if (is.data.frame(annot_cols_df)) {
    annot_cols_prep <- prepare_annotation(annot_df = annot_cols_df, annot_defaults = annot_default,
                                          annot_params = annot_cols_params, annot_side = annot_cols_side,
                                          context = "cols", annot_name_params = annot_cols_names_params,
                                          annot_names_size = annot_names_size,
                                          annot_names_side = annot_cols_names_side, data_size = nrow(x),
                                          x_long = x_long, annot_names_strategy = annot_cols_names_strategy)
    annot_cols_df <- annot_cols_prep[[1]]; annot_cols_params <- annot_cols_prep[[2]];
    annot_cols_pos <- annot_cols_prep[[3]]; annot_cols_names_params <- annot_cols_prep[[4]]
    annot_cols_names_side <- annot_cols_prep[[5]]
  }

  # Generate dendrograms, positions depend on annotation sizes
  dend_defaults <- list(dist = dend_dist, col = dend_col, height = dend_height, lwd = dend_lwd, lty = dend_lty)

  check_logical(show_dend_rows = show_dend_rows)
  check_logical(show_dend_cols = show_dend_cols)

  if (lclust_rows & isTRUE(show_dend_rows)) {
    dendro_rows <- prepare_dendrogram(dendro_in = row_clustering$dendro, context = "rows",
                                      dend_side = dend_rows_side,
                                      dend_defaults = dend_defaults,
                                      dend_params = dend_rows_params,
                                      full_plt = full_plt, layout = layout, x_long = x_long,
                                      annot_df = annot_rows_df, annot_side = annot_rows_side,
                                      annot_pos = annot_rows_pos, annot_size = annot_rows_params$size)

    # Check that the dendrogram labels are in the correct positions after mirroring and moving
    dendro_rows <- check_dendrogram_pos(dat = x_long, context = "row", dendro = dendro_rows)
  }

  if (lclust_cols & isTRUE(show_dend_cols)) {
    dendro_cols <- prepare_dendrogram(dendro_in = col_clustering$dendro, context = "cols",
                                      dend_side = dend_cols_side,
                                      dend_defaults = dend_defaults,
                                      dend_params = dend_cols_params,
                                      full_plt = full_plt, layout = layout, x_long = x_long,
                                      annot_df = annot_cols_df, annot_side = annot_cols_side,
                                      annot_pos = annot_cols_pos, annot_size = annot_cols_params$size)
    dendro_cols <- check_dendrogram_pos(dat = x_long, context = "col", dendro = dendro_cols)
  }


  # Generate colour scales according to specifications
  # Skip this whole part if the function call comes directly from ggcorrhm, as it is already handled there
  if (!grepl("^ggcorrhm\\(", deparse(sys.call(-1))[1])) {
    # Get scales and their orders
    scale_order <- make_legend_order(mode = mode,
                                     col_scale = col_scale,
                                     size_scale = size_scale, annot_rows_df = annot_rows_df,
                                     annot_cols_df = annot_cols_df,
                                     bins = bins, limits = limits, na_col = na_col,
                                     legend_order = legend_order)

    # Prepare scales for mixed layouts
    if (length(layout) == 2) {
      bins <- prepare_mixed_param(bins, "bins")
      limits <- prepare_mixed_param(limits, "limits")
      na_col <- prepare_mixed_param(na_col, "na_col")
      col_name <- prepare_mixed_param(col_name, "col_name")
      col_scale <- prepare_mixed_param(col_scale, "col_scale")
      size_name <- prepare_mixed_param(size_name, "size_name")
      size_scale <- prepare_mixed_param(size_scale, "size_scale")
    }

    # Generate the necessary scales
    main_scales <- prepare_scales(scale_order = scale_order, context = "gghm",
                                  layout = layout,
                                  val_type = ifelse(is.character(x_long[["value"]]) | is.factor(x_long[["value"]]), "discrete", "continuous"),
                                  col_scale = col_scale, col_name = col_name,
                                  size_scale = size_scale, size_name = size_name,
                                  na_col = na_col, limits = limits, bins = bins)

    # Annotation scales
    annot_scales <- prepare_scales_annot(scale_order = scale_order, na_col = annot_na_col,
                                         annot_rows_df = annot_rows_df, annot_cols_df = annot_cols_df,
                                         annot_rows_col = annot_rows_col, annot_cols_col = annot_cols_col)

    # Generate the scale lists to pass to gghm
    col_scale <- extract_scales(main_scales, scale_order, c("fill", "col"), layout)
    size_scale <- extract_scales(main_scales, scale_order, "size", layout)
  } else {
    annot_scales <- list("rows" = annot_rows_col, "cols" = annot_cols_col)
  }

  # Check that rows and columns in cell label input exist (if matrix/data frame)
  if (length(layout) == 2 && is.vector(cell_labels)) {
    cell_labels <- lapply(cell_labels, function(x) check_cell_labels(x, x_long))
  } else {
    cell_labels <- check_cell_labels(cell_labels, x_long)
  }

  # Build plot
  check_logical(show_names_diag = show_names_diag)

  if (length(layout) == 1) {
    plt <- make_heatmap(x_long = x_long, plt = NULL, mode = mode, include_diag = include_diag,
                        invisible_diag = isSymmetric(as.matrix(x)) && isTRUE(show_names_diag),
                        border_lwd = border_lwd, border_col = border_col, border_lty = border_lty,
                        show_names_diag = show_names_diag, show_names_x = show_names_x, show_names_y = show_names_y,
                        names_x_side = names_x_side, names_y_side = names_y_side,
                        col_scale = col_scale, size_scale = size_scale,
                        cell_labels = cell_labels, cell_label_col = cell_label_col,
                        cell_label_size = cell_label_size, cell_label_digits = cell_label_digits,
                        cell_bg_col = cell_bg_col, cell_bg_alpha = cell_bg_alpha,
                        split_rows_names = split_rows_names, split_cols_names = split_cols_names,
                        split_rows_side = split_rows_side, split_cols_side = split_cols_side)
    if (isTRUE(show_names_diag)) {
      plt <- add_diag_names(plt = plt, x_long = x_long, names_diag_params = names_diag_params)
    }
  } else if (length(layout) == 2) {

    # Avoid name clash
    lt <- layout
    # First half of the plot
    plt <- make_heatmap(x_long = dplyr::filter(x_long, layout == lt[1]), plt = NULL,
                        mode = mode[1], include_diag = include_diag, invisible_diag = TRUE,
                        border_lwd = border_lwd[[1]], border_col = border_col[[1]], border_lty = border_lty[[1]],
                        show_names_diag = show_names_diag, show_names_x = show_names_x, show_names_y = show_names_y,
                        names_x_side = names_x_side, names_y_side = names_y_side,
                        col_scale = col_scale[[1]], size_scale = size_scale[[1]],
                        cell_labels = cell_labels[[1]], cell_label_col = cell_label_col[[1]],
                        cell_label_size = cell_label_size[[1]], cell_label_digits = cell_label_digits[[1]],
                        cell_bg_col = cell_bg_col[[1]], cell_bg_alpha = cell_bg_alpha[[1]],
                        split_rows_names = split_rows_names, split_cols_names = split_cols_names,
                        split_rows_side = split_rows_side, split_cols_side = split_cols_side)
    # Remaining half
    # Add new scales if multiple are provided
    if (isTRUE(col_scale[[1]][["aesthetics"]] == col_scale[[2]][["aesthetics"]])) {
      plt <- plt + ggnewscale::new_scale(col_scale[[1]][["aesthetics"]])
    }
    if (!is.null(size_scale[[2]])) {plt <- plt + ggnewscale::new_scale(new_aes = "size")}

    plt <- make_heatmap(x_long = dplyr::filter(x_long, layout == lt[2]), plt = plt,
                        mode = mode[2], include_diag = FALSE, invisible_diag = FALSE,
                        border_lwd = border_lwd[[2]], border_col = border_col[[2]], border_lty = border_lty[[2]],
                        show_names_diag = FALSE, show_names_x = show_names_x, show_names_y = show_names_y,
                        names_x_side = names_x_side, names_y_side = names_y_side,
                        col_scale = col_scale[[2]], size_scale = size_scale[[2]],
                        cell_labels = cell_labels[[2]], cell_label_col = cell_label_col[[2]],
                        cell_label_size = cell_label_size[[2]], cell_label_digits = cell_label_digits[[2]],
                        cell_bg_col = cell_bg_col[[2]], cell_bg_alpha = cell_bg_alpha[[2]])
    if (show_names_diag) {
      plt <- add_diag_names(plt = plt, x_long = x_long, names_diag_params = names_diag_params)
    }
  }

  # Add row and column annotations
  if (is.data.frame(annot_rows_df)) {
    plt <- add_annotation(plt = plt, context = "rows", annot_df = annot_rows_df, annot_pos = annot_rows_pos,
                          annot_size = annot_rows_params$size, annot_border_lwd = annot_rows_params$border_lwd,
                          annot_border_col = annot_rows_params$border_col,
                          annot_border_lty = annot_rows_params$border_lty,
                          show_annot_names = annot_rows_params$show_names,
                          na_remove = annot_na_remove, col_scale = annot_scales[["rows"]],
                          names_side = annot_rows_names_side, name_params = annot_rows_names_params,
                          names_strategy = annot_rows_names_strategy)
  }

  if (is.data.frame(annot_cols_df)) {
    plt <- add_annotation(plt = plt, context = "cols", annot_df = annot_cols_df, annot_pos = annot_cols_pos,
                          annot_size = annot_cols_params$size, annot_border_lwd = annot_cols_params$border_lwd,
                          annot_border_col = annot_cols_params$border_col,
                          annot_border_lty = annot_cols_params$border_lty,
                          show_annot_names = annot_cols_params$show_names,
                          na_remove = annot_na_remove, col_scale = annot_scales[["cols"]],
                          names_side = annot_cols_names_side, name_params = annot_cols_names_params,
                          names_strategy = annot_cols_names_strategy)
  }

  # Add dendrograms
  if (lclust_rows & isTRUE(show_dend_rows)) {
    plt <- add_dendrogram(plt = plt, dendro = dendro_rows, dend_col = dendro_rows$params$col,
                          dend_lwd = dendro_rows$params$lwd, dend_lty = dendro_rows$params$lty)
  }

  if (lclust_cols & isTRUE(show_dend_cols)) {
    plt <- add_dendrogram(plt = plt, dendro = dendro_cols, dend_col = dendro_cols$params$col,
                          dend_lwd = dendro_cols$params$lwd, dend_lty = dendro_cols$params$lty)
  }

  if (return_data) {

    # If layout is included (for mixed layouts), rename column
    if ("lt" %in% colnames(x_long)) {x_long <- dplyr::rename(x_long, layout = lt)}

    # Data to return. If not drawing the diagonal, skip those values
    data_out <- if (!include_diag) {
      dplyr::filter(x_long, as.character(row) != as.character(col))
    } else {
      x_long
    }
    list_out <- list("plot" = plt, "plot_data" = data_out)

    if (!isFALSE(cluster_rows)) {
      list_out[["row_clustering"]] <- row_clustering[["clust"]]
    }
    if (!isFALSE(cluster_cols)) {
      list_out[["col_clustering"]] <- col_clustering[["clust"]]
    }

    return(list_out)

  } else {
    return(plt)
  }
}


#' Scale data rows or columns.
#'
#' @keywords internal
#'
#' @param x Matrix to scale.
#' @param scl String of dimension to scale ("row", "column", "none" (or NULL), or a substring of the beginning).
#'
#' @returns Scaled (or not scaled) matrix.
#'
scale_mat <- function(x, scl = NULL) {
  if (is.null(x) || grepl(paste0("^", scl), "none")) {
    return(x)
  } else if (grepl(paste0("^", scl), "rows")) {
    x_out <- t(scale(t(x)))
  } else if (grepl(paste0("^", scl), "columns")) {
    x_out <- scale(x)
  } else {
    cli::cli_abort("{.var scale_data} must be NULL or 'none' (no scaling), 'rows' or 'columns' (or a substring of the beginning).",
                   class = "scale_data_error")
  }

  return(x_out)
}

#' Prepare parameters for mixed layouts.
#'
#' @keywords internal
#'
#' @param param Parameter to prepare.
#' @param param_name Parameter name (for error messages and handling special parameter).
#'
#' @returns If length one, it is returned duplicated in a list for use in each triangle. If longer than 1
#' an error message is returned. In other cases, the input parameter is returned (length two input).
#'
prepare_mixed_param <- function(param, param_name) {

  if (grepl("_scale$", param_name) && is.list(param) && length(param) == 1) {
    # If a scale object, put it in a list but don't repeat it
    # If character, repeat
    if (inherits(param[[1]], c("Scale", "ggproto", "gg"))) {
      param_out <- list(param[[1]], NULL)
    } else if (is.character(param[[1]])) {
      param_out <- list(param[[1]], param[[1]])
    }

  } else if (is.null(param) && (grepl("_scale$", param_name) || grepl("_digits$", param_name) ||
                                param_name %in% c("size_range", "limits", "bins"))) {
    # Return a list of NULLs if NULL
    param_out <- list(NULL, NULL)

  } else if (is.list(param) && length(param) == 1) {
    # If a list of length one, repeat its content
    param_out <- list(param[[1]], param[[1]])

  } else if (!is.list(param) && param_name %in% c("size_range", "limits")) {
    # Scale parameters that can be a vector
    param_out <- list(param, param)

  } else if (length(param) == 1 || (param_name == "cell_labels" && (is.matrix(param) || is.data.frame(param)))) {
    # Recycle if length one, or if cell_labels is a data frame or matrix for cell labels
    param_out <- list(param, param)

  } else if (length(param) != 2) {
    msg <- if (param_name == "col_scale") {
      "In a mixed layout, {.var {param_name}} must be either one character specifying a scale (used for all),
       or a list with up to two scales (character, scale object or NULL). See the details of 'gghm' for more on usage."
    } else if (param_name == "size_scale") {
      "In a mixed layout, {.var {param_name}} must be either NULL (use default),
       or a list with up to two scales (scale object or NULL). See the details of 'gghm' for more on usage."
    } else {
      "In a mixed layout, {.var {param_name}} must be either one (used for all) or two (used for each triangle) values,
                          or a list of length two with a vector for each triangle. See the details of 'gghm' for more on usage."
    }

    cli::cli_abort(msg, class = "param_len_error")

  } else {
    param_out <- param
  }

  return(param_out)
}