R/biv_density_plot.R

Defines functions biv_dense_plot densePlot

Documented in biv_dense_plot

# CUSTOMISED GGPLOT ----

#' A util function to plot a customized ggplot
#' @noRd
densePlot <- function(data, numVar, catVar, colors = NULL){
  data %>%
    ggplot2::ggplot(ggplot2::aes_string(numVar, fill = catVar)) +
    ggplot2::geom_density(alpha = 0.3, na.rm = TRUE) +
    ggplot2::scale_fill_manual(values = colors) +
    ggplot2::labs(title = paste0("Distribution of ", numVar, " Based on ", catVar)) +
    ggplot2::theme_minimal()
}

# DENSITY PLOTS FOR NUMERIC FEATURES SPLIT IN TARGET FEAT CATEGORIS ----

#' A function to display or save density plots created on all numeric features.
#'
#' @description Creates (or saves as png if asked) density plots for all numeric features. Splits the density plots based on target feature categories.
#'
#' @param dataset Name of the data frame object
#' @param classVar Name of the target feature
#' @param order A vector listing the target feature labels in the desired order. To use default order leave this parameter. Default value NULL.
#' @param colors A vector listing which color to use to represent which target feature label. To have the function pick color leave this parameter. Deafult value NULL.
#' @param loc A string with the directory where you want to save the plots. If no location is provided the plots will be created and displayed but not stored as image files.
#' @param facet Name of the features along which to separate the plots as facets
#'
#' @return
#'
#' Returns three outputs:
#' 1. If loc = NULL, returns plots and displays in the RStudio Plots window,
#' 2. If loc has location provided, creates and saves the plots. Doesn't display in RStudio.
#'
#' @examples
#'
#' library(dplyr)
#' library(ggplot2)
#' biv_dense_plot(dataset = iris,
#' classVar = Species,
#' order = c("virginica", "versicolor", "setosa"),
#' colors = c("virginica" = "#32a897", "versicolor" = "#328bab", "setosa" = "#8031ad"),
#' loc = NULL)
#'
#'
#' @export

biv_dense_plot <- function(dataset, classVar, order = NULL, colors = NULL, facet = NULL, loc = NULL) {

  x <- rlang::enquo(classVar) %>% rlang::get_expr()
  nLevels <- dplyr::select(dataset, {{classVar}}) %>% unique() %>% nrow()

  # producing random color n case no color is provided
  if(is.null(colors)){
    colors = randomcoloR::randomColor(nLevels, luminosity = "bright")
  }

  print("plotting...")
  if(is.null(loc)){
    for(i in names(dplyr::select(dataset, where(is.numeric)))) {
      print(dataset %>%
              densePlot(i, catVar = x, colors = colors) +
              wrap_by({{facet}})
              )
    }
  } else{

    for(i in names(dplyr::select(dataset, where(is.numeric)))) {

      png(paste0(loc, "/denseplot_", i, ".PNG"), width = 627, height = 453)
      plot <- dataset %>%
        densePlot(i, catVar = x, colors = colors) +
        wrap_by({{facet}})
      print(plot)
      dev.off()
    }
  }
}
Curious-Joe/fastEda documentation built on March 23, 2022, 12:13 p.m.