PPBstats: An R package to perform analysis found within PPB programmes

Documented in plot.parameter_groups

#' Get ggplot to visualize output from \code{\link{parameter_groups}}
#'
#' @description
#' \code{plot.parameter_groups} returns ggplot to visualize outputs from \code{\link{parameter_groups}}
#'
#' @param x Output from \code{\link{parameter_groups}}
#'
#' @param ind_to_highlight individual to higlight on the PCA plot
#'
#' @param ... further arguments passed to or from other methods
#'
#' @details
#' S3 method.
#' See examples for AMMI, GGE and hierarchical bayesian GxE model : https://priviere.github.io/PPBstats_book/family-2.html
#' 
#' @return 
#' It returns list of ggplot object
#'   \itemize{
#'    \item pca : a list with three elements on the PCA on the group of parameters :
#'     \itemize{
#'      \item composante_variance : variance caught by each dimension of the PCA
#'      \item ind : graph of individuals
#'      \item var : graph of variables
#'     }
#'    \item clust : output from \code{factextra::fviz_nbclust()}. See \code{?factoextra::fviz_nbclust} for more details, 
#'    a list of number of cluster + 1 element
#'   }
#'   
#' @author Pierre Riviere
#' 
#' @seealso \code{\link{parameter_groups}}
#' 
#' @export
#' 
#' @import dplyr
#' @import factoextra
#' @import ggplot2
#' 
plot.parameter_groups <- function(x, ind_to_highlight = NULL, ...){
  y = clust = NULL  # to avoid no visible binding for global variable
  
  pca = x$obj.pca
  res.hcpc = x$clust$res.hcpc
  
  # ind_to_highlight ----------
  if( !is.null(ind_to_highlight) ){
    if( !is.element(ind_to_highlight, rownames(res.hcpc$call$X)) ) { 
      warning(ind_to_highlight, " is not present in the data set.")
      highlight = FALSE
    } else { highlight = TRUE }
  } else { highlight = FALSE }
  
  res = res.hcpc
  
  # Get one plot per cluster with the rigth legend ----------
  nb_clust = nlevels(res.hcpc$call$X$clust)

  p_all = fviz_cluster(res.hcpc, repel = TRUE) 
  if(highlight){
    D = p_all$data
    coord = D[grep(ind_to_highlight,D$name),c("x","y")]
    p_all = p_all + geom_point(data=coord,mapping=aes(x=x,y=y))
  }

  list_p_clust = list(p_all)
  for(c in 1:nb_clust){
    d = res
    dX = dplyr::filter(d$call$X, clust == c)
    rownames(dX) = rownames(d$call$X)[which(d$call$X$clust == c)]
    d$call$X = dX
    levels(d$call$X$clust) = c(1:nb_clust)
    res.hcpc = d
    
    p1 = fviz_cluster(res.hcpc, repel = TRUE)
    
    xlim = range(p1$data$x)
    ylim = range(p1$data$y)
    levels(d$call$X$clust) = c(1:nb_clust)
    for(cc in 1:nb_clust){ d$call$X = rbind.data.frame(d$call$X, c(NA, NA, cc, 1)) }
    rownames(d$call$X)[(nrow(d$call$X) - nb_clust + 1): nrow(d$call$X)] = paste("cluster", c(1:nb_clust))

    p = fviz_cluster(d, repel = TRUE, ellipse = FALSE) 
    p = p + coord_cartesian(xlim = xlim, ylim = ylim)
    
    if(highlight){
      D = p$data
      coord = D[grep(ind_to_highlight,D$name),c("x","y")]
      if(nrow(coord)>0){p = p + geom_point(data=coord,mapping=aes(x=x,y=y))}
    }


    list_p_clust = c(list_p_clust, list(p))
  }
  names(list_p_clust) = paste("cluster", c("all", c(1:nb_clust)), sep = "_")
  
  # Return results ----------
  out = list(
    "pca" = list(
      "composante_variance" = fviz_eig(pca),
      "ind" = fviz_pca_ind(pca, repel = TRUE),
      "var" = fviz_pca_var(pca, repel = TRUE)
    ),
    "clust" = list_p_clust
  )
  
  return(out)
}