flowR: R-shiny interface for the analysis of flow cytometry data

Documented in add_columns_from_metadata add_gate add_gates_flowCore add_gate_to_plot asinh_transform build_flowset_from_df call_plot_function copy_gate dim_reduction ellipse_path find_all_parent_gates format_plot get_all_ancestors get_all_descendants get_cluster get_data_gs get_gate_coordinates get_gates_from_gs get_gates_from_ws get_gates_from_ws_diva get_groups_from_ws get_parameters_gs get_plot_data get_plot_data_range getPopStatsPlus get_spillover_matrices_from_ws get_spillover_matrices_from_ws_diva get_templates_from_ws_diva gh_get_gate_names gs_get_fs_subset parseCompensationDiva parseGate parseGateDiva parseGroupNodes parseSampleNodes parseSpillover parseSpilloverMatrix parseSpilloverMatrixDiva parseTemplatesNodesDiva plot_bar plot_contour plot_dots plot_gate plot_gh plot_gs plot_gs_ggcyto plot_heatmap plot_hexagonal plot_histogram plot_pca plot_stat plot_tile plot_tree scale_values transform_gates

utils::globalVariables(c("df", "xvar", "yvar", "x", "y"))

###### Parse Diva workspace (.xml Diva workspace files) ######################################################

#' Return the name of 'template' xml_node
#' from a Diva xml workspace
#' @param templateNode a 'template' xml_node from a Diva xml workspace
#' @import xml2
parseTemplatesNodesDiva <- function(templateNode){
  x <- templateNode
  attrs <- as.list(xml_attrs(x))
  if("name" %in% names(attrs)){
    return(attrs$name)
  }else{return(NA)}
}

#' Return the names of all 'templates'
#' from a Diva xml workspace
#' @param ws_path path to the workspace
#' @import xml2
get_templates_from_ws_diva <- function(ws_path){
  ws <- read_xml(ws_path)
  templates <-  xml_find_all(ws, ".//worksheet_template")
  template_names <- unlist(lapply(templates, parseTemplatesNodesDiva))
  return(template_names[!is.na(template_names)])
}

#' Extract all gates from a Diva xml workspace
#' @param ws_path path to the workspace
#' @param template Names of the template to consider
#' @import xml2
#' @importFrom flowCore rectangleGate polygonGate
get_gates_from_ws_diva <- function(ws_path, template = NULL){
  xt <- read_xml(ws_path)
  templates <-  xml_find_all(xt, ".//worksheet_template")
  template_names <- unlist(lapply(templates, parseTemplatesNodesDiva))
  
  idx_template <- 1
  if(!is.null(template)){
    if(template %in% template_names){
      idx_template <- which(template_names == template)
    }
  }
  
  gatesNode <- xml_find_first(templates[[idx_template]], ".//gates")
  gate_set <- xml_find_all(gatesNode, ".//gate")
  gates <- lapply(gate_set, parseGateDiva)
  
  gate_list <- list()
  
  for(i in 1:length(gates)){
    if(!is.null(gates[[i]])){
      parent <- gates[[i]]$parent_long
      name <- gates[[i]]$name_long
      
      #parent <- gsub(" ", "_", parent)
      #name <- gsub(" ", "_", name)
      
      if(gates[[i]]$type == "RectangleGate"){
        boundaries <- gates[[i]]$boundaries
        g <- flowCore::rectangleGate(.gate = boundaries, filterId = basename(name))
        gate_list[[name]] <- list(gate = g, parent = parent)
      }else if(gates[[i]]$type == "PolygonGate"){
        polygon <- gates[[i]]$polygon
        g <- flowCore::polygonGate(.gate = polygon, filterId = basename(name) )
        gate_list[[name]] <- list(gate = g, parent = parent)
      }else{
        warning(paste("gate type", gates[[i]]$type, "not supported"))
        #g <- NULL
        #gate_list[[name_long]] <- list(gate = g, parent = parent)
      }
    }
    
  } 
  return(gate_list)
  
  return(gates)
}

#' Return relevant info from a 'gate' xml_node
#' from a Diva xml workspace
#' @param gateNode a 'gate' xml_node from a Diva xml workspace
#' @import xml2
parseGateDiva <- function(gateNode){
  
  res <- list()
  gate <- gateNode
  
  fullname <- xml_attr(gate, "fullname")
  
  if(fullname == "All Events"){
    return(NULL)
  }
  
  name_long <- gsub(fixed = FALSE, pattern = "\\\\", replacement = "/", x= fullname)
  name_long <- gsub("All Events", "", name_long)
  
  name <- xml_text(xml_find_all(gate, ".//name"))
  parent <- xml_text(xml_find_all(gate, ".//parent"))
  is_x_parameter_log <- xml_text(xml_find_all(gate, ".//is_x_parameter_log"))
  is_x_parameter_scaled <- xml_text(xml_find_all(gate, ".//is_x_parameter_scaled"))
  x_parameter_scale_value <- xml_text(xml_find_all(gate, ".//x_parameter_scale_value"))
  is_y_parameter_log <- xml_text(xml_find_all(gate, ".//is_y_parameter_log"))
  is_y_parameter_scaled <- xml_text(xml_find_all(gate, ".//is_y_parameter_scaled"))
  y_parameter_scale_value <- xml_text(xml_find_all(gate, ".//y_parameter_scale_value"))
  
   # print(name)
   # print(is_x_parameter_log)
   # print(is_x_parameter_scaled)
   # print(x_parameter_scale_value)
   # print(is_y_parameter_log)
   # print(is_y_parameter_scaled)
   # print(y_parameter_scale_value)
  
  parent <- gsub(fixed = FALSE, pattern = "\\\\", replacement = "/", x= parent)
  if(parent == "All Events"){
    parent <- "root"
  }else{
    parent <- gsub("All Events", "", parent)
  }
  parent_long <- parent
  parent <- basename(parent)
  
  
  res <- c(res, list("name" = name,
                     "parent" =  parent, 
                     "name_long" = name_long, 
                     "parent_long" = parent_long
  ))
  
  region <- xml_find_all(gate, ".//region")
  
  xparm <- xml_attr(region, "xparm")
  yparm <- xml_attr(region, "yparm")
  type <- xml_attr(region, "type")
  
  region <- xml_find_all(gate, ".//region")
  points <- xml_find_first(region, ".//points")
  vertexes <- xml_find_all(points, ".//point")
  
  m <- do.call(rbind, lapply(vertexes, function(v){
    x <- as.numeric(xml_attr(v, "x"))
    if(is_x_parameter_log == "true" & is_x_parameter_scaled == "false"){x <- 10^x}
    y <- as.numeric(xml_attr(v, "y"))
    if(is_y_parameter_log == "true" & is_y_parameter_scaled == "false"){y <- 10^y}
    return(data.frame(x = x,
                      y = y))
  }))
  m <- as.matrix(m)
  colnames(m) <- c(xparm, yparm)
  
  if(type == "INTERVAL_REGION"){
    res <- c(res, list("type" = "RectangleGate",
                       "boundaries" = rbind(m[1,1], m[2,1])
    ))
  }else if(type %in% c("RECTANGLE_REGION", "POLYGON_REGION")){
    res <- c(res, list("type" = "PolygonGate",
                       "polygon" = m
    ))
  }
  
  return(res)
  
}

#' Extract spillover matrices from a Diva xml workspace
#' @param ws_path path to the workspace
#' @import xml2
get_spillover_matrices_from_ws_diva <- function(ws_path){
  ws <- read_xml(ws_path)
  settingsNodes <-  xml_find_all(ws, ".//instrument_settings")
  spill_list <- lapply(settingsNodes[1], parseSpilloverMatrixDiva)
  spill_names <- unlist(lapply(settingsNodes[1], function(x){as.list(xml_attrs(x))$name}))
  names(spill_list) <- spill_names
  return(spill_list)
}

#' Return the spillover matrix associated with a 'instrument_settings' xml_node
#' from a Diva xml workspace
#' @param settingsNode a 'instrument_settings' xml_node from a Diva xml workspace
#' @import xml2
#' @importFrom reshape2 acast
parseSpilloverMatrixDiva <- function(settingsNode){
  x <- settingsNode
  parameterNodes <- xml_find_all(x, ".//parameter")
  
  spill_parameters <- unlist(lapply(parameterNodes, function(x){
    name <- as.list(xml_attrs(x))$name
    can_be_comp <- xml_text(xml_find_first(x, ".//can_be_compensated"))
    is_comp <- FALSE
    if(!is.na(can_be_comp)){
      if(can_be_comp == "true"){
        is_comp <- TRUE
      }
    }
    if(is_comp){
      return(name)
    }else{
      return(NULL)
    }
  }))
  
  df_spillover_list <- lapply(parameterNodes, function(x){
    name <- as.list(xml_attrs(x))$name
    if(name %in% spill_parameters){
      df <- parseCompensationDiva(x)
      df$parameter <- spill_parameters
      return(df)
    }else{
      return(NULL)
    }
  })
  
  df_spillover <- do.call(rbind, df_spillover_list)
  compMat <- reshape2::acast(df_spillover, input ~ parameter)
  return(compMat)
}

#' Return the spillover coefficients associated with a 'parameter' xml_node
#' from a Diva xml workspace
#' @param parameterNode a 'parameter' xml_node from a Diva xml workspace
#' @import xml2
parseCompensationDiva <- function(parameterNode){
  x <- parameterNode
  name <- as.list(xml_attrs(x))$name
  compensationNode <- xml_find_first(x, ".//compensation")
  coeffNodes <- xml_find_all(compensationNode, ".//compensation_coefficient")
  coeffs <- unlist(lapply(coeffNodes, function(x){xml_double(x)}))
  if(!is.null(coeffs)){
    df <- data.frame(value = coeffs)
    df$input <- name
    return(df)
  }else{
    return(NULL)
  }
}

###### Parse FlowJO workspace (.wsp flowJO workspace files) ##################################################

#' Return the name and ID of a SampleNode xml_node 
#' from a FlowJO wsp
#' @param x a xml_document object 
#' @import xml2
parseSampleNodes <- function(x){
  name <- xml_text(xml_find_all(x, ".//@name"))[1]
  sampleID <- xml_integer(xml_find_all(x, ".//@sampleID"))[1]
  return(list("name" = name, "sampleID" = sampleID))
}

#' Return the name and IDs of samples in a  GroupNode xml_node
#' from a flowJO wsp
#' @param x a xml_document object
#' @import xml2
parseGroupNodes <- function(x){
  name <- xml_text(xml_find_all(x, ".//@name"))[1]
  sampleID <- xml_integer(xml_find_all(xml_find_all(x, ".//SampleRefs"), ".//@sampleID"))
  return(list("name" = name, "sampleID" = sampleID))
}

#' find, in a recursive manner, all parent gates of a given Gate xml_node
#' from a FlowJO wsp
#' @param x a Gate xml_node from a FlowJO wsp
#' @import xml2
find_all_parent_gates <- function(x){
  all_parents <- NULL
  y <- x
  while(xml_name( xml_parent(xml_parent(xml_parent(y))) ) == "Population"){
    all_parents <- c(xml_text(xml_find_all( xml_parent(xml_parent(xml_parent(y))), ".//@name")[1]), 
                     all_parents)
    y <- xml_parent(xml_parent(xml_parent(y)))
    idx_gate <- which( xml_name( xml_children(y) ) == "Gate")
    if(length(idx_gate)>0){
      y <- xml_children(y)[[idx_gate]]
    }else{
      break
    }
    
  }
  return(all_parents)
}

#' Return the names of all 'groups'
#' from a FlowJO workspace
#' @param ws_path path to the workspace
#' @import xml2
get_groups_from_ws <- function(ws_path){
  ws <- read_xml(ws_path)
  GroupNodes <- xml_find_all(ws, "//GroupNode")
  group_names <- unlist(lapply(GroupNodes, function(x){
    parseGroupNodes(x)$name
    }))
  return(group_names)
}

#' Extract all gates from a FlowJO workspace
#' @param ws_path path to the workspace
#' @param group Names of the sample groups to be considered
#' @import xml2
#' @importFrom flowCore rectangleGate polygonGate
get_gates_from_ws <- function(ws_path, group = NULL){
  
  ws <- read_xml(ws_path)
  
  # get Groups info
  GroupNodes <- xml_find_all(ws, "//GroupNode")
  group_info <- lapply(GroupNodes, parseGroupNodes)
  group_info <- data.frame( do.call(rbind, group_info ) )
  #print(group_info)
  
  # get Samples info
  SampleNodes <- xml_find_all(ws, "//SampleNode")
  sample_info <- lapply(SampleNodes , parseSampleNodes)
  sample_info <- data.frame( do.call(rbind, sample_info ) )
  #print(sample_info)

  if(is.null(group)){
    group_selected <- unlist(group_info$name)[1]
  }else{
    group_selected <- group
  }

  
  # get Gates for first sample in group
  sampleID <- group_info$sampleID[[which(unlist(group_info$name) == group_selected)]][1]
  if(length(sampleID) > 0){
    SampleNode <- SampleNodes[ which(unlist(sample_info$sampleID) == sampleID) ]
  }else{
    stop("Could not find sample in group")
  }
  
  #print(SampleNode)
  gates <- lapply(xml_find_all(SampleNode, ".//Gate"), parseGate)
  
  if(length(gates)==0){
    warning("Could not find gates defined in the first sample of the group")
    return(list())
  }
  
  gate_list <- list()
  
  for(i in 1:length(gates)){
    
    parent <- gates[[i]]$parent_long
    name <- gates[[i]]$name_long
    
    #parent <- gsub(" ", "_", parent)
    #name <- gsub(" ", "_", name)
    
    if(gates[[i]]$type == "RectangleGate"){
      boundaries <- gates[[i]]$boundaries
      g <- flowCore::rectangleGate(.gate = boundaries, filterId = basename(name))
      gate_list[[name]] <- list(gate = g, parent = parent)
    }else if(gates[[i]]$type == "PolygonGate"){
      polygon <- gates[[i]]$polygon
      g <- flowCore::polygonGate(.gate = polygon, filterId = basename(name) )
      gate_list[[name]] <- list(gate = g, parent = parent)
    }else{
      warning(paste("gate type", gates[[i]]$type, "not supported"))
      #g <- NULL
      #gate_list[[name_long]] <- list(gate = g, parent = parent)
    }
    
    
  } 
  return(gate_list)
  
}

#' Return relevant info from a Gate xml_node
#' @param x a Gate xml_node from a FlowJO wsp
#' @import xml2
parseGate <- function(x){
  res <- list()
  
  name <- xml_text( xml_find_all(xml_parent(x), ".//@name")[1] )
  
  if( xml_name( xml_parent(xml_parent(xml_parent(x))) ) == "Population"){
    parent <- xml_text(xml_find_all( xml_parent(xml_parent(xml_parent(x))), ".//@name")[1])
  }else{
    parent <- "root"
  }
  
  # find all parent gates recursively
  all_parents <- find_all_parent_gates(x)
  
  if(length(all_parents)>0){
    parent_long <- paste("/",paste(all_parents, collapse = "/"), sep = "")
  }else{
    parent_long <- "root"
  }
  
  name_long <- paste("/",paste(c(all_parents, name), collapse = "/"), sep = "")
  
  type <- xml_name(xml_child(x))
  dim <- xml_text(xml_find_all(xml_find_all(x, ".//gating:dimension"), ".//@data-type:name"))
  res <- c(res, list("name" = name, 
                     "parent" =  parent, 
                     "name_long" = name_long, 
                     "parent_long" = parent_long, 
                     "type" = type, 
                     "dim" = dim))
  
  if(type == "RectangleGate"){
    min <- xml_double(xml_find_all(x, ".//@gating:min"))
    max <- xml_double(xml_find_all(x, ".//@gating:max"))
    m <- rbind(min, max)
    colnames(m) <- dim
    res <- c(res, list("boundaries" = m))
  }
  if(type == "PolygonGate" ){
    vertexes <- xml_double(
      xml_find_all(
        xml_find_all(x, ".//gating:vertex"), ".//@data-type:value"))
    polygon <- matrix(vertexes, nrow = 2)
    polygon <- t(polygon)
    colnames(polygon) <- res[["dim"]]
    res <- c(res, list("polygon" = polygon))
  }
  return(res)
}

#' Extract spillover matrices from a FlowJO workspace
#' @param ws_path path to the workspace
#' @import xml2
get_spillover_matrices_from_ws <- function(ws_path){
  ws <- read_xml(ws_path)
  spilloverMatrixNodes <- xml_children(xml_find_first(ws, ".//Matrices"))
  spill_list <- lapply(spilloverMatrixNodes, parseSpilloverMatrix)
  spill_names <- unlist(lapply(spilloverMatrixNodes, function(x){as.list(xml_attrs(x))$name}))
  names(spill_list) <- spill_names
  return(spill_list)
}

#' Return the spillover matrix associated with a spilloverMatrix xml_node
#' from a flowJO wsp
#' @param x a spilloverMatrix xml_node from a FlowJO wsp
#' @import xml2
#' @importFrom reshape2 acast
parseSpilloverMatrix <- function(x){
  params_list <- xml_find_all(xml_find_first(x, ".//data-type:parameters"), ".//data-type:parameter")
  parameters <- unlist(lapply(params_list, function(x){as.list(xml_attrs(x))$name}))
  spilloverNodes <- xml_find_all(x, ".//transforms:spillover")
  df_spillover_list <- lapply(spilloverNodes, parseSpillover)
  df_spillover <- do.call(rbind, df_spillover_list)
  compMat <- reshape2::acast(df_spillover, input ~ parameter)
  return(compMat)
}

#' Return the spillover coefficients associated with a spillover xml_node
#' from a flowJO wsp
#' @param x a spillover xml_node from a FlowJO wsp
#' @import xml2
parseSpillover <- function(x){
  parameter <- as.list(xml_attrs(x))$parameter
  coeffNodes <- xml_find_all(x, ".//transforms:coefficient")
  coeffs <- lapply(coeffNodes, function(x){xml_attrs(x)})
  df <- as.data.frame(do.call(rbind, coeffs), stringsAsFactors = FALSE)
  df$input <- parameter
  df$value <- as.numeric(df$value)
  return(df)
}
###### Transformations #########################################################################


#' @importFrom flowWorkspace flowJoTrans flow_trans
flowJo_biexp_inverse_trans <- function (..., n = 6, equal.space = FALSE){
  trans <- flowWorkspace::flowJoTrans(..., inverse = TRUE)
  inv <- flowWorkspace::flowJoTrans(...)
  flow_trans(name = "flowJo_biexp_inverse", trans.fun = trans, inverse.fun = inv, 
             n = n, equal.space = equal.space)
}

#' Scaled hyperbolic arc-sine function
#' @param scale scale parameter
#' @param inverse use inverse function?
asinh_transform <- function(scale=5, inverse = FALSE){
  if(inverse){
    function(x){scale*sinh(x)} 
  }else{
    function(x){asinh(x/scale)} 
  }
}

#' Scaled hyperbolic arc-sine transformation
#' @param ... arguments passed to \code{asinh_transform()}
#' @param n desired number of breaks (see \code{flow_trans()})
#' @param equal.space whether breaks at equal-spaced intervals (see \code{flow_trans()})
#' @importFrom flowWorkspace flow_trans
asinh_trans <- function (..., n = 6, equal.space = FALSE){
  trans <- asinh_transform(...)
  inv <- asinh_transform(..., inverse = TRUE)
  flow_trans(name = "asinh", trans.fun = trans, inverse.fun = inv, 
             n = n, equal.space = equal.space)
}


### Gating #####################################################################################


#' Return coordinates of flowCore gate.
#' @param gate a flowCore gate either from class "polygonGate", "rectangleGate" or 
#' "ellipsoidGate"
get_gate_coordinates <- function(gate){
  
  polygon <- NULL
  
  if(class(gate) == "polygonGate" ){
    if(length(unique(colnames(gate@boundaries)))>1){
      polygon <- as.data.frame(gate@boundaries)
    }
  }else if(class(gate) == "rectangleGate"){
    if(length(gate@min)>1){
      polygon <- data.frame(x = c(gate@min[1], gate@max[1], gate@max[1], gate@min[1]),
                            y = c(gate@min[2], gate@min[2], gate@max[2], gate@max[2]))
    }else{
      polygon <- data.frame(x = c(gate@min[1], gate@max[1]))
    }
    colnames(polygon) <- names(gate@min)
    
  }else if(class(gate) == "ellipsoidGate"){
    cov <- gate@cov
    mean <- gate@mean
    polygon <- ellipse_path(cov = cov, mean = mean)
  }else{
    warning("gate format not supported")
  }
  
  return(polygon)
  
}

#' Return coordinates of points along an ellipse defined by its 
#' covariance matrix and its center
#' @param cov covariance matrix
#' @param mean coordinates of the center of the ellipse
#' @param n number of points to return along the ellipse
#' @return a data.frame with point cordinates
ellipse_path <- function(cov, mean, n = 100){
  
  eg <- eigen(cov)
  a <- sqrt(eg$values[1])
  b <- sqrt(eg$values[2])
  alpha <- acos(eg$vectors[1,1])
  
  x <- NULL
  y <- NULL

  for(i in 1:(n+1)){
    theta <- (i-1)*pi*2/n
    xr <- a*cos(theta)
    yr <- b*sin(theta)
    x <- c(x, cos(alpha)*xr - sin(alpha)*yr + mean[1])
    y <- c(y, sin(alpha)*xr + cos(alpha)*yr + mean[2])
  }
  
  df <- data.frame(x = x, y= y)
  names(df)[1:2] <- colnames(cov)
  
  return(df)
}

#' Return all descendants from a set of nodes in a tree
#' @param named_list a list representing a tree. It must be named 
#' according to tree node names and each of its element must have a field 'parent' 
#' containing the name of its parent node.
#' @param names Names of the nodes for which all descendants must be returned
get_all_descendants <- function(named_list, names){
  
  parents <- sapply(named_list, function(x){x$parent}) 
  children <- names(named_list)[parents %in% names]
  children_all <- children
  while(length(children)>0){
    children <- get_all_descendants(named_list, children)
    children_all <- unique(c(children_all, children))
  }
  return(children_all)
  
}

#' Return all ancestors from a set of nodes in a tree
#' @param named_list a list representing a tree. It must be named 
#' according to tree node names and each of its element must have a field 'parent' 
#' containing the name of its parent node.
#' @param names Names of the nodes for which all ancestors must be returned
get_all_ancestors <- function(named_list, names){
  
  parents <- sapply(named_list, function(x){x$parent}) 
  parents <- unlist(parents[names(named_list) %in% names])
  parents_all <- parents
  while(length(parents)>0){
    parents <- get_all_ancestors(named_list, parents)
    parents_all <- unique(c(parents_all, parents))
  }
  return(parents_all)
  
}

#' Get all gate names from a GatingHierarchy
#' @param gh a GatingHierarchy
#' @importFrom flowWorkspace gs_pop_get_children
gh_get_gate_names <- function(gh){
  children <- flowWorkspace::gs_pop_get_children(gh, "root")
  children_all <- c("root", children)
  while(length(children)>0){
    children <- unlist(sapply(children, 
                       function(x){flowWorkspace::gs_pop_get_children(gh, x)}))
    children_all <- unique(c(children_all, children))
  }
  return(children_all)  
}

#' Build a gating hierarchy from a GatingSet
#' @param gs a GatingSet
#' @return a named list representing the gating hierarchy. 
#' Each element has a field 'gate' with a flowCore filter object 
#' and a field 'parent' with the name of its parent gate.
#' @importFrom flowWorkspace gs_get_pop_paths gh_pop_get_gate gs_pop_get_parent
get_gates_from_gs <- function(gs){
  
  nodes <- gh_get_gate_names(gs[[1]])
  
  nodes <- gh_get_gate_names(gs[[1]])
  
  gates <- list()
  
  for(node in setdiff(nodes, "root")){
    g <- flowWorkspace::gs_pop_get_gate(gs, node)
    parent <- flowWorkspace::gs_pop_get_parent(gs, node)
    gates[[node]] <- list(gate = g, parent = parent)
  } 
  
  return(gates)
}

#' Add gates from a gating hierarchy to a GatingSet
#' @param gs a GatingSet
#' @param gates a named list representing the gating hierarchy. 
#' Each element must have a field 'gate' with a flowCore filter object 
#' and a field 'parent' with the name of its parent gate.
#' @importFrom flowWorkspace gs_get_pop_paths gs_pop_add recompute colnames
add_gates_flowCore <- function(gs, gates){
  
  #print(sampleNames(gs))
  
  #gates are expected to share the same hierarchy and dimensions across samples
  # so focus only on the first sample
  new_gates_name <- setdiff(names(gates), gh_get_gate_names(gs[[1]]))
  if(length(new_gates_name)==0){
    warning("All gates already exist in GatingSet. No gates added")
    return(gs)
  }
  if(!setequal(new_gates_name, names(gates))){
    warning(paste("Some of the gates already exist in GatingSet. Adding only ", 
                  paste(new_gates_name, collapse = ", ")))
  }
  gates <- gates[new_gates_name]
  
  ngates <- length(gates)

  
  if(ngates>0){
    
    idx <- 1:ngates
    
    while(length(idx)>0){
      
      i_added <- NULL
      
      for(i in 1:length(idx)){
        
        g <- gates[[idx[i]]]

        print("gate check")
        print(g)
        
        if(g$parent %in% union(gh_get_gate_names(gs[[1]]), "root") ){
          if(class(g$gate) == "list"){
            
            # check that all samples have a gate defined
            samples_to_gate <- intersect(names(g$gate), flowWorkspace::sampleNames(gs))
            if(!setequal(samples_to_gate, flowWorkspace::sampleNames(gs))){
              stop("Names of gates do not match sample names")
            }else{
              g$gate <- g$gate[samples_to_gate]
            }
            
            first_gate <- g$gate[[1]]
          }else{
            first_gate <- g$gate
          }
          gate_class <- class(first_gate)
          pass_check <- FALSE
          if(gate_class != "booleanFilter"){
            if( !is.null(names(first_gate@parameters)) & 
                length( setdiff( names(first_gate@parameters), flowWorkspace::colnames(gs@data)) ) == 0 ){
                pass_check <- TRUE
            }else{
              warning("Could not find gate parameters in flowData")
            }
          }else{
            pass_check <- TRUE
          }
          
          if(pass_check){
            flowWorkspace::gs_pop_add(gs = gs,
                                      gate = g$gate,
                                      parent = g$parent,
                                      name = first_gate@filterId)
          }
          
          i_added <- c(i_added, i)
        }
      }
      if(!is.null(i_added)){
        idx <- idx[-i_added]
      }else{
        break
      }
      
    }
    flowWorkspace::recompute(gs)
  }
  
  return(gs)
}


#' Transform gates coordinates and modify names of parameters.
#' @param gates a named list representing the gating hierarchy.
#' @param transformation A list of trans objects.
#' Each element must be named after a parameter and contain the transfomation 
#' to apply for this parameter.
#' @param pattern pattern to be replaced in the names of gate coordinates
#' @param replacement Character string that is to replace 'pattern' in in the 
#' names of gate coordinates
#' @param time_step value of the time step used to transform gates with 
#' the 'Time' parameter. Ignored if NULL.
#' @importFrom flowCore polygonGate rectangleGate
transform_gates <- function(gates,
                            transformation = NULL, 
                            pattern = "[\\<|\\>]",
                            replacement = "",
                            time_step = NULL ){
  
  # transform gate coordinates
  
  ngates <- length(gates)
  
  if(ngates>0){
    
    for(i in 1:ngates){
      
      g <- gates[[i]]
      
      if(class(g$gate) == "polygonGate"){
        
        polygon <- g$gate@boundaries
        if(!is.null(pattern)){
          colnames(polygon) <- gsub(pattern = pattern, 
                                    replacement = replacement, 
                                    colnames(polygon))
        }
        
        if(!is.null(time_step)){
          idx_time <- grep("^Time", colnames(polygon))
          if(length(idx_time)>0){
            for(j in idx_time){
              polygon[,j] <- polygon[,j]/time_step
            }
          }
        }
        
        if(!is.null(transformation)){
          for(j in 1:length(colnames(polygon))){
            if(colnames(polygon)[j] %in% names(transformation)){
              polygon[,j] <- transformation[[colnames(polygon)[j]]]$transform(polygon[,j])
            }
          }
        }

        
        trans_gate <- flowCore::polygonGate(.gate = polygon, filterId=g$gate@filterId)
      }
      
      if(class(g$gate) == "rectangleGate"){
        
        polygon <- rbind(g$gate@min, g$gate@max)
        if(dim(polygon)[2]==1){
          colnames(polygon) <- names(g$gate@parameters)
        }
        if(!is.null(pattern)){
          colnames(polygon) <- gsub(pattern = pattern,
                                    replacement = replacement,
                                    colnames(polygon))
        }

        if(!is.null(time_step)){
          idx_time <- grep("^Time", colnames(polygon))
          if(length(idx_time)>0){
            for(j in idx_time){
              polygon[,j] <- polygon[,j]/time_step
            }
          }
        }
        
        if(!is.null(transformation)){
          for(j in 1:length(colnames(polygon))){
            if(colnames(polygon)[j] %in% names(transformation)){
              polygon[,j] <- transformation[[colnames(polygon)[j]]]$transform(polygon[,j])
            }
          }
        }
        
        trans_gate <- flowCore::rectangleGate(.gate = polygon, filterId=g$gate@filterId)
      }
      
      if(class(g$gate) == "ellipsoidGate"){
        
        cov <- g$gate@cov
        mean <- g$gate@mean
        polygon <- as.matrix(ellipse_path(cov = cov, mean = mean))
        
        if(!is.null(pattern)){
          colnames(polygon) <- gsub(pattern = pattern, 
                                    replacement = replacement, 
                                    colnames(polygon))
        }

        if(!is.null(time_step)){
          idx_time <- grep("^Time", colnames(polygon))
          if(length(idx_time)>0){
            for(j in idx_time){
              polygon[,j] <- polygon[,j]/time_step
            }
          }
        }
        
        if(!is.null(transformation)){
          for(j in 1:length(colnames(polygon))){
            if(colnames(polygon)[j] %in% names(transformation)){
              polygon[,j] <- transformation[[colnames(polygon)[j]]]$transform(polygon[,j])
            }
          }
        }
        trans_gate <- flowCore::polygonGate(.gate = polygon, filterId=g$gate@filterId)
      }
      
      gates[[i]] <- list(gate = trans_gate, parent = g$parent)
    }
    
  }
  
  return(gates)
  
}

#' Copy a gate and its children as children of another parent gate(optionnal)
#' @param gs a GatingSet
#' @param name name of the gate to copy
#' @param parent name of the parent gate
#' @param copy_children_gates logical. Should children gates be copied as well 
#' (the hierarchy of children gates will be conserved)
copy_gate <- function(gs, name, parent, copy_children_gates = TRUE){
  
  gates <- get_gates_from_gs(gs)
  
  preffix <- ifelse(parent == "root", "/", parent)
  
  new_name <- paste(preffix, basename(name), sep = "/")
  gate <- list()
  gate[[new_name]] <- gates[[name]]
  gate[[new_name]]$parent <- parent
  
  if(copy_children_gates){
    children <- get_all_descendants(gates, name)
    children_gates <- gates[children]
    children_gates <- lapply(children_gates, function(x){
      x$parent <- gsub(pattern = name, 
                       replacement = new_name, 
                       x = x$parent, 
                       fixed = TRUE)
      return(x)
    })
    names(children_gates) <- gsub(pattern = name, 
                                  replacement = new_name, 
                                  x = names(children_gates), 
                                  fixed = TRUE)
    add_gates_flowCore(gs, c(gate, children_gates))
  }else{
    add_gates_flowCore(gs, gate)
  }
  
  return(gs)
}

### Getting data ###############################################################################

#' Get parameters from a GatingSet
#' @param gs a GatingSet
#' @return a list
#' @importFrom flowWorkspace pData gs_get_pop_paths sampleNames
#' @importFrom flowCore parameters
#' @export
get_parameters_gs <- function(gs){
  
  ff <- gs@data[[1]]
  pdata <- flowWorkspace::pData(gs)
  params <- flowCore::parameters(ff)@data
  params$name <- as.character(params$name)
  params$desc <- as.character(params$desc)
  
  params$display <- unlist(sapply(rownames(params), FUN = function(x){
    kw <- substr(x, start = 2, stop = nchar(x))
    kw <- paste(kw, "DISPLAY", sep = "")
    disp <- ff@description[[kw]]
    if(is.null(disp)){
      disp <- "NA"
    }
    return(disp)
  }))
  
  
  params$vartype <- unlist(sapply(rownames(params), FUN = function(x){
    kw <- paste(x, "VARTYPE", sep = "")
    vartype <- ff@description[[kw]]
    if(is.null(vartype)){
      vartype <- "numeric"
    }
    return(vartype)
  }))
  
  axis_limits <- lapply(1:length(params$name), function(x){
    return(as.numeric(c(params$minRange[x], params$maxRange[x])))})
  
  labels <- sapply(1:length(params$name), function(x){
    if(is.na(params$desc[x])){
      params$name[x]
    }else{
      paste(params$name[x], "(", params$desc[x], ")")
    }
  })
  
  plot_var <- params$name
  names(plot_var) <- labels
  names(labels) <- params$name
  names(axis_limits) <- params$name
  
  return( 
    list(sample = flowWorkspace::sampleNames(gs),
         subset = gh_get_gate_names(gs[[1]]),
         plot_var = plot_var,
         labels = labels,
         axis_limits = axis_limits,
         metadata = pdata,
         params = params,
         meta_var = names(pdata),
         transformation = gs@transformation,
         compensation = lapply(gs@compensation, as.matrix),
         gates = get_gates_from_gs(gs)
    )
  )
}  

#' Return a flowSet from a given subset in a GatingSet
#' @param gs a GatingSet
#' @param spill spillover matrix. If NULL, uncompensated data is used for gating
#' @param subset Name of the subset
#' @importFrom flowWorkspace GatingSet gs_pop_get_data sampleNames
#' @importFrom flowCore compensate
gs_get_fs_subset <- function(gs, spill = NULL, subset){
  
  fs <- gs@data[flowWorkspace::sampleNames(gs)]
  gates <- get_gates_from_gs(gs) 
  
  if(!is.null(spill)){
      if(all(sampleNames(fs) %in% names(spill))){
        fs <- flowCore::compensate(fs, spill)
      }else{
        message("Could not compensate data")
      }
  }
  
  gs_comp <- flowWorkspace::GatingSet(fs)
  gs_comp <- add_gates_flowCore(gs_comp, gates)
  fs_comp <- flowWorkspace::gs_pop_get_data(gs_comp, subset)
  return(fs_comp)
}

#' Return statistics for all subsets ans samples in a GatingSet
#' @param gs a GatingSet
#' @param spill spillover matrix. If NULL, uncompensated data is used for gating
#' @param filter a filter object applied before computing statistics. Ignored if NULL.
#' @importFrom flowCore Subset
#' @importFrom flowWorkspace GatingSet gs_pop_get_count_fast sampleNames
getPopStatsPlus <- function(gs, spill = NULL, filter = NULL){
  
  fs <- gs@data
  gates <- get_gates_from_gs(gs) 
  if(!is.null(filter)){
    fs <- flowCore::Subset(fs, filter)
  }
  
  if(!is.null(spill)){
    fs <- compensate(fs, spill)
  }
  
  gs_comp <- flowWorkspace::GatingSet(fs)
  gs_comp <- add_gates_flowCore(gs_comp, gates)
  df <- flowWorkspace::gs_pop_get_count_fast(gs_comp)
  
  df$name <- sapply(df$name, function(x){strsplit(x, split = "_[0-9]+$")[[1]][1]})
  df_root <- data.frame(name = flowWorkspace::sampleNames(fs))
  df_root$Population <- "root"
  df_root$Count <- sapply(1:length(fs), function(x){dim(fs[[x]]@exprs)[1]})
  df_root$Parent <- NA
  df_root$ParentCount <- NA
  
  df_merge <- rbind(df, df_root)
  df_merge
}

#' Return data from a GatingSet
#' @param gs a GatingSet
#' @param sample Names of samples from the GatingSet 
#' (as returned by \code{pData(gs)$name})
#' @param subset Names of subsets from the GatingSet 
#' (as returned by \code{gh_get_gate_names(gs[[1]])})
#' @param Ncells Maximum number of cells per sample and subset sampled from the GatingSet
#' @param spill spillover matrix. If NULL, uncompensated data is used for gating. 
#' Uncompensated data is returned if parameter 'return_comp_data' is TRUE.
#' @param return_comp_data logical. Should compensated data be returned ?
#' @param updateProgress function used in shiny to update a progress bar
#' @return a data.frame
#' @importFrom flowWorkspace sampleNames gs_get_pop_paths colnames GatingSet gh_pop_get_indices pData
#' @importFrom flowCore compensate
get_data_gs <- function(gs,
                        sample = NULL,
                        subset = NULL,
                        Ncells = NULL,
                        spill = NULL,
                        return_comp_data = TRUE,
                        updateProgress = NULL
){
  
  if(is.null(sample)){sample <- flowWorkspace::sampleNames(gs)}
  if(is.null(subset)){subset <- gh_get_gate_names(gs[[1]])}
  
  #idx <- which(sample %in% flowWorkspace::sampleNames(gs))
  idx <- match(sample, flowWorkspace::sampleNames(gs))
  idx <- idx[!is.na(idx)]
  
  if(length(idx) == 0){
    return(NULL)
  }
  
  gs_comp <- gs
  
  
  if(!is.null(spill)){
    
    if( setequal(names(spill),  flowWorkspace::sampleNames(gs)) ){
      gates <- get_gates_from_gs(gs)
      fs <- gs@data[idx]
      fs <- flowCore::compensate(fs, spill[idx])
      gs_comp <- flowWorkspace::GatingSet(fs)
      gs_comp <- add_gates_flowCore(gs_comp, gates)
    }
   
  }
  
  df <- list()
  count <- 0
  
  for(i in 1:length(idx)){
    
    for(k in 1:length(subset)){
      
      idx_subset <- NULL
      if(!is.null(spill)){
        idx_comp <- match(flowWorkspace::sampleNames(gs)[idx[i]], 
                          flowWorkspace::sampleNames(gs_comp))
      }
      
      if(subset[k] != "root"){
        if(!is.null(spill)){
          idx_subset <- flowWorkspace::gh_pop_get_indices(gs_comp[[idx_comp]], subset[k])
        }else{
          idx_subset <- flowWorkspace::gh_pop_get_indices(gs[[idx[i]]], subset[k])
        }
      }
      
      if(return_comp_data & !is.null(spill) ){
        ff <- gs_comp@data[[idx_comp]]
      }else{
        ff <- gs@data[[idx[i]]]
      }
      

      df_int <- as.data.frame(ff@exprs)
      if(!is.null(idx_subset)){
        df_int <- df_int[idx_subset, ]
      }

      
      
      if(dim(df_int)[1]>0){
        
        df_int[["name"]] <- flowWorkspace::sampleNames(gs)[idx[i]]
        df_int[["subset"]] <- subset[k]
        #df <- rbind(df, df_int)
        
        if(!is.null(Ncells)){
          if(Ncells < dim(df_int)[1]){
            df_int <- df_int[sample(1:dim(df_int)[1], Ncells, replace = FALSE), ] 
          }
        }
        count <- count + 1
        df[[count]] <- df_int
      }
      
      
      if(is.function(updateProgress)){
        value <- count / (length(subset)*length(idx))*100
        updateProgress(value = value, detail = paste(format(value, digits=0), "%", sep = ""))
      }
        
        
      
      
    }
  }
  
  df_tot <- do.call(rbind, df)
  df_tot[["subset"]] <- factor(df_tot[["subset"]], levels = subset)
  df_tot[["name"]] <- factor(df_tot[["name"]], levels = flowWorkspace::sampleNames(gs)[idx])
  
  if(length(df_tot[["name"]]) > 0){
    return(df_tot)
  }else{
    return(NULL)
  }
  
}

#' Add metadata columns
#' @description  Add metadata columns
#' @param df data.frame with a column \code{name} used to map metadata.
#' Metadata should also contain a column \code{name}
#' @param metadata a data.frame containing metadata associated to samples. 
#' Must have a column \code{name} used for mapping.
#' @return a data.frame with additional columns
add_columns_from_metadata <- function(df,
                                      metadata
                                      ){

  
  if(! "name" %in% names(df)){
    warning("Could not find column 'name' in data.frame. No metadata added.")
    return(df)
  }
  
  new_vars <- unique(setdiff(names(metadata), names(df)))
  
  if(length(new_vars)>0){
    for(variable in new_vars){
      df[[variable]] <- metadata[[variable]][match(df[["name"]], metadata$name)]
    }
  }

  return(df)
}

#' @importFrom reshape2 melt dcast
#' @importFrom scales identity_trans log_trans
#' @importFrom stats as.formula
#' @importFrom dplyr rename
compute_stats <- function(df = NULL,
                          gs = NULL,
                          spill = NULL,
                          transformation=NULL,
                          stat_function = "mean",
                          y_trans = identity_trans(),
                          apply_inverse = TRUE,
                          yvar = NULL,
                          var_names = NULL,
                          id.vars = c("name", "subset")
){
  
  inverse <- NULL
  
  if(is.null(yvar)){
    yvar <- setdiff(names(df), id.vars)
  }
  
  custom_name <- NULL
  
  if(stat_function == "GeoMean"){
    y_trans = scales::log_trans()
    apply_inverse = TRUE
    stat_function = "mean"
    custom_name <- "GeoMean"
    warning("Note that negative values will be discarded when computing the geometric mean")
  }
  
  if(stat_function == "median"){
    y_trans = scales::identity_trans()
    apply_inverse = FALSE
  }
  
  if(is.null(var_names)){
    var_names <- yvar
    names(var_names) <- yvar
  }
  
  if(! stat_function %in% c("cell count", "percentage")){
    if(!is.null(yvar)){
      
      if(!is.null(y_trans)){
        transformation <- lapply(yvar, function(x){y_trans})
        names(transformation) <- yvar
      }
      
      
      for(i in 1:length(yvar)){
        df[[yvar[i]]] <- transformation[[yvar[i]]]$transform(df[[yvar[i]]])
      }
      
      
      df_melt <- reshape2::melt(df, id.vars = id.vars, measure.vars = yvar)
      df_melt <- df_melt[is.finite(df_melt$value), ]
      
      
      stat.fun <- function(...){do.call(stat_function, args = list(...))}
      df_cast <- reshape2::dcast(df_melt, 
                                 formula = stats::as.formula(
                                   paste(
                                     paste(id.vars, collapse = " + "), 
                                     " ~ variable", 
                                     sep ="")), 
                                 fun.aggregate =  stat.fun, 
                                 na.rm = TRUE)
      
      if(apply_inverse){
        for(i in 1:length(yvar)){
          df_cast[[yvar[i]]] <- transformation[[yvar[i]]]$inverse(df_cast[[yvar[i]]])
          if(transformation[[yvar[i]]]$name != "identity"){
            inverse <- "inverse"
          }
        }
      }
      
      
      # for(i in 1:length(yvar)){
      #   idx <- which(names(df_cast) == yvar[i])
      #   trans_name <- NULL
      #   if(transformation[[yvar[i]]]$name != "identity"){
      #     trans_name <- transformation[[yvar[i]]]$name
      #   }
      #   if(is.null(custom_name)){
      #     names(df_cast)[idx] <- paste(stat_function, trans_name, inverse, var_names[[i]])
      #   }else{
      #     names(df_cast)[idx] <- paste(custom_name,  var_names[[i]])
      #   }
      #   
      # }
      
      
    }
    
  }else{
    if(!is.null(gs)){
      variable <- switch(stat_function,
                         "cell count" = "Count",
                         "percentage" = "perc_parent")
      
      df_pop_stat <- as.data.frame(getPopStatsPlus(gs, spill = spill))
      df_pop_stat <- dplyr::rename(df_pop_stat, subset = "Population")
      df_pop_stat[['perc_parent']] <- df_pop_stat$Count / df_pop_stat$ParentCount * 100
      df_cast <- df_pop_stat[c("name", "subset", variable)]
      
      df_cast <- df_cast[df_cast$name %in% unique(as.character(df$name)) & 
                           df_cast$subset %in% unique(as.character(df$subset)), ]
      
    }
  }
  
  return(df_cast)
  
}

#' Return data used for plotting a GatingSet
#' @param gs a GatingSet
#' @param df data.frame with columns \code{name} and \code{subset} 
#' containing sample and subset names respectively and
#' columns with plot variables. 
#' Ignored if \code{NULL}. 
#' Otherwise supersedes parameters 'gs', 'sample', 'spill', 'metadata'.
#' @param sample Names of samples from the GatingSet 
#' (as returned by \code{pData(gs)$name})
#' @param subset Names of subsets from the GatingSet
#' (as returned by \code{gs_get_pop_paths(gs)})
#' @param Ncells number of cells to sample from the GatingSet
#' @param spill spillover matrix. If NULL, uncompensated data is returned and used for gating.
#' @param metadata a data.frame containing metadata associated to samples.
#' @param vartype named character vector specifying variable type conversion.
#' (either "factor", "integer" or "character")
#' Must have a column \code{name} used for mapping.
#' @importFrom flowWorkspace pData
#' @return a data.frame
get_plot_data <- function(gs,
                          df=NULL, 
                          sample,
                          subset,
                          Ncells = NULL,
                          spill = NULL,
                          metadata = NULL,
                          vartype = NULL){
  
  
  if(is.null(df)){
    df <- get_data_gs(gs = gs,
                      sample = sample,
                      subset = subset,
                      spill = spill,
                      Ncells = Ncells)
  }else{
    df <- df[df$name %in% sample & df$subset %in% subset, ]
  }
  
  if(is.null(metadata) & !is.null(gs)){
    metadata <- flowWorkspace::pData(gs)
  }
  
  if(!is.null(metadata)){
    df <- add_columns_from_metadata(df,
                                    metadata = metadata)
  }
  
  if(!is.null(vartype)){
    for(var in names(vartype)){
      if(vartype[[var]] %in% c("factor", "integer", "character")){
        df[[var]] <- do.call(paste("as.", vartype[[var]], sep = ""), args = list(df[[var]]) )
      }
    }
  }
  
  # if("cluster" %in% names(df)){
  #   df[["cluster"]] <- as.factor(df[["cluster"]])  
  # }
  
  return(df)
  
}


### Plotting ##################################################################################

#' Generates a plot from data
#' @param data data.frame with plot data (as returned by \code{get_plot_data})
#' @param plot_type Name of the type of plot to generate. 
#' Available types are 'hexagonal', 'histogram', 'dots', 'contour' (for single cell data) and 
#' 'heatmap', 'bar', 'tile', 'pca' (for aggregated data). 
#' The plot function corresponding to a given plot type must have the same name 
#' as the plot type with the preffix 'plot_' (for instance 'plot_hexagonal()')
#' @param plot_args list of arguments passed to the plot function
#' @importFrom flowWorkspace pData
#' @return a plot (plot class depends on the plot function)
call_plot_function <- function(data,
                         plot_type,
                         plot_args = list()
                         ){
  # Make sure metadata column 'name' has the correct values 
  #(not the case in the flowAI::Bcells dataset)
  if(class(data) %in% c("ncdfFlowSet", "flowSet")){
    pdata <- flowWorkspace::pData(data)
    pdata$name <- row.names(pdata)
    flowWorkspace::pData(data) <- pdata
  }
  
  p <- do.call(paste("plot", plot_type, sep="_"), 
               list(args = c(list(data=data), plot_args)))

  return(p)
}


### Plots for data with single cell resolution (plotGatingSetInput_module)

#' Generates a hexagonal heatmap of 2d bin counts (see ggplot2::geom_hex)
#' @param args list of arguments. 
#' Mandatory arguments : a data.frame 'df', x and y plot variables 'xvar' and 'yvar'.
#' Other arguments can include :
#' 'bins' : numeric, number of bins, passed to 'ggplot2::geom_hex()'
#' 'use_log10_count' : logical, transform bin counts using log10
#' 'option' : name of the viridis palette
#' @import ggplot2
#' @importFrom ggcyto ggcyto
#' @importFrom viridis scale_fill_viridis
plot_hexagonal <- function(args = list()){
  
  plot_type <- "hexagonal"
  max_nrow_to_plot <- Inf
  bins <- 100
  use_log10_count <- TRUE
  option <- "viridis"
  if(length(unlist(args[c("xvar", "yvar")])) != 2 ){
    warning("Incorrect dimensions")
    return(NULL)
  }
  
  for(var in names(args)){
    assign(var, args[[var]])
  }
  
  if(class(data) %in% c("ncdfFlowSet", "flowSet")){
    stop("Plot type not supported for flowSet objects")
    # p <- ggcyto::ggcyto(data,
    #                     aes_string(x = as.name( xvar ),
    #                                y = as.name( yvar )),
    #                     max_nrow_to_plot = max_nrow_to_plot)
  }else{
    p <- ggplot(data,
                        aes_(x = as.name( xvar ), 
                             y = as.name( yvar ) ) )
  }
  
  #p <- p + coord_cartesian()
  p <- p + geom_hex(bins = bins)
  
  if(use_log10_count){
    p <- p + scale_fill_viridis(trans = log10_trans(), option = option)
  }else{
    p <- p + scale_fill_viridis(option = option)
  }
  
  p
}

#' Generates an histogram or a density plot
#' @param args list of arguments. 
#' Mandatory arguments : a data.frame 'df', x plot variable 'xvar'.
#' Other arguments can include :
#' 'color_var' : variable used for the aesthetic 'color'
#' 'group_var' : variable used for the aesthetic 'group'
#' 'smooth' : logical. Should a density plot be generated?
#' 'ridges': logical. Ignored if 'smooth' is FALSE. Shift different density plots according to 'yridges_var'
#' 'yridges_var' : variable used for the aesthetic 'y' in 'geom_density_ridges'. Ignored if 'ridges' is FALSE. 
#' 'norm_density' : logical. Set maximal y value to 1?
#' 'bins' : number of bins.
#' (If 'smooth' is TRUE, the inverse of 'bins' is used as the value for the bandwidth parameter 'bw')
#' 'alpha' : transparency (between 0 and 1)
#' @import ggplot2
#' @importFrom ggcyto ggcyto
#' @importFrom ggridges geom_density_ridges
plot_histogram <- function(args = list()){
  
  plot_type <- "histogram"
  
  max_nrow_to_plot = Inf
  color_var <- NULL
  group_var <- NULL
  smooth <- FALSE
  ridges <- FALSE
  yridges_var <- "name"
  norm_density <- TRUE
  bins <- 100
  alpha <- 0.25
  
  if(is.null(args["xvar"])){
    warning("Incorrect dimensions")
    return(NULL)
  }
  
  for(var in names(args)){
    assign(var, args[[var]])
  }
  

  if(class(data) %in% c("ncdfFlowSet", "flowSet")){
    p <- ggcyto::ggcyto(data,
                        aes_(x = as.name( xvar )),
                        max_nrow_to_plot=max_nrow_to_plot)
    df <- data.frame(exprs(data[[1]]), check.names = FALSE)
  }else{
    p <- ggplot(data, aes_(x = as.name( xvar )))
    df <- data
  }
  
  
  
  if(typeof(df[[xvar]])!= "double"){
    warning("Cannot plot histogram : x variable is not continuous.")
    return(NULL)
  }
    
  if(norm_density){
      stat_var <- "stat(ndensity)"
  }else{
      stat_var <- "stat(density)"
    
  }
  
  if(!is.null(color_var)){
    if(color_var == "none"){
      color_var <- NULL
    }
  }
  
  if(!is.null(color_var)){
    if(color_var %in% names(df)){
      color_var <- as.name(color_var)
    }
  }
  
  if(!is.null(group_var)){
    if(group_var == "none"){
      group_var <- NULL
    }
  }
  
  if(!is.null(group_var)){
    if(group_var %in% names(df)){
      group_var <- as.name(group_var)
    }
  }
  
  if(!is.null(yridges_var)){
    if(yridges_var %in% names(df)){
      yridges_var <- as.name(yridges_var)
    }
  }

  if(smooth){
    if(ridges){
      p <- p + geom_density_ridges(mapping = aes_string(fill = color_var, 
                                                        color = color_var, 
                                                        group = group_var,
                                                        y = yridges_var, 
                                                        height = stat_var), 
                                   alpha = alpha, 
                                   bw = 1/bins, 
                                   stat = "density")
    }else{
      p <- p + geom_density(mapping = aes_string(fill = color_var, 
                                                 color = color_var, 
                                                 group = group_var,
                                                 y = stat_var), 
                            alpha = alpha,
                            bw = 1/bins)
    }
  }else{
    p <- p + geom_histogram(mapping = aes_string(fill = color_var, 
                                                 color = color_var, 
                                                 group = group_var,
                                                 y = stat_var), 
                            alpha = alpha,  
                            bins = bins,
                            position = "identity",
                            boundary = 0
                            ) 
  }
  
  return(p)
  
}

#' Generates a dot plot
#' @param args list of arguments. 
#' Mandatory arguments : a data.frame 'df', x and y plot variable 'xvar' and 'yvar'.
#' Other arguments can include :
#' 'color_var' : variable used for the aesthetic 'color'
#' 'group_var' : variable used for the aesthetic 'group'
#' 'alpha' : dot transparency (between 0 and 1)
#' 'size' : dot size
#' 'show_label' : logical; add labels for each group (as defined by 'id.vars')
#' 'id.vars' : variable defining groups for which a label should be displayed 
#' (superseded by 'color_var' and 'group_var')
#' @import ggplot2
#' @importFrom ggcyto ggcyto
#' @importFrom ggrepel geom_label_repel
#' @importFrom ggpointdensity geom_pointdensity
plot_dots <-function(args = list()){
  
  plot_type <- "dots"
  
  transform_function <- "identity"
  max_nrow_to_plot <- Inf
  adjust <- 1
  use_pointdensity <- FALSE
  id.vars <- NULL
  show_label <- FALSE
  color_var <- NULL
  group_var <- NULL
  alpha <- 0.1
  size <- 0.1
  pch <- 16
  
  if(length(unlist(args[c("xvar", "yvar")])) != 2 ){
    warning("Incorrect dimensions")
    return(NULL)
  }
  
  for(var in names(args)){
    assign(var, args[[var]])
  }
  
  if(class(data) %in% c("ncdfFlowSet", "flowSet")){
    df <- data.frame(exprs(data[[1]]), check.names = FALSE)
  }else{
    df <- data
  }
  
  if(!is.null(color_var)){
    if(color_var == "none"){
      color_var <- NULL
    }else if(color_var == "density"){
      use_pointdensity <- TRUE
    }
    else{
      if(color_var %in% names(df)){
        id.vars <- color_var
      }
    }
  }
  
  if(!is.null(color_var)){
    if(color_var %in% names(df)){
      color_var <- as.name(color_var)
    }
  }
  
  if(!is.null(group_var)){
    if(group_var == "none"){
      group_var <- NULL
    }else{
      if(group_var %in% names(df)){
        id.vars <- group_var
      }
    }
  }
  
  if(!is.null(group_var)){
    if(group_var %in% names(df)){
      group_var <- as.name(group_var)
    }
  }
  
  mapping <- aes_string(x = as.name( xvar ),
                  y = as.name( yvar ),
                  colour = color_var,
                  group = group_var)
  
  if(use_pointdensity){
    mapping <- aes_string(x = as.name( xvar ),
                          y = as.name( yvar ))
  }
  
  if(class(data) %in% c("ncdfFlowSet", "flowSet")){
    p <- ggcyto::ggcyto(data = data, mapping=mapping, max_nrow_to_plot=max_nrow_to_plot)
  }else{
    p <- ggplot(data, mapping) 
  }
  
  if(use_pointdensity){
    adjust_default <- sapply(max(df[[xvar]]), transform_function)/30
    p <- p + ggpointdensity::geom_pointdensity(alpha = alpha, 
                                               size = size,
                                               adjust = adjust_default * adjust)
  }else{
    p <- p +  geom_point(alpha = alpha,
                          size = size, pch=pch)
  }
  

  if(show_label & ! class(data) %in% c("ncdfFlowSet", "flowSet")){
    df_stat <- compute_stats(df = df,
                             stat_function = "median",
                             yvar = c(xvar, yvar),
                             id.vars = id.vars)

    p <- p + geom_label_repel(mapping = aes_string(x = as.name( xvar ),
                                                  y = as.name( yvar ),
                                                  color = id.vars,
                                                  label = id.vars),
                             data = df_stat,
                             fill = "white")
  }
  
  return(p)
  
}

#' Generates a contour plot
#' @param args list of arguments. 
#' Mandatory arguments : a data.frame 'df', x and y plot variable 'xvar' and 'yvar'.
#' Other arguments can include :
#' 'color_var' : variable used for the aesthetic 'color'
#' 'group_var' : variable used for the aesthetic 'group'
#' 'show_outliers' : logical; Display all cells in the background
#' 'fill' : fill parameter for contour plot (passed to 'ggplot2::stat_density_2d()')
#' 'bins' : number of grid points in each direction. (passed as parameter 'n' to 'ggplot2::geom_density_2d()')
#' 'alpha' : contour line transparency (between 0 and 1). If 'show_outliers' is TRUE, used to set outliers dot transparency.
#' 'size' : contour line size. If 'show_outliers' is TRUE, used to set outliers dot size.
#' @import ggplot2
#' @importFrom ggcyto ggcyto
plot_contour <-function(args = list()){
  
  plot_type <- "contour"

  max_nrow_to_plot <- Inf
  color_var <- NULL
  group_var <- NULL
  
  bins <- 50
  breaks <- 10^(seq(from = -1.5, to = 0, length.out = 30))
  alpha <- 0.75
  size <- 0.2
  show_outliers <- FALSE
  pch <- 16
  
  if(length(unlist(args[c("xvar", "yvar")])) != 2 ){
    warning("Incorrect dimensions")
    return(NULL)
  }
  
  for(var in names(args)){
    assign(var, args[[var]])
  }
  
  if(class(data) %in% c("ncdfFlowSet", "flowSet")){
    df <- data.frame(exprs(data[[1]]), check.names = FALSE)
  }else{
    df <- data
  }
  
  if(!is.null(color_var)){
    if(color_var == "none" ){
      color_var <- NULL
    }
  }
  
  if(!is.null(color_var)){
    if(color_var %in% names(df)){
      color_var <- as.name(color_var)
    }
  }
  
  if(!is.null(group_var)){
    if(group_var == "none"){
      group_var <- NULL
    }
  }
  
  if(!is.null(group_var)){
    if(color_var %in% names(df)){
      group_var <- as.name(group_var)
    }
  }
  
  if(class(data) %in% c("ncdfFlowSet", "flowSet")){
    p <- ggcyto::ggcyto(data,
                aes_string(x = as.name( xvar ),
                           y = as.name( yvar ),
                           colour = color_var,
                           group = group_var),
                max_nrow_to_plot = max_nrow_to_plot)
  }else{
    p <- ggplot(data,
                aes_string(x = as.name( xvar ),
                           y = as.name( yvar ),
                           colour = color_var,
                           group = group_var))
  }
  
  if(show_outliers){
    p <- p + geom_point(size = size, alpha = alpha, pch = pch)
    size <- 0.1
    alpha <- 1
  }
  
  
  
   if(!is.null(color_var)){
     
     if(show_outliers){
       p <- p + stat_density2d(aes_string(colour = color_var, group = group_var),
                               fill = "white",
                               size=0,
                               geom="polygon",
                               n=bins,
                               contour_var = "ndensity",
                               breaks = breaks
       )
     }
     
    p <- p + geom_density2d(aes_string(colour = color_var, group = group_var),
                            size=size,
                            alpha= alpha,
                            n=bins,
                            contour_var = "ndensity",
                            breaks = breaks
    )
      
   }else{
     if(show_outliers){
       p <- p + stat_density2d(aes_string(group = group_var),
                               fill = "white",
                               size=0,
                               geom="polygon",
                               n=bins,
                               contour_var = "ndensity",
                               breaks = breaks
       )
     }
     
     p <- p + geom_density2d(aes_string(group = group_var),
                             color = "black",
                             size=size,
                             alpha= alpha,
                             n=bins,
                             contour_var = "ndensity",
                             breaks = breaks
     )
    
  }

  return(p)
}


### Plot for aggregated data (plotStatInput_module)

#' Generates a heatmap
#' @param args list of arguments. 
#' Mandatory argument : a data.frame or a matrix 'df'
#' Other arguments can include :
#' 'stat_var' : names of numeric columns to include in the heatmap
#' 'group_var' : name of the column used to order x coordinates
#' 'cluster_y' : logical; cluster y axis variables
#' 'cluster_x' : logical; cluster x axis variables
#' 'show.legend' : logical; show legend
#' 'option' : name of the viridis palette
#' @importFrom viridis viridis
#' @importFrom pheatmap pheatmap
plot_heatmap <-function(args = list()){
  
  plot_type <- "heatmap"
  stat_var <- NULL
  annotation_vars <- NULL
  group_var <- NULL
  cluster_y <- FALSE
  cluster_x <- FALSE
  show.legend <- TRUE
  option <- "viridis"
  
  if(is.null(args["df"])){
    return(NULL)
  }
  
  for(var in names(args)){
    assign(var, args[[var]])
  }
  
  df <- as.data.frame(df)
  
  labels_col <- 1:dim(df)[1]
  
  if(!is.null(group_var)){
    df <- df[order(df[[group_var[1]]]), ]
    #labels_col <- df$group_var
  }
  
  row.names(df) <- 1:dim(df)[1]

  
  if(is.null(annotation_vars)){
    annotation_vars <- c("name", "subset")
  }
  idx <- which(names(df) %in% annotation_vars)
  idx_annot <- idx
  
  df_stat <- df[-idx]
  
  if(!is.null(stat_var)){
    df_stat <- df_stat[which(names(df_stat) %in% stat_var)]
  }else{
    df_stat <- df_stat[which(sapply(df_stat, is.numeric))]
  }
  
  annotation <- df[idx_annot]
  
  df_plot <- t(df_stat)
  colnames(df_plot) <- 1:dim(df_plot)[2]
  
  if(dim(df_plot)[1]<2){
    cluster_y <- FALSE
  }
  if(dim(df_plot)[2]<2){
    cluster_x <- FALSE
  }
  
  p <- pheatmap(df_plot, show_colnames = FALSE, 
                color = viridis(16, option = option),
                labels_col = labels_col,
                scale = "none",
                annotation_col = annotation,
                cluster_rows = cluster_y,
                cluster_cols = cluster_x,
                legend = show.legend
  )
  
  return(p)
}

#' Generates a bar plot
#' @param args list of arguments. 
#' Mandatory argument : a data.frame 'df'
#' Other arguments can include :
#' 'stat_var' : names of numeric columns to include in the plot
#' 'group_var' : name of the column used to define x axis groups
#' 'color_var' : name of the column used for the aesthetic 'color' in 'ggplot2::geom_point()'
#' 'show.legend' : logical; show legend
#' @import ggplot2
#' @importFrom reshape2 melt
plot_bar <-function(args = list()){
  
  plot_type <- "bar"
  stat_var <- NULL
  group_var <- NULL
  color_var <- NULL
  show.legend <- TRUE
  pch <- 16
    
  if(is.null(args["df"])){
    return(NULL)
  }
  
  for(var in names(args)){
    assign(var, args[[var]])
  }
  
  df <- as.data.frame(df)
  
  id.vars <- names(df)[which(!sapply(df, is.numeric))]
  df_melt <- reshape2::melt(df, id.vars = id.vars)
  
  if(is.null(stat_var)){
    stat_var <- names(df)[which(sapply(df, is.numeric))]
  }
  
  if(!is.null(group_var)){
    if(group_var %in% names(df)){
      group_var <- as.name(group_var)
    }
  }
  
  if(!is.null(color_var)){
    if(color_var %in% names(df)){
      color_var <- as.name(color_var)
    }
  }
  
  df_melt <- df_melt[df_melt$variable %in% stat_var, ]
  
  p <- ggplot(df_melt, aes_string(x = group_var, y = "value"))
  
  p <- p + 
    geom_bar(mapping = aes_string(fill = group_var), alpha = 0.5, stat = "summary", fun.y = "mean") + 
    geom_point( mapping = aes_string(colour = color_var), 
                inherit.aes = TRUE, 
                position = position_jitter(width = 0.25, height = 0),
                alpha = 0.5,
                size = 3,
                pch = pch,
                show.legend = show.legend)

  
  return(p)
  
}

#' Generates a tile plot
#' @param args list of arguments. 
#' Mandatory argument : a data.frame 'df'
#' Other arguments can include :
#' 'stat_var' : names of numeric columns to include in the plot
#' 'group_var' : name of the column used to define x axis groups
#' 'show.legend' : logical; show legend
#' 'option' : name of the viridis palette
#' @import ggplot2
#' @importFrom viridis scale_fill_viridis
#' @importFrom reshape2 melt
plot_tile <-function(args = list()){
  
  plot_type <- "tile"
  stat_var <- NULL
  group_var <- NULL
  show.legend <- TRUE
  option <- "viridis"
  
  if(is.null(args["df"])){
    return(NULL)
  }
  
  for(var in names(args)){
    assign(var, args[[var]])
  }
  
  df <- as.data.frame(df)
  
  id.vars <- names(df)[which(!sapply(df, is.numeric))]
  df_melt <- reshape2::melt(df, id.vars = id.vars)
  
  if(is.null(stat_var)){
    stat_var <- names(df)[which(sapply(df, is.numeric))]
  }
  
  if(!is.null(group_var)){
    if(group_var %in% names(df)){
      group_var <- as.name(group_var)
    }
  }

  
  df_melt <- df_melt[df_melt$variable %in% stat_var, ]
  
  p <- ggplot(df_melt, aes_string(x = group_var, y = "variable", fill = "value")) +
    geom_tile(show.legend = show.legend) +
    scale_fill_viridis(option = option)
  
  return(p)
  
}

#' Perform a PCA and plot the result
#' @param args list of arguments. 
#' Mandatory argument : a data.frame 'df'
#' Other arguments can include :
#' 'stat_var' : names of numeric columns used to perform the PCA.
#' All numeric variables are used by default.
#' 'PCx' : x axis variable ("PC1" by default)
#' 'PCy' : y axis variable ("PC2" by default)
#' 'color_var' : name of the column used to color points
#' 'label_var' : name of the column used to label points
#' 'scale' : logical; scale values by variable before performing the PCA
#' @import ggplot2
#' @importFrom ggrepel geom_text_repel
#' @importFrom stats prcomp
plot_pca <-function(args = list()){
  
  plot_type <- "pca"
  PCx <- "PC1"
  PCy <- "PC2"
  stat_var <- NULL
  annotation_vars <- NULL
  color_var <- NULL
  label_var <- "name"
  scale <- FALSE
  pch <- 16
  
  if(is.null(args["df"])){
    return(NULL)
  }
  
  for(var in names(args)){
    assign(var, args[[var]])
  }
  
  df <- as.data.frame(df)
  
  idx <- which(names(df) %in% c("name", "subset", color_var, label_var))
  idx_annot <- idx
  
  df_stat <- df[-idx]
  if(!is.null(stat_var)){
    df_stat <- df_stat[which(names(df_stat) %in% stat_var)]
  }
  
  idx_cols <- which(sapply(df_stat, is.numeric))
  if(length(idx_cols)>1){
    df_stat <- df_stat[ , idx_cols ] 
  }else{
    stop("Not enough numeric variables to perform PCA")
  }
  
  rownames(df_stat) <- 1:dim(df_stat)[1]
  
  annotation <- df[idx_annot]
  rownames(annotation) <- 1:dim(annotation)[1]
  
  pca_res <- stats::prcomp( df_stat, center = scale, scale. = scale)
  
  df_pca <- as.data.frame(pca_res$x)
  df_pca <- cbind(df_pca, annotation[match(row.names(annotation), row.names(df_pca)), ])
  
  if(!is.null(color_var)){
    if(color_var %in% names(df_pca)){
      color_var <- as.name(color_var)
    }
  }
  if(!is.null(label_var)){
    if(label_var %in% names(df_pca)){
      label_var <- as.name(label_var)
    }
  }
  
  p <- ggplot(df_pca, aes_string(x=as.name(PCx), 
                                 y=as.name(PCy),
                                 color = color_var, 
                                 label = label_var)) +
    geom_point(pch=pch) +
    geom_text_repel(show.legend = FALSE)
  
  return(p)
}



### Add plot layers

#' @import ggplot2
#' @importFrom grDevices rgb
#' @importFrom ggrepel geom_label_repel
add_polygon_layer <- function(p,
                             polygon = NULL,
                             idx_selected = NULL,
                             label = NULL){
  
  #if(p$plot_env$plot_type != "histogram" & setequal(names(polygon), c("x", "y"))){
  if(all(c("x", "y") %in% names(polygon))){
    if(!is.null(polygon$x)){
      
      if(length(polygon$x)>0){
        polygon <- data.frame(x = polygon$x, y = polygon$y)
        polygon <- rbind(polygon, polygon[1,])
        

        # adjust plot limits
        layer_info <- layer_scales(p)
        
        update_range_x <- FALSE
        
        if(!is.null(layer_info$x$limits) & 
           "RangeContinuous" %in% class(layer_info$x$range) ){
          
          xrange <- layer_info$x$trans$inverse(layer_info$x$limits)
          if(!is.null(xrange)){
            if(max(polygon$x) > max(xrange)){
              update_range_x <- TRUE
              xrange[2] <- max(polygon$x)
            }
            if(min(polygon$x) < min(xrange)){
              update_range_x <- TRUE
              xrange[1] <- min(polygon$x)
            }
          }
        }
        
        if(update_range_x){
          
          p <- p + scale_x_continuous(name = layer_info$x$name, 
                                      trans = layer_info$x$trans, 
                                      limits = xrange)
          
        }
        
        update_range_y <- FALSE
        
        if(!is.null(layer_info$y$limits) & 
           "RangeContinuous" %in% class(layer_info$y$range) ){
          
          yrange <- layer_info$y$trans$inverse(layer_info$y$limits)
          if(!is.null(yrange)){
            if(max(polygon$y) > max(yrange)){
              update_range_y <- TRUE
              yrange[2] <- max(polygon$y)
            }
            if(min(polygon$y) < min(yrange)){
              update_range_y <- TRUE
              yrange[1] <- min(polygon$y)
            }
          }
        }
        if(update_range_y ){
          
          p <- p + scale_y_continuous(name = layer_info$y$name, 
                                      trans = layer_info$y$trans, 
                                      limits = yrange)
        }
        
        # add polygon layer

        p <- p +
          geom_path(data = polygon, mapping = aes(x=x, y=y), 
                    color = "red", inherit.aes = FALSE) +
          geom_polygon(data=polygon, mapping = aes(x=x, y=y), 
                       inherit.aes = FALSE,
                       fill="red",
                       alpha=0.05) +
          geom_point(data = polygon, mapping = aes(x=x, y=y), 
                     color = "red", inherit.aes = FALSE, alpha = 0.5, size = 2, pch=16) +
          geom_point(data = polygon[length(polygon$x)-1, ], mapping = aes(x=x, y=y), 
                     shape = 21, color = "red", fill = NA, inherit.aes = FALSE, alpha = 0.5, size = 6, pch=16)
        
        if(!is.null(idx_selected)){
          p <- p + geom_point(data = polygon[idx_selected, ], mapping = aes(x=x, y=y), shape = 21,
                              color = "red", fill = "yellow", inherit.aes = FALSE, alpha = 0.5, size = 6, pch=16)
        }
          
        if(!is.null(label)){
          df_label <- data.frame(x=mean(polygon$x), y= mean(polygon$y))
          p <- p +  geom_label_repel(data = df_label, force = 4, inherit.aes = FALSE,
                                     mapping = aes(x=x, y=y), 
                                     label = label, 
                                     fill = grDevices::rgb(1,1,1,0.85), 
                                     color = "red", 
                                     nudge_y = 0, 
                                     nudge_x =0, 
                                     point.padding = 0)
        }
      }
      

    }
    
  }
  return(p)
  
}

#' Add a gate layer to plot
#' @param p a plot
#' @param gate a gate object
#' @importFrom sp point.in.polygon
#' @importFrom rlang quo_get_expr
add_gate <- function(p, gate){
  
  if(is.null(gate)){
    return(p)
  }
  
  polygon <- get_gate_coordinates(gate)
  
  
  xvar <- NULL
  yvar <- NULL
  color_var <- NULL
  
  if("x" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$x)){
      xvar <- as.character(rlang::quo_get_expr(p$mapping$x))
    }
  }
  
  if("y" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$x)){
      yvar <- as.character(rlang::quo_get_expr(p$mapping$y))
    }
  }
  
  if("colour" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$colour)){
      color_var <- as.character(rlang::quo_get_expr(p$mapping$colour))
    }
  }
  
  if(setequal(c(xvar, yvar), names(polygon))){ 
    if(dim(polygon)[2] >1){
      in_poly <- sp::point.in.polygon(p$data[[xvar]], 
                                      p$data[[yvar]], 
                                      polygon[[xvar]],
                                      polygon[[yvar]], 
                                      mode.checked=FALSE)
      
      perc_in_poly <- sprintf("%.1f", sum(in_poly)/length(in_poly)*100)
      
      idx_match <- match(c(xvar, yvar), names(polygon))
      names(polygon)[idx_match] <- c("x", "y")
      
      label <- paste(gate@filterId, " (", perc_in_poly, "%)", sep="")
      p <- add_polygon_layer(p, polygon = polygon, label = label)
    }else{
      p <- p + geom_area(data = data.frame(x = polygon[[xvar]], y = c(1,1)), 
                         mapping = aes(x=x, y = y), 
                         alpha = 0.2, 
                         color = "red", fill = "red")
      perc_in_poly <- sum(p$data[[xvar]] <= max(polygon[[xvar]]) & 
                            p$data[[xvar]] >= min(polygon[[xvar]]))/ 
        length(p$data[[xvar]])*100
      perc_in_poly <- sprintf("%.1f", perc_in_poly)
      label <- paste(gate@filterId, " (", perc_in_poly, "%)", sep="")
      df_label <- data.frame(x=mean(polygon[[xvar]]), y= 0.5)
      p <- p +  geom_label_repel(data = df_label, force = 4, inherit.aes = FALSE,
                                 mapping = aes(x=x, y=y),
                                 label = label,
                                 fill = grDevices::rgb(1,1,1,0.85),
                                 color = "red",
                                 nudge_y = 0,
                                 nudge_x =0,
                                 point.padding = 0)
      
    }
    
  }
  
  return(p)
  
}

#' Add a gate layer to plot
#' @param p a plot
#' @param gate a gate object
#' @importFrom sp point.in.polygon
#' @importFrom rlang quo_get_expr
#' @importFrom ggcyto geom_gate geom_stats
add_gate_to_plot <- function(p, gate){
  
  if(is.null(gate)){
    return(p)
  }
  if(class(gate[[1]]) == "booleanFilter"){
    warning("Gates of class booleanFilter cannot be displayed")
    return(p)
  }
    
  polygon <- get_gate_coordinates(gate[[1]])
  
  xvar <- NULL
  yvar <- NULL
  color_var <- NULL
  
  if("x" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$x)){
      xvar <- as.character(rlang::quo_get_expr(p$mapping$x))
    }
  }
  
  if("y" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$x)){
      yvar <- as.character(rlang::quo_get_expr(p$mapping$y))
    }
  }
  
  if(all(names(polygon) %in% c(xvar, yvar))){ 
    
    p <- p + ggcyto::geom_gate(gate) + 
      ggcyto::geom_stats(gate = gate, nudge_y = 0.5,
                                              type = c("gate_name", "percent"), label.padding = unit(0.5, "lines"),
                                              fill = grDevices::rgb(1,1,1,0.75))
  }
  
  return(p)
  
}

#' Get data ranges from a plot
#' @param p a plot
#' @importFrom sp point.in.polygon
#' @importFrom rlang quo_get_expr
#' @importFrom scales expand_range
get_plot_data_range <- function(p){

  xlim <- NULL
  ylim <- NULL
  xvar <- NULL
  yvar <- NULL
  
  data_range <- list()
  
  if("x" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$x)){
      xvar <- as.character(rlang::quo_get_expr(p$mapping$x))
    }
  }
  
  if("y" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$x)){
      yvar <- as.character(rlang::quo_get_expr(p$mapping$y))
    }
  }
  
  if(!is.null(xvar)){
    if(class(p$data) %in% c("ncdfFlowSet", "flowSet")){
      xvalues <- exprs(p$data[[1]])[,xvar]
    }else{
      xvalues <- p$data[[xvar]]
    }
    xlim <- range(xvalues)
    data_range[[xvar]] <- scales::expand_range(xlim, add = 1)
  }
  
  if(!is.null(yvar)){
    if(class(p$data) %in% c("ncdfFlowSet", "flowSet")){
      yvalues <- exprs(p$data[[1]])[,yvar]
    }else{
      yvalues <- p$data[[yvar]]
    }
    ylim <- range(yvalues)
    data_range[[yvar]] <- scales::expand_range(ylim, add=1)
  }
  
  return(data_range)
}

#' Build a tree graph from a named list
#' @param gates a named list. Each list element should contain a item 'parent' with 
#' the name of its parent list element
#' @param attrs parameter passed to Rgraphviz::layoutGraph()
#' @importFrom graph addEdge nodes
#' @importFrom Rgraphviz renderGraph layoutGraph
#' @importFrom methods new
plot_tree <- function(gates, 
                      attrs = list(graph=list(rankdir="LR"),
                                   node=list(fixedsize = FALSE,
                                             fillcolor = "gray",
                                             fontsize = 40,
                                             shape = "ellipse"))
                      ){
  
  gR = methods::new("graphNEL", nodes = union("root", names(gates)), edgemode = "directed")
  
  for(i in 1:length(gates)){
    if(!is.null(gates[[i]]$parent)){
      gR = graph::addEdge(gates[[i]]$parent,  names(gates)[i], gR)
    }
  }
  
  nAttrs <- list()
  nodeNames <- basename(graph::nodes(gR))
  names(nodeNames) <- graph::nodes(gR)
  nAttrs$label <- nodeNames
  
  p <- Rgraphviz::renderGraph(
    Rgraphviz::layoutGraph(gR,
                           nodeAttrs=nAttrs,
                           attrs=attrs
    )
  )
  return(p)
}

### Format plot (legend, scale, labels ...) #####################################################

#' Format a ggplot object
#' @param p a ggplot object
#' @param options  list of plot format options. Names of options include:
#' xlim : x-axis range
#' ylim : y-axis range
#' transformation : named list of trans objects 
#' default_trans : default trans object (set to 'identity_trans()' by default). 
#' Used only if 'transformation' is not an element of 'options'.
#' axis_labels : named list with axis labels (each element should be named after a plot variable)
#' color_var_name : name to display for color variable
#' facet_var : names of the variables used for facetting plots along the x-axis
#' facet_yvar : names of the variables used for facetting plots along the y-axis
#' scales : control scaling across facets (passed to 'facet_grid()'), Set to "fixed" by default
#' option : name of the viridis palette
#' theme : name of the ggplot theme ("gray" by default)
#' legend.position : legend position
#' @import ggplot2
#' @import viridis
#' @importFrom stats as.formula
#' @importFrom rlang quo_get_expr
#' @importFrom scales identity_trans
#' @importFrom flowCore exprs
#' @return a ggplot object
format_plot <- function(p,
                        options = list()){
  
  if(! "ggplot" %in% class(p) ){
    stop("p is not an object of class 'ggplot' ")
  }
  
  xvar <- NULL
  yvar <- NULL
  color_var <- NULL
  title <- NULL
  
  if("x" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$x)){
      xvar <- as.character(rlang::quo_get_expr(p$mapping$x))
    }
  }
  
  if("y" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$x)){
      yvar <- as.character(rlang::quo_get_expr(p$mapping$y))
    }
  }
  
  xlim <- NULL
  ylim <- NULL
  
  transformation <- list()
  axis_labels <- list()
  axis_limits <- list()
  
  if("colour" %in% names(p$mapping)){
    if("quosure" %in% class(p$mapping$colour)){
      color_var <- as.character(rlang::quo_get_expr(p$mapping$colour))
      print(color_var)
    }
  }

  facet_yvar <- NULL
  if(!is.null(p$plot_env$plot_type)){
    if(p$plot_env$plot_type == "bar"){
      facet_yvar <- "variable"
    }
  }
  
  
  #### default parameters ###
  
  var_options <- c("xlim", "ylim", "transformation", "default_trans",
                   "axis_labels", "axis_limits", "color_var_name", "facet_var", "facet_yvar",
                   "scales", "option", "theme", "legend.position", "title")
  
  for(var in intersect(names(options), var_options)){
    assign(var, options[[var]])
  }

  #facet scales
  if(is.null(options$scales)){
    scales <- "fixed"
  }
  
  #default viridis palette
  if(is.null(options$option)){
    option <- "viridis"
  }

  #default transformation
  if(is.null(options$default_trans)){
    default_trans <- scales::identity_trans()
  }
  
  ### transformations ####
  
  if(!is.null(xvar)){
    if(length(xvar) == 1){

      xvalues <- p$data[[xvar]]
      labx <- ifelse(xvar %in% names(axis_labels), 
                     axis_labels[[xvar]], 
                     xvar)
      trans_x <- default_trans
      if(xvar %in% names(transformation)){
        trans_x <- transformation[[xvar]]
      }
      xlim <- axis_limits[[xvar]]
      
      if(is.double(xvalues)){
        
        if(!is.null(xlim)){
          names(xlim) <- c("min", "max")
        }
        p$coordinates$limits$x <- xlim
        
        p <- p + scale_x_continuous(name = labx, 
                                    trans = trans_x, limits = xlim ) 
        
      }else if(is.integer(xvalues)){
        limits <- NULL
        if(!is.null(xlim)){limits <- seq(xlim[1], xlim[2])}
        p <- p + scale_x_discrete(name = labx,  limits = limits) 
      }else{
        p <- p + scale_x_discrete(name = labx) 
      }
     
    }
  }
  
  if(!is.null(yvar)){
    if(length(yvar) == 1){
      
      yvalues <- p$data[[yvar]]
      laby <- ifelse(yvar %in% names(options$axis_labels), 
                     options$axis_labels[[yvar]], 
                     yvar)
      trans_y <- default_trans
      if(yvar %in% names(transformation)){
        trans_y <- transformation[[yvar]]
      }
      ylim <- axis_limits[[yvar]]
      
      if(is.double(yvalues)){
        
        if(!is.null(ylim)){
          names(ylim) <- c("min", "max")
        }
        p$coordinates$limits$y <- ylim
        
        p <- p + scale_y_continuous(name = laby, 
                                    trans = trans_y, limits = ylim) 
      }else if(is.integer(yvalues)){
        limits <- NULL
        if(!is.null(ylim)){limits <- seq(ylim[1], ylim[2])}
        p <- p + scale_y_discrete(name = laby,  limits = limits) 
      }else{
        p <- p + scale_y_discrete(name = laby) 
      }
        
    }
  }
  
  if("GeomPoint" %in% class(p$layers[[1]]$geom)){
  #if(!is.null(p$plot_env$plot_type)){
    #if(p$plot_env$plot_type == "dots"){
      
      if(!is.null(color_var)){
        if(length(color_var) == 1){

          print("OK color")
          label_color <- ifelse(color_var %in% 
                                  names(options$axis_labels), 
                                options$axis_labels[[color_var]], 
                                color_var)
          trans_col <- default_trans
          
          if(color_var %in% names(transformation)){
            trans_col <- transformation[[color_var]]
          }
          
          color_lim <- axis_limits[[color_var]]
          
          is_cont <- FALSE
          
          if(color_var %in% names(p$data)){
            is_cont <- is.double(p$data[[color_var]])
          }
          
          #is_cont <- ifelse(color_var %in% names(p$data), is.double(p$data[[color_var]]), FALSE)
          
          if(is_cont){
            print(trans_col)
            print(color_lim)
            p <- p + viridis::scale_colour_viridis(trans = trans_col,
                                                   name = label_color,
                                                   option = option, 
                                                   limits = color_lim)
          }
        }
      }
    
  }

  if("StatPointdensity" %in% class(p$layers[[1]]$stat)){
    p <- p + viridis::scale_colour_viridis(option = option)
  }
  
  ### facet ####
  if(!is.null(options$facet_var) | !is.null(facet_yvar)){
    
    left_formula <- paste(facet_yvar, collapse = " + ")
    right_formula <- "."
    if(!is.null(options$facet_var)){
      if(options$facet_var != ""){
        right_formula <- paste(options$facet_var, collapse = " + ")
      }
    }
    
    #print(paste(left_formula, "~", right_formula))
    formula_facet <- stats::as.formula(paste(left_formula, "~", right_formula))
    
    p <- p + facet_grid(formula_facet,
                        labeller = label_both,
                        #scales = scale_y,
                        scales = scales)
  }else{
    p <- p + facet_wrap(NULL)
  }
  
  ### theme ####
  if(!is.null(title)){
    p <- p + ggtitle(title)
  }
  
  if("theme" %in% names(options)){
    if(!is.null(options$theme)){
      if(options$theme != ""){
        theme_name = paste("theme_", options$theme, sep = "")
        theme_function <- function(...){
          do.call(theme_name, list(...))
        }
        p <- p + theme_function()
      }
    }
    
  }
  
  
  if(!is.null(options$legend.position)){
    p <- p + theme(legend.position = options$legend.position)
  }
  
  p <- p + theme(plot.title = element_text(face = "bold"))

  return(p)
  
}


### Main plot functions #######################################################################


#' Plot a GatingSet
#' @param df a data.frame with plot data resulting from a call of \code{get_plot_data}. 
#' Supersedes parameters 'gs', 'sample', 'spill', 'metadata'
#' @param gs a GatingSet
#' @param sample Names of samples from the GatingSet 
#' (as returned by \code{pData(gs)$name})
#' @param subset Names of subsets from the GatingSet 
#' (as returned by \code{gs_get_pop_paths(gs)})
#' @param spill spillover matrix. If NULL, uncompensated data is used for gating and plotting.
#' @param metadata a data.frame containing metadata associated to samples.
#' Must have a column \code{name} used for mapping.
#' @param plot_type name of the plot type
#' @param plot_args  list of plot parameters passed to the plot function. 
#' Plot parameters depend on the plot type selected.
#' @param options  list of plot format options passed to \code{format_plot()}
#' @param gate_name Names of the gates to add to the plot (if it is compatible with plot parameters).
#' Ignored if NULL.
#' @param Ncells Maximum number of cells per sample and subset. If NULL, all cells are used.
#' @importFrom flowWorkspace gs_get_pop_paths gh_pop_get_gate sampleNames
#' @return a plot
plot_gs <- function(gs,
                    df = NULL,
                    sample = NULL,
                    subset = NULL,
                    spill = NULL,
                    metadata = NULL,
                    gate_name = NULL,
                    Ncells = NULL,
                    plot_type = "hexagonal",
                    plot_args = list(),
                    options = list()){
  
  
  if(! "xvar" %in% names(plot_args)){
    plot_args[["xvar"]] <- colnames(gs@data)[1]
  }
  if(! "yvar" %in% names(plot_args)){
    plot_args[["yvar"]] <- colnames(gs@data)[2]
  }
  
  if(is.null(sample)) sample <-  flowWorkspace::sampleNames(gs)[1]
  if(is.null(subset)) subset <- gh_get_gate_names(gs[[1]])[1]
  
  df <- get_plot_data(df = df,
                      gs = gs,
                      sample = sample,
                      subset = subset,
                      Ncells = Ncells,
                      spill = spill, 
                      metadata = metadata)
  
  p <- call_plot_function(data = df,
                          plot_type = plot_type,
                          plot_args = plot_args)
  
  p <- format_plot(p, options = options)
  
  # if(!is.null(gate_name)){
  #   for(gateName in setdiff(gate_name, "root")){
  #     g <- flowWorkspace::gs_pop_get_gate(gs, gateName)
  #     p <- add_gate(p, g[[sample[1]]])
  #   }
  # }
  
  return(p)
}

#' Plot a GatingSet
#' @param gs a GatingSet
#' @param sample Names of samples from the GatingSet 
#' (as returned by \code{pData(gs)$name})
#' @param subset Names of subsets from the GatingSet 
#' (as returned by \code{gs_get_pop_paths(gs)})
#' @param spill spillover matrix. If NULL, uncompensated data is used for gating and plotting.
#' @param metadata a data.frame containing metadata associated to samples.
#' Must have a column \code{name} used for mapping.
#' @param plot_type name of the plot type
#' @param plot_args  list of plot parameters passed to the plot function. 
#' Plot parameters depend on the plot type selected.
#' @param options  list of plot format options passed to \code{format_plot()}
#' @param gate_name Names of the gates to add to the plot (if it is compatible with plot parameters).
#' Ignored if NULL.
#' @importFrom flowWorkspace gs_get_pop_paths gh_pop_get_gate sampleNames
#' @importFrom ggcyto as.ggplot

#' @return a plot
plot_gs_ggcyto <- function(gs,
                    sample = NULL,
                    subset = NULL,
                    spill = NULL,
                    metadata = NULL,
                    gate_name = NULL,
                    plot_type = "hexagonal",
                    plot_args = list(),
                    options = list()){
  
  
  if(! "xvar" %in% names(plot_args)){
    plot_args[["xvar"]] <- colnames(gs@data)[1]
  }
  if(! "yvar" %in% names(plot_args)){
    plot_args[["yvar"]] <- colnames(gs@data)[2]
  }
  
  
  if(is.null(sample)) sample <-  flowWorkspace::sampleNames(gs)[1]
  if(is.null(subset)) subset <- gh_get_gate_names(gs[[1]])[1]
  
  fs <- gs_get_fs_subset(gs[sample], spill = spill, subset = subset)
  options[["title"]] <- subset
  
  # if(!is.null(spill)){
  #   fs <- flowCore::compensate(fs, gs@compensation)
  # }
  
  p <- call_plot_function(data = fs,
                          plot_type = plot_type,
                          plot_args = plot_args)
  
  if(!is.null(gate_name)){
    for(gateName in setdiff(gate_name, "root")){
      g <- flowWorkspace::gs_pop_get_gate(gs, gateName)
      p <- add_gate_to_plot(p, g)
    }
  }
  
  p <- ggcyto::as.ggplot(p)
  
  p <- format_plot(p, options = options)
  
  return(p)
}

#' Plot aggregated data from a GatingSet
#' @param df a data.frame with plot data resulting from a call of \code{get_plot_data}. 
#' Supersedes parameters 'gs', 'sample', 'spill'
#' @param gs a GatingSet
#' @param sample Names of samples from the GatingSet 
#' (as returned by \code{pData(gs)$name})
#' @param subset Names of subsets from the GatingSet 
#' (as returned by \code{gs_get_pop_paths(gs)})
#' @param spill spillover matrix. If NULL, uncompensated data is used for gating and plotting.
#' @param metadata a data.frame containing metadata associated to samples.
#' Must have a column \code{name} used for mapping.
#' @param transformation A list of trans objects. 
#' Each element must be named after a parameter and contain the transfomation to apply for this parameter.
#' If NULL, the default transformation 'y_trans' is applied.
#' @param stat_function Name of the function to be applied on transformed data for each sample and subset.
#' @param y_trans Default trans object (set to 'identity_trans()' by default). 
#' Used only if parameter 'transformation' is NULL. 
#' @param apply_inverse logical; Apply inverse transformation before returning the data.
#' @param yvar Names of the variables for which to compute statistics
#' @param var_names Replace 'yvar' with custom names
#' @param scale logical; Should data be scaled for each 'yvar' variable?
#' @param plot_type name of the plot type
#' @param plot_args  list of plot parameters passed to the plot function. 
#' Plot parameters depend on the plot type selected.
#' @param options  list of plot format options passed to \code{format_plot()}
#' @importFrom flowWorkspace gs_get_pop_paths sampleNames
#' @importFrom scales identity_trans
#' @return a list with a plot and the corresponding plot data
plot_stat <- function(df = NULL,
                      gs,
                      sample = NULL,
                      subset = NULL,
                      spill = NULL,
                      metadata = NULL,
                      transformation=NULL,
                      stat_function = "mean",
                      y_trans = identity_trans(),
                      apply_inverse = TRUE,
                      yvar = NULL,
                      var_names = NULL,
                      scale = FALSE,
                      plot_type = "heatmap",
                      plot_args = list(),
                      options = list() ){
                        
  
  
  if(is.null(sample)) sample <- flowWorkspace::sampleNames(gs)[1]
  if(is.null(subset)) subset <- gh_get_gate_names(gs[[1]])[1]
  
  if(is.null(df)){
    df <- get_plot_data(df = df,
                        gs = gs,
                        sample = sample,
                        subset = subset,
                        spill = spill, 
                        metadata = NULL)
  }
  
  df <- df[df$name %in% sample & df$subset %in% subset, ]
  
  df_stat <- compute_stats(df = df,
                      gs = gs,
                      spill = spill,
                      transformation = transformation,
                      stat_function = stat_function,
                      y_trans = y_trans,
                      apply_inverse = apply_inverse,
                      yvar = yvar,
                      var_names = var_names,
                      id.vars = c("name", "subset"))
  
  if(scale){
    df_stat <- scale_values(df_stat, id.vars = c("name", "subset"))
  }                          
  
  df_stat <- add_columns_from_metadata(df_stat, metadata = metadata)
  
  plot_args$stat_var <- switch(stat_function,
                               "cell count" = "Count",
                               "percentage" = "perc_parent",
                               yvar)
  
  plot_args$annotation_vars <- unique(c("name", "subset", names(metadata)))
  
  p <- call_plot_function(data = df_stat,
                          plot_type = plot_type,
                          plot_args = plot_args)
  
  
  if("plot_type" %in% names(p$plot_env)){
   p <- format_plot(p, options = options)
  }
  
  return( list(plot = p, data = df_stat) )
}

#' Plot all gates for a given sample of a GatingSet
#' @description  Plot all gates for a given sample of a gating set
#' @param df data.frame with columns \code{name} and \code{subset} 
#' containing sample and subset names respectively and
#' columns with plot variables. Ignored if \code{NULL}. 
#' Otherwise supersedes parameters 'gs', 'sample', 'spill', 'metadata'.
#' @param gs a GatingSet
#' @param sample sample names
#' @param Ncells number of cells to sample from the GatingSet
#' @param selected_subsets subset names. if NULL, all gates are drawn.
#' @param spill spillover matrix. If NULL, uncompensated data is used both for gating and plotting.
#' @param plot_type name of the plot type
#' @param plot_args  list of plot parameters passed to \code{plot_gs()}
#' @param options  list of plot format options passed to \code{format_plot()}
#' @return a list of ggplot objects
#' @importFrom flowWorkspace gs_get_pop_paths gs_pop_get_parent gs_pop_get_children sampleNames
  plot_gh <- function( gs, 
                      df = NULL,
                      sample = NULL,
                      Ncells = NULL,
                      selected_subsets = NULL,
                      spill = gs@compensation,
                      plot_type = "hexagonal",
                      plot_args = list(), 
                      options = list()){
  
  if(is.null(sample)){sample = flowWorkspace::sampleNames(gs)[1]}
  
  idx <- match(sample, flowWorkspace::sampleNames(gs))
  
  if(is.null(selected_subsets)){
    selected_subsets <- setdiff(gh_get_gate_names(gs[[1]]), "root")
    subset <- gh_get_gate_names(gs[[1]])
  }else{
    subset <- selected_subsets[selected_subsets %in% gh_get_gate_names(gs[[1]])]
    parent_subsets <- sapply(subset, function(x){flowWorkspace::gs_pop_get_parent(gs[[idx[1]]], x)})
    subset <- union(subset, parent_subsets)
  }
  

  # if(is.null(df)){
  #   
  #   df <- get_data_gs(gs = gs,
  #                     sample = sample,
  #                     subset = subset,
  #                     spill = spill,
  #                     Ncells = Ncells)
  #   
  # }
  
  child_nodes <- flowWorkspace::gs_pop_get_children(gs[[idx[1]]], "root")
  child_nodes <- child_nodes[child_nodes %in% selected_subsets]
  
  
  plist <- list()
  count <- 0
  
  #plot gates descending the gh until there are no more children gates
  while(length(child_nodes)>0){
    
    child_nodes_int <- NULL
    nodes_to_plot <- child_nodes
    all_parents <- sapply(nodes_to_plot, function(x){flowWorkspace::gs_pop_get_parent(gs[[idx[1]]], x)})
    names(all_parents) <- NULL
    
    for(parent in unique(all_parents)){
      
      idx_parent <- which(all_parents == parent)
      
      nodes_to_plot_parent <- nodes_to_plot[idx_parent]
      
      #plot together gates that share the same set of parameters
      
      while(length(nodes_to_plot_parent) > 0){
        
        
        par_nodes <- lapply(nodes_to_plot_parent, function(x){
          
          g <- flowWorkspace::gh_pop_get_gate(gs[[idx[1]]], x)

          if(class(g) %in% c("polygonGate")){
            try(colnames(g@boundaries), silent = TRUE)
          }else if(class(g) %in% c("ellipsoidGate")){
            try(colnames(g@cov), silent = TRUE)
          }else if(class(g) %in% c("rectangleGate")){
            try(names(g@min), silent = TRUE)
          }
          
        })
        
        same_par <- sapply(par_nodes, function(x){setequal(x, par_nodes[[1]])})
        
        count <- count + 1

        plot_args$xvar <- par_nodes[[1]][1]
        plot_type_gate <- plot_type
        if(length(par_nodes[[1]]) > 1){
          plot_args$yvar <- par_nodes[[1]][2]
        }else{
          plot_type_gate <- "histogram"
        }
        
        plist[[count]] <- plot_gs_ggcyto(gs=gs, 
                                   sample=sample,
                                   subset = parent, 
                                   spill = spill,
                                   gate_name = nodes_to_plot_parent[same_par], 
                                   plot_type = plot_type_gate,
                                   plot_args = plot_args,
                                   options = options)
        
        all_children <- unlist(sapply(nodes_to_plot_parent[same_par], function(x){flowWorkspace::gs_pop_get_children(gs[[1]], x)}))
        names(all_children) <- NULL
        
        child_nodes_int <- c(child_nodes_int, all_children)
        nodes_to_plot_parent <- setdiff(nodes_to_plot_parent, nodes_to_plot_parent[same_par])
        
      }
      
    }
    
    child_nodes <- child_nodes_int[child_nodes_int %in% selected_subsets]
    
  }
  return(plist)
}

#' Plot a gate from a GatingSet
#' @param gate_name name of the gate
#' @param df a data.frame with plot data resulting from a call of \code{get_plot_data}. 
#' Supersedes parameters 'gs', 'sample', 'spill', 'metadata'
#' @param gs a GatingSet
#' @param sample Set of samples from 'gs'
#' @param spill compensation 
#' @param metadata a data.frame containing metadata associated to samples.
#' Must have a column \code{name} used for mapping.
#' @param plot_type name of the plot type
#' @param plot_args  list of plot parameters passed to \code{plot_gs()}
#' @param options  list of plot format options passed to \code{format_plot()}
#' @importFrom flowWorkspace gh_pop_get_gate sampleNames
#' @importFrom ggcyto as.ggplot
#' @importFrom flowCore compensate
plot_gate <- function(gate_name,
                     df = NULL,
                     gs,
                     sample = NULL,
                     spill = NULL,
                     metadata = NULL,
                     plot_type = "hexagonal",
                     plot_args = list(),
                     options = list()){
  
  gate <- flowWorkspace::gs_pop_get_gate(gs, gate_name)
  polygon <- get_gate_coordinates(gate[[1]])
  
  subset <- flowWorkspace::gs_pop_get_parent(gs,  gate_name)
  plot_args[["xvar"]] <- names(polygon)[1]

  if(length(names(polygon))>1){
    plot_args$yvar <- names(polygon)[2]
  }else{
    plot_type = "histogram"
  }
  
  if(is.null(sample)) sample <-  flowWorkspace::sampleNames(gs)[1]

  # df <- get_plot_data(df = df,
  #                     gs = gs,
  #                     sample = sample,
  #                     subset = parent,
  #                     spill = spill,
  #                     metadata = metadata)
  
  fs <- gs_pop_get_data(gs[sample], subset)
  
  if(!is.null(spill)){
    fs <- flowCore::compensate(fs, gs@compensation)
  }
  
  p <- call_plot_function(data = fs,
                    plot_type = plot_type,
                    plot_args = plot_args)
  
  p <- add_gate_to_plot(p, gate)
  
  p <- ggcyto::as.ggplot(p)
    
  p <- format_plot(p, options = options)
  
  
  
  return(p)
}



#' scale column of a data frame
#' @param df a data.frame
#' @param id.vars Names of df's columns that should not be scaled
#' @return a data.frame
scale_values <- function(df, id.vars = NULL){
  
  if(is.null(id.vars)){
    id.vars <- names(df)[which(!sapply(df, is.numeric))]
  }
  
  df_scale <- df
  df_scale[-which(names(df) %in% id.vars)] <- scale(df[-which(names(df) %in% id.vars)])
  
  df_scale
}

### compensation ##################################################################################

matrix_equal <- function(x, y){
  is.matrix(x) && is.matrix(y) && dim(x) == dim(y) && all(x == y)
}
#' @importFrom htmlwidgets JS
#' @importFrom DT datatable formatRound formatStyle styleInterval
#' @importFrom magrittr %>%
#' @importFrom RColorBrewer brewer.pal
format_style_comp_matrix <- function(df, editable = 'none', rownames = TRUE){
  
  `%>%` <- DT::`%>%`() 
    
  df <- as.matrix(df)
  do_formatting <- is.numeric(df[1])
  
  if(do_formatting){
    
    headerCallback <- c(
      "function(thead, data, start, end, display){",
      "  var $ths = $(thead).find('th');",
      "  $ths.css({'vertical-align': 'bottom', 'white-space': 'nowrap'});",
      "  var betterCells = [];",
      "  $ths.each(function(){",
      "    var cell = $(this);",
      "    var newDiv = $('<div>', {height: 'auto', width: cell.height()});",
      "    var newInnerDiv = $('<div>', {text: cell.text()});",
      "    newDiv.css({margin: 'auto'});",
      "    newInnerDiv.css({",
      "      transform: 'rotate(180deg)',",
      "      'writing-mode': 'tb-rl',",
      "      'white-space': 'nowrap'",
      "    });",
      "    newDiv.append(newInnerDiv);",
      "    betterCells.push(newDiv);",
      "  });",
      "  $ths.each(function(i){",
      "    $(this).html(betterCells[i]);",
      "  });",
      "}"
    )
    
    colors <- c(RColorBrewer::brewer.pal(n = 9, name = "Blues")[10-(1:9)], 
                RColorBrewer::brewer.pal(n = 9, name = "Reds")[1:9])
    # colnames(df) <- unlist(lapply(strsplit(colnames(df), split="-"), function(x){
    #   paste(unlist(x[2:(length(x)-1)]), collapse = "-")}))
    # row.names(df) <- unlist(lapply(strsplit(row.names(df), split="-"), function(x){
    #   paste(unlist(x[2:(length(x)-1)]), collapse = "-")}))
    df <- DT::datatable(df*100,
                        rownames = rownames, 
                        selection = list(mode = 'single', target = 'cell'), 
                        editable  = editable, 
                        options = list(
                          initComplete = htmlwidgets::JS(
                            "function(settings, json) {",
                            "$(this.api().table().container()).css({'font-size': '12px'});",
                            "}"),
                          headerCallback = htmlwidgets::JS(headerCallback),
                          autoWidth = FALSE,
                          scrollX=TRUE
                          #columnDefs = list(list(width = '10px', targets = "_all"))
                        )) %>%
      DT::formatRound(columns = colnames(df), digits = 2, ) %>%
      #DT::formatStyle(columns = colnames(df), fontSize = '50%') %>%
      DT::formatStyle(
        columns = colnames(df),
        backgroundColor = DT::styleInterval(cuts = seq(-125, 125, 250/(length(colors)-2)), values = colors),
      )
    
  }else{
    df <- DT::datatable(df, rownames = rownames)
  }
  return(df)
}


plot_comp_as_heatmap <- function(df, name = ""){
  
  maxval <- 100*max(c(1.25, max(abs(df))))
  limits <- c(-maxval, maxval)
  df <- as.data.frame(100*df)
  df <- signif(df, digits = 2)
  df[df == 0] <- NA

  colors <- c(RColorBrewer::brewer.pal(n = 9, name = "Blues")[10-(1:9)], 
              RColorBrewer::brewer.pal(n = 9, name = "Reds")[1:9])
  
  p <- heatmaply::heatmaply(df,
                            colors = colors,
                            plot_method="plotly",
                            limits = limits,
                            Rowv = NULL,
                            Colv = NULL,
                            column_text_angle = 90,
                            xlab = "detection channel",
                            ylab = "emitting fluorophore",
                            fontsize_row = 10,
                            fontsize_col = 10,
                            cellnote_size = 6,
                            hide_colorbar = FALSE,
                            main = paste(name, "spillover (%)"),
                            margins = c(50, 50, 50, 0)
  )
}

### Dimensionality Reduction ###################################################################

#' Perform dimensionality reduction
#' @description  Perform dimensionality reduction
#' @param df a data.frame with only numeric variables.
#' @param yvar names of df's variables used to perform dimensionality reduction
#' @param Ncells Maximum number of cells without any NA values sampled from df. 
#' If NULL, all cells without any NA values are used
#' @param transformation  Named list of \code{trans} objects. 
#' List names should correspond to variable names.
#' @param y_trans default \code{trans} object to be used if \code{transformation} is NULL.
#' @param perplexity t-SNE perplexity parameter (passed to \code{Rtsne:Rstne()})
#' @param dims Number of dimensions (passed to \code{Rtsne:Rstne()})
#' @param method Name of the method used. Either "tSNE" or "umap"
#' @param check_duplicates logical. Checks whether duplicates are 
#' present (passed to \code{Rtsne:Rstne()})
#' @return a data.frame with additionnal columns : 
#' "tSNE1" and "tSNE2" for method 'tSNE', "UMAP1" and "UMAP2" for method 'umap'
#' @importFrom Rtsne Rtsne
#' @importFrom umap umap
#' @importFrom scales log10_trans
dim_reduction <- function(df,
                          yvar,
                          Ncells = NULL,
                          transformation = NULL,
                          y_trans = identity_trans(),
                          perplexity = 50,
                          dims = 2,
                          method = "tSNE",
                          check_duplicates = FALSE){
  
  yvar <- as.character(yvar)
  
  idx_cells_kept <- 1:dim(df)[1]
  
  if(is.numeric(Ncells)){
    if(Ncells<=0){
      warning("Parameter Ncells must be > 0")
      return(NULL)
    }
  }
  
  if(!is.null(y_trans) & is.null(transformation)){
    transformation <- lapply(yvar, function(x){y_trans})
    names(transformation) <- yvar
  }
  
  trans_name <-  unique(unlist(sapply(transformation[yvar], function(tf){tf$name})))
  
  df_trans <- df
  df_filter <- df
  
  for(i in 1:length(yvar)){
    df_trans[[yvar[i]]] <- transformation[[yvar[i]]]$transform(df[[yvar[i]]])
  }

  cell_has_non_finite <- apply(X = df_trans[, yvar], MARGIN = 1, FUN = function(x){sum(!is.finite(x) )>0})
  cell_has_na <- rowSums(is.na(df_trans[, yvar])) > 0
  idx_filter <- which(cell_has_na | cell_has_non_finite)
  
  if(length(idx_filter)>0){
    message(paste("Filter out ", length(idx_filter), " cells with NA or non-finite values", sep =""))
    df_trans <- df_trans[-idx_filter, ]
    df_filter <- df_filter[-idx_filter, ]
    idx_cells_kept <- idx_cells_kept[-idx_filter]
  }
  
  if(!is.null(Ncells) & is.numeric(Ncells)){
    Ncells_used <- min(dim(df_trans)[1], Ncells)
    idx_cells <- sample(1:dim(df_trans)[1], Ncells_used, replace = FALSE)
  }else{
    Ncells_used <- dim(df_trans)[1]
    idx_cells <- 1:dim(df_trans)[1]
  }
  
  idx_cells_kept <- idx_cells_kept[idx_cells]
  
  message(paste("Running ", method, " with ", Ncells_used, " cells and ",  length(yvar), " parameters", sep = ""))
  
  if(Ncells_used > 3000){
    message("This may take a while... Try with less cells.")
  }

  if(method == "tSNE"){
    tSNE <- Rtsne::Rtsne(df_trans[ idx_cells , yvar], perplexity = perplexity, dims = dims, check_duplicates = check_duplicates)
    df_tSNE <- tSNE$Y
    colnames(df_tSNE) <- c("tSNE1","tSNE2")
    return(list( df = cbind(df_filter[idx_cells, ], df_tSNE), keep = idx_cells_kept, var_names = c("tSNE1","tSNE2")))
  }
  
  if(method == "umap"){
    df_umap <- umap::umap(df_trans[ idx_cells , yvar])
    df_umap <- df_umap$layout
    colnames(df_umap) <- c("UMAP1","UMAP2")
    return(list( df = cbind(df_filter[idx_cells, ], df_umap), keep = idx_cells_kept, var_names = c("UMAP1","UMAP2")))
  }
  
  return(NULL)
  
}

### Clustering ##################################################################################

#' Identify clusters
#' @description  Identify clusters
#' @param df a data.frame with only numeric variables.
#' @param yvar names of df's variables used to find clusters
#' @param transformation  Named list of \code{trans} objects. 
#' List names should correspond to variable names.
#' @param y_trans default \code{trans} object to be used if \code{transformation} is NULL.
#' @param dc ClusterX dc parameter
#' @param alpha ClusterX alpha parameter
#' @param method Name of the method used. Either "FlowSOM", "ClusterX", "Rphenograph".
#' @param k integer; number of nearest neighbours (passed to \code{Rphenograph()})
#' @param k_meta Maximum number of clusters to try out 
#' (passed to \code{FlowSOM::MetaClustering()})
#' @param scale logical; Scale values before building SOM (for method 'FlowSOM' only)
#' @return a data.frame with the additionnal column "cluster"
#' @importFrom FlowSOM BuildSOM BuildMST MetaClustering
#' @importFrom igraph membership
#' @importFrom scales identity_trans
get_cluster <- function(df,
                        yvar,
                        transformation = NULL,
                        y_trans = identity_trans(),
                        dc=3, 
                        alpha = 0.001,
                        k = 100,
                        k_meta = 8,
                        scale = FALSE,
                        method = "FlowSOM"){
  
  yvar <- as.character(yvar)
  
  idx_cells_kept <- 1:dim(df)[1]
  
  if(!is.null(y_trans) & is.null(transformation)){
    transformation <- lapply(yvar, function(x){y_trans})
    names(transformation) <- yvar
  }
  
  trans_name <-  unique(unlist(sapply(transformation[yvar], function(tf){tf$name})))
  
  df_trans <- df
  df_filter <- df
  
  for(i in 1:length(yvar)){
    df_trans[[yvar[i]]] <- transformation[[yvar[i]]]$transform(df[[yvar[i]]])
  }
  
  cell_has_non_finite <- apply(X = df_trans[, yvar], 
                               MARGIN = 1, 
                               FUN = function(x){sum(!is.finite(x) )>0})
  cell_has_na <- rowSums(is.na(df_trans[, yvar])) > 0
  idx_filter <- which(cell_has_na | cell_has_non_finite)
  
  if(length(idx_filter)>0){
    message(paste("Filter out ", length(idx_filter), 
                  " cells with NA or non-finite values", sep =""))
    df_trans <- df_trans[-idx_filter, ]
    df_filter <- df_filter[-idx_filter, ]
    idx_cells_kept <- idx_cells_kept[-idx_filter]
  }
  
  if(method == "FlowSOM"){
    
    data <- as.matrix(df_trans[, which(names(df_trans) %in% yvar)])
    fSOM <- list(data = data,
                 compensate = FALSE,
                 spillover = NULL,
                 transform = FALSE,
                 scale = scale,
                 prettyColnames = colnames(data))
    
    message(paste("Clustering ", dim(data)[1], " cells using 'FlowSOM' on ", 
                  length(yvar), " parameters", sep = ""))
    
    fSOM <- BuildSOM(fSOM, colsToUse = which(colnames(data) %in% yvar))
    fSOM <- BuildMST(fSOM)
    fSOM$metaClustering <- MetaClustering(fSOM$map$codes, 
                                          "metaClustering_consensus", max=k_meta)
    
    metaClustering_perCell <- fSOM$metaClustering[fSOM$map$mapping[,1]]
    df_filter$cluster_fsom <- as.factor(fSOM$map$mapping[,1])
    df_filter$cluster <- as.factor(metaClustering_perCell)
    var_names <- c("cluster", "cluster_fsom")
    return(list(df = df_filter, keep = idx_cells_kept,  var_names = var_names, fSOM = fSOM))
  }else{
    stop("Clustering method not supported")
  }
}



### Build FlowSet ###############################################################################

#' Build a flowSet from a data.frame
#' @description Build a flowSet from a data.frame
#' @param df data.frame with a column \code{sample_col} containing sample names and
#' columns with flow variables.
#' @param origin flowSet from which to retrieve flowFrames description and parameters slots. 
#' Ignored if NULL.
#' @param chanel_col Names of df's columns to be used as flow variables 
#' @param sample_col Name of df's column containing sample names
#' @return a flowSet
#' @importFrom flowCore description parameters flowFrame flowSet
#' @importFrom flowWorkspace pData sampleNames
#' @examples
#' \dontrun{
#' utils::data("GvHD", package = "flowCore")
#' gs <- GatingSet(GvHD)
#' samples <- flowWorkspace::sampleNames(gs)[1:3]
#' df <- get_data_gs(gs = gs, sample = samples, subset = "root", Ncells = 1000)
#' fs <- build_flowset_from_df(df = df, origin = gs@data)
#' pData(fs)}
build_flowset_from_df <- function(df,
                                  origin = NULL,
                                  chanel_col = setdiff(names(df), c("name", "subset")), 
                                  sample_col = "name"){
  
  samples <- unique(df[[sample_col]])
  ff_list <- list()
  
  for(sample in samples){
    
    idx_cells <- which(df[[sample_col]] == sample)
    ncells <- length(idx_cells)
    if(ncells >0){
      df_sample <- df[idx_cells , chanel_col]
      
      df_exprs <- data.frame(lapply(df_sample, as.numeric), check.names = FALSE)
      M <- as.matrix(df_exprs)
      
      par <- NULL
      desc <- NULL
      
      if(!is.null(origin)){
        
        idx <- match(sample, flowWorkspace::sampleNames(origin))
        
        if(!is.na(idx)){
          
          par <- parameters(origin[[idx]])
          #par <- origin$par[[idx]]
          
          par@data$name <- as.character(par@data$name)
          par@data$desc <- as.character(par@data$desc)
          
          desc <- flowCore::description(origin[[idx]])
          #desc <- origin$desc[[idx]]
          new_par <- setdiff(chanel_col, par@data$name)
          npar <- length(par@data$name)
          
          for(i in 1:length(par@data$name)){
            param <- par@data$name[i]
            if(! paste("$P",i,"VARTYPE",sep="") %in% names(desc)){
              desc[[paste("$P",i,"VARTYPE",sep="")]] <- class(df_sample[[param]])
            }
          }
          
          for(param in new_par){
            npar <- npar + 1
            rg <- c(NA, NA)
            
            if(is.numeric(df_sample[[param]])){
              rg <- range(df_sample[[param]])
            }
            
            par@data <- rbind(par@data, c(param, NA, diff(rg), rg[1], rg[2]))
            rownames(par@data)[npar] <- paste("$P",npar, sep = "")
            desc[[paste("$P",npar,"DISPLAY",sep="")]] <- NA
            desc[[paste("$P",npar,"VARTYPE",sep="")]] <- class(df_sample[[param]])
            #print(class(df_sample[[param]]))
          }
          
          # par@data$vartype <- sapply(par@data$name, function(x){typeof(df_sample[[x]])})
          # rn <- row.names(par@varMetadata)
          # par@varMetadata <- rbind(par@varMetadata, "vartype")
          # row.names(par@varMetadata)<- c(rn, "vartype")
          
          
          desc[["$TOT"]] <- dim(df_sample)[1]
        }
      }
      
      if(!is.null(par) & !is.null(desc)){
        ff_list[[sample]] <- flowFrame(exprs = M,
                                       parameters = par,
                                       description = desc)
      }else{
        ff_list[[sample]] <- flowFrame(exprs = M)
      }

    }

  }
  
  if(length(ff_list)>0){
    fs_new <- flowSet(ff_list)
    if("flowSet" %in% class(origin) ){
      pdata <- data.frame(flowWorkspace::pData(origin))
      idx_match <- match(samples, flowWorkspace::sampleNames(origin))
      if(length(colnames(pdata))>1){
        flowWorkspace::pData(fs_new) <- pdata[idx_match, ]
      }else{
        flowWorkspace::pData(fs_new)$name <- pdata[idx_match, "name"]
      }
    }
  }else{
    fs_new <- NULL
  }
  
  return(fs_new)
  
}

#' @importFrom flowWorkspace GatingSet
build_gatingset_from_df <- function(df, gs_origin = NULL){
  fs <- build_flowset_from_df(df = df, origin = gs_origin@data)
  gs <- GatingSet(fs)
  choices <- get_parameters_gs(gs)
  gates <- get_gates_from_gs(gs_origin)
  add_gates_flowCore(gs, gates)
  sample <- choices$sample[choices$sample %in% names(gs_origin@compensation)]
  gs@compensation <- gs_origin@compensation[sample]
  params <- choices$params$name[choices$params$name %in% names(gs_origin@transformation)]
  gs@transformation <- gs_origin@transformation[params]
  return(gs)
}
VoisinneG/flowR documentation built on June 1, 2021, 6:42 p.m.
rdrr.io home R language documentation Run R code online
CRAN packages Bioconductor packages R-Forge packages GitHub packages
Note that we can't provide technical support on individual packages. You should contact the package authors for that.
VoisinneG/flowR
R-shiny interface for the analysis of flow cytometry data

R/flowR.R
In VoisinneG/flowR: R-shiny interface for the analysis of flow cytometry data

R Package Documentation

Browse R Packages

We want your feedback!

VoisinneG/flowR R-shiny interface for the analysis of flow cytometry data

R/flowR.R In VoisinneG/flowR: R-shiny interface for the analysis of flow cytometry data

R Package Documentation

Browse R Packages

We want your feedback!

VoisinneG/flowR
R-shiny interface for the analysis of flow cytometry data

R/flowR.R
In VoisinneG/flowR: R-shiny interface for the analysis of flow cytometry data