ENMTools: Analysis of Niche Evolution using Niche and Distribution Models

Documented in multistack.pca

#' multistack.pca, simultaneous PCA on more than one stack of environmental rasters
#'
#' @param n The number of PCA layers to return
#' @param ... Any number of environmental raster stacks or bricks
#'
#' @return A list containing a stack or brick of rasters for each input set representing the top n pca axes of the initial environmental variables, as well as the pca object from the analysis that produced them and some useful plots showing the distribution of each PC in the different stacks.
#'
#' @keywords raster pca environment
#'
#' @examples
#' test1 <- terra::crop(euro.worldclim, terra::ext(-10, -5, 40, 43))
#' test2 <- terra::crop(euro.worldclim, terra::ext(-5, 5, 40, 48))
#' test3 <- terra::crop(euro.worldclim, terra::ext(5, 15, 44, 48))
#' multistack.pca(test1, test2, test3)

multistack.pca <- function(..., n = 2){

  # Get raster stacks into a list, make sure all have the same layers
  stacks <- list(...)
  if(length(stacks) <= 1){
    stop("One or fewer raster stacks passed!")
  }

  # This is a lot of crap just to get the names and get n out if supplied,
  # but it works
  stacknames <- sapply(match.call(expand.dots=TRUE)[-1], deparse)
  if(any(names(stacknames) == "n")){
    stacknames <- stacknames[-which(names(stacknames) == "n")]
  }
  names(stacks) <- stacknames

  # This will be set to true if there are any name mismatches
  mismatch <- FALSE

  for(i in 1:length(stacks)){
    for(j in 1:length(stacks)){
      if(length(setdiff(names(stacks[[i]]), names(stacks[[j]]))) > 0){
        print(paste("Layers in", names(stacks)[[i]],
                    "missing from", names(stacks)[[j]], ":"))

        print(setdiff(names(stacks[[i]]), names(stacks[[j]])))
        mismatch <- TRUE
      }
    }
  }
  if(mismatch){stop("Layer mismatch!")}

  # Get all values
  env.val <- lapply(stacks, function(x) terra::values(x))

  # Figure out which cells have complete cases and which have at least one NA
  keepers <- lapply(env.val, function(x) which(complete.cases(x)))
  nas <- lapply(env.val, function(x) which(!complete.cases(x)))

  # Do PCA
  pca.df <- do.call("rbind", env.val)
  pca.df <- pca.df[complete.cases(pca.df),]
  pca <- prcomp(pca.df, retx = TRUE, scale = TRUE)

  # Build dummy layers
  env.pca <- stacks
  for(i in 1:length(env.pca)){
    env.pca[[i]] <- env.pca[[i]][[1:n]]
  }

  # Add scores and NAs where appropriate
  # the offset is going to be used so that we start
  # on the right row of the PCA values for each set of layers
  offset <- 0
  for(i in 1:length(env.pca)){
    for(j in 1:n){
      thislayer <- env.pca[[i]][[j]]
      thislayer[nas[[i]]] <- NA
      thislayer[keepers[[i]]] <- pca$x[(offset + 1):(offset + length(keepers[[i]])),j]
      env.pca[[i]][[j]] <- thislayer
    }
    offset <- offset + length(keepers[[i]])
    # Rename layers and ship it out
    names(env.pca[[i]]) <- paste0("PC", 1:n)
    env.pca[[i]] <- terra::setMinMax(env.pca[[i]])
  }

  # Now we'll make some plots of the distribution of each PC in each stack
  pc.plots <- list()

  # Janky code to make a vector of stack names going with each observation in pca
  nkeepers <- sapply(keepers, length)
  data.source <- Reduce(c, sapply(names(keepers), function(x) rep(x, nkeepers[[x]])))

  plot.df <- as.data.frame(pca$x)

  # Doing this weird local() trick to keep ggplot from making the same plot over and over
  for (i in 1:n) {
    pc.name <- colnames(plot.df)[i]
    pc.plots[[pc.name]] <- local({
      i <- i

      p1 <- ggplot(data = plot.df, aes(x = .data[[paste0("PC", i)]], fill = data.source, alpha = 0.3)) +
        geom_density() +  xlab(pc.name) + guides(alpha = "none") +
        labs(fill = "Data source", color = "Data source")
      print(p1)
    })
  }

  output <- list(raster.stacks = env.pca,
                 pc.plots = pc.plots,
                 pca.object = pca)

  return(output)
}

danlwarren/ENMTools documentation built on Jan. 17, 2025, 8:42 a.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

danlwarren/ENMTools
Analysis of Niche Evolution using Niche and Distribution Models

R/multistack.pca.R
In danlwarren/ENMTools: Analysis of Niche Evolution using Niche and Distribution Models

Defines functions multistack.pca

Documented in multistack.pca

R Package Documentation

Browse R Packages

We want your feedback!

danlwarren/ENMTools Analysis of Niche Evolution using Niche and Distribution Models

R/multistack.pca.R In danlwarren/ENMTools: Analysis of Niche Evolution using Niche and Distribution Models

Defines functions multistack.pca

Documented in multistack.pca

R Package Documentation

Browse R Packages

We want your feedback!

danlwarren/ENMTools
Analysis of Niche Evolution using Niche and Distribution Models

R/multistack.pca.R
In danlwarren/ENMTools: Analysis of Niche Evolution using Niche and Distribution Models