LeyLabRMisc: Ley Lab misc R functions, rmd templates, etc.

Documented in calculate_rarefaction_curves estimate_rarified_richness phyloseq2df phyloseq_rel_abund

#' Convert a sub-object of a phyloseq object to a dataframe
#'
#' A helper function for converting OTU, taxonomy, and metadata to dataframes
#'
#' @param physeq_obj The phyloseq object
#' @param physeq_func Which object do you want ('otu_table', 'tax_table', or 'sample_data')
#' @param long Do you want the table in "long" format ("gathered")
#' @param flip Flip (transpose) the table?
#' @return A tibble
#' @export
#' @importFrom tidyr gather
#' @importFrom tibble as_tibble
phyloseq2df = function(physeq_obj, physeq_func, long=FALSE, flip=FALSE){
  require(dplyr)
  tbl = physeq_obj %>%
    physeq_func %>%
    as.data.frame(stringsAsFactors = FALSE)
  if(flip == TRUE){
    tbl = tbl %>% t %>% as.data.frame
  }

  func_str = as.character(substitute(physeq_func))

  if(func_str == 'otu_table' || func_str == 'tax_table'){
    if(flip == TRUE){
      tbl$Sample = rownames(tbl)
    } else {
      tbl$OTU = rownames(tbl)
    }
  } else
    if(func_str == 'sample_data'){
      tbl$Sample = rownames(tbl)
    }
  rownames(tbl) = 1:nrow(tbl)

  if(func_str == 'otu_table' && long == TRUE){
    if(flip == TRUE){
      tbl = tbl %>%
        tidyr::gather(OTU, Count, -Sample)
    } else {
      tbl = tbl %>%
        tidyr::gather(Sample, Count, -OTU)
    }
  } else if(func_str == 'tax_table' && long == TRUE){
    tbl = tbl %>%
      tidyr::gather(Tax_level, Tax_name, -OTU)
  } else if(func_str == 'sample_data' && long == TRUE){
    tbl = tbl %>%
      tidyr::gather(Metadata_key, Metadata_value, -Sample)
  }

  return(suppressWarnings(tibble::as_tibble(tbl)))
}

#' Transform abundances to relative
#'
#' A simple wrapper for transform_sample_counts()
#'
#' @param physeq_obj The phyloseq object
#' @param percent_abund Fractional or percent abundance?
#' @return A phyloseq object
#' @export
phyloseq_rel_abund <- function(physeq_obj, percent_abund=TRUE) {
  if(percent_abund == TRUE){
    physeq_obj = phyloseq::transform_sample_counts(physeq_obj, function(x) x / sum(x) * 100)
  } else {
    physeq_obj = phyloseq::transform_sample_counts(physeq_obj, function(x) x / sum(x) )
  }
  return(physeq_obj)
}

#' phyloseq::estimate_richness, but includes Faith's PD
#'
#' See physeq::estimate richness for full details
#'
#' @param physeq Phyloseq object
#' @param split Splitting the OTU table
#' @param measures Which diversity measures (Faith's PD = "FaithPD)
#' @return Dataframe
#' @export
estimate_richness_phy = function (physeq, split = TRUE, measures = NULL){
  if (!any(otu_table(physeq) == 1)) {
    warning("The data you have provided does not have\n",
            "any singletons. This is highly suspicious. Results of richness\n",
            "estimates (for example) are probably unreliable, or wrong, if you have already\n",
            "trimmed low-abundance taxa from the data.\n", "\n",
            "We recommended that you find the un-trimmed data and retry.")
  }
  if (!split) {
    OTU <- phyloseq::taxa_sums(physeq)
  }
  else if (split) {
    OTU <- as(phyloseq::otu_table(physeq), "matrix")
    if (phyloseq::taxa_are_rows(physeq)) {
      OTU <- t(OTU)
    }
  }
  renamevec = c("Observed", "Chao1", "ACE", "Shannon", "Simpson",
                "InvSimpson", "Fisher")
  names(renamevec) <- c("S.obs", "S.chao1", "S.ACE", "shannon",
                        "simpson", "invsimpson", "fisher")
  if (is.null(measures)) {
    measures = as.character(renamevec)
  }
  if (any(measures %in% names(renamevec))) {
    measures[measures %in% names(renamevec)] <- renamevec[names(renamevec) %in%
                                                            measures]
  }
  if (!any(measures %in% renamevec)) {
    stop("None of the `measures` you provided are supported. Try default `NULL` instead.")
  }
  outlist = vector("list")
  estimRmeas = c("Chao1", "Observed", "ACE")
  if (any(estimRmeas %in% measures)) {
    outlist <- c(outlist, list(t(data.frame(vegan::estimateR(OTU)))))
  }
  if ("Shannon" %in% measures) {
    outlist <- c(outlist, list(shannon = vegan::diversity(OTU, index = "shannon")))
  }
  if ("Simpson" %in% measures) {
    outlist <- c(outlist, list(simpson = vegan::diversity(OTU, index = "simpson")))
  }
  if ("InvSimpson" %in% measures) {
    outlist <- c(outlist, list(invsimpson = vegan::diversity(OTU,
                                                             index = "invsimpson")))
  }
  if ("Fisher" %in% measures) {
    fisher = tryCatch(preseqR::fisher.alpha(OTU, se = TRUE), warning = function(w) {
      warning("phyloseq::estimate_richness: Warning in fisher.alpha(). See `?fisher.fit` or ?`fisher.alpha`. Treat fisher results with caution")
      suppressWarnings(preseqR::fisher.alpha(OTU, se = TRUE)[, c("alpha",
                                                        "se")])
    })
    if (!is.null(dim(fisher))) {
      colnames(fisher)[1:2] <- c("Fisher", "se.fisher")
      outlist <- c(outlist, list(fisher))
    }
    else {
      outlist <- c(outlist, Fisher = list(fisher))
    }
  }

  if( "FaithPD" %in% measures){
    outlist <- c(outlist, list(FaithPD = t(picante::pd(samp = OTU, tree = phy_tree(physeq),
                                                       include.root = TRUE))[1,] ))
  }

  out = do.call("cbind", outlist)
  namechange = intersect(colnames(out), names(renamevec))
  colnames(out)[colnames(out) %in% namechange] <- renamevec[namechange]
  colkeep = sapply(paste0("(se\\.){0,}", measures), grep, colnames(out),
                   ignore.case = TRUE)
  out = out[, sort(unique(unlist(colkeep))), drop = FALSE]
  out <- as.data.frame(out)
  return(out)
}

#' Helper Function for rarefaction analysis
#'
#' @param psdata phyloseq object
#' @param measures Which diversity measures
#' @param depth The sampling depth
#' @return molten alpha diversity object
#' @export
estimate_rarified_richness = function(psdata, measures, depth) {
  if(max(sample_sums(psdata)) < depth) return()
  psdata = phyloseq::prune_samples(sample_sums(psdata) >= depth, psdata)

  rarified_psdata = phyloseq::rarefy_even_depth(psdata, depth, verbose = FALSE)

  alpha_diversity = phyloseq::estimate_richness_phy(rarified_psdata, measures = measures)

  # as.matrix forces the use of melt.array, which includes the Sample names (rownames)
  molten_alpha_diversity = reshape2::melt(as.matrix(alpha_diversity),
                                           varnames = c('Sample', 'Measure'),
                                           value.name = 'Alpha_diversity')
  # return
  return(molten_alpha_diversity)
}

#' Function for rarefaction analysis
#'
#' Running estimate_richness_phy() at multiple subsampling depths
#'
#' @param psdata phyloseq object
#' @param measures Which diversity measures (see vegan package)
#' @param depths Which sequencing depths? Example: c(10, 100, 1000)
#' @return A dataframe
#' @export
calculate_rarefaction_curves = function(psdata, measures, depths, parallel=FALSE) {
  names(depths) = depths # this enables automatic addition of the Depth to the output by ldply
  rarefaction_curve_data = plyr::ldply(depths, estimate_rarified_richness, psdata = psdata,
                                        measures = measures, .id = 'Depth',
                                        .progress = ifelse(interactive(), 'text', 'none'),
                                        .parallel = parallel)

  # convert Depth from factor to numeric
  rarefaction_curve_data$Depth = as.numeric(levels(rarefaction_curve_data$Depth))[rarefaction_curve_data$Depth]
  # return
  return(rarefaction_curve_data)
}

leylabmpi/LeyLabRMisc documentation built on June 13, 2025, 9:29 a.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

leylabmpi/LeyLabRMisc
Ley Lab misc R functions, rmd templates, etc.

R/phyloseq.R
In leylabmpi/LeyLabRMisc: Ley Lab misc R functions, rmd templates, etc.

Defines functions calculate_rarefaction_curves estimate_rarified_richness phyloseq_rel_abund phyloseq2df

Documented in calculate_rarefaction_curves estimate_rarified_richness phyloseq2df phyloseq_rel_abund

R Package Documentation

Browse R Packages

We want your feedback!

leylabmpi/LeyLabRMisc Ley Lab misc R functions, rmd templates, etc.

R/phyloseq.R In leylabmpi/LeyLabRMisc: Ley Lab misc R functions, rmd templates, etc.

Defines functions calculate_rarefaction_curves estimate_rarified_richness phyloseq_rel_abund phyloseq2df

Documented in calculate_rarefaction_curves estimate_rarified_richness phyloseq2df phyloseq_rel_abund

R Package Documentation

Browse R Packages

We want your feedback!

leylabmpi/LeyLabRMisc
Ley Lab misc R functions, rmd templates, etc.

R/phyloseq.R
In leylabmpi/LeyLabRMisc: Ley Lab misc R functions, rmd templates, etc.