
Defines functions plotRarefactionCurve

Documented in plotRarefactionCurve

#' Plot rarefaction and extrapolation curves for samples
#' Given a study table, for each sample plot rarefaction curves to estimate
#' repertoire diversity. The method used to generate the rarefaction curve
#' is derived from Chao et al., (2014) using the iNEXT library
#' @param study_table A tibble consisting antigen receptor sequencing
#' data imported by the LymphoSeq2 function [readImmunoSeq()]. "junction_aa",
#' "duplicate_count", and "duplicate_frequency" are required columns.
#' @seealso [LymphoSeq2::runINext()]
#' @examples
#' file_path <- system.file("extdata", "TCRB_sequencing",
#'  package = "LymphoSeq2")
#' study_table <- LymphoSeq2::readImmunoSeq(path = file_path, threads = 1)
#' study_table <- LymphoSeq2::topSeqs(study_table, top = 100)
#' LymphoSeq2::plotRarefactionCurve(study_table)
#' @export
plotRarefactionCurve <- function(study_table) {
  rarefaction_tables <- study_table |>
    dplyr::group_by(repertoire_id) |>
    dplyr::group_split() |>
    purrr::map(runINext) |>
  rarefaction_tables <- rarefaction_tables |>
    dplyr::mutate(Method = dplyr::recode(Method,
      Observed = "Interpolated",
      Rarefaction = "Interpolated", Extrapolation = "Extrapolated"
  rarefaction_curves <- ggplot2::ggplot(rarefaction_tables,
      ggplot2::aes(x = m, y = qD, fill = repertoire_id)) +
    ggplot2::geom_line(ggplot2::aes(linetype = Method, color = repertoire_id),
                       size = 1.5) +
    ggplot2::geom_ribbon(ggplot2::aes(ymin = qD.LCL, ymax = qD.UCL),
                         alpha = 0.5) +
      values = c("dashed", "solid"),
      labels = c("Extrapolated", "Interpolated")
    ) +
    ggplot2::theme_classic() +
    ggplot2::xlab("Total number of sequences") +
    ggplot2::ylab("TCR diversity") +
    ggplot2::labs(fill = "Sample", color = "Sample", linetype = "Method")
shashidhar22/LymphoSeq2 documentation built on Jan. 16, 2024, 4:29 a.m.