R/extract_sigma.R
In nichetools: Complementary Package to 'nicheROVER' and 'SIBER'

Documented in extract_sigma

#' extract \eqn{\Sigma}
#'
#' Extract Bayesian estimates of \eqn{\Sigma} from data objects created by
#' [{nicheROVER}](https://cran.r-project.org/package=nicheROVER)
#' or [{SIBER}](https://cran.r-project.org/package=SIBER).
#'
#' @param data a `list` created by the function `niw.post()` or `siberMVN()`
#' in the package
#' [{nicheROVER}](https://cran.r-project.org/package=nicheROVER)
#' or [{SIBER}](https://cran.r-project.org/package=SIBER), respectfully.
#' @param pkg a `character` string that is the name of the package that
#' you're using. Defaults to `"nicheROVER"`.
#' Alternatively the user can supply the argument with `"SIBER"`.
#' @param isotope_n a `numeric` either `2` or `3` that is the number of isotopes
#' used in the anlsysis. Will default to `2`.
#' @param isotope_names is a vector of `character` string used change the column name
#' of isotopes used in the analysis. Defaults to `c("d13c", "d15n")`.
#' @param data_format a `character` string that decides whether the returned object is
#' in long or wide format. Default is `"wide"`, with the alternative supplied being `"long"`.
#'
#' @return Returns a `tibble` of extracted estimates of \eqn{\Sigma} created by
#' the function `niw.post()` or `siberMVN()` in the packages
#' [{nicheROVER}](https://cran.r-project.org/package=nicheROVER).
#' and [{SIBER}](https://cran.r-project.org/package=SIBER).
#'
#' The returned object will contain five columns in the
#' following order when `data_format` is set to `"wide"`,
#' `metric`, `id`, `sample_name`, `isotope`, `sample_number`,
#' and the posterior sample for \eqn{\Sigma} (e.g., `d13c` and `d15n`).
#'
#' @seealso [nicheROVER::niw.post()] and [SIBER::siberMVN()]
#' @examples
#' extract_sigma(
#' data = niw_fish_post
#' )
#'
#' extract_sigma(
#' data = post_sam_siber,
#' pkg = "SIBER"
#' )
#'
#' @import dplyr
#' @import purrr
#' @import tibble
#' @import tidyr
#' @export

extract_sigma <-  function(data,
                           pkg = NULL,
                           isotope_n = NULL,
                           isotope_names = NULL,
                           data_format = NULL) {

  # Set pkg to "nicheROVER" if it is NULL
  if (is.null(pkg)) {
    pkg <- "nicheROVER"
  }

  # Check if pkg is one of the allowed values
  if (!(pkg %in% c("nicheROVER", "SIBER"))) {
    cli::cli_abort("Invalid characters for 'pkg'. Allowed character strings are
                   'nicheROVER' or 'SIBER'.")
  }

  # sett data formatt
  if (is.null(data_format)) {
    data_format <- "wide"
  }

  if (!(data_format %in% c("wide", "long"))) {
    cli::cli_abort("Invalid characters for 'data_format'. Allowed character
    strings are 'wide' or 'long'.")
  }


  if (pkg %in% "nicheROVER") {
    # Check if data is a list
    if (!inherits(data, "list")) {
      cli::cli_abort("Input 'data' must be a list.")
    }
    # create name vector that will be used to id isotopes.
    if (is.null(isotope_n)) {
      isotope_n <- 2
    }
    if (!is.numeric(isotope_n) || !(isotope_n %in% c(2, 3))) {
      cli::cli_abort("Argument 'isotope_n' must be a numeric value and either 2 or 3.")
    }

    if (isotope_n == 2) {
      if (is.null(isotope_names)) {
        isotope_names <- c("d13c", "d15n")
      }

      # Check if isotope_names is a character vector
      if (!is.vector(isotope_names) || !is.character(isotope_names)) {
        cli::cli_abort("The supplied argument for 'isotope_names' must be a vector of characters.")
      }

      # Check if isotope_names has exactly 2 elements
      if (length(isotope_names) != 2) {
        cli::cli_abort("The 'isotope_names' vector must have exactly 2 elements, representing isotope_a and isotope_b.")
      }

      df_sigma <- purrr::map(data, purrr::pluck, 2) |>
        purrr::imap(~ tibble::as_tibble(.x))

      isotope_number <- df_sigma |>
        purrr::map(~ nrow(.x)) |>
        dplyr::bind_rows(.id = "isotope_num") |>
        dplyr::mutate(
          id = 1
        ) %>%
        tidyr::pivot_longer(-id)

      isotope_length <- unique(isotope_number$value)

      if (isotope_length != 2) {
        cli::cli_abort("Argument 'isotope_n' does not match the number of isotopes
                       being used.")
      }

      }

    if (isotope_n == 3) {
      # defaults of isotpoe a and b
      if (is.null(isotope_names)) {
        isotope_names <- c("d13c", "d15n", "d34s")
      }

      # Check if isotope_names is a character vector
      if (!is.vector(isotope_names) || !is.character(isotope_names)) {
        cli::cli_abort("The supplied argument for 'isotope_names' must be a vector of characters.")
      }

      # Check if isotope_names has exactly 2 elements
      if (length(isotope_names) != 3) {
        cli::cli_abort("The 'isotope_names' vector must have exactly 3 elements, representing isotope_a,  isotope_b, and isotope_c.")
      }

      df_sigma <- purrr::map(data, purrr::pluck, 2) |>
        purrr::imap(~ tibble::as_tibble(.x))

      isotope_number <- df_sigma |>
        purrr::map(~ nrow(.x)) |>
        dplyr::bind_rows(.id = "isotope_num") |>
        dplyr::mutate(
          id = 1
        ) %>%
        tidyr::pivot_longer(-id)

      isotope_length <- unique(isotope_number$value)

      if (isotope_length != 3) {
        cli::cli_abort("Argument 'isotope_n' does not match the number of isotopes
                       being used.")
      }

    }

    # extract sigma
    df_sigma_extract <- df_sigma |>
      purrr::imap(~ .x |>
                    dplyr::mutate(
                      metric = "sigma",
                      id = isotope_names,
                      sample_name = .y
                    )
      ) |>
      dplyr::bind_rows() |>
      tidyr::pivot_longer(cols = -c("id", "sample_name", "metric"),
                          names_to = "isotope",
                          values_to = "post_sample"
      ) |>
      tidyr::separate(isotope, into = c("isotope", "sample_number"),
                      sep = "\\.")



    if (data_format %in% "wide") {

      df_sigma_extract <- df_sigma_extract |>
        tidyr::pivot_wider(names_from = id,
                           values_from = post_sample)
      return(df_sigma_extract)
    }
    if (data_format %in% "long") {
      return(df_sigma_extract)

    }
  }


  if (pkg %in% "SIBER") {
    if (!inherits(data, "list")) {
      cli::cli_abort("Input 'data' must be a list.")
    }

    if (is.null(isotope_names)) {
      isotope_names <- c("d13c", "d15n")
    }

    # Check if isotope_names is a character vector
    if (!is.vector(isotope_names) || !is.character(isotope_names)) {
      cli::cli_abort("The supplied argument for 'isotope_names' must be a vector of characters.")
    }

    # Check if isotope_names has exactly 2 elements
    if (length(isotope_names) != 2) {
      cli::cli_abort("The 'isotope_names' vector must have exactly 2 elements, representing isotope_a and isotope_b.")
    }
    # create name vector that will be used to id isotopes.
    id_isotope <- isotope_names

    isotope_a <- isotope_names[1]
    isotope_b <- isotope_names[2]


    df_sigma <- data |>
      purrr::map(~ {
        df <- .x[, 1:4] |>
          t() |>
          as.numeric() |>
          matrix(ncol = 2, byrow = T) |>
          as.data.frame() |>
          tibble::as_tibble()

        df <- df |>
          dplyr::mutate(
            sample_number = rep(1:ceiling(nrow(df) / 2),
                                each = 2,
                                length.out = nrow(df)),
            isotope = rep(id_isotope, times = nrow(df) / 2)
          )
      }
      ) |>
      dplyr::bind_rows(.id = "sample_name") |>
      dplyr::mutate(
        metric = "sigma",
      ) |>
      dplyr::rename(
        {{isotope_a}} := V1,
        {{isotope_b}} := V2
      ) |>
      dplyr::select(metric, sample_name, isotope, sample_number, {{isotope_a}},
                    {{isotope_b}})

    if (data_format %in% "wide") {

      return(df_sigma)
    }

    if (data_format %in% "long") {
      df_sigma <- df_sigma |>
        mutate(
          id = isotope
        ) |>
        dplyr::select(-isotope) |>
        tidyr::pivot_longer(cols = -c("metric", "sample_name", "id",
                                      "sample_number"),
                            names_to = "isotope",
                            values_to = "post_sample"

        ) |>
        dplyr::select(
          metric, id, sample_name, isotope, sample_number, post_sample
        ) |>
        arrange(id)


    }
  }
}