R/get_performance_metrics.R

Defines functions get_performance_metrics get_performance_by_pgs_id get_performance_by_ppm_id get_performance_all get_performance

Documented in get_performance_metrics

get_performance <- function(resource,
                      limit = 20L,
                      verbose = FALSE,
                      warnings = TRUE,
                      progress_bar = TRUE) {

  tbl_json <- get(resource_url = resource,
                  limit = limit,
                  verbose = verbose,
                  warnings = warnings,
                  progress_bar = progress_bar)

  tidy_tbls <- as_tidy_tables_performance_metrics(tbl_json)

  return(tidy_tbls)
}


get_performance_all <- function(limit = 20L, verbose = FALSE, warnings = TRUE, progress_bar = TRUE) {

  resource <- '/rest/performance/all'

  get_performance(resource = resource,
            limit = limit,
            verbose = verbose,
            warnings = warnings,
            progress_bar = progress_bar)
}


get_performance_by_ppm_id <- function(ppm_id, limit = 20L, verbose = FALSE, warnings = TRUE, progress_bar = TRUE) {

  resource <- '/rest/performance'
  resource_urls <- sprintf("%s/%s", resource, ppm_id)

  purrr::map(
    resource_urls,
    get_performance,
    limit = limit,
    warnings = warnings,
    verbose = verbose,
    progress_bar = progress_bar
  ) %>%
    purrr::pmap(dplyr::bind_rows)
}

get_performance_by_pgs_id <- function(pgs_id, limit = 20L, verbose = FALSE, warnings = TRUE, progress_bar = TRUE) {

  resource <- '/rest/performance/search'
  resource_urls <- sprintf("%s?pgs_id=%s", resource, pgs_id)

  purrr::map(
    resource_urls,
    get_performance,
    limit = limit,
    warnings = warnings,
    verbose = verbose,
    progress_bar = progress_bar
  ) %>%
    purrr::pmap(dplyr::bind_rows)
}

#' Get PGS Catalog Performance Metrics
#'
#' Retrieves performance metrics via the PGS Catalog REST API. The REST
#' API is queried multiple times with the criteria passed as arguments (see
#' below). By default all performance metrics that match the criteria supplied in the
#' arguments are retrieved: this corresponds to the default option
#' \code{set_operation} set to \code{'union'}. If you rather have only the
#' associations that match simultaneously all criteria provided, then set
#' \code{set_operation} to \code{'intersection'}.
#'
#' Please note that all search criteria are vectorised, thus allowing for batch
#' mode search.
#'
#' @param ppm_id A character vector of PGS Catalog performance metrics accession
#'   identifiers.
#' @param pgs_id A \code{character} vector of PGS Catalog score accession
#'   identifiers.
#' @param set_operation Either \code{'union'} or \code{'intersection'}. This
#'   tells how performance metrics retrieved by different criteria  should be combined:
#'   \code{'union'} binds together all results removing duplicates and
#'   \code{'intersection'} only keeps same performance metrics found with different
#'   criteria.
#' @param interactive A logical. If all performance metrics are requested, whether to ask
#'   interactively if we really want to proceed.
#' @param verbose A \code{logical} indicating whether the function should be
#'   verbose about the different queries or not.
#' @param warnings A \code{logical} indicating whether to print warnings, if any.
#' @param progress_bar Whether to show a progress bar as the queries are
#'   performed.
#'
#' @return A \linkS4class{performance_metrics} object.
#' @examples
#' \dontrun{
#' # Get performance metrics catalogued with identifier 'PPM000001'
#' get_performance_metrics(ppm_id = 'PPM000001')
#'
#' # Get performance metrics associated with polygenic score id 'PGS000001'
#' get_performance_metrics(pgs_id = 'PGS000001')
#'
#' # To retrieve all catalogued performed metrics in PGS Catalog you simply
#' # leave the parameters `ppm_id` and `pgs_id` as `NULL`.
#' get_performance_metrics()
#' }
#'
#' @export
get_performance_metrics <- function(
  ppm_id = NULL,
  pgs_id = NULL,
  set_operation = 'union',
  interactive = TRUE,
  verbose = FALSE,
  warnings = TRUE,
  progress_bar = TRUE) {

  if(!(rlang::is_scalar_character(set_operation) && set_operation %in% c('union', 'intersection')))
    stop("set_operation must be either 'union' or 'intersection'")

  if(!(rlang::is_scalar_logical(verbose) && verbose %in% c(TRUE, FALSE)))
    stop("verbose must be either TRUE or FALSE")

  if(!(rlang::is_scalar_logical(warnings) && warnings %in% c(TRUE, FALSE)))
    stop("warnings must be either TRUE or FALSE")

  list_of_ppm <- list()

  if (!rlang::is_null(ppm_id))
    list_of_ppm[['get_performance_by_ppm_id']] <-
    get_performance_by_ppm_id(ppm_id = ppm_id,
                        verbose = verbose,
                        warnings = warnings,
                        progress_bar = progress_bar) %>%
    coerce_to_s4_performance_metrics()

  if (!rlang::is_null(pgs_id))
    list_of_ppm[['get_performance_by_pgs_id']] <-
    get_performance_by_pgs_id(pgs_id = pgs_id,
                          verbose = verbose,
                          warnings = warnings,
                          progress_bar = progress_bar) %>%
    coerce_to_s4_performance_metrics()

  # If no criteria have been passed, i.e. all are NULL then got fetch all
  # Performance Metrics.
  if(rlang::is_empty(list_of_ppm)) {
    msg1 <- "You are about to download all Performance Metrics from the PGS Catalog.\nThis might take a while."
    msg2 <- 'Returning an empty performance_metrics object!'
    msg3 <- 'OK! Getting all Performance Metrics then. This is going to take a while...'
    if(interactive)
      default_answer = NULL  # i.e., use interactive mode.
    else
      default_answer = 'y'
    if (sure(
      before_question = msg1,
      after_saying_no = msg2,
      after_saying_yes = msg3,
      default_answer = default_answer
    ))
      return(
        coerce_to_s4_performance_metrics(
          get_performance_all(
            verbose = verbose,
            warnings = warnings,
            progress_bar = progress_bar
          ))
      )
    else
      return(coerce_to_s4_performance_metrics(NULL))
  } else {

    if (identical(set_operation, "union")) {
      return(purrr::reduce(list_of_ppm, union))
    }

    if (identical(set_operation, "intersection")) {
      return(purrr::reduce(list_of_ppm, intersect))
    }
  }
}

Try the quincunx package in your browser

Any scripts or data that you put into this service are public.

quincunx documentation built on July 9, 2023, 7:32 p.m.