playaxr: Create R plots conforming to the Playax standards.

Documented in abbrv_large

#' Abbreviated labels for \href{https://en.wikipedia.org/wiki/Names_of_large_numbers}{large numbers}.
#'
#' `abbrv_large` takes a numeric vector and returns a character vector containing
#'  abbreviated names of the form `[DDD].[S+]C` where `[DDD]` and [S+] is a variable
#'  prefix of the of the original number containing its most significant digits,
#'  and `C` an abbreviation which summarises its magnitude. In addition, `abbrv_large` may
#'  add decimal places to the abbreviated number to disambiguate them from other numbers
#'  close in the scale.
#'
#'  For example, `1e6` will be typically mapped into `1M`, and `123845` to `123k`.
#'  However, `abbrv_large` may add decimal places if more than one number in the input
#'  maps into the same abbreviated representation. The number of decimal places
#'  kept is the minimum required to disambiguate all of the abbreviated representations
#'  (see examples).
#'
#'  Numbers are _truncated_, not rounded, into their large number representation.
#'
#'
#' @examples
#'
#'  # All abbreviations are unique, do not add decimal places.
#'  abbrv_large(c(123456, 28475777, 125, 1.3, 0.1))
#'  # [1] "123k" "28M"  "125"  "1"    "0"
#'
#'  # Adds one decimal place to the `k` range to disambiguate 123.4k from 123.5k.
#'  abbrv_large(c(123456, 123556, 28475777, 125, 1.3, 0.1, 1))
#'  # [1] "123.4k" "123.5k" "28M"    "125"    "1"      "0"
#'
#' @export
abbrv_large <- function(x, decimals = NULL) {
  decimals <- if (is.null(decimals)) compute_decimals(x) else decimals
  x_str <- rep(NA_character_, length(x))
  for (i in 1:nrow(RANGES)) {
    unit <- RANGES[i,]$unit
    round_to <- if (is.null(decimals[[unit]])) 0 else decimals[[unit]]
    x_str <- coalesce(
      abbrv_range(x, RANGES[i,]$magnitude, unit, decimals = round_to),
      x_str
    )
  }
  mag_floor <- min(RANGES$magnitude)
  if_else(abs(x) < mag_floor, as.character(trunc(x)), x_str)
}

abbrv_range <- function(x, magnitude, unit, decimals) {
  abs_x <- abs(x)
  if_else(magnitude <= abs_x & abs_x < magnitude * 1000,
          sprintf('%s%s', as.character(
            truncate(x / magnitude, decimals = decimals)), unit),
          NA)
}

compute_decimals <- function(x) {
  decimals <- list()
  # TODO This makes things easier, but we should actually apply separate
  # truncations for positive and negative numbers.
  abs_x <- abs(x[!is.na(x)])
  mags <- c(RANGES$magnitude, +Inf)
  units <- RANGES$unit

  for (i in 1:nrow(RANGES)) {
    x_range <- abs_x[(mags[i] <= abs_x & abs_x < mags[i + 1])]
    if (length(x_range) <= 1) {
      next
    }
    diffs <- round(diff(sort(unique(x_range))))
    decimals[units[i]] <- max(0, log10(mags[i]) - min(floor(log10(diffs))))
  }

  decimals
}

RANGES <- data.frame(
  magnitude = c(1e3, 1e6, 1e9, 1e12),
  unit = c('k', 'M', 'B', 'T'),
  stringsAsFactors = FALSE
)