stocks: Stock Market Analysis

Documented in plot_metrics

#' Plot One Performance Metric (Sorted Bar Plot) or One vs. Another
#' (Scatterplot) for a Group of Individual Funds
#'
#' Useful for visualizing the performance of individual funds. For 2- and 3-fund
#' portfolios, see \code{plot_metrics_2funds} and \code{plot_metrics_3funds}.
#' To visualize any combination of single funds and 2- and 3-fund portfolios,
#' see \code{link{plot_metrics_123}}.
#'
#'
#' @param metrics "Long" data frame with Fund column and column for each metric
#' you want to plot. Typically the result of a prior call to
#' \code{\link{calc_metrics}}.
#' @param formula Formula specifying what to plot, e.g. \code{cagr ~ mdd} for
#' CAGR vs. MDD, \code{cagr ~ .} for just CAGR, or \code{. ~ mdd} for just MDD.
#' See \code{?calc_metrics} for list of metrics to choose from.
#' @param tickers Character vector of ticker symbols that Yahoo! Finance
#' recognizes, if you want to download data on the fly.
#' @param ... Arguments to pass along with \code{tickers} to
#' \code{\link{load_gains}}.
#' @param gains Data frame with one column of gains for each investment and a
#' date variable named Date.
#' @param prices Data frame with one column of prices for each investment and a
#' date variable named Date.
#' @param benchmark Character string specifying which fund to use as a
#' benchmark for metrics that require one.
#' @param y.benchmark Character string specifying which fund to use as benchmark
#' for y-axis metric.
#' @param x.benchmark Character string specifying which fund to use as benchmark
#' for x-axis metric.
#' @param plotly Logical value for whether to convert the
#' \code{\link[ggplot2]{ggplot}} to a \code{\link[plotly]{plotly}} object
#' internally.
#' @param title Character string.
#' @param base_size Numeric value.
#' @param label_size Numeric value.
#' @param ticklabel_size Numeric value.
#' @param return Character string specifying what to return. Choices are
#' \code{"plot"}, \code{"data"}, and \code{"both"}.
#'
#'
#' @return
#' Depending on \code{return}, a \code{\link[ggplot2]{ggplot}}, a data frame
#' with the source data, or a list containing both.
#'
#'
#' @references
#' Jeffrey A. Ryan and Joshua M. Ulrich (2019). quantmod: Quantitative Financial
#' Modelling Framework. R package version 0.4-15.
#' \url{https://CRAN.R-project.org/package=quantmod}
#'
#'
#' @examples
#' \dontrun{
#' # Plot Sharpe ratio for FANG stocks
#' plot_metrics(formula = sharpe ~ ., tickers = fang)
#'
#' # Create previous plot in step-by-step process with pipes
#' fang %>%
#'   load_gains() %>%
#'   calc_metrics("sharpe") %>%
#'   plot_metrics(. ~ sharpe)
#'
#' # Plot CAGR vs. max drawdown for SPY and BRK-B
#' plot_metrics(formula = cagr ~ mdd, tickers = c("SPY", "BRK-B"))
#'
#' # Create previous plot in step-by-step process with pipes
#' c("SPY", "BRK-B") %>%
#'   load_gains() %>%
#'   calc_metrics("cagr", "mdd") %>%
#'   plot_metrics(cagr ~ mdd)
#' }
#'
#'
#' @export
plot_metrics <- function(metrics = NULL,
                         formula = cagr ~ mdd,
                         tickers = NULL,
                         ...,
                         gains = NULL,
                         prices = NULL,
                         benchmark = "SPY",
                         y.benchmark = benchmark,
                         x.benchmark = benchmark,
                         plotly = FALSE,
                         title = NULL,
                         base_size = 16,
                         label_size = 5,
                         ticklabel_size = 8,
                         return = "plot") {

  # Extract info from formula
  all.metrics <- all.vars(formula, functions = FALSE)

  # If metrics is specified but doesn't include the expected variables, set defaults
  if (! is.null(metrics) & ! all(unlist(metric_label(all.metrics)) %in% names(metrics))) {
    all.metrics <- unlist(label_metric(names(metrics)))
    if (length(all.metrics) == 1) {
      all.metrics <- c(all.metrics, ".")
    } else if (length(all.metrics) >= 2) {
      all.metrics <- all.metrics[1: 2]
    } else {
      stop("The input 'metrics' must have at least one column with a performance metric")
    }
  }
  y.metric <- x.metric <- NULL
  if (all.metrics[1] != ".") y.metric <- all.metrics[1]
  if (all.metrics[2] != ".") x.metric <- all.metrics[2]
  all.metrics <- c(y.metric, x.metric)

  xlabel <- metric_label(x.metric)
  ylabel <- metric_label(y.metric)

  # Set benchmarks to NULL if not needed
  if (! any(c("alpha", "alpha.annualized", "beta", "r.squared", "r", "rho") %in% all.metrics)) {
    benchmark <- y.benchmark <- x.benchmark <- NULL
  }

  # Check that requested metrics are valid
  invalid.requests <- all.metrics[! (all.metrics %in% c(metric.choices, "allocation") | grepl("growth.", all.metrics, fixed = TRUE))]
  if (length(invalid.requests) > 0) {
    stop(paste("The following metrics are not allowed (see ?calc_metrics for choices):",
               paste(invalid.requests, collapse = ", ")))
  }

  # Calculate performance metrics if not pre-specified
  if (is.null(metrics)) {

    # Determine gains if not pre-specified
    if (is.null(gains)) {

      if (! is.null(prices)) {

        date.var <- names(prices) == "Date"
        gains <- cbind(prices[-1, date.var, drop = FALSE],
                       sapply(prices[! date.var], pchanges))

      } else if (! is.null(tickers)) {

        gains <- load_gains(tickers = unique(c(y.benchmark, x.benchmark, tickers)), ...)
        tickers <- setdiff(names(gains), c("Date", y.benchmark, x.benchmark))

      } else {

        stop("You must specify 'metrics', 'gains', 'prices', or 'tickers'")

      }

    }

    # If tickers is NULL, set to all funds in gains, excluding benchmarks
    if (is.null(tickers)) {
      tickers <- setdiff(names(gains), c("Date", y.benchmark, x.benchmark))
    }

    # Figure out conversion factor in case CAGR or annualized alpha is requested
    min.diffdates <- min(diff(unlist(head(gains$Date, 10))))
    units.year <- ifelse(min.diffdates == 1, 252, ifelse(min.diffdates <= 30, 12, 1))

    # Extract benchmark gains
    if (! is.null(y.benchmark)) {
      y.benchmark.gains <- gains[[y.benchmark]]
    } else {
      y.benchmark.gains <- NULL
    }
    if (! is.null(x.benchmark)) {
      x.benchmark.gains <- gains[[x.benchmark]]
    } else {
      x.benchmark.gains <- NULL
    }

    df <- data.frame(Fund = tickers)

    if (! is.null(y.metric)) {
      df[[ylabel]] <- sapply(gains[tickers], function(x) {
        calc_metric(gains = x, metric = y.metric, units.year = units.year, benchmark.gains = y.benchmark.gains)
      })
    }

    if (! is.null(x.metric)) {
      df[[xlabel]] <- sapply(gains[tickers], function(x) {
        calc_metric(gains = x, metric = x.metric, units.year = units.year, benchmark.gains = x.benchmark.gains)
      })
    }

  } else {
    df <- as.data.frame(metrics)
  }

  # Drop benchmarks and funds with missing metrics
  df <- df[! df$Fund %in% c(y.benchmark, x.benchmark) & complete.cases(df[, c(xlabel, ylabel)]), ]

  # Create plot
  if (is.null(x.metric)) {

    # For y.metric only
    df$tooltip <- paste(df$Fund, "<br>",
                        metric_title(y.metric), ": ", formatC(df[[ylabel]], metric_decimals(y.metric), format = "f"), metric_units(y.metric), sep = "")
    p <- ggplot(df, aes(y = .data[[ylabel]],
                        x = reorder(Fund, .data[[ylabel]]),
                        text = tooltip)) +
      geom_col() +
      scale_y_continuous(limits = range(c(0, df[[ylabel]])) * 1.03, expand = c(0, 0)) +
      theme(axis.text = element_text(size = ticklabel_size)) +
      labs(title = ifelse(! is.null(title), title, paste(metric_title(y.metric), "for Various Funds")),
           y = ylabel, x = NULL)

  } else if (is.null(y.metric)) {

    # For x.metric only
    df$tooltip <- paste(df$Fund, "<br>", metric_title(x.metric), ": ",
                        formatC(df[[xlabel]], metric_decimals(x.metric), format = "f"), metric_units(x.metric), sep = "")
    p <- ggplot(df, aes(y = .data[[xlabel]], x = reorder(Fund, .data[[xlabel]]), text = tooltip)) +
      geom_col() +
      theme(axis.text = element_text(size = ticklabel_size)) +
      coord_flip(ylim = range(c(0, df[[xlabel]])) * 1.03, expand = 0) +
      labs(title = ifelse(! is.null(title), title, paste(metric_title(x.metric), "for Various Funds")),
           y = xlabel, x = NULL)

  } else {

    df$tooltip <- paste(
      df$Fund,
      "<br>", metric_title(x.metric), ": ", formatC(df[[xlabel]], metric_decimals(x.metric), format = "f"), metric_units(x.metric),
      "<br>", metric_title(y.metric), ": ", formatC(df[[ylabel]], metric_decimals(y.metric), format = "f"), metric_units(y.metric), sep = ""
    )
    p <- ggplot(df, aes(y = .data[[ylabel]],
                        x = .data[[xlabel]],
                        group = Fund, label = Fund, text = tooltip)) +
      geom_point() +
      geom_label_repel(size = label_size) +
      ylim(range(c(0, df[[ylabel]])) * 1.03) +
      xlim(range(c(0, df[[xlabel]])) * 1.03) +
      theme_gray(base_size = base_size) +
      labs(title = ifelse(! is.null(title), title, paste(metric_title(y.metric), "vs.", metric_title(x.metric))),
           y = ylabel, x = xlabel)

  }

  if (plotly) {
    p <- ggplotly(p, tooltip = "tooltip") %>%
      style(hoverlabel = list(font = list(size = 15)))
  }

  if (return == "plot") return(p)
  if (return == "data") return(df)
  return(list(plot = p, data = df))

}