NaiveBayes: Gaussian Naive Bayes model

Documented in naive_bayes predict.naive_bayes

#' Naive Bayes model
#'
#' Creates a summary matrix of the means and standard devations
#' for the data matrix split by classes and features. It also
#' calcaulates the prior class probabilities.
#'
#' @param X data matrix which stores observations as rows and
#' features as columns
#'
#' @param y column vector that stores each observation's class labels
#'
#' @return
#'
#' @import stats
#' @export
#'
#' @examples
#'
naive_bayes <- function(X, y) {
  n <- dim(X)[1]
  d <- dim(X)[2]
  levels <- sort(unique(y)[, 1])
  k <- length(levels)

  #calculate prior class probabilities
  prior <- rep(0, k)
  for (i in 1:k) {
    prior[i] <- sum(y == levels[i]) / n
  }

  # create a 3D array containing the mean and sd of the data
  # split by clasess and features
  summaries <- array(rep(1, d * k * 2), dim = c(k, d, 2))
  for (i in 1:k) {
    X_k <- X[which(y == (i - 1)), ]
    summaries[i, , 1] <- apply(X_k, 2, mean)
    summaries[i, , 2] <- apply(X_k, 2, sd)
  }

  # create an S3 object
  nb <- list(X = X, y = y, summaries = summaries, prior = prior)
  class(nb) <- "naive_bayes"
  return(nb)
}

#' Predictions for Naive Bayes
#'
#' Makes predictions based on the fitted naive_bayes model by using a
#' Gaussian assumption that each variable is normally ditributed.
#'
#' @param object instance of naive_bayes class
#' @param x_new test data matrix with observations as rows and features as columns
#'
#' @return predicted class labels
#' @import stats
#' @export
#'
#' @examples
#'
predict.naive_bayes <- function(object, x_new, ...) {
  prior <- object$prior
  summaries <- object$summaries
  n <- dim(x_new)[1]
  d <- dim(x_new)[2]
  k <- dim(summaries)[1]

  # calculate posterior class probabilities for every observations
  result <- matrix(rep(0, n * k), nrow = n)
  for (obs in 1:n) {
    for (class in 1:k) {
      post <- log(prior[class])
      for (feat in 1:d) {
        mu <- summaries[class, feat, 1]
        sd <- summaries[class, feat, 2]
        cond <- dnorm(x_new[obs, feat], mu, sd, log = TRUE)
        post <- post + cond
      }
      result[obs, class] <- post
    }
  }

  # obtain predictions by taking the largest posterior
  # class probability
  pred <- apply(result, 1, which.max)
  return(matrix((pred - 1), ncol = 1))
}