R/calculateRMSEs.R

#' Root Mean square errors for the given data from dataset(RMSEs)
#'
#' This function calculates and returns list of two dataframes,
#' where the first data frame contains RMSEs for the given data, diferent horizons and methods,
#' the second one contains ranked list of the methods according to RMSEs.
#' Also the function plots RMSEs for different hirizons and methods.
#'
#' @aliases calculateRMSEs
#' @param frame A data frame containing columns "actual", "forecast", "method", and "horizon".
#' @param sort logical. If TRUE the resulting list of RMSEs dataframe and ranked dataframe of RMSEs sorting by average value.
#' @return \code{calculateRMSEs} function calculates and returns list of two dataframes,
#' where the first data frame contains RMSEs for the given data, diferent horizons and methods,
#' the second one contains ranked dataframe of the methods according to RMSEs.
#' Also the function plots RMSEs for different hirizons and methods.
#' @author Sai Van Cuong, Maixm Shcherbakov and Andrey Davydenko
#' @seealso \code{\link{calculateAvgRelMAEs}}, \code{\link{calculateGMAPEs}}, \code{\link{calculateGMRAEs}},
#' \code{\link{calculateMAD_MEAN_ratio}}, \code{\link{calculateMAEs}}, \code{\link{calculateMAPEs}},
#' \code{\link{calculateMASEs}}, \code{\link{calculateMdAPEs}}, \code{\link{calculateMPEs}}, \code{\link{calculateMSEs}},
#' \code{\link{calculatePB_MAEs}}, \code{\link{calculateSMAPEs}}, \code{\link{calculateSMdAPEs}}.
#' @references Rob J. Hyndman, Anne B. Koehler (2006) Volume title: "International Journal of Forecasting".
#' Chapter title: \emph{Another look at measures of forecast accuracy}. Chapter pages : (p.679-688).
#' \url{http://eva.fcea.edu.uy/pluginfile.php/109034/mod_resource/content/0/2006_Hyndman_Predicc.pdf}.
#' @keywords dataframe
#' @examples
#' calculateRMSEs(frame = FORAYearForecast)
#' calculateRMSEs(frame = FORAYearForecast, sort = TRUE)
#' data1 <- subset(FORAYearForecast, actual >= 5000| forecast < 8000)
#' data2 <- FORAYearForecast[1:300,]
#' calculateRMSEs(frame = data1, sort = TRUE)
#' calculateRMSEs(frame = data2, sort = TRUE)
#'
#' @export
calculateRMSEs <- function(frame, sort = FALSE){
  out <-matrix(NA, nrow = length(unique(frame$method)), ncol = length(unique(frame$horizon)))
  methodlist <- list()
  horizonlist <- list()
  RMSElist <- list()
  RMSE <- c()
  df = data.frame(out)
  colnames(df) <- paste("horizon = ", 1:length(unique(frame$horizon)), sep ="")
  rownames(df) <- unique(frame$method)
  ranks = data.frame(out)
  colnames(ranks) <- paste("horizon = ", 1:length(unique(frame$horizon)), sep ="")
  rownames(ranks) <- unique(frame$method)
  outlist <- list()

  for(j in as.vector(unique(frame$horizon))){
    for(i in as.vector(unique(frame$method))){
      df[i, j] <-  sqrt(mean((subset(frame, method == i & horizon == j)$actual - subset(frame, method == i & horizon == j)$forecast)^2, na.rm=TRUE))
    }
  }
  for (k in 1:length(unique(frame$horizon))){
    ranks[,k] <- rank(df[, k])
  }
  averagerank <- rowMeans(ranks, na.rm =TRUE)
  averageRMSE <- rowMeans(df, na.rm =TRUE)
  ranks <- cbind(ranks, "average rank" = averagerank)
  df <- cbind(df, " average RMSE" = averageRMSE)

  for(m in 1:length(unique(frame$method))){
    RMSElist[[m]] <- unname(df[m, 1:length(unique(frame$horizon))])
    methodlist[[m]] <- rep(as.vector(unique(frame$method))[m],length(unique(frame$horizon)))
    horizonlist[[m]]<- as.vector(unique(frame$horizon))
  }
  RMSE1 <- Reduce(c, RMSElist)
  RMSE <- Reduce(c, RMSE1)
  horizon <- Reduce(c, horizonlist)
  method = Reduce(c, methodlist)
  df2 <- data.frame(RMSE, horizon, method )

  # plots MSEs frame
  gp1 <- ggplot2::ggplot(df2, ggplot2::aes(x=horizon, y=RMSE, group=method,color=method, shape=method)) +
    ggplot2::scale_shape_manual(values=1:nlevels(df2$method)) +
    ggplot2::labs(title = "RMSE for different horizons and methods") +
    ggplot2::geom_line() +
    ggplot2::geom_point(size=3)+
    ggplot2::theme(plot.title = ggplot2::element_text(hjust = 0.5))
  print(gp1)

  outlist <- list("RMSE" = df, "rank" =ranks)
  if(sort == FALSE){
    return(outlist)
  }else{
    frame1 <-df[order(df$` average RMSE`),]
    frame2 <- ranks[order(ranks$`average rank`),]
    outlist <- list("RMSE" = frame1, "rank" = frame2)
    return(outlist)
  }
}
svcuonghvktqs/FORA documentation built on May 20, 2019, 9:57 a.m.