modRMSE: Model evaluation parameters

Documented in metricsloop

#' metricsloop
#'
#' @importFrom epiR epi.ccc
#'
#' @param d a data frame.
#' @param var a vector of varibales in the data set.
#' @param MT a model type, such as "lm" or "lmer".
#' @param m a model such as "x + y", or "x + y + (1|random)", or "x + y, family = Gamma". Varibales have to be present in the dataset d.
#' @param PF function for calculate the prediction of the model such as "predict.glm", if empty it will use "predict".
#' @param s significant digits
#'  empty:  return all values.
#'  number 1 to 6: will return the desired significant digits.
#'  "std1": will return number as character in a predefined format.
#' @return a data frame with different parameters to evaluate the model
#'
#' @export
metricsloop <- function(d, var, MT, m, PF, s) {

  out <- NULL

  if(missing(PF) | PF == FALSE){
    for(i in var){
      for(j in m){

          o <- d[[i]]
          p <- predict(eval(parse(text = paste0(MT, "(", i , "~", j, ",", deparse(substitute(d)), ")"))))

          data <- data.frame(o, p)
          data$res = data$o - data$p
          data <- subset(data, is.na(data$res)==FALSE)
          o <- data$o
          p <- data$p
          res <- data$res
          meano <- mean(o, na.rm=TRUE)
          meanp <- mean(p, na.rm=TRUE)
          PMeanBias <- t.test(res)$p.value
          PMeanBias <- ifelse(PMeanBias < 0.0001, 0.0001, PMeanBias)
          PSlope <- anova(lm(res~p))[1,5]
          PSlope <- ifelse(PSlope < 0.0001, 0.0001, PSlope)
          res2=res^2;
          rm=sqrt(mean(res2, na.rm=TRUE));
          uss=sum(res2, na.rm=TRUE);
          lo <- ifelse(is.na(o)==FALSE, 1, 0)
          n=sum(lo);
          meano=mean(o, na.rm=TRUE);
          mb=sum(res, na.rm=TRUE)/n;
          sse <- anova(lm(res~p))[2,2];
          msb <- mb^2;
          mspe <- rm^2;
          msre <- sse/n;
          msslope <- mspe-msre-msb;
          mean <- msb/mspe*100;
          slope <- msslope/mspe*100;
          residual <- msre/mspe*100;
          check <- mean+slope+residual
          rsr <- rm/sd(o, na.rm=TRUE)
          ccc <- epi.ccc(o,p)$rho.c[1]
          MAE <- mean(abs(res))    # added by Giulio Giagnoni
          MAEp <- mean(abs(res))/meano*100   # added by Giulio Giagnoni
          rmp = rm/meano*100
          mb <- mean(res, na.rm=TRUE)
          sb <- coef(lm(res~p))[2]

          Values <- c(n, meano, meanp, rm, rmp, mean, slope, residual, mb, sb,
                      msre, PMeanBias, PSlope, rsr, ccc[,1], MAE, MAEp)

          Values <- if(missing(s)){
            Values
          }
          else if (s == 'std1'){
             ifelse(Values >= 0.01, round(Values, digits = 2), ifelse(Values < 0.01 & Values >= 0.001,  round(Values, digits = 3), ifelse(Values < 0.001, "<0.001", as.character(Values))))
          }
          else if (s >= 1 & s <= 6){
            formatC(Values, digits=s, format = "fg", flag = "#")
          }
          else {
            stop(sQuote(s), " not implemented")
          }

          Values <- cbind(as.data.frame(rbind(Values)), i, MT, j)

          out <- rbind(out, Values)
        }
    }
  }


  else{

    for(i in var){
      for(j in m){

            o <- d[[i]]
            p <- eval(parse(text = paste0(PF, "(", MT, "(", i , "~", j, ",", deparse(substitute(d)), ")", ")")))

            data <- data.frame(o, p)
            data$res = data$o - data$p
            data <- subset(data, is.na(data$res)==FALSE)
            o <- data$o
            p <- data$p
            res <- data$res
            meano <- mean(o, na.rm=TRUE)
            meanp <- mean(p, na.rm=TRUE)
            PMeanBias <- t.test(res)$p.value
            PMeanBias <- ifelse(PMeanBias < 0.0001, 0.0001, PMeanBias)
            PSlope <- anova(lm(res~p))[1,5]
            PSlope <- ifelse(PSlope < 0.0001, 0.0001, PSlope)
            res2=res^2;
            rm=sqrt(mean(res2, na.rm=TRUE));
            uss=sum(res2, na.rm=TRUE);
            lo <- ifelse(is.na(o)==FALSE, 1, 0)
            n=sum(lo);
            meano=mean(o, na.rm=TRUE);
            mb=sum(res, na.rm=TRUE)/n;
            sse <- anova(lm(res~p))[2,2];
            msb <- mb^2;
            mspe <- rm^2;
            msre <- sse/n;
            msslope <- mspe-msre-msb;
            mean <- msb/mspe*100;
            slope <- msslope/mspe*100;
            residual <- msre/mspe*100;
            check <- mean+slope+residual
            rsr <- rm/sd(o, na.rm=TRUE)
            ccc <- epi.ccc(o,p)$rho.c[1]
            MAE <- mean(abs(res))    # added by Giulio
            MAEp <- mean(abs(res))/meano*100   # added by Giulio
            rmp = rm/meano*100
            mb <- mean(res, na.rm=TRUE)
            sb <- coef(lm(res~p))[2]

            Values <- c(n, meano, meanp, rm, rmp, mean, slope, residual, mb, sb,
                        msre, PMeanBias, PSlope, rsr, ccc[,1], MAE, MAEp)

            Values <- if(missing(s)){
              Values
            }
            else if (s == 'std1'){
               ifelse(Values >= 0.01, round(Values, digits = 2), ifelse(Values < 0.01 & Values >= 0.001,  round(Values, digits = 3), ifelse(Values < 0.001, "<0.001", as.character(Values))))
            }
            else if (s >= 1 & s <= 6){
              formatC(Values, digits=s, format = "fg", flag = "#")
            }
            else {
              stop(sQuote(s), " not implemented")
            }

            Values <- cbind(as.data.frame(rbind(Values)), i, MT, j, PF)

            out <- rbind(out, Values)
          }
    }
  }


  colnames(out) <- if(missing(PF) | PF == FALSE){
    c("N", "Observed Mean", "Predicted Mean", "RMSE", "RMSE, % mean",
      "Mean Bias, % MSE", "Slope Bias, % MSE", "Dispersion, % MSE",
      "Mean Bias", "Slope Bias", "Dispersion Bias", "P-Mean Bias",
      "P-Slope Bias", "RSR", "CCC", "MAE", "MAE, % mean", "Var", "ModelType", "Model")
  }
  else{
    c("N", "Observed Mean", "Predicted Mean", "RMSE", "RMSE, % mean",
      "Mean Bias, % MSE", "Slope Bias, % MSE", "Dispersion, % MSE",
      "Mean Bias", "Slope Bias", "Dispersion Bias", "P-Mean Bias",
      "P-Slope Bias", "RSR", "CCC", "MAE", "MAE, % mean", "Var", "ModelType", "Model", "Predict")
  }

  return(out)
}