R/predict.cv.splitSelect.R
In splitSelect: Best Split Selection Modeling for Low-Dimensional Data

Documented in predict.cv.splitSelect

#' 
#' @importFrom stats predict
#' 
#' @title Predictions for cv.splitSelect object
#'
#' @description \code{predict.cv.splitSelect} returns the prediction for cv.splitSelect for new data.
#' 
#' @param object An object of class cv.splitSelect.
#' @param newx A matrix with the new data.
#' @param optimal.only A boolean variable (TRUE default) to indicate if only the predictions of the optimal split are returned.
#' @param ... Additional arguments for compatibility.
#' 
#' @return A matrix with the predictions of the \code{cv.splitSelect} object.
#' 
#' @export
#' 
#' @author Anthony-Alexander Christidis, \email{anthony.christidis@stat.ubc.ca}
#' 
#' @examples
#' # Setting the parameters
#' p <- 4
#' n <- 30
#' n.test <- 5000
#' beta <- rep(5,4)
#' rho <- 0.1
#' r <- 0.9
#' SNR <- 3
#' # Creating the target matrix with "kernel" set to rho
#' target_cor <- function(r, p){
#'   Gamma <- diag(p)
#'   for(i in 1:(p-1)){
#'     for(j in (i+1):p){
#'       Gamma[i,j] <- Gamma[j,i] <- r^(abs(i-j))
#'     }
#'   }
#'   return(Gamma)
#' }
#' # AR Correlation Structure
#' Sigma.r <- target_cor(r, p)
#' Sigma.rho <- target_cor(rho, p)
#' sigma.epsilon <- as.numeric(sqrt((t(beta) %*% Sigma.rho %*% beta)/SNR))
#' # Simulate some data
#' x.train <- mvnfast::rmvn(30, mu=rep(0,p), sigma=Sigma.r)
#' y.train <- 1 + x.train %*% beta + rnorm(n=n, mean=0, sd=sigma.epsilon)
#' x.test <- mvnfast::rmvn(n.test, mu=rep(0,p), sigma=Sigma.rho)
#' y.test <- 1 + x.test %*% beta + rnorm(n.test, sd=sigma.epsilon)
#' 
#' # Generating the coefficients for a fixed split
#' \donttest{
#' split.out <- cv.splitSelect(x.train, y.train, G=2, use.all=TRUE,
#'                             fix.partition=list(matrix(c(2,2), 
#'                                                ncol=2, byrow=TRUE)), 
#'                             fix.split=NULL,
#'                             intercept=TRUE, group.model="glmnet", alphas=0)
#' predict(split.out, newx=x.test)
#' }
#' 
#' @seealso \code{\link{cv.splitSelect}}
#' 
predict.cv.splitSelect <- function(object, newx, optimal.only=TRUE, ...){
  
  # Check input data
  if(!any(class(object) %in% "cv.splitSelect"))
    stop("The object should be of class \"cv.splitSelect\"")
  if(is.matrix(newx)){
    if(ncol(newx)!=ncol(object$splits))
      stop("The dimension of newx is invalid.")
  } else if(length(newx)!=ncol(object$splits))
    stop("The number of variables for newx is invalid.")
  
  # Removing the intercepts
  if(!is.null(object$intercepts))
    object$betas <- object$betas[-1,]
  
  if(optimal.only){
    
    if(object$family=="gaussian"){
      # Variable to store the predictions
      predictions <- numeric(nrow(newx))
      
      # Computing the predictions
      for(newx.id in 1:nrow(newx)){
        predictions[newx.id] <- newx[newx.id,] %*% object$betas[,object$optimal.split, drop=FALSE]
      }
      
      # Adding the intercepts
      if(!is.null(object$intercepts))
        predictions <- predictions + object$intercepts[object$optimal.split]
      
      # Returning the coefficients
      return(predictions)
      
    } else if(object$family=="binomial"){
      
      # Variable to store the predictions
      predictions <- numeric(nrow(newx))
      
      # Computing the predictions
      for(newx.id in 1:nrow(newx)){
        predictions[newx.id] <- exp(newx[newx.id,] %*% object$betas[,object$optimal.split, drop=FALSE])/
          (1+exp(newx[newx.id,] %*% object$betas[,object$optimal.split, drop=FALSE]))
      }
      
      # Getting the binary prediction
      predictions <- round(predictions, 0)
      
      # Returning the coefficients
      return(predictions)
    }
    
  } else{
    
    if(object$family=="gaussian"){
      
      # Matrix to store the predictions
      predictions <- matrix(nrow=nrow(newx), ncol=nrow(object$splits))
      
      # Computing the predictions
      for(newx.id in 1:nrow(newx)){
        for(split.id in 1:nrow(object$splits)){
          predictions[newx.id, split.id] <- newx[newx.id,] %*% object$betas[, split.id, drop=FALSE]
        }
      }
      
      # Adding the intercepts
      if(!is.null(object$intercepts))
        for(split.id in 1:nrow(object$splits))
          predictions[,split.id] <- predictions[,split.id] + object$intercepts[split.id]
        
        # Returning the coefficients
        return(predictions)
      
    } else if(object$family=="binomial"){
      
      # Matrix to store the predictions
      predictions <- matrix(nrow=nrow(newx), ncol=nrow(object$splits))
      
      # Computing the predictions
      for(newx.id in 1:nrow(newx)){
        for(split.id in 1:nrow(object$splits)){
          predictions[newx.id, split.id] <- exp(newx[newx.id,] %*% object$betas[, split.id, drop=FALSE])/
            (1+exp(newx[newx.id,] %*% object$betas[, split.id, drop=FALSE]))
        }
      }
      
      # Getting the binary prediction
      predictions <- round(predictions, 0)
      
      # Returning the coefficients
      return(predictions)
    }
  }
}