R/pred_intervals_new_initials_GS.R
In bartBMA: Bayesian Additive Regression Trees using Bayesian Model Averaging

Documented in pred_intervals_new_initials_GS

#' @title Prediction intervals for bart-bma output
#' 
#' @description This function produces prediction intervals for BART-BMA estimates by post-hoc Gibbs-sampling from the full conditionals of the terminal node parameters and the variance of the error term. See Hernandez et al. (2018) Appendix D for details.
#' @param object bartBMA object obtained from function bartBMA
#' @param num_iter Total number of iterations of the Gibbs sampler (including burn-in).
#' @param burnin Number of burn-on iterations of the Gibbs sampler.
#' @param l_quant Lower quartile of the prediction interval.
#' @param u_quant Upper quartile of the prediction interval.
#' @param newdata Test data for which predictions are to be produced. Default = NULL. If NULL, then produces prediction intervals for training data if no test data was used in producing the bartBMA object, or produces prediction intervals for the original test data if test data was used in producing the bartBMA object.
#' @param update_resids Option for whether to update the partial residuals in the gibbs sampler. If equal to 1, updates partial residuals, if equal to zero, does not update partial residuals. The defaullt setting is to update the partial residuals.
#' @param trainingdata The matrix of training data.
#' @export 
#' @return The output is a list of length 2:
#' \item{PI}{A 3 by n matrix, where n is the number of observations. The first row gives the l_quant*100 quantiles. The second row gives the medians. The third row gives the u_quant*100 quantiles.} 
#' \item{meanpreds}{An n by 1 matrix containing the estimated means.} 
#' @examples 
#' 
#' #load the package
#' library(bartBMA)
#' #set the seed
#' set.seed(100)
#' #simulate some data
#' N <- 100
#' p<- 100
#' epsilon <- rnorm(N)
#' xcov <- matrix(runif(N*p), nrow=N)
#' y <- sin(pi*xcov[,1]*xcov[,2]) + 20*(xcov[,3]-0.5)^2+10*xcov[,4]+5*xcov[,5]+epsilon
#' epsilontest <- rnorm(N)
#' xcovtest <- matrix(runif(N*p), nrow=N)
#' ytest <- sin(pi*xcovtest[,1]*xcovtest[,2]) + 20*(xcovtest[,3]-0.5)^2+10*xcovtest[,4]+
#'   5*xcovtest[,5]+epsilontest
#' 
#' #Train the object 
#' bart_bma_example <- bartBMA(x.train = xcov,y.train=y,x.test=xcovtest,zero_split = 1, 
#'                             only_max_num_trees = 1,split_rule_node = 0)
#' #Obtain the prediction intervals
#' pred_intervals_new_initials_GS(bart_bma_example,1000,100,0.025,0.975,
#' newdata=NULL,update_resids=1,xcov)

pred_intervals_new_initials_GS<-function(object,num_iter,burnin,l_quant,u_quant,newdata=NULL,update_resids=1,trainingdata){
  if(l_quant>0.5 ||u_quant<0 ||u_quant>1){stop("Lower quantile must be lower than 0.5 and greater than 0")}
  if(u_quant<0.5 ||u_quant<0 ||u_quant>1){stop("Upper quantile must be greater than 0.5 and less than 1")}
  
  
  scaled_train_y <- scale_response(min(object$response),max(object$response),-0.5,0.5,object$response)
  
  # diff_inital_resids <- list()
  # resid_length <- length(object$sum_residuals[[1]][[1]])
  # #initial_partial_resids <- rep(0.8*mean(scaled_train_y),resid_length )
  # 
  # 
  # for(i in 1:length(object$sum_residuals)){
  #   diff_inital_resids[[i]] <- rep(list(scaled_train_y- ((length(object$sum_residuals[[i]])-1 )/ length(object$sum_residuals[[i]]))*mean(scaled_train_y)), 
  #                                  length(object$sum_residuals[[i]])) 
  # }
  # 
  get_resids <- get_initial_resids(trainingdata,object$sumoftrees,scaled_train_y)
  diff_inital_resids<- get_resids[[1]]
  new_pred_list1 <- get_resids[[2]]
  
  
  #object will be bartBMA object.
  if(update_resids==0){
    if(is.null(newdata) && length(object)==16){
      #if test data specified separately
      gs_chains<-gibbs_sampler_no_update_new_inits(object$sumoftrees,object$obs_to_termNodesMatrix,object$response,object$bic,num_iter, burnin,object$nrowTrain,
                                                   nrow(object$test_data),object$a,object$sigma,0,object$nu,object$lambda,
                                                   diff_inital_resids,
                                                   object$test_data,
                                                   new_pred_list1)
    }else if(is.null(newdata) && length(object)==14){
      #else return Pred Ints for training data
      gs_chains<-gibbs_sampler_no_update2_new_inits(object$sumoftrees,object$obs_to_termNodesMatrix,object$response,object$bic,num_iter, burnin,object$nrowTrain,
                                                    object$a,object$sigma,0,object$nu,object$lambda,
                                                    diff_inital_resids,
                                                    new_pred_list1)
      
    }else{
      #if test data included in call to object
      gs_chains<-gibbs_sampler_no_update_new_inits(object$sumoftrees,object$obs_to_termNodesMatrix,object$response,object$bic,num_iter, burnin,object$nrowTrain,
                                                   nrow(newdata), object$a,object$sigma,0,object$nu,object$lambda,
                                                   diff_inital_resids,
                                                   newdata,
                                                   new_pred_list1)
    }
  }else{
    if(is.null(newdata) && length(object)==16){
      #if test data specified separately
      gs_chains<-gibbs_sampler_new_inits(object$sumoftrees,object$obs_to_termNodesMatrix,object$response,object$bic,num_iter, burnin,object$nrowTrain,
                                         nrow(object$test_data),object$a,object$sigma,0,object$nu,object$lambda,
                                         diff_inital_resids,
                                         object$test_data,
                                         new_pred_list1)
    }else if(is.null(newdata) && length(object)==14){
      #else return Pred Ints for training data
      gs_chains<-gibbs_sampler2_new_inits(object$sumoftrees,object$obs_to_termNodesMatrix,object$response,object$bic,num_iter, burnin,object$nrowTrain,
                                          object$a,object$sigma,0,object$nu,object$lambda,
                                          diff_inital_resids,
                                          new_pred_list1)
      
    }else{
      #if test data included in call to object
      gs_chains<-gibbs_sampler_new_inits(object$sumoftrees,object$obs_to_termNodesMatrix,object$response,object$bic,num_iter, burnin,object$nrowTrain,
                                         nrow(newdata), object$a,object$sigma,0,object$nu,object$lambda,
                                         diff_inital_resids,
                                         newdata,
                                         new_pred_list1)
    }
  }
  #  y_posterior_sum_trees<-gs_chains[[4]]
  #  y_orig_post_sum_trees<-gs_chains[[5]]
  #  sigma_chains<-gs_chains[[3]]
  if(is.null(newdata) && length(object)==16){
    #y_posterior_sum_trees<-gs_chains[[1]] #[[8]]
    y_orig_post_sum_trees<-gs_chains[[2]] #[[9]]
    sigma_chains<-gs_chains[[1]] # [[3]]
  }else if(is.null(newdata) && length(object)==14){
    #y_posterior_sum_trees<-gs_chains[[4]] 
    y_orig_post_sum_trees<-gs_chains[[2]]
    sigma_chains<-gs_chains[[1]]
    
  }else{
    #y_posterior_sum_trees<-gs_chains[[1]] #[[8]]
    y_orig_post_sum_trees<-gs_chains[[2]] #[[9]]
    sigma_chains<-gs_chains[[1]]
  } 
  
  sum_of_tree_BIC<- -0.5*object$bic
  weights<-exp(sum_of_tree_BIC-(max(sum_of_tree_BIC)+log(sum(exp(sum_of_tree_BIC-max(sum_of_tree_BIC))))))
  #final_length<-num_iter-burnin
  num_its_to_sample<-round(weights*(num_iter-burnin))
  #final_sigma_chain<-numeric(0)
  
  #final_y_chain<-matrix(nrow=0,ncol=ncol(y_posterior_sum_trees[[1]]))
  final_yorig_chain<-matrix(nrow=0,ncol=ncol(y_orig_post_sum_trees[[1]]))
  
  for(i in 1:length(sigma_chains)){
    sample_its<-sample(burnin:num_iter,num_its_to_sample[i])
    #final_sigma_chain<-c(final_sigma_chain,sigma_chains[[i]][sample_its])
    #now do the same for predicted response updates
    #post_y_i<-y_posterior_sum_trees[[i]]
    post_yorig_i<-y_orig_post_sum_trees[[i]]
    #final_y_chain<-rbind(final_y_chain,post_y_i[sample_its,])
    final_yorig_chain<-rbind(final_yorig_chain,post_yorig_i[sample_its,])
    
  }
  PI<-apply(final_yorig_chain,2,function(x)quantile(x,probs=c(l_quant,0.5,u_quant)))
  meanpreds<-apply(final_yorig_chain,2,mean)
  
  
  ret<-list()
  length(ret)<-2
  ret[[1]]<-PI
  ret[[2]] <- meanpreds
  
  class(ret)<-"pred_intervals.bartBMA"  
  ret
}