CAMP_RST: CAMP RST R Routines

Documented in plotbsSpline

#' @export
#' 
#' @title plotbsSpline
#'   
#' @description Plot the results of fitting a temporal b-spline.
#'   
#' @param X The basis b-spline matrix resulting from a call to function 
#'   \code{bs}.
#'   
#' @param fit The generalized linear model resulting from a call to function 
#'   \code{glm}.
#'   
#' @param beg.x The POSIX-formatted start date to use for plotting.
#'   
#' @param end.x The POSIX-formatted end date to use for plotting.
#'   
#' @param eff0 The default data frame containing efficiency trials for a
#'   particular \code{TrapPositionID}.  Typically \code{tmp.df}.
#'   
#' @param option The plotting option.  Value \code{option=1} incorporates logic 
#'   surrounding spline knots, while \code{option=2} does not.
#'   
#' @param bd2 The \code{batchDate2} column, typically from data frame \code{df},
#'   containing the \code{batchDate}s mapped to the 1959-1960 spline paradigm.
#'   
#' @param ... Additional plotting control. 
#'   
#' @return A plot of the fitted cubic spline, its originating data points, and 
#'   the knots utilized to achive the fit.
#'   
#' @details Function \code{plotbsSpline} simply organizes all the pieces 
#'   necessary to graph the prediction cubic piecewise polynomial resulting from
#'   the use of a b-spline.  It plots not only the (necessarily) smooth spline, 
#'   but also the original points used to estimate it.  It also plots all knots,
#'   i.e., both boundary and interior.  It calculates the prediction via matrix 
#'   multiplication of the provided matrix basis \eqn{X} and the vector of 
#'   parameter \eqn{\beta} coefficients from object \code{fit}.
#'   
#'   This function is customized for use with the CAMP project, and will not 
#'   work for splines derived from data originating elsewhere without 
#'   modification.
#'   
#' @seealso \code{F.efficiency.model.enh}
#'   
#' @author WEST Inc.
#'   
#' @examples
#' \dontrun{
#' #   ---- Plot results from an efficiency model.  Note that no parameter
#' #   ---- is provided for argument bd2 (batchDate2).   
#' plotbsSpline(X,fit,beg.x,end.x,tmp.df)
#' }
plotbsSpline <- function(X,fit,beg.x,end.x,eff0,option,bd2,...){
  
  # X <- m0$bspl
  # fit <- fit1#m2$fit
  # beg.x <- bsplBegDt
  # end.x <- bsplEndDt
  # eff0 <- tmp.df
  # bd2=df$batchDate2[eff.ind.inside]
  # option <- 2
  
  #   ---- For CAMP work, we assume there is no intercept.  Check for this.
  int <- attr(X,"intercept")
  if(int != FALSE){
    stop(paste0("ERROR:  This function assumes no intercept in bs object ",deparse(substitute(X)),".\n"))
  }
  Boundary.knots <- attr(X,"Boundary.knots")
  #degree <- attr(X,"degree")   # do i need this?  we always use cubic.
  knots <- attr(X,"knots")
  
  #   ---- Preserve the bs object before manipulation.  
  bspl <- X
  
  #   ---- Identify if the bspl object is really just a vector of 1s.
  intOnly <- sum(X == rep(1,nrow(X))) == nrow(X) 
  
  #   ---- In CAMP work, and in general, the X (bspl) matrix may not be sorted  
  #   ---- by row.  This means the x-variable against which we ultimately wnat to plot.  
  #   ---- For CAMP, the reduction of multiple years of data to the "one 1969/1979 year"
  #   ---- means that the bs basis matrix is, in general, not sorted.  This also means
  #   ---- that in general, an x-value could be in X twice+, via two+ rows.  This 
  #   ---- duplication in the x doesn't affect estimation, but we need to ID which rows
  #   ---- are which; i.e., we need to sort.  So, use the hard-coded batchDate object. 
  
  #   ---- Id the beta vector.  
  b <- coef(fit)
  
  if(option == 1){
    
    #   ---- See if we have other covariates other than time we need to do something with.
    if( length(coef(fit)) > (ncol(X) + 1) ){
  
      #   ---- Check if we have only one non-intercept variable.
      if( (length(coef(fit)) - ncol(X)) == 2 ){
       dat <- data.frame(fit$data[,colnames(fit$data)[colnames(fit$data) %in% names(coef(fit))]])
       colnames(dat) <- names(b)[length(b)]
      } else {
       dat <- fit$data[,colnames(fit$data)[colnames(fit$data) %in% names(coef(fit))]]
      }
      covarMeans <- suppressWarnings(apply(dat,2,function(x) mean(as.numeric(x))))
      X <- cbind(rep(1,nrow(X)),X,matrix(covarMeans,ncol=length(covarMeans),nrow=nrow(X),byrow=TRUE))
      colnames(X) <- names(b)
  
    } else if(!intOnly){
  
      #   ---- Tack on the intercept column, if necessary.
      X <- cbind(rep(1,nrow(X)),X)
    }
    
    #   ---- Check if X is just a vector of 1s; i.e., an intercept-only model.  
    y <- X %*% b
    p <- 1/(1 + exp(-1*y))
    DF <- data.frame(X,y=y,p=p)
    
    #   ---- Get the y-coordinates for the 2 boundary knots.
    if( intOnly == TRUE){
      yboundary <- DF$p[1:2]
      yknots <- numeric(0)
    } else if(length(coef(fit)) > ncol(bspl)) {
      yboundary <- 1/(1 + exp(-1*cbind(rep(1,2),predict(bspl,Boundary.knots),matrix(covarMeans,ncol=length(covarMeans),nrow=2,byrow=TRUE)) %*% b))
      if(length(knots) > 0){
        yknots <- 1/(1 + exp(-1*cbind(rep(1,length(knots)),predict(bspl,knots),matrix(covarMeans,ncol=length(covarMeans),nrow=length(knots),byrow=TRUE)) %*% b))
      }
    } else {
      yboundary <- 1/(1 + exp(-1*cbind(rep(1,2),predict(bspl,Boundary.knots)) %*% b))
      if(length(knots) > 0){
        yknots <- 1/(1 + exp(-1*cbind(rep(1,length(knots)),predict(bspl,knots)) %*% b))
      }
    }
    
    #   ---- Sort DF.
    DF$batchDate2 <- bd2
    DF <- DF[order(DF$batchDate2),]
    DF <- DF[!duplicated(DF$batchDate2),]
    
    #   ---- Plot.
    yM <- 0.3  # maybe set as argument?
    yM <- max(eff0$efficiency,DF$p)
    title <- paste0("Enhanced Efficiency Cubic Spline Trap ",fit$data$TrapPositionID[1])
    plot(DF$batchDate2,DF$p,xlim=as.numeric(c(beg.x,end.x)),ylim=c(0,yM),xlab="Time",ylab="Efficiency",type="l",col="black",main=title)
    par(new=TRUE)
    points(Boundary.knots,yboundary,pch=19,col="blue")
    points(eff0$batchDate2,eff0$efficiency,pch=19,col="red",cex=(fit$data$nReleased)/mean((fit$data$nReleased))  )
    if(length(knots) > 0){
      points(knots,yknots,pch=19,col="blue")
    }
    
  } else if(option == 2){
   
    #   ---- Build a design matrix for the days on which we have observations.  
    colnames(X) <- paste0("tmp.bs",colnames(X))
    X <- data.frame("(Intercept)"=rep(1,nrow(X)),X,"batchDate2"=bd2,check.names=FALSE)
    X <- merge(X,eff0,by=c("batchDate2"),all.y=TRUE)
    X <- X[,c("batchDate2",names(coef(fit)))]
    
    D <- X
    D$batchDate2 <- NULL
    D <- as.matrix(D)

    #   ---- Build estimates.  
    y <- D %*% b
    p <- 1/(1 + exp(-1*y))
    DF <- data.frame(X,y=y,p=p)
    
    #   ---- Sort DF.
    DF <- DF[!duplicated(DF$batchDate2),]
    DF <- DF[order(DF$batchDate2),]
    
    # #   ---- Turned off -- how to get internal X if only plotting where we had efficiency trials?
    # #   ---- Get the y-coordinates  for the 2 boundary knots.
    # if( intOnly == TRUE ){
    #   yboundary <- DF$p[1:2]
    #   yknots <- numeric(0)
    # } else {
    #   yboundary <- 1/(1 + exp(-1*cbind(rep(1,2),predict(bspl,Boundary.knots),matrix(DF[1,],ncol=length(covarMeans),nrow=2,byrow=TRUE)) %*% b))
    #   if(length(knots) > 0){
    #     yknots <- 1/(1 + exp(-1*cbind(rep(1,length(knots)),predict(bspl,knots)) %*% b))
    #   }
    # }
    
    #   ---- Plot.
    yM <- 0.3  # maybe set as argument?
    yM <- max(eff0$efficiency,DF$p)
    title <- paste0("Enhanced Efficiency Cubic Spline Trap ",fit$data$TrapPositionID[1])
    plot(DF$batchDate2,DF$p,xlim=as.numeric(c(beg.x,end.x)),ylim=c(0,yM),xlab="Time",ylab="Efficiency",type="l",col="black",main=title)
    par(new=TRUE)
    # points(Boundary.knots,yboundary,pch=19,col="blue")
    points(eff0$batchDate2,eff0$efficiency,pch=19,col="red",cex=(fit$data$nReleased)/mean((fit$data$nReleased))  )
    # if(length(knots) > 0){
    #   points(knots,yknots,pch=19,col="blue")
    # }
    return(list(X=X,pred=p,DF=DF))
    
  }
  
}