bayesMRM: Bayesian Multivariate Receptor Modeling

Documented in convdiag_bmrm

#' Convergence Diagnostics on MCMC samples in \code{bmrm}
#' @description Compute convergence diagnostics of
#'  Geweke (1992), Heidelberger and Welch (1983), Raftery and Lewis(1992).
#' @usage convdiag_bmrm(x , var="P", convdiag="geweke",print=TRUE,...)
#' @param x an object of class \code{bmrm}, the output of the \code{bmrm} function
#' @param var name of a variable to which convergence disagnostics apply. It should be one of "A" (source contribution matrix),
#' "P" (source composition or profile matrix), "Sigma" (error variance).
#' @param convdiag  vector of convergence diagnostic methods. It should be any subvector
#'  of ("geweke", "heidel","raftery" ) (default="geweke").
#' @param print TRUE/FALSE, print convergence diagnostics results (default=TRUE)
#' @param ... arguments to be passed to methods
#'
#' @return A list of  convergence diagnostics results
#' \describe{
#'   \item{convdiag}{selected convergence diagnostic methods}
#'   \item{geweke}{Geweke's z-scores and p-values if \code{convdiag}
#'  includes "geweke", NULL if \code{convdiag} does not include "geweke"}
#'   \item{heidel}{Heidelberger and Welch's stationary test results
#' and p-values if \code{convdiag} includes "heidel"; NULL if
#' \code{convdiag} does not include "heidel"}
#' \item{raftery}{Raftery and Lewis's estimates of burn-in, minimum number of iterations,
#' and thinning if \code{convdiag} includes "raftery"; NULL if
#' \code{convdiag} does not include "raftery"}
#' }
#'
#' @details
#'  Geweke's convergence diagnostic for Markov chains is based on
#'  a test for equality of the means of the first and last part of a Markov chain
#'  (by default the first 10\% and the last 50\%).
#'  If the samples are drawn from the stationary distribution of the chain,
#'  the two means should be equal and Geweke's statistic has an asymptotically
#'  standard normal distribution. We use the function \code{geweke.diag} in \bold{coda}
#'   package (with default option) which provides the test statistics
#'   (standard Z-scores) and the upper bound of
#'   and p-values.
#'
#'  Heidelberger and Welch's  convergence diagnostic tests the
#'  null hypothesis that the sampled values come from a stationary distribution.
#'   The test is successively applied, firstly to the whole chain, then after
#'    discarding the first 10\%, 20\%, ... of the chain until either
#'    the null hypothesis is accepted, or 50\% of the chain has been discarded.
#'    We use the function  \code{heidel.diag} (with default option)
#'    which provides the staionary test results and p-values.
#'
 #' Raftery and Lewis's diagnostic estimates the minimum number of iterations, burn-in,
 #' thinning interval for zero autocorrelation, satisfying specified conditions
 #' regarding quantile \eqn{q} of parameters of interest. The conditions are
 #' specified by a posterior quantile \eqn{q} of parameters, an acceptable
 #' tolerance (accuracy) \eqn{r} for \eqn{q}, a probability \eqn{s} of being
 #' within the interval \eqn{q-r, q+r}.
 #' We use the function  \code{raftery.diag} (with default option).
#'

 #' @references Geweke, J.(1992) Evaluating the accuracy of sampling-based
#' approaches to calculating posterior moments. In Bayesian Statistics 4
#' (ed JM Bernado, JO Berger, AP Dawid and AFM Smith). Clarendon Press.
#' @references Heidelberger P, and Welch PD. (1981) A spectral method for
#' confidence interval generation and run length control in simulations.
#' Comm. ACM. 24, 233-245.
#' @references Heidelberger P. and Welch PD.(1983) Simulation run length
#' control in the presence of an initial transient.
#' Opns Res., 31, 1109-44,Oxford, UK.
#' @references Plummer, M., Best, N., Cowles, K. and Vines K. (2006) CODA:
#' Convergence Diagnosis and Output Analysis for MCMC, R News, Vol 6, pp. 7-11.
#' @references Raftery, A.E. and Lewis, S.M. (1992). One long run with diagnostics:
#' Implementation strategies for Markov chain Monte Carlo. Statistical Science, 7, 493-497.
#' @references Raftery, A.E. and Lewis, S.M. (1995). The number of iterations,
#'  convergence diagnostics and generic Metropolis algorithms. In Practical Markov Chain Monte
#'  Carlo (W.R. Gilks, D.J. Spiegelhalter and S. Richardson, eds.). London, U.K.: Chapman and Hall.
#' @export
#' @examples
#' \dontrun{
#' data(Elpaso)
#' Y=Elpaso$Y ; muP=Elpaso$muP
#' q=nrow(muP)
#' out.Elpaso <- bmrm(Y,q,muP, nAdapt=1000,nBurnIn=5000,nIter=5000,nThin=1)
#' conv1<-convdiag_bmrm(out.Elpaso,var="P",convdiag="raftery" )
#' conv2<-convdiag_bmrm(out.Elpaso,var="A", convdiag="geweke")
#' conv3<-convdiag_bmrm(out.Elpaso,var="Sigma", convdiag=c("geweke","heidel"))
#' conv4<-convdiag_bmrm(out.Elpaso,var="Sigma", convdiag=c("geweke","heidel", "raftery"))
#' }


convdiag_bmrm <- function(x , var="P", convdiag="geweke",print=TRUE,...){

  if (class(x) != 'bmrm') { stop("incorrect class of 'x.bmrm' ",call.=FALSE)}
  T<-x$nobs
  q<-x$nsource
  J<-x$nvar
  var.codaSamples=list()
  geweke_table = heidel_table = raftery_table=NULL
  if (var == "P"){
        for (ic in 1:length(x$codaSamples)) {
           var.codaSamples[[ic]]=x$codaSamples[[ic]][,(T*q+1):(T*q+q*J)] }
  } else if (var == "A"){
    for (ic in 1:length(x$codaSamples)) {
      var.codaSamples[[ic]]=x$codaSamples[[ic]][,1:(T*q)] }
  } else if (var == "Sigma"){
      for (ic in 1:length(x$codaSamples)) {
        var.codaSamples[[ic]]=x$codaSamples[[ic]][,(T*q+q*J+1):(T*q+q*J+J)] }
  } else{
      cat("unknown 'var' name \n" )}

  class(var.codaSamples)<-"mcmc.list"
  if (!("geweke" %in% convdiag)&
      !("heidel" %in% convdiag)&
      !("raftery" %in% convdiag)) {
    stop("incorrect type of convergence diagnostics", call.=FALSE) }


  if ("geweke" %in% convdiag){
  #geweke: a test for equality of the means of the first and last part of
  #a Markov chain (by default the first 10% and the last 50%)

    mcmcSamples = base::as.matrix(var.codaSamples)
    geweke1 = coda::geweke.diag(mcmcSamples, frac1=0.1, frac2=0.5)
    if(class(geweke1)=="list") geweke1=geweke1[[1]]
    geweke_pvalue <- 2*stats::pnorm(-base::abs(geweke1$z))
    geweke_table <- base::data.frame('z-score' = geweke1$z,
                                     'p value' =
                                      round(geweke_pvalue, digits = 4))

    if(print){
      cat("\n\n")
      cat("Geweke Diagnostics :\n\n")
      base::print(utils::head(geweke_table,n=10))
      if(nrow(geweke_table)>10)
        base::cat(paste("...",nrow(geweke_table)-10," more rows"))
      cat("\n\n")
    }
  }

  if ("heidel" %in% convdiag){
    mcmcSamples=base::as.matrix(var.codaSamples)

    heidel1 <- coda::heidel.diag(mcmcSamples, eps=0.1, pvalue=0.05)
    if(class(heidel1)=="list") heidel1=heidel1[[1]]
    heidel_table <- base::data.frame('stest' = heidel1[,1],
                                        'p value' =round(heidel1[,3], 4))

    #print("Put")
    if(print){
      base::cat("\n\n")
      base::cat("Heidel Diagnostics:\n\n")
      base::print(utils::head(heidel_table,n=10))
      if(nrow(heidel_table)>10)
        base::cat(paste("...",nrow(heidel_table)-10," more rows"))
      base::cat("\n\n" )
    }
  }

  if ("raftery" %in% convdiag){
    mcmcSamples=base::as.matrix(var.codaSamples)

    raftery1 <- coda::raftery.diag(mcmcSamples,q=0.025,
                                   r=0.005, s=0.95, converge.eps=0.001)
    if(class(raftery1 )=="list") raftery1 =raftery1 [[1]]
    raftery1=raftery1$resmatrix
    raftery_table <- base::data.frame('burn in' = raftery1[,1],
                                     'min num of iteration' =raftery1[,2],
                                     'thinning' =raftery1[,3])

    if(print){
      base::cat("\n\n")
      base::cat("Raftery Diagnostics:\n\n")
      base::print(utils::head(raftery_table,n=10))
      if(nrow(raftery_table)>10)
        base::cat(paste("...",nrow(raftery_table)-10," more rows"))
      base::cat("\n\n" )
    }
  }
  return(list(convdiag = convdiag,
              geweke=geweke_table,
              heidel=heidel_table,
              raftery=raftery_table))
}