Nothing
#' Convergence plots
#'
#' The function produces a .pdf file containing some convergence plots for the Monte Carlo draws.
#' @param model an object of class \code{`flexreg`}.
#' @param file a character string giving the name of the file (with extension .pdf).
#' @param plotfun an optional character vector of diagnostics plots. The default is to compute \code{all} plots, otherwise one can specify a selection of plots among \code{density}, \code{trace}, \code{intervals}, \code{rate}, \code{rhat}, and \code{acf}.
#' @param pars an optional character vector of parameter names. If \code{pars} is not specified, all parameters in the regression models are evaluated.
#' @param point_est an optional character to specify the point estimate to be shown between \code{median} (the default), \code{mean}, or \code{none}.
#' @param prob the probability mass to be included in the inner interval (\code{intervals} plot) or in the shaded region (for \code{density} plot). The default is 0.5.
#' @param prob_outer the probability mass to be included in the outer interval of the \code{intervals} plot. The default is 0.9.
#' @param lags the number of lags to be shown in the \code{acf} plot. The default is 10.
#' @param width,height the width and height of the graphics region of each plot in inches. The default values are 7.
#' @param warmup a logical scalar indicating whether to include the warmup draws or not (default).
#'
#' @return A .pdf file with one plot per page.
#'
#' @import bayesplot ggplot2
#'
#' @references {
#' Brooks, SP., Gelman, A. (1998). General methods for monitoring convergence of iterative simulations. Journal of Computational and Graphical Statistics, \bold{7}, 434-455. \cr
#' \cr
#' Stan Development Team (2020). RStan: the R interface to Stan. R package version 2.19.3. https://mc-stan.org
#' }
#'
#' @details The plots can be further customized using the \code{ggplot2} package.
#' \itemize{
#' \item \code{density} returns a density plot for each parameter in \code{pars} computed from the posterior draws. See \code{bayesplot::mcmc_areas} for further details.
#' \item \code{trace} returns a trace plot for each parameter in \code{pars} computed from the posterior draws. See \code{bayesplot::mcmc_trace} for further details.
#' \item \code{intervals} returns a plot of uncertainty interval for each parameter in \code{pars} computed from the posterior draws. See \code{bayesplot::mcmc_intervals} for further details.
#' \item \code{rate} returns a plot for each parameter in \code{pars} with the number of iterations on the x-axis and the Monte Carlo mean until iteration i-th on the y-axis.
#' \item \code{rhat} returns a plot with the Rhat values for each parameter in \code{pars}. See \code{bayesplot::mcmc_rhat} for further details.
#' \item \code{acf} returns the autocorrelation plots (one for each parameter in \code{pars}). See \code{bayesplot::mcmc_acf} for further details.
#'
#' }
#'
#' @export
#'
convergence.plot <- function(model, file = "convergence-output.pdf", #compress = F,
plotfun = "all", pars = NULL, point_est = "median",
prob = 0.5, prob_outer = 0.9, lags = 10, warmup = F,
width = 7, height = 7)
{
posterior <- model$model
if (is.null(pars)) pars <- extract.pars(posterior = posterior)
chains <- rstan::extract(posterior, pars, inc_warmup = warmup, permuted=F)#ottengo degli array
n.iter <- dim(posterior)[1]
n.warmup <- dim(chains)[1]-n.iter
if ("beta" %in% pars) {
pars.full <- names(posterior)
pars <- c(pars.full[grep("beta",pars.full)], pars)
pars <- pars[-which(pars=="beta")]
}
if ("psi" %in% pars) {
pars.full <- names(posterior)
pars <- c(pars.full[grep("psi",pars.full)], pars)
pars <- pars[-which(pars=="psi")]
}
D <- length(pars)
#tools::file_ext(file)
file.extension.position <- regexpr("\\.([[:alnum:]]+)$",file)
file.extension <- tolower(substr(file, file.extension.position +
1, nchar(file)))
file.name <- substr(file, 1, file.extension.position - 1)
#file.rendered <- paste(file.name, "Rmd", sep = ".")
#density plot
if (any(plotfun %in% c("all", "density"))){
pp <- lapply(pars, function(x) mcmc_areas(posterior, pars = x, prob = prob))
title.plot <- lapply(pars, function(x) ggtitle(paste("Posterior distribution of ", x,
"with", point_est,"and", prob*100, "% intervals", sep=" ")))
plot1 <- lapply(1:D, function(x) pp[[x]] + title.plot[[x]])
} else plot1 <- NULL
#trace plot
if (any(plotfun %in% c("all", "trace"))){
n_warmup <- ifelse(warmup==F, 0, n.warmup)
pp <- lapply(pars, function(x) mcmc_trace(chains, pars = x, n_warmup = n_warmup))
title.plot <- lapply(pars, function(x) ggtitle(paste("Traceplot of ", x, sep=" ")))
plot2 <- lapply(1:D, function(x) pp[[x]] + title.plot[[x]]+theme(axis.title.y=element_text(angle=0,hjust=1)) )
} else plot2 <- NULL
#intervals plot
if (any(plotfun %in% c("all", "intervals"))){
pp <- lapply(pars, function(x) mcmc_intervals(posterior, pars = x, prob = prob, prob_outer = prob_outer))
title.plot <- lapply(pars, function(x) ggtitle(paste("Posterior interval estimates of ", x, sep=" ")))
plot3 <- lapply(1:D, function(x) pp[[x]] + title.plot[[x]])
} else plot3 <- NULL
#rate plot
if (any(plotfun %in% c("all", "rate"))){
plot4 <- rate_plot(chains, pars, n.warmup = n.warmup)
} else plot4 <- NULL
#rhat plot
if (any(plotfun %in% c("all", "rhat"))){
plot5 <- mcmc_rhat(rhat = rhat(posterior, pars = pars)) + yaxis_text(hjust = .0)
} else plot5 <- NULL
#non mi piace il plot4, al massimo lo togliamo
#plot4 <- mcmc_neff( neff_ratio(posterior, pars = pars), size = 2)
#acf plot
if (any(plotfun %in% c("all", "acf"))){
plot6 <- mcmc_acf(posterior, pars = pars, lags = lags)
} else plot6 <- NULL
plot.final <- c(plot1, plot2, plot3, plot4, list(plot5, plot6))
# if (compress == F){
# plot.final <- list(plot1, plot2, plot3, plot4, plot5)
# } else {
# #fa giĆ print, quindi va spostato
# plot.final <- Rmisc::multiplot(plotlist = plot1, layout = matrix(1:D, nrow = length(plot1), byrow = T))
# }
# sink(file.rendered)
# sink()
#
if (is.null(file)){
for(i in 1:length(plot.final)){
question <- utils::menu(c("Yes", "No"), title=paste0("Plot ", i, "/",length(plot.final), "\nDo you want to see it?"))
#grDevices::devAskNewPage(ask = TRUE)
if (question ==1)
invisible(utils::capture.output(print(plot.final[[i]]))) else break()#oppure next()
}
#grDevices::devAskNewPage(ask = FALSE)
} else if (file.extension == "pdf") {
grDevices::pdf(file, width = width, height = height)
invisible(utils::capture.output(print(plot.final)))
garbage <- grDevices::dev.off()
} else stop("File extension not supported")
#
# }
#mcmc_violin requires multiple chains
#aggiungere file che stampa che hai ottenuto il pdf
}
extract.pars <- function(posterior){
pars.full <- names(posterior)
pars <- c()
pars <- c(pars, pars.full[grep("beta",pars.full)])
pars <- c(pars, pars.full[grep("psi",pars.full)])#if model.phi is TRUE or if model.theta is TRUE
pars <- c(pars, pars.full[which(pars.full=="phi")])#if model.phi or model.theta is FALSE
pars <- c(pars, pars.full[grep("omega0",pars.full)])#for 0 augmentation
pars <- c(pars, pars.full[grep("omega1",pars.full)])#for 1 augmentation
pars <- c(pars, pars.full[which(pars.full=="theta")])#if model.theta is FALSE
pars <- c(pars, pars.full[which(pars.full=="p")])#if type is FB, VIB, or FBB
pars <- c(pars, pars.full[which(pars.full=="w")])#if type is FB or FBB
pars <- c(pars, pars.full[which(pars.full=="k")])#if type is VIB
return(pars)
}
#plot for rate of convergence
rate_plot <- function(chains, pars, n.warmup = n.warmup )
{
S <- dim(chains)[1]#n.iter
n.chain <- dim(chains)[2]#n.chain
sum.parz <- apply(chains, 3, cumsum)
dim(sum.parz) <- dim(chains)
mean.parz <- apply(sum.parz, 3, function(x) x/(1:S))
data.plot <- as.data.frame(mean.parz)
names(data.plot) <- pars
if (n.chain > 1) {
data.plot$Chain <- as.factor(rep(1:n.chain, each=S))
data.plot$iter <- rep( 1:S, n.chain)
} else {
data.plot$iter <- 1:S
data.plot$Chain <- as.factor(rep(1, S))
}
plot.out <- lapply(pars, function(g) ggplot(data.plot, aes_string(x="iter", y=as.name(g), color= "Chain"))+
annotate("rect",xmin = 0,xmax = n.warmup,
ymin = -Inf, ymax = Inf, fill = "grey20", alpha = 0.1)+
geom_line()+ theme(legend.position = 'none',panel.grid.major = element_blank(), panel.grid.minor = element_blank(),
panel.background = element_blank(),
axis.title.x = element_blank(),
axis.title.y=element_text(angle=0,hjust=1),
axis.line = element_line(colour = "black")))
return(plot.out)
}
#' Convergence diagnostics
#'
#' The function returns some diagnostics to check for convergence to the equilibrium distribution of the Markov Chain(s).
#' Moreover, it prints the number (and percentage) of iterations that ended with a divergence and that saturated the max treedepth, and the E-BFMI values for each chain for which E-BFMI is less than 0.2.
#'
#' @param model an object of class \code{`flexreg`}.
#' @param diagnostics an optional character vector of diagnostics names. The default is to compute \code{all} diagnostics, otherwise one can specify a selection of diagnostics among \code{Rhat}, \code{geweke}, \code{gaftery}, \code{heidel}, and \code{gelman}.
#' @param pars an optional character vector of parameter names. If \code{pars} is not specified, all parameters in the regression models are evaluated.
#' @param additional.args a list containing additional arguments (see details)
#'
#' @return A print from \code{check_hmc_diagnostics} function and a list of convergence diagnostics.
#'
#'
#' @references {
#' Brooks, SP., Gelman, A. (1998). General methods for monitoring convergence of iterative simulations. Journal of Computational and Graphical Statistics, \bold{7}, 434-455. \cr
#' \cr
#' Geweke, J. (1992). Evaluating the accuracy of sampling-based approaches to calculating posterior moments. In Bayesian Statistics 4 (ed JM Bernado, JO Berger, AP Dawid and AFM Smith). Clarendon Press, Oxford, UK. \cr
#' \cr
#' Heidelberger P., Welch P.D. (1981). A spectral method for confidence interval generation and run length control in simulations. Comm. ACM. \bold{24}, 233-245.\cr
#' \cr
#' Raftery, A.E. and Lewis, S.M. (1992). One long run with diagnostics: Implementation strategies for Markov chain Monte Carlo. Statistical Science, \bold{7}, 493-497.\cr
#' \cr
#' Stan Development Team (2020). RStan: the R interface to Stan. R package version 2.19.3. https://mc-stan.org
#' }
#'
#' @details \itemize{
#' \item \code{R-hat} returns the potential scale reduction factor on split chains. An R-hat greater than 1 is indicative of a bad mix of the chains. At convergence R-hat has to be less than 1.05. See \code{rstan::Rhat} for further details.
#' \item \code{geweke} returns the z-scores, one for each parameter, for a test of equality between the means of the first 10\% and last 50\% of the chain. The fraction to use from the first and last part of the chain can be edited through the additional arguments \code{frac1} and \code{frac2}. The sum of \code{frac1} and \code{frac2} has to be strictly less than 1. See \code{coda::geweke.diag} for further details.
#' \item \code{raftery} returns the length of "burn-in" (\eqn{M}), the required sample size (\eqn{N}), the minimum sample size for a chain with zero autocorrelation (\eqn{Nmin}), and the estimate of the "dependence factor" (\eqn{I = (M+N)/Nmin}). Values of \eqn{I} greater than 5 may be indicative of a strong autocorrelation.
#' Additional parameters such as the quantile to be estimated (\code{q}), the desired margin of error of the estimate (\code{r}), and the probability (\code{s}) of obtaining an estimate between \eqn{q-r} and \eqn{q+r} can be passed as list in the \code{additional.args} argument. See \code{coda::raftery.diag} for further details.
#' \item \code{heidel} returns a p-value referred to a convergence test where the null hypothesis is that the sampled values come from a stationary distribution. It is possible to set the target value for ratio of halfwidth to sample mean (\code{eps}) and the significance level of the test (\code{pvalue}) into the \code{additional.args} argument. See \code{coda::heidel.diag} for further details.
#' \item \code{gelman} returns the estimate of the potential scale reduction factor and the upper confidence limit. At least two chains are needed to compute the Gelman and Rubin's convergence diagnostics. Additional parameters such as the confidence level (\code{confidence}), a logical flag indicating whether variables should be transformed (\code{transform}),
#' a logical flag indicating whether only the second half of the series should be used in the computation (\code{autoburnin}), and a logical flag indicating whether the multivariate potential scale reduction factor should be calculated for multivariate chains (\code{multivariate}) can be passed as list in the \code{additional.args} argument. See \code{coda::gelman.diag} for further details.
#' }
#'
#' @import rstan
#'
#' @export
#'
convergence.diag <- function(model, diagnostics = "all", pars = NULL, additional.args=list())
{
posterior <- model$model
hmc.diag <- rstan::check_hmc_diagnostics(posterior)
if (is.null(pars)) pars <- extract.pars(posterior = posterior)
mcmc <- rstan::extract(posterior, pars=pars, permuted=F)
if(any(diagnostics == "all")) diagnostics <- c("Rhat", "geweke", "raftery", "heidel", "gelman")
#Rhat diag
if (any(diagnostics %in% "Rhat")){
rhat <- apply(mcmc, 3, function(x) rstan::Rhat(x))
} else rhat <- NULL
diagnostics <- diagnostics[-which(diagnostics=="Rhat")]
mcmc <- rstan::As.mcmc.list(posterior, pars=pars)
#gestiamo gli argomenti aggiuntivi
arg.coda <- lapply(diagnostics, function(x)
formals(utils::getFromNamespace(paste0(x,".diag"), "coda"))[-1])
names(arg.coda) <- diagnostics
if(length((additional.args))>0){
arg.coda <- unlist(arg.coda)
arg.match <- lapply(names(additional.args), function(x) grepl(x,names(arg.coda)))
for(i in 1:length(arg.match)) arg.coda[arg.match[[i]]] <- additional.args[i]
}
arg.coda <- unlist(arg.coda)
e <- names(arg.coda)
out <- within(as.list(arg.coda),{
if (any(diagnostics %in% "gelman")){
if(is.null(model$call$n.chain)) model$call$n.chain <- 1
if (model$call$n.chain < 2){
diagnostics <- diagnostics[-which(diagnostics=="gelman")]
warning("You need at least two chains to compute Gelman and Rubin's convergence diagnostic")}
}
other.diag <- lapply(diagnostics, function(x)
do.call(utils::getFromNamespace(paste0(x,".diag"), "coda"),append(list(mcmc),
lapply(e[startsWith(e,x)], function(a) get(a)))))
names(other.diag) <- diagnostics
})
return(list(Rhat=rhat, out$other.diag))
}
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.