finmix: An R package for Bayesian estimation of finite mixture distributions

## Copyright (C) 2013 Lars Simon Zehnder
#
# This file is part of finmix.
#
# finmix is free software: you can redistribute it and/or modify it
# under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# finmix is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with finmix. If not, see <http://www.gnu.org/licenses/>.

#' Calculate point estimators from MCMC samples
#' 
#' @description 
#' Calling [mcmcestimate()] calculates the following point estimates from the 
#' MCMC samples: 
#' * MAP: The maximum a posterior estimates are defined as the mode of the 
#'   (joint) posterior density.
#' * BML: The Bayesian maximum likelihood estimator is based on the mixture 
#'   log-likelihood function and defines the mode of this function.
#' * EAVG: The ergodic average is calculated as an average over the MCMC traces 
#'   of component parameters and weights (in case of unknown parameters).  
#' * IEAVG: The identified ergodic average is defined similar to the EAVG, 
#'   however, in contrast to the latter it is based on re-labeled MCMC traces. 
#'   This is especially important in case of random permutation during MCMC
#'   sampling as component parameters then have to be re-assigned to their 
#'   (probably) correct component.
#'   
#' For a more detailed outlay of point estimators from Bayesian mixture model 
#' estimation, see Fr\"uhwirth-Schnatter (2006).
#' 
#' @param mcmcout An `mcmcoutput` object containing the sampled parameters and 
#'   informaiton about the finite mixture model.
#' @param method A character defining the re-labeling method in case of a model 
#'   with unknown indicators. For most distributions there exists only a single 
#'   choice, namely "kmeans". For Poisson and Binomial distributions the 
#'   re-labeling algorithms "Stephens1997a" and "Stephens1997b" can be chosen. 
#' @param fdata An `fdata` model containing the observations. Optional.
#' @param permOut A logical indicating, if the permuted MCMC samples should be 
#'   returned as well. Optional.
#' @param opt_ctrl A list with an element `max_iter` controlling the number of 
#'   iterations in case the "Stephens1997a" re-labeling algorithm is chosen.
#' @return An `mcmcest` object containing the point estimates together with 
#'   additional information about the underlying finite mixture model, MCMC 
#'   sampling hyper-parameters and the data. In case `permOut` is set to 
#'   `TRUE`, the output of this function is a named list with an `mcmcest` 
#'   object containing parameter estimates and in addition an `mcmcoutputperm` 
#'   object containing the permuted (re-labeled) MCMC samples.
#' @export
#' @name mcmcestimate
#'   
#' @seealso 
#' * [mcmcestfix-class] for object storing the parameter estimates in case of 
#'   fixed indicators
#' * [mcmcestind-class] for object storing the parameter estimates in case of 
#'   unknown indicators
#' * [mcmcoutputperm-class] for classes storing re-labeled 
#'   MCMC samples
"mcmcestimate" <- function(mcmcout, method = "kmeans", fdata = NULL,
                           permOut = FALSE, opt_ctrl = list(max_iter = 200L)) {
  ## Check input ##
  .check.args.Mcmcestimate(mcmcout, method, fdata, permOut, opt_ctrl)
  ## Constants
  K <- mcmcout@model@K
  M <- mcmcout@M
  dist <- mcmcout@model@dist
  indicmod <- mcmcout@model@indicmod
  ranperm <- mcmcout@ranperm

  ## If it inherits from 'mcmcoutputbase' indicators
  ## must be simulated.
  indicfix <- mcmcout@model@indicfix

  ## If it inherits from 'mcmcoutputperm' it has already
  ## identified samples
  perm <- inherits(mcmcout, what = "mcmcoutputperm")

  ## Posterior Mode (MAP)
  map.index <- .map.Mcmcestimate(mcmcout)
  map <- .extract.Mcmcestimate(mcmcout, map.index)

  ## Bayesian Maximum Likelihood (BML)
  bml.index <- .bml.Mcmcestimate(mcmcout)
  bml <- .extract.Mcmcestimate(mcmcout, bml.index)

  ## Ergodic average (EAVG)
  eavg <- .eavg.Mcmcestimate(mcmcout)

  if (indicfix) {
    ## Ergodic average is identified
    ## 'avg.id'
    ## Posterior Std. Error.
    sdpost <- .sdpost.Mcmcestimate(mcmcout, perm)

    .mcmcestfix(
      dist = dist, K = K, M = mcmcout@M, burnin = mcmcout@burnin,
      ranperm = mcmcout@ranperm, relabel = "none",
      indicmod = indicmod, map = map, bml = bml, ieavg = eavg,
      sdpost = sdpost
    )
  } else {
    if (ranperm) {
      ## Ergodic average is invariant
      ## 'inv'
      ## Check if already identification has been made
      if (perm) {
        if (mcmcout@Mperm > 0) {
          ## Use ergodic average function on 'mcmcoutputperm'
          ## object
          ieavg <- .eavg.Mcmcestimate(mcmcout)
          ## Posterior Std. Error.
          sdpost <- .sdpost.Mcmcestimate(mcmcout, perm)
          .mcmcestfix(
            dist = dist, K = K,
            indicmod = indicmod, M = mcmcout@Mperm,
            burnin = mcmcout@burnin, ranperm = mcmcout@ranperm,
            relabel = mcmcout@relabel, map = map, bml = bml,
            ieavg = ieavg, sdpost = sdpost
          )
        } else {
          warning(paste("No identification possible. Not a single ",
            "draw is a permutation",
            sep = ""
          ))
          sdpost <- .sdpost.unidentified.Mcmcestimate(mcmcout)
          .mcmcestfix(
            dist = dist, K = K,
            indicmod = indicmod, M = mcmcout@M,
            burnin = mcmcout@burnin, ranperm = mcmcout@ranperm,
            relabel = method, map = map, bml = bml,
            eavg = eavg, sdpost = sdpost
          )
        }
      } else {
        ## Use function 'mcmcpermute' to permute the sample
        mcmcoutperm <- mcmcpermute(mcmcout, method = method, fdata = fdata, opt_ctrl = opt_ctrl)
        perm <- TRUE
        if (mcmcoutperm@Mperm > 0) {
          ## Use ergodic average function on 'mcmcoutputperm'
          ## object
          ## Build 'avg.id'
          ieavg <- .eavg.Mcmcestimate(mcmcoutperm)
          ## Posterior Std. Error
          sdpost <- .sdpost.Mcmcestimate(mcmcoutperm, perm)
          mcmcest <- .mcmcestind(
            dist = dist, K = K,
            indicmod = indicmod, M = mcmcoutperm@Mperm,
            burnin = mcmcout@burnin, ranperm = mcmcout@ranperm,
            relabel = method, map = map, bml = bml,
            ieavg = ieavg, eavg = eavg, sdpost = sdpost
          )
          if (permOut) {
            return.list <- list(
              mcmcest = mcmcest,
              mcmcoutputperm = mcmcoutperm
            )
            return(return.list)
          } else {
            return(mcmcest)
          }
        } else {
          warning(paste("No identification possible. Not a single ",
            "draw is a permutation",
            sep = ""
          ))
          sdpost <- .sdpost.unidentified.Mcmcestimate(mcmcout)
          mcmcest <- .mcmcestind(
            dist = dist, K = K,
            indicmod = indicmod, M = mcmcout@M,
            burnin = mcmcout@burnin, ranperm = mcmcout@ranperm,
            relabel = method, map = map, bml = bml,
            ieavg = list(), eavg = eavg, sdpost = sdpost
          )
          if (permOut) {
            return.list <- list(
              mcmcest = mcmcest,
              mcmcoutputperm = mcmcoutperm
            )
            return(return.list)
          } else {
            return(mcmcest)
          }
        }
      }
    } else {
      ## 'eavg'
      ## Posterior Std. Error
      sdpost <- .sdpost.Mcmcestimate(mcmcout, perm)
      .mcmcestfix(
        dist = dist, K = K, indicmod = indicmod,
        M = mcmcout@M, burnin = mcmcout@burnin,
        ranperm = mcmcout@ranperm, relabel = "none",
        map = map, bml = bml, ieavg = eavg, sdpost = sdpost
      )
    }
  }
  ## New 'mcmcestimate' object.

  ## In case the permOut = TRUE the mcmcoutperm object is
  ## returned as well in a list
}

### Private functions
### These functions are not exported.

#' Check arguments for [mcmcestimate()]
#' 
#' @description 
#' For internal usage only. This function checks the arguments to the 
#' [mcmcestimate()] function and throws an error, if the checks do not pass. 
#' More specifically it checks for the classes of objects and the choices in 
#' case of a character argument.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing MCMC 
#'   samples.
#' @param arg2 The second argument to the `mcmcestimate()` function. 
#' @param arg3 The second argument to the `mcmcestimate()` function. 
#' @param arg4 The second argument to the `mcmcestimate()` function. 
#' @param arg5 The second argument to the `mcmcestimate()` function.
#' @return None. If checks do not pass, an error is thrown with a user-friendly 
#'   message.
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function 
".check.args.Mcmcestimate" <- function(obj, arg2, arg3, arg4, arg5) {
  if (!inherits(obj, c("mcmcoutput", "mcmcoutputperm"))) {
    stop(paste("Wrong argument: Argument 1 must be an object ",
      "either of class 'mcmcoutput' or of type ",
      "'mcmcoutputperm'.",
      sep = ""
    ))
  }
  match.arg(arg2, c("kmeans", "Stephens1997a", "Stephens1997b"))
  if (!inherits(arg3, "fdata") && !is.null(arg3)) {
    stop(paste("Wrong argument: Argument 3 must be an object ",
      "of class 'fdata'.",
      sep = ""
    ))
  }
  if (!is.logical(arg4)) {
    stop("Wrong argument: Argument 4 must be of type 'logical'.")
  }
  if (length(arg5) != 0) {
    if ("max_iter" %in% names(arg5)) {
      if (!is.numeric(arg5$max_iter)) {
        stop(paste0(
          "Wrong argument: In argument 5 'max_iter' ",
          "has to be of type integer."
        ))
      }
    } else {
      stop(paste0(
        "Wrong argument: Argument 5 must contain a variable ",
        "'max_iter' of type integer."
      ))
    }
  }
}

#' Calculates the MAP
#' 
#' @description 
#' For internal usage only. This function calculates the MAP estimates from the 
#' MCMC samples. 
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object storing the MCMC 
#'   samples.
#' @return An integer specifying the index of the parameter values that lead 
#'   to the highest posterior log likelihood. 
#' @noRd
#' @seealso 
#' * [mcmcestimate()] for the calling function
".map.Mcmcestimate" <- function(obj) {
  ## Take the value with the highest posterior log
  ## likelihood
  mixpost <- obj@log$mixlik + obj@log$mixprior
  mixpost.sort <- sort.int(mixpost, index.return = TRUE)
  map.index <- tail(mixpost.sort$ix, 1)
  return(as.integer(map.index))
}

#' Calculates the BML
#' 
#' @description 
#' For internal usage only. This function calculates the BML estimates from the 
#' MCMC samples. 
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object storing the MCMC 
#'   samples.
#' @return An integer specifying the index of the parameter values that lead 
#'   to the highest mixture log-likelihood. 
#' @noRd
#' @importFrom utils tail
#' @seealso 
#' * [mcmcestimate()] for the calling function
".bml.Mcmcestimate" <- function(obj) {
  ## Take the value with the highest log likelihood
  mixlik <- obj@log$mixlik
  mixlik.sort <- sort.int(mixlik, index.return = TRUE)
  bml.index <- tail(mixlik.sort$ix, 1)
  return(bml.index)
}

#' Extract estimates from MCMC samples
#' 
#' @description 
#' For internal usage only. This function extracts a row of MCMC samples by 
#' index. The index in this case are the indices at which the log-likelihood 
#' functions have their empirical mode.
#' 
#' @param obj An `mcmcoutput` object containing the MCMC samples.
#' @param m An integer defining the index at which index parameters and 
#'   log-likelihood function values should be extracted.
#' @return A named list with elements `par` containing the extracted 
#'   parameters and `log` containing the log-likelihood values.
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".extract.Mcmcestimate" <- function(obj, m) {
  ## Extract the 'm'th row in each slot of an mcmcout
  ## object
  K <- obj@model@K
  dist <- obj@model@dist
  indicfix <- !inherits(obj, what = "mcmcoutputbase")
  if (dist %in% c("poisson", "cond.poisson", "exponential")) {
    par.est <- list(lambda = as.array(obj@par$lambda[m, ]))
  } else if (dist == "binomial") {
    par.est <- list(p = as.array(obj@par$p[m, ]))
  } else if (dist == "normal") {
    par.est <- list(
      mu = as.array(obj@par$mu[m, ]),
      sigma = as.array(obj@par$sigma[m, ])
    )
  } else if (dist == "student") {
    par.est <- list(
      mu = as.array(obj@par$mu[m, ]),
      sigma = as.array(obj@par$sigma[m, ]),
      df = as.array(obj@par$df[m, ])
    )
  } else if (dist == "normult") {
    par.est <- list(
      mu = as.array(obj@par$mu[m, , ]),
      sigma = qinmatrmult(obj@par$sigma[m, , ]),
      sigmainv = qinmatrmult(obj@par$sigmainv[m, , ])
    )
  } else if (dist == "studmult") {
    par.est <- list(
      mu = as.array(obj@par$mu[m, , ]),
      sigma = qinmatrmult(obj@par$sigma[m, , ]),
      sigmainv = qinmatrmult(obj@par$sigmainv[m, , ]),
      df = as.array(obj@par$df[m, ])
    )
  }
  if (!indicfix && K > 1) {
    weight.est <- as.array(obj@weight[m, ])
    est.list <- list(
      par = par.est, weight = weight.est,
      log = obj@log$mixlik[m]
    )
    return(est.list)
  }
  est.list <- list(par = par.est, log = obj@log$mixlik[m])
  return(est.list)
}

#' Calculate the EAVG
#' 
#' @description 
#' For internal usage only. This function calculates the identified ergodic 
#' average from the (re-labeled) MCMC traces. In the case of permuted MCMC 
#' samples the ergodic average is the so-called identified ergodic average.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing MCMC 
#'   samples.
#' @return A list containing the ergodic average estimates for the component 
#'   parameters in element `par` and the corresponding weight estimates in 
#'   element `weigth`.
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".eavg.Mcmcestimate" <- function(obj) {
  ## Check arguments ##
  dist <- obj@model@dist
  indicfix <- !inherits(obj, what = "mcmcoutputbase")
  perm <- inherits(obj, what = "mcmcoutputperm")
  if (dist %in% c("poisson", "cond.poisson", "exponential")) {
    if (!perm) {
      par.eavg <- list(lambda = as.array(apply(obj@par$lambda,
        2, mean,
        na.rm = TRUE
      )))
    } else {
      par.eavg <- list(lambda = as.array(apply(obj@parperm$lambda,
        2, mean,
        na.rm = TRUE
      )))
    }
  } else if (dist == "binomial") {
    if (!perm) {
      par.eavg <- list(p = as.array(apply(obj@par$p, 2, mean,
        na.rm = TRUE
      )))
    } else {
      par.eavg <- list(p = as.array(apply(obj@parperm$p, 2, mean,
        na.rm = TRUE
      )))
    }
  } else if (dist == "normal") {
    if (!perm) {
      par.eavg <- list(
        mu = as.array(apply(obj@par$mu, 2,
          mean,
          na.rm = TRUE
        )),
        sigma = as.array(apply(obj@par$sigma, 2,
          mean,
          na.rm = TRUE
        ))
      )
    } else {
      par.eavg <- list(
        mu = as.array(apply(obj@parperm$mu, 2,
          mean,
          na.rm = TRUE
        )),
        sigma = as.array(apply(obj@parperm$sigma, 2,
          mean,
          na.rm = TRUE
        ))
      )
    }
  } else if (dist == "student") {
    if (!perm) {
      par.eavg <- list(
        mu = as.array(apply(obj@par$mu, 2,
          mean,
          na.rm = TRUE
        )),
        sigma = as.array(apply(obj@par$sigma, 2,
          mean,
          na.rm = TRUE
        )),
        df = as.array(apply(obj@par$df, 2,
          mean,
          na.rm = TRUE
        ))
      )
    } else {
      par.eavg <- list(
        mu = as.array(apply(obj@parperm$mu, 2,
          mean,
          na.rm = TRUE
        )),
        sigma = as.array(apply(obj@parperm$sigma, 2,
          mean,
          na.rm = TRUE
        )),
        df = as.array(apply(obj@parperm$df, 2,
          mean,
          na.rm = TRUE
        ))
      )
    }
  } else if (dist == "normult") {
    if (!perm) {
      par.eavg <- list(
        mu = as.array(apply(obj@par$mu, c(2, 3),
          mean,
          na.rm = TRUE
        )),
        sigma = as.array(t(apply(obj@par$sigma, c(2, 3),
          mean,
          na.rm = TRUE
        ))),
        sigmainv = as.array(t(apply(obj@par$sigmainv, c(2, 3),
          mean,
          na.rm = TRUE
        )))
      )
    } else {
      par.eavg <- list(
        mu = as.array(apply(obj@parperm$mu, c(2, 3),
          mean,
          na.rm = TRUE
        )),
        sigma = as.array(t(apply(obj@parperm$sigma, c(2, 3),
          mean,
          na.rm = TRUE
        ))),
        sigmainv = as.array(t(apply(obj@parperm$sigmainv, c(2, 3),
          mean,
          na.rm = TRUE
        )))
      )
    }
  } else if (dist == "studmult") {
    if (!perm) {
      par.eavg <- list(
        mu = as.array(apply(obj@par$mu, c(2, 3),
          mean,
          na.rm = TRUE
        )),
        sigma = as.array(t(apply(obj@par$sigma, c(2, 3),
          mean,
          na.rm = TRUE
        ))),
        sigmainv = as.array(t(apply(obj@par$sigmainv, c(2, 3),
          mean,
          na.rm = TRUE
        ))),
        df = as.array(apply(obj@par$df, 2,
          mean,
          na.rm = TRUE
        ))
      )
    } else {
      par.eavg <- list(
        mu = as.array(apply(obj@parperm$mu, c(2, 3),
          mean,
          na.rm = TRUE
        )),
        sigma = as.array(t(apply(obj@parperm$sigma, c(2, 3),
          mean,
          na.rm = TRUE
        ))),
        sigmainv = as.array(t(apply(obj@parperm$sigmainv, c(2, 3),
          mean,
          na.rm = TRUE
        ))),
        df = as.array(apply(obj@parperm$df, 2,
          mean,
          na = TRUE
        ))
      )
    }
  }
  if (indicfix) {
    eavg.list <- list(par = par.eavg)
    return(eavg.list)
  } else {
    if (perm) {
      weight.eavg <- as.array(apply(obj@weightperm,
        2, mean,
        na.rm = TRUE
      ))
      eavg.list <- list(par = par.eavg, weight = weight.eavg)
      return(eavg.list)
    } else {
      weight.eavg <- as.array(apply(obj@weight, 2, mean,
        na.rm = TRUE
      ))
      eavg.list <- list(par = par.eavg, weight = weight.eavg)
      return(eavg.list)
    }
  }
}

#' Calculate the standard deviation of the posterior
#' 
#' @description 
#' For internal usage only. This function calculates the standard deviations of 
#' the posterior parameter distribution.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing the 
#'   sampled parameter values.
#' @param perm A logical indicating, if the samples have been re-labeled.
#' @return A list containing the standard deviations of the posterior 
#'   densities. 
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".sdpost.Mcmcestimate" <- function(obj, perm) {
  dist <- obj@model@dist
  if (dist %in% c("poisson", "cond.poisson", "exponential")) {
    .sdpost.poisson.Mcmcestimate(obj, perm)
  } else if (dist == "binomial") {
    .sdpost.binomial.Mcmcestimate(obj, perm)
  } else if (dist == "normal") {
    .sdpost.normal.Mcmcestimate(obj, perm)
  } else if (dist == "student") {
    .sdpost.student.Mcmcestimate(obj, perm)
  } else if (dist == "normult") {
    .sdpost.normult.Mcmcestimate(obj, perm)
  } else if (dist == "studmult") {
    .sdpost.studmult.Mcmcestimate(obj, perm)
  }
}

# TODO: Throws error that weights are not available, if `indicfix=TRUE` 
#' Calculate the standard deviation of the posterior from Poisson mixtures
#' 
#' @description 
#' For internal usage only. This function calculates the standard deviations of 
#' the posterior parameter distribution.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing the 
#'   sampled parameter values.
#' @param perm A logical indicating, if the samples have been re-labeled.
#' @return A list containing the standard deviations of the posterior 
#'   densities. 
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".sdpost.poisson.Mcmcestimate" <- function(obj, perm) {
  if (perm) {
    sdpar <- apply(obj@parperm$lambda, 2, sd, na.rm = TRUE)
    sdparpre <- apply(obj@par$lambda, 2, sd, na.rm = TRUE)
    sdweight <- apply(obj@weightperm, 2, sd, na.rm = TRUE)
    sdweightpre <- apply(obj@weight, 2, sd, na.rm = TRUE)
    identified <- list(
      par = list(lambda = sdpar),
      weight = sdweight
    )
    unidentified <- list(
      par = list(lambda = sdparpre),
      weight = sdweightpre
    )
    sdlist <- list(
      identified = identified,
      unidentified = unidentified
    )
  } else {
    sdpar <- apply(obj@par$lambda, 2, sd, na.rm = TRUE)
    if (!obj@model@indicfix) {
      sdweight <- apply(obj@weight, 2, sd, na.rm = TRUE)
      identified <- list(par = list(lambda = sdpar), weight = sdweight)
    } else {
      identified <- list(par = list(lambda = sdpar))
    }
    sdlist <- list(identified = identified)
  }
  return(sdlist)
}

#' Calculate the standard deviation of the posterior from Binomial mixtures
#' 
#' @description 
#' For internal usage only. This function calculates the standard deviations of 
#' the posterior parameter distribution.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing the 
#'   sampled parameter values.
#' @param perm A logical indicating, if the samples have been re-labeled.
#' @return A list containing the standard deviations of the posterior 
#'   densities. 
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".sdpost.binomial.Mcmcestimate" <- function(obj, perm) {
  if (perm) {
    sdpar <- apply(obj@parperm$p, 2, sd, na.rm = TRUE)
    sdparpre <- apply(obj@par$p, 2, sd, na.rm = TRUE)
    sdweight <- apply(obj@weightperm, 2, sd, na.rm = TRUE)
    sdweightpre <- apply(obj@weight, 2, sd, na.rm = TRUE)
    identified <- list(
      par = list(p = sdpar),
      weight = sdweight
    )
    unidentified <- list(
      par = list(p = sdparpre),
      weight = sdweightpre
    )
    sdlist <- list(
      identified = identified,
      unidentified = unidentified
    )
  } else {
    # TODO: Make a difference between indicfix. Take the weight from the 
    # model for fixed indicators.
    sdpar <- apply(obj@par$p, 2, sd, na.rm = TRUE)
    sdweight <- apply(obj@weight, 2, sd, na.rm = TRUE)
    identified <- list(
      par = list(p = sdpar),
      weight = sdweight
    )
    sdlist <- list(identified = identified)
  }
  return(sdlist)
}

#' Calculate the standard deviation of the posterior from Normal mixtures
#' 
#' @description 
#' For internal usage only. This function calculates the standard deviations of 
#' the posterior parameter distribution.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing the 
#'   sampled parameter values.
#' @param perm A logical indicating, if the samples have been re-labeled.
#' @return A list containing the standard deviations of the posterior 
#'   densities. 
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".sdpost.normal.Mcmcestimate" <- function(obj, perm) {
  if (perm) {
    sdmu <- apply(obj@parperm$mu, 2, sd, na.rm = TRUE)
    sdmupre <- apply(obj@par$mu, 2, sd, na.rm = TRUE)
    sdsigma <- apply(obj@parperm$sigma, 2, sd, na.rm = TRUE)
    sdsigmapre <- apply(obj@par$sigma, 2, sd, na.rm = TRUE)
    sdweight <- apply(obj@weightperm, 2, sd, na.rm = TRUE)
    sdweightpre <- apply(obj@weight, 2, sd, na.rm = TRUE)
    identified <- list(
      par = list(mu = sdmu, sigma = sdsigma),
      weight = sdweight
    )
    unidentified <- list(
      par = list(mu = sdmupre, sigma = sdsigmapre),
      weight = sdweightpre
    )
    sdlist <- list(
      identified = identified,
      unidentified = unidentified
    )
  } else {
    # TODO: Make a difference between indicfix. Take the weight from the 
    # model for fixed indicators.
    sdmu <- apply(obj@par$mu, 2, sd, na.rm = TRUE)
    sdsigma <- apply(obj@par$sigma, 2, sd, na.rm = TRUE)
    sdweight <- apply(obj@weight, 2, sd, na.rm = TRUE)
    identified <- list(
      par = list(mu = sdmu, sigma = sdsigma),
      weight = sdweight
    )
    sdlist <- list(identified = identified)
  }
  return(sdlist)
}

#' Calculate the standard deviation of the posterior from Student-t mixtures
#' 
#' @description 
#' For internal usage only. This function calculates the standard deviations of 
#' the posterior parameter distribution.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing the 
#'   sampled parameter values.
#' @param perm A logical indicating, if the samples have been re-labeled.
#' @return A list containing the standard deviations of the posterior 
#'   densities. 
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".sdpost.student.Mcmcestimate" <- function(obj, perm) {
  if (perm) {
    sdmu <- apply(obj@parperm$mu, 2, sd, na.rm = TRUE)
    sdmupre <- apply(obj@par$mu, 2, sd, na.rm = TRUE)
    sdsigma <- apply(obj@parperm$sigma, 2, sd, na.rm = TRUE)
    sdsigmapre <- apply(obj@par$sigma, 2, sd, na.rm = TRUE)
    sddf <- apply(obj@parperm$df, 2, sd, na.rm = TRUE)
    sddfpre <- apply(obj@parperm$df, 2, sd, na.rm = TRUE)
    sdweight <- apply(obj@weightperm, 2, sd, na.rm = TRUE)
    sdweightpre <- apply(obj@weight, 2, sd, na.rm = TRUE)
    identified <- list(
      par = list(
        mu = sdmu, sigma = sdsigma,
        df = sddf
      ),
      weight = sdweight
    )
    unidentified <- list(
      par = list(
        mu = sdmupre, sigma = sdsigmapre,
        df = sddfpre
      ),
      weight = sdweightpre
    )
    sdlist <- list(
      identified = identified,
      unidentified = unidentified
    )
  } else {
    # TODO: Make a difference between indicfix. Take the weight from the 
    # model for fixed indicators.
    sdmu <- apply(obj@par$mu, 2, sd, na.rm = TRUE)
    sdsigma <- apply(obj@par$sigma, 2, sd, na.rm = TRUE)
    sddf <- apply(obj@par$sigma, 2, sd, na.rm = TRUE)
    sdweight <- apply(obj@weight, 2, sd, na.rm = TRUE)
    identified <- list(
      par = list(
        mu = sdmu, sigma = sdsigma,
        df = sddf
      ),
      weight = sdweight
    )
    sdlist <- list(identified = identified)
  }
  return(sdlist)
}

#' Calculate the std. dev. of the posterior from multivariate Normal mixtures
#' 
#' @description 
#' For internal usage only. This function calculates the standard deviations of 
#' the posterior parameter distribution.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing the 
#'   sampled parameter values.
#' @param perm A logical indicating, if the samples have been re-labeled.
#' @return A list containing the standard deviations of the posterior 
#'   densities. 
#' @noRd
#' @importFrom stats cov
#' @seealso 
#' * [mcmcestimate()] for the calling function
".sdpost.normult.Mcmcestimate" <- function(obj, perm) {
  r <- obj@model@r
  K <- obj@model@K
  s <- r * (r + 1) / 2
  if (perm) {
    if (K == 1) {
      sdmu <- cov(obj@parperm$mu)
      sdmupre <- cov(obj@par$mu)
      sdsigma <- cov(obj@parperm$sigma)
      sdsigmapre <- cov(obj@par$sigma)
      sdsigmainv <- cov(obj@parperm$sigmainv)
      sdsigmainvpre <- cov(obj@par$sigmainv)
    } else {
      sdmu <- array(numeric(), dim = c(r, r, K))
      sdsigma <- array(numeric(), dim = c(s, s, K))
      sdsigmainv <- array(numeric(), dim = c(s, s, K))
      sdmupre <- array(numeric(), dim = c(r, r, K))
      sdsigmapre <- array(numeric(), dim = c(s, s, K))
      sdsigmainvpre <- array(numeric(), dim = c(s, s, K))
      for (k in 1:K) {
        sdmu[, , k] <- cov(obj@parperm$mu[, , k])
        sdsigma[, , k] <- cov(obj@parperm$sigma[, , k])
        sdsigmainv[, , k] <- cov(obj@parperm$sigmainv[, , k])
        sdmupre[, , k] <- cov(obj@par$mu[, , k])
        sdsigmapre[, , k] <- cov(obj@par$sigma[, , k])
        sdsigmainvpre[, , k] <- cov(obj@par$sigmainv[, , k])
      }
    }
    sdweight <- apply(obj@weightperm, 2, sd)
    sdweightpre <- apply(obj@weight, 2, sd)
    identified <- list(
      par = list(
        mu = sdmu, sigma = sdsigma,
        sigmainv = sdsigmainv
      ),
      weight = sdweight
    )
    unidentified <- list(
      par = list(
        mu = sdmupre, sigma = sdsigmapre,
        sigmainv = sdsigmainvpre
      ),
      weight = sdweightpre
    )
    sdlist <- list(
      identified = identified,
      unidentified = unidentified
    )
  } else {
    # TODO: Make a difference between indicfix. Take the weight from the 
    # model for fixed indicators.
    if (K == 1) {
      sdmu <- cov(obj@par$mu)
      sdsigma <- cov(obj@par$sigma)
      sdsigmainv <- cov(obj@par$sigmainv)
    } else {
      sdmu <- array(numeric(), dim = c(r, r, K))
      sdsigma <- array(numeric(), dim = c(s, s, K))
      sdsigmainv <- array(numeric(), dim = c(s, s, K))
      for (k in 1:K) {
        sdmu[, , k] <- cov(obj@par$mu[, , k])
        sdsigma[, , k] <- cov(obj@par$sigma[, , k])
        sdsigmainv[, , k] <- cov(obj@par$sigmainv[, , k])
      }
    }
    sdweight <- apply(obj@weight, 2, sd)
    identified <- list(
      par = list(
        mu = sdmu, sigma = sdsigma,
        sigmainv = sdsigmainv
      ),
      weight = sdweight
    )
    sdlist <- list(identified = identified)
  }
  return(sdlist)
}

#' Calculate the std. dev. of the posterior from multivariate Student-t mixtures
#' 
#' @description 
#' For internal usage only. This function calculates the standard deviations of 
#' the posterior parameter distribution.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing the 
#'   sampled parameter values.
#' @param perm A logical indicating, if the samples have been re-labeled.
#' @return A list containing the standard deviations of the posterior 
#'   densities. 
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".sdpost.studmult.Mcmcestimate" <- function(obj, perm) {
  r <- obj@model@r
  K <- obj@model@K
  s <- r * (r + 1) / 2
  if (perm) {
    if (K == 1) {
      sdmu <- cov(obj@parperm$mu)
      sdmupre <- cov(obj@par$mu)
      sdsigma <- cov(obj@parperm$sigma)
      sdsigmapre <- cov(obj@par$sigma)
      sdsigmainv <- cov(obj@parperm$sigmainv)
      sdsigmainvpre <- cov(obj@par$sigmainv)
    } else {
      sdmu <- array(numeric(), dim = c(r, r, K))
      sdsigma <- array(numeric(), dim = c(s, s, K))
      sdsigmainv <- array(numeric(), dim = c(s, s, K))
      sdmupre <- array(numeric(), dim = c(r, r, K))
      sdsigmapre <- array(numeric(), dim = c(s, s, K))
      sdsigmainvpre <- array(numeric(), dim = c(s, s, K))
      for (k in 1:K) {
        sdmu[, , k] <- cov(obj@parperm$mu[, , k])
        sdsigma[, , k] <- cov(obj@parperm$sigma[, , k])
        sdsigmainv[, , k] <- cov(obj@parperm$sigmainv[, , k])
        sdmupre[, , k] <- cov(obj@par$mu[, , k])
        sdsigmapre[, , k] <- cov(obj@par$sigma[, , k])
        sdsigmainvpre[, , k] <- cov(obj@par$sigmainv[, , k])
      }
    }
    sdweight <- apply(obj@weightperm, 2, sd)
    sdweightpre <- apply(obj@weight, 2, sd) #
    sddf <- apply(obj@parperm$df, 2, sd)
    sddfpre <- apply(obj@par$df, 2, sd)
    identified <- list(
      par = list(
        mu = sdmu, sigma = sdsigma,
        sigmainv = sdsigmainv,
        df = sddf
      ),
      weight = sdweight
    )
    unidentified <- list(
      par = list(
        mu = sdmupre, sigma = sdsigmapre,
        sigmainv = sdsigmainvpre,
        df = sddfpre
      ),
      weight = sdweightpre
    )
    sdlist <- list(
      identified = identified,
      unidentified = unidentified
    )
  } else {
    # TODO: Make a difference between indicfix. Take the weight from the 
    # model for fixed indicators.
    if (K == 1) {
      sdmu <- cov(obj@par$mu)
      sdsigma <- cov(obj@par$sigma)
      sdsigmainv <- cov(obj@par$sigmainv)
    } else {
      sdmu <- array(numeric(), dim = c(r, r, K))
      sdsigma <- array(numeric(), dim = c(s, s, K))
      sdsigmainv <- array(numeric(), dim = c(s, s, K))
      for (k in 1:K) {
        sdmu[, , k] <- cov(obj@par$mu[, , k])
        sdsigma[, , k] <- cov(obj@par$sigma[, , k])
        sdsigmainv[, , k] <- cov(obj@par$sigmainv[, , k])
      }
    }
    sdweight <- apply(obj@weight, 2, sd)
    sddf <- apply(obj@par$df, 2, sd)
    identified <- list(
      par = list(
        mu = sdmu, sigma = sdsigma,
        sigmainv = sdsigmainv,
        df = sddf
      ),
      weight = sdweight
    )
    sdlist <- list(identified = identified)
  }
  return(sdlist)
}

#' Calculate the std. dev. for unidentified MCMC samples 
#' 
#' @description 
#' For internal usage only. This function calculates the standard deviations of 
#' the posterior parameter distribution in case that no re-labeling has been 
#' performed.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing the 
#'   sampled parameter values.
#' @return A list containing the standard deviations of the posterior 
#'   densities in case of samples that are not re-labeled.
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".sdpost.unidentified.Mcmcestimate" <- function(obj) {
  .sdpost.unidentified.poisson.Mcmcestimate(obj)
}

#' Calculate the std. dev. for unidentified Poisson MCMC samples 
#' 
#' @description 
#' For internal usage only. This function calculates the standard deviations of 
#' the posterior parameter distribution in case that no re-labeling has been 
#' performed.
#' 
#' @param obj An `mcmcoutput` or `mcmcoutputperm` object containing the 
#'   sampled parameter values.
#' @return A list containing the standard deviations of the posterior 
#'   densities in case of samples that are not re-labeled.
#' @noRd
#' 
#' @seealso 
#' * [mcmcestimate()] for the calling function
".sdpost.unidentified.poisson.Mcmcestimate" <- function(obj) {
  sdpar <- apply(obj@par$lambda, 2, sd)
  sdweight <- apply(obj@weight, 2, sd)
  unidentified <- list(
    par = list(lambda = sdpar),
    weight = sdweight
  )
  sdlist <- list(unidentified = unidentified)
  return(sdlist)
}
simonsays1980/finmix documentation built on Dec. 23, 2021, 2:25 a.m.
rdrr.io home R language documentation Run R code online
CRAN packages Bioconductor packages R-Forge packages GitHub packages
Note that we can't provide technical support on individual packages. You should contact the package authors for that.
simonsays1980/finmix
An R package for Bayesian estimation of finite mixture distributions

R/mcmcestimate.R
In simonsays1980/finmix: An R package for Bayesian estimation of finite mixture distributions

R Package Documentation

Browse R Packages

We want your feedback!

simonsays1980/finmix An R package for Bayesian estimation of finite mixture distributions

R/mcmcestimate.R In simonsays1980/finmix: An R package for Bayesian estimation of finite mixture distributions

R Package Documentation

Browse R Packages

We want your feedback!

simonsays1980/finmix
An R package for Bayesian estimation of finite mixture distributions

R/mcmcestimate.R
In simonsays1980/finmix: An R package for Bayesian estimation of finite mixture distributions