R/ppoislogn.R
In flexCountReg: Estimation of a Variety of Count Regression Models

Documented in dpLnorm ppLnorm rpLnorm

#' Poisson-Lognormal Distribution
#'
#' These functions provide density, distribution function, quantile function,
#' and random number generation for the Poisson-Lognormal (PLogN) Distribution
#'
#'
#' @param x numeric value or a vector of values.
#' @param q quantile or a vector of quantiles.
#' @param p probability or a vector of probabilities.
#' @param n the number of random numbers to generate.
#' @param mean numeric value or vector of mean values for the distribution (the
#'   values have to be greater than 0).
#' @param sigma single value or vector of values for the sigma parameter of the
#'   lognormal distribution (the values have to be greater than 0).
#' @param ndraws the number of Halton draws to use for the integration.
#' @param log logical; if TRUE, probabilities p are given as log(p).
#' @param log.p logical; if TRUE, probabilities p are given as log(p).
#' @param lower.tail logical; if TRUE, probabilities p are \eqn{P[X\leq x]}
#'   otherwise, \eqn{P[X>x]}.
#' @param hdraws and optional vector of Halton draws to use for the integration.
#'
#' @details
#' \code{dpLnorm} computes the density (PDF) of the Poisson-Lognormal
#' Distribution.
#'
#' \code{ppLnorm} computes the CDF of the Poisson-Lognormal Distribution.
#'
#' \code{qpLnorm} computes the quantile function of the Poisson-Lognormal
#' Distribution.
#'
#' \code{rpLnorm} generates random numbers from the Poisson-Lognormal
#' Distribution.
#'
#' The compound Probability Mass Function (PMF) for the Poisson-Lognormal
#' distribution is:
#' \deqn{f(y|\mu,\theta,\alpha)=
#'   \int_0^\infty \frac{\mu^y x^y e^{-\mu x}}{y!} 
#'   \frac{exp\left(-\frac{ln^2(x)}{2\sigma^2} \right)}{x\sigma\sqrt{2\pi}}dx}
#'
#' Where \eqn{\sigma} is a parameter for the lognormal distribution with the
#' restriction \eqn{\sigma>0}, and \eqn{y} is a non-negative integer.
#'
#' The expected value of the distribution is:
#' \deqn{E[y]=e^{X\beta+\sigma^2/2} = \mu e^{\sigma^2/2}}
#' Halton draws are used to perform simulation over the lognormal distribution
#' to solve the integral.
#' 
#' @returns dpLnorm gives the density, ppLnorm gives the distribution 
#'  function, qpLnorm gives the quantile function, and rpLnorm generates
#'  random  deviates.
#' 
#'  The length of the result is determined by n for rpLnorm, and is the 
#'  maximum of the lengths of the numerical arguments for the other functions.
#'
#' @examples
#' dpLnorm(0, mean=0.75, sigma=2, ndraws=10)
#' ppLnorm(c(0,1,2,3,5,7,9,10), mean=0.75, sigma=2, ndraws=10)
#' qpLnorm(c(0.1,0.3,0.5,0.9,0.95), mean=0.75, sigma=2, ndraws=10)
#' rpLnorm(30, mean=0.75,  sigma=2, ndraws=10)
#'
#' @importFrom stats runif qnorm
#' @importFrom randtoolbox halton
#' @export
#' @name PoissonLognormal
#' 
#' @importFrom Rcpp sourceCpp
#' @useDynLib flexCountReg
#' @rdname PoissonLognormal
#' @export
dpLnorm <- function(x, mean=1, sigma=1, ndraws=1500, log=FALSE, hdraws=NULL){
  if (!is.null(hdraws)){
    h <- qnorm(hdraws)
  }else{
    h <- randtoolbox::halton(ndraws, normal=TRUE)
  }
  
  p <- dpLnorm_cpp(x, mean, sigma, h)
  
  if (log) return(log(p))
  else return(p)
}
#' @rdname PoissonLognormal
#' @export
ppLnorm <- function(
    q, mean=1, sigma=1, ndraws=1500, lower.tail=TRUE, log.p=FALSE){
  
  # Input Validation
  if(any(mean <= 0) || any(sigma <= 0)) 
    warning("The values of `mean` and `sigma` must be greater than 0.")
  
  # 1. Generate Halton draws ONCE for the entire batch
  h <- randtoolbox::halton(ndraws, normal=FALSE)
  
  # 2. Vectorization Setup
  n <- max(length(q), length(mean), length(sigma))
  q <- rep_len(q, n)
  mean <- rep_len(mean, n)
  sigma <- rep_len(sigma, n)
  
  cdf <- numeric(n)
  
  # 3. Efficient Calculation
  # Group by parameters to avoid redundant PMF calculations if parameters are
  # shared
  # (Simplest approach shown here: loop over N, but use pre-calculated 'h')
  
  for(i in 1:n) {
    if(is.na(q[i]) || q[i] < 0) {
      cdf[i] <- 0
      next
    }
    
    # Calculate PMF for 0 to q[i]
    # Pass the PRE-GENERATED 'h' (hdraws) to dpLnorm
    y_seq <- 0:floor(q[i])
    probs <- dpLnorm(y_seq, mean[i], sigma[i], ndraws=ndraws, hdraws=h)
    
    cdf[i] <- sum(probs)
  }
  
  if(!lower.tail) cdf <- 1-cdf
  if(log.p) return(log(cdf))
  return(cdf)
}

#' @rdname PoissonLognormal
#' @export
qpLnorm <- Vectorize(function(p, mean=1, sigma=1, ndraws=1500) {
  if (mean <= 0 || sigma <= 0) {
    msg <- paste('The values of `mean`  and `sigma` have to",
                 "have values greater than 0.')
    warning(msg)
  }
  
  y <- 0
  p_value <- ppLnorm(y, mean, sigma=sigma, ndraws=ndraws)
  while(p_value < p){
    y <- y + 1
    p_value <- ppLnorm(y, mean, sigma=sigma, ndraws=ndraws)
  }
  return(y)
})


#' @rdname PoissonLognormal
#' @export
rpLnorm <- function(n, mean=1, sigma=1, ndraws=1500) {
  if(mean<=0  || sigma<=0) {
    msg <- 
      'The values of `mean` and `sigma` have to have values greater than 0.'
    warning(msg)
  }
  
  u <- stats::runif(n)
  y <- vapply(
    X = u, 
    FUN = \(p) qpLnorm(p, mean, sigma = sigma, ndraws = ndraws), 
    FUN.VALUE = numeric(1))
    return(y)
}