rstanmed: Mediation in Stan

Documented in make_prior simulate_data

#' Take a list with design matrices and outcomes and collapse it down to
#' unique data observation patterns with observation weights \code{w}
#' 
#' Assumes that the primary outcome design matrix \code{do_list$designs$x_y} 
#' contains M and all adjustment covariates that appear the U and M models.
#' 
#' @param do_list Named list containing \code{designs} list (with named matrices
#' \code{x_u}, \code{x_m}, and \code{x_y}) and \code{outcomes} list (with named
#' vectors \code{m} and \code{y}; see \code{\link{simulate_data}} for example
#' expected input, but without the \code{df} element 
#' @return Named list with \code{designs} sublist of collapsed design matrices,
#' \code{outcomes} sublist of collapsed outcome vectors, and \code{w}, a vector 
#' of integer counts of the observation frequency patterns. Note that individual
#' design matrices and/or outcome vectors may contain duplicate elements.
#' @export
collapse_do_list <- function(do_list) {
  
  # Basic input checking
  stopifnot(c("designs", "outcomes") %in% names(do_list))
  stopifnot(c("x_u", "x_m", "x_y") %in% names(do_list$designs))
  stopifnot(c("m", "y") %in% names(do_list$outcomes))
  stopifnot("(i)" %in%  colnames(do_list$designs$x_y))
  
  # Merge to get unique covariate and outcome combinations
  alltogether <- cbind(do_list$designs$x_y, y = do_list$outcomes$y)
  
  # Deduplicate and get count of observation patterns
  deduped <- aggregate(`(i)` ~ ., data = alltogether, FUN = sum)
  colnames(deduped)[colnames(deduped) == "(i)"] <- "count"
  deduped[["(i)"]] <- 1
  
  # Include U as a collapsed outcome iff it was provided initially
  if ("u" %in% names(do_list$outcomes)) {
    outcomes <- list(m = deduped[["m"]],
                     y = deduped[["y"]],
                     u = deduped[["u"]])
  } else {
    outcomes <- list(m = deduped[["m"]],
                     y = deduped[["y"]])
  }
  
  return(list(designs = list(x_u = deduped[, colnames(do_list$designs$x_u)],
                             x_m = deduped[, colnames(do_list$designs$x_m)],
                             x_y = deduped[, colnames(do_list$designs$x_y)]),
              outcomes = outcomes,
              w = deduped$count))
}



#' Calculate bias of posterior mean in Stan parameter samples
#' 
#' @param estimate Length-P vector with each column corresponding to an estimate
#' @param truth Length-P vector of true parameter values
#' @return Length-P vector of estimated bias
#' @export
calculate_bias <- function(estimate, truth) {
  bias <- unname(estimate - truth)
  return(bias)
}



#' Calculate posterior mean in Stan parameter samples
#' 
#' @param samples SxP Matrix with each column corresponding to a parameter
#' @return Length-P vector of posterior means
#' @export
calculate_post_mean <- function(samples) {
  if (is.vector(samples)) {
    post_mean <- mean(samples)
  } else {
    post_mean <- colMeans(as.matrix(samples))
  }
  return(post_mean)
}



#' Make credible interval from Stan samples
#' 
#' @param samples SxP Matrix with each column corresponding to a parameter
#' @return Length-2 vector or Px2 matrix of credible interval bounds
#' @export
make_ci <- function(samples) {
  if (is.vector(samples) || (length(dim(samples)) == 1)) {
    ci <- quantile(samples, probs = c(0.025, 0.975))
  } else {
    ci <- matrixStats::colQuantiles(as.matrix(samples), probs = c(0.025, 0.975))  
  }
  names(ci) <- NULL
  return(ci)
}



#' Function to calculate width of credible intervals
#' 
#' @param ci Length-2 vector or Px2
#' @return Scalar or length-P vector of CI widths
#' @export
get_ci_width <- function(ci) {
  if (is.vector(ci)) {
    ci_width <- ci[2] - ci[1]
  } else {
    ci_width <- ci[,2] - ci[,1]
  }
  return(unname(ci_width))
}



#' Evaluate Y/N credible interval coverage
#' 
#' @param ci Length-2 vector or Px2 matrix of CI lower and upper bounds
#' @param truth Length-P vector of true parameter values
#' @return Length-P logical vector of interval coverage
#' @export
check_coverage <- function(ci, truth) {
  if (is.vector(ci)) {
    coverage <- unname((ci[1] < truth) & (ci[2] > truth))
  } else {
    coverage <- (ci[, 1] < truth) & (ci[, 2] > truth)
  }
  return(coverage)
}



#' Return true DGP parameters for binary-binary sensitivity simulations
#' 
#' @param u_ei 0/1 flag for whether U should be exposure-induced
#' @param am_intx 0/1 flag for including A*M interaction in outcome model
#' @param yu_strength Strength of U -> Y relationship on log-odds scale
#' @param mu_strength Strength of U -> M relationship on log-odds scale
#' @return Named list of parameter values
#' @export
return_dgp_parameters <- function(u_ei, am_intx, yu_strength, mu_strength) {
  stopifnot(c(u_ei, am_intx) %in% 0:1, is.numeric(c(yu_strength, mu_strength)))
  
  yu_strength <- unname(as.numeric(yu_strength))
  mu_strength <- unname(as.numeric(mu_strength))
  
  if (u_ei == 0) {
    gamma <- setNames(c(-0.4, 0, 0), c("(i)", "z1", "z2"))
  } else if (u_ei == 1) {
    gamma <- setNames(c(-0.4, 0, 0, 1.5), c("(i)", "z1", "z2", "a"))
  }
  
  if (am_intx == 0) {
    alpha <- setNames(c(-2, 0.3, 0.2, 1, 0.8, yu_strength),
                      c("(i)", "z1", "z2", "a", "m", "u"))
  } else if (am_intx == 1) {
    alpha <- setNames(c(-2, 0.3, 0.2, 1, 0.8, 1, yu_strength),
                      c("(i)", "z1", "z2", "a", "m", "a:m", "u"))
  }
  return(list(u_ei     = u_ei,
              am_intx  = am_intx,
              pz1      = 0.5, 
              pz2      = 0.5, 
              gamma    = gamma,
              beta     = setNames(c(-1.5, 0.3, 0.2, 0.7, mu_strength),
                                  c("(i)", "z1", "z2", "a", "u")),
              alpha    = alpha,
              a_params = setNames(c(-0.2, 0.5, 0.7),
                                  c("(i)", "z1", "z2"))))
}



#' Construct all 4 possible combinations of binary Z1 and Z2
#' @return Named data frame of the baseline covariate types
#' @export
make_bl_types <- function() {
  expand.grid(z1 = 0:1, z2 = 0:1)
}



#' Calculate population prevalance of baseline covariate types
#' 
#' @param bl_types Data frame containing the 4 unique covariate types
#' @param pz1 P(Z1 = 1)
#' @param pz2 P(Z2 = 1), assumed to be independent of Z1
#' @export
make_bl_weights <- function(bl_types, pz1, pz2) {
  stopifnot(NROW(bl_types) == 4)
  bl_weights <- rep(NA, 4)
  bl_weights[bl_types$z1 == 1 & bl_types$z2 == 1] <- pz1 * pz2
  bl_weights[bl_types$z1 == 1 & bl_types$z2 == 0] <- pz1 * (1 - pz2)
  bl_weights[bl_types$z1 == 0 & bl_types$z2 == 1] <- (1 - pz1) * pz2
  bl_weights[bl_types$z1 == 0 & bl_types$z2 == 0] <- (1 - pz1) * (1 - pz2)
  return(bl_weights)
}



#' Construct design matrix for unmeasured confounder regression model
#' Can depend on A or not
#' 
#' @param z1 Length-N vector for baseline confounder Z1
#' @param z2 Length-N vector for baseline confounder Z2
#' @param a Length-N vector for observed or hypothetical A
#' @param u_ei 0/1 flag for whether U should be exposure-induced
#' @return NxP design matrix for the U outcome model
#' @export
make_x_u <- function(z1, z2, a, u_ei) {
  if (u_ei == 1) {
    return(cbind(`(i)` = 1, z1, z2, a))
  } else if (u_ei == 0) {
    return(cbind(`(i)` = 1, z1, z2))
  }
}



#' Construct design matrix for mediator regression model
#' 
#' @param z1 Length-N vector for baseline confounder Z1
#' @param z2 Length-N vector for baseline confounder Z2
#' @param a Length-N vector for observed or hypothetical A
#' @param u Length-N vector for observed (true) or hypothetical U
#' @param type Whether to make naive matrix excluding U ("observed") or 
#' full matrix that includes U ("full")
#' @return NxP design matrix for the M outcome model
#' @export
make_x_m <- function(z1, z2, a, u = NULL, type = c("observed", "full")) {
  if (type == "full") {
    return(cbind(`(i)` = 1, z1, z2, a, u))
  } else if (type == "observed") {
    return(cbind(`(i)` = 1, z1, z2, a))
  }
}



#' Construct design matrix for outcome regression model
#' 
#' @param z1 Length-N vector for baseline confounder Z1
#' @param z2 Length-N vector for baseline confounder Z2
#' @param a Length-N vector for observed or hypothetical A
#' @param m Length-N vector for observed or hypothetical M
#' @param u Length-N vector for observed (true) or hypothetical U
#' @param type Whether to make naive matrix excluding U ("observed") or 
#' full matrix that includes U ("full")
#' @param am_intx 0/1 Whether to include A*M interaction
#' @return NxP design matrix for the Y outcome model
#' @export
make_x_y <- function(z1, z2, a, m, u = NULL, type = c("observed", "full"),
                     am_intx) {
  base <- cbind(`(i)` = 1, z1, z2, a, m)
  if (am_intx == 1) {
    base <- cbind(base, a * m)
    colnames(base)[ncol(base)] <- "a:m"
  }
  if (type == "full") {
    return(cbind(base, u))
  } else if (type == "observed") {
    return(base)
  }
}



#' Simulate data set
#' 
#' @param n Number of observations to simulate
#' @param u_ei 0/1 flag for whether U should be exposure-induced
#' @param am_intx 0/1 flag for A*M interaction in outcome model
#' @param yu_strength Log-OR of U in outcome model
#' @param mu_strength Log-OR of U in mediator model
#' @param params (Optional) List of data-generating parameters
#' see \code{\link{return_dgp_parameters}} for details on structure
#' @return List containing: df (data frame with n rows),
#' outcomes (named list of m and y outcomes), and designs (named list of 
#' design matrices for u, m, and y regression models)
#' @export
simulate_data <- function(n, u_ei, am_intx, yu_strength, mu_strength, params = NULL) {
  if (is.null(params)) {
    params <- return_dgp_parameters(u_ei = u_ei, am_intx = am_intx,
                                    yu_strength = yu_strength, mu_strength = mu_strength)
  }
  
  
  # Baseline and treatment
  # Center baseline covariates at true prevalence
  z1  <- rbinom(n, size = 1, prob = params$pz1)
  z2  <- rbinom(n, size = 1, prob = params$pz2)
  a   <- rbinom(n, size = 1, prob = plogis(cbind(1, z1, z2) %*% params$a_params))
  
  # Regression model data simulation
  x_u <- make_x_u(z1, z2, a, params$u_ei)
  u   <- rbinom(n, size = 1, prob = plogis(x_u %*% params$gamma))
  x_m_full <- make_x_m(z1, z2, a, u, type = "full")
  x_m <- make_x_m(z1, z2, a, u, type = "observed")
  m   <- rbinom(n, size = 1, prob = plogis(x_m_full %*% params$beta))
  x_y_full <- make_x_y(z1, z2, a, m, u, type = "full", am_intx = params$am_intx)
  x_y <- make_x_y(z1, z2, a, m, u, type = "observed", am_intx = params$am_intx)
  y   <- rbinom(n, size = 1, prob = plogis(x_y_full %*% params$alpha))
  
  # Return
  return(list(df = data.frame(z1 = z1, z2 = z2, a = a, u = u, m = m, y = y),
              outcomes = list(y = y, m = m),
              designs = list(x_u = x_u, x_m = x_m, x_y = x_y)))
}



#' Make template for prior distribution list
#' @return Empty list with correct naming structure
make_prior_shell <- function() {
  prior <- list()
  prior[["gamma"]] <- prior[["beta"]] <- prior[["alpha"]] <- 
    list(mean = NA, vcov = NA)
  return(prior)
}



#' Make binary-binary data driven prior based on simulated or real external data
#' 
#' Make a list of prior mean and variance-covariance matrices using an external
#' data source. Assumes binary mediator and binary outcome (for now).
#' 
#' @param small_data Data list with data set on which to base prior information 
#' (see \code{\link{simulate_data}} for format)
#' @param partial_vague Whether or not to inflate prior variance for more 
#' identified parameters
#' @param inflate_factor Variance inflation factor (only used if 
#' partial_vague = TRUE)
#' @return Named list with prior means and variances
#' @export
make_dd_prior <- function(small_data, partial_vague, inflate_factor = NULL) {
  
  #Fit maximum likelihood models to small data set
  fit_m <- glm(small_data$df$m ~ -1 + small_data$designs$x_m + small_data$df$u, 
               family = binomial(link = "logit"))
  fit_y <- glm(small_data$df$y ~ -1 + small_data$designs$x_y + small_data$df$u, 
               family = binomial(link = "logit"))
  fit_u <- glm(small_data$df$u ~ -1 + small_data$designs$x_u, 
               family = binomial(link = "logit"))
  
  # Set prior means and extract covariance matrices
  prior <- make_prior_shell()
  prior[["alpha"]][["mean"]] <- unname(coef(fit_y))
  prior[["beta"]][["mean"]]  <- unname(coef(fit_m))
  prior[["gamma"]][["mean"]] <- unname(coef(fit_u))
  a_vcov <- unname(vcov(fit_y))
  b_vcov <- unname(vcov(fit_m))
  g_vcov <- unname(vcov(fit_u))
  
  if (partial_vague) {
    # Inflate all variances and covariances by inflate_factor,
    # EXCEPT u-related parameters, which are all in last column
    # (and obviously gamma is u-related)
    sd_inflate <- sqrt(inflate_factor)
    a_vcov <- a_vcov * inflate_factor
    a_vcov[, ncol(a_vcov)] <- a_vcov[, ncol(a_vcov)] / sd_inflate
    a_vcov[nrow(a_vcov), ] <- a_vcov[nrow(a_vcov), ] / sd_inflate
    
    b_vcov <- b_vcov * inflate_factor
    b_vcov[, ncol(b_vcov)] <- b_vcov[, ncol(b_vcov)] / sd_inflate
    b_vcov[nrow(b_vcov), ] <- b_vcov[nrow(b_vcov), ] / sd_inflate
  }
  
  # Set prior covariance matrices
  prior[["alpha"]][["vcov"]] <- a_vcov
  prior[["beta"]][["vcov"]]  <- b_vcov
  prior[["gamma"]][["vcov"]] <- g_vcov
  
  # Apply names
  names(prior[["alpha"]][["mean"]]) <- colnames(small_data$designs$x_y)
  names(prior[["beta"]][["mean"]])  <- colnames(small_data$designs$x_m)
  names(prior[["gamma"]][["mean"]]) <- colnames(small_data$designs$x_u)
  
  return(prior)
}



#' Construct prior list based on type of sensitivity analysis
#' 
#' @param params List of parameters
#' @param prior_type Variance type: unit variance ("unit"), informative priors 
#' on non-identifiable parameters ("partial"), strong prior information 
#' ("strict"), data-driven ("dd") based on external or simulated data set, or
#' data pooling/power prior ("pp") based on the external or simulated data set
#' @param dd_control Named list of data-driven options. If external data is to
#' be used, "small_data" needs to be formatted as output from 
#' \code{\link{simulate_data}}. If secondary data source is to be simulated, 
#' need a list of parameters as from \code{\link{return_dgp_parameters}}. 
#' @return Named list of prior means and variance-covariance matrices
#' @export
make_prior <- function(params, prior_type = c("unit", "partial", "strict", "dd", 
                                              "powerprior"),
                       dd_control = NULL) {

  stopifnot(prior_type %in% c("unit", "partial", "strict", "dd", "powerprior"))
  
  if (prior_type %in% c("unit", "partial", "strict")) {
    if (is.null(params)) {
      stop("Need to supply underlying parameters for this prior_type")
    }
    P_y <- length(params$alpha)
    P_m <- length(params$beta)
    P_u <- length(params$gamma)
    
    # Initialize container
    prior <- make_prior_shell()
    
    # Set prior means to be truth
    prior[["alpha"]][["mean"]] <- params$alpha
    prior[["beta"]][["mean"]]  <- params$beta
    prior[["gamma"]][["mean"]] <- params$gamma
    
    # Set prior variances according to specification
    if (prior_type == "unit") {
      prior[["alpha"]][["vcov"]] <- diag(P_y)
      prior[["beta"]][["vcov"]]  <- diag(P_m)
      prior[["gamma"]][["vcov"]] <- diag(P_u)
    } else if (prior_type == "partial") {
      aa <- ifelse(params$am_intx == 1, 2, 1)
      prior[["alpha"]][["vcov"]] <- diag(c(rep(1, P_y - aa), rep(0.001, aa)))
      prior[["beta"]][["vcov"]]  <- diag(c(rep(1, P_m - 1), 0.001))
      prior[["gamma"]][["vcov"]] <- diag(P_u) * 0.001
    } else if (prior_type == "strict") {
      prior[["alpha"]][["vcov"]] <- diag(P_y) * 0.001
      prior[["beta"]][["vcov"]]  <- diag(P_m) * 0.001
      prior[["gamma"]][["vcov"]] <- diag(P_u) * 0.001
    }
    
    # Apply names
    names(prior[["alpha"]][["mean"]]) <- names(params$alpha)
    names(prior[["beta"]][["mean"]])  <- names(params$beta)
    names(prior[["gamma"]][["mean"]]) <- names(params$gamma)
    
  } else if (prior_type %in% c("dd", "powerprior")) {
    
    if (is.null(dd_control)) {
      stop("Need to specify input data set or simulation parameters for dd")
    } else {
      # Basic option checks
      valid_options <- c("params", "small_n", "small_data", 
                         "partial_vague", "inflate_factor")
      opts_given <- names(dd_control)
      stopifnot(opts_given %in% valid_options)
      if (c("params", "small_n") %in% opts_given &&
          !("small_data" %in% opts_given)) {
        dd_control$small_data <- simulate_data(n = dd_control$small_n, 
                                               params = dd_control$params)
      } else if (!("small_data" %in% opts_given)) {
        stop("Need to specify input data set or simulation parameters for dd")
      } else {
        stop("Can only specify small_data OR params and small_n")
      }
      
      # Defaults
      if (is.null(dd_control$partial_vague)) {
        if (prior_type == "dd") {
          dd_control$partial_vague <- TRUE
        } else if (prior_type == "powerprior") {
          dd_control$partial_vague <- FALSE
        } else {
          stop("Unexpected logic")
        }
      } 
      if (is.null(dd_control$inflate_factor)) {
        if (prior_type == "dd") {
          dd_control$inflate_factor <- 100
        } else if (prior_type == "powerprior") {
          dd_control$inflate_factor <- 1
        } else {
          stop("Unexpected logic")
        }
      }
      
      prior <- make_dd_prior(small_data = dd_control$small_data, 
                             partial_vague = dd_control$partial_vague,
                             inflate_factor = dd_control$inflate_factor)
      
      # Also pass back small data set if doing power prior
      # List format will be collapsed
      if (prior_type == "powerprior") {
        small_dl <- dd_control$small_data
        small_dl$outcomes$u <- small_dl$df$u
        small_dl$designs$x_m <- cbind(small_dl$designs$x_m, u = small_dl$df$u)
        small_dl$designs$x_y <- cbind(small_dl$designs$x_y, u = small_dl$df$u)
        prior$small_cdo <- collapse_do_list(do_list = small_dl)
      }
    }
  }
  
  # Return
  return(prior)
}



#' Function to extract g-computation estimate of (r)NDE from Stan fit
#' 
#' @param stan_fit Result from bin_bin_sens_stan
#' @param statistic Posterior statistic to calculate. Defaults to mean.
#' @return Vector with scalar point estimate and 95\% CI
#' @export
extract_nder_gcomp <- function(stan_fit, statistic = "mean") {
  samples <- unlist(extract(stan_fit, pars = "meffects[1]"))
  pe <- mean(samples)
  ci <- make_ci(samples)
  return(c(pe, ci))
}



#' Calculate g-formula with Bayesian bootstrap version of (r)NDE
#' 
#' @param stan_fit Stan fit from bin_bin_sens_stan result list
#' @param df Data frame for bootstrapping covariates
#' @param u_ei Whether U is exposure-induced
#' @param am_intx Whether to include A-M interaction in Y model
#' @return Vector with scalar point estimate and 95\% CI
#' @export
extract_nder_gform <- function(stan_fit, df, u_ei, am_intx) {
  KxR <- calculate_nder_stan(stan_fit, u_ei, am_intx)
  samples <- colMeans(KxR)
  bootweights <- get_bayesian_bootweights(df, R = length(samples))
  weighted_nder <- colSums(bootweights * KxR)
  ci <- make_ci(weighted_nder)
  pe <- mean(weighted_nder)
  return(c(pe, ci))
}



#' Calculate randomized interventional analog to natural direct effect
#'
#' @param params List of parameters (optional)
#' @param alpha Vector of Y regression coefficients (optional) 
#' @param beta Vector of M regression coefficients (optional) 
#' @param gamma Vector of U regression coefficients (optional)
#' @param u_ei Whether U is exposure-induced (optional)
#' @param am_intx Whether exposure-M interaction in outcome (optional)
#' @param yu_strength U coefficient in Y regression (optional)
#' @param mu_strength U coefficient in M regression (optional)
#' @param z1 Vector containing levels of z1 covariate to evaluate conditional NDER
#' @param z2 Vector containing levels of z2 covariate to evaluate conditional NDER
#' @param mean Whether to average (defaults)
#' @param weights Vector of weights for z1 and z2 combinations (optional). Default is to 
#' give every combination equal weight
#' @return Length-K vector of conditional NDERs, for each of K covariate patterns
#' @export
calculate_nder <- function(params = NULL, 
                           alpha = NULL, beta = NULL, gamma = NULL, 
                           u_ei = NULL, am_intx = NULL, 
                           yu_strength = NULL, mu_strength = NULL,
                           z1 = 0:1, z2 = 0:1, mean = FALSE, weights = NULL) {
  
  if ((is.null(u_ei) | is.null(am_intx) | is.null(yu_strength) | 
       is.null(mu_strength)) & (is.null(params))) {
    stop("Need to specify u_ei, am_intx, yu_strength, and mu_strength if not 
         supplying params")
  }
  
  if (is.null(params)) {
    params  <- return_dgp_parameters(u_ei, am_intx, yu_strength, mu_strength)
    if (is.null(alpha)) {
      alpha <- params$alpha
    }
    if (is.null(beta)) {
      beta  <- params$beta
    }
    if (is.null(gamma)) {
      gamma <- params$gamma
    }
  } else if (!is.null(params)) {
    alpha <- params$alpha
    beta  <- params$beta
    gamma <- params$gamma
  }
  
  # Make all possible combinations for provided z1, z2
  df <- expand.grid(z1 = z1, z2 = z2, u_for_y = 0:1, m = 0:1)
  bl_types <- make_bl_types()
  bl_types$bl_type <- 1:NROW(bl_types)
  if (mean == TRUE & is.null(weights)) {
    bl_types$weights <- 1/NROW(bl_types)
  } else if (!is.null(weights)) {
    stopifnot(length(weights) == NROW(bl_types))
    bl_types$weights <- weights
  }
  df <- merge(df, bl_types, by = c("z1", "z2"))
  
  # for a = 0 world
  pu1_a0 <- plogis(make_x_u(df$z1, df$z2, a = 0, u_ei) %*% gamma)
  pu_for_y_a0 <- ifelse(df$u_for_y == 1, pu1_a0, 1 - pu1_a0)
  
  # for randomized intervention on m (only matters in a = 0 world)
  pm1_a0u0 <- plogis(make_x_m(df$z1, df$z2, a = 0, u = 0, "full") %*% beta)
  pm1_a0u1 <- plogis(make_x_m(df$z1, df$z2, a = 0, u = 1, "full") %*% beta)
  pm1_a0   <- pm1_a0u1 * pu1_a0 + pm1_a0u0 * (1 - pu1_a0)
  pm_a0    <- ifelse(df$m == 1, pm1_a0, 1 - pm1_a0)
  
  # for a = 1 world
  pu1_a1 <- plogis(make_x_u(df$z1, df$z2, a = 1, u_ei) %*% gamma)
  pu_for_y_a1 <- ifelse(df$u_for_y == 1, pu1_a1, 1 - pu1_a1)
  
  # mean y for covariate/m/u combinations
  ey_cf1 <- plogis(make_x_y(df$z1, df$z2, a = 1, df$m, df$u_for_y, "full", am_intx) 
                   %*% alpha)
  ey_cf2 <- plogis(make_x_y(df$z1, df$z2, a = 0, df$m, df$u_for_y, "full", am_intx)
                   %*% alpha)
  
  # CF1 : E[Y(a = 1, u = u(a = 1), m = g(a = 0))]
  w1 <- pm_a0 * pu_for_y_a1
  ECF1 <- sapply(bl_types$bl_type, function(type) {
    weighted.mean(ey_cf1[df$bl_type == type], w = w1[df$bl_type == type])
  })
  
  # CF2 : E[Y(a = 0, u = u(a = 0), m = g(a = 0))]
  w2 <- pm_a0 * pu_for_y_a0
  ECF2 <- sapply(bl_types$bl_type, function(type) {
    weighted.mean(ey_cf2[df$bl_type == type], w = w2[df$bl_type == type])
  })
  
  # Return
  if (mean == TRUE) {
    return(weighted.mean(ECF1 - ECF2, w = bl_types$weights))
  } else {
    return(ECF1 - ECF2)
  }
}



#' Calculate u_prime as true underlying population average value for u
#' 
#' @param params List of true DGP
#' @return Scalar mean u for the interaction bias correction eval
#' @export
calculate_u_prime <- function(params) {
  xmat <- cbind(1, make_bl_types())
  w_z <- ifelse(xmat$z1 == 1, params$pz1, 1 - params$pz1) * 
         ifelse(xmat$z2 == 1, params$pz2, 1 - params$pz2)
  if (params$u_ei == 1) {
    # defaults to a = 0
    lp <- as.matrix(xmat) %*% head(params$gamma, length(params$gamma) - 1)
  } else if (params$u_ei == 0) {
    lp <- as.matrix(xmat) %*% params$gamma
  }
  return(weighted.mean(plogis(lp), w = w_z))
}



#' Calculate randomized interventional analog to natural direct effect
#' at a fixed level of u (u')
#'
#' Should not be used for exposure-induced U
#'
#' @param params List of parameters (optional)
#' @param alpha Vector of Y regression coefficients (optional) 
#' @param beta Vector of M regression coefficients (optional) 
#' @param gamma Vector of U regression coefficients (optional)
#' @param u_ei Whether U is exposure-induced (optional)
#' @param am_intx Whether exposure-M interaction in outcome (optional)
#' @param yu_strength U coefficient in Y regression (optional)
#' @param mu_strength U coefficient in M regression (optional)
#' @param z1 Vector containing levels of z1 covariate to evaluate conditional NDER
#' @param z2 Vector containing levels of z2 covariate to evaluate conditional NDER
#' @param u_prime Value at which to fix u
#' @param mean Whether to average (defaults)
#' @param weights Vector of weights for z1 and z2 combinations (optional). Default is to 
#' give every combination equal weight
#' @return Length-K vector of conditional NDERs, for each of K covariate patterns
#' @export
calculate_nder_fixed_u <- function(params = NULL, 
                                   alpha = NULL, beta = NULL, gamma = NULL, 
                                   u_ei = NULL, am_intx = NULL, 
                                   yu_strength = NULL, mu_strength = NULL,
                                   z1 = 0:1, z2 = 0:1, 
                                   u_prime = NULL, 
                                   mean = FALSE, weights = NULL) {
  if (u_ei == 1) {
    warning("rNDE has strange interpretation if U is exposure-induced!")
  }
  
  if ((is.null(u_ei) | is.null(am_intx) | is.null(yu_strength) | 
       is.null(mu_strength)) & (is.null(params))) {
    stop("Need to specify u_ei, am_intx, yu_strength, and mu_strength if not 
         supplying params")
  }
  
  if (is.null(params)) {
    params  <- return_dgp_parameters(u_ei, am_intx, yu_strength, mu_strength)
    if (is.null(alpha)) {
      alpha <- params$alpha
    }
    if (is.null(beta)) {
      beta  <- params$beta
    }
    if (is.null(gamma)) {
      gamma <- params$gamma
    }
  } else if (!is.null(params)) {
    alpha <- params$alpha
    beta  <- params$beta
    gamma <- params$gamma
  }
  
  # Make all possible combinations for provided z1, z2
  df <- expand.grid(z1 = z1, z2 = z2, u_for_y = u_prime, m = 0:1)
  bl_types <- make_bl_types()
  bl_types$bl_type <- 1:NROW(bl_types)
  if (mean == TRUE & is.null(weights)) {
    bl_types$weights <- 1/NROW(bl_types)
  } else if (!is.null(weights)) {
    stopifnot(length(weights) == NROW(bl_types))
    bl_types$weights <- weights
  }
  df <- merge(df, bl_types, by = c("z1", "z2"))
  
  # for randomized intervention on m (only matters in a = 0 world)
  pm1_a0 <- plogis(make_x_m(df$z1, df$z2, a = 0, u = u_prime, "full") %*% beta)
  pm_a0    <- ifelse(df$m == 1, pm1_a0, 1 - pm1_a0)
  
  # mean y for covariate/m/u combinations
  ey_cf1 <- plogis(make_x_y(df$z1, df$z2, a = 1, df$m, df$u_for_y, "full", am_intx) 
                   %*% alpha)
  ey_cf2 <- plogis(make_x_y(df$z1, df$z2, a = 0, df$m, df$u_for_y, "full", am_intx)
                   %*% alpha)
  
  # CF1 : E[Y(a = 1, u = u_prime, m = g(a = 0))]
  w1 <- pm_a0
  ECF1 <- sapply(bl_types$bl_type, function(type) {
    weighted.mean(ey_cf1[df$bl_type == type], w = w1[df$bl_type == type])
  })
  
  # CF2 : E[Y(a = 0, u = u_prime, m = g(a = 0))]
  w2 <- pm_a0
  ECF2 <- sapply(bl_types$bl_type, function(type) {
    weighted.mean(ey_cf2[df$bl_type == type], w = w2[df$bl_type == type])
  })
  
  # Return
  if (mean == TRUE) {
    return(weighted.mean(ECF1 - ECF2, w = bl_types$weights))
  } else {
    return(ECF1 - ECF2)
  }
}



#' Calculate (r)NDE from Stan sensitivity analysis fit
#' 
#' Not simulation-based! Closed form, g-formula
#' Returns conditional on specific z1, z2 values
#' 
#' @param stan_fit Result list with element stan_fit containing the stan fit
#' @param u_ei Whether unmeasured confounder is exposure-induced
#' @param am_intx Whether outcome model includes exposure-mediator interaction
#' @param \dots Parameters to pass to \code{\link{calculate_nder}}
#' @return K x R matrix of conditional NDER values for the K covariate patterns requested
#' from R MCMC iterations (excludes warmup)
#' @export
calculate_nder_stan <- function(stan_fit, u_ei, am_intx, ...) {
  as <- extract(stan_fit, pars = "alpha")[["alpha"]]
  bs <- extract(stan_fit, pars = "beta")[["beta"]]
  gs <- extract(stan_fit, pars = "gamma")[["gamma"]]
  niter <- nrow(as)
  ncol_alpha <- ncol(as)
  ncol_beta <- ncol(bs)
  
  return(sapply(1:niter, function(r) {
    calculate_nder(params = NULL, 
                   alpha = as[r,], beta = bs[r,], gamma = gs[r,], 
                   u_ei = u_ei, am_intx = am_intx,
                   yu_strength = as[r, ncol_alpha], 
                   mu_strength = bs[r, ncol_beta],
                   ...)
  }))
}



#' Make matrix of covariate pattern weights for Bayesian bootstrap
#' 
#' @param dat Data frame containing z1 and z2
#' @param R Number of weight replicates to draw
#' @return K x R matrix with dirichlet weights in columns (K = 4 right now)
get_bayesian_bootweights <- function(dat, R = 1) {
  poss_patterns <- make_bl_types()
  dat$.one <- 1
  obs_patterns <- aggregate(.one ~ z1 + z2, FUN = NROW, data = dat)
  counts <- merge(poss_patterns, obs_patterns, all.x = TRUE)$.one
  counts[is.na(counts)] <- 0
  bootweights <- replicate(R, sapply(counts, FUN = function(x) 
                           rgamma(n = 1, shape = x, scale = 1)))
  return(bootweights %*% diag(1 / colSums(bootweights)))
}