R/ce_estimate_iptw_ate.R
In CIMTx: Causal Inference for Multiple Treatments with a Binary Outcome

Documented in ce_estimate_iptw_ate

#' Causal inference with multiple treatments using IPTW for ATE effects
#'
#' The function \code{ce_estimate_iptw_ate} implements
#' IPTW to estimate ATE effect with
#' multiple treatments using observational data.
#'
#' @param y A numeric vector (0, 1) representing a binary outcome.
#' @param w A numeric vector representing the treatment groups.
#' @param x A dataframe, including all the covariates but not treatments.
#' @param method A character string. Users can selected from the
#' following methods including \code{"IPTW-Multinomial"},
#' \code{"IPTW-GBM"}, \code{"IPTW-SL"}.
#' @param ... Other parameters that can be passed through to functions.
#'
#' @return A summary of the effect estimates can be obtained
#' with \code{summary} function. The weight distributions can be
#' visualized using \code{plot} function.
#' @importFrom nnet multinom
#' @importFrom WeightIt weightit
#' @references
#'
#' Venables, W. N. & Ripley, B. D. (2002)
#' \emph{Modern Applied Statistics with S}.
#' Fourth Edition. Springer, New York. ISBN 0-387-95457-0
#'
#' Matthew Cefalu, Greg Ridgeway, Dan McCaffrey,
#' Andrew Morral, Beth Ann Griffin and Lane Burgette (2021).
#' \emph{twang: Toolkit for Weighting and Analysis of Nonequivalent Groups}.
#' R package version 2.5. URL:\url{https://CRAN.R-project.org/package=twang}
#'
#' Noah Greifer (2021).
#' \emph{WeightIt: Weighting for Covariate Balance in Observational Studies}.
#' R package version 0.12.0.
#' URL:\url{https://CRAN.R-project.org/package=WeightIt}
ce_estimate_iptw_ate <- function(y, w, x, method, ...) {
  xwdata <- as.data.frame(cbind(x, w = w))
  n_trt <- length(unique(w))
  trim_perc <- parent.frame()$trim_perc
  if (method == "IPTW-Multinomial" && is.null(trim_perc)) {
    # Fit a multinomial logistic regression model
    # with treatment indicator as the outcome
    psmod2 <- nnet::multinom(w ~ ., data = xwdata, trace = FALSE)
    pred_ps <- stats::fitted(psmod2)
    # Get the weights
    for (i in 1:n_trt) {
      assign(paste0("ate_wt_", i), 1 / pred_ps[, i])
    }
    # Record the weights
    weight_glm <- NULL
    for (i in 1:n_trt) {
      weight_glm <- c(weight_glm,
                      eval(parse(text = paste0("ate_wt_", i)))[w == i])
    }
    # Calculate the weighted means
    for (i in 1:n_trt) {
      assign(paste0("mu_", i, "_hat_iptw"),
             sum(y[w == i] * weight_glm[w == i]) / sum(weight_glm[w == i]))
    }
    # Obtain the causal effects based on RD, OR and RR
    result_list_multinomial <- NULL
    for (i in 1:(n_trt - 1)) {
      result_once <- NULL
      for (j in (i + 1):n_trt) {
        assign(paste0("RD", i, j),
               eval(parse(text = paste0(
                 "mu_", i, "_hat_iptw"
               ))) -
                 eval(parse(text = paste0(
                   "mu_", j, "_hat_iptw"
                 ))))
        assign(paste0("RR", i, j),
               eval(parse(text = paste0(
                 "mu_", i, "_hat_iptw"
               ))) /
                 eval(parse(text = paste0(
                   "mu_", j, "_hat_iptw"
                 ))))
        assign(paste0("OR", i, j),
               (eval(parse(
                 text = paste0("mu_", i, "_hat_iptw")
               )) /
                 (1 - eval(
                   parse(text = paste0("mu_", i, "_hat_iptw"))
                 ))) /
                 (eval(parse(
                   text = paste0("mu_", j, "_hat_iptw")
                 )) /
                   (1 - eval(
                     parse(text = paste0("mu_", j, "_hat_iptw"))
                   ))))
        result_once <- rbind(eval(parse(text = paste0("RD", i, j))),
                             eval(parse(text = paste0("RR", i, j))),
                             eval(parse(text = paste0("OR", i, j))))
        colnames(result_once) <- "EST"
        rownames(result_once) <- c("RD", "RR", "OR")
        result_once_list <- list(result_once)
        names(result_once_list) <- paste0("ATE", i, j)
        result_list_multinomial <-
          c(result_list_multinomial, result_once_list)
      }
    }
    result_list_multinomial <- c(
      result_list_multinomial,
      list(weight = weight_glm),
      list(method = method),
      list(estimand = "ATE")
    )
    class(result_list_multinomial) <- "CIMTx_IPTW"
    return(result_list_multinomial)
  } else if (method == "IPTW-Multinomial" && !is.null(trim_perc)) {
    # Fit a multinomial logistic regression model
    # with treatment indicator as the outcome
    psmod2 <- nnet::multinom(w ~ ., data = xwdata, trace = FALSE)
    pred_ps <- stats::fitted(psmod2)
    # Get the weights
    for (i in 1:n_trt) {
      assign(paste0("ate_wt_", i), 1 / pred_ps[, i])
    }
    # Record the weights
    weight_glm <- NULL
    for (i in 1:n_trt) {
      weight_glm <- c(weight_glm,
                      eval(parse(text = paste0("ate_wt_", i)))[w == i])
    }
    # Trim  the weights
    weight_glm_trim <- trunc_fun(weight_glm, trim_perc)
    # Calculate the weighted means
    for (i in 1:n_trt) {
      assign(
        paste0("mu_", i, "_hat_iptw_trim"),
        sum(y[w == i] * weight_glm_trim[w == i]) /
          sum(weight_glm_trim[w == i])
      )
    }
    # Obtain the causal effects based on RD, OR and RR
    result_list_multinomial_trim <- NULL
    for (i in 1:(n_trt - 1)) {
      result_once <- NULL
      for (j in (i + 1):n_trt) {
        assign(paste0("RD", i, j),
               eval(parse(
                 text = paste0("mu_", i, "_hat_iptw_trim")
               )) -
                 eval(parse(
                   text = paste0("mu_", j, "_hat_iptw_trim")
                 )))
        assign(paste0("RR", i, j),
               eval(parse(
                 text = paste0("mu_", i, "_hat_iptw_trim")
               )) /
                 eval(parse(
                   text = paste0("mu_", j, "_hat_iptw_trim")
                 )))
        assign(paste0("OR", i, j),
               (eval(parse(
                 text = paste0("mu_", i, "_hat_iptw_trim")
               )) /
                 (1 - eval(
                   parse(text = paste0("mu_", i, "_hat_iptw_trim"))
                 ))) /
                 (eval(parse(
                   text = paste0("mu_", j, "_hat_iptw_trim")
                 )) /
                   (1 - eval(
                     parse(text = paste0("mu_", j, "_hat_iptw_trim"))
                   ))))
        result_once <- rbind(eval(parse(text = paste0("RD", i, j))),
                             eval(parse(text = paste0("RR", i, j))),
                             eval(parse(text = paste0("OR", i, j))))
        colnames(result_once) <- "EST"
        rownames(result_once) <- c("RD", "RR", "OR")
        result_once_list <- list(result_once)
        names(result_once_list) <- paste0("ATE", i, j)
        result_list_multinomial_trim <-
          c(result_list_multinomial_trim,
            result_once_list)
      }
    }
    result_list_multinomial_trim <- c(
      result_list_multinomial_trim,
      list(weight = weight_glm_trim),
      list(method = paste0(method, "-Trim")),
      list(estimand = "ATE")
    )
    class(result_list_multinomial_trim) <- "CIMTx_IPTW"
    return(result_list_multinomial_trim)
  } else if (method == "IPTW-GBM" && is.null(trim_perc)) {
    # Fit a GBM model with treatment indicator as the outcome
    temp <- noquote(names(x))
    str_formula <-
      sprintf("w~%s", paste(temp, sep = "", collapse = "+"))
    psmod <- twang::mnps(
      stats::as.formula(str_formula),
      data = xwdata %>% mutate(w = as.factor(w)),
      estimand = "ATE",
    )
    # Get the weights
    es.max.ATE <- NULL
    for (i in 1:n_trt) {
      assign(paste0("ps", i), psmod$psList[[i]]$ps %>% pull(es.max.ATE))
    }
    wt_hat <- twang::get.weights(psmod, estimand = "ATE")
    # Calculate the weighted means
    for (i in 1:n_trt) {
      assign(paste0("mu_", i, "_hatgbm"),
             sum(y[w == i] * wt_hat[w == i]) /
               sum(wt_hat[w == i]))
    }
    # Obtain the causal effects based on RD, OR and RR
    result_list_gbm <- NULL
    for (i in 1:(n_trt - 1)) {
      result_once <- NULL
      for (j in (i + 1):n_trt) {
        assign(paste0("RD", i, j),
               eval(parse(text = paste0(
                 "mu_", i, "_hatgbm"
               ))) -
                 eval(parse(text = paste0(
                   "mu_", j, "_hatgbm"
                 ))))
        assign(paste0("RR", i, j),
               eval(parse(text = paste0(
                 "mu_", i, "_hatgbm"
               ))) /
                 eval(parse(text = paste0(
                   "mu_", j, "_hatgbm"
                 ))))
        assign(paste0("OR", i, j),
               (eval(parse(
                 text = paste0("mu_", i, "_hatgbm")
               )) /
                 (1 - eval(
                   parse(text = paste0("mu_", i, "_hatgbm"))
                 ))) /
                 (eval(parse(
                   text = paste0("mu_", j, "_hatgbm")
                 )) /
                   (1 - eval(
                     parse(text = paste0("mu_", j, "_hatgbm"))
                   ))))
        result_once <- rbind(eval(parse(text = paste0("RD", i, j))),
                             eval(parse(text = paste0("RR", i, j))),
                             eval(parse(text = paste0("OR", i, j))))
        colnames(result_once) <- "EST"
        rownames(result_once) <- c("RD", "RR", "OR")
        result_once_list <- list(result_once)
        names(result_once_list) <- paste0("ATE", i, j)
        result_list_gbm <- c(result_list_gbm, result_once_list)
      }
    }
    result_list_gbm <- c(
      result_list_gbm,
      list(weight = wt_hat),
      list(method = method),
      list(estimand = "ATE")
    )
    class(result_list_gbm) <- "CIMTx_IPTW"
    return(result_list_gbm)
  } else if (method == "IPTW-GBM" && !is.null(trim_perc)) {
    # Get the weights
    temp <- noquote(names(x))
    str_formula <-
      sprintf("w~%s", paste(temp, sep = "", collapse = "+"))
    psmod <- twang::mnps(
      stats::as.formula(str_formula),
      data = xwdata %>% mutate(w = as.factor(w)),
      estimand = "ATE",
      ...
    )
    for (i in 1:n_trt) {
      assign(paste0("ps", i), psmod$psList[[i]]$ps %>% pull(es.max.ATE))
    }
    wt_hat <- twang::get.weights(psmod, estimand = "ATE")
    # Trim the weights
    wt_hat_trunc <- trunc_fun(wt_hat, trim_perc)
    # Calculate the weighted means
    for (i in 1:n_trt) {
      assign(paste0("mu_", i, "_hatgbm_trim"),
             sum(y[w == i] * wt_hat_trunc[w == i]) /
               sum(wt_hat_trunc[w == i]))
    }
    # Obtain the causal effects based on RD, OR and RR
    result_list_gbm_trim <- NULL
    for (i in 1:(n_trt - 1)) {
      result_once <- NULL
      for (j in (i + 1):n_trt) {
        assign(paste0("RD", i, j),
               eval(parse(text = paste0(
                 "mu_", i, "_hatgbm_trim"
               ))) -
                 eval(parse(text = paste0(
                   "mu_", j, "_hatgbm_trim"
                 ))))
        assign(paste0("RR", i, j),
               eval(parse(text = paste0(
                 "mu_", i, "_hatgbm_trim"
               ))) /
                 eval(parse(text = paste0(
                   "mu_", j, "_hatgbm_trim"
                 ))))
        assign(paste0("OR", i, j),
               (eval(parse(
                 text = paste0("mu_", i, "_hatgbm_trim")
               )) /
                 (1 - eval(
                   parse(text = paste0("mu_", i, "_hatgbm_trim"))
                 ))) /
                 (eval(parse(
                   text = paste0("mu_", j, "_hatgbm_trim")
                 )) /
                   (1 - eval(
                     parse(text = paste0("mu_", j, "_hatgbm_trim"))
                   ))))
        result_once <- rbind(eval(parse(text = paste0("RD", i, j))),
                             eval(parse(text = paste0("RR", i, j))),
                             eval(parse(text = paste0("OR", i, j))))
        colnames(result_once) <- "EST"
        rownames(result_once) <- c("RD", "RR", "OR")
        result_once_list <- list(result_once)
        names(result_once_list) <- paste0("ATE", i, j)
        result_list_gbm_trim <-
          c(result_list_gbm_trim, result_once_list)
      }
    }
    result_list_gbm_trim <- c(
      result_list_gbm_trim,
      list(weight = wt_hat_trunc),
      list(method = paste0(method, "-Trim")),
      list(estimand = "ATE")
    )
    class(result_list_gbm_trim) <- "CIMTx_IPTW"
    return(result_list_gbm_trim)
  } else if (method == "IPTW-SL" && is.null(trim_perc)) {
    sl_library <- parent.frame()$sl_library
    if (any((sl_library %in%
             getNamespaceExports("SuperLearner")[
               grepl(pattern = "^[S]L",
                     getNamespaceExports("SuperLearner"))]) == F))
      stop(
        "sl_library argument unrecgonized; please use listWrappers()
           in SuperLearner to find the list of supported values",
        call. = FALSE
      )
    # Get the weights
    weightit_superlearner <- WeightIt::weightit(
      w ~ .,
      data = xwdata,
      method = "super",
      estimand = "ATE",
      SL.library = sl_library,
      ...
    )
    weight_superlearner <- weightit_superlearner$weights
    # Calculate the weighted means
    for (i in 1:n_trt) {
      assign(
        paste0("mu_", i, "_hat_superlearner"),
        sum(y[w == i] * weight_superlearner[w == i]) /
          sum(weight_superlearner[w == i])
      )
    }
    # Obtain the causal effects based on RD, OR and RR
    result_list_superlearner <- NULL
    for (i in 1:(n_trt - 1)) {
      result_once <- NULL
      for (j in (i + 1):n_trt) {
        assign(paste0("RD", i, j), eval(parse(
          text = paste0("mu_", i, "_hat_superlearner")
        )) - eval(parse(
          text = paste0("mu_", j, "_hat_superlearner")
        )))
        assign(paste0("RR", i, j), eval(parse(
          text = paste0("mu_", i, "_hat_superlearner")
        )) / eval(parse(
          text = paste0("mu_", j, "_hat_superlearner")
        )))
        assign(paste0("OR", i, j), (eval(parse(
          text = paste0("mu_", i, "_hat_superlearner")
        )) / (1 - eval(
          parse(text = paste0("mu_", i, "_hat_superlearner"))
        ))) / (eval(parse(
          text = paste0("mu_", j, "_hat_superlearner")
        )) / (1 - eval(
          parse(text = paste0("mu_", j, "_hat_superlearner"))
        ))))
        result_once <-
          rbind(eval(parse(text = paste0("RD", i, j))),
                eval(parse(text = paste0("RR", i, j))),
                eval(parse(text = paste0("OR", i, j))))
        colnames(result_once) <- "EST"
        rownames(result_once) <- c("RD", "RR", "OR")
        result_once_list <- list(result_once)
        names(result_once_list) <- paste0("ATE", i, j)
        result_list_superlearner <-
          c(result_list_superlearner, result_once_list)
      }
    }
    result_list_superlearner <-
      c(
        result_list_superlearner,
        list(weight = weight_superlearner),
        list(method = method),
        list(estimand = "ATE")
      )
    class(result_list_superlearner) <- "CIMTx_IPTW"
    return(result_list_superlearner)
  } else if (method == "IPTW-SL" && !is.null(trim_perc)) {
    sl_library <- parent.frame()$sl_library
    if (any((sl_library %in% getNamespaceExports("SuperLearner")[
      grepl(pattern = "^[S]L", getNamespaceExports("SuperLearner"))]) == F))
      stop(
        "sl_library argument unrecgonized; please use listWrappers()
        in SuperLearner to find the list of supported values",
        call. = FALSE
      )
    # Get the weights
    weightit_superlearner <- WeightIt::weightit(
      w ~ .,
      data = xwdata,
      method = "super",
      estimand = "ATE",
      SL.library = sl_library,
      ...
    )
    # Trim the weights
    weight_superlearner_trim <-
      trunc_fun(weightit_superlearner$weights, trim_perc)
    # Calculate the weighted means
    for (i in 1:n_trt) {
      assign(
        paste0("mu_", i, "_hat_superlearner_trim"),
        sum(y[w == i] * weight_superlearner_trim[w == i]) /
          sum(weight_superlearner_trim[w == i])
      )
    }
    # Obtain the causal effects based on RD, OR and RR
    result_list_superlearner_trim <- NULL
    for (i in 1:(n_trt - 1)) {
      result_once <- NULL
      for (j in (i + 1):n_trt) {
        assign(paste0("RD", i, j), eval(parse(
          text = paste0("mu_", i, "_hat_superlearner_trim")
        )) - eval(parse(
          text = paste0("mu_", j, "_hat_superlearner_trim")
        )))
        assign(paste0("RR", i, j), eval(parse(
          text = paste0("mu_", i, "_hat_superlearner_trim")
        )) / eval(parse(
          text = paste0("mu_", j, "_hat_superlearner_trim")
        )))
        assign(paste0("OR", i, j), (eval(parse(
          text = paste0("mu_", i, "_hat_superlearner_trim")
        )) / (1 - eval(
          parse(text = paste0(
            "mu_", i, "_hat_superlearner_trim"
          ))
        ))) / (eval(parse(
          text = paste0("mu_", j, "_hat_superlearner_trim")
        )) / (1 - eval(
          parse(text = paste0(
            "mu_", j, "_hat_superlearner_trim"
          ))
        ))))
        result_once <-
          rbind(eval(parse(text = paste0("RD", i, j))),
                eval(parse(text = paste0("RR", i, j))),
                eval(parse(text = paste0("OR", i, j))))
        colnames(result_once) <- "EST"
        rownames(result_once) <- c("RD", "RR", "OR")
        result_once_list <- list(result_once)
        names(result_once_list) <- paste0("ATE", i, j)
        result_list_superlearner_trim <-
          c(result_list_superlearner_trim, result_once_list)
      }
    }
    result_list_superlearner_trim <-
      c(
        result_list_superlearner_trim,
        list(weight = weight_superlearner_trim),
        list(method = paste0(method, "-Trim")),
        list(estimand = "ATE")
      )
    class(result_list_superlearner_trim) <- "CIMTx_IPTW"
    return(result_list_superlearner_trim)
  }
}