R/nonprob_dr.R
In nonprobsvy: Inference Based on Non-Probability Samples

#' @useDynLib nonprobsvy
#' @import Rcpp
#' @importFrom stats glm.fit
#' @importFrom stats model.frame
#' @importFrom stats model.matrix
#' @importFrom stats update
#' @importFrom stats qnorm
#' @importFrom stats binomial
#' @importFrom stats terms
#' @importFrom stats reformulate
#' @importFrom stats coef
#' @importFrom survey svytotal
#' @importFrom ncvreg cv.ncvreg
#' @importFrom MASS ginv
#' @importFrom Rcpp evalCpp
#' @importFrom formula.tools rhs
#' @importFrom formula.tools lhs
#' @noRd
nonprob_dr <- function(selection,
                       outcome,
                       data,
                       svydesign,
                       pop_totals,
                       pop_means,
                       pop_size,
                       method_selection,
                       method_outcome,
                       family_outcome,
                       strata,
                       case_weights,
                       na_action,
                       control_selection,
                       control_outcome,
                       control_inference,
                       start_outcome,
                       start_selection,
                       verbose,
                       se,
                       pop_size_fixed,
                       ...) {

  ## setting for the IPW
  method <- switch(method_selection,
                   "logit" = method_ps("logit"),
                   "probit" = method_ps("probit"),
                   "cloglog" = method_ps("cloglog"))

  estimation_method <- est_method_ipw(control_selection$est_method)

  ## multiple outcomes
  outcomes <- make_outcomes(outcome)
  output <- list()
  outcome_list <- list()
  ys <- list()

  confidence_interval <- list()
  SE_values <- list()

  bias_corr <- control_inference$bias_correction

  # variable selection and combination --------------------------------------

  if (control_inference$vars_selection & control_inference$vars_combine) {

    ## estimate the mi
    if (verbose) {
      cat("MI variable selection in progress...\n")
    }

    results_mi <- nonprob_mi(outcome = outcome,
                             data = data,
                             svydesign = svydesign,
                             pop_totals = pop_totals,
                             pop_means = pop_means,
                             pop_size = pop_size,
                             method_outcome = method_outcome,
                             family_outcome = family_outcome,
                             subset = subset,
                             strata = strata,
                             case_weights = case_weights,
                             na_action = na_action,
                             control_outcome = control_outcome,
                             control_inference = control_inference,
                             start_outcome = start_outcome,
                             verbose = verbose,
                             se = FALSE,
                             pop_size_fixed=pop_size_fixed)

    if (verbose) {
      cat("IPW variable selection in progress...\n")
    }

    results_ipw <- nonprob_ipw(selection = selection,
                               target = reformulate(outcomes[[1]]),
                               data = data,
                               svydesign = svydesign,
                               pop_totals = pop_totals,
                               pop_means = pop_means,
                               pop_size = pop_size,
                               method_selection = method_selection,
                               subset = subset,
                               strata = strata,
                               case_weights = case_weights,
                               na_action = na_action,
                               control_selection = control_selection,
                               control_inference = control_inference,
                               start_selection = start_selection,
                               verbose = verbose,
                               se = FALSE,
                               pop_size_fixed = pop_size_fixed)

    ## doubly robust estimator
    mu_hat <- mu_hatDR(y_hat = results_mi$output$mean,
                       y_resid = do.call("cbind", results_mi$ys_resid),
                       weights = case_weights,
                       weights_nons = results_ipw$ipw_weights,
                       N_nons = pop_size)

    ipw_coefs_sel <- names(results_ipw$selection$coefficients)
    mi_coefs_sel <- lapply(results_mi$outcome, coef)
    dr_coefs_sel <- lapply(mi_coefs_sel, function(x) {
      mi_cols <- names(x[abs(x)>0])
      combined <- sort(base::union(ipw_coefs_sel, mi_cols))
      combined[!grepl("Intercept", combined)]
    })

    if (verbose) {
      cat("IPW vars selected:", ipw_coefs_sel, "\n")
      cat("MI vars selected:\n")
      print(lapply(mi_coefs_sel, function(x) names(x[abs(x)>0])))
      cat("DR combined vars:\n")
      print(dr_coefs_sel)
    }


    ## combining variables for selection
    selection_vars <- all.vars(formula.tools::rhs(outcome))
    outcome_vars <- all.vars(formula.tools::rhs(selection))
    target_vars <- all.vars(formula.tools::lhs(outcome))
    combined_vars <- reformulate(union(selection_vars, outcome_vars))

    y_nons <- subset(data, select=target_vars)
    X_nons <- model.matrix(combined_vars, data)
    ## take into account information that svydesign might be not present...
    X_rand <- model.matrix(combined_vars, svydesign$variables)
    X_all <- rbind(X_rand, X_nons)

    X_nons <- cbind(y_nons, X_nons[, !grepl("Intercept", colnames(X_nons)), drop=FALSE])
    X_rand <- X_rand[, !grepl("Intercept", colnames(X_rand)), drop=FALSE]
    svydesign_ <- svydesign
    svydesign_$variables <- cbind(svydesign_$variables, X_rand)

    bias_corr_results_ipw <- bias_corr_results_mi <- results_mi_combined <- results_ipw_combined <- list()

    bias_corr_ys_rand_pred  <- bias_corr_ys_nons_pred <- bias_corr_ys_resid <- list()

    mu_hat <- numeric()

    control_inference_ <- control_inference
    control_inference_$vars_selection <- FALSE

    for (o in outcomes$f) {

      if (bias_corr) {

        ## consider different start
        par0 <- numeric(NCOL(X_all)*2)
        names(par0) <- rep(colnames(X_all), times = 2)

        bias_corr_result <- nleqslv::nleqslv(
          x = par0,
          fn = u_theta_beta_dr,
          method = control_selection$nleqslv_method,
          global = control_selection$nleqslv_global,
          xscalm = control_selection$nleqslv_xscalm,
          jacobian = TRUE,
          control = list(
            scalex = rep(1, length(par0)),
            maxit = control_selection$maxit
          ),
          R = results_ipw$R,
          X = X_all,
          y = c(rep(0, sum(results_ipw$R==0)), y_nons[, o]),
          weights = c(weights(svydesign_), results_ipw$case_weights),
          method_selection = method_selection,
          family_outcome = family_outcome
        )

        coefs_ipw_inds <- 1:NCOL(X_all)
        coefs_mi_inds <- (NCOL(X_all) + 1):(2 * NCOL(X_all))

        theta_hat <- bias_corr_result$x[coefs_ipw_inds]
        beta_hat <- bias_corr_result$x[coefs_mi_inds]

        bias_corr_ps <- method$make_link_inv(unname(drop(X_all %*% theta_hat)))
        bias_corr_ipw_weights <- 1/bias_corr_ps[results_ipw$R == 1]
        bias_corr_mu_rand_pred <- as.vector(get(family_outcome)()$linkinv(X_all[results_ipw$R == 0, ] %*% beta_hat))
        bias_corr_mu_nons_pred <- as.vector(get(family_outcome)()$linkinv(X_all[results_ipw$R == 1, ] %*% beta_hat))
        bias_corr_mu_resid <- bias_corr_mu_nons_pred - y_nons[, o]

        mu_hat[[o]] <- mu_hatDR(y_hat = weighted.mean(bias_corr_mu_rand_pred, weights(svydesign_)),
                                y_resid = as.matrix(bias_corr_mu_resid),
                                weights = results_ipw$case_weights,
                                weights_nons = bias_corr_ipw_weights,
                                N_nons = pop_size)


        bias_corr_results_mi[[o]] <- bias_corr_result
        bias_corr_results_ipw[[o]] <- bias_corr_result

        bias_corr_results_mi[[o]]$x <- bias_corr_results_mi[[o]]$x[coefs_mi_inds]
        bias_corr_results_mi[[o]]$fvec <- bias_corr_results_mi[[o]]$fvec[coefs_mi_inds]
        bias_corr_results_mi[[o]]$scalex <- bias_corr_results_mi[[o]]$scalex[coefs_mi_inds]
        bias_corr_results_mi[[o]]$jac <- bias_corr_results_mi[[o]]$jac[coefs_mi_inds, coefs_mi_inds]

        bias_corr_results_ipw[[o]]$x <- bias_corr_results_ipw[[o]]$x[coefs_ipw_inds]
        bias_corr_results_ipw[[o]]$fvec <- bias_corr_results_ipw[[o]]$fvec[coefs_ipw_inds]
        bias_corr_results_ipw[[o]]$scalex <- bias_corr_results_ipw[[o]]$scalex[coefs_ipw_inds]
        bias_corr_results_ipw[[o]]$jac <- bias_corr_results_ipw[[o]]$jac[coefs_ipw_inds, coefs_ipw_inds]

        bias_corr_ys_rand_pred[[o]] <- bias_corr_mu_rand_pred
        bias_corr_ys_nons_pred[[o]] <- bias_corr_mu_nons_pred
        bias_corr_ys_resid[[o]] <- bias_corr_mu_resid

      } else {
        ## this is not saved in the output list
        results_ipw_combined[[o]] <- nonprob_ipw(data = X_nons,
                                                 target = reformulate(o),
                                                 selection =  reformulate(dr_coefs_sel[[o]]),
                                                 svydesign = svydesign_,
                                                 pop_totals = pop_totals,
                                                 pop_means = pop_means,
                                                 pop_size = pop_size,
                                                 method_selection = method_selection,
                                                 strata = strata,
                                                 case_weights = case_weights,
                                                 na_action = na_action,
                                                 control_selection = control_selection,
                                                 control_inference = control_inference_,
                                                 start_selection = start_selection,
                                                 verbose = verbose,
                                                 se = FALSE,
                                                 pop_size_fixed = pop_size_fixed)
        ## estimate the mi
        results_mi_combined[[o]] <- nonprob_mi(outcome = as.formula(paste0(o, reformulate(dr_coefs_sel[[o]]))),
                                               data = X_nons,
                                               svydesign = svydesign_,
                                               pop_totals = pop_totals,
                                               pop_means = pop_means,
                                               pop_size = pop_size,
                                               method_outcome = method_outcome,
                                               family_outcome = family_outcome,
                                               strata = strata,
                                               case_weights = case_weights,
                                               na_action = na_action,
                                               control_outcome = control_outcome,
                                               control_inference = control_inference_,
                                               start_outcome = start_outcome,
                                               verbose = verbose,
                                               se = FALSE,
                                               pop_size_fixed=pop_size_fixed)

        ## estimate in loop
        mu_hat[[o]] <- mu_hatDR(y_hat = results_mi_combined[[o]]$output$mean,
                                y_resid = do.call("cbind", results_mi_combined[[o]]$ys_resid),
                                weights = case_weights,
                                weights_nons = results_ipw_combined[[o]]$ipw_weights,
                                N_nons = pop_size)
      }

    }

    if (se) {

      for (o in outcomes$f) {

        if (control_inference$var_method == "analytic") {

          if (bias_corr) {

            sigma_hat <- switch(family_outcome,
                                "gaussian" = mean((bias_corr_ys_resid[[o]])^2),
                                "binomial" = bias_corr_ys_rand_pred[[o]]*(1-bias_corr_ys_rand_pred[[o]]),
                                "poisson"  = bias_corr_ys_rand_pred[[o]])

            var_nonprob <- 1/pop_size^2*(sum((results_ipw$case_weights^2 - 2*results_ipw$case_weights)*(bias_corr_ys_resid[[o]]^2)) +
                                           sum(sigma_hat*weights(svydesign_)))

            if (is.null(pop_totals)) {

              svydesign <- stats::update(svydesign, y_rand = bias_corr_ys_rand_pred[[o]])
              svydesign_mean <- survey::svymean(~y_rand, svydesign)
              var_prob <- as.vector(attr(svydesign_mean, "var"))

            } else {
              var_prob <- 0
            }


          } else {
            ps_ <- results_ipw_combined[[o]]$ps_scores[results_ipw_combined[[o]]$R == 1]
            psd_ <- as.numeric(results_ipw_combined[[o]]$selection$selection_model$ps_nons_der)
            y_ <- results_mi_combined[[o]]$y[[o]]
            X_ <- results_ipw_combined[[o]]$X[results_ipw_combined[[o]]$R == 1, ]
            y_pred_ <- results_mi_combined[[o]]$ys_nons_pred[[1]]
            h_n_ <- 1 / pop_size * sum(y_ - y_pred_)

            b_var <- method$b_vec_dr(
              X = X_,
              ps = ps_,
              psd = psd_,
              y = y_,
              hess = results_ipw_combined[[o]]$selection$selection_model$hess,
              eta = as.numeric(X_ %*% as.matrix(results_ipw_combined[[o]]$selection$coefficients)),
              h_n = h_n_,
              y_pred = y_pred_,
              weights = case_weights,
              verbose = verbose
            )

            var_nonprob <- estimation_method$make_var_nonprob(
              ps = ps_,
              psd = psd_,
              y = y_,
              y_pred = results_mi_combined[[o]]$ys_nons_pred[[o]],
              h_n = h_n_,
              X = X_,
              b = b_var,
              N = pop_size,
              gee_h_fun = control_selection$gee_h_fun,
              method_selection = method_selection,
              weights = case_weights,
              pop_totals = pop_totals
            )

            if (is.null(pop_totals)) {

              t_comp <- estimation_method$make_t_comp(
                X = results_ipw_combined[[o]]$X[results_ipw_combined[[o]]$R == 0, ],
                ps = as.numeric(results_ipw_combined[[o]]$selection$selection_model$est_ps_rand),
                psd = as.numeric(results_ipw_combined[[o]]$selection$selection_model$est_ps_rand_der),
                b = b_var,
                gee_h_fun = control_selection$gee_h_fun,
                y_rand = results_mi_combined[[o]]$ys_rand_pred[[1]],
                y_nons = results_mi_combined[[o]]$ys_nons_pred[[1]],
                N = pop_size,
                method_selection = method_selection,
                weights = case_weights
              )

              svydesign__ <- stats::update(svydesign_, t_comp = t_comp)
              svydesign_mean <- survey::svymean(~t_comp, svydesign__)
              var_prob <- as.vector(attr(svydesign_mean, "var"))

            } else {
              var_prob <- 0
            }
          }

          var_total <- var_nonprob + var_prob
          se_nonprob <- sqrt(var_nonprob)
          se_prob <- sqrt(var_prob)
          SE_values[[o]] <- data.frame(prob = se_prob, nonprob = se_nonprob)
          z <- stats::qnorm(1 - control_inference$alpha / 2)
          # confidence interval based on the normal approximation
          confidence_interval[[o]] <- data.frame(lower_bound = mu_hat - z * sqrt(var_total),
                                                 upper_bound = mu_hat + z * sqrt(var_total))
          output[[o]] <- data.frame(mean = mu_hat[o], SE = sqrt(var_total))
        }
      }

      if (control_inference$var_method == "bootstrap") {

          ## variable selection should and combination should be done within `boot_dr` function
          boot_obj <- boot_dr(selection = selection,
                              outcome = outcome,
                              target = reformulate(outcomes[[1]]),
                              data = data,
                              svydesign = svydesign,
                              pop_totals = pop_totals,
                              pop_means = pop_means,
                              pop_size = pop_size,
                              method_selection = method_selection,
                              method_outcome = method_outcome,
                              family_outcome = family_outcome,
                              strata = strata,
                              case_weights = case_weights,
                              na_action = na_action,
                              control_selection = control_selection,
                              control_outcome = control_outcome,
                              control_inference = control_inference,
                              start_outcome = start_outcome,
                              start_selection = start_selection,
                              verbose = verbose,
                              pop_size_fixed = pop_size_fixed)

        var_total <- apply(boot_obj, 2, var)
        SE_values <- replicate(NROW(outcomes[[1]]), data.frame(nonprob = NA, prob = NA), simplify = F)
        SE <- sqrt(var_total)
        output <- list(data.frame(mean = mu_hat, SE = SE))
        alpha <- control_inference$alpha
        z <- stats::qnorm(1 - alpha / 2)
        # confidence interval based on the normal approximation
        confidence_interval <- list(data.frame(lower_bound = mu_hat - z * SE,
                                               upper_bound = mu_hat + z * SE))
        }
      } else {
      for (o in 1:outcomes$l) {
        confidence_interval[[o]] <- data.frame(lower_bound = NA, upper_bound = NA)
        SE_values[[o]] <- data.frame(nonprob = NA, prob = NA)
        output[[o]] <- data.frame(mean = mu_hat[o], SE = NA)
      }
    }
  } else {

    # variable selection but without combination ------------------------------

    results_mi <- nonprob_mi(outcome = outcome,
                             data = data,
                             svydesign = svydesign,
                             pop_totals = pop_totals,
                             pop_means = pop_means,
                             pop_size = pop_size,
                             method_outcome = method_outcome,
                             family_outcome = family_outcome,
                             strata = strata,
                             case_weights = case_weights,
                             na_action = na_action,
                             control_outcome = control_outcome,
                             control_inference = control_inference,
                             start_outcome = start_outcome,
                             verbose = verbose,
                             se = FALSE,
                             pop_size_fixed=pop_size_fixed)

    results_ipw <- nonprob_ipw(selection = selection,
                               target = reformulate(outcomes[[1]]),
                               data = data,
                               svydesign = svydesign,
                               pop_totals = pop_totals,
                               pop_means = pop_means,
                               pop_size = pop_size,
                               method_selection = method_selection,
                               strata = strata,
                               case_weights = case_weights,
                               na_action = na_action,
                               control_selection = control_selection,
                               control_inference = control_inference,
                               start_selection = start_selection,
                               verbose = verbose,
                               se = FALSE,
                               pop_size_fixed = pop_size_fixed)

    ## doubly robust estimator
    mu_hat <- mu_hatDR(y_hat = results_mi$output$mean,
                       y_resid = do.call("cbind", results_mi$ys_resid),
                       weights = case_weights,
                       weights_nons = results_ipw$ipw_weights,
                       N_nons = pop_size)

    if (se) {
      if (control_inference$var_method == "analytic") {
        for (o in 1:outcomes$l) {

          ps_ <- results_ipw$ps_scores[results_ipw$R == 1]
          psd_ <- as.numeric(results_ipw$selection$selection_model$ps_nons_der)
          y_ <- results_mi$y[[o]]
          X_ <- results_ipw$X[results_ipw$R == 1, ]
          y_pred_ <- results_mi$ys_nons_pred[[1]]
          h_n_ <- 1 / pop_size * sum(y_ - y_pred_)

          b_var <- method$b_vec_dr(
            X = X_,
            ps = ps_,
            psd = psd_,
            y = y_,
            hess = results_ipw$selection$selection_model$hess,
            eta = as.numeric(X_ %*% as.matrix(results_ipw$selection$coefficients)),
            h_n = h_n_,
            y_pred = y_pred_,
            weights = case_weights,
            verbose = verbose
          )

          var_nonprob <- estimation_method$make_var_nonprob(
            ps = ps_,
            psd = psd_,
            y = y_,
            y_pred = results_mi$ys_nons_pred[[o]],
            h_n = h_n_,
            X = X_,
            b = b_var,
            N = pop_size,
            gee_h_fun = control_selection$gee_h_fun,
            method_selection = method_selection,
            weights = case_weights,
            pop_totals = pop_totals
          )



          if (is.null(pop_totals)) {
            t_comp <- estimation_method$make_t_comp(
              X = results_ipw$X[results_ipw$R == 0, ],
              ps = as.numeric(results_ipw$selection$selection_model$est_ps_rand),
              psd = as.numeric(results_ipw$selection$selection_model$est_ps_rand_der),
              b = b_var,
              gee_h_fun = control_selection$gee_h_fun,
              y_rand = results_mi$ys_rand_pred[[o]],
              y_nons = results_mi$ys_nons_pred[[o]],
              N = pop_size,
              method_selection = method_selection,
              weights = case_weights
            )

            svydesign_ <- stats::update(svydesign, t_comp = t_comp)
            svydesign_mean <- survey::svymean(~t_comp, svydesign)
            var_prob <- as.vector(attr(svydesign_mean, "var"))

          } else {
            var_prob <- 0
          }

          var_total <- var_nonprob + var_prob
          se_nonprob <- sqrt(var_nonprob)
          se_prob <- sqrt(var_prob)
          SE_values[[o]] <- data.frame(prob = se_prob, nonprob = se_nonprob)
          z <- stats::qnorm(1 - control_inference$alpha / 2)
          # confidence interval based on the normal approximation
          confidence_interval[[o]] <- data.frame(lower_bound = mu_hat[o] - z * sqrt(var_total),
                                                 upper_bound = mu_hat[o] + z * sqrt(var_total))
          output[[o]] <- data.frame(mean = mu_hat[o], SE = sqrt(var_total))
        }
      }

      if (control_inference$var_method == "bootstrap") {

        boot_obj <- boot_dr(selection = selection,
                            outcome = outcome,
                            target = reformulate(outcomes[[1]]),
                            data = data,
                            svydesign = svydesign,
                            pop_totals = pop_totals,
                            pop_means = pop_means,
                            pop_size = pop_size,
                            method_selection = method_selection,
                            method_outcome = method_outcome,
                            family_outcome = family_outcome,
                            strata = strata,
                            case_weights = case_weights,
                            na_action = na_action,
                            control_selection = control_selection,
                            control_outcome = control_outcome,
                            control_inference = control_inference,
                            start_outcome = start_outcome,
                            start_selection = start_selection,
                            verbose = verbose,
                            pop_size_fixed = pop_size_fixed)

        var_total <- apply(boot_obj, 2, var)
        SE_values <- replicate(NROW(outcomes[[1]]), data.frame(nonprob = NA, prob = NA), simplify = F)
        SE <- sqrt(var_total)
        output <- list(data.frame(mean = mu_hat, SE = SE))
        alpha <- control_inference$alpha
        z <- stats::qnorm(1 - alpha / 2)
        # confidence interval based on the normal approximation
        confidence_interval <- list(data.frame(lower_bound = mu_hat - z * SE,
                                               upper_bound = mu_hat + z * SE))
      }

    } else {
      for (o in 1:outcomes$l) {
        confidence_interval[[o]] <- data.frame(lower_bound = NA, upper_bound = NA)
        SE_values[[o]] <- data.frame(nonprob = NA, prob = NA)
        output[[o]] <- data.frame(mean = mu_hat[o], SE = NA)
      }
    }


  }
  boot_sample <- if (control_inference$var_method == "bootstrap" & control_inference$keep_boot) {
    boot_obj
  } else {
    NULL
  }

  if (!is.null(boot_sample) & is.matrix(boot_sample)) colnames(boot_sample) <- names(ys)

  output <- do.call(rbind, output)
  confidence_interval <- do.call(rbind, confidence_interval)
  SE_values <- do.call(rbind, SE_values)
  rownames(output) <- rownames(confidence_interval) <- rownames(SE_values) <- outcomes$f

  if (bias_corr) {
    bias_corr_ys_rand_pred <- do.call("cbind", bias_corr_ys_rand_pred)
    bias_corr_ys_nons_pred <- do.call("cbind", bias_corr_ys_nons_pred)
    bias_corr_ys_resid <- do.call("cbind", bias_corr_ys_resid)
  }

  structure(
    list(
      data = data,
      X = results_mi$X,
      y = results_mi$y,
      R = results_ipw$R,
      ps_scores = if (bias_corr) bias_corr_ps else results_ipw$ps_scores,
      case_weights = results_ipw$case_weights,
      ipw_weights = if (bias_corr) bias_corr_ipw_weights else results_ipw$ipw_weights,
      control = list(
        control_selection = control_selection,
        control_outcome = control_outcome,
        control_inference = control_inference
      ),
      output = output,
      SE = SE_values,
      confidence_interval = confidence_interval,
      nonprob_size = results_mi$nonprob_size,
      prob_size = results_mi$prob_size,
      pop_size = pop_size,
      pop_size_fixed = pop_size_fixed,
      pop_totals = pop_totals,
      pop_means = pop_means,
      outcome = if (bias_corr) bias_corr_results_mi else results_mi$outcome,
      selection = if (bias_corr) bias_corr_results_ipw else results_ipw$selection,
      boot_sample = boot_sample,
      svydesign = if (is.null(pop_totals)) svydesign else NULL,
      ys_rand_pred = if (bias_corr) bias_corr_ys_rand_pred else results_mi$ys_rand_pred,
      ys_nons_pred = if (bias_corr) bias_corr_ys_nons_pred else results_mi$ys_nons_pred,
      ys_resid = if (bias_corr) bias_corr_ys_resid else results_mi$ys_resid
    ),
    class = "nonprob"
  )
}


# Internal function for fitting the parameters for joint estimation
# par - starting parameters
# R - inclusion information
# joint X
# y - target variable
# weights - vector of combined weights
# method_selection - method selected
# family_outcome - propensity score model
u_theta_beta_dr <- function(par,
                            R,
                            X,
                            y,
                            weights,
                            method_selection,
                            family_outcome) {

  method <- switch(method_selection,
                   "logit" = method_ps("logit"),
                   "probit" = method_ps("probit"),
                   "cloglog" = method_ps("cloglog"))

  inv_link <- method$make_link_inv
  inv_link_rev <- method$make_link_inv_rev

  p <- ncol(X)
  theta <- par[1:(p)]
  beta <- par[(p + 1):(2 * p)]
  eta_pi <- unname(drop(X %*% theta))
  ps <- inv_link(eta_pi)

  eta <- X %*% beta
  family_obj <- get(family_outcome)()
  mu <- as.vector(family_obj$linkinv(eta))
  mu_der <- if (family_outcome == "gaussian") rep(1, NROW(eta)) else as.vector(family_obj$mu.eta(eta))
  res <- y - mu

  n <- NROW(R)
  R_rand <- 1 - R

  ## this should be gee method dependent
  ## and take into account that population totals may be only available
  utb <- c(
    apply(X * R / ps * mu_der * weights - X * R_rand * weights * mu_der, 2, sum),
    apply(X * R * weights * as.vector(-inv_link_rev(eta_pi)) * res, 2, sum)
  ) / n

  utb
}