R/alternated_procedure.R
In PLUCR: Policy Learning Under Constraint

Documented in Optimization_Estimation update_mu update_mu_XA update_nu update_nu_XA

#' Update mu via augmented covariate adjustment for fixed X
#'
#' Computes updated Mu predictions by adding the bias correction for fixed 
#' \code{psi_collection} scaled by coefficients \code{epsilon1_collection},
#' then transforms back via the logistic function.
#'
#' @param offset_mu_XA A numeric vector of logit-scale baseline mu0 predictions.
#' @param epsilon1 A numeric vector of GLM coefficients for each column in \code{psi_collection}.
#' @param psi_collection A matrix whose columns are optimal \code{psi} solutions.
#' @param H_XA A numeric vector of inverse-propensity weights, typically from \code{HX()}.
#'
#' @return A numeric vector of updated mu on the `[0,1]` scale.
#'
#'@export
update_mu_XA <- function(offset_mu_XA, epsilon1, psi_collection, H_XA){ 
  out <- expit(offset_mu_XA + H_XA*(psi_collection%*%epsilon1)) 
  return(out)
}

#' Update nu via augmented covariate adjustment for fixed X
#'
#' Computes updated Nu predictions by adding the bias correction for fixed 
#' \code{sigma_psi_collection} scaled by coefficients \code{epsilon2_collection},
#' then transforms back via the logistic function.
#'
#' @param offset_nu_XA A numeric vector of logit-scale baseline nu0 predictions.
#' @param epsilon2 A numeric vector of GLM coefficients for each column in \code{sigma_psi_collection}.
#' @param sigma_psi_collection A matrix whose columns are optimal \code{psi} solutions composed by sigma.
#' @param H_XA A numeric vector of inverse-propensity weights, typically from \code{HX()}.
#'
#' @return A numeric vector of updated nu on the `[0,1]` scale.
#'
#'@export
update_nu_XA <- function(offset_nu_XA, epsilon2, sigma_psi_collection, H_XA){
  out <- expit(offset_nu_XA + H_XA*(sigma_psi_collection%*%epsilon2))
  return(out)
}

#' Update mu via augmented covariate adjustment
#'
#' Computes updated Mu predictions by adding the bias correction for all previous solutions at X 
#' \code{psi(X)} scaled by coefficients \code{epsilon1_collection},
#' then transforms back via the logistic function.
#'
#' @param A A binary vector or matrix of length n indicating treatment assignment (0 or 1).
#' @param X A matrix of covariates of size n x d (input data in `[0,1]`).
#' @param mu0 A fold-specific function predicting primary outcome (Y) given treatment (A) and covariates (X).
#' @param epsilon1 A numeric vector of GLM coefficients for each column in \code{psi_collection}.
#' @param theta_collection A list of the optimal \code{theta} enabling the reconstruction of optimal \code{psi} functions.
#' @param prop_score A function that estimates the propensity score given treatment (A) and covariates (X).
#'
#' @return A numeric vector of updated mu on the `[0,1]` scale.
#'
#'@export
update_mu <- function(A, X, mu0, epsilon1, theta_collection, prop_score){ 
  H_XA <- HX(A, X, prop_score)
  res<- lapply(theta_collection, function(theta){make_psi(theta)(X)})
  psi_collection <- do.call(cbind, res)
  out <- expit(logit(mu0(A, X))+ H_XA*(psi_collection%*%epsilon1)) 
  return(out)
}

#' Update nu via augmented covariate adjustment
#'
#' Computes updated Nu predictions by adding the bias correction for all previous solutions at X 
#' using \code{sigma_beta} scaled by coefficients \code{epsilon2_collection},
#' then transforms back via the logistic function.
#'
#' @param A A binary vector or matrix of length n indicating treatment assignment (0 or 1).
#' @param X A matrix of covariates of size n x d (input data in `[0,1]`).
#' @param nu0 A fold-specific function predicting adverse event outcome (Xi) given treatment (A) and covariates (X).
#' @param epsilon2 A numeric vector of GLM coefficients for each column in \code{sigma_psi_collection}.
#' @param theta_collection A list of the optimal \code{theta} enabling the reconstruction of optimal \code{sigma_beta} applied to \code{psi} functions.
#' @param prop_score A function that estimates the propensity score given treatment (A) and covariates (X).
#' @param beta A non-negative numeric scalar controlling the sharpness of the probability function (0.05 by default).
#' @param centered A logical value indicating whether to apply centering in \code{sigma_beta} (FALSE by default).
#'
#' @return A numeric vector of updated nu on the `[0,1]` scale.
#'
#'@export
update_nu <- function(A, X, nu0, epsilon2, theta_collection, prop_score, beta=0.05, centered=FALSE){
  H_XA <- HX(A, X, prop_score)
  res<- lapply(theta_collection, function(theta){make_psi(theta)(X)})
  sigma_psi_collection <- do.call(cbind, lapply(res,function(X)sigma_beta(X, beta, centered)))
  out <- expit(logit(nu0(A,X))+ H_XA*(sigma_psi_collection%*%epsilon2))
  return(out)
}

#' Iterative optimization procedure
#' 
#' This function performs an iterative optimization routine to correct and minimize the objective function. 
#' It iteratively finds a solution and corrects the objective function for such optimal solution, until 
#' two consecutive solutions do not change much. 
#'
#' @param mu0 A fold-specific function predicting primary outcome (Y) given treatment (A) and covariates (X).
#' @param nu0 A fold-specific function predicting adverse event outcome (Xi) given treatment (A) and covariates (X).
#' @param prop_score A function that estimates the propensity score given treatment (A) and covariates (X).
#' @param X A matrix of covariates of size n x d (input data in `[0,1]`).
#' @param A A binary vector or matrix of length n indicating treatment assignment (0 or 1).
#' @param Y A numeric vector or matrix of length n representing primary outcomes (in `[0,1]`).
#' @param Xi A numeric vector or matrix of length n indicating adverse events (0 or 1).
#' @param lambda A non-negative numeric scalar controlling the penalty for violating the constraint.
#' @param alpha A numeric scalar representing the constraint tolerance (0.1 by default).
#' @param precision A numeric scalar defining the desired convergence precision (0.05 by default). The number of Frank-Wolfe iterations (K) is inversely proportional to this value, calculated as 1/precision.
#' @param beta A non-negative numeric scalar controlling the sharpness of the probability function (0.05 by default).
#' @param centered A logical value indicating whether to apply centering in \code{sigma_beta} (FALSE by default).
#' @param tol A numeric scalar used as an early stopping criterion based on the RMSE between consecutive solutions (0.025 by default).
#' @param max_iter A numeric scalar specifying the maximum number of iterations (5 by default).
#'
#' @return A list containing:
#' \item{iter}{The number of completed iterations.}
#' \item{offset_mu}{Initial logit-transformed outcome predictions.}
#' \item{offset_nu}{Initial logit-transformed auxiliary predictions.}
#' \item{psi_collection}{Matrix of covariate projections across iterations.}
#' \item{sigma_psi_collection}{Matrix of transformed projections across iterations.}
#' \item{epsilon1}{GLM coefficients from the outcome model.}
#' \item{epsilon2}{GLM coefficients from the auxiliary model.}
#' \item{theta_collection}{List of parameter vectors from each iteration of the functional weight estimation.}
#'
#' @details
#' This function saves intermediate results to files in order to recover progress or inspect iteration-level behavior. 
#' If the optimization converges or the maximum number of iterations is reached, the final parameter vector \code{theta_init} is saved.
#' @export
Optimization_Estimation <- function(mu0, nu0, prop_score, X, A, Y, Xi, lambda, 
                                    alpha=0.1, precision=0.05, 
                                    beta=0.05, centered=FALSE, 
                                    tol= 2.5*1e-2, max_iter=5){
  tol <- R.utils::Arguments$getNumerics(tol, c(0.01, 0.1))
  max_iter <- R.utils::Arguments$getIntegers(max_iter, c(2, 10))
  
  Delta_mu <- function(X){mu0(rep(1,nrow(X)),X)-mu0(rep(0,nrow(X)),X)}
  Delta_nu <- function(X){nu0(rep(1,nrow(X)),X)-nu0(rep(0,nrow(X)),X)}
  reason <- ""
  H <- HX(A,X,prop_score)
  
  theta <- FW(X, delta_Mu=Delta_mu, delta_Nu=Delta_nu, 
              lambda=lambda, alpha=alpha, beta=beta, 
              centered=centered, precision=precision, verbose=TRUE)
  psi<- make_psi(theta)
  psi_X <- psi(X)
  sigma_psi_X <- sigma_beta(psi_X,beta, centered)
  
  offset_mu <- stats::qlogis(mu0(A,X))
  df_mu <- tibble::tibble(
    Y = Y)
  
  offset_nu <- stats::qlogis(nu0(A,X))
  df_nu <- tibble::tibble(
    xi = Xi)
  
  correction_term_mu_norm <- NULL
  correction_term_nu_norm <- NULL
  term1 <- NULL
  term2 <- NULL
  psi_collection <- NULL
  sigma_psi_collection <- NULL
  theta_collection<-list()
  
  go_on <- TRUE
  k <- 0 
  while(go_on){
    k <- k + 1
    varname <- paste0("newcov.", k)
    df_mu[[varname]] <- H*as.vector(psi_X)
    df_nu[[varname]] <- H*as.vector(sigma_psi_X)
    psi_collection <- cbind(psi_collection, as.vector(psi_X))
    
    if(FALSE){
      if (!is.null(sigma_psi_collection)) {
        new_cor <- abs(cor(as.vector(sigma_psi_X), sigma_psi_collection))
        max_cor <- max(new_cor)
        
        # Stop if new sigma_psi_X is too similar to previous
        if (max_cor > 0.90) {
          reason <- "New sigma_psi_X is highly correlated"
          message(glue::glue("Stopping early at iteration {k}: 
                             new sigma_psi_X is highly correlated 
                             (max_cor = {round(max_cor, 4)})"))
          break
        }
      } 
    }
    sigma_psi_collection <- cbind(sigma_psi_collection, as.vector(sigma_psi_X))
    theta_collection[[k]] <- theta
    
      mu_update_obj <- stats::glm(Y ~ -1 + ., offset=offset_mu, data = df_mu, family=stats::binomial())
      nu_update_obj <- stats::glm(xi ~ -1 + ., offset=offset_nu, data = df_nu, family=stats::binomial())
      epsilon1<- as.matrix(as.numeric(mu_update_obj$coefficients))
      epsilon2<- as.matrix(as.numeric(nu_update_obj$coefficients))
      
      if (any(abs(c(epsilon1,epsilon2)) > 10)) {
        reason <- "Detected large component of epsilon1 or epsilon2"
        warning(glue::glue("Iteration {k}: detected large component of epsilon1 or epsilon2."))
        break
      }
      correction_term_mu_norm <- cbind(correction_term_mu_norm, sqrt(mean((H*(psi_collection %*% epsilon1))^2)))
      correction_term_nu_norm <- cbind(correction_term_nu_norm, sqrt(mean((H*(sigma_psi_collection %*% epsilon2))^2)))
    
      term1 <- cbind(term1, H*(-2*psi_X*(df_mu$Y-update_mu_XA(offset_mu, epsilon1, psi_collection, H))))
      term2 <- cbind(term2, H*(lambda*sigma_psi_X*(df_nu$xi - update_nu_XA(offset_nu, epsilon2, sigma_psi_collection, H))))
      
      out <- list(
        iter=k,
        offset_mu=offset_mu,
        offset_nu=offset_nu, 
        psi_collection=psi_collection, 
        sigma_psi_collection=sigma_psi_collection, 
        epsilon1=epsilon1, 
        epsilon2=epsilon2,
        theta_collection=theta_collection, 
        correction_term_mu_norm=correction_term_mu_norm,
        correction_term_nu_norm=correction_term_nu_norm,
        term1= term1, 
        term2=term2
      )

    Delta_mu <- function(X) { update_mu_XA(stats::qlogis(mu0(rep(1,nrow(X)),X)), epsilon1, 
                                           psi_collection, HX(rep(1,nrow(X)),X,prop_score)) - 
        update_mu_XA(stats::qlogis(mu0(rep(0,nrow(X)),X)), epsilon1, psi_collection, 
                     HX(rep(0,nrow(X)), X, prop_score)) }
    Delta_nu <- function(X) { update_nu_XA(stats::qlogis(nu0(rep(1,nrow(X)),X)), epsilon2, 
                                           sigma_psi_collection,HX(rep(1,nrow(X)), X,prop_score)) - 
        update_nu_XA(stats::qlogis(nu0(rep(0,nrow(X)),X)), epsilon2, sigma_psi_collection, 
                     HX(rep(0,nrow(X)), X, prop_score)) }
    
    theta <- FW(X, delta_Mu=Delta_mu, delta_Nu=Delta_nu, lambda=lambda, alpha=alpha, 
                beta=beta, centered=centered, precision=precision, verbose=TRUE)
    psi<- make_psi(theta)
    new_psi <- psi(X)
    sigma_psi_X <- sigma_beta(new_psi,beta, centered)
    go_on <- (k < max_iter) & (sqrt(mean((psi_X - new_psi)^2)) > tol)
  
    
    psi_X <- new_psi
  }
  if(reason==""){
    if(!k<max_iter){
      reason <- "Maximum iterations reached"
    }else{
      reason <- "RMSE of consecutive solutions < tol"
    }
  }
  out$last_theta <- theta
  out$reason <- reason
  return(out)
}

Any scripts or data that you put into this service are public.

PLUCR documentation built on March 30, 2026, 5:08 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

PLUCR
Policy Learning Under Constraint

R/alternated_procedure.R
In PLUCR: Policy Learning Under Constraint

Defines functions Optimization_Estimation update_nu update_mu update_nu_XA update_mu_XA

Documented in Optimization_Estimation update_mu update_mu_XA update_nu update_nu_XA

Try the PLUCR package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

PLUCR Policy Learning Under Constraint

R/alternated_procedure.R In PLUCR: Policy Learning Under Constraint

Defines functions Optimization_Estimation update_nu update_mu update_nu_XA update_mu_XA

Documented in Optimization_Estimation update_mu update_mu_XA update_nu update_nu_XA

Try the PLUCR package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

PLUCR
Policy Learning Under Constraint

R/alternated_procedure.R
In PLUCR: Policy Learning Under Constraint