R/np.condistribution.proper.R

Defines functions .np_condist_finalize_proper_object .np_condist_apply_proper .np_condist_apply_proper_grid .np_condist_project_values_with_plan .np_condist_prepare_proper_plan .np_condist_project_bounded_isotonic .np_condist_weighted_pava .np_condist_make_reason_info .np_condist_validate_proper_args .np_condist_normalize_proper_control .np_condist_proper_reason_message .np_condist_proper_shadow_enabled

.np_condist_proper_shadow_enabled <- function() {
  isTRUE(getOption("np.condist.proper.shadow", FALSE))
}

.np_condist_proper_reason_message <- function(reason, where = "npcdist()") {
  switch(
    as.character(reason),
    not_requested = "proper-distribution repair was not requested",
    already_proper = "proper=TRUE was requested, but the estimator is already proper by construction",
    no_eval_grid = "proper=TRUE requires explicit evaluation data that define a full y-grid for each fixed x; paired row-wise evaluation is insufficient",
    scope_not_selected = "proper=TRUE was requested, but 'proper.control$apply' does not target the values returned by this object",
    slice_disabled = "proper=TRUE slice repair is disabled by internal dispatcher controls",
    slice_context_missing = "proper=TRUE slice repair requires explicit evaluation and training data context",
    slice_invalid_master_grid = "proper=TRUE slice repair could not construct a valid internal y-grid",
    slice_eval_failed = "proper=TRUE slice repair failed while evaluating the internal explicit-grid oracle",
    y_not_univariate_continuous = "proper=TRUE currently supports only univariate continuous y",
    gradients_unsupported = "proper=TRUE is currently unsupported when gradients=TRUE",
    x_slices_not_repeated = "proper=TRUE requires repeated fixed-x slices in the evaluation data",
    y_grid_not_common = "proper=TRUE requires every fixed-x slice to share a common ordered y-grid",
    y_grid_not_ordered = "proper=TRUE requires at least two strictly increasing y-grid points in each fixed-x slice",
    invalid_quadrature = "proper=TRUE could not construct valid grid weights from the evaluation y-grid",
    repair_disabled_shadow_mode = sprintf("proper=TRUE repair is disabled in internal shadow-validation mode in %s", where),
    sprintf("proper=TRUE is unsupported in %s for reason '%s'", where, as.character(reason))
  )
}

.np_condist_normalize_proper_control <- function(proper.control) {
  if (is.null(proper.control))
    proper.control <- list()

  if (!is.list(proper.control))
    stop("'proper.control' must be a list")

  ctrl <- list(
    tol = 1e-10,
    grid.check = TRUE,
    store.raw = TRUE,
    fail.on.unsupported = FALSE,
    mode = "grid",
    apply = "evaluation",
    slice.grid.size = 101L,
    slice.extend.factor = 0.1
  )

  known <- names(ctrl)
  if (length(proper.control)) {
    extra <- setdiff(names(proper.control), known)
    if (length(extra))
      stop(sprintf("unsupported entries in 'proper.control': %s",
                   paste(shQuote(extra), collapse = ", ")))
    ctrl[names(proper.control)] <- proper.control
  }

  ctrl$tol <- npValidatePositiveFiniteNumeric(ctrl$tol, "proper.control$tol")
  ctrl$grid.check <- npValidateScalarLogical(ctrl$grid.check, "proper.control$grid.check")
  ctrl$store.raw <- npValidateScalarLogical(ctrl$store.raw, "proper.control$store.raw")
  ctrl$fail.on.unsupported <- npValidateScalarLogical(
    ctrl$fail.on.unsupported,
    "proper.control$fail.on.unsupported"
  )
  ctrl$mode <- match.arg(as.character(ctrl$mode)[1L], c("grid", "slice"))
  ctrl$apply <- match.arg(as.character(ctrl$apply)[1L], c("evaluation", "fitted", "both"))
  ctrl$`slice.grid.size` <- npValidatePositiveInteger(
    ctrl$`slice.grid.size`,
    "proper.control$slice.grid.size"
  )
  ctrl$`slice.extend.factor` <- .np_condist_validate_nonnegative_finite_numeric(
    ctrl$`slice.extend.factor`,
    "proper.control$slice.extend.factor"
  )

  ctrl
}

.np_condist_validate_proper_args <- function(proper = FALSE,
                                             proper.method = c("isotonic"),
                                             proper.control = list()) {
  proper <- npValidateScalarLogical(proper, "proper")
  proper.method <- match.arg(as.character(proper.method)[1L], c("isotonic"))
  proper.control <- .np_condist_normalize_proper_control(proper.control)

  list(
    proper.requested = proper,
    proper.method = proper.method,
    proper.control = proper.control
  )
}

.np_condist_make_reason_info <- function(reason,
                                         supported = FALSE,
                                         slice.count = 0L,
                                         grid.common = FALSE,
                                         lower.bound = 0,
                                         upper.bound = 1,
                                         monotone.violations.raw = NULL,
                                         range.raw = NULL,
                                         projection.distance.l2 = NULL) {
  list(
    supported = supported,
    reason = as.character(reason)[1L],
    slice.count = as.integer(slice.count),
    grid.common = isTRUE(grid.common),
    lower.bound = lower.bound,
    upper.bound = upper.bound,
    monotone.violations.raw = monotone.violations.raw,
    range.raw = range.raw,
    projection.distance.l2 = projection.distance.l2
  )
}

.np_condist_weighted_pava <- function(f, w, tol = 1e-10) {
  f <- as.double(f)
  w <- as.double(w)

  if (length(f) != length(w))
    stop("length mismatch between distribution values and grid weights")
  if (any(!is.finite(f)))
    stop("distribution values must be finite")
  if (any(!is.finite(w)) || any(w <= 0))
    stop("grid weights must be finite and strictly positive")
  if (!is.finite(tol) || tol <= 0)
    stop("projection tolerance must be positive and finite")

  block.start <- seq_along(f)
  block.end <- seq_along(f)
  block.weight <- w
  block.value <- f
  nblock <- length(f)

  i <- 1L
  while (i < nblock) {
    if (block.value[i] <= block.value[i + 1L] + tol) {
      i <- i + 1L
      next
    }

    new.weight <- block.weight[i] + block.weight[i + 1L]
    new.value <- (block.weight[i] * block.value[i] +
                    block.weight[i + 1L] * block.value[i + 1L]) / new.weight

    block.end[i] <- block.end[i + 1L]
    block.weight[i] <- new.weight
    block.value[i] <- new.value

    if (i + 1L < nblock) {
      keep <- seq.int(i + 2L, nblock)
      block.start[(i + 1L):(nblock - 1L)] <- block.start[keep]
      block.end[(i + 1L):(nblock - 1L)] <- block.end[keep]
      block.weight[(i + 1L):(nblock - 1L)] <- block.weight[keep]
      block.value[(i + 1L):(nblock - 1L)] <- block.value[keep]
    }

    nblock <- nblock - 1L
    if (i > 1L)
      i <- i - 1L
  }

  fitted <- numeric(length(f))
  for (j in seq_len(nblock))
    fitted[block.start[j]:block.end[j]] <- block.value[j]

  fitted
}

.np_condist_project_bounded_isotonic <- function(f,
                                                 w,
                                                 lower = 0,
                                                 upper = 1,
                                                 tol = 1e-10) {
  f <- as.double(f)
  w <- as.double(w)

  if (!is.finite(lower) || !is.finite(upper) || lower > upper)
    stop("invalid lower/upper bounds for isotonic projection")

  big.weight <- max(1, sum(w)) * 1e12
  aug.fit <- .np_condist_weighted_pava(
    f = c(lower, f, upper),
    w = c(big.weight, w, big.weight),
    tol = tol
  )

  out <- aug.fit[-c(1L, length(aug.fit))]
  out <- pmin(pmax(out, lower), upper)

  if (any(diff(out) < -10 * tol))
    stop("bounded isotonic projection failed monotonicity check")

  out
}

.np_condist_prepare_proper_plan <- function(object, proper.control = list()) {
  proper.control <- .np_condist_normalize_proper_control(proper.control)

  grid <- .np_condens_detect_proper_grid(object = object, tol = proper.control$tol)
  if (!isTRUE(grid$supported)) {
    info <- .np_condist_make_reason_info(
      reason = grid$reason,
      supported = FALSE,
      slice.count = 0L,
      grid.common = FALSE
    )
    return(list(
      supported = FALSE,
      reason = grid$reason,
      proper.info = info
    ))
  }

  weights <- tryCatch(
    .np_condens_trapezoid_weights(grid$y.grid, tol = proper.control$tol),
    error = function(e) e
  )
  if (inherits(weights, "error")) {
    info <- .np_condist_make_reason_info(
      reason = "invalid_quadrature",
      supported = FALSE,
      slice.count = length(grid$slices),
      grid.common = TRUE
    )
    return(list(
      supported = FALSE,
      reason = "invalid_quadrature",
      proper.info = info
    ))
  }

  list(
    supported = TRUE,
    slices = grid$slices,
    weights = weights,
    y.grid = grid$y.grid,
    proper.control = proper.control
  )
}

.np_condist_project_values_with_plan <- function(values,
                                                 plan,
                                                 progress.label = NULL) {
  if (!isTRUE(plan$supported))
    stop("proper projection plan is not supported")

  is.vector.input <- is.null(dim(values))
  values.mat <- if (is.vector.input) {
    matrix(as.double(values), nrow = 1L)
  } else {
    data.matrix(values)
  }

  if (ncol(values.mat) != sum(lengths(plan$slices)))
    stop("value length mismatch for proper distribution projection")

  out <- values.mat
  progress <- NULL
  if (!is.vector.input && !is.null(progress.label) && nrow(values.mat) > 1L) {
    progress <- .np_plot_stage_progress_begin(
      total = nrow(values.mat),
      label = as.character(progress.label)[1L]
    )
    on.exit(.np_plot_progress_end(progress), add = TRUE)
  }
  for (row in seq_len(nrow(values.mat))) {
    for (idx in plan$slices) {
      out[row, idx] <- .np_condist_project_bounded_isotonic(
        f = values.mat[row, idx],
        w = plan$weights,
        lower = 0,
        upper = 1,
        tol = plan$proper.control$tol
      )
    }
    if (!is.null(progress))
      progress <- .np_plot_progress_tick(state = progress, done = row)
  }

  if (is.vector.input) as.vector(out[1L, ]) else out
}

.np_condist_apply_proper_grid <- function(object,
                                          proper.method = "isotonic",
                                          proper.control = list()) {
  proper.method <- match.arg(as.character(proper.method)[1L], c("isotonic"))
  proper.control <- .np_condist_normalize_proper_control(proper.control)

  plan <- .np_condist_prepare_proper_plan(
    object = object,
    proper.control = proper.control
  )
  if (!isTRUE(plan$supported)) {
    return(list(
      applied = FALSE,
      reason = plan$reason,
      proper.info = plan$proper.info
    ))
  }

  raw <- as.double(object$condist)
  repaired <- .np_condist_project_values_with_plan(raw, plan)
  monotone.violations.raw <- integer(length(plan$slices))
  range.raw <- matrix(NA_real_, nrow = length(plan$slices), ncol = 2L,
                      dimnames = list(NULL, c("min", "max")))
  projection.distance <- numeric(length(plan$slices))

  for (i in seq_along(plan$slices)) {
    idx <- plan$slices[[i]]
    f.slice <- raw[idx]
    g.slice <- repaired[idx]
    monotone.violations.raw[i] <- sum(diff(f.slice) < -proper.control$tol)
    range.raw[i, ] <- c(min(f.slice), max(f.slice))
    projection.distance[i] <- sqrt(sum(plan$weights * (g.slice - f.slice)^2))
  }

  info <- .np_condist_make_reason_info(
    reason = "applied",
    supported = TRUE,
    slice.count = length(plan$slices),
    grid.common = TRUE,
    monotone.violations.raw = monotone.violations.raw,
    range.raw = range.raw,
    projection.distance.l2 = projection.distance
  )

  list(
    applied = TRUE,
    condist = repaired,
    condist.raw = if (isTRUE(proper.control$store.raw)) raw else NULL,
    proper.info = info
  )
}

.np_condist_apply_proper <- function(object,
                                     proper.method = "isotonic",
                                     proper.control = list(),
                                     slice.context = NULL) {
  proper.method <- match.arg(as.character(proper.method)[1L], c("isotonic"))
  proper.control <- .np_condist_normalize_proper_control(proper.control)

  if (!isTRUE(object$trainiseval) && identical(proper.control$apply, "fitted")) {
    info <- .np_condist_make_reason_info(
      reason = "scope_not_selected",
      supported = TRUE,
      slice.count = 0L,
      grid.common = FALSE
    )
    return(list(applied = FALSE, reason = "scope_not_selected", proper.info = info))
  }

  grid.out <- .np_condist_apply_proper_grid(
    object = object,
    proper.method = proper.method,
    proper.control = proper.control
  )
  if (isTRUE(grid.out$applied))
    return(grid.out)

  if (!identical(proper.control$mode, "slice"))
    return(grid.out)

  .np_condist_apply_proper_slice(
    object = object,
    proper.method = proper.method,
    proper.control = proper.control,
    slice.context = slice.context,
    grid.out = grid.out
  )
}

.np_condist_finalize_proper_object <- function(object,
                                               proper = FALSE,
                                               proper.method = c("isotonic"),
                                               proper.control = list(),
                                               slice.context = NULL,
                                               where = "npcdist()") {
  args <- .np_condist_validate_proper_args(
    proper = proper,
    proper.method = proper.method,
    proper.control = proper.control
  )

  object$proper.requested <- args$proper.requested
  object$proper.applied <- FALSE
  object$proper.method <- if (isTRUE(args$proper.requested)) args$proper.method else NULL
  object$condist.raw <- NULL
  object$proper.info <- .np_condist_make_reason_info(
    reason = if (isTRUE(args$proper.requested)) "pending" else "not_requested",
    supported = FALSE
  )

  if (!isTRUE(args$proper.requested))
    return(object)

  if (.np_condist_is_already_proper_by_design(object$bws)) {
    object$proper.info <- .np_condist_make_reason_info(
      reason = "already_proper",
      supported = TRUE
    )
    return(object)
  }

  if (.np_condist_proper_shadow_enabled()) {
    object$proper.info <- .np_condist_make_reason_info(
      reason = "repair_disabled_shadow_mode",
      supported = FALSE
    )
    return(object)
  }

  proper.out <- .np_condist_apply_proper(
    object = object,
    proper.method = args$proper.method,
    proper.control = args$proper.control,
    slice.context = slice.context
  )

  if (!isTRUE(proper.out$applied)) {
    object$proper.info <- proper.out$proper.info
    if (isTRUE(args$proper.control$fail.on.unsupported) &&
        !isTRUE(proper.out$proper.info$supported)) {
      stop(.np_condist_proper_reason_message(
        reason = proper.out$reason,
        where = where
      ), call. = FALSE)
    }
    return(object)
  }

  object$condist <- proper.out$condist
  object$proper.applied <- TRUE
  object$proper.info <- proper.out$proper.info
  if (!is.null(proper.out$condist.raw))
    object$condist.raw <- proper.out$condist.raw

  object
}

Try the np package in your browser

Any scripts or data that you put into this service are public.

np documentation built on May 3, 2026, 1:07 a.m.