Nothing
#' @title PipeOpOOR_B
#'
#' @name PipeOpOOR_B
#'
#' @description
#' Impute features by OOR imputation in approach B (independently during the training and prediction phase).
#'
#' @section Input and Output Channels:
#' Input and output channels are inherited from \code{\link{PipeOpImpute}}.
#'
#' @section Parameters:
#' The parameters include inherited from [`PipeOpImpute`], as well as: \cr
#' \itemize{
#' \item \code{id} :: \code{character(1)}\cr
#' Identifier of resulting object, default `"impute_OOR_B"`.
#' }
#'
#'
#' @examples
#' {
#'
#' # Using debug learner for example purpose
#'
#' graph <- PipeOpOOR_B$new() %>>% LearnerClassifDebug$new()
#' graph_learner <- GraphLearner$new(graph)
#'
#' # Task with NA
#' set.seed(1)
#' resample(tsk("pima"), graph_learner, rsmp("cv", folds = 3))
#' }
#' @export
PipeOpOOR_B = R6::R6Class("OOR_B_imputation",
inherit = PipeOpImpute,
public = list(
initialize = function(id = "impute_oor_B", param_vals = list()) {
ps = ParamSet$new(params = list(
ParamLgl$new("min", tags = c("train", "predict")),
ParamDbl$new("offset", lower = 0, tags = c("train", "predict")),
ParamDbl$new("multiplier", lower = 0, tags = c("train", "predict")))
)
ps$values = list(min = TRUE, offset = 1, multiplier = 1)
# this is one of the few imputers that handles 'character' features!
super$initialize(id, param_set = ps, param_vals = param_vals, feature_types = c("character", "factor", "integer", "numeric", "ordered"))
}
),
private = list(
.train_imputer = function(feature, type, context) {
NULL
},
.impute = function(feature, type, model, context) {
train_imputer <- function(feature, type, context) {
if (type %in% c("factor", "ordered", "character")) {
return(".MISSING") # early exit
}
offset = self$param_set$values$offset + self$param_set$values$multiplier * diff(range(feature, na.rm = TRUE))
oor = if (self$param_set$values$min) {
min(feature, na.rm = TRUE) - offset
} else {
max(feature, na.rm = TRUE) + offset
}
if (type == "integer") {
oor = as.integer(round(oor))
}
oor
}
model <- train_imputer(feature, type, context)
if (type %in% c("factor", "ordered")) {
# in some edge cases there may be levels during training that are missing during predict.
levels(feature) = c(levels(feature), as.character(model))
}
if (length(model) == 1) {
feature[is.na(feature)] = model
} else {
outlen = sum(is.na(feature))
feature[is.na(feature)] = sample(model, outlen, replace = TRUE, prob = attr(model, "probabilities"))
}
feature
}
)
)
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.