R/learner_LiblineaR_classif_liblinear.R

#' @title LiblineaR Classification Learner
#' @author be-marc
#' @name mlr_learners_classif.liblinear
#'
#' @description
#' L2 regularized support vector classification.
#' Calls [LiblineaR::LiblineaR()] from \CRANpkg{LiblineaR}.
#'
#' @template learner
#' @templateVar id classif.liblinear
#'
#' @details Type of SVC depends on `type` argument:
#'
#' * `0` – L2-regularized logistic regression (primal)
#' * `1` - L2-regularized L2-loss support vector classification (dual)
#' * `3` - L2-regularized L1-loss support vector classification (dual)
#' * `2` – L2-regularized L2-loss support vector classification (primal)
#' * `4` – Support vector classification by Crammer and Singer
#' * `5` - L1-regularized L2-loss support vector classification
#' * `6` - L1-regularized logistic regression
#' * `7` - L2-regularized logistic regression (dual)
#'
#' If number of records > number of features, `type = 2` is faster than `type = 1`
#' (Hsu et al. 2003).
#'
#' Note that probabilistic predictions are only available for types `0`, `6`, and `7`.
#' The default `epsilon` value depends on the `type` parameter, see [LiblineaR::LiblineaR].
#'
#' @references
#' `r format_bib("fan2008liblinear")`
#'
#' @export
#' @template seealso_learner
#' @template example
LearnerClassifLiblineaR = R6Class("LearnerClassifLiblineaR", # nolint
  inherit = LearnerClassif,
  public = list(

    #' @description
    #' Creates a new instance of this [R6][R6::R6Class] class.
    initialize = function() {

      ps = ps(
        type = p_int(default = 0, lower = 0, upper = 7, tags = "train"),
        cost = p_dbl(default = 1, lower = 0, tags = "train"),
        epsilon = p_dbl(lower = 0, tags = "train"),
        bias = p_dbl(default = 1, tags = "train"),
        cross = p_int(default = 0L, lower = 0L, tags = "train"),
        verbose = p_lgl(default = FALSE, tags = "train"),
        wi = p_uty(default = NULL, tags = "train"),
        findC = p_lgl(default = FALSE, tags = "train"),
        useInitC = p_lgl(default = TRUE, tags = "train")
      )

      # 50 is an arbitrary choice here
      ps$add_dep("findC", "cross", CondAnyOf$new(seq(2:50)))
      ps$add_dep("useInitC", "findC", CondEqual$new(TRUE))

      super$initialize(
        id = "classif.liblinear",
        packages = c("mlr3extralearners", "LiblineaR"),
        feature_types = "numeric",
        predict_types = c("response", "prob"),
        param_set = ps,
        properties = c("twoclass", "multiclass"),
        man = "mlr3extralearners::mlr_learners_classif.liblinear",
        label = "Support Vector Machine"
      )
    }
  ),
  private = list(
    .train = function(task) {
      pars = self$param_set$get_values(tags = "train")
      data = task$data()
      train = task$data(cols = task$feature_names)
      target = task$truth()

      type = ifelse(is.null(pars$type), 0, pars$type)
      pars = pars[names(pars) != "type"]

      invoke(LiblineaR::LiblineaR, data = train, target = target, type = type, .args = pars)
    },

    .predict = function(task) {
      newdata = ordered_features(task, self)
      pars = self$param_set$get_values(tags = "predict")

      type = ifelse(is.null(self$param_set$values$type), 0, self$param_set$values$type)

      if (type %nin% c(0, 6, 7) && self$predict_type == "prob") {
        stop("'prob' predict_type only possible if `type` is `0`, `6`, or `7`.")
      }

      if (self$predict_type == "prob") {
        pred = invoke(predict, self$model, newx = newdata, proba = TRUE, .args = pars)
        return(list(prob = pred$probabilities))
      } else {
        pred = invoke(predict, self$model, newx = newdata, .args = pars)
        return(list(response = pred$predictions))
      }
    }
  )
)

.extralrns_dict$add("classif.liblinear", LearnerClassifLiblineaR)
mlr-org/mlr3extralearners documentation built on May 23, 2024, 2:09 p.m.