getDefaultParSetValues = function() {
nonevallist = function(...) {
as.list(match.call(expand.dots = FALSE)$...)
}
par.sets = nonevallist(
## following are set nearly accroding to caret random search spaces
# adabag boosting: AdaBoost.M1
.boosting = makeParamSet(
makeDiscreteParam(id = "coeflearn", default = "Breiman", values = c("Breiman", "Freund", "Zhu")),
makeNumericParam(id = "mfinal", default = log2(100L/10), lower = log2(1/10), upper = log2(1000/10), trafo = function(x) floor(2^x * 10)),
makeIntegerParam(id = "maxdepth", default = 30L, lower = 1L, upper = 30L)
),
# C50: C5.0
.C50 = makeParamSet(
makeIntegerParam(id = "trials", lower = 1L, default = 1L, upper = 100L),
makeLogicalParam(id = "winnow", default = FALSE)
),
# Regularized Random Forest (more like RFFglobal in caret)
.RRF = makeParamSet(
makeIntegerParam(id = "mtry", lower = 1L, default = expression(floor(p/3)), upper = expression(p)),
makeNumericParam(id = "coefReg", default = 0.8, lower = 0, upper = 1),
keys = "p"
),
# ada
.ada = makeParamSet(
makeNumericParam(id = "iter", default = log2(50/10), lower = log2(1/10), upper = log2(1000/10), trafo = function(x) floor(2^x * 10)),
makeIntegerParam(id = "maxdepth", default = 10L, lower = 1L, upper = 10L), # mlr recommends 30 as default
makeNumericParam(id = "nu", default = 0.1, lower = 0.001, upper = 0.5)
),
# blackboost
.blackboost = makeParamSet(
makeIntegerParam(id = "maxdepth", default = 2L, lower = 1L, upper = 10L),
makeNumericParam(id = "mstop", default = log2(100/10), lower = log2(1/10), upper = log2(1000/10), trafo = function(x) floor(2^x * 10))
),
# extraTrees
classif.extraTrees = makeParamSet(
makeIntegerParam(id = "mtry", lower = 1L, upper = expression(p), default = expression(floor(sqrt(p)))),
makeIntegerParam(id = "numRandomCuts", default = 1L, lower = 1L, upper = 25L),
keys = "p"
),
regr.extraTrees = makeParamSet(
makeIntegerParam(id = "mtry", lower = 1L, upper = expression(p), default = expression(max(floor(p/3), 1))),
makeIntegerParam(id = "numRandomCuts", default = 1L, lower = 1L, upper = 25L),
keys = "p"
),
# For ksvm caret uses kernlab::sigest() +- 0.75
.ksvm = makeParamSet(
makeNumericParam(id = "C", upper = 10, lower = -5, trafo = function(x) 2^x, default = log2(1)),
makeNumericParam(id = "sigma", upper = 15, lower = -15, trafo = function(x) 2^x, default = expression(kernlab::sigest(as.matrix(getTaskData(task, target.extra = TRUE)[["data"]])), scaled = TRUE)),
keys = "task"
),
# glmboost
.glmboost = makeParamSet(
makeNumericParam(id = "mstop", default = log2(100/10), lower = log2(1/10), upper = log2(1000/10), trafo = function(x) floor(2^x * 10)),
makeNumericParam("nu", lower = 0, upper = 1, default = 0.1)
),
# gbm - shrinkage in caret : 0.6 (high numbres produce NAs for small data.sets)
.gbm = makeParamSet(
makeNumericParam(id = "n.trees", lower = log2(10/10), upper = log2(1000/10), trafo = function(x) round(2^x * 10), default = log2(500/10)),
makeIntegerParam(id = "interaction.depth", default = 1L, lower = 1L, upper = 10L),
makeNumericParam(id = "shrinkage", default = 0.001, lower = 0.001, upper = 0.6),
makeIntegerParam(id = "n.minobsinnode", default = 10L, lower = 5L, upper = 25L)
),
# rpart - caret does an initial fit here, we diverge completely
.rpart = makeParamSet(
makeNumericParam(id = "cp", default = log2(0.01), lower = -10, upper = 0, trafo = function(x) 2^x),
makeIntegerParam(id = "maxdepth", default = 30L, lower = 3L, upper = 30L),
makeIntegerParam(id = "minbucket", default = 7L, lower = 5L, upper = 50L),
makeIntegerParam(id = "minsplit", default = 20L, lower = 5L, upper = 50L)
),
# nnet
.nnet = makeParamSet(
makeIntegerParam(id = "size", default = 3L, lower = 1L, upper = 20L),
makeNumericParam(id = "decay", default = 10^(-5), lower = -5, upper = 1, trafo = function(x) 10^x)
),
# glmnet - caret does an inital fit here (only for the grid search)
.glmnet = makeParamSet(
makeNumericParam(id = "alpha", default = 1, lower = 0, upper = 1),
makeNumericParam(id = "lambda", default = log2(1), lower = -10, upper = 3, trafo = function(x) 2^x)
),
# xgbTree (in mlr booster = gbtree) default
.xgboost = makeParamSet(
makeNumericParam(id = "nrounds", lower = log2(10/10), upper = log2(4000/10), trafo = function(x) round(2^x * 10), default = log2(10/10)),
makeIntegerParam(id = "max_depth", default = 6L, lower = 1L, upper = 10L),
makeNumericParam(id = "eta", default = 0.3, lower = 0.001, upper = 0.6),
makeNumericParam(id = "gamma", default = 0, lower = 0, upper = 10),
makeNumericParam(id = "colsample_bytree", default = 0.5, lower = 0.3, upper = 0.7),
makeNumericParam(id = "min_child_weight", default = 1, lower = 0, upper = 20),
makeNumericParam(id = "subsample", default = 1, lower = 0.25, upper = 1)
),
## not compared to caret
# random forest (only mtry in caret)
classif.randomForest = makeParamSet(
makeIntegerParam("nodesize", lower = 1, upper = 10, default = 1),
makeIntegerParam("mtry", lower = 1L, upper = expression(p), default = expression(floor(sqrt(p)))),
keys = "p"
),
regr.randomForest = makeParamSet(
makeIntegerParam("nodesize", lower = 1, upper = 10, default = 1),
makeIntegerParam(id = "mtry", lower = 1L, upper = expression(p), default = expression(max(floor(p/3), 1))),
keys = "p"
),
classif.ranger = makeParamSet(
makeIntegerParam("mtry", lower = 1L, upper = expression(p), default = expression(floor(sqrt(p)))),
makeIntegerParam("min.node.size", lower = 1, upper = 10, default = 1),
keys = "p"
),
regr.ranger = makeParamSet(
makeIntegerParam("mtry", lower = 1L, upper = expression(p), default = expression(max(floor(p/3), 1))),
makeIntegerParam("min.node.size", lower = 1, upper = 10, default = 5),
keys = "p"
),
## svm
.svm = makeParamSet(
makeNumericParam(id = "cost", upper = 15, lower = -15, trafo = function(x) 2^x, default = log2(1)),
makeNumericParam(id = "gamma", upper = 15, lower = -15, trafo = function(x) 2^x, default = expression(log2(1/p))),
keys = "p"
)
)
par.vals = nonevallist()
mkps = function(par.set, par.vals = NULL) {
list(par.set.call = par.set, par.vals.call = par.vals)
}
Map(mkps, par.set = par.sets, par.vals = par.vals[names(par.sets)])
}
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.