impute_missing: Missing values imputation wrapper

Description Usage Arguments Value Examples

View source: R/missingValues.R

Description

Missing values imputation wrapper

Usage

1
impute_missing(dataset, method, exclude = NULL, ...)

Arguments

dataset

we want to impute missing values on

method

selected method of missing values imputation

exclude

character. Vector of attributes to exclude from the missing values treatment

...

Further arguments for method

Value

The treated dataset (either with noisy instances replaced or erased)

Examples

 1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
library("smartdata")
data(africa, package = "Amelia")
data(nhanes, package = "mice")
data(ozone,  package = "missMDA")
data(vnf,    package = "missMDA")
data(orange, package = "missMDA")
data(sleep,  package = "VIM")

super_nhanes <- impute_missing(nhanes, "gibbs_sampling")
super_nhanes <- impute_missing(nhanes, "gibbs_sampling", exclude = "chl")
# Use a different method for every column
impute_methods <- c("pmm", "midastouch", "norm_nob", "norm_boot")
super_nhanes <- impute_missing(nhanes, "gibbs_sampling", imputation = impute_methods)
super_nhanes <- impute_missing(nhanes, "central_imputation")
super_africa <- impute_missing(africa, "knn_imputation")
# Execute knn imputation with non default value for k
super_africa <- impute_missing(africa, "knn_imputation", k = 5)
super_africa <- impute_missing(africa, "expect_maximization", exclude = "country")
super_africa <- impute_missing(africa, "rf_imputation", num_iterations = 15,
                               num_trees = 200, bootstrap = FALSE)
# Examples of calls to 'PCA imputation' with wholly numeric datasets

super_orange <- impute_missing(orange, "PCA_imputation", num_dimensions = 5,
                               imputation = "EM")
super_orange <- impute_missing(orange, "PCA_imputation", num_dimensions = 5,
                               imputation = "Regularized")

super_orange <- impute_missing(orange, "PCA_imputation", num_dimensions = 5,
                               imputation = "Regularized", random_init = TRUE)
# Examples of calls to 'MCA imputation' with wholly categorical datasets

super_vnf    <- impute_missing(vnf, "MCA_imputation", num_dimensions = 5,
                               imputation = "EM")
super_vnf    <- impute_missing(vnf, "MCA_imputation", num_dimensions = 5,
                               imputation = "Regularized")

super_vnf    <- impute_missing(vnf, "MCA_imputation", num_dimensions = 5,
                               imputation = "Regularized", random_init = TRUE)
# Examples of calls to 'FAMD imputation' with hybrid datasets

super_ozone  <- impute_missing(ozone, "FAMD_imputation", num_dimensions = 5,
                               imputation = "EM", exclude = c("Ne12", "Vx15"))
super_ozone  <- impute_missing(ozone, "FAMD_imputation", num_dimensions = 5,
                               imputation = "Regularized")

super_ozone  <- impute_missing(ozone, "FAMD_imputation", num_dimensions = 5,
                               imputation = "Regularized", random_init = TRUE)

# Examples of hotdeck, iterative robust and reggresion imputations
super_sleep <- impute_missing(sleep, "hotdeck")
super_sleep <- impute_missing(sleep, "iterative_robust", initialization = "median",
                              num_iterations = 1000)
super_sleep <- impute_missing(sleep, "regression_imputation",
                              formula = Dream+NonD~BodyWgt+BrainWgt)

# Examples of adaptative shrinkage imputation
super_ozone <- impute_missing(ozone, "ATN", sigma = 2.2)
super_ozone <- impute_missing(ozone, "ATN", lambda = 0.025, gamma = 2.5)
super_ozone <- impute_missing(ozone, "ATN", tune = "SURE")

smartdata documentation built on Dec. 19, 2019, 1:08 a.m.