test-processing.R
In sperrorest: Perform Spatial Error Estimation and Variable Importance Assessment

library("rpart")
library("MASS")
# runfolds Sun May 21 22:58:39 2017 ------------------------------

test_that("runfolds works on missing factor levels in
          test data example", {
  skip("internal use")

  df <- readRDS("inst/testfiles/pathogen_data.rds")
  fo <- diplo01 ~ temp + p_sum + r_sum + elevation + slope + hail +
    age + ph + lithology + soil

  current_sample <- partition_kmeans(df, nfold = 4)[[1]]
  current_res <- current_sample

  runfolds(
    j = 1, data = df, current_sample = current_sample,
    formula = fo,
    model_args = list(family = "binomial"),
    model_fun = glm,
    importance = TRUE,
    imp_permutations = 2,
    imp_variables = c("lithology"),
    current_res = current_res,
    pred_args = list(type = "response"),
    response = "diplo01",
    coords = c("x", "y"), progress = 1,
    pooled_obs_train = c(),
    pooled_obs_test = c(),
    err_fun = err_default
  ) -> runfolds_single
  expect_equal(length(runfolds_single), 6)
})

test_that("runfolds works on glm example", {
  skip_on_cran()

  j <- 1 # running the first repetition of 'current_sample', normally we are
  # calling an apply call to seq_along nFolds of repetition
  # see also 'runreps()'
  data <- ecuador
  current_sample <- partition_cv(ecuador, nfold = 4)[[1]]
  current_res <- current_sample
  fo <- slides ~ dem + slope + hcurv + vcurv + log.carea + cslope

  runfolds(
    j = 1, data = ecuador, current_sample = current_sample,
    formula = fo,
    model_args = list(family = "binomial"),
    model_fun = glm,
    imp_permutations = 2,
    imp_variables = c(
      "dem", "slope", "hcurv", "vcurv", "log.carea",
      "cslope"
    ),
    importance = TRUE, current_res = current_res,
    pred_args = list(type = "response"), response = "slides",
    coords = c("x", "y"), progress = 1, pooled_obs_train = c(),
    pooled_obs_test = c(), err_fun = err_default
  ) -> runfolds_single
  expect_equal(length(runfolds_single), 9)
})

test_that("runfolds works on LDA example", {
  skip_on_cran()

  data <- ecuador
  current_sample <- partition_cv(maipo, nfold = 4)[[1]]
  current_res <- current_sample

  lda_predfun <- function(object, newdata, fac = NULL) {
    library(nnet)
    majority <- function(x) {
      levels(x)[which.is.max(table(x))]
    }

    majority_filter <- function(x, fac) {
      for (lev in levels(fac)) {
        x[fac == lev] <- majority(x[fac == lev])
      }
      x
    }
    pred <- predict(object, newdata = newdata)$class
    if (!is.null(fac)) pred <- majority_filter(pred, newdata[, fac])
    return(pred)
  }

  data("maipo", package = "sperrorest")
  predictors <- colnames(maipo)[5:ncol(maipo)]
  fo <- as.formula(paste("croptype ~", paste(predictors, collapse = "+")))

  runfolds_single <- runfolds(
    j = 1, data = maipo,
    current_sample = current_sample,
    formula = fo,
    model_fun = lda,
    pred_fun = lda_predfun,
    pred_args = list(fac = "field"),
    importance = FALSE,
    current_res = current_sample,
    response = "croptype",
    coords = c("x", "y"), progress = 1,
    pooled_obs_train = c(),
    pooled_obs_test = c(), err_fun = err_default
  )
  expect_equal(length(runfolds_single), 9)
})

test_that("runfolds works on rpart example", {
  skip_on_cran()

  data <- ecuador
  current_sample <- partition_cv(ecuador, nfold = 4)[[1]]
  current_res <- current_sample

  mypred_rpart <- function(object, newdata) predict(object, newdata)[, 2]
  ctrl <- rpart.control(cp = 0.005) # show the effects of overfitting

  # Non-spatial 5-repeated 10-fold cross-validation:
  mypred_rpart <- function(object, newdata) predict(object, newdata)[, 2]

  runfolds_single <- runfolds(
    j = 1, data = ecuador,
    current_sample = current_sample,
    formula = slides ~ dem + slope + hcurv +
      vcurv + log.carea + cslope,
    model_fun = rpart,
    imp_permutations = 2, pred_fun = mypred_rpart,
    model_args = list(control = ctrl),
    imp_variables = c(
      "dem", "slope", "hcurv",
      "vcurv", "log.carea", "cslope"
    ),
    importance = TRUE,
    current_res = current_res,
    response = "slides",
    coords = c("x", "y"), progress = 1,
    pooled_obs_train = c(),
    pooled_obs_test = c(), err_fun = err_default
  )
  expect_equal(length(runfolds_single), 9)
})

# runreps Sun May 21 23:07:03 2017 ------------------------------

test_that("runreps works on lda example", {
  skip_on_cran()

  j <- 1 # running the first repetition of 'current_sample', normally we are
  # calling an apply call to seq_along nFolds of repetition
  # see also 'runreps()'
  #### 2 repetitions, 4 folds
  current_sample <- partition_cv(maipo, nfold = 4)
  current_sample[[2]] <- partition_cv(maipo, nfold = 4)[[1]]
  current_res <- current_sample

  lda_predfun <- function(object, newdata, fac = NULL) {
    library(nnet)
    majority <- function(x) {
      levels(x)[which.is.max(table(x))]
    }

    majority_filter <- function(x, fac) {
      for (lev in levels(fac)) {
        x[fac == lev] <- majority(x[fac == lev])
      }
      x
    }

    pred <- predict(object, newdata = newdata)$class
    if (!is.null(fac)) pred <- majority_filter(pred, newdata[, fac])
    return(pred)
  }

  predictors <- colnames(maipo)[5:ncol(maipo)]
  fo <- as.formula(paste("croptype ~", paste(predictors, collapse = "+")))

  runreps_res <- lapply(current_sample, function(x) {
    runreps(
      current_sample = x, data = maipo,
      formula = fo, pred_fun = lda_predfun,
      model_fun = lda,
      do_gc = 1,
      importance = FALSE, current_res = current_res,
      pred_args = list(fac = "field"), response = "croptype",
      coords = c("x", "y"), progress = 1, pooled_obs_train = c(),
      pooled_obs_test = c(), err_fun = err_default
    )
  })
  expect_equal(length(runreps_res), 2)
})

test_that("runreps works on glm example", {
  skip("internal use")

  data <- ecuador
  imp_one_rep <- readRDS("inst/test-objects/imp_one_rep.rda")
  current_sample <- readRDS("inst/test-objects/resamp.rda")
  current_res <- readRDS("inst/test-objects/current_res.rda")

  runreps_res <- lapply(current_sample, function(x) {
    runreps(
      current_sample = X, data = ecuador,
      formula = slides ~ dem + slope + hcurv + vcurv + log.carea + cslope,
      model_args = list(family = "binomial"),
      model_fun = glm,
      imp_permutations = 2,
      do_gc = 1,
      imp_variables = c(
        "dem", "slope", "hcurv", "vcurv",
        "log.carea", "cslope"
      ),
      importance = TRUE, current_res = current_res,
      pred_args = list(type = "response"), response = "slides",
      coords = c("x", "y"), progress = 1, pooled_obs_train = c(),
      pooled_obs_test = c(), err_fun = err_default
    )
  })
})

test_that("runreps works on rpart example", {
  skip("internal use")

  data <- ecuador
  imp_one_rep <- readRDS("inst/test-objects/imp_one_rep.rda")
  current_sample <- readRDS("inst/test-objects/resamp.rda")
  current_res <- readRDS("inst/test-objects/current_res.rda")

  runreps_res <- lapply(current_sample, function(x) {
    runreps(
      current_sample = X, data = ecuador,
      formula = slides ~ dem + slope + hcurv + vcurv + log.carea + cslope,
      model_fun = rpart,
      imp_permutations = 2,
      pred_fun = mypred_rpart,
      model_args = list(control = ctrl),
      imp_variables = c(
        "dem", "slope", "hcurv", "vcurv",
        "log.carea", "cslope"
      ),
      importance = TRUE, current_res = current_res,
      response = "slides",
      coords = c("x", "y"), progress = 1, pooled_obs_train = c(),
      pooled_obs_test = c(), err_fun = err_default
    )
  })
})

test_that("runfolds works on missing factor levels in
          test data example", {
  skip("internal use")

  df <- readRDS("inst/testfiles/pathogen_data.rds")
  fo <- diplo01 ~ temp + p_sum + r_sum + elevation + slope + hail +
    age + ph + lithology + soil

  current_sample <- partition_kmeans(df, nfold = 5, repetition = 1:5)
  current_res <- current_sample

  runreps_res <- lapply(current_sample, function(x) {
    runreps(
      current_sample = x, do_gc = 1,
      formula = fo, data = df,
      model_args = list(family = "binomial"),
      model_fun = glm,
      importance = TRUE,
      imp_variables = c("elevation", "lithology"),
      imp_permutations = 2,
      current_res = current_res,
      pred_args = list(type = "response"), response = "diplo01",
      coords = c("x", "y"), progress = 1,
      pooled_obs_train = c(),
      pooled_obs_test = c(), err_fun = err_default
    )
  })
  expect_equal(length(runfolds_single), 6)
})

Any scripts or data that you put into this service are public.

sperrorest documentation built on Oct. 16, 2022, 5:05 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

sperrorest
Perform Spatial Error Estimation and Variable Importance Assessment

tests/testthat/test-processing.R
In sperrorest: Perform Spatial Error Estimation and Variable Importance Assessment

Try the sperrorest package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

sperrorest Perform Spatial Error Estimation and Variable Importance Assessment

tests/testthat/test-processing.R In sperrorest: Perform Spatial Error Estimation and Variable Importance Assessment

Try the sperrorest package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

sperrorest
Perform Spatial Error Estimation and Variable Importance Assessment

tests/testthat/test-processing.R
In sperrorest: Perform Spatial Error Estimation and Variable Importance Assessment