tests/testthat/test-simulate-suite.R

test_that("simulate_dataset adds leakage-specific columns", {
  sim_none <- bioLeak:::.simulate_dataset(
    n = 20, p = 5, prevalence = 0.5,
    mode = "subject_grouped", leakage = "none",
    rho = 0, signal_strength = 1
  )
  expect_false("leak_subj" %in% names(sim_none$data))

  sim_subj <- bioLeak:::.simulate_dataset(
    n = 20, p = 5, prevalence = 0.5,
    mode = "subject_grouped", leakage = "subject_overlap",
    rho = 0, signal_strength = 1
  )
  expect_true("leak_subj" %in% names(sim_subj$data))

  sim_batch <- bioLeak:::.simulate_dataset(
    n = 20, p = 5, prevalence = 0.5,
    mode = "batch_blocked", leakage = "batch_confounded",
    rho = 0, signal_strength = 1
  )
  expect_true("leak_batch" %in% names(sim_batch$data))

  sim_peek <- bioLeak:::.simulate_dataset(
    n = 20, p = 5, prevalence = 0.5,
    mode = "subject_grouped", leakage = "peek_norm",
    rho = 0, signal_strength = 1
  )
  expect_true("leak_global" %in% names(sim_peek$data))

  sim_future <- bioLeak:::.simulate_dataset(
    n = 20, p = 5, prevalence = 0.5,
    mode = "time_series", leakage = "lookahead",
    rho = 0, signal_strength = 1
  )
  expect_true("leak_future" %in% names(sim_future$data))
})

test_that("simulate_leakage_suite runs when required learners are available", {
  if (!requireNamespace("glmnet", quietly = TRUE)) {
    expect_error(simulate_leakage_suite(
      n = 80, p = 5, prevalence = 0.5,
      mode = "batch_blocked", learner = "glmnet",
      leakage = "none", rho = 0, K = 3, repeats = 1,
      B = 2, seeds = 1, parallel = FALSE, signal_strength = 1
    ), "glmnet")
  } else {
    res <- simulate_leakage_suite(
      n = 80, p = 5, prevalence = 0.5,
      mode = "batch_blocked", learner = "glmnet",
      leakage = "none", rho = 0, K = 3, repeats = 1,
      B = 2, seeds = 1, parallel = FALSE, signal_strength = 1
    )
    expect_true(inherits(res, "LeakSimResults"))
    expect_true(all(c("seed", "metric_obs", "gap", "p_value", "leakage", "mode") %in% names(res)))
  }
})

# test_that("simulate_leakage_suite accepts preprocess overrides", {
#   skip_if_not_installed("glmnet")
#   res <- simulate_leakage_suite(
#     n = 80, p = 4, prevalence = 0.5,
#     mode = "subject_grouped", learner = "glmnet",
#     leakage = "peek_norm",
#     preprocess = list(normalize = list(method = "none")),
#     rho = 0, K = 3, repeats = 1,
#     B = 2, seeds = 1, parallel = FALSE, signal_strength = 1
#   )
#   expect_true(inherits(res, "LeakSimResults"))
# })

Try the bioLeak package in your browser

Any scripts or data that you put into this service are public.

bioLeak documentation built on March 6, 2026, 1:06 a.m.