tests/testthat/test-simulation_helpers.R

context("test-simulation_helpers")

# Define variables
set.seed(1991)
u <- sample(1e6, 1)
n <- sample(1:1e3, 1)
p <- sample(1:50, 1)
tail_index <- sample(1:10, 1)
prob_connect <- runif(1)

# Run tests
test_that("pick elements works", {

  # vec has length 0
  expect_equal(pick_elements(vec = numeric(0), prob = 0), numeric(0))
  expect_equal(pick_elements(vec = numeric(0), prob = 1), numeric(0))
  expect_equal(pick_elements(vec = numeric(0), prob = 0.3), numeric(0))

  # vec has length 1
  set.seed(u)
  vec <- c(1)
  proba <- 0.3
  r <- rbinom(n = length(vec), size = 1, proba)
  picked <- vec[r == 1]
  expect_equal(pick_elements(vec = vec, prob = 0), numeric(0))
  expect_equal(pick_elements(vec = vec, prob = 1), c(1))
  set.seed(u)
  expect_equal(pick_elements(vec = vec, prob = proba), picked)

  # vec has length > 1
  set.seed(u)
  vec <- c(4, 0, 3, 1)
  proba <- 0.3
  r <- rbinom(n = length(vec), size = 1, proba)
  picked <- vec[r == 1]
  expect_equal(pick_elements(vec = vec, prob = 0), numeric(0))
  expect_equal(pick_elements(vec = vec, prob = 1), vec)
  set.seed(u)
  expect_equal(pick_elements(vec = vec, prob = proba), picked)

})

test_that("inverse mirror uniform works", {
  lb <- runif(1)
  ub <- lb + runif(1)
  expect_equal(inverse_mirror_uniform(prob = 0, min = lb, max = ub), -ub)
  expect_equal(inverse_mirror_uniform(prob = 1, min = lb, max = ub), ub)
  expect_equal(inverse_mirror_uniform(prob = 1 / 2, min = lb, max = ub), lb)
  expect_equal(inverse_mirror_uniform(prob = 1 / 4, min = lb, max = ub),
               2 * 1 / 4 * (ub - lb) - ub)
  expect_equal(inverse_mirror_uniform(prob = 3 / 4, min = lb, max = ub),
               (2 * 3 / 4 - 1) * (ub - lb) + lb)

  expect_error(inverse_mirror_uniform(prob = runif(1), min = ub, max = lb))
  expect_error(inverse_mirror_uniform(prob = runif(1), min = -ub, max = lb))
  expect_error(inverse_mirror_uniform(prob = runif(1), min = ub, max = -lb))
  expect_error(inverse_mirror_uniform(prob = runif(1), min = -ub, max = -lb))
  expect_error(inverse_mirror_uniform(prob = 1.2, min = lb, max = ub))

})

test_that("sample uniform works", {
  n <- 7
  lb <- runif(1)
  ub <- lb + runif(1)

  # mirror == FALSE
  set.seed(u)
  r <- runif(n, min = lb, max = ub)
  set.seed(u)
  expect_equal(sample_uniform(n = n, min = lb, max = ub), r)

  set.seed(u)
  r <- runif(n, min = -ub, max = -lb)
  set.seed(u)
  expect_equal(sample_uniform(n = n, min = -ub, max = -lb), r)

  expect_error(sample_uniform(n = n, min = ub, max = lb))

  # mirror == TRUE
  set.seed(u)
  r <- sapply(runif(n), inverse_mirror_uniform, min = lb, max = ub)
  set.seed(u)
  expect_equal(sample_uniform(n = n, min = lb, max = ub, mirror = TRUE), r)

  expect_error(sample_uniform(n = n, min = -ub, max = -lb, mirror = TRUE))
  expect_error(sample_uniform(n = n, min = -ub, max =  lb, mirror = TRUE))
  expect_error(sample_uniform(n = n, min =  ub, max = -lb, mirror = TRUE))
  expect_error(sample_uniform(n = n, min = ub, max = lb, mirror = TRUE))

})

test_that("random dag works", {
  # caus_order has length 0
  expect_error(random_dag(p = 0, prob = 0, caus_order = numeric(0)))
  expect_error(random_dag(p = 0, prob = 1, caus_order = numeric(0)))
  expect_error(random_dag(p = 0, prob = 0.4, caus_order = numeric(0)))

  # caus_order has length 1
  caus_order <- c(1)

  expect_equal(random_dag(p = 1, prob = 0, caus_order = caus_order),
               matrix(0))
  expect_equal(random_dag(p = 1, prob = 1, caus_order = caus_order),
               matrix(0))
  expect_equal(random_dag(p = 1, prob = 0.5, caus_order = caus_order),
               matrix(0))

  # caus_order has length > 1
  p <- 4
  caus_order <- sample(p)

  dag_empty <- matrix(0, nrow = length(caus_order), ncol = length(caus_order))
  expect_equal(random_dag(p = p, prob = 0, caus_order = caus_order),
               dag_empty)

  dag_full <-  caus_order_to_dag(caus_order)
  expect_equal(random_dag(p = p, prob = 1, caus_order = caus_order),
               dag_full)

  proba <- runif(1)
  dag <- matrix(0, nrow = length(caus_order), ncol = length(caus_order))

  set.seed(u)
  elms <- pick_elements(caus_order[2:p], proba)
  dag[caus_order[1], elms] <- 1
  elms <- pick_elements(caus_order[3:p], proba)
  dag[caus_order[2], elms] <- 1
  elms <- pick_elements(caus_order[4:p], proba)
  dag[caus_order[3], elms] <- 1

  set.seed(u)
  expect_equal(random_dag(p = p, prob = proba, caus_order = caus_order),
               dag)


  # mismatch between length of caus_order and p
  expect_error(random_dag(p = 1, prob = 0, caus_order = sample(p)))
  expect_error(random_dag(p = 1, prob = 1, caus_order = sample(p)))
  expect_error(random_dag(p = 1, prob = 0.4, caus_order = sample(p)))



})

test_that("random coefficients works", {
  lb <- runif(1)
  ub <- lb + runif(1)


  # DAG has one variable
  expect_equal(random_coeff(matrix(0), lb = lb, ub = ub,
                            two_intervals = FALSE), matrix(0))
  expect_equal(random_coeff(matrix(0), lb = lb, ub = ub,
                            two_intervals = TRUE), matrix(0))

  # DAG has > 1 variable
  p <- 7
  g <- random_dag(p = p, prob = runif(1))

  num_coeff <- sum(g)

  # two_intervals == TRUE
  g_coeff <- matrix(0, nrow = p, ncol = p)
  set.seed(u)
  g_coeff[g == 1] <- sample_uniform(n = num_coeff, min = lb, max = ub,
                                    mirror = TRUE)
  set.seed(u)
  expect_equal(random_coeff(g, lb = lb, ub = ub, two_intervals = TRUE),
               g_coeff)

  # two_intervals == FALSE
  g_coeff <- matrix(0, nrow = p, ncol = p)
  set.seed(u)
  g_coeff[g == 1] <- sample_uniform(n = num_coeff, min = lb, max = ub,
                                    mirror = FALSE)
  set.seed(u)
  expect_equal(random_coeff(g, lb = lb, ub = ub, two_intervals = FALSE),
               g_coeff)

  # not adjacency matrix
  expect_error(random_coeff(g * 0.1, lb = lb, ub = ub, two_intervals = FALSE))
  expect_error(random_coeff(g * 0.1, lb = lb, ub = ub, two_intervals = TRUE))

  # lb > ub
  expect_error(random_coeff(g, lb = ub, ub = lb, two_intervals = FALSE))
  expect_error(random_coeff(g, lb = ub, ub = lb, two_intervals = TRUE))

  # if two_intervals == TRUE, lb > 0 and ub > 0
  expect_error(random_coeff(g, lb = -ub, ub =  lb, two_intervals = TRUE))
  expect_error(random_coeff(g, lb =  ub, ub = -lb, two_intervals = TRUE))
  expect_error(random_coeff(g, lb = -ub, ub = -lb, two_intervals = TRUE))

})

test_that("add random confounders works", {

  ### p = 1
  p <- 1

  dag <- random_dag(p, prob_connect = runif(1))
  out <- add_random_confounders(dag, prob_confound = runif(1))

  # is the output the right size?
  expect_equal(NROW(out$dag_confounders), p + p * (p - 1) / 2)

  # are there zero confounders?
  expect_equal(length(out$pos_confounders), 0)

  ### p > 1
  p <- sample(2:20, 1)

  ## Proba confounder = 1
  prob_confound <- 1
  dag <- random_dag(p, prob_connect = runif(1))
  out <- add_random_confounders(dag, prob_confound = prob_confound)


  if (length(out$pos_confounders) == 1){

    # are the confounders affecting only 2 vars at a time?
    expect_equal(sum(out$dag_confounders[out$pos_confounders, ]), 2)

    # are the confounders actually source nodes?
    expect_equal(sum(out$dag_confounders[, out$pos_confounders]), 0)

  } else {

    # are the confounders affecting only 2 vars at a time?
    expect_equal(apply(out$dag_confounders[out$pos_confounders, ], 1, sum),
                 rep(2, length(out$pos_confounders)))

    # are the confounders actually source nodes?
    expect_equal(apply(out$dag_confounders[, out$pos_confounders], 2, sum),
                 rep(0, length(out$pos_confounders)))
  }


  ## Proba confounder = 0
  prob_confound <- 0
  dag <- random_dag(p, prob_connect = runif(1))
  out <- add_random_confounders(dag, prob_confound = prob_confound)

  # is the output the right size?
  expect_equal(NROW(out$dag_confounders), p)

  # are there zero confounders?
  expect_equal(length(out$pos_confounders), 0)

  # are the confounders affecting only 2 vars at a time?
  expect_equal(apply(out$dag_confounders[out$pos_confounders, ], 1, sum),
               rep(2, length(out$pos_confounders)))

  # are the confounders actually source nodes?
  expect_equal(apply(out$dag_confounders[, out$pos_confounders], 2, sum),
               rep(0, length(out$pos_confounders)))


  ## Proba confounder in (0, 1)
  prob_confound <- runif(1)
  dag <- random_dag(p, prob_connect = runif(1))
  out <- add_random_confounders(dag, prob_confound = prob_confound)

  # is the output the right size?
  expect_lte(NROW(out$dag_confounders), p + p * (p - 1) / 2)
  expect_gte(NROW(out$dag_confounders), p)

  if (length(out$pos_confounders) == 1){

    # are the confounders affecting only 2 vars at a time?
    expect_equal(sum(out$dag_confounders[out$pos_confounders, ]), 2)

    # are the confounders actually source nodes?
    expect_equal(sum(out$dag_confounders[, out$pos_confounders]), 0)

  } else {

    # are the confounders affecting only 2 vars at a time?
    expect_equal(apply(out$dag_confounders[out$pos_confounders, ], 1, sum),
                 rep(2, length(out$pos_confounders)))

    # are the confounders actually source nodes?
    expect_equal(apply(out$dag_confounders[, out$pos_confounders], 2, sum),
                 rep(0, length(out$pos_confounders)))
  }

  ## Error
  dag <- random_dag(5, prob_connect = 1)
  expect_error(add_random_confounders(dag * 0.1, runif(1)))

})

test_that("simulate noise works", {

  p <- sample(1:20, 1)

  ## check that size is correct
  # student_t
  sim <- simulate_noise(n, p, "student_t", tail_index)
  expect_equal(NROW(sim), n)
  expect_equal(NCOL(sim), p)

  # gaussian
  sim <- simulate_noise(n, p, "gaussian", tail_index)
  expect_equal(NROW(sim), n)
  expect_equal(NCOL(sim), p)

  # log_norm
  sim <- simulate_noise(n, p, "log_normal", tail_index)
  expect_equal(NROW(sim), n)
  expect_equal(NCOL(sim), p)

  ## Error
  expect_error(simulate_noise(n, p, "blahblah", tail_index))
  expect_error(simulate_noise(1, 2, tail_index = 1.5))
  expect_error(simulate_noise(2, 1, tail_index = 1.5))
  expect_error(simulate_noise(1, 1, tail_index = 1.5))
})

test_that("uniform margin works", {
  p <- sample(0:10)
  v <- rnorm(p)
  expect_equal(uniform_margin(v), rank(v) / length(v))
})

test_that("broken hockeystick works", {
  n <- sample(0:10, 1)
  v <- rnorm(n)

  v_temp <- v
  r <- rank(v_temp, ties.method = "first")
  q_low <- runif(1)
  q_high <- runif(1)
  v_temp[r > floor(n * q_low) & r <= ceiling(n * q_high)] <- 0

  expect_equal(broken_hockeystick(v, q_low, q_high), v_temp)
})

test_that("nonlinear scm works", {
  dag <- random_dag(3, prob_connect = 1, caus_order = 1:3)
  adj_mat <- random_coeff(dag)
  noise <- simulate_noise(n, 3, distr = "student_t", tail_index = tail_index)
  X <- matrix(0, nrow = n, ncol = 3)
  X[, 1] <- noise[, 1]
  X[, 2] <- adj_mat[1, 2] * broken_hockeystick(X[, 1]) + noise[, 2]
  X[, 3] <- adj_mat[1, 3] * broken_hockeystick(X[, 1]) +
    adj_mat[2, 3] * broken_hockeystick(X[, 2]) + noise[, 3]
  expect_equal(nonlinear_scm(adj_mat, noise), X)
})
nicolagnecco/causalXtreme documentation built on April 21, 2024, 4:22 a.m.