inst/tinytest/test-pkg-mgcv.R

source("helpers.R")
# if (!EXPENSIVE) exit_file("EXPENSIVE")
using("marginaleffects")


requiet("mgcv")
requiet("emmeans")
requiet("tibble")
requiet("tsModel")


# marginaleffects vs. emtrends
set.seed(2)
void <- capture.output(dat <- gamSim(1, n = 400, dist = "normal", scale = 2))
void <- capture.output(dat2 <- gamSim(1, n = 2000, dist = "poisson", scale = .1))
dat <- dat
dat2 <- dat2
m1 <- mgcv::gam(y ~ s(x0) + s(x1) + s(x2) + s(x3), data = dat)
m2 <- mgcv::gam(y ~ te(x0, x1, k = 7) + s(x2) + s(x3), data = dat, method = "REML")
m3 <- mgcv::gam(y ~ s(x0) + s(x1) + s(x2) + s(x3) + ti(x1, x2, k = 6), data = dat, method = "REML")
m4 <- mgcv::gam(y ~ s(x0, x1, k = 40) + s(x2) + s(x3), data = dat, method = "REML")
m5 <- mgcv::gam(y ~ s(x0) + s(x1) + s(x2) + s(x3), data = dat, method = "REML", select = TRUE)
m6 <- mgcv::gam(y ~ s(x0) + s(x1) + s(x2) + s(x3), sp = c(0.01, -1, -1, -1), data = dat)
m7 <- mgcv::gam(y ~ s(x0, sp = .01) + s(x1) + s(x2) + s(x3), data = dat)
m8 <- mgcv::gam(y ~ s(x0) + s(x1) + s(x2) + s(x3), min.sp = c(0.001, 0.01, 0, 10), data = dat)
m9 <- mgcv::gam(y ~ s(x0, bs = "cr") + s(x1, bs = "cr") + s(x2, bs = "cr") +
      s(x3, bs = "cr"), family = poisson, data = dat2, method = "REML")
expect_slopes(m1)
expect_slopes(m2)
expect_slopes(m3)
expect_slopes(m4)
expect_slopes(m5)
expect_slopes(m6)
expect_slopes(m7)
expect_slopes(m8)
expect_slopes(m9)


# emtrends
mfx <- slopes(m1,
    variables = "x1",
    newdata = datagrid(
        x1 = 0,
        x2 = 0,
        x3 = 0),
    type = "link")

# TODO: emmeans no longer seems to work
# em <- emtrends(m1, specs = ~x1, var = "x1", at = list(x1 = 0, x2 = 0, x3 = 0))
# em <- tidy(em)
# expect_equivalent(mfx$estimate, em$x1.trend)
# expect_equivalent(mfx$std.error, em$std.error, tolerance = .0001)


# predictions: no validity
set.seed(2)
void <- capture.output(dat <- gamSim(1, n = 400, dist = "normal", scale = 2))
dat <- dat
mod <- mgcv::gam(y ~ s(x0) + s(x1) + s(x2) + s(x3), data = dat)
pred1 <- predictions(mod)
pred2 <- predictions(mod, newdata = head(dat))
expect_predictions(pred1, n_row = nrow(dat))
expect_predictions(pred2, n_row = 6)

# Issue #364: predictions confidence intervals for binomial models
void <- capture.output(
    dat <- suppressMessages(gamSim(1, n = 400, dist = "binary", scale = .33)))
m <- bam(
    y ~ s(x0) + s(x1) + s(x2) + s(x3),
    family = binomial,
    data = dat,
    method = "REML"
)
p <- predictions(m)
expect_true("conf.low" %in% colnames(p))
expect_true("conf.high" %in% colnames(p))


# Issue #363: matrix column in predictors
test1 <- function(x, z, sx = 0.3, sz = 0.4) {
    x <- x * 20
    (pi**sx * sz) * (1.2 * exp(-(x - 0.2)^2 / sx^2 - (z - 0.3)^2 / sz^2) +
        0.8 * exp(-(x - 0.7)^2 / sx^2 - (z - 0.8)^2 / sz^2))
}
n <- 500
x <- runif(n) / 20
z <- runif(n)
f <- test1(x, z)
y <- f + rnorm(n) * 0.2
df <- tibble::tibble(y, x, z)
df <- poorman::mutate(
    df,
    x_lags = tsModel::Lag(x, 0:10),
    L = matrix(0:10, nrow = 1))
b <- mgcv::gam(y ~ s(z) + te(x_lags, L), data = df)
mfx <- suppressWarnings(slopes(b))
cmp <- suppressWarnings(comparisons(b))
pre <- predictions(b)
expect_inherits(pre, "predictions")
expect_inherits(mfx, "marginaleffects")
expect_inherits(cmp, "comparisons")
# only one regressor since others are matrix columns
expect_true(all(mfx$term == "z"))
expect_true(all(cmp$term == "z"))

expect_error(suppressWarnings(slopes(b, variables = "L")), pattern = "no valid")
expect_error(suppressWarnings(comparisons(b, variables = "L")), pattern = "no valid")
expect_warning(plot_predictions(b, condition = "z"), pattern = "Matrix columns")
expect_warning(plot_slopes(b, variables = "L", condition = "z"), pattern = "Matrix columns")


# Issue #365: exclude argument changes predictions
void <- capture.output(
    dat <- gamSim(1, n = 400, dist = "normal", scale = 2)
)
b <- bam(y ~ s(x0) + s(x1) + s(x2) + s(x3), data = dat)
p1 <- predictions(b)
p2 <- predictions(b, exclude = "s(x3)")
expect_true(all(p1$estimate != p2$estimate))


# exclude a smooth
requiet("itsadug")
set.seed(1024)
data(simdat)
simdat$Subject <- as.factor(simdat$Subject)
model <- bam(Y ~ Group + s(Time, by = Group) + s(Subject, bs = "re"), data = simdat)
nd <- datagrid(
    model = model,
    Subject = "a01",
    Group = "Adults")

expect_equivalent(
    predictions(model, newdata = nd)$estimate,
    predict(model, newdata = nd)[1])

expect_equivalent(
    predictions(model, newdata = nd, exclude = "s(Subject)")$estimate,
    predict(model, newdata = nd, exclude = "s(Subject)")[1])


mfx <- slopes(model, newdata = "mean", variables = "Time", type = "link")
emt <- suppressMessages(data.frame(
    emtrends(model, ~Time, "Time", at = list(Time = 1000, Subject = "a01", Group = "Adults"))))
expect_equivalent(mfx$estimate, emt$Time.trend, tolerance = 1e-2)
expect_equivalent(mfx$std.error, emt$SE, tolerance = 1e-3)

# Issue #545
p <- plot_slopes(model, variables = "Time", condition = "Time", draw = FALSE)
expect_true(nrow(p) > 1)



# Issue #844
df <- transform(mtcars, gear = as.integer(gear))

mod <- gam(
    gear ~ s(hp) + cyl,
    data = df,
    family = ocat(R = 5)
)

pre <- avg_predictions(model = mod)
slo <- avg_slopes(mod)
cmp <- comparisons(mod)
expect_inherits(pre, "predictions")
expect_inherits(slo, "slopes")
expect_inherits(cmp, "comparisons")




# Issue #931
simdat$Subject <- as.factor(simdat$Subject)
model <- bam(Y ~ Group + s(Time, by = Group) + s(Subject, bs = "re"),
             data = simdat)

low = function(hi, lo, x) {
    dydx <- (hi - lo) / 1e-6
    dydx_min <- min(dydx)
    x[dydx == dydx_min][1]
}
cmp <- comparisons(model,
  variables = list("Time" = 1e-6),
  vcov = FALSE,
  by = "Group",
  comparison = low
)
expect_inherits(cmp, "comparisons")
expect_equal(nrow(cmp), 2)

rm(list = ls())

Try the marginaleffects package in your browser

Any scripts or data that you put into this service are public.

marginaleffects documentation built on Oct. 20, 2023, 1:07 a.m.