vignettes/UsingSpikeSlabGAM.R
In spikeSlabGAM: Bayesian Variable Selection and Model Choice for Generalized Additive Mixed Models

## ----setup, include=FALSE-------------------------------------------
#use 2 cores on CRAN, potentially more if not:
use_cores <- ifelse(
  identical(Sys.getenv("NOT_CRAN"), "true"), #s. testhat::on_cran
  2,
  max(1, parallel::detectCores() - 2)
)
options(prompt = "R> ", continue = "+  ", width = 70, #JSS style
        useFancyQuotes = FALSE, digits=5, 
        mc.cores = use_cores)
clrs <- c("#E41A1C", "#377EB8", "#4DAF4A", "#984EA3", "#FF7F00", "#FFFF33",
          "#A65628", "#F781BF", "#999999")
knitr::opts_chunk$set(
  cache = TRUE,
  fig.path='UsingSpikeSlabGAM',
  dev='pdf'
)

library("spikeSlabGAM")
library("mboost")
library("ggplot2")
library("gtable")


## ----mkData, echo=T, results='hide'---------------------------------
set.seed(1312424)
n <- 200
snr <- 3

sm1 <- runif(n)
fsm1 <- dbeta(sm1, 7, 3)/2

sm2 <- runif(n, 0, 1)
f <- gl(3, n/3)
ff <- as.numeric(f)/2
fsm2f <- ff + ff * sm2 +
  ((f == 1) * -dbeta(sm2, 6, 4) + (f == 2) * dbeta(sm2, 6, 9) +
     (f == 3) * dbeta(sm2, 9, 6))/2

lin <- matrix(rnorm(n * 3), n, 3)
colnames(lin) <- paste("lin", 1:3, sep = "")

noise1 <- sm1 + rnorm(n)
noise2 <- runif(n)
noise3 <- runif(n)
noise4 <- sample(gl(4, n/4))

eta <- drop(fsm1 + fsm2f + lin %*% c(.1, .2, .3))
y <- eta + sd(eta)/snr * rt(n, df = 5)
d <- data.frame(y, sm1, sm2, f, lin, noise1, noise2, noise3, noise4)


## ----defForm1-------------------------------------------------------
f1 <- y ~ (sm1 + sm2 + f + lin1)^2 + lin2 +lin3 + noise1 + noise2 + noise3 + noise4


## ----fit1, cache=T, results='hide'----------------------------------
m <- spikeSlabGAM(formula = f1, data = d)


## ----summary1.1Fake, echo=T, eval=FALSE-----------------------------
## summary(m)


## ----summary1.1Prep, echo=FALSE, results='hide'---------------------
summ <- summary(m)


## ----summary1.1, echo=FALSE-----------------------------------------
print(summ, printModels=F)


## ----summary1.2, echo=F---------------------------------------------
#this is just ctrl-c-v from summary.spikeSlabGAM s.t. we don't get too much
#redundant info about model formula etc. roughly the same as: print(sum,
#printPGamma=F, printModels=T)
cat("\nPosterior model probabilities (inclusion threshold =",summ$thresh,"):\n")
modelTable <- {
  #make ("x","")-vectors out of model names
  models <- sapply(names(summ$modelTable), function(x){
    sapply(strsplit(gsub("1", "x", x),""),
           function(y) gsub("0", "", y))
  })
  models <- rbind(round(summ$modelTable,3), models,
                  round(cumsum(summ$modelTable), 3))
  rownames(models) <- c("prob.:",
                        names(summ$predvars[!grepl("u(", names(summ$predvars),
                                                   fixed=TRUE)]),
                        "cumulative:")
  models <- data.frame(models)
  showModels <- 8
  models <- models[,1:showModels, drop=F]
  colnames(models) <- 1:NCOL(models)
  models
}
print(modelTable)


## ----plotm1Fake, echo=TRUE, eval=FALSE------------------------------
## plot(m)


## ----plotm1prep, echo=FALSE, cache=TRUE, results='hide', fig.show='hide'----
pl <- plot(m, nrow=4, ncol=3,
           ggElems=list(theme(legend.key.size = grid:::unit(0.01, "npc"),
                              legend.text = element_text(size = 7),
                              legend.title=element_text(size=8, hjust = 0),
                              axis.text.x = element_text(size=8),
                              axis.text.y = element_text(size=8, hjust=1),
                              plot.margin=grid:::unit(c(0.5, 0, 0, 0), "lines"))))


## ----plotm1, echo=FALSE, fig.width=6, cache=TRUE, external=TRUE-----
do.call(gridExtra:::grid.arrange, c(pl, nrow=4, ncol=3))


## ----plotm1sm1Fake, echo=TRUE, eval=FALSE---------------------------
## plot(m, labels = c("lin(sm1)", "sm(sm1)"), cumulative = FALSE)
## trueFsm1 <- data.frame(truth = fsm1 - mean(fsm1), sm1 = sm1)
## plot(m, labels = "sm(sm1)", ggElems = list(geom_line(aes(x = sm1, y = truth),
##                                                      data = trueFsm1, linetype = 2)))

## ----plotm1sm1Prep, echo=FALSE, cache=TRUE, results='hide', fig.show='hide'----
pSm11 <- plot(m, labels="sm(sm1)",
              ggElems=list(theme(axis.text.x = element_text(size=9),
                                 axis.text.y = element_text(size=9, hjust=1))))
pSm1Sep <-  plot(m, labels=c("lin(sm1)", "sm(sm1)"), cumulative=FALSE,
                 ggElems=list(theme(axis.text.x = element_text(size=9),
                                    axis.text.y = element_text(size=9, hjust=1))),
                 nrow=1, ncol=2) #,
# JSS version only:        ggElems=list(list(ylab("$\\eta$"))))


## ----plotm1sm1, echo=FALSE, fig.width=6, fig.height=2, cache=TRUE, external=TRUE----
trueFsm1 <- data.frame(truth=fsm1-mean(fsm1), sm1=sm1)
pSm1Cum <- pSm11[[1]] + geom_line(data=trueFsm1, aes(x=sm1, y=truth), lty=2)  +
  theme(axis.text.x = element_text(size=9),
        axis.text.y = element_text(size=9, hjust=1))# + ylab("$\\eta$")
gridExtra:::grid.arrange(pSm1Sep[[1]], pSm1Sep[[2]], pSm1Cum, nrow=1)


## ----plotm1sm2fFake, echo=TRUE, eval=FALSE--------------------------
## trueFsm2f <-data.frame(truth = fsm2f - mean(fsm2f), sm2 = sm2, f = f)
## plot(m, labels = "sm(sm2):fct(f)",
##      ggElems = list(geom_line(aes(x = sm2, y = truth, colour = f),
##                               data = trueFsm2f, linetype = 2)))


## ----plotm1sm2fprep, echo=FALSE, cache=TRUE, results='hide', fig.show='hide'----
trueFsm2f <-data.frame(truth=fsm2f-mean(fsm2f), sm2=sm2, f=f)
#JSS only: plot(m, labels="sm(sm2):fct(f)", ggElems=list(list(ylab("$\\eta$")), geom_line(aes(x=sm2, y=truth, colour=f), data=trueFsm2f, linetype=2)))
pl2 <- plot(m, labels="sm(sm2):fct(f)",
            ggElems=list(geom_line(aes(x=sm2, y=truth, colour=f), data=trueFsm2f,
                                   linetype=2)))


## ----plotm1sm2f, echo=FALSE, fig.width=6, fig.height=3, cache=TRUE, external=TRUE----
pl2[[1]]


## ----pimaDataPrep, echo=TRUE----------------------------------------
data("PimaIndiansDiabetes2", package = "mlbench")
pimaDiab <- na.omit(PimaIndiansDiabetes2[, -c(4, 5)])
pimaDiab <- within(pimaDiab,{
  diabetes <- 1*(diabetes == "pos")
})
set.seed(1109712439)
testInd <- sample(1:nrow(pimaDiab), 200)
pimaDiabTrain <- pimaDiab[-testInd,]


## ----pimaM0, echo=TRUE, cache=TRUE, results='hide'------------------
mcmc <- list(nChains = 8, chainLength = 1000, burnin = 500, thin = 5)
m0 <- spikeSlabGAM(
  diabetes ~ pregnant + glucose + pressure + mass + pedigree + age,
  family = "binomial", data = pimaDiabTrain, mcmc = mcmc)


## ----pimaM0Summary, echo=TRUE---------------------------------------
pr0 <- predict(m0, newdata = pimaDiab[testInd,])
print(summary(m0), printModels = FALSE)


## ----pimaB0, echo=TRUE, cache=TRUE, results='hide'------------------
b <- gamboost(
  as.factor(diabetes) ~ pregnant + glucose + pressure + mass + pedigree + age,
  family = Binomial(), data = pimaDiabTrain)[300]
aic <- AIC(b, method = "classical")
prB <- predict(b[mstop(aic)], newdata = pimaDiab[testInd,])


## ----pimaB0Sum, echo=TRUE-------------------------------------------
summary(b[mstop(aic)])$selprob


## ----pimaM0Pred-----------------------------------------------------
dev <- function(y, p){
  -2*sum(dbinom(x = y, size = 1, prob = p, log = T))
}
c(spikeSlabGAM = dev(pimaDiab[testInd, "diabetes"], pr0),
  gamboost   = dev(pimaDiab[testInd, "diabetes"], plogis(prB)))


## ----pimaM1, echo=TRUE, cache=TRUE, results='hide'------------------
hyper1 <- list(gamma = c(v0 = 0.005))
m1 <- spikeSlabGAM(
  diabetes ~ pregnant + glucose + pressure + mass + pedigree + age,
  family = "binomial", data = pimaDiabTrain, mcmc = mcmc,
  hyperparameters = hyper1)
pr1 <- predict(m1, newdata = pimaDiab[testInd, ])


## ----pimaM1Sum, echo=T----------------------------------------------
print(summary(m1), printModels = FALSE)
(dev(pimaDiab[testInd, "diabetes"], pr1))


## ----sessionInfo----------------------------------------------------
sessionInfo()

Any scripts or data that you put into this service are public.

spikeSlabGAM documentation built on June 10, 2022, 5:10 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

spikeSlabGAM
Bayesian Variable Selection and Model Choice for Generalized Additive Mixed Models

vignettes/UsingSpikeSlabGAM.R
In spikeSlabGAM: Bayesian Variable Selection and Model Choice for Generalized Additive Mixed Models

Try the spikeSlabGAM package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

spikeSlabGAM Bayesian Variable Selection and Model Choice for Generalized Additive Mixed Models

vignettes/UsingSpikeSlabGAM.R In spikeSlabGAM: Bayesian Variable Selection and Model Choice for Generalized Additive Mixed Models

Try the spikeSlabGAM package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

spikeSlabGAM
Bayesian Variable Selection and Model Choice for Generalized Additive Mixed Models

vignettes/UsingSpikeSlabGAM.R
In spikeSlabGAM: Bayesian Variable Selection and Model Choice for Generalized Additive Mixed Models