In bips-hb/DataTrainCausalLearning: Practicals for the Data Train Course "Causal learning" 2021 (V Didelez)

knitr::opts_chunk$set(
  echo = TRUE,
  eval = TRUE,
  collapse = TRUE,
  fig.width = 6)

Make use of the DAGitty package

Enter the following DAG into R: dagitty.net/ms0VVMy

library(dagitty)

# Build the graph
g <- dagitty("dag {
              ESRD [outcome]
              current.smoking [exposure]
              baseline.covariates -> earlier.smoking
              baseline.covariates -> prior.disease
              baseline.covariates -> ESRD
              current.smoking -> ESRD
              earlier.smoking -> current.smoking
              earlier.smoking -> prior.disease
              prior.disease -> current.smoking
              prior.disease -> ESRD
              }")

plot(graphLayout(g))

Making 'earlier smoking' unobserved

g.unob <- g
latents(g.unob) <- c("earlier.smoking")

List adjustment sets

adjustmentSets(g, type = "minimal", effect = "total")
adjustmentSets(g.unob, type = "minimal", effect = "total")

List testable implications

print(impliedConditionalIndependencies(g))
print(impliedConditionalIndependencies(g.unob))

List total effects that are identifiable by regression

for(n in names(g.unob)){
  for(m in setdiff(dagitty::descendants(g.unob, n), n)){
    a <- adjustmentSets(g.unob, n, m)
    if(length(a) > 0){
      cat("The total effect of ", n," on ", m,
          " is identifiable controlling for:\n", sep = "")
      print(a, prefix=" * ")
    }
  }
}

List all back-door paths

## show paths
(pfad <- paths(g.unob, from = "current.smoking", to = "ESRD"))

# number of open back-door paths
sum(pfad$open)

Insert new node

g2 <- dagitty("dag {
              ESRD [outcome]
              current.smoking [exposure]
              unknown [latent]
              baseline.covariates -> earlier.smoking
              baseline.covariates -> prior.disease
              baseline.covariates -> ESRD
              current.smoking -> ESRD
              earlier.smoking -> current.smoking
              earlier.smoking -> prior.disease
              prior.disease -> current.smoking
              prior.disease -> ESRD
              prior.disease <- unknown -> ESRD
              }")

plot(graphLayout(g2))

adjustmentSets(g2)

Simulated data examples

library(gRbase)

Example 1

plot(dag(~X1, ~L, ~X2*X1*L, ~Y*L))

N <- 1000
x1 <- sample(c(1,0), N, replace = T)
l <- rnorm(N, 1, 2)
p <- 1/(1 + exp(-1.5*x1 * l + 2)) 
x2 <- rbinom(N, 1, p)

y <- 0.5 * l + rnorm(N, 2)

summary(lm(y ~ x1))$coefficients

summary(lm(y ~ x1 + x2))$coefficients

summary(lm(y ~ x1 + x2 + l))$coefficients

Example 2

plot(dag(~X1, ~U, ~L*X1*U, ~X2*X1*L, ~Y*L*U*X1*X2))

N <- 1000
x1 <- sample(c(1,0), N, replace = T)
u <- rnorm(N, 2)
l <- 2 * x1 - u + rnorm(N, 1, 2)
p <- 1/(1 + exp(-3 * x1 + l)) 
x2 <- rbinom(N, 1, p)
y <- u + x1 + l + x2 + rnorm(N)

summary(lm(y ~ x1 + x2))$coefficients

summary(lm(y ~ x1 + x2 + l))$coefficients

Randomising $X_2$

x2_new <- sample(c(1,0), N, replace = T)
y_new <- u + x1 + l + x2_new + rnorm(N)

summary(lm(y_new ~ x1 + x2_new))$coefficients

Inverse probability weights

log_model <- glm(x2 ~ x1 + l, family = binomial(link="logit"))
p_hat <- predict(log_model, type = "response")
w <- (x2 * p_hat + (1 - x2) * (1 - p_hat))^(-1)

summary(lm(y ~ x1 + x2, weights = w))$coefficients

bips-hb/DataTrainCausalLearning documentation built on Dec. 5, 2023, 8:32 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

bips-hb/DataTrainCausalLearning
Practicals for the Data Train Course "Causal learning" 2021 (V Didelez)

In bips-hb/DataTrainCausalLearning: Practicals for the Data Train Course "Causal learning" 2021 (V Didelez)

Make use of the DAGitty package

Making 'earlier smoking' unobserved

List adjustment sets

List testable implications

List total effects that are identifiable by regression

List all back-door paths

Insert new node

Simulated data examples

Example 1

Example 2

Randomising $X_2$

Inverse probability weights

R Package Documentation

Browse R Packages

We want your feedback!

bips-hb/DataTrainCausalLearning Practicals for the Data Train Course "Causal learning" 2021 (V Didelez)

In bips-hb/DataTrainCausalLearning: Practicals for the Data Train Course "Causal learning" 2021 (V Didelez)

Make use of the DAGitty package

Making 'earlier smoking' unobserved

List adjustment sets

List testable implications

List total effects that are identifiable by regression

List all back-door paths

Insert new node

Simulated data examples

Example 1

Example 2

Randomising $X_2$

Inverse probability weights

R Package Documentation

Browse R Packages

We want your feedback!

bips-hb/DataTrainCausalLearning
Practicals for the Data Train Course "Causal learning" 2021 (V Didelez)