intro-to-penppml.R
In penppml: Penalized Poisson Pseudo Maximum Likelihood Regression

## ---- include = FALSE---------------------------------------------------------
knitr::opts_chunk$set(
  collapse = TRUE,
  comment = "#>"
)

## ----setup 1, eval = FALSE----------------------------------------------------
#  install.packages("penppml")

## ---- eval=FALSE--------------------------------------------------------------
#  library(penppml)

## ---- hide=TRUE, eval=FALSE---------------------------------------------------
#  devtools::load_all()

## ----filter trade data, eval=FALSE--------------------------------------------
#  selected <- countries$iso[countries$region %in% c("Americas")]
#  trade2 <- trade[(trade$exp %in% selected) & (trade$imp %in% selected), -(5:6)] # We remove columns 5 and
#  # 6 because these variables are not needed in our regressions.

## ----try hdfeppml, eval=FALSE-------------------------------------------------
#  reg1 <- hdfeppml(data = trade2,
#                   dep = "export",
#                   fixed = list(c("exp", "time"),
#                                c("imp", "time"),
#                                c("exp", "imp")))

## ----hdfeppml results, results = FALSE, eval=FALSE----------------------------
#  results <- data.frame(prov = rownames(reg1$coefficients), b = reg1$coefficients, se = 0)
#  results$se[!is.na(reg1$coefficients)] <- reg1$se
#  results

## ----try hdfeppml2, eval=FALSE------------------------------------------------
#  reg1_indep <- hdfeppml(data = trade2, indep=5:7,
#                   dep = "export",
#                   fixed = list(c("exp", "time"),
#                                c("imp", "time"),
#                                c("exp", "imp")))

## ----try mlfitpenppml lasso, results = FALSE, eval=FALSE----------------------
#  lambdas <- c(0.05, 0.025, 0.01, 0.0075, 0.005, 0.0025, 0.001, 0.00075, 0.0005, 0.00025, 0.0001, 0)
#  
#  reg2 <- mlfitppml(data = trade2,
#                    dep = "export",
#                    fixed = list(c("exp", "time"),
#                                c("imp", "time"),
#                                c("exp", "imp")),
#                    penalty = "lasso",
#                    lambdas = lambdas)

## ----try penhdfeppml, results = FALSE, eval=FALSE-----------------------------
#  reg3 <- penhdfeppml(data = trade2,
#                    dep = "export",
#                    fixed = list(c("exp", "time"),
#                                c("imp", "time"),
#                                c("exp", "imp")),
#                    penalty = "lasso",
#                    lambda = 0.005)

## ----try mlfitpenppml ridge, results = FALSE, eval=FALSE----------------------
#  lambdas <- seq(0.0001, 0, length.out = 10)
#  
#  reg4 <- mlfitppml(data = trade2,
#                    dep = "export",
#                    fixed = list(c("exp", "time"),
#                                c("imp", "time"),
#                                c("exp", "imp")),
#                    penalty = "ridge",
#                    lambdas = lambdas)

## ----split data set by agreement, eval = FALSE--------------------------------
#  id <- unique(trade[(trade$exp %in% selected) & (trade$imp %in% selected), 5])
#  nfolds <- 20
#  unique_ids <- data.frame(id = id, fold = sample(1:nfolds, size = length(id), replace = TRUE))
#  
#  cross_ids <- merge(trade[(trade$exp %in% selected) & (trade$imp %in% selected), 5, drop = FALSE],
#                     unique_ids, by = "id", all.x = TRUE)

## ----try cross validation, eval = FALSE---------------------------------------
#  reg5 <- mlfitppml(data = trade2,
#                    dep = "export",
#                    fixed = list(c("exp", "time"),
#                                c("imp", "time"),
#                                c("exp", "imp")),
#                    penalty = "lasso",
#                    lambdas = c(seq(0.5, 0.1, by = -0.1), 0.05, 0.01, 0.005, 0.001, 0.0005, 0.0001, 0),
#                    xval = TRUE,
#                    IDs =  cross_ids$fold)

## ----xval results, eval = FALSE-----------------------------------------------
#  reg5$rmse

## ----try plugin lasso, results = FALSE, eval=FALSE----------------------------
#  reg6 <- mlfitppml(data = trade2,
#                    dep = "export",
#                    fixed = list(c("exp", "time"),
#                                c("imp", "time"),
#                                c("exp", "imp")),
#                    penalty = "lasso",
#                    method = "plugin",
#                    cluster = c("exp", "imp"))

## ----plugin results, results = FALSE, eval=FALSE------------------------------
#  results <- data.frame(prov = rownames(reg6$beta), b_pre = reg6$beta_pre, b = reg6$beta, se = 0)
#  results$se <- reg6$ses[1,]
#  results

## ----try plugin lasso gamma, results = FALSE, eval=FALSE----------------------
#  reg6_gamma <- mlfitppml(data = trade2,
#                    dep = "export",
#                    fixed = list(c("exp", "time"),
#                                c("imp", "time"),
#                                c("exp", "imp")),
#                    penalty = "lasso",
#                    method = "plugin",
#                    cluster = c("exp", "imp"), gamma_val=0.3)
#  rownames(reg6$beta)[which(reg6_gamma$beta != 0)]

## ----plugin results gamma, results = FALSE, eval=FALSE------------------------
#  results_gamma <- data.frame(prov = rownames(reg6_gamma$beta), b_pre = reg6_gamma$beta_pre, b = reg6_gamma$beta, se = 0)
#  results_gamma$se <- reg6_gamma$ses[1,]
#  results_gamma

## ----try iceberg,  results = FALSE, eval = FALSE------------------------------
#  iceberg_results <- iceberg(data = trade2[, -(1:4)],
#                             dep = results$prov[results$b != 0],
#                             selectobs = (trade2$time == "2016"))

## ----iceberg correlations, results = FALSE, eval = FALSE----------------------
#  provcorr <- cor(trade2[, results$prov])
#  (provcorr <- provcorr[, results$prov[results$b != 0]])

## ---- message=FALSE, warning=FALSE, results=FALSE, eval=FALSE-----------------
#  trade3 <- trade[(trade$exp %in% selected) & (trade$imp %in% selected), ] # Now, we need id and agreement variable
#  # Let's cluster by agreement
#  trade3$alt_id <- trade3$id # ID refers to agreement ID
#  trade3$alt_id[is.na(trade3$alt_id)] <- 0 # We set this to zero when the ID is missing, interpreting this as the country pair not being part of any agreement.
#  
#  # Create pair ID
#  v1 <- do.call(paste, as.data.frame(t(apply(trade3[1:2], 1, sort))))
#  trade3$pair <-  match(v1, unique(v1))
#  trade3$pair <- trade3$pair + 500
#  
#  
#  # Create maximal ID from the preexisting ID-variable inside each pair
#  trade3 <- within(trade3, {alt_id2 = ave(alt_id,pair,FUN=max)} ) # This creates the maximum of the ID for each pair. This adjusts for the fact that some pairs might have been part of different agreements and we want to take get a unique agreement ID for each pair.
#  
#  trade3$alt_id2[trade3$alt_id2==0] <- trade3$pair[trade3$alt_id2==0]
#  unique(trade3$alt_id2) # This cluster variable collects pairs for pairs that are in agreement, uses the pair ID for those that are not.
#  # Thus, it allows errors to be clustered within agreements.
#  alt_id2 <- factor(trade3$alt_id2)
#  trade3$clus <- alt_id2 #Add the ID to the data

## ----try bootstrap lasso, warning=FALSE, message=FALSE, results = FALSE, eval=FALSE----
#  set.seed(123)
#  bs1 <- bootstrap(data=trade3, dep="export", cluster_id="clus", fixed=list(c("exp", "time"), c("imp", "time"), c("exp", "imp")), indep=7:22, bootreps=10, colcheck_x = TRUE, colcheck_x_fes = TRUE, boot_threshold = 0.01, post=TRUE, gamma_val=0.01, verbose=FALSE)

Any scripts or data that you put into this service are public.

penppml documentation built on Sept. 8, 2023, 5:58 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

penppml
Penalized Poisson Pseudo Maximum Likelihood Regression

inst/doc/intro-to-penppml.R
In penppml: Penalized Poisson Pseudo Maximum Likelihood Regression

Try the penppml package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

penppml Penalized Poisson Pseudo Maximum Likelihood Regression

inst/doc/intro-to-penppml.R In penppml: Penalized Poisson Pseudo Maximum Likelihood Regression

Try the penppml package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

penppml
Penalized Poisson Pseudo Maximum Likelihood Regression

inst/doc/intro-to-penppml.R
In penppml: Penalized Poisson Pseudo Maximum Likelihood Regression