inst/scripts/synthetic_benchmark/resources/method_definitions/pareg_network_cv.R

# prepare environment
source(snakemake@params$setup_code_fname)

devtools::load_all("../..")

# run model
future::plan(future::multisession, workers = snakemake@threads)
fit <- pareg::pareg(
  study$df %>% select(gene, pvalue),
  df_terms,
  term_network = term_similarities_sub,
  cv = TRUE
)
future::plan(future::sequential) # shut down workers

df <- fit %>%
  as.data.frame() %>%
  mutate(method = "pareg_network_cv", enrichment = abs(enrichment))

df %>%
  arrange(desc(abs(enrichment))) %>%
  head()

# misc
fname_model <- file.path(dirname(snakemake@output$fname), "model")
fit$obj$fit$model$save(fname_model)
fit$obj$model <- fname_model
saveRDS(fit, file.path(dirname(snakemake@output$fname), "fit.rds"))

df_loss <- do.call(rbind, fit$obj$fit$loss_hist) %>%
  as_tibble() %>%
  unnest(everything()) %>%
  mutate(iteration = seq_along(fit$obj$fit$loss_hist))
df_loss %>%
  write_csv(file.path(dirname(snakemake@output$fname), "loss.csv"))

df_loss %>%
  pivot_longer(-iteration) %>%
  ggplot(aes(x = iteration, y = value, color = name)) +
    geom_line() +
    # geom_point() +
    theme_minimal()
ggsave(
  file.path(dirname(snakemake@output$fname), "loss.pdf"),
  width = 8,
  height = 6
)

ggplot(fit$obj$loss_grid, aes(x = lambda, y = psigx, fill = loss)) +
  geom_tile() +
  geom_text(aes(label = round(loss, 2)), color = "white", size = 1) +
  theme_minimal()
ggsave(
  file.path(dirname(snakemake@output$fname), "loss_grid.pdf"),
  width = 8,
  height = 6
)

data.frame(
  pseudo_r_squared = fit$obj$fit$pseudo_r_squared,
  mse = fit$obj$fit$mse
) %>%
  write_csv(file.path(dirname(snakemake@output$fname), "extra_stats.csv"))

# save result
df %>%
  write_csv(snakemake@output$fname)
cbg-ethz/pareg documentation built on July 20, 2023, 7:30 p.m.