R/feather_file_creator-tcga_build_driver_results_files.R

Defines functions tcag_build_driver_results_files

tcag_build_driver_results_files <- function() {

  get_results <- function() {

    gene_ids <- synapse_read_all_feather_files("syn22125640") %>%
      dplyr::select("hgnc", "entrez")

    tcga_tags <- "syn23545011" %>%
      iatlas.data::synapse_feather_id_to_tbl(.) %>%
      dplyr::select("tag" = "old_name", "new_tag" = "name") %>%
      tidyr::drop_na()

    driver_results <- "syn22126068" %>%
      synapse_rds_id_tbl() %>%
      dplyr::select(
        "label",
        "feature" = "metric",
        "tag" = "group2",
        "fold_change",
        "log10_p_value" = "log10_pvalue",
        "log10_fold_change",
        "p_value" = "pvalue",
        "n_wt",
        "n_mut"
      ) %>%
      dplyr::mutate(
        gene_mutation = iatlas.data::driver_results_label_to_hgnc(label)
      ) %>%
      tidyr::separate(
        gene_mutation,
        into = c("hgnc", "mutation_code"),
        sep = "\\s",
        remove = TRUE
      ) %>%
      dplyr::mutate(
        "mutation_code" = ifelse(
          is.na(mutation_code),
          "(NS)",
          mutation_code
        ),
        "mutation" = stringr::str_c(.data$hgnc, ":", .data$mutation_code),
        "feature" = stringr::str_replace_all(.data$feature, "[\\.]", "_"),
        "dataset" = "TCGA"
      ) %>%
      dplyr::inner_join(gene_ids, by = "hgnc") %>%
      dplyr::select(-c("hgnc", "label", "entrez",  "mutation_code")) %>%
      dplyr::select("mutation", "feature", "tag", "dataset", dplyr::everything()) %>%
      dplyr::distinct() %>%
      dplyr::inner_join(tcga_tags, by = "tag") %>%
      dplyr::select(-"tag") %>%
      dplyr::rename("tag" = "new_tag")

    return(driver_results)
  }

  iatlas.data::synapse_store_feather_file(
    get_results(),
    "driver_results.feather",
    "syn22126168"
  )

}
CRI-iAtlas/iatlas-feather-files documentation built on Sept. 1, 2021, 6:57 p.m.