inst/scripts/ontomap_update.R

## read in
onto <- readr::read_tsv("inst/extdata/ontomap.tsv")

## modification
onto <- as.data.frame(onto)
onto[onto$DataType == "macrophage_differentiation_protein", "DataType"] <-
    "macrophage_differentiation"

## output checking
stopifnot(
    identical(length(unique(onto[["DataType"]])), 4L)
)

## writing
write.table(
    x = onto, file = "inst/extdata/ontomap.tsv",
    quote = FALSE, sep = "\t", row.names = FALSE
)

## reading ontology terms from kelly ontomap based on an ontomap old version
cellontokelly <- as.data.frame(
    readr::read_tsv("~/Downloads/Cell type ontology - Sheet2.tsv")
)
onto <- as.data.frame(
    readr::read_tsv("inst/extdata/ontomap.tsv")
)

## removing repetitive rows for seqFISH/scRNAseq celltypes
## aligning with newer version of ontomap
cellontokelly <-
    cellontokelly[!cellontokelly$dataset_name=="mouse_visual_cortex_scRNAseq",]
ontokey <- paste0(onto$DataType,"_",onto$function_name)
ontokey <-
    gsub("SCoPE2", "protein_SCoPE2", gsub("scMultiome", "multiome", ontokey))
ontokey <- paste0(ontokey, "_", onto$original_cell_name)
kellykey <-
    paste0(cellontokelly$dataset_name, "_", cellontokelly$original_cell_name)
## reordering
cellontokelly <- cellontokelly[match(ontokey, kellykey),]

onto$ontology_ID <- cellontokelly$ontology_ID
onto$ontology_cell_name <- cellontokelly$ontology_cell_name

## writing
write.table(
    x = onto, file = "inst/extdata/ontomap.tsv",
    quote = FALSE, sep = "\t", row.names = FALSE
)


## adding celltypes for cord_blood citeseq
## 
load("cord_blood/v1.0.0/coldata_scRNAseq.rda")
cd <- coldata_scRNAseq
ct <- unique(cd$celltype)
ct <- ct[-which(is.na(ct))]

onto <- as.data.frame(
    readr::read_tsv("inst/extdata/ontomap.tsv")
)

cn <- colnames(onto)
ctcb <- data.frame("cord_blood", "CITEseq", "celltype", ct, NA, NA)
colnames(ctcb) <- cn
onton <- rbind.data.frame(onto, ctcb) 
write.table(
    x = onton, file = "inst/extdata/ontomap.tsv",
    quote = FALSE, sep = "\t", row.names = FALSE
)
waldronlab/SingleCellMultiModal documentation built on May 1, 2024, 5:29 a.m.