inst/extdata/BelderbosME_etal/preprocessing.R

#download the raw data from https://www.bbmt.org/article/S1083-8791(19)30566-X/fulltext#supplementaryMaterial

require(dplyr)
require(magrittr)

raw_belderbos_data <- readxl::read_excel("inst/sample_data/BelderbosME_etal/belderbosME_raw_data.xlsx", sheet = "C21")
colnames(raw_belderbos_data) <- gsub("BM", "sac_BM_", colnames(raw_belderbos_data))
colnames(raw_belderbos_data) <- gsub("Spleen", "sac_Spleen", colnames(raw_belderbos_data))
colnames(raw_belderbos_data) <- gsub("Liver", "sac_Liver", colnames(raw_belderbos_data))
raw_belderbos_data <- raw_belderbos_data[,!grepl("_sum", colnames(raw_belderbos_data))]
colnames(raw_belderbos_data) <- gsub("unsorted", "U", colnames(raw_belderbos_data))
colnames(raw_belderbos_data)[c(2:4, 29, 30)] <- paste0(colnames(raw_belderbos_data)[c(2:4, 29,30)], "_U")

raw_belderbos_data <- as.data.frame(raw_belderbos_data)
rownames(raw_belderbos_data) <- raw_belderbos_data$ID
raw_belderbos_data$ID <- NULL
raw_belderbos_data <- raw_belderbos_data[,colSums(raw_belderbos_data) > 100]

belderbos_metadata <- data.frame(SAMPLENAME = colnames(raw_belderbos_data),
                                 weeks = c(9,14,20,22,22,22,rep("sac", 17)),
                                 celltype = c(rep("bulk", 4), "B", "T", "bulk",
                                              "B", "T", "B", "T", "G", "bulk",
                                              "B", "T", "G", "bulk", "B", "T", "G",
                                              "bulk", "B", "bulk"),
                                 organ = c(rep("PB", 6), rep("BM_Front", 3),
                                           rep("BM_Left", 3), rep("BM_Right", 4),
                                           rep("BM_Spine", 4), rep("BM_Pelvis",2), "Spleen"))

write.table(file = "inst/sample_data/BelderbosME_etal/count_matrix_mouse_C21.txt", raw_belderbos_data,
            sep = '\t', quote = FALSE, row.names = TRUE, col.names = NA)

write.table(file = "inst/sample_data/BelderbosME_etal/metadata_mouse_C21.txt", belderbos_metadata,
            sep = '\t', quote = FALSE, row.names = FALSE)
d93espinoza/barcodetrackR documentation built on April 28, 2021, 1:58 p.m.