## code to prepare `cellhealth_metrics` dataset goes here
## code to prepare `cellhealth` dataset goes here
library(dplyr)
library(readr)
## -----------------------------------------------------------------------------
url <-
"https://github.com/broadinstitute/grit-benchmark/raw/main/1.calculate-metrics/cell-health/data/cell_health_merged_feature_select.csv.gz"
cellhealth <-
read_csv(
url,
col_types = cols(
.default = col_double(),
Metadata_Plate = col_character(),
Metadata_Well = col_character(),
Metadata_WellRow = col_character(),
Metadata_WellCol = col_character(),
Metadata_cell_line = col_character(),
Metadata_gene_name = col_character(),
Metadata_pert_name = col_character()
)
)
## -----------------------------------------------------------------------------
drop_group <-
data.frame(Metadata_gene_name = "EMPTY")
reference <-
data.frame(Metadata_gene_name = c("Chr2"))
all_same_cols_ref <-
c(
"Metadata_cell_line",
"Metadata_Plate"
)
all_same_cols_rep <-
c(
"Metadata_cell_line",
"Metadata_gene_name",
"Metadata_pert_name"
)
all_same_cols_rep_ref <-
c(
"Metadata_cell_line",
"Metadata_gene_name",
"Metadata_pert_name",
"Metadata_Plate"
)
any_different_cols_non_rep <-
c(
"Metadata_cell_line",
"Metadata_gene_name",
"Metadata_pert_name"
)
all_same_cols_non_rep <-
c(
"Metadata_cell_line",
"Metadata_Plate"
)
all_different_cols_non_rep <-
c("Metadata_gene_name")
all_same_cols_group <-
c(
"Metadata_cell_line",
"Metadata_gene_name"
)
any_different_cols_group <-
c(
"Metadata_cell_line",
"Metadata_gene_name",
"Metadata_pert_name"
)
annotation_cols <-
c(
"Metadata_cell_line",
"Metadata_gene_name",
"Metadata_pert_name"
)
## -----------------------------------------------------------------------------
sim_df <- matric::sim_calculate(cellhealth, method = "cosine")
collated_sim <-
matric::sim_collate(
sim_df,
reference = reference,
all_same_cols_rep = all_same_cols_rep,
all_same_cols_rep_ref = all_same_cols_rep_ref,
all_same_cols_ref = all_same_cols_ref,
any_different_cols_non_rep = any_different_cols_non_rep,
all_same_cols_non_rep = all_same_cols_non_rep,
all_different_cols_non_rep = all_different_cols_non_rep,
any_different_cols_group = any_different_cols_group,
all_same_cols_group = all_same_cols_group,
annotation_cols = annotation_cols,
drop_group = drop_group
)
index <- matric::sim_calculate(cellhealth, method = "cosine", lazy = TRUE)
# collated_sim_lazy <-
# matric::sim_collate(
# index,
# reference = reference,
# all_same_cols_rep = all_same_cols_rep,
# all_same_cols_rep_ref = all_same_cols_rep_ref,
# all_same_cols_ref = all_same_cols_ref,
# any_different_cols_non_rep = any_different_cols_non_rep,
# all_same_cols_non_rep = all_same_cols_non_rep,
# all_different_cols_non_rep = all_different_cols_non_rep,
# any_different_cols_group = any_different_cols_group,
# all_same_cols_group = all_same_cols_group,
# annotation_cols = annotation_cols,
# drop_group = drop_group
# )
#
# doParallel::registerDoParallel(cores = 8)
#
# collated_sim_lazy <- sim_calculate_ij(population = cellhealth,
# index = collated_sim_lazy,
# cores = 8)
## -----------------------------------------------------------------------------
cellhealthmetrics <-
matric::sim_metrics(collated_sim, "ref", calculate_grouped = TRUE)
usethis::use_data(cellhealthmetrics, overwrite = TRUE)
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.