## code to prepare `ptk_annotation` dataset goes here
library(tidyverse)
library(devtools)
# Loading Annotation ------------------------------------------------------
annotation <-
read_csv(
"data-raw/data/RegPhos_Annotation_human.csv",
col_types = cols(.default = col_character())
) |>
mutate(
Kinase = str_to_upper(Kinase),
Group = str_to_upper(Group),
Family = str_to_upper(Family),
Subfamily = str_to_upper(Subfamily),
Gene_Symbol = str_to_upper(Gene_Symbol)
)
non_human <- c("CK2A1-RS", "SGK424", "STLK6-RS")
annotation_clean <- annotation |>
select(Kinase, Group, Family, Subfamily, Gene_Symbol) |>
filter(!Kinase %in% non_human) |>
mutate(Gene_Symbol = if_else(is.na(Gene_Symbol), Kinase, Gene_Symbol))
# Processing UKA Mapping --------------------------------------------------
uka_map <-
read_csv("data-raw/data/uka_pep2kinase_PTK.csv",
col_types = cols(.default = col_character())) |>
select(ID, Kinase_UniprotName) |>
rename(Kinase = Kinase_UniprotName) |>
filter(!is.na(Kinase)) |>
unique()
uka_matched_by_kinase <- uka_map |>
left_join(annotation_clean, by = "Kinase") |>
filter(!is.na(Family), !is.na(Group))
uka_matched_by_family <- uka_map |>
rename(Family = Kinase) |>
left_join(annotation_clean, by = "Family") |>
filter(!is.na(Kinase), !is.na(Group))
uka_matched_by_subfamily <- uka_map |>
rename(Subfamily = Kinase) |>
left_join(annotation_clean, by = "Subfamily") |>
filter(!is.na(Kinase), !is.na(Group), !is.na(Family))
uka_matched_by_gene <- uka_map |>
rename(Gene_Symbol = Kinase) |>
left_join(annotation_clean, by = "Gene_Symbol") |>
filter(!is.na(Kinase), !is.na(Group), !is.na(Family))
# Processing KRSA Mapping -------------------------------------------------
krsa_map <-
read_tsv("data-raw/data/KRSA_Mapping_PTK_sep.tsv",
col_types = cols(.default = col_character())) |>
select(-db) |>
rename(Family = Kinases)
krsa_matched_by_family <- krsa_map |>
left_join(annotation_clean, by = "Family") |>
filter(!is.na(Kinase), !is.na(Group))
krsa_matched_by_kinase <- krsa_map |>
rename(Kinase = Family) |>
left_join(annotation_clean, by = "Kinase") |>
filter(!is.na(Family), !is.na(Group))
krsa_matched_by_subfamily <- krsa_map |>
rename(Subfamily = Family) |>
left_join(annotation_clean, by = "Subfamily") |>
filter(!is.na(Kinase), !is.na(Group), !is.na(Family))
krsa_matched_by_gene <- krsa_map |>
rename(Gene_Symbol = Family) |>
left_join(annotation_clean, by = "Gene_Symbol") |>
filter(!is.na(Kinase), !is.na(Group), !is.na(Family))
# Putting it all together -------------------------------------------------
ptk_annotation <- bind_rows(
krsa_matched_by_family,
krsa_matched_by_kinase,
krsa_matched_by_subfamily,
krsa_matched_by_gene,
uka_matched_by_family,
uka_matched_by_gene,
uka_matched_by_kinase,
uka_matched_by_subfamily
) |>
select(ID, Group, Family, Subfamily, Kinase, Gene_Symbol) |>
filter(!is.na(ID)) |>
unique() |>
write_csv("data-raw/data/PTK_Annotation.csv")
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.