inst/data-raw/process/PMID27813705_Moin-2016/process.R

library(rvest)

# import and extraction
tab1 <- read_html("https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5413103/table/T1/") %>% html_table()
tab1 <- tab1[[2]]

t1d <- tab1[2:23, c(1, 7)]
names(t1d) <- c("ID", "Ki67.PDG.prct")
controls <- tab1[2:25, c(8, 12)]
names(controls) <- c("ID", "Ki67.PDG.prct")

dataset <- rbind(t1d, controls)

dataset$ID <- gsub("[^0-9]", "", dataset$ID)
dataset <- apply(dataset, 2, as.numeric)

write.table(dataset, "PMID27813705_1_Moin-2016.tsv", sep = "\t", row.names = F, quote = F)
avucoh/nPOD documentation built on April 1, 2020, 5:24 p.m.