data-raw/DataComputing.R

library(Rd2roxygen)
library(tidyverse)

# MedicareProviders
download.file("https://github.com/DataComputing/DataComputing/raw/master/data/MedicareProviders.rda", "data/MedicareProviders.rda")
cat(create_roxygen(parse_file("https://raw.githubusercontent.com/DataComputing/DataComputing/master/man/MedicareProviders.Rd")), sep = "\n")

# MedicareCharges
download.file("https://github.com/DataComputing/DataComputing/raw/master/data/MedicareCharges.rda", "data-raw/MedicareCharges.RData")
load("data-raw/MedicareCharges.RData")
MedicareCharges <- MedicareCharges %>%
  inner_join(mdsr::MedicareProviders, by = "idProvider") %>%
  group_by(drg, stateProvider) %>%
  summarize(num_charges = n(), mean_charge = mean(aveCharges, na.rm = TRUE)) %>%
  ungroup()
usethis::use_data(MedicareCharges, overwrite = TRUE)

cat(create_roxygen(parse_file("https://raw.githubusercontent.com/DataComputing/DataComputing/master/man/MedicareCharges.Rd")), sep = "\n")

# OrdwayBirds
download.file("https://github.com/DataComputing/DataComputing/raw/master/data/OrdwayBirds.rda", "data/OrdwayBirds.rda")
cat(create_roxygen(parse_file("https://raw.githubusercontent.com/DataComputing/DataComputing/master/man/OrdwayBirds.Rd")), sep = "\n")
load("data/OrdwayBirds.rda")
ordway_birds <- OrdwayBirds %>%
  as_tibble()
usethis::use_data(ordway_birds, overwrite = TRUE)

# Minneapolis2013
download.file("https://github.com/DataComputing/DataComputing/raw/master/data/Minneapolis2013.rda", "data/Minneapolis2013.rda")
cat(create_roxygen(parse_file("https://raw.githubusercontent.com/DataComputing/DataComputing/master/man/Minneapolis2013.Rd")), sep = "\n")
load("data/Minneapolis2013.rda")
save(Minneapolis2013, file = "data/Minneapolis2013.rda", compress = "xz")

# WorldCities
download.file("https://github.com/DataComputing/DataComputing/raw/master/data/WorldCities.rda", "data/WorldCities.rda")
cat(create_roxygen(parse_file("https://raw.githubusercontent.com/DataComputing/DataComputing/master/man/WorldCities.Rd")), sep = "\n")
load("data/WorldCities.rda")
showNonASCII(WorldCities$name)
x <- WorldCities$name
Encoding(x) <- "latin1"
y <- iconv(x, from = "latin1", to = "ASCII", sub = "")
showNonASCII(y)
# z <- stringi::stri_trans_general(WorldCities$name, "latin-ascii")
# showNonASCII(z)
WorldCities$name <- y
WorldCities <- as_tibble(WorldCities)
usethis::use_data(WorldCities, overwrite = TRUE)

# NCI60 -- 5 MB file so put it in a different place
download.file("https://github.com/DataComputing/DataComputing/raw/master/data/NCI60.rda", "data-raw/NCI60.rda")
load("data-raw/NCI60.rda")
NCI60_tiny <- head(NCI60)
save(NCI60_tiny, file = "data/NCI60_tiny.rda", compress = "xz")
cat(create_roxygen(parse_file("https://raw.githubusercontent.com/DataComputing/DataComputing/master/man/NCI60.Rd")), sep = "\n")
mdsr-book/mdsr documentation built on May 1, 2024, 9:22 a.m.