data-raw/DATASET.R

## code to prepare `DATASET` dataset goes here
library(readr)
library(dplyr)
library(lubridate)
inits_data <- read_csv(here::here("data-raw","initiations.csv"),col_types = cols(.default = col_character()))
inits_data <- inits_data %>%
  rename_with(~stringr::str_to_lower(.)) %>%
  # handle all of the parsing for the data
  mutate(across(ends_with("date")|starts_with("bond_date"),~mdy_hms(.)),
        across(contains("flag"),~case_when(. == "true"~TRUE,
                                            . == "false"~FALSE)),
        across(contains("bond_amount")|starts_with("age_at")|contains("charge_count"), ~parse_number(.)),
        # incident_begin_date = ymd(incident_begin_date),
        # incident_end_date   = mdy_hms(incident_end_date),
        # arrest_date         = mdy_hms(arrest_date),
        # felony_review_date  = mdy_hms(felony_review_date),
        # received_date       = mdy_hms(received_date),
        # event_date          = mdy_hms(event_date),
        # arraignment_date    = mdy_hms(arraignment_date),
        # bond_date_initial   = mdy_hms(bond_date_initial),
        # bond_date_current   = mdy_hms(bond_date_current)
        ) %>%
  # correct a misspelling on the bond flag
  rename("bond_electronic_monitor_flag_current" = bond_electroinic_monitor_flag_current )

inits_data<- inits_data %>%
  #fix up the race information
  mutate(race = race %>%
           stringr::str_to_title() %>%
           stringr::str_replace_all("^Hispanic","White/Black [Hispanic Or Latino]"))

initiations <- inits_data
usethis::use_data(initiations, overwrite = TRUE)
phillydao/deidentify documentation built on Feb. 4, 2021, 2:31 p.m.