R/read.R
In stats19: Work with Open Road Traffic Casualty Data from Great Britain

Documented in check_input_file read_casualties read_collisions read_vehicles

#' Read in STATS19 road safety data from .csv files downloaded.
#'
#' @section Details:
#' This is a wrapper function to access and load stats 19 data in a user-friendly way.
#' The function returns a data frame, in which each record is a reported incident in the
#' STATS19 data.
#'
#' @param filename Character string of the filename of the .csv to read, if this is given, type and
#' years determine whether there is a target to read, otherwise disk scan would be needed.
#' @param data_dir Where sets of downloaded data would be found.
#' @param year Single year for which data are to be read
#' @param format Switch to return raw read from file, default is `TRUE`.
#' @param silent Boolean. If `FALSE` (default value), display useful progress
#'   messages on the screen.
#'
#' @export
#' @examples
#' \donttest{
#' if(curl::has_internet()) {
#' dl_stats19(year = 2019, type = "collision")
#' ac = read_collisions(year = 2019)
#'
#' dl_stats19(year = 2019, type = "collision")
#' ac_2019 = read_collisions(year = 2019)
#' }
#' }
read_collisions = function(year = NULL,
                          filename = "",
                          data_dir = get_data_directory(),
                          format = TRUE,
                          silent = FALSE) {
  # Set the local edition for readr.
  # See https://github.com/ropensci/stats19/issues/205
  if (.Platform$OS.type == "windows" && utils::packageVersion("readr") >= "2.0.0") {
    readr::local_edition(1)
  }

  path = check_input_file(
    filename = filename,
    type = "collision",
    data_dir = data_dir,
    year = year
  )
  if (isFALSE(silent)) {
    message("Reading in: ")
    message(path)
  }
  # read the data in
  if (is.null(path)) {
    message("File not found.")
    return(NULL)
  }
  suppressWarnings({
    ac = readr::read_csv(path, col_types = col_spec())
  })

  if(format)
    return(format_collisions(ac))
  ac
}

#' Read in stats19 road safety data from .csv files downloaded.
#'
#' @section Details:
#' The function returns a data frame, in which each record is a reported vehicle in the
#' STATS19 dataset for the data_dir and filename provided.
#'
#' @inheritParams read_collisions
#'
#' @export
#' @examples
#' \donttest{
#' if(curl::has_internet()) {
#' dl_stats19(year = 2019, type = "vehicle")
#' ve = read_vehicles(year = 2019)
#' }
#' }
read_vehicles = function(year = NULL,
                         filename = "",
                         data_dir = get_data_directory(),
                         format = TRUE) {
  # check inputs
  path = check_input_file(
    filename = filename,
    type = "vehicle",
    data_dir = data_dir,
    year = year
  )
  ve = read_ve_ca(path = path)
  if(format) {
    return(format_vehicles(ve))
  } else {
    ve
  }
}

#' Read in STATS19 road safety data from .csv files downloaded.
#'
#' @section Details:
#' The function returns a data frame, in which each record is a reported casualty
#' in the STATS19 dataset.
#'
#' @inheritParams read_collisions
#'
#' @export
#' @examples
#' \donttest{
#' if(curl::has_internet()) {
#' dl_stats19(year = 2022, type = "casualty")
#' casualties = read_casualties(year = 2022)
#' }
#' }
read_casualties = function(year = NULL,
                           filename = "",
                           data_dir = get_data_directory(),
                           format = TRUE) {
  path = check_input_file(
    filename = filename,
    type = "cas",
    data_dir = data_dir,
    year = year
  )
  ca = read_ve_ca(path = path)
  if(format)
    return(format_casualties(ca))
  ca
}

#' Local helper to be reused.
#'
#' @param filename Character string of the filename of the .csv to read, if this is given, type and
#' years determine whether there is a target to read, otherwise disk scan would be needed.
#' @param data_dir Where sets of downloaded data would be found.
#' @param year Single year for which data are to be read
#' @param type  The type of file to be downloaded (e.g. 'collisions', 'casualty' or
#' 'vehicles'). Not case sensitive and searches using regular expressions ('acc' will work).
#'
check_input_file = function(filename = NULL,
                            type = NULL,
                            data_dir = NULL,
                            year = NULL) {
  path = locate_one_file(
    type = type,
    filename = filename,
    data_dir = data_dir,
    year = year
  )
  if(identical(path, "More than one csv file found."))
    stop("Multiple files with the same name found.", call. = FALSE)
  # have we NOT found a csv to read?
  if (is.null(path) || length(path) == 0 || !endsWith(path, ".csv")
      || !file.exists(path)) {
    # locate_files malfunctioned or just path returned with no filename
    message(path, " not found")
    message(
      "Try running dl_stats19(), change arguments or try later.",
      call. = FALSE
      )
    return(NULL)
  }
  return(path)
}

read_ve_ca = function(path) {
  # Set the local edition for readr.
  # See https://github.com/ropensci/stats19/issues/205
  if (.Platform$OS.type == "windows" && utils::packageVersion("readr") >= "2.0.0") {
    readr::local_edition(1)
  }
  x = read_null(path)
  x
}

read_null = function(path, ...) {
  if (is.null(path)) {
    return(NULL)
  }
  readr::read_csv(path, col_types = col_spec(), ...)
}

# possibly in utils
# Convert the 'type' column to readr's col_type format
convert_to_col_type = function(type) {
  switch(type,
         character = readr::col_character(),
         numeric = readr::col_integer(),
         integer = readr::col_integer(),
         logical = readr::col_logical(),
         date = readr::col_date(),
         datetime = readr::col_datetime(),
         readr::col_guess())
}

col_spec = function() {
    # Create a named list of column types
  unique_vars = unique(stats19::stats19_variables$variable)
  unique_types = sapply(unique_vars, function(v) {
    type = stats19::stats19_variables$type[stats19::stats19_variables$variable == v][1]
    convert_to_col_type(type)
  })

  col_types = stats::setNames(unique_types, unique_vars)
  do.call(readr::cols, col_types)
}

Any scripts or data that you put into this service are public.

stats19 documentation built on April 4, 2025, 1:41 a.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

stats19
Work with Open Road Traffic Casualty Data from Great Britain

R/read.R
In stats19: Work with Open Road Traffic Casualty Data from Great Britain

Defines functions col_spec convert_to_col_type read_null read_ve_ca check_input_file read_casualties read_vehicles read_collisions

Documented in check_input_file read_casualties read_collisions read_vehicles

Try the stats19 package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

stats19 Work with Open Road Traffic Casualty Data from Great Britain

R/read.R In stats19: Work with Open Road Traffic Casualty Data from Great Britain

Defines functions col_spec convert_to_col_type read_null read_ve_ca check_input_file read_casualties read_vehicles read_collisions

Documented in check_input_file read_casualties read_collisions read_vehicles

Try the stats19 package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

stats19
Work with Open Road Traffic Casualty Data from Great Britain

R/read.R
In stats19: Work with Open Road Traffic Casualty Data from Great Britain