Nothing
#' Extract OSM into OSRM Graph Files
#'
#' @description
#' `r lifecycle::badge("stable")`
#'
#' Run the `osrm-extract` tool to preprocess an OSM file
#' (`.osm`, `.osm.bz2`, or `.osm.pbf`) into the base `.osrm` graph files
#' using a specified Lua profile. After running, a companion
#' `<base>.osrm.timestamp` file must exist to confirm success.
#'
#' @param input_osm A string. Path to the input OSM file
#' (`.osm`, `.osm.bz2`, or `.osm.pbf`) or a directory containing exactly one
#' OSM file with a supported extension.
#' @param profile A string. Path to the OSRM Lua profile
#' (e.g. returned by \code{osrm_find_profile("car.lua")}).
#' @param threads An integer. Number of threads for
#' \code{-t/--threads}; default \code{8} (OSRM's default).
#' @param overwrite A logical. If \code{FALSE} (default), stops when any
#' existing `.osrm*` files matching the base name are found alongside
#' \code{input_osm}. Set to \code{TRUE} to proceed regardless.
#' @param verbosity A string. Log verbosity level passed to
#' \code{-l/--verbosity} (one of \code{"NONE","ERROR","WARNING","INFO","DEBUG"}),
#' default \code{"INFO"}.
#' @param data_version A string or \code{NULL}. Passed to
#' \code{-d/--data_version}; default \code{NULL}, in which case the option
#' is omitted.
#' @param small_component_size An integer. For
#' \code{--small-component-size}; default \code{1000} (OSRM's default).
#' @param with_osm_metadata A logical. If \code{TRUE}, adds
#' \code{--with-osm-metadata}; default \code{FALSE}.
#' @param parse_conditional_restrictions A logical. If \code{TRUE}, adds
#' \code{--parse-conditional-restrictions}; default \code{FALSE}.
#' @param location_dependent_data A string or \code{NULL}. Path to GeoJSON,
#' passed to \code{--location-dependent-data}; default \code{NULL}, in which
#' case the option is omitted.
#' @param disable_location_cache A logical. If \code{TRUE}, adds
#' \code{--disable-location-cache}; default \code{FALSE}.
#' @param dump_nbg_graph A logical. If \code{TRUE}, adds
#' \code{--dump-nbg-graph}; default \code{FALSE}.
#' @inheritParams osrm_prepare_graph
#'
#' @return An object of class \code{osrm_job} with the following elements:
#' \describe{
#' \item{osrm_job_artifact}{The path to the generated `.osrm.timestamp` file.}
#' \item{osrm_working_dir}{The directory containing all OSRM files.}
#' \item{logs}{The \code{processx::run} result object.}
#' }
#'
#' @examples
#' \donttest{
#' if (identical(Sys.getenv("OSRM_EXAMPLES"), "true")) {
#' # Install OSRM (temporary, session PATH)
#' install_dir <- osrm_install(
#' version = "latest",
#' path_action = "session",
#' quiet = TRUE
#' )
#'
#' # copy example OSM PBF into a temporary workspace to avoid polluting pkg data
#' pbf_path <- system.file("extdata/cur.osm.pbf", package = "osrm.backend")
#' osrm_dir <- file.path(tempdir(), paste0("osrm-", Sys.getpid()))
#' dir.create(osrm_dir, recursive = TRUE)
#' tmp_pbf <- file.path(osrm_dir, "cur.osm.pbf")
#' file.copy(from = pbf_path, to = tmp_pbf, overwrite = TRUE)
#'
#' # Find the path to the profile first
#' car_profile <- osrm_find_profile("car.lua")
#'
#' # extract OSRM graph files
#' result <- osrm_extract(
#' input_osm = tmp_pbf,
#' profile = car_profile,
#' overwrite = TRUE,
#' threads = 1L
#' )
#' # path to generated .osrm files (specifically, the .osrm.timestamp file)
#' result$osrm_job_artifact
#'
#' # Clean up binaries and workspace
#' osrm_uninstall(
#' dest_dir = install_dir,
#' clear_path = TRUE,
#' force = TRUE,
#' quiet = TRUE
#' )
#' unlink(osrm_dir, recursive = TRUE)
#' }
#' }
#' @export
osrm_extract <- function(
input_osm,
profile = osrm_find_profile("car.lua"),
threads = 8L,
overwrite = FALSE,
verbosity = c("INFO", "NONE", "ERROR", "WARNING", "DEBUG"),
data_version = NULL,
small_component_size = 1000L,
with_osm_metadata = FALSE,
parse_conditional_restrictions = FALSE,
location_dependent_data = NULL,
disable_location_cache = FALSE,
dump_nbg_graph = FALSE,
quiet = FALSE,
verbose = FALSE,
spinner = TRUE,
echo_cmd = FALSE
) {
if (!requireNamespace("processx", quietly = TRUE)) {
stop("'processx' package is required for osrm_extract", call. = FALSE)
}
# Extract previous logs if input is an osrm_job object
input_logs <- if (inherits(input_osm, "osrm_job")) {
if (is.list(input_osm$logs) && length(input_osm$logs) > 0) {
input_osm$logs
} else {
list()
}
} else {
list()
}
# Extract path from osrm_job object if needed
input_osm <- get_osrm_path_from_input(input_osm)
# Resolve input path (file or directory)
input_osm <- resolve_osrm_path(
input_osm,
pattern = "\\.(osm|osm\\.bz2|osm\\.pbf)$",
file_description = "OSM files (.osm, .osm.bz2, or .osm.pbf)"
)
# strip recognized extensions to derive base path
if (grepl("\\.osm\\.pbf$", input_osm, ignore.case = TRUE)) {
base <- sub("\\.osm\\.pbf$", "", input_osm, ignore.case = TRUE)
} else if (grepl("\\.osm\\.bz2$", input_osm, ignore.case = TRUE)) {
base <- sub("\\.osm\\.bz2$", "", input_osm, ignore.case = TRUE)
} else if (grepl("\\.osm$", input_osm, ignore.case = TRUE)) {
base <- sub("\\.osm$", "", input_osm, ignore.case = TRUE)
} else {
stop(
"'input_osm' must have extension .osm, .osm.bz2, or .osm.pbf",
call. = FALSE
)
}
# check for existing .osrm* files
existing <- list.files(
dirname(base),
pattern = paste0("^", basename(base), ".*\\.osrm"),
ignore.case = TRUE
)
if (length(existing) > 0) {
if (!overwrite) {
stop(
"Found existing OSRM files: ",
paste(existing, collapse = ", "),
".\nSet overwrite = TRUE to proceed.",
call. = FALSE
)
} else {
if (!quiet) message("Existing OSRM files found. Cleaning up...")
osrm_cleanup(base, quiet = quiet)
}
}
# build command arguments
verbosity <- match.arg(verbosity)
arguments <- c(
input_osm,
"-p",
profile,
"-l",
verbosity,
"-t",
as.character(threads),
"--small-component-size",
as.character(small_component_size)
)
if (!is.null(data_version)) {
arguments <- c(arguments, "-d", data_version)
}
if (with_osm_metadata) {
arguments <- c(arguments, "--with-osm-metadata")
}
if (parse_conditional_restrictions) {
arguments <- c(arguments, "--parse-conditional-restrictions")
}
if (!is.null(location_dependent_data)) {
arguments <- c(
arguments,
"--location-dependent-data",
location_dependent_data
)
}
if (disable_location_cache) {
arguments <- c(arguments, "--disable-location-cache")
}
if (dump_nbg_graph) {
arguments <- c(arguments, "--dump-nbg-graph")
}
# Determine final processx parameters
show_echo <- !quiet && verbose
show_spinner <- !quiet && spinner
show_echo_cmd <- !quiet && echo_cmd
# run extraction
logs <- processx::run(
resolve_osrm_bin("osrm-extract"),
args = arguments,
echo = show_echo,
spinner = show_spinner,
echo_cmd = show_echo_cmd
)
# verify timestamp file
timestamp_file <- paste0(base, ".osrm.timestamp")
if (!file.exists(timestamp_file)) {
stop(
"Extraction did not produce timestamp file: ",
basename(timestamp_file),
call. = FALSE
)
}
# --- WRITE METADATA ---
# Determine profile name: "path/to/car.lua" -> "car"
profile_name <- tools::file_path_sans_ext(basename(profile))
meta_file <- file.path(dirname(base), "dataset.meta.json")
meta_data <- list(
profile = profile_name,
created_at = format(Sys.time(), "%Y-%m-%dT%H:%M:%SZ", tz = "UTC"),
input_osm = basename(input_osm)
)
try(
jsonlite::write_json(meta_data, meta_file, auto_unbox = TRUE, pretty = TRUE),
silent = TRUE
)
# Accumulate logs from previous stages
accumulated_logs <- c(input_logs, list(extract = logs))
as_osrm_job(
osrm_job_artifact = timestamp_file,
osrm_working_dir = dirname(timestamp_file),
logs = accumulated_logs
)
}
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.