R/set_datetime.R
In corella: Prepare, Manipulate and Check Data to Comply with Darwin Core Standard

Documented in set_datetime

#' Set, create or modify columns with date and time information
#'
#' @description
#' This function helps format standard date/time columns in a `tibble` using
#' Darwin Core Standard. Users should make use of the
#' [lubridate package](https://lubridate.tidyverse.org/) to
#' format their dates so corella can read them correctly.
#'
#' In practice this is no different from using `mutate()`, but gives some
#' informative errors, and serves as a useful lookup for how spatial fields are
#' represented in the Darwin Core Standard.
#' @param .df A `data.frame` or `tibble` that the column should be appended to.
#' @param eventDate The date or date + time that the observation/event occurred.
#' @param year The year of the observation/event.
#' @param month The month of the observation/event.
#' @param day The day of the observation/event.
#' @param eventTime The time of the event. Use this term for Event data.
#' Date + time information for observations is accepted in `eventDate`.
#' @param .keep Control which columns from .data are retained in the output.
#' Note that unlike [dplyr::mutate()], which defaults to `"all"` this defaults to
#' `"unused"`; i.e. only keeps Darwin Core fields, and not those fields used to
#' generate them.
#' @param .messages (logical) Should informative messages be shown? Defaults to
#' `TRUE`.
#' @returns A `tibble` with the requested columns added/reformatted.
#' @details
#' Example values are:
#' * `eventDate` should be class `Date` or `POSITct`. We suggest using the
#' lubridate package to define define your date format using functions like
#' `ymd()`, `mdy`, `dmy()`, or if including date + time, `ymd_hms()`,
#' `ymd_hm()`, or `ymd_h()`.
#' @examples
#' df <- tibble::tibble(
#'   name = c("Crinia Signifera", "Crinia Signifera", "Litoria peronii"),
#'   latitude = c(-35.27, -35.24, -35.83),
#'   longitude = c(149.33, 149.34, 149.34),
#'   date = c("2010-10-14", "2010-10-14", "2010-10-14"),
#'   time = c("10:08:12", "13:01:45", "14:02:33")
#' )
#'
#' # Use the lubridate package to format date + time information
#' # eventDate accepts date + time
#' df |>
#'   set_datetime(
#'     eventDate = lubridate::ymd_hms(paste(date, time))
#'   )
#'
#' @importFrom dplyr mutate
#' @importFrom rlang abort
#' @export
set_datetime <- function(
    .df,
    eventDate = NULL,
    year = NULL,
    month = NULL,
    day = NULL,
    eventTime = NULL,
    .keep = "unused",
    .messages = TRUE
){

  if(missing(.df)){
    abort(".df is missing, with no default.")
  }

  fn_args <- ls()

  # capture arguments as a list of quosures
  # NOTE: enquos() must be listed alphabetically
  fn_quos <- enquos(day, eventDate, eventTime, month, year)
  names(fn_quos) <- fn_args

  # find arguments that are NULL but exist already in `df`
  # then remove their names before `mutate()`
  # otherwise, these DwC columns are deleted by `mutate(.keep = "unused")`
  fn_quo_is_null <- fn_quos |>
    purrr::map(\(user_arg)
               rlang::quo_is_null(user_arg)) |>
    unlist()

  null_col_exists_in_df <- fn_quo_is_null & (names(fn_quos) %in% colnames(.df))

  if(any(null_col_exists_in_df)){
    fn_quos <- fn_quos |>
      purrr::keep(!names(fn_quos) %in% names(which(null_col_exists_in_df)))
  }

  # Update df
  result <- .df |>
    mutate(!!!fn_quos,
           .keep = .keep)

  check_missing_all_args(fn_call = match.call(),
                         fn_args = fn_args,
                         user_cols = colnames(result))

  # inform user which columns will be checked
  matched_cols <- names(result)[names(result) %in% fn_args]

  if(isTRUE(.messages)) {
    if(length(matched_cols > 0)) {
    col_progress_bar(cols = matched_cols)
    }
  }

  check_eventDate(result, level = "abort")
  check_year(result, level = "abort")
  check_month(result, level = "abort")
  check_day(result, level = "abort")
  check_eventTime(result, level = "abort")

  # other tests likely to be needed here
  result
}



#' Check eventDate
#' @noRd
#' @importFrom lubridate parse_date_time
#' @keywords Internal
check_eventDate <- function(.df,
                            level = c("inform", "warn", "abort")
){
  level <- match.arg(level)
  if(any(colnames(.df) == "eventDate")){
    .df |>
      select("eventDate") |>
      check_is_date(level = level)
      # check_is_time(level = level)
      # mutate(eventDate = lubridate::parse_date_time(eventDate, orders = "ymd"))

    # bullets <- c(
    #   "{.field eventDate} defaults to UTC standard.",
    #   i = paste0(
    #     "To change timezone, use e.g. {.code {.pkg lubridate}::ymd_hms(x, tz = \"timezone\")}"
    #     ) |>
    #     cli::col_grey()
    # )

    # cli::cli_inform(bullets)

  }
}


#' Check year
#' @noRd
#' @importFrom lubridate year
#' @importFrom lubridate today
#' @keywords Internal
check_year <- function(.df,
                       level = c("inform", "warn", "abort")
){
  level <- match.arg(level)
  if(any(colnames(.df) == "year")){
    .df |>
      select("year") |>
      check_within_range(lower = 0,
                         upper = as.numeric(lubridate::year(lubridate::today())),
                         level = level
                         )
  }
}

#' Check month
#' @noRd
#' @importFrom lubridate year
#' @importFrom lubridate today
#' @keywords Internal
check_month <- function(.df,
                        level = c("inform", "warn", "abort")) {
  level <- match.arg(level)
  if (any(colnames(.df) == "month")) {
    month <- .df |>
      select("month")

    if (inherits(.df$month, "numeric")) {
      month |>
        check_within_range(
          lower = 1,
          upper = 12,
          level = level
        )
    } else {
      if (inherits(.df$month, "character")) {
        # Detect and handle month abbreviations
        if (!is.na(any(match(.df$month, month.abb)))) {
          if (any(is.na(match(.df$month, month.abb)))) {
            unmatched <- sum(is.na(match(.df$month, month.abb)))
            cli::cli_warn("{.field month} contains {unmatched} unrecognised month abbreviation{?s}.")
          }
        } else {
          # Detect and handle month names
          if (!is.na(any(match(.df$month, month.name)))) {
            if (any(is.na(match(.df$month, month.name)))) {
              unmatched <- sum(is.na(match(.df$month, month.name)))
              cli::cli_warn("{.field month} contains {unmatched} unrecognised month name{?s}.")
            }
          }
        }
      }
    }
  }
}

#' Check day
#' @noRd
#' @importFrom lubridate year
#' @importFrom lubridate today
#' @keywords Internal
check_day <- function(.df,
                        level = c("inform", "warn", "abort")
){
  level <- match.arg(level)
  if(any(colnames(.df) == "day")){

    day <- .df |>
      select("day")

    if(inherits(.df$day, "numeric")) {
      day |>
        check_within_range(lower = 1,
                           upper = 31,
                           level = level
        )
    } else {
      bullets <- cli::cli_bullets(c(
        "{.field day} must be a numeric vector, not {class(.df$day)}.",
        i = "See {.code ?lubridate::mday()} to see how to convert a date to day of month."
      ))|>
        cli::cli_fmt()

      cli::cli_abort(bullets)

    }
  }
}



#' Check eventTime
#' @noRd
#' @importFrom lubridate year
#' @importFrom lubridate today
#' @keywords Internal
check_eventTime <- function(.df,
                       level = c("inform", "warn", "abort")
){
  level <- match.arg(level)
  if(any(colnames(.df) == "eventTime")){
    .df |>
      select("eventTime") |>
      check_is_time(level = level)
  }
}

Any scripts or data that you put into this service are public.

corella documentation built on April 4, 2025, 12:20 a.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

corella
Prepare, Manipulate and Check Data to Comply with Darwin Core Standard

R/set_datetime.R
In corella: Prepare, Manipulate and Check Data to Comply with Darwin Core Standard

Defines functions check_eventTime check_day check_month check_year check_eventDate set_datetime

Documented in set_datetime

Try the corella package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

corella Prepare, Manipulate and Check Data to Comply with Darwin Core Standard

R/set_datetime.R In corella: Prepare, Manipulate and Check Data to Comply with Darwin Core Standard

Defines functions check_eventTime check_day check_month check_year check_eventDate set_datetime

Documented in set_datetime

Try the corella package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

corella
Prepare, Manipulate and Check Data to Comply with Darwin Core Standard

R/set_datetime.R
In corella: Prepare, Manipulate and Check Data to Comply with Darwin Core Standard