R/compare_one_reserve_multi_event.R

Defines functions compare_one_reserve_multi_event

Documented in compare_one_reserve_multi_event

#' compare_one_reserve_multi_event
#'
#' @param var_in .xlsx with all required input variables defined (string).
#' @param data_path pathway to cdmo data folder (string).
#' @param storm_nm name of storm event (string).
#' @param storm_start YYYY-MM-DD HH:MM:SS (string).
#' @param storm_end YYYY-MM-DD HH:MM:SS (string).
#' @param reserve 3 digit reserve code (string).
#' @param keep_flags comma separated list of data quality flags that should be kept (string).
#' @param skip TRUE/FALSE. If TRUE, function will be skipped (string).
#' @param user_units User defined units. Set to "English" or "SI". Default CDMO data is in SI units. Not all parameters have common equivalent English units (e.g. concentrations), and therefore not all will be converted.
#'
#' @return tables are generated and saved in /output/wq/compare_one_reserve_multi_event/ and /output/met/compare_one_reserve_multi_event/
#' @export
#'
#' @examples
#'
#' \dontrun{
#' #StormVariables.xlsx is a template variable input file saved in data/
#' vars_in <- 'data/StormTrackVariables.xlsx'
#' single_storm_track(var_in = vars_in)
#' }
compare_one_reserve_multi_event <- function(var_in,
                                            data_path,
                                            storm_nm = NULL,
                                            storm_start = NULL,
                                            storm_end = NULL,
                                            reserve = NULL,
                                            keep_flags = NULL,
                                            skip = NULL,
                                            user_units = NULL) {

  # ----------------------------------------------------------------------------
  # Define global variables
  # ----------------------------------------------------------------------------
  NERR.Site.ID_ <- rlang::sym('NERR.Site.ID')
  Status_ <- rlang::sym('Status')
  Station.Type_ <- rlang::sym('Station.Type')

  station_ <- rlang::sym('station')
  event_ <- rlang::sym('event')
  parameter_ <- rlang::sym('parameter')
  result_ <- rlang::sym('result')


  # ----------------------------------------------------------------------------
  # Read in Data
  # ----------------------------------------------------------------------------

  #a.  Read in the variable input template, var_in

  input_Parameters <- openxlsx::read.xlsx(var_in, sheet = "stats_one_reserve")
  input_Master <- openxlsx::read.xlsx(var_in, sheet = "MASTER")



  if(is.null(storm_nm)) storm_nm <- unlist(strsplit(input_Parameters[1,2],", "))
  if(is.null(storm_start)) storm_start <- unlist(strsplit(input_Parameters[2,2],", "))
  if(is.null(storm_end)) storm_end <- unlist(strsplit(input_Parameters[3,2],", "))
  #if(is.null(wq_sites)) wq_sites <- unlist(strsplit(input_Parameters[5,2],", "))
  #if(is.null(wq_sites)) wq_sites <- if(is.na(input_Parameters[4,2])) {wq_stations$Station.Code} else {input_Parameters[4,2]}
  #if(is.null(met_sites)) met_sites <- unlist(strsplit(input_Parameters[6,2],", "))
  #if(is.null(met_sites)) met_sites <- if(is.na(input_Parameters[5,2])) {met_stations$Station.Code} else {input_Parameters[5,2]}
  if(is.null(reserve)) reserve <- if(is.na(input_Parameters[4,2])) {input_Master[1,2]} else {input_Parameters[4,2]}
  if(is.null(keep_flags)) keep_flags <- unlist(strsplit(input_Parameters[5,2],", "))
  if(is.null(skip)) skip <- input_Parameters[6,2]
  if(is.null(user_units)) user_units <- input_Parameters[7,2]
  if(is.null(data_path)) data_path <- 'data/cdmo'

  stations <- get('sampling_stations') %>%
    dplyr::filter(!! NERR.Site.ID_ == reserve) %>%
    dplyr::filter(!! Status_ == "Active")

  wq_sites <- stations %>%
    dplyr::filter(!! Station.Type_ == 1)
  wq_sites <- wq_sites$Station.Code

  met_sites <- stations %>%
    dplyr::filter(!! Station.Type_ == 0)
  met_sites <- met_sites$Station.Code

  ############## Tests #########################################################
  if(skip == "TRUE") {return(warning("skip set to 'TRUE', skipping compare_one_reserve_multi_event"))}


  ########## WATER QUALITY #####################################################

  # ----------------------------------------------
  # Load water quality data ----------------------
  # ----------------------------------------------

  ## load, clean, and filter data
  data_type <- 'wq'

  ls_par <- lapply(wq_sites, SWMPr::import_local, path = data_path)
  ls_par <- lapply(ls_par, SWMPr::qaqc, qaqc_keep = keep_flags)
  names(ls_par) <- wq_sites


  ## convert dataset to user defined units (if "SI", no conversion will take place)
  ls_par <- SWMPrStorm::convert_units(ls_par, user_units)

  ## filter timeframe
  evts <- data.frame()
  for(i in 1:length(storm_nm)) {

    evt <- lapply(ls_par, subset, subset = c(as.POSIXct(storm_start[i]), as.POSIXct(storm_end[i])))
    evt <- dplyr::bind_rows(evt, .id = 'station')
    evt$event <- storm_nm[i]

    evts <- dplyr::bind_rows(evts, evt)

  }


  dat <- evts %>% dplyr::relocate(!! event_)


  # combine data.frames into one and tidy
  dat_tidy <- tidyr::pivot_longer(dat, 4:length(names(dat)), names_to = 'parameter', values_to = 'result')

  # ----------------------------------------------
  # Multiple Event Comparison, Single Reserves ---
  # ----------------------------------------------


  summary <- dat_tidy %>%
    dplyr::group_by(!! event_, !! parameter_,!! station_) %>%
    tidyr::drop_na(!! result_) %>%
    dplyr::summarise(min = min(!! result_, na.rm = T)
              , max = max(!! result_, na.rm = T)
              , mean = mean(!! result_, na.rm = T)
              , median = stats::median(!! result_, na.rm = T))

  # add readable station names
  summary$station_name <- sapply(summary$station, SWMPrExtension::title_labeler)

  # # add factors for spatial filtering
  # summary$station_fac <- factor(summary$station, levels = wq_sites)
  #
  # # re-sort the table using factors
  # summary <- summary %>% arrange(., parameter, station_fac)

  # write table
  tbl_ttl <- paste('output/wq/data_one_reserve_multi_event_table/data_table_wq_', user_units, "_", reserve, '_multievent.csv', sep = '')
  utils::write.csv(summary, file = tbl_ttl, quote = F, row.names = F)


  ########## Meteorological #####################################################


  # ----------------------------------------------
  # Load meteorological data ----------------------
  # ----------------------------------------------

  ## load, clean, and filter data
  data_type <- 'met'

  ls_par <- lapply(met_sites, SWMPr::import_local, path = data_path)
  ls_par <- lapply(ls_par, SWMPr::qaqc, qaqc_keep = keep_flags)
  names(ls_par) <- met_sites

  ## convert dataset to user defined units (if "SI", no conversion will take place)
  ls_par <- SWMPrStorm::convert_units(ls_par, user_units)


  ## filter timeframes

  evts <- data.frame()
  for(i in 1:length(storm_nm)) {

    evt <- lapply(ls_par, subset, subset = c(as.POSIXct(storm_start[i]), as.POSIXct(storm_end[i])))
    evt <- dplyr::bind_rows(evt, .id = 'station')
    evt$event <- storm_nm[i]

    evts <- dplyr::bind_rows(evts, evt)

  }


  dat <- evts %>% dplyr::relocate(!! event_)

  # combine data.frames into one and tidy
  dat_tidy <- tidyr::pivot_longer(dat, 4:length(names(dat)), names_to = 'parameter', values_to = 'result')

  # ----------------------------------------------
  # Multiple Event Comparison, Single Reserve ---
  # ----------------------------------------------

  total_nalist <- c("atemp", "bp", "intensprcp", "maxwspd", "rh", "sdwdir", "wdir", "wspd")

  summary <- dat_tidy %>%
    dplyr::group_by(!! event_, !! parameter_, !! station_) %>%
    tidyr::drop_na(!! result_) %>%
    dplyr::summarise(min = min(!! result_, na.rm = T)
              , max = max(!! result_, na.rm = T)
              , mean = mean(!! result_, na.rm = T)
              , median = stats::median(!! result_, na.rm = T)
              , total = sum(!! result_, na.rm = T)) %>%
    dplyr::mutate(total = dplyr::case_when(!! parameter_ %in% total_nalist == FALSE ~ total))



  # add readable station names
  summary$station_name <- sapply(summary$station, SWMPrExtension::title_labeler)


  # write table
  tbl_ttl <- paste('output/met/data_one_reserve_multi_event_table/data_table_met_', user_units, "_", reserve, '_multievent.csv', sep = '')
  utils::write.csv(summary, file = tbl_ttl, quote = F, row.names = F)


}
LimnoTech/SWMPrStorm documentation built on June 14, 2022, 6:27 p.m.