R/read-planning-edf.R

Defines functions read_edf_sheet check_code_essai check_redem check_lim check_lim_limit read_planning_edf

Documented in read_planning_edf

#' @importFrom data.table as.data.table := setorderv %like%
#' @importFrom readxl read_excel
read_edf_sheet <- function(path, sheet) {
  data <- readxl::read_excel(path = path, sheet = sheet, skip = 5)
  data <- as.data.table(data)
  setnames(x = data, old = names(data), new = clean_names(names(data)))
  data <- data[, .SD, .SDcols = c("comb_", "groupe", "code_groupe", "pmd", "debut", "fin", "code_essai", "pmax", "pmin")]
  data <- data[, groupe := locf(groupe)]
  data <- data[, code_groupe := locf(code_groupe)]
  data <- data[, comb_ := locf(comb_)]
  data <- data[, pmd := locf(pmd)]
  data <- data[!is.na(debut)]

  
  # LIM/LIMIT
  # data <- data[, val_llim := check_lim_limit(x = code_essai), by = code_groupe]
  # data <- data[val_llim == TRUE]
  # data <- data[, val_llim := NULL]
  
  # keep only LIMIT for D units
  data <- data[!(comb_ == "D" & code_essai == "LIM")]


  # Delete REDEM
  # data <- data[!code_essai %like% "^REDEM.*"]

  # expand dates
  data <- data[, .id := seq_len(.N)]
  data <- data[rep(.id, n_hours(debut, fin))]
  data <- data[, datetime := seq.POSIXt(from = min(debut), to = max(fin), by = "hours"), by = list(.id)]
  data <- data[, datetime := as.POSIXct(round.POSIXt(datetime - 1, units = "hours"), tz = "Europe/Paris")]
  data <- data[format(datetime) != format(fin)]
  data <- data[, debut := NULL]
  data <- data[, fin := NULL]
  data <- data[, .id := NULL]
  
  
  # check code essai indispo
  data <- data[, val_indispo := check_code_essai(code_essai, "^INDISPO$", "INDISPO"), by = list(code_groupe, datetime)]
  data <- data[val_indispo == TRUE]
  data <- data[, val_indispo := NULL]

  # check code essai fortuit
  data <- data[, val_fortuit := check_code_essai(code_essai, "^F$", "^F$"), by = list(code_groupe, datetime)]
  data <- data[val_fortuit == TRUE]
  data <- data[, val_fortuit := NULL]

  # check code essai arret garanti prolonge
  data <- data[, val_agp := check_code_essai(code_essai, "^AGP$", "^AGP$"), by = list(code_groupe, datetime)]
  data <- data[val_agp == TRUE]
  data <- data[, val_agp := NULL]

  # check code essai AND
  data <- data[, val_and := check_code_essai(
    x = code_essai, code = "^AND$", possible.values = c("^AND")
  ), by = list(code_groupe, datetime)]
  data <- data[val_and == TRUE]
  data <- data[, val_and := NULL]
  
  
  
  # check code essai VP
  data <- data[, val_vp := check_code_essai(
    x = code_essai, code = "^VP$", possible.values = c("^VP", "^RVP.*")
  ), by = list(code_groupe, datetime)]
  data <- data[val_vp == TRUE]
  data <- data[, val_vp := NULL]
  
  # check code essai RVP
  data <- data[, val_rvp := check_redem(x = code_essai), by = list(code_groupe, datetime)]
  data <- data[val_rvp == TRUE]
  data <- data[, val_rvp := NULL]
  
  # check code essai RVD
  data <- data[, val_rvd := check_redem(x = code_essai, type = "RVD"), by = list(code_groupe, datetime)]
  data <- data[val_rvd == TRUE]
  data <- data[, val_rvd := NULL]
  
  # check code essai VA
  data <- data[, val_va := check_code_essai(
    x = code_essai, code = "^VA$", possible.values = c("^VA$")
  ), by = list(code_groupe, datetime)]
  data <- data[val_va == TRUE]
  data <- data[, val_va := NULL]
  
  # check code essai VD
  data <- data[, val_vd := check_code_essai(
    x = code_essai, code = "^VD$", possible.values = c("^VD", "^RVD.*")
  ), by = list(code_groupe, datetime)]
  data <- data[val_vd == TRUE]
  data <- data[, val_vd := NULL]
  
  # check code essai ASR
  data <- data[, val_asr := check_code_essai(
    x = code_essai, code = "^ASR$", possible.values = c("^ASR", "^RASR.*")
  ), by = list(code_groupe, datetime)]
  data <- data[val_asr == TRUE]
  data <- data[, val_asr := NULL]
  
  # check code essai DRTE
  data <- data[, val_drte := check_code_essai(
    x = code_essai, code = "^DRTE$", possible.values = c("^DRTE")
  ), by = list(code_groupe, datetime)]
  data <- data[val_drte == TRUE]
  data <- data[, val_drte := NULL]
  
  # check code essai MODUL
  data <- data[, val_modul := check_code_essai(
    x = code_essai, code = "^MODUL$", possible.values = c("^MODUL")
  ), by = list(code_groupe, datetime)]
  data <- data[val_modul == TRUE]
  data <- data[, val_modul := NULL]

  # check code essai EP NUC
  data <- data[, val_epnuc := check_code_essai(
    x = code_essai, code = "^EP NUC$", possible.values = c("EP NUC")
  ), by = list(code_groupe, datetime)]
  data <- data[val_epnuc == TRUE]
  data <- data[, val_epnuc := NULL]

  
  # Anything than LIM
  data <- data[, val_lim := check_lim(x = code_essai), by = list(code_groupe, datetime)]
  data <- data[val_lim == TRUE]
  data <- data[, val_lim := NULL]
  
  
  # date header
  dates_h <- readxl::read_excel(path = path, sheet = sheet, n_max = 5)[4, 4]
  dates_h <- unlist(dates_h, use.names = FALSE)
  dates_h <- stringr::str_extract_all(string = dates_h, pattern = "\\d{2}/\\d{2}/\\d{4}")[[1]]
  dates_h <- as.POSIXct(dates_h, format = "%d/%m/%Y")
  data <- data[datetime >= dates_h[1] &  datetime < dates_h[2] + 24 * 60 * 60]

  # dedup
  data <- unique(x = data, by = c("groupe", "code_groupe", "datetime"), fromLast = TRUE)
  setorderv(x = data, cols = c("groupe", "datetime"))
  return(data)
}

#' @importFrom stringr str_detect
check_code_essai <- function(x, code = "VP", possible.values = c("^VP", "^RVP.*")) {
  if (any(str_detect(string = x, pattern = code))) {
    lind <- lapply(X = possible.values, FUN = stringr::str_detect, string = x)
    Reduce(f = `|`, x = lind)
  } else {
    rep_len(x = TRUE, length.out = length(x))
  }
}

check_redem <- function(x, type = "RVP") {
  if (any(str_detect(string = x, pattern = "^REDEM")) & any(str_detect(string = x, pattern = paste0("^", type)))) {
    str_detect(string = x, pattern = paste0("^", type))
  } else {
    rep_len(x = TRUE, length.out = length(x))
  }
}


check_lim <- function(x) {
  if (all(x == "LIM")) {
    rep_len(x = TRUE, length.out = length(x))
  } else {
    x != "LIM"
  }
}


check_lim_limit <- function(x) {
  if ("LIM" %in% x & "LIMIT" %in% x) {
    x != "LIMIT"
  } else {
    rep_len(x = TRUE, length.out = length(x))
  }
}



#' Read EDF thermal file
#'
#' @param path Path to the Excel file. Can be left blank, designate an Excel
#' file or directory containing Excel files. If the path points to a directory,
#' the most recent Excel file is read. If the argument is not specified, a dialog
#' box will open to select a directory.
#'
#' @export
#' @return a \code{data.table}
#'
#' @importFrom data.table rbindlist
#' @importFrom readxl read_excel excel_sheets
read_planning_edf <- function(path) {
  if (missing(path)) {
    path <- choose_path()
  }
  path <- select_file(path, "Politique_S", fileext = "\\.xlsx$")
  sheets <- readxl::excel_sheets(path = path)
  res <- lapply(
    X = sheets,
    FUN = function(sheet) {
      dat <- read_edf_sheet(path = path, sheet = sheet)
      region <- unlist(readxl::read_excel(path = path, sheet = sheet, n_max = 5)[4, 1], use.names = FALSE)
      dat$region <- region
      return(dat)
    }
  )
  rbindlist(res)
}
rte-antares-rpackage/antaresWeeklyMargin documentation built on July 25, 2019, 8:23 p.m.