ccmisc: Some misc functions for working at CodeClan

Documented in find_notes open_notes

#' Locate files at given path
#'
#' Determines all notes files (html, Rmd) or data (csv) files at the given location.
#'
#' If \code{file_types} is \code{'notes'}, html note files are opened. If \code{file_types} is \code{'rmd'} Rmarkdown notebooks are opened. If \code{file_types} is \code{'data'} csv files are read and placed in the global environment. Data files are named according to their \code{\link{basename}}
#'
#' @param week Integer
#' @param day  Integer
#' @param file_types Character; Any or all of 'notes', 'rmd', or 'data'
#' @param path Character; Location of course repo
#' @param drop_dups Logical; Remove duplicated dataset names
#'
#' @return List of character vector filepaths named 'notes', 'rmd' and 'data'
#' @export
#'
find_notes <- function(week, day, file_types = c('notes', 'data', 'rmd'),
                       path, drop_dups = TRUE) {

  path <- sprintf(file.path(path, 'week_%02i/day_%i'), week, day)

  files <- list()

  if ('notes' %in% file_types) {
    files$notes <- dir(path, '\\.html$', recursive = TRUE, full.names = TRUE)
  }

  # rmds are only returned if specified explicitly
  if ('rmd' %in% file_types) {
    rmd <- dir(path, '\\.Rmd$', recursive = TRUE, full.names = TRUE)
    files$rmd <- rmd
  }

  if ('data' %in% file_types) {
    data_files <- dir(path, '\\.csv$', recursive = TRUE, full.names = TRUE)
    data_files_names <- basename(data_files)
    if (drop_dups) {
      dups <- duplicated(data_files_names)
      data_files <- data_files[!dups]
      data_files_names <- data_files_names[!dups]
    }
    data_files_names <- sub('\\..{3,4}$', '', data_files_names)
    data_files_names <- gsub('[ -]+', '_', data_files_names)
    files$data <- setNames(data_files, data_files_names)
  }

  files
}

#' Opens notes files
#'
#' Loops over a vector or file paths and open the files indicated. If two or
#' more datasets have the same name basename, only the last read will be
#' available
#'
#' @param clean_names Logical; Pass dataset columns names through \code{\link{janitor::clean_names}}
#' @inheritParams find_notes
#'
#' @return Character; names of datasets attached.
#' @export
#'
open_notes <- function(week, day, file_types = c('notes', 'data', 'rmd'),
                       path = '/Users/user/Documents/GitHub/data_rewrite2',
                       clean_names = TRUE, drop_dups = TRUE) {

  file_types_arg <- match.arg(file_types, several.ok = TRUE)
  if (missing(file_types)) {
    file_types_arg <- file_types_arg[1:2]
  }

  notes <- find_notes(week, day, file_types_arg, path, drop_dups)

  suppressMessages(
    invisible(
      mapply(\(f, n) {
        f <- readr::read_csv(f)
        assign(n,
               if (clean_names) janitor::clean_names(f) else f,
               envir = .GlobalEnv)
      }, notes$data, names(notes$data))
    ))
  lapply(unlist(notes[names(notes) != 'data']), browseURL)
  structure(names(notes$data),
            path = sub('(week_\\d{1,2}/day_\\d/).+', '\\1', notes$notes[1]))
}


#' Rename object in global environment
#'
#' @param obj_names Character; names of object to rename
#' @param names Character; New names for objects
#' @param where Environment or character
#'
#' @return NULL
#' @export
#'
#' @examples
#'
#' \dontrun{
#' ccmisc::open_notes(6, 3, 'data')
#'
#' rename_obj(c('telecomms_churn', 'telecomms_churn_200_sample'),
#'         c('telco', 'telco_200'))
#' }
#'
rename_obj <- function (obj_names, names, where = .GlobalEnv) {
  obj <- mget(obj_names, envir = where)
  names(obj) <- names

  lens <- nchar(obj_names)
  pad <- paste0(' ', strrep('.', max(lens) - lens), '> ')

  list2env(obj, envir = where)
  rm(list = obj_names, envir = where)

  cli::cat_line(
    cli::col_grey(obj_names, pad),
    cli::col_green(names)
  )

  invisible()
}