medusa: Automating SIOP Membership Analytics

Documented in step_interests

#' Cleans primary interests categories, up to 3 in total
#'
#' @param ...
#' @param df Specify the raw xlsx demographics file
#'
#' @return tibble
#' @export
#'
#' @examples #step_interests(df)

step_interests <- function(df) {

  df %>%
    rename(
      'int_1' = `Interest Area (first choice)`,
      'int_2' = `Interest Area (second choice)`,
      'int_3' = `Interest Area (third choice)`,
    ) %>%
    mutate(across(starts_with('int_'), ~ str_replace(., " \\s*\\([^\\)]+\\)", ""))) %>% # Drop ()
    mutate(across(starts_with('int_'), ~ gsub("(.*),.*", "\\1", .))) %>% # Drop > 1 Interest
    return()

  # The rest of this code was developed for a pivot_longer configuration
  # But I went for appending the three interest areas to the primary
  # cleaned output file instead.

  # pivot_longer(cols = -SID, names_to = "Rank") %>%
  #   mutate(Rank = as.double(str_replace(Rank, "Interest_", ""))) %>%
  #   rename('Interest' = value) %>%
  #   filter(Interest != 'NA')

  }