R/get_all_invalids.R

Defines functions get_all_invalids

Documented in get_all_invalids

#' Getting Invalid Summaries
#' 
#' This function will call upon each of the functions that end with `_invalid` and combine the results from all into one data frame. All
#' invalid checks were done at the patient-visit-level: If *one* message in a patient-visit was found to be invalid, then the whole patient visit
#' was returned as invalid.
#' 
#' @param data The raw data from BioSense on which you will do the invalid checks.
#' @return A data frame that contains the results from all of the `_invalid` functions.
#' @import dplyr
#' @import tidyr
#' @export
get_all_invalids <- function(data) {
  
  # merge all invalid summaries
  # make summaries into a list
  invalid_summaries <- list(admit_source_invalid(data)[[2]], age_invalid(data)[[2]], any_e_invalid(data)[[2]],
                            blood_pressure_invalid(data)[[2]], cc_ar_invalid(data)[[2]], country_invalid(data)[[2]],
                            death_invalid(data)[[2]], diagnosis_type_invalid(data)[[2]], 
                            discharge_disposition_invalid(data)[[2]], ethnicity_invalid(data)[[2]], 
                            facility_type_invalid(data)[[2]], fpid_mrn_invalid(data)[[2]],
                            gender_invalid(data)[[2]], height_invalid(data)[[2]], patient_class_invalid(data)[[2]],
                            pulseox_invalid(data)[[2]], race_invalid(data)[[2]], smoking_status_invalid(data)[[2]],
                            state_invalid(data)[[2]], temperature_invalid(data)[[2]], weight_invalid(data)[[2]], 
                            zip_invalid(data)[[2]])
  
  state_invalids <- invalid_summaries[[1]] # initialize data frame
  for (i in 2:length(invalid_summaries)) { # for the rest of the data frames in the list
    state_invalids <- full_join(state_invalids, 
                                invalid_summaries[[i]], # join them to the state invalids summary 
                                by="C_Biosense_Facility_ID") # by facility id
  }
  
  # clean up state invalids
  state_invalids <- state_invalids %>% # take invalids
    gather(key, value, 2:ncol(.)) %>% # gather all columns, besides facility
    separate(key, c("Field", "Measure"), "\\.") %>% # separate field and type out by period
    spread(Field, value) %>% # spread it back out by facility
    as.data.frame() # make as a classic data frame for writing to xlsx
  state_invalids[state_invalids=="NaN"] <- NA # replace nan with na
  
  return(state_invalids)
}
markhwhiteii/biosensequality documentation built on May 14, 2019, 7:43 a.m.