Nothing
#' @title Return or remove variables or observations that are completely missing
#' @name remove_empty
#' @rdname remove_empty
#'
#' @description
#'
#' These functions check which rows or columns of a data frame completely
#' contain missing values, i.e. which observations or variables completely have
#' missing values, and either (1) returns their indices; or (2) removes them
#' from the data frame.
#'
#' @param x A data frame.
#'
#' @return
#'
#' - For `empty_columns()` and `empty_rows()`, a numeric (named) vector with row
#' or column indices of those variables that completely have missing values.
#'
#' - For `remove_empty_columns()` and `remove_empty_rows()`, a data frame with
#' "empty" columns or rows removed, respectively.
#'
#' - For `remove_empty()`, **both** empty rows and columns will be removed.
#'
#' @details For character vectors, empty string values (i.e. `""`) are also
#' considered as missing value. Thus, if a character vector only contains `NA`
#' and `""``, it is considered as empty variable and will be removed. Same
#' applies to observations (rows) that only contain `NA` or `""`.
#'
#' @examples
#' tmp <- data.frame(
#' a = c(1, 2, 3, NA, 5),
#' b = c(1, NA, 3, NA, 5),
#' c = c(NA, NA, NA, NA, NA),
#' d = c(1, NA, 3, NA, 5)
#' )
#'
#' tmp
#'
#' # indices of empty columns or rows
#' empty_columns(tmp)
#' empty_rows(tmp)
#'
#' # remove empty columns or rows
#' remove_empty_columns(tmp)
#' remove_empty_rows(tmp)
#'
#' # remove empty columns and rows
#' remove_empty(tmp)
#'
#' # also remove "empty" character vectors
#' tmp <- data.frame(
#' a = c(1, 2, 3, NA, 5),
#' b = c(1, NA, 3, NA, 5),
#' c = c("", "", "", "", ""),
#' stringsAsFactors = FALSE
#' )
#' empty_columns(tmp)
#'
#' @export
empty_columns <- function(x) {
if ((!is.matrix(x) && !is.data.frame(x)) || ncol(x) < 2) {
vector("numeric")
} else {
all_na <- colSums(is.na(x)) == nrow(x)
all_empty <- vapply(x, function(i) {
(is.character(i) || is.factor(i)) && !any(nzchar(as.character(i[!is.na(i)])))
}, FUN.VALUE = logical(1L))
which(all_na | all_empty)
}
}
#' @rdname remove_empty
#' @export
empty_rows <- function(x) {
if ((!is.matrix(x) && !is.data.frame(x)) || nrow(x) < 2) {
vector("numeric")
} else {
which(rowSums((is.na(x) | x == "")) == ncol(x)) # nolint
}
}
#' @rdname remove_empty
#' @export
remove_empty_columns <- function(x) {
# check if we have any empty columns at all
ec <- empty_columns(x)
# if yes, removing works, else an empty df would be returned
if (length(ec)) {
x <- x[-ec]
}
x
}
#' @rdname remove_empty
#' @export
remove_empty_rows <- function(x) {
# check if we have any empty rows at all
er <- empty_rows(x)
# if yes, removing works, else an empty df would be returned
if (length(er)) {
attr_data <- attributes(x)
x <- x[-er, ]
x <- .replace_attrs(x, attr_data)
}
x
}
#' @rdname remove_empty
#' @export
remove_empty <- function(x) {
x <- remove_empty_rows(x)
x <- remove_empty_columns(x)
x
}
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.