Nothing
#' Count number of patients
#'
#' @description `r lifecycle::badge("stable")`
#'
#' The analyze function [analyze_num_patients()] creates a layout element to count total numbers of unique or
#' non-unique patients. The primary analysis variable `vars` is used to uniquely identify patients.
#'
#' The `count_by` variable can be used to identify non-unique patients such that the number of patients with a unique
#' combination of values in `vars` and `count_by` will be returned instead as the `nonunique` statistic. The `required`
#' variable can be used to specify a variable required to be non-missing for the record to be included in the counts.
#'
#' The summarize function [summarize_num_patients()] performs the same function as [analyze_num_patients()] except it
#' creates content rows, not data rows, to summarize the current table row/column context and operates on the level of
#' the latest row split or the root of the table if no row splits have occurred.
#'
#' @inheritParams argument_convention
#' @param required (`character` or `NULL`)\cr name of a variable that is required to be non-missing.
#' @param count_by (`character` or `NULL`)\cr name of a variable to be combined with `vars` when counting
#' `nonunique` records.
#' @param unique_count_suffix (`flag`)\cr whether the `"(n)"` suffix should be added to `unique_count` labels.
#' Defaults to `TRUE`.
#' @param .stats (`character`)\cr statistics to select for the table.
#'
#' Options are: ``r shQuote(get_stats("summarize_num_patients"), type = "sh")``
#'
#' @name summarize_num_patients
#' @order 1
NULL
#' @describeIn summarize_num_patients Statistics function which counts the number of
#' unique patients, the corresponding percentage taken with respect to the
#' total number of patients, and the number of non-unique patients.
#'
#' @param x (`character` or `factor`)\cr vector of patient IDs.
#'
#' @return
#' * `s_num_patients()` returns a named `list` of 3 statistics:
#' * `unique`: Vector of counts and percentages.
#' * `nonunique`: Vector of counts.
#' * `unique_count`: Counts.
#'
#' @examples
#' # Use the statistics function to count number of unique and nonunique patients.
#' s_num_patients(x = as.character(c(1, 1, 1, 2, 4, NA)), labelstr = "", .N_col = 6L)
#' s_num_patients(
#' x = as.character(c(1, 1, 1, 2, 4, NA)),
#' labelstr = "",
#' .N_col = 6L,
#' count_by = c(1, 1, 2, 1, 1, 1)
#' )
#'
#' @export
s_num_patients <- function(x,
labelstr,
.N_col, # nolint
...,
count_by = NULL,
unique_count_suffix = TRUE) {
checkmate::assert_string(labelstr)
checkmate::assert_count(.N_col)
checkmate::assert_multi_class(x, classes = c("factor", "character"))
checkmate::assert_flag(unique_count_suffix)
count1 <- n_available(unique(x))
count2 <- n_available(x)
if (!is.null(count_by)) {
checkmate::assert_vector(count_by, len = length(x))
count2 <- n_available(unique(interaction(x, count_by)))
}
out <- list(
unique = formatters::with_label(c(count1, ifelse(count1 == 0 && .N_col == 0, 0, count1 / .N_col)), labelstr),
nonunique = formatters::with_label(count2, labelstr),
unique_count = formatters::with_label(
count1, ifelse(unique_count_suffix, paste0(labelstr, if (nzchar(labelstr)) " ", "(n)"), labelstr)
)
)
out
}
#' @describeIn summarize_num_patients Statistics function which counts the number of unique patients
#' in a column (variable), the corresponding percentage taken with respect to the total number of
#' patients, and the number of non-unique patients in the column.
#'
#' @return
#' * `s_num_patients_content()` returns the same values as `s_num_patients()`.
#'
#' @examples
#' # Count number of unique and non-unique patients.
#'
#' df <- data.frame(
#' USUBJID = as.character(c(1, 2, 1, 4, NA)),
#' EVENT = as.character(c(10, 15, 10, 17, 8))
#' )
#' s_num_patients_content(df, .N_col = 5, .var = "USUBJID")
#'
#' df_by_event <- data.frame(
#' USUBJID = as.character(c(1, 2, 1, 4, NA)),
#' EVENT = c(10, 15, 10, 17, 8)
#' )
#' s_num_patients_content(df_by_event, .N_col = 5, .var = "USUBJID", count_by = "EVENT")
#'
#' @export
s_num_patients_content <- function(df,
labelstr = "",
.N_col, # nolint
.var,
...,
required = NULL,
count_by = NULL,
unique_count_suffix = TRUE) {
checkmate::assert_string(.var)
checkmate::assert_data_frame(df)
if (is.null(count_by)) {
assert_df_with_variables(df, list(id = .var))
} else {
assert_df_with_variables(df, list(id = .var, count_by = count_by))
}
if (!is.null(required)) {
checkmate::assert_string(required)
assert_df_with_variables(df, list(required = required))
df <- df[!is.na(df[[required]]), , drop = FALSE]
}
x <- df[[.var]]
y <- if (is.null(count_by)) NULL else df[[count_by]]
s_num_patients(
x = x,
labelstr = labelstr,
.N_col = .N_col,
count_by = y,
unique_count_suffix = unique_count_suffix
)
}
#' @describeIn summarize_num_patients Formatted analysis function which is used as `afun`
#' in `analyze_num_patients()` and as `cfun` in `summarize_num_patients()`.
#'
#' @return
#' * `a_num_patients()` returns the corresponding list with formatted [rtables::CellValue()].
#'
#' @keywords internal
a_num_patients <- function(df,
labelstr = "",
...,
.stats = NULL,
.stat_names = NULL,
.formats = NULL,
.labels = NULL,
.indent_mods = NULL) {
# Check for additional parameters to the statistics function
dots_extra_args <- list(...)
extra_afun_params <- retrieve_extra_afun_params(names(dots_extra_args$.additional_fun_parameters))
dots_extra_args$.additional_fun_parameters <- NULL
# Check for user-defined functions
default_and_custom_stats_list <- .split_std_from_custom_stats(.stats)
.stats <- default_and_custom_stats_list$all_stats
custom_stat_functions <- default_and_custom_stats_list$custom_stats
# Apply statistics function
x_stats <- .apply_stat_functions(
default_stat_fnc = s_num_patients_content,
custom_stat_fnc_list = custom_stat_functions,
args_list = c(
df = list(df),
labelstr = list(labelstr),
extra_afun_params,
dots_extra_args
)
)
# Fill in formatting defaults
.stats <- get_stats("summarize_num_patients", stats_in = .stats, custom_stats_in = names(custom_stat_functions))
.formats <- get_formats_from_stats(.stats, .formats)
.labels <- get_labels_from_stats(
.stats, .labels,
tern_defaults = c(lapply(x_stats, attr, "label")[nchar(lapply(x_stats, attr, "label")) > 0], tern_default_labels)
)
.indent_mods <- get_indents_from_stats(.stats, .indent_mods)
x_stats <- x_stats[.stats]
# Auto format handling
.formats <- apply_auto_formatting(.formats, x_stats, extra_afun_params$.df_row, extra_afun_params$.var)
# Get and check statistical names
.stat_names <- get_stat_names(x_stats, .stat_names)
in_rows(
.list = x_stats,
.formats = .formats,
.names = .labels %>% .unlist_keep_nulls(),
.stat_names = .stat_names,
.labels = .labels %>% .unlist_keep_nulls(),
.indent_mods = .indent_mods %>% .unlist_keep_nulls()
)
}
#' @describeIn summarize_num_patients Layout-creating function which can take statistics function arguments
#' and additional format arguments. This function is a wrapper for [rtables::summarize_row_groups()].
#'
#' @return
#' * `summarize_num_patients()` returns a layout object suitable for passing to further layouting functions,
#' or to [rtables::build_table()]. Adding this function to an `rtable` layout will add formatted rows containing
#' the statistics from `s_num_patients_content()` to the table layout.
#'
#' @examples
#' # summarize_num_patients
#' tbl <- basic_table() %>%
#' split_cols_by("ARM") %>%
#' split_rows_by("SEX") %>%
#' summarize_num_patients("USUBJID", .stats = "unique_count") %>%
#' build_table(df)
#'
#' tbl
#'
#' @export
#' @order 3
summarize_num_patients <- function(lyt,
var,
required = NULL,
count_by = NULL,
unique_count_suffix = TRUE,
na_str = default_na_str(),
riskdiff = FALSE,
...,
.stats = c("unique", "nonunique", "unique_count"),
.stat_names = NULL,
.formats = NULL,
.labels = list(
unique = "Number of patients with at least one event",
nonunique = "Number of events"
),
.indent_mods = 0L) {
checkmate::assert_flag(riskdiff)
afun <- if (isFALSE(riskdiff)) a_num_patients else afun_riskdiff
# Process standard extra arguments
extra_args <- list(".stats" = .stats)
if (!is.null(.stat_names)) extra_args[[".stat_names"]] <- .stat_names
if (!is.null(.formats)) extra_args[[".formats"]] <- .formats
if (!is.null(.labels)) extra_args[[".labels"]] <- .labels
if (is.null(.indent_mods)) {
indent_mod <- 0L
} else if (length(.indent_mods) == 1) {
indent_mod <- .indent_mods
} else {
indent_mod <- 0L
extra_args[[".indent_mods"]] <- .indent_mods
}
# Process additional arguments to the statistic function
extra_args <- c(
extra_args,
required = required, count_by = count_by, unique_count_suffix = unique_count_suffix,
if (!isFALSE(riskdiff)) list(afun = list("s_num_patients_content" = a_num_patients)),
...
)
# Append additional info from layout to the analysis function
extra_args[[".additional_fun_parameters"]] <- get_additional_afun_params(add_alt_df = FALSE)
formals(afun) <- c(formals(afun), extra_args[[".additional_fun_parameters"]])
summarize_row_groups(
lyt = lyt,
var = var,
cfun = afun,
na_str = na_str,
extra_args = extra_args,
indent_mod = indent_mod
)
}
#' @describeIn summarize_num_patients Layout-creating function which can take statistics function arguments
#' and additional format arguments. This function is a wrapper for [rtables::analyze()].
#'
#' @return
#' * `analyze_num_patients()` returns a layout object suitable for passing to further layouting functions,
#' or to [rtables::build_table()]. Adding this function to an `rtable` layout will add formatted rows containing
#' the statistics from `s_num_patients_content()` to the table layout.
#'
#' @details In general, functions that starts with `analyze*` are expected to
#' work like [rtables::analyze()], while functions that starts with `summarize*`
#' are based upon [rtables::summarize_row_groups()]. The latter provides a
#' value for each dividing split in the row and column space, but, being it
#' bound to the fundamental splits, it is repeated by design in every page
#' when pagination is involved.
#'
#' @note As opposed to [summarize_num_patients()], this function does not repeat the produced rows.
#'
#' @examples
#' df <- data.frame(
#' USUBJID = as.character(c(1, 2, 1, 4, NA, 6, 6, 8, 9)),
#' ARM = c("A", "A", "A", "A", "A", "B", "B", "B", "B"),
#' AGE = c(10, 15, 10, 17, 8, 11, 11, 19, 17),
#' SEX = c("M", "M", "M", "F", "F", "F", "M", "F", "M")
#' )
#'
#' # analyze_num_patients
#' tbl <- basic_table() %>%
#' split_cols_by("ARM") %>%
#' add_colcounts() %>%
#' analyze_num_patients("USUBJID", .stats = c("unique")) %>%
#' build_table(df)
#'
#' tbl
#'
#' @export
#' @order 2
analyze_num_patients <- function(lyt,
vars,
required = NULL,
count_by = NULL,
unique_count_suffix = TRUE,
na_str = default_na_str(),
nested = TRUE,
show_labels = c("default", "visible", "hidden"),
riskdiff = FALSE,
...,
.stats = c("unique", "nonunique", "unique_count"),
.stat_names = NULL,
.formats = NULL,
.labels = list(
unique = "Number of patients with at least one event",
nonunique = "Number of events"
),
.indent_mods = NULL) {
checkmate::assert_flag(riskdiff)
afun <- if (isFALSE(riskdiff)) a_num_patients else afun_riskdiff
# Process standard extra arguments
extra_args <- list(".stats" = .stats)
if (!is.null(.stat_names)) extra_args[[".stat_names"]] <- .stat_names
if (!is.null(.formats)) extra_args[[".formats"]] <- .formats
if (!is.null(.labels)) extra_args[[".labels"]] <- .labels
if (!is.null(.indent_mods)) extra_args[[".indent_mods"]] <- .indent_mods
# Process additional arguments to the statistic function
extra_args <- c(
extra_args,
required = required, count_by = count_by, unique_count_suffix = unique_count_suffix,
if (!isFALSE(riskdiff)) list(afun = list("s_num_patients_content" = a_num_patients)),
...
)
# Append additional info from layout to the analysis function
extra_args[[".additional_fun_parameters"]] <- get_additional_afun_params(add_alt_df = FALSE)
formals(afun) <- c(formals(afun), extra_args[[".additional_fun_parameters"]])
analyze(
lyt = lyt,
vars = vars,
afun = afun,
na_str = na_str,
nested = nested,
extra_args = extra_args,
show_labels = show_labels
)
}
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.