Nothing
#' Format columns of a data frame
#'
#' This function formats the columns of a data frame based on the column type (logical, date, numeric).
#' It allows various formatting options like significant digits, decimal points, and scientific notation.
#' It also includes custom formatting for date and boolean values.
#' If this function is applied several times to the same cell, the last transformation is retained and the previous calls are ignored, except for the `escape` argument which can be applied to previously transformed data.
#'
#' @param x A data frame or a vector to be formatted.
#' @param i Numeric vector or string.
#' - Numeric vector: Row indices where the styling should be applied. Can be a single value or a vector.
#' - String: Table components to format "caption", "colnames", "groupi" (row group labels), "~groupi" (non-group rows), "groupj" (column group labels), "notes".
#' - If both the `i` and `j` are omitted (default: NULL), formatting is applied to all table elements, including caption, notes, and group labels.
#' @param digits Number of significant digits or decimal places.
#' @param num_fmt The format for numeric values; one of 'significant', 'significant_cell', 'decimal', or 'scientific'.
#' @param num_zero Logical; if TRUE, trailing zeros are kept in "decimal" format (but not in "significant" format).
#' @param num_mark_big Character to use as a thousands separator.
#' @param num_mark_dec Decimal mark character. Default is the global option 'OutDec'.
#' @param num_suffix Logical; if TRUE display short numbers with `digits` significant digits and K (thousands), M (millions), B (billions), or T (trillions) suffixes.
#' @param date A string passed to the `format()` function, such as "%Y-%m-%d". See the "Details" section in `?strptime`
#' @param bool A function to format logical columns. Defaults to title case.
#' @param math Logical. If TRUE, wrap cell values in math mode `$..$`. This is useful for LaTeX output or with HTML MathJax `options(tinytable_html_mathjax=TRUE)`.
#' @param other A function to format columns of other types. Defaults to `as.character()`.
#' @param replace Logical, String or Named list of vectors
#' - TRUE: Replace `NA` and `NaN` by an empty string.
#' - FALSE: Print `NA` and `NaN` as strings.
#' - String: Replace `NA` and `NaN` entries by the user-supplied string.
#' - Named list: Replace matching elements of the vectors in the list by theirs names. Example:
#' - `list("-" = c(NA, NaN), "Tiny" = -Inf, "Massive" = Inf)`
#' @param escape Logical or "latex" or "html". If TRUE, escape special characters to display them as text in the format of the output of a `tt()` table.
#' - If `i` and `j` are both `NULL`, escape all cells, column names, caption, notes, and spanning labels created by `group_tt()`.
#' @param markdown Logical; if TRUE, render markdown syntax in cells. Ex: `_italicized text_` is properly italicized in HTML and LaTeX.
#' @param fn Function for custom formatting. Accepts a vector and returns a character vector of the same length.
#' @param quarto Logical. Enable Quarto data processing and wrap cell content in a `data-qmd` span (HTML) or `\QuartoMarkdownBase64{}` macro (LaTeX). See warnings in the Global Options section below.
#' @param sprintf String passed to the `?sprintf` function to format numbers or interpolate strings with a user-defined pattern (similar to the `glue` package, but using Base R).
#' @param linebreak NULL or a single string. If it is a string, replaces that string with appropriate line break sequences depending on the output format (HTML: `<br>`, LaTeX: `\\\\`, Typst: `\\ `). Markdown output is excluded from line break replacement.
#' @param output Apply formatting only if the `tt()` object is rendered in the specified format. One of "latex", "html", "typst", or "markdown". If `NULL` (default), apply formatting regardless of the output format.
#' @inheritParams tt
#' @inheritParams style_tt
#' @template global_options
#'
#' @return A data frame with formatted columns.
#' @export
#' @examples
#' dat <- data.frame(
#' a = rnorm(3, mean = 10000),
#' b = rnorm(3, 10000)
#' )
#' tab <- tt(dat)
#' format_tt(tab,
#' digits = 2,
#' num_mark_dec = ",",
#' num_mark_big = " "
#' )
#'
#' k <- tt(data.frame(x = c(0.000123456789, 12.4356789)))
#' format_tt(k, digits = 2, num_fmt = "significant_cell")
#'
#' dat <- data.frame(
#' a = c("Burger", "Halloumi", "Tofu", "Beans"),
#' b = c(1.43202, 201.399, 0.146188, 0.0031),
#' c = c(98938272783457, 7288839482, 29111727, 93945)
#' )
#' tt(dat) |>
#' format_tt(j = "a", sprintf = "Food: %s") |>
#' format_tt(j = 2, digits = 1, num_fmt = "decimal", num_zero = TRUE) |>
#' format_tt(j = "c", digits = 2, num_suffix = TRUE)
#'
#' y <- tt(data.frame(x = c(123456789.678, 12435.6789)))
#' format_tt(y, digits = 3, num_mark_big = " ")
#'
#' x <- tt(data.frame(Text = c("_italicized text_", "__bold text__")))
#' format_tt(x, markdown = TRUE)
#'
#' # Line breaks using linebreak argument
#' d <- data.frame(Text = "First line<br>Second line")
#' tt(d) |> format_tt(linebreak = "<br>")
#'
#' # Non-standard evaluation (NSE)
#' dat <- data.frame(
#' w = c(143002.2092, 201399.181, 100188.3883),
#' x = c(1.43402, 201.399, 0.134588),
#' y = as.Date(c(897, 232, 198), origin = "1970-01-01"),
#' z = c(TRUE, TRUE, FALSE)
#' )
#' tt(dat) |>
#' format_tt(i = w > 150000, j = w, digits = 0, num_mark_big = ",")
#'
#' tab <- data.frame(a = c(NA, 1, 2), b = c(3, NA, 5))
#' tt(tab) |> format_tt(replace = "-")
#'
#' dat <- data.frame(
#' "LaTeX" = c("Dollars $", "Percent %", "Underscore _"),
#' "HTML" = c("<br>", "<sup>4</sup>", "<emph>blah</emph>")
#' )
#' tt(dat) |> format_tt(escape = TRUE)
#'
format_tt <- function(
x,
i = NULL,
j = NULL,
digits = get_option("tinytable_format_digits", default = NULL),
num_fmt = get_option("tinytable_format_num_fmt", default = "significant"),
num_zero = get_option("tinytable_format_num_zero", default = FALSE),
num_suffix = get_option("tinytable_format_num_suffix", default = FALSE),
num_mark_big = get_option("tinytable_format_num_mark_big", default = ""),
num_mark_dec = get_option(
"tinytable_format_num_mark_dec",
default = getOption("OutDec", default = ".")
),
date = get_option("tinytable_format_date", default = NULL),
bool = get_option("tinytable_format_bool", default = NULL),
math = get_option("tinytable_format_math", default = FALSE),
other = get_option("tinytable_format_other", default = NULL),
replace = get_option("tinytable_format_replace", default = FALSE),
escape = get_option("tinytable_format_escape", default = FALSE),
markdown = get_option("tinytable_format_markdown", default = FALSE),
quarto = get_option("tinytable_format_quarto", default = FALSE),
fn = get_option("tinytable_format_fn", default = NULL),
sprintf = get_option("tinytable_format_sprintf", default = NULL),
linebreak = get_option("tinytable_format_linebreak", default = NULL),
output = get_option("tinytable_format_output", default = NULL)) {
assert_integerish(digits, len = 1, null.ok = TRUE)
assert_choice(
num_fmt,
c("significant", "significant_cell", "decimal", "scientific")
)
assert_flag(num_zero)
assert_string(num_mark_big)
assert_string(num_mark_dec)
assert_string(date, null.ok = TRUE)
assert_function(bool, null.ok = TRUE)
assert_function(identity, null.ok = TRUE)
assert_function(other, null.ok = TRUE)
assert_flag(markdown)
assert_flag(quarto)
assert_function(fn, null.ok = TRUE)
assert_choice(output, c("latex", "html", "typst", "markdown"), null.ok = TRUE)
assert_string(sprintf, null.ok = TRUE)
assert_string(linebreak, null.ok = TRUE)
replace <- sanitize_replace(replace)
sanity_num_mark(digits, num_mark_big, num_mark_dec)
out <- x
# non-standard evaluation before anything else
tmp <- nse_i_j(x, i_expr = substitute(i), j_expr = substitute(j), pf = parent.frame())
list2env(tmp, environment())
if (inherits(out, "tinytable")) {
cal <- call(
"format_tt_lazy",
i = i,
j = j,
digits = digits,
num_fmt = num_fmt,
num_zero = num_zero,
num_suffix = num_suffix,
num_mark_big = num_mark_big,
num_mark_dec = num_mark_dec,
replace = replace,
fn = fn,
sprintf = sprintf,
date_format = date,
bool = bool,
math = math,
escape = escape,
markdown = markdown,
quarto = quarto,
other = other,
linebreak = linebreak,
output = output
)
out@lazy_format <- c(out@lazy_format, list(cal))
} else {
out <- format_tt_lazy(
out,
i = i,
j = j,
digits = digits,
num_fmt = num_fmt,
num_zero = num_zero,
num_suffix = num_suffix,
num_mark_big = num_mark_big,
num_mark_dec = num_mark_dec,
replace = replace,
fn = fn,
sprintf = sprintf,
date_format = date,
bool = bool,
math = math,
other = other,
escape = escape,
quarto = quarto,
markdown = markdown,
linebreak = linebreak,
output = output
)
}
return(out)
}
format_tt_lazy <- function(
x,
i,
j,
digits,
num_fmt,
num_zero,
num_suffix,
num_mark_big,
num_mark_dec,
replace,
fn,
sprintf,
date_format,
bool,
math,
escape,
markdown,
quarto,
other,
linebreak,
output) {
if (inherits(x, "tbl_df")) {
assert_dependency("tibble")
x_is_tibble <- TRUE
x <- as.data.frame(x, check.names = FALSE)
} else {
x_is_tibble <- FALSE
}
if (inherits(x, "tinytable") && !is.null(output)) {
if (!identical(x@output, output)) {
return(x)
}
}
# important for tabulator
if (!is.null(bool) && inherits(x, "tinytable")) {
x@tabulator_format_bool <- TRUE
}
# Check if i contains component names (do this before processing tinytable objects)
if (identical(i, "groupi")) {
components <- "cells"
i <- x@group_index_i
} else if (identical(i, "~groupi")) {
components <- "cells"
i <- setdiff(seq_len(nrow(x)), x@group_index_i)
} else if (is.character(i)) {
components <- i # before wiping i
i <- NULL
} else if (!is.null(i) || !is.null(j)) {
components <- "cells"
} else {
components <- "all"
}
# format_tt() supports vectors
if (isTRUE(check_atomic_vector(x))) {
atomic_vector <- TRUE
if (is.factor(x)) {
x <- as.character(x)
}
ori <- out <- x <- data.frame(tinytable = x, stringsAsFactors = FALSE)
j <- 1
} else if (is.data.frame(x)) {
atomic_vector <- FALSE
ori <- out <- x
} else if (inherits(x, "tinytable")) {
atomic_vector <- FALSE
# if no other format_tt() call has been applied, we ctan have numeric values
out <- x@data_body
ori <- x@data
} else {
stop(
"`x` must be a `tinytable` object, a data frame, or an atomic vector.",
call. = FALSE
)
}
# In sanity_tt(), we fill in missing NULL `j` in the format-specific versions,
# because tabularray can do whole column styling. Here, we need to fill in
# NULL for all formats since this is applied before creating the table.
# nrow(out) because nrow(x) sometimes includes rows that will be added **in the lazy future** by group_tt()
i <- sanitize_i(i, x, lazy = FALSE, calling_function = "format_tt")
j <- sanitize_j(j, x, skip_tabulator_types = TRUE)
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_logical,
inherit_class = "logical",
bool_fn = bool
)
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_date,
inherit_class = "Date",
date_format = date_format
)
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_numeric,
num_suffix = num_suffix,
digits = digits,
num_mark_big = num_mark_big,
num_mark_dec = num_mark_dec,
num_zero = num_zero,
num_fmt = num_fmt,
inherit_class = is.numeric
)
is_other <- function(x) {
!is.numeric(x) && !inherits(x, "Date") && !is.logical(x)
}
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_other,
inherit_class = is_other,
other_fn = other
)
# after other formatting
if (!is.null(sprintf)) {
x <- apply_format(
x = x,
i = i,
j = j,
components = components,
format_fn = format_vector_sprintf,
sprintf_pattern = sprintf
)
}
# Custom functions overwrite all the other formatting, but is before markdown
# before escaping
if (is.function(fn)) {
if (!is.null(components)) {
# Use apply_format for component-specific formatting
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_custom,
components = components,
fn = fn
)
} else {
# Original behavior for cell-specific formatting
for (col in j) {
tmp <- tryCatch(
format_vector_custom(ori[i, col, drop = TRUE], fn),
error = function(e) NULL
)
out[i, col] <- if (length(tmp) > 0) tmp else out[i, col]
}
}
}
# close to last
if (isTRUE(math)) {
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_math,
components = components,
original_data = FALSE,
math = math
)
}
# linebreak before replace and escape
if (!is.null(linebreak)) {
if (inherits(x, "tinytable")) {
output_format <- x@output
} else {
output_format <- NULL
}
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_linebreak,
components = components,
original_data = FALSE,
linebreak = linebreak,
output = output_format
)
}
# replace before escape, otherwise overaggressive removal
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_replace,
components = components,
replace = replace,
original_data = FALSE
)
# escape latex characters
if (!isFALSE(escape)) {
if (isTRUE(escape == "latex")) {
o <- "latex"
} else if (isTRUE(escape == "html")) {
o <- "html"
} else if (isTRUE(escape == "typst")) {
o <- "typst"
} else if (inherits(x, "tinytable")) {
o <- x@output
} else {
o <- FALSE
}
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_escape,
components = components,
original_data = FALSE,
output = o
)
}
# markdown and quarto at the very end
if (isTRUE(markdown)) {
assert_dependency("litedown")
x <- apply_format(
x = x,
i = i,
j = j,
format_fn = format_vector_markdown,
components = components,
original_data = FALSE,
output_format = x@output
)
}
if (isTRUE(quarto)) {
for (col in j) {
x <- format_vector_quarto(i = i, col = col, x = x)
}
}
# output
if (isTRUE(atomic_vector)) {
x <- x[[1]]
}
if (!inherits(x, "tinytable") && x_is_tibble) {
x <- tibble::as_tibble(x)
}
return(x)
}
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.