R/shards_lazy.R

Defines functions `[[.shard_descriptor_lazy` `[.shard_descriptor_lazy` length.shard_descriptor_lazy print.shard_descriptor_lazy .lazy_shard_at shards_lazy

Documented in length.shard_descriptor_lazy print.shard_descriptor_lazy

# Lazy shard descriptor for contiguous shards.
#
# Used by shm_queue dispatch mode to avoid materializing a giant list of shard
# descriptors on the master.

shards_lazy <- function(n, block_size) {
  n <- as.integer(n)
  block_size <- as.integer(block_size)
  if (is.na(n) || n < 1L) stop("n must be >= 1", call. = FALSE)
  if (is.na(block_size) || block_size < 1L) stop("block_size must be >= 1", call. = FALSE)

  num_shards <- as.integer(ceiling(n / block_size))

  structure(
    list(
      n = n,
      block_size = block_size,
      strategy = "contiguous_lazy",
      num_shards = num_shards
    ),
    class = c("shard_descriptor_lazy", "shard_descriptor")
  )
}

.lazy_shard_at <- function(x, i) {
  i <- as.integer(i)
  if (is.na(i) || i < 1L || i > x$num_shards) stop("shard index out of range", call. = FALSE)
  start <- (i - 1L) * x$block_size + 1L
  end <- min(i * x$block_size, x$n)
  list(id = i, start = start, end = end, idx = start:end, len = end - start + 1L)
}

#' Print a shard_descriptor_lazy Object
#'
#' @param x A \code{shard_descriptor_lazy} object.
#' @param ... Further arguments (ignored).
#' @return The input \code{x}, invisibly.
#' @examples
#' sh <- shards(100, block_size = 25)
#' print(sh)
#' @export
print.shard_descriptor_lazy <- function(x, ...) {
  cat("shard descriptor (lazy)\n")
  cat("  Items:", format(x$n, big.mark = ","), "\n")
  cat("  Block size:", format(x$block_size, big.mark = ","), "\n")
  cat("  Strategy:", x$strategy, "\n")
  cat("  Shards:", x$num_shards, "\n")
  invisible(x)
}

#' Length of a shard_descriptor_lazy Object
#'
#' @param x A \code{shard_descriptor_lazy} object.
#' @return An integer scalar giving the number of shards.
#' @examples
#' sh <- shards(100, block_size = 25)
#' length(sh)
#' @export
length.shard_descriptor_lazy <- function(x) {
  x$num_shards
}

#' Subset a shard_descriptor_lazy Object
#'
#' @param x A \code{shard_descriptor_lazy} object.
#' @param i Index or indices.
#' @return A subset of the object.
#' @examples
#' sh <- shards(100, block_size = 25)
#' sh[1:2]
#' @export
`[.shard_descriptor_lazy` <- function(x, i) {
  lapply(i, function(j) .lazy_shard_at(x, j))
}

#' Extract a Single Shard from a shard_descriptor_lazy Object
#'
#' @param x A \code{shard_descriptor_lazy} object.
#' @param i Index.
#' @return A subset of the object.
#' @examples
#' sh <- shards(100, block_size = 25)
#' sh[[1]]
#' @export
`[[.shard_descriptor_lazy` <- function(x, i) {
  .lazy_shard_at(x, i)
}

Try the shard package in your browser

Any scripts or data that you put into this service are public.

shard documentation built on April 3, 2026, 9:08 a.m.