R/ranges-bind.R

Defines functions .set_id_var .check_id_var .bind_rng all_integer_ranges all_genomic_ranges bind_ranges interweave

Documented in bind_ranges interweave

#' Interweave a pair of Ranges objects together
#'
#' @param left,right Ranges objects.
#' @param .id When supplied a new column that represents the origin column
#' and is linked to each row of the resulting Ranges object.
#'
#' @details The output of `interweave()` takes pairs of Ranges
#' objects and combines them into a single  Ranges object. If an .id
#' argument is supplied, an origin column with name .id is created indicated which side
#' the resulting Range comes from (eit)
#'
#' @examples
#'gr <- as_granges(data.frame(start = 10:15,
#'                             width = 5,
#'                             seqnames = "seq1",
#'                             strand = c("+", "+", "-", "-", "+", "*")))
#' interweave(flank_left(gr, width = 5L), flank_right(gr, width = 5L))
#' interweave(flank_left(gr, width = 5L), flank_right(gr, width = 5L), .id = "origin")
#' @importFrom S4Vectors zipup Pairs
#' @return a Ranges object
#' @export
#' @rdname ranges-interweave
interweave <- function(left, right, .id = NULL) {
  if (!is.null(.id)) {
    stopifnot(is.character(.id) & length(.id) == 1L)
    mcols(left)[[.id]] <- "left"
    mcols(right)[[.id]] <- "right"
  }
  unlist(zipup(Pairs(left, right)))
}


#' Combine Ranges by concatentating them together
#'
#' @param ... Ranges objects to combine. Each argument can be a Ranges object,
#' or a list of Ranges objects.
#' @param .id Ranges object identifier. When .id is supplied a new column
#' is created that links each row to the original Range object. The contents
#' of the column correspond to the named arguments or the names of the list
#' supplied.
#'
#' @note Currently GRangesList or IRangesList objects are not supported.
#' @return a concatenated Ranges object
#' @importFrom rlang dots_values have_name
#' @rdname ranges-bind
#' @examples
#'gr <- as_granges(data.frame(start = 10:15,
#'                             width = 5,
#'                             seqnames = "seq1"))
#'gr2 <- as_granges(data.frame(start = 11:14,
#'                             width = 1:4,
#'                             seqnames = "seq2"))
#'bind_ranges(gr, gr2)
#'
#'bind_ranges(a = gr, b = gr2, .id = "origin")
#'
#'bind_ranges(gr, list(gr, gr2), gr2)
#'
#'bind_ranges(list(a = gr, b = gr2), c = gr, .id = "origin")
#'
#' @export
#' @importFrom methods as
bind_ranges <- function(..., .id = NULL) {
  x <- unlist(rlang::dots_values(...), recursive = TRUE)
  .bind_rng(x, .id)
}

all_genomic_ranges <- function(x) {
  all(vapply(x, function(x) is(x, "GenomicRanges"), logical(1)))
}

all_integer_ranges <- function(x) {
  all(vapply(x, function(x) is(x, "IntegerRanges"), logical(1)))
}

.bind_rng <- function(x, .id = NULL) {
  if (!(all_genomic_ranges(x) | all_integer_ranges(x))) {
    stop("Cannot bind objects of different classes together, ... must be
         all Ranges objects.", 
         call. = FALSE)
  }
  x <- as(x, "List")
  x <- .check_id_var(x, .id)
  x <- .set_id_var(x, .id)
  x
}

# .check_ranges_list <- function(x, .id = NULL) {
#   if (is(x, "RangesList")) return(unlist(x, recursive = TRUE), .id))
#   x
# }

.check_id_var <- function(x, .id = NULL) {
  if (!is.null(.id)) {
    stopifnot(is.character(.id) & length(.id) == 1L)
    any_empty <-  vapply(x, function(x) length(x) == 0, logical(1))
    any_noname <- rlang::have_name(x)
    if (!all(any_empty | any_noname)) {
      x <- Filter(length, x)
      names(x) <- seq_along(x)
    }
  }
  x
}

.set_id_var <- function(x, .id = NULL) {
  res <- suppressWarnings(unlist(x, use.names = FALSE))
  if (!is.null(.id)) {
    mcols(res)[[.id]] <-  Rle(names(x), lengths(x))
  }
  res
}
sa-lee/plyranges documentation built on April 15, 2024, 12:25 p.m.