R/genomic_sequences.R

Defines functions get_sequences

Documented in get_sequences

#' Retrieve Sequences
#'
#' Retrieve sequences for expanded ranges
#'
#' @import tibble
#' @importFrom GenomicRanges GRanges
#' @importFrom Rsamtools FaFile
#' @importFrom Biostrings getSeq
#' @importFrom purrr set_names
#'
#' @param deep_obj dep_tss object
#' @param assembly Path to genome assembly
#'
#' @rdname get_sequences-function
#'
#' @export

get_sequences <- function(deep_obj, assembly) {
        
	## Load the genome assembly.
	genome <- FaFile(assembly)

	## Retrieve the sequences used for genomic encoding.
	genomic_ranges <- deep_obj@ranges$sequence
        genomic_seqs <- genomic_ranges %>%
		getSeq(genome, .) %>%
		as.character %>%
		set_names(NULL)

	genomic_ranges$genomic_seq <- genomic_seqs

	## Retrieve the sequences used for shape encoding.
	shape_ranges <- deep_obj@ranges$shape
	shape_seqs <- genomic_ranges %>%
		getSeq(genome, .) %>%
		as.character %>%
		set_names(NULL)

	shape_ranges$shape_seq <- shape_seqs

	## Return the deep tss object.
	deep_obj@ranges$sequence <- genomic_ranges
	deep_obj@ranges$shape <- shape_ranges

        return(deep_obj)
}
rpolicastro/deepTSSscrubbeR documentation built on March 20, 2020, 5:38 a.m.