R/getDupeSeq.R

Defines functions getDupeSeq

Documented in getDupeSeq

#' helper function for findDupes
#' 
#' @param duperow the row
#' 
#' @return  the sequence for that duplicated entry
#' @importFrom Rsamtools scanFaIndex FaFile
#' @importFrom Biostrings getSeq
#' @importFrom GenomeInfoDb seqnames
#' @export
getDupeSeq <- function(duperow) { 
  seqname <- duperow[1]
  fasta <- duperow[2]
  namedGr <- function(gr) { 
    names(gr) <- seqnames(gr)
    return(gr) 
  }
  faFile <- FaFile(fasta)
  gr <- namedGr(scanFaIndex(faFile))[seqname]
  as.character(getSeq(faFile, gr))
}
arcolombo/TxDbLite documentation built on July 10, 2020, 12:27 a.m.