R/get_selfhyb_subseq.R

Defines functions show_selfhyb_counts show_selfhyb_lengths get_selfhyb_subseq .buildEl

Documented in get_selfhyb_subseq show_selfhyb_counts show_selfhyb_lengths

.buildEl = function(s, r, minlen) {
    both = c(s, r)
    slen = nchar(s, type="chars")
    autoseqs = .Call(.longest_common_substring, both)
    if (all(nchar(autoseqs) < minlen))
        return(list())
    names(autoseqs) = autoseqs
    selfhybs = lapply(autoseqs,
      function(x) {
          locL = gregexpr(x, both, fixed=TRUE)
          starts = as.integer(locL[[1]]) # remove match.length attr
          mlen = attr(locL[[2]], "match.length")
          rcstarts = slen - (as.integer(locL[[2]]) + mlen - 1) + 1
          list(starts=starts, rcstarts=rcstarts)
          ## FIXME: add gap calculation here
      })
    ## FIXME: add base count/freq
    selfhybs
}

get_selfhyb_subseq = function(seq, minlen, type=c("RNA", "DNA")) {
    type = match.arg(type)
    revcompfun = switch(type,
      RNA=RNAStringSet,
      DNA=DNAStringSet,
      stop("type must be RNA or DNA"))
    rcSeq = reverseComplement(revcompfun(seq))
    rcSeq = as.character(rcSeq)
    ans = mapply(.buildEl, seq, rcSeq, minlen, USE.NAMES=FALSE)
    names(ans) = names(seq)
    ans
}

show_selfhyb_lengths = function(L) {
    lens = sapply(L, function(x) {
        if (length(x))
          nchar(names(x)[1], type="char")
        else
          0
    })
    table(lens, dnn="SHS length")
}

show_selfhyb_counts = function(L) {
    cnts = sapply(L, length)
    table(cnts, dnn="SHS counts")
}

Try the microRNA package in your browser

Any scripts or data that you put into this service are public.

microRNA documentation built on Nov. 8, 2020, 7:50 p.m.