RNAseqFunctions: RNA sequencing functions for the Enge lab

#' nTopVar
#'
#' Facilitates gene selection using variance.
#'
#' Returns the index for the n genes (rows) with the maximum
#' variance in the counts object. Counts per million (CPM) should be used for
#' the calculation.
#'
#' @name nTopVar
#' @rdname nTopVar
#' @aliases nTopVar
#' @param cpm matrix; Matrix containing cpm values.
#' @param n Number of genes to select.
#' @param safe logical; Should input and output checks be on?
#' @return A numeric vector containing the indices of selected genes.
#' @author Jason T. Serviss
#' @keywords nTopVar
#'
NULL

#' @rdname nTopVar
#' @importFrom stats var
#' @importFrom matrixStats rowVars
#' @importFrom Rfast Order
#' @export

nTopVar <- function(cpm, n, safe = TRUE) {
  if(safe) {
    cpm <- .matrixCheckingAndCoercion(cpm)
    n <- .checkNarg(n, cpm)
  }
  rv = matrixStats::rowVars(cpm)
  if(safe) .check0range(rv)
  Order(rv, descending = TRUE, stable = TRUE)[1:n]
}

#' nTopMax
#'
#' Facilitates gene selection prior to unsupervised clustering.
#'
#' Returns the index for the n genes (rows) with the maximum
#' expression in the spCounts object. The expression matrix in
#' the counts.cpm slot is used for the calculation.
#'
#' @name nTopMax
#' @rdname nTopMax
#' @aliases nTopMax
#' @param cpm matrix; Matrix containing cpm values.
#' @param n integer; Number of genes to select.
#' @param safe logical; Should input and output checks be on?
#' @return A numeric vector containing the indices of selected genes.
#' @author Jason T. Serviss
#' @keywords nTopMax
#'
NULL

#' @rdname nTopMax
#' @importFrom matrixStats rowMaxs
#' @importFrom Rfast Order
#' @export

nTopMax <- function(cpm, n, safe = TRUE) {
  if(safe) {
    cpm <- .matrixCheckingAndCoercion(cpm)
    n <- .checkNarg(n, cpm)
  }
  rv <- matrixStats::rowMaxs(cpm)
  if(safe) .check0range(rv)
  Order(rv, descending = TRUE, stable = TRUE)[1:n]
}

#' nTopDeltaCV
#'
#' Selected informative genes by fitting a support-vector regression to the
#' coefficient of variation (CV) as a function of the mean, and selecting genes
#' having the greatest offset from the fitted curve; this would correspond to
#' genes with higher-than-expected variance. Adpoted from Linnarsson lab python
#' implementation:
#' https://github.com/linnarsson-lab/cytograph/blob/master/cytograph/feature_selection.py.
#' Note this displays a rendency to prioritize lowly expressed genes.
#'
#' @name nTopDeltaCV
#' @rdname nTopDeltaCV
#' @author Jason T. Serviss
#' @param cpm matrix; Matrix containing cpm values.
#' @param n Number of genes to select.
#' @keywords nTopDeltaCV
#'
#'
#' @export
NULL

#' @importFrom e1071 svm
#' @importFrom matrixStats rowMeans2 rowSds
#' @importFrom stats predict

nTopDeltaCV <- function(cpm, n) {
  cpm <- .matrixCheckingAndCoercion(cpm)
  n <- .checkNarg(n, cpm)

  valid <- matrixStats::rowSums2(cpm) > 0
  mu <- matrixStats::rowMeans2(cpm)
  sd <- matrixStats::rowSds(cpm)
  ok <- mu > 0 & sd > 0
  cv <- sd[ok] / mu[ok]

  log2_m <- log2(mu[ok])
  log2_cv <- log2(cv)

  svr_gamma <- 1000 / length(mu[ok])
  modelsvm <- svm(log2_cv ~ log2_m, gamma = svr_gamma)
  score <- log2_cv - predict(modelsvm, log2_m)
  score <- score * valid[ok]
  names(score) <- rownames(cpm)[ok]
  sort(score, decreasing = TRUE)[1:n]
}

martinenge/RNAseqFunctions documentation built on May 28, 2019, 3:10 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

martinenge/RNAseqFunctions
RNA sequencing functions for the Enge lab

R/featureSelectionFuns.R
In martinenge/RNAseqFunctions: RNA sequencing functions for the Enge lab

R Package Documentation

Browse R Packages

We want your feedback!

martinenge/RNAseqFunctions RNA sequencing functions for the Enge lab

R/featureSelectionFuns.R In martinenge/RNAseqFunctions: RNA sequencing functions for the Enge lab

R Package Documentation

Browse R Packages

We want your feedback!

martinenge/RNAseqFunctions
RNA sequencing functions for the Enge lab

R/featureSelectionFuns.R
In martinenge/RNAseqFunctions: RNA sequencing functions for the Enge lab