R/mrw.R
In diffusr: Network Diffusion Algorithms

# diffusr: network diffusion algorithms in R
#
# Copyright (C) 2016 Simon Dirmeier
#
# This file is part of diffusr.
#
# diffusr is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# diffusr is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with diffusr. If not, see <http://www.gnu.org/licenses/>.


#' Graph diffusion using a Markov random walk
#'
#' @description A Markov Random Walk takes an inital distribution \code{p0}
#' and calculates the stationary distribution of that.
#' The diffusion process is regulated by a restart probability \code{r} which
#' controls how often the MRW jumps back to the initial values.
#'
#' @export
#' @docType methods
#' @rdname random-walk-methods
#'
#' @param p0  an \code{n x p}-dimensional numeric non-negative vector/matrix
#'  representing the starting distribution of the Markov chain
#'  (does not need to sum to one).
#' @param graph  an (\code{n x n})-dimensional numeric non-negative adjacence
#' matrix representing the graph
#' @param r  a scalar between (0, 1). restart probability if a Markov random
#' walk with restart is desired
#' @param thresh  threshold for breaking the iterative computation of the
#'  stationary distribution. If the absolute difference of the distribution at
#'  time point $t-1$ and $t$ is less than \code{thresh}, then the algorithm stops.
#'  If \code{thresh} is not reached before \code{niter}, then the algorithm stops
#'  as well.
#' @param niter  maximal number of iterations for computation of the
#'  Markov chain. If \code{thresh} is not reached, then \code{niter} is used as
#' stop criterion.
#' @param do.analytical  boolean if the stationary distribution shall be
#'  computed solving the analytical solution or rather iteratively
#' @param correct.for.hubs if \code{TRUE} multiplies a correction factor to the
#'  nodes, such that the random walk gets not biased to nodes with high
#'  degree. In that case the original input matrix will be normalized as:
#'  \deqn{ P(j | i) =  1 /degree(i) *  min(1, degree(j)/degree(j))}
#'  \emph{Note that this will not consider edge weights.}
#'
#' @return  returns a list with the following elements
#'  \itemize{
#'   \item p.inf  the stationary distribution as numeric vector
#'   \item transition.matrix the column normalized transition matrix used for the random walk
#'  }
#'
#' @references
#' Tong, H., Faloutsos, C., & Pan, J. Y. (2006),
#' Fast random walk with restart and its applications.\cr \cr
#' Koehler, S., Bauer, S., Horn, D., & Robinson, P. N. (2008),
#' Walking the interactome for prioritization of candidate disease genes.
#' \emph{The American Journal of Human Genetics}\cr \cr
#'
#' @examples
#'  # count of nodes
#'  n <- 5
#'  # starting distribution (has to sum to one)
#'  p0    <- as.vector(rmultinom(1, 1, prob=rep(.2, n)))
#'  # adjacency matrix (either normalized or not)
#'  graph <- matrix(abs(rnorm(n*n)), n, n)
#'  # computation of stationary distribution
#'  pt    <- random.walk(p0, graph)
#'
setGeneric(
  "random.walk",
  function(p0, graph, r=.5,
           niter=1e4, thresh=1e-4, do.analytical=FALSE,
           correct.for.hubs=FALSE)
  {
    standardGeneric("random.walk")
  },
  package="diffusr"
)


#' @rdname random-walk-methods
#' @aliases random.walk,numeric,matrix-method
setMethod(
  "random.walk",
  signature = signature(p0="numeric", graph="matrix"),
  function(p0, graph, r=.5,
           niter=1e4, thresh=1e-4, do.analytical=FALSE,
           correct.for.hubs=FALSE)
  {
    p0 <- as.matrix(p0, ncol=1)
    random.walk(p0, graph, r, niter, thresh, do.analytical, correct.for.hubs)
  }
)

#' @rdname random-walk-methods
#' @aliases random.walk,matrix,matrix-method
setMethod(
  "random.walk",
  signature = signature(p0="matrix", graph="matrix"),
  function(p0, graph, r=.5,
           niter=1e4, thresh=1e-4, do.analytical=FALSE,
           correct.for.hubs=FALSE)
  {
    stopifnot(length(r) == 1)
    stopifnot(is.logical(correct.for.hubs))
    .check.restart(r)
    .check.starting.matrix(p0)
    .check.graph(graph, p0)

    if (any(diag(graph) != 0))
    {
      message("setting diag of graph to zero")
      diag(graph) <- 0
    }
    if (correct.for.hubs) graph <- hub.correction(graph)
    stoch.graph <- normalize.stochastic(graph)
    if(!.is.ergodic(stoch.graph))
      stop(paste("the provided graph has more than one component.",
                 "It is likely not ergodic."))

    l <- list(
       p.inf=mrwr_(normalize.stochastic(p0),
                   stoch.graph, r, thresh, niter, do.analytical),
       transition.matrix=stoch.graph)

    l
  }
)