R/EStep.R
In RMallow: Fit Multi-Modal Mallows' Models to Ranking Data

Documented in EStep

#' The Expectation step of the EM algorithm.
#' 
#' Assigns each ranking the probability that it belongs to each cluster, given
#' current parameters.
#' 
#' 
#' @param R Current cluster modal sequences.
#' @param r The data of partial or full rankings.
#' @param p The proportion of the data currently assigned to each cluster.
#' @param lambda The lambda parameters from Mallow's model for each cluster.
#' @param G Number of clusters, length(R).
#' @param N Number of rows in the data.
#' @param C Vector of normalizing coefficients for the clusters.
#' @param all.dists For efficiency, provide all of the Kendall distances
#' between each sequence and each cluster mode.
#' @return Matrix where output[i, j] represents the current probability that
#' subject "i" belongs to cluster "j".
#' @author Erik Gregory
#' @references 
#' "Mixtures of distance-based models for ranking data". Thomas 
#' Brendan Murphy & Donal Martin. 1 April 2002. Computational Statistics & 
#' Data Analysis 41 (2003) 645-655.
#' @keywords expectation maximization
EStep <-
function(R, r, p, lambda, G, N, C, all.dists = NULL) {
  # Update z for each subject.
  if(is.null(all.dists)) {
    all.dists <- AllKendall(r, do.call("rbind", R))
  }
  fs <- C*exp(t(-lambda*t(all.dists)))
  z <- t(p*t(fs))
  z <- z/rowSums(z)
  return(z)
}