R/api_compile.R
In jti: Junction Tree Inference

Documented in compile compile.cpt_list cpt_list cpt_list.data.frame cpt_list.list dim_names dim_names.charge dim_names.cpt_list dim_names.jt get_graph get_graph.charge get_graph.cpt_list get_triang_graph has_inconsistencies has_inconsistencies.charge has_inconsistencies.jt names.charge names.cpt_list names.jt pot_list pot_list.data.frame print.charge print.cpt_list

#' Conditional probability list
#'
#' A check and conversion of cpts to be used in the junction tree algorithm
#'
#' @param x Either a named list with cpts in form of array-like object(s)
#' where names must be the child node or a \code{data.frame}
#' @param g Either a directed acyclic graph (DAG) as an igraph object or a
#' decomposable graph as an igraph object. If \code{x} is a list,
#' \code{g} must be \code{NULL}. The procedure then deduce the graph
#' from the conditional probability tables.
#' @examples
#'
#' library(igraph)
#' el <- matrix(c(
#' "A", "T",
#' "T", "E",
#' "S", "L",
#' "S", "B",
#' "L", "E",
#' "E", "X",
#' "E", "D",
#' "B", "D"),
#'  nc = 2,
#'  byrow = TRUE
#' )
#' 
#' g <- igraph::graph_from_edgelist(el) 
#' cl <- cpt_list(asia, g)
#' 
#' print(cl)
#' dim_names(cl)
#' names(cl)
#' plot(get_graph(cl))
#' @export
cpt_list <- function(x, g = NULL) UseMethod("cpt_list")


#' @rdname cpt_list
#' @export
cpt_list.list <- function(x, g = NULL) { 

  if (!is_named_list(x)) {
    stop(
      "x must be a named list of cpts. ",
      "A name should be the name of the corresponding child node."
    )
  }

  if (!is.null(g)) stop("g must be 'NULL'")

  dim_names <- list()
  
  y <- lapply(seq_along(x), function(i) {
    spar <- sparta::as_sparta(x[[i]])
    child <- names(parents)[i]
    # This ensures, that the CPTs and dim_names have the same ordering of the lvls!
    dim_names <<- push(dim_names, attr(spar, "dim_names"))
    spar
  })

  names(y)  <- names(x)
  dim_names <- unlist(dim_names, FALSE)
  dim_names <- dim_names[unique(names(dim_names))]

  g <- graph_from_cpt_list(y)
  if (!igraph::is_dag(g)) stop("The cpts does not induce an acyclic graph.")

  structure(
    y,
    nodes     = names(x),
    dim_names = dim_names,
    parents   = parents_cpt_list(y),
    graph     = g,
    class     = c("bn", "cpt_list", "list")
  )
}


#' @rdname cpt_list
#' @export
cpt_list.data.frame <- function(x, g) {

  if (!igraph::is.igraph(g)) stop("g must be an igraph object")

  is_dag <- igraph::is_dag(g)
  if (!is_dag) {
    if (!igraph::is_chordal(g)$chordal) {
      stop("undirected graphs must be be decomposable", call. = FALSE)
    }
  }

  parents <- if (is_dag) {
    parents_igraph(g)
  } else {
    rip(as_adj_lst(igraph::as_adjacency_matrix(g, sparse = FALSE)), check = FALSE)$P 
  }

  dns  <- list()

  
  y <- lapply(seq_along(parents), function(i) {
    child <- names(parents)[i]
    pars  <- parents[[i]]
    spar <- sparta::as_sparta(x[, c(child, pars), drop = FALSE])    
    spar <- sparta::as_cpt(spar, pars)
    # This ensures, that the CPTs and dim_names have the same ordering of the lvls!
    dns <<- push(dns, sparta::dim_names(spar))
    spar
  })

  dns <- unlist(dns, FALSE)
  dns <- dns[unique(names(dns))]
  
  structure(
    structure(y, names = names(parents)),
    nodes     = names(parents),
    dim_names = dns,
    parents   = parents,
    graph     = g,
    class     = c(ifelse(is_dag, "bn", "mrf"), "cpt_list", "list")
  )
}

#' A check and extraction of clique potentials from a Markov random field
#' to be used in the junction tree algorithm
#'
#' @param x Character \code{data.frame}
#' @param g A decomposable Markov random field as an igraph object.
#' @examples
#'
#' # Typically one would use the ess package:
#' # library(ess)
#' # g  <- ess::fit_graph(derma)
#' # pl <- pot_list(derma, ess::as_igraph(g))
#' # pl
#'
#' # Another example
#' g <- igraph::sample_gnm(ncol(asia), 12)
#' while(!igraph::is.chordal(g)$chordal) g <- igraph::sample_gnm(ncol(asia), 12, FALSE)
#' igraph::V(g)$name <- colnames(asia)
#' plot(g)
#' pot_list(asia, g)
#' 
#' @export
pot_list <- function(x, g) UseMethod("pot_list")

#' @rdname pot_list
#' @export
pot_list.data.frame <- function(x, g) cpt_list(x, g)


#' Compile information
#'
#' Compiled objects are used as building blocks for junction tree inference
#'
#' @param x An object returned from \code{cpt_list} (baeysian network) or
#' \code{pot_list} (decomposable markov random field)
#' @param evidence A named vector. The names are the variabes and the elements
#' are the evidence.
#' @param root_node A node for which we require it to live in the root
#' clique (the first clique).
#' @param joint_vars A vector of variables for which we require them
#' to be in the same clique. Edges between all these variables are added
#' to the moralized graph.
#' @param tri The optimization strategy used for triangulation if x originates
#' from a Baeysian network. One of
#'  * 'min_fill'
#'  * 'min_rfill'
#'  * 'min_sp'
#'  * 'min_ssp'
#'  * 'min_lsp'
#'  * 'min_lssp'
#'  * 'min_elsp'
#'  * 'min_elssp'
#'  * 'min_nei'
#'  * 'minimal'
#'  * 'alpha'
#' @param pmf_evidence A named vector of frequencies of the expected
#' missingness of a variable. Variables with frequencies of 1 can be
#' neglected; these are inferrred. A value of 0.25 means, that the
#' given variable is expected to be missing (it is not a evidence node)
#' in one fourth of the future cases. Relevant for \code{tri} methods
#' 'min_elsp' and 'min_elssp'.
#' @param alpha Character vector. A permutation of the nodes
#' in the graph. It specifies a user-supplied eliminination ordering for
#' triangulation of the moral graph.
#' @param initialize_cpts \code{TRUE} if the CPTs should be initialized,
#' i.e. multiplied together to form the clique potentials. If FALSE,
#' the \code{compile}d object will save the triangulation and other
#' information that needs only bee computed once. Herafter, it is
#' possible to enter evidence into the CPTs, using \code{set_evidence},
#' saving a lot of computations. 
#'
#' @md
#' 
#' @details The Junction Tree Algorithm performs both a forward and inward
#' message pass (collect and distribute). However, when the forward
#' phase is finished, the root clique potential is guaranteed to be the
#' joint pmf over the variables involved in the root clique. Thus, if
#' it is known in advance that a specific variable is of interest, the
#' algortihm can be terminated after the forward phase. Use the \code{root_node}
#' to specify such a variable and specify \code{propagate = "collect"} in
#' the juntion tree algortihm function \code{jt}.
#'
#' Moreover, if interest is in some joint pmf for variables that end up
#' being in different cliques these variables must be specified in advance
#' using the \code{joint_vars} argument. The compilation step then
#' adds edges between all of these variables to ensure that at least one
#' clique contains all of them.
#'
#' Evidence can be entered either at compile stage
#' or after compilation. Hence, one can also combine
#' evidence from before compilation with evidence
#' after compilation. Before refers to entering
#' evidence in the 'compile' function and after
#' refers to entering evidence in the 'jt' function.
#'
#' Finally, one can either use a Bayesian network or a decomposable
#' Markov random field (use the \code{ess} package to fit these). Bayesian
#' networks must be constructed with \code{cpt_list} and decomposable MRFs
#' can be constructed with both \code{pot_list} and \code{cpt_list}. However,
#' \code{pot_list} is just an alias for \code{cpt_list} which handles both
#' cases internally.
#' 
#' @examples
#' cptl <- cpt_list(asia2)
#' cp1  <- compile(cptl, evidence = c(bronc = "yes"), joint_vars = c("bronc", "tub"))
#' print(cp1)
#' names(cp1)
#' dim_names(cp1)
#' plot(get_graph(cp1))
#' @export
compile <- function(x,
                    evidence        = NULL,
                    root_node       = "",
                    joint_vars      = NULL,
                    tri             = "min_fill",
                    pmf_evidence    = NULL,
                    alpha           = NULL,
                    initialize_cpts = TRUE
                    ) {
  UseMethod("compile")
}

#' @rdname compile
#' @export
compile.cpt_list <- function(x,
                             evidence        = NULL,
                             root_node       = "",
                             joint_vars      = NULL,
                             tri             = "min_fill",
                             pmf_evidence    = NULL,
                             alpha           = NULL,
                             initialize_cpts = TRUE
                             ) {
  
  check_params_compile(tri, pmf_evidence, alpha, names(x), root_node)

  g       <- attr(x, "graph")
  parents <- attr(x, "parents")

  gm      <- moralize_igraph(g, parents)
  if (!is.null(joint_vars)) gm <- add_joint_vars_igraph(gm, joint_vars)

  # Note here: if sparse = TRUE, the run time explodes! Wonder why...
  M  <- igraph::as_adjacency_matrix(gm, sparse = FALSE)

  tri_obj <- new_triang(tri, M, .map_int(dim_names(x), length), pmf_evidence, alpha)
  gmt     <- .triang(tri_obj)
  adj_lst <- as_adj_lst(gmt)
  cliques <- construct_cliques(adj_lst)

  # cliques_int is needed to construct the junction tree in new_jt -> new_schedule
  dimnames(gmt) <- lapply(dimnames(gmt), function(x) 1:nrow(gmt))
  adj_lst_int   <- as_adj_lst(gmt)
  # root_node_int <- ifelse(root_node != "", as.character(match(root_node, names(adj_lst))), "")
  cliques_int   <- lapply(rip(adj_lst_int)$C, as.integer)

  inc <- new.env()
  inc$inc <- FALSE

  if (!is.null(evidence)) {
    if (!valid_evidence(attr(x, "dim_names"), evidence)) {
      stop("Evidence is not on correct form", call. = FALSE)
    }
    # x looses its attributes in set_evidence
    att_ <- attributes(x)
    x    <- set_evidence_(x, evidence, inc)
    attributes(x) <- att_
  }
  
  charge  <- if (initialize_cpts) {
    new_charge(x, cliques, parents)
  } else {
    list(cpts = x, parents = parents)
  }
  
  schedule <- new_schedule(cliques, cliques_int, root_node, joint_vars)
  
  structure(
    list(charge = charge, cliques = cliques, schedule = schedule),
    root_node        = root_node,
    joint_vars       = joint_vars,
    dim_names        = attr(x, "dim_names"),
    evidence         = evidence,
    cliques_int      = cliques_int,
    inconsistencies  = inc$inc,
    graph            = g,
    triang_graph     = gmt,
    cpts_initialized = initialize_cpts,
    class            = c(ifelse(inherits(x, "bn"), "bn", "mrf"), "charge", "list")
  )
}

#' Various getters
#'
#' Getter methods for \code{cpt_list}, \code{pot_list}, \code{charge}
#' and \code{jt} objects
#' 
#' @param x \code{cpt_list}, \code{pot_list}, \code{charge} or \code{jt}

#' @rdname getters
#' @export
dim_names <- function(x) UseMethod("dim_names")

#' @rdname getters
#' @export
has_inconsistencies <- function(x) UseMethod("has_inconsistencies")

#' @rdname getters
#' @export
dim_names.cpt_list <- function(x) attr(x, "dim_names")

#' @rdname getters
#' @export
names.cpt_list <- function(x) attr(x, "nodes")

#' @rdname getters
#' @export
dim_names.charge <- function(x) attr(x, "dim_names")

#' @rdname getters
#' @export
names.charge <- function(x) names(attr(x, "dim_names"))

#' @rdname getters
#' @export
has_inconsistencies.charge <- function(x) attr(x, "inconsistencies")

#' @rdname getters
#' @export
dim_names.jt <- function(x) attr(x, "dim_names")

#' @rdname getters
#' @export
names.jt <- function(x) names(attr(x, "dim_names"))

#' @rdname getters
#' @export
has_inconsistencies.jt <- function(x) attr(x, "inconsistencies")


#' Get graph
#'
#' Retrieve the graph
#'
#' @param x \code{cpt_list} or a compiled object
#' @return A graph as an \code{igraph} object

#' @rdname get-graph
#' @export
get_graph <- function(x) UseMethod("get_graph")

#' @rdname get-graph
#' @export
get_graph.charge <- function(x) attr(x, "graph")

#' @rdname get-graph
#' @export
get_graph.cpt_list <- function(x) attr(x, "graph")


#' Get triangulated graph
#'
#' Retrieve the triangulated graph from
#'
#' @param x A compiled object
#' @return A triangulated graph as a neibor matrix

#' @rdname get-triang-graph
#' @export
get_triang_graph <- function(x) UseMethod("get_triang_graph")

get_triang_graph.charge <- function(x) x$triang_graph

#' A print method for cpt lists
#'
#' @param x A \code{cpt_list} object
#' @param ... For S3 compatability. Not used.
#' @seealso \code{\link{compile}}
#' @export
print.cpt_list <- function(x, ...) {
  cls <- paste0("<", paste0(class(x), collapse = ", "), ">")
  nn  <- length(names(x))
  cat(" List of CPTs",
    "\n -------------------------\n")

  for (child in names(x)) {
    parents <- setdiff(names(sparta::dim_names(x[[child]])), child)
    if (neq_empt_chr(parents)) {
      cat("  P(", child, "|" , paste(parents, collapse = ", "), ")\n")      
    } else {
      cat("  P(", child, ")\n")
    }
  }
  
  cat(paste0("\n  ", cls),
    "\n -------------------------\n"
  )
}

#' A print method for compiled objects
#'
#' @param x A compiled object
#' @param ... For S3 compatability. Not used.
#' @seealso \code{\link{jt}}
#' @export
print.charge <- function(x, ...) {

  cls <- paste0("<", paste0(class(x), collapse = ", "), ">")
  nn  <- length(names(x))
  clique_sizes <- .map_int(x$cliques, length)
  max_C <- max(clique_sizes)
  min_C <- min(clique_sizes)
  avg_C <- mean(clique_sizes)

  init  <- attr(x, "cpts_initialized")
  init_msg <- ifelse(init, " (cpts initialized)", " (cpts not initialized)")
  dashes   <- paste0("\n ------------------------------------", ifelse(init, "", "----"))
  
  cat(" Compiled network", init_msg,
    dashes,
    "\n  Nodes:", nn,
    "\n  Cliques:", length(x$cliques),
    "\n   - max:", max_C,
    "\n   - min:", min_C,
    "\n   - avg:", round(avg_C, 2)
  )

  e <- attr(x, "evidence")
  inc <- attr(x, "inconsistencies")
  if (!is.null(e)) {
    if (inc) cat("\n  Evidence: (inconsistencies)") else cat("\n  Evidence:")
    for (i in seq_along(e)) {
      cat(
        "\n   -", paste0(names(e[i]), ":"), unname(e[i])
      )
    }
  }

  cat(paste0("\n  ", cls), dashes, "\n") 
}


# --------------------------------------
# OBSOLETE CODE FOR MARKOV RANDOM FIELDS
# --------------------------------------

# #' A check and extraction of clique potentials from a Markov random field
# #' to be used in the junction tree algorithm
# #'
# #' @param x Character \code{data.frame}
# #' @param g A decomposable Markov random field as an igraph object.
# #' @examples
# #'
# #' # Typically one would use the ess package:
# #' # library(ess)
# #' # g  <- ess::fit_graph(derma)
# #' # pl <- pot_list(derma, ess::as_igraph(g))
# #' # pl
# #'
# #' # Another example
# #' g <- igraph::sample_gnm(ncol(asia), 12)
# #' while(!igraph::is.chordal(g)$chordal) g <- igraph::sample_gnm(ncol(asia), 12, FALSE)
# #' igraph::V(g)$name <- colnames(asia)
# #' plot(g)
# #' pot_list(asia, g)
# #' 
# #' @export
# pot_list <- function(x, g) UseMethod("pot_list")

# #' @rdname pot_list
# #' @export
# pot_list.data.frame <- function(x, g) {

#   if (!igraph::is.igraph(g)) stop("g must be an igraph object", call. = FALSE)
#   adj_lst <- as_adj_lst(igraph::as_adjacency_matrix(g, sparse = FALSE))

#   rip_ <- rip(adj_lst, check = TRUE)
#   cliques <- rip_$C
#   separators <- rip_$S
#   N <- nrow(x)

#   names(cliques) <- paste("C", 1:length(cliques), sep = "")
#   names(separators) <-paste("S", 1:length(separators), sep = "")
#   dns <- list()

#   clique_tabs <- lapply(seq_along(cliques), function(i) {
#     clique <- cliques[[i]]
#     spar <- sparta::as_sparta(x[, clique, drop = FALSE])
#     spar <- sparta::div(spar, N)
#     dns <<- push(dns, sparta::dim_names(spar))
#     spar
#   })

#   separator_tabs <- lapply(seq_along(separators), function(i) {
#     separator <- separators[[i]]
#     if (is.null(separator)) return(NULL)
#     spar <- sparta::as_sparta(x[, separator, drop = FALSE])
#     # NOTE: # Can be unstable for small values in spar?
#     # Maybe just deprecate this function all together and resort to cpt_list
#     spar <- sparta::div(spar, N)
#     sparta::div(1, spar)
#   })

#   clique_tabs[[1]] <- sparta::div(clique_tabs[[1]], N)

#   # Assign each sep to a clique
#   for (sep in separator_tabs) {
#     if (is.null(sep)) next
#     idx <- .map_lgl(clique_tabs, function(ct) all(names(sep) %in% names(ct)))
#     cl_idx <- which(idx)[1L]
#     clique_tabs[[cl_idx]] <- sparta::mult(clique_tabs[[cl_idx]], sep)
#   }

#   dns <- unlist(dns, FALSE)
#   dns <- dns[unique(names(dns))]
  
#   structure(
#     structure(clique_tabs, names = names(cliques)),
#     nodes     = colnames(x),
#     cliques   = cliques,
#     dim_names = dns,
#     graph     = g,
#     class     = c("pot_list", "list")
#   )
# }


# #' @rdname compile
# #' @export
# compile.pot_list <- function(x,
#                              evidence       = NULL,
#                              root_node      = "",
#                              joint_vars     = NULL,
#                              tri            = "min_fill",
#                              pmf_evidence   = NULL,
#                              alpha          = NULL
#                              ) {

#   check_params_compile(tri, pmf_evidence, alpha, names(x), root_node)
  
#   g       <- attr(x, "graph")
#   gmat    <- igraph::as_adjacency_matrix(g, sparse = FALSE)
#   adj_lst <- as_adj_lst(gmat)
#   cliques <- attr(x, "cliques")

#   # cliques_int is needed to construct the junction tree in new_jt -> new_schedule
#   dimnames(gmat) <- lapply(dimnames(gmat), function(x) 1:nrow(gmat))
#   adj_lst_int   <- as_adj_lst(gmat)
#   # root_node_int <- ifelse(root_node != "", as.character(match(root_node, names(adj_lst))), "")
#   cliques_int   <- lapply(rip(adj_lst_int)$C, as.integer)

#   inc <- new.env()
#   inc$inc <- FALSE
#   if (!is.null(evidence)) {
#     if (!valid_evidence(attr(x, "dim_names"), evidence)) {
#       stop("Evidence is not on correct form", call. = FALSE)
#     }
#     # x looses its attributes in set_evidence
#     att_ <- attributes(x)
#     x    <- set_evidence_(x, evidence, inc)
#     attributes(x) <- att_
#   }

#   charge  <- new_charge_pot(x)
#   structure(
#     list(charge   = charge, cliques = cliques),
#     root_node     = root_node,
#     joint_vars    = joint_vars,
#     dim_names     = attr(x, "dim_names"),
#     evidence      = evidence,
#     graph         = g,
#     cliques_int   = cliques_int,
#     inconsistencies = inc$inc,
#     class         = c("charge", "list")
#   )
# }