R/SimulationHandler.R
In epizootic: Spatially Explicit Population Models of Disease Transmission in Wildlife

#' R6 class representing a simulation handler.
#'
#' @description
#' [`R6::R6Class`] class to represent a handler for running multiple model
#' simulations and saving results. This simulation manager bears some
#' resemblance to the [`poems::SimulationManager`] in \code{poems}, but differs
#' in that it can handle multiple dispersal generators, uses a different engine
#' for parallelization, handles errors differently, and has a different default
#' data format (\code{.qs}).
#'
#' @importFrom foreach foreach
#' @importFrom foreach %dopar%
#' @importFrom doParallel registerDoParallel
#' @importFrom doParallel stopImplicitCluster
#' @importFrom qs qsave
#' @importFrom R6 R6Class
#' @export SimulationHandler

SimulationHandler <- R6Class("SimulationHandler",
  inherit = GenericManager,
  public = list(
    ## Attributes ##

    # object_generator [inherited]

    #' @field attached A list of dynamically attached attributes (name-value
    #' pairs).
    attached = list(),

    ## Methods ##

    # Inherited methods (from GenericClass & GenericManager) #
    #   new_clone(...)
    #   get_attribute(param)
    #   get_message_sample(status_message, sample_index)
    #   get_results_filename(sample_index)

    # Overwritten/overridden methods #

    #' @description
    #' Initialization method sets any included attributes (\emph{sample_data},
    #' \emph{model_template}, \emph{generators}, \emph{model_simulator},
    #' \emph{parallel_cores}, \emph{results_dir},
    #' \emph{results_filename_attributes}) and attaches other attributes
    #' individually listed.
    #' @param model_template A SimulationModel (or inherited class) object with
    #'   parameters common to all simulations.
    #' @param ... Parameters listed individually.
    initialize = function(model_template = NULL, ...) {
      self$model_template = model_template
      if (!("model_simulator" %in% names(list(...)))) {
        if (!is.null(model_template)) {
          self$model_simulator <- ModelSimulator$new(simulation_function = model_template$simulation_function)
        } else {
          self$model_simulator <- ModelSimulator$new()
        }
      }
      super$initialize(...)
    },

    #' @description
    #' Summarizes the simulation log and writes it to a text file.
    #'
    #' This method takes a nested list of simulation log entries generated by
    #' the `run` method and summarizes the log. It determines which simulations
    #' were successful, collects any warnings, and writes the summary to a text
    #' file in the results directory.
    #'
    #' @param simulation_log A nested list of simulation log entries.
    #' @return A list containing the summary, indices of failed simulations,
    #'   indices of simulations with warnings, and the full log.
    #' @export
    log_simulation = function(simulation_log) {
      # Determine which simulations were successful and collect any warnings
      successful_array <- array(FALSE, length(simulation_log))
      warning_indices <- c()
      for (i in 1:length(simulation_log)) {
        if (is.null(simulation_log[[i]]$successful)) {
          simulation_log[[i]] <- list(message = as.character(simulation_log[[i]]), successful = FALSE)
        }
        successful_array[i] <- simulation_log[[i]]$successful
        if (!is.null(simulation_log[[i]]$warnings)) {
          warning_indices <- c(warning_indices, i)
        }
      }
      # Add a summary and failure & warning indices to the log
      simulation_log <- list(summary = sprintf("%s of %s sample models ran and saved results successfully",
                                               length(which(successful_array)), length(simulation_log)),
                             failed_indices = which(!successful_array),
                             warning_indices = warning_indices,
                             full_log = simulation_log)
      if (length(warning_indices)) {
        simulation_log$summary <- paste(simulation_log$summary, "with warnings")
      }
      # Write a log file
      log_file <- file.path(self$results_dir, "simulation_log.txt")
      suppressWarnings(try({
        file_con <- file(log_file, 'w')
        writeLines(c(simulation_log$summary), con = file_con)
        if (length(simulation_log$failed_indices)) {
          writeLines(c("", paste(length(simulation_log$failed_indices), "failed runs/errors:")), con = file_con)
          for (i in simulation_log$failed_indices) {
            writeLines(c("", paste("Sample", i, ":"), simulation_log$full_log[[i]]$message), con = file_con)
            if (!is.null(simulation_log$full_log[[i]]$errors)) {
              writeLines(simulation_log$full_log[[i]]$errors, con = file_con)
            }
          }
        }
        if (length(warning_indices)) {
          writeLines(c("", paste(length(warning_indices), "warnings:")), con = file_con)
          for (i in warning_indices) {
            writeLines(c("", paste("Sample", i, ":"), simulation_log$full_log[[i]]$message), con = file_con)
            writeLines(simulation_log$full_log[[i]]$warnings, con = file_con)
          }
        }
        close(file_con)
      }, silent = TRUE))
      return(simulation_log)
    },

    #' @description
    #' Sets the model sample attributes via the sample data frame and the
    #' generators.
    #'
    #' This method sets the sample attributes of a SimulationModel object based
    #' on the specified sample index. It uses the sample data frame and the
    #' generators to determine the attribute values.
    #'
    #' @param model [`poems::SimulationModel`] (or inherited class) object
    #'   (clone) to receive sample attributes.
    #' @param sample_index Index of sample from data frame.
    #' @keywords internal
    #' @export
    set_model_sample = function(model, sample_index) {
      sample_list <- as.list(self$sample_data[sample_index, ])
      names(sample_list) <- names(self$sample_data)

      if (!is.null(model$attached$sample_model_names)) {
        model$set_sample_attributes(params = sample_list[model$attached$sample_model_names])
      }

      if (!is.null(self$generators)) {
        for (i in 1:length(self$generators)) {
          generator <- self$generators[[i]]

          if (!is.null(model$attached$sample_generative_names[[i]])) {
            if ("DispersalGenerator" %in% class(generator)) {
              inputs <- intersect(generator$inputs,
                                  generator$get_attribute_aliases())

              if (any(names(self$model_template$get_attributes()) %in% inputs)) {
                generator$set_attributes(params = model$get_attributes()[inputs])
              } else if (any(names(self$sample_data) %in% inputs)) {
                generator$set_attributes(params = sample_list[inputs])
              }

              if (generator$generative_requirements_satisfied()$dispersal_data) {
                generator$calculate_dispersals()
                name <- model$attached$sample_generative_names[[i]]
                if (length(generator$error_messages)) {
                  cli_abort(
                    c(
                      "Dispersal generator {name} produced errors:",
                      "x" = "{generator$error_messages}"
                    )
                  )
                }
                suppressWarnings(model$set_sample_attributes(params = setNames(
                  list(generator$dispersal_data), name
                )))
              } else {
                cli_abort(
                  c(
                    "Errors produced when generating {self$nested_model$attached$sample_generative_names[[i]]}.",
                    "x" = "This generator requires {generator$inputs}."
                  )
                )
              }
            } else {
              inputs <- unique(c(
                generator$inputs,
                generator$get_attribute_aliases(params = generator$inputs)
              ))
              # Initialize input_values as a named list with the same names as inputs
              input_values <- setNames(vector("list", length(inputs)), inputs)

              # Update values from model$get_attributes()
              matching_attributes <- intersect(names(input_values), names(model$get_attributes()))
              input_values[matching_attributes] <- model$get_attributes()[matching_attributes]

              # Update values from sample_list
              matching_samples <- intersect(names(input_values), names(sample_list))
              input_values[matching_samples] <- sample_list[matching_samples]

              model$set_sample_attributes(params = generator$generate(input_values = input_values))
              if (length(generator$error_messages)) {
                cli_abort(
                  c(
                    "Generator {generator$description} produced errors:",
                    "x" = "{generator$error_messages}"
                  )
                )
              }
            }
          }
        }
      }
    },


    #' @description Runs the multiple population simulations, stores the
    #' results, and creates a simulation log.
    #'
    #' This method runs multiple population simulations using the specified
    #' model template and sample data. It stores the simulation results in the
    #' specified results directory and creates a simulation log. The simulation
    #' log contains information about the success or failure of each simulation
    #' run.
    #'
    #' @param results_dir Results directory path where the simulation results
    #'   will be stored. If not provided, the results directory must be set
    #'   within the manager class object.
    #' @return A list representing the simulation log. Each element of the list
    #'   corresponds to a simulation run and contains information about the
    #'   success or failure of the run, any error messages, and the path to the
    #'   saved results file (if applicable).
    #' @export
    run = function(results_dir = NULL) {
      # Check for error messages
      if (!is.null(self$error_messages)) {
        error_messages <- self$error_messages
        self$error_messages <- NULL
        stop(error_messages, call. = FALSE)
      }

      # Check that model and sample data is present
      if (is.null(self$model_template) |
          length(self$sample_data) == 0) {
        cli_abort(
          c(
            "Simulations cannot run unless there is a `model_template`
                    or a `sample_data` with at least one row."
          )
        )
      }

      # Check that model simulator/function is present
      if (is.null(self$model_simulator)) {
        stop("The model simulator has not been set", call. = FALSE)
      } else if (is.null(self$model_simulator$simulation_function)) {
        stop("The model simulator function has not been set", call. = FALSE)
      }

      # Check that the results directory is present and exists
      if (is.null(self$results_dir)) {
        stop("No output directory set for results", call. = FALSE)
      }
      if (!dir.exists(self$results_dir)) {
        stop(paste("Could not find results directory", self$results_dir),
             call. = FALSE)
      }
      if (is.null(self$results_ext)) {
        self$results_ext <- ".qs" # reinstate default
      }

      # Create a nested simulation (or descendant) model for cloning
      self$nested_model <- self$model_template$new_clone(template = self$model_template)

      # Allow extra attachments to be passed
      if ("nested_model" %in% names(self$attached)) {
        self$nested_model$attached <- self$attached$nested_model
      }

      model_sample_columns <- which(names(self$sample_data) %in% self$nested_model$get_attribute_aliases())
      if (length(model_sample_columns) > 0) {
        self$nested_model$attached$sample_model_names <- names(self$sample_data)[model_sample_columns]
        self$nested_model$sample_attributes <- self$nested_model$attached$sample_model_names
      }
      if (!is.null(self$generators)) {
        self$nested_model$attached$sample_generative_names <- list()
        dispersal_count <- 0

        for (i in 1:length(self$generators)) {
          generator <- self$generators[[i]]

          if ("DispersalGenerator" %in% class(generator)) {
            dispersal_count <- dispersal_count + 1
            self$nested_model$attached$sample_generative_names[[i]] <- paste0("dispersal", dispersal_count)
            self$nested_model$sample_attributes <- unique(c(
              self$nested_model$sample_attributes,
              paste0("dispersal", dispersal_count)
            ))
          } else {
            self$nested_model$attached$sample_generative_names[[i]] <- generator$outputs
            self$nested_model$sample_attributes <- unique(c(
              self$nested_model$sample_attributes,
              generator$outputs
            ))
          }
        }
      }

      # Check the completeness/consistency of the first sample only
      model <- self$nested_model$clone()
      self$set_model_sample(model, 1)
      if (length(model$error_messages)) {
        stop(c(
          "Error(s) setting model sample attributes: ",
          model$error_messages
        ),
        call. = FALSE)
      }
      if (!model$is_complete()) {
        incomplete_message <- "Model attributes are incomplete"
        if (!model$is_consistent()) {
          incomplete_message <- paste(incomplete_message, "/inconsistent", sep = "")
        }
        incomplete_message <- paste0(incomplete_message,
                                     ": ",
                                     paste(model$incomplete_attributes(), collapse = ", "))
        stop(incomplete_message, call. = FALSE)
      }
      model <- NULL # release from memory

      doParallel::registerDoParallel(cores = self$parallel_cores)
      simulation_log <- foreach(
        i = 1:nrow(self$sample_data),
        .packages = c("raster"),
        .errorhandling = c("pass")
      ) %dopar% {
        # Clone the model
        model <- self$nested_model$clone()

        # Set the model sample attributes
        self$set_model_sample(model, i)
        if (length(model$error_messages)) {
          return(
            list(
              successful = FALSE,
              message = self$get_message_sample("Error(s) setting model %s sample attributes", i),
              errors = model$error_messages
            )
          )
        }

        # Create and run the simulator
        simulator <- self$model_simulator$new_clone(simulation_model = model, sample_id = i)
        simulator_run_status <- simulator$run()

        # Substitute sample details into the simulator run status message
        simulator_run_status$message <- self$get_message_sample(simulator_run_status$message, i)

        # Save results
        if (!is.null(simulator$results)) {
          results_file <- file.path(self$results_dir,
                                    paste0(self$get_results_filename(i), self$results_ext))
          suppressWarnings(try(if (self$results_ext == ".qs") {
            qsave(simulator$results, results_file)
          } else {
            saveRDS(simulator$results, file = results_file)
          }, silent = TRUE)
          )
          if (file.exists(results_file))
          {
            simulator_run_status$message <- paste0(simulator_run_status$message,
                                                   " and the results were saved")
          } else {
            simulator_run_status$successful <- FALSE
            simulator_run_status$message <- paste0(
              simulator_run_status$message,
              ", but the results could not be saved in ",
              results_file
            )
          }
        }

        return(simulator_run_status)
      }
      doParallel::stopImplicitCluster()

      # Summarize and write log to a file
      simulation_log <- self$log_simulation(simulation_log)

      return(simulation_log)
    }

  ), # end public

  private = list(
    ## Attributes ##

  # Manager attributes #
  .manager_attributes = c("sample_data", "model_template", "nested_model", "generators", "model_simulator",
                          "parallel_cores", "results_dir", "results_ext", "results_filename_attributes"),
  # .sample_data                   [inherited]
  .model_template = NULL,
  .nested_model = NULL,
  # .generators             [inherited]
  .model_simulator = NULL,
  # .parallel_cores                [inherited]
  # .results_dir                   [inherited]
  .results_ext = ".qs"
  # .results_filename_attributes   [inherited]

  # Errors and warnings #
  # .error_messages                [inherited]
  # .warning_messages              [inherited]
  ), # end private

  active = list(

    #' @field sample_data A data frame of sampled parameters for each simulation/result.
    sample_data = function(value) { # inherited
      if (missing(value)) {
        super$sample_data
      } else {
        super$sample_data <- value
      }
    },

    #' @field model_template A [`poems::SimulationModel`] (or inherited class)
    #' object with parameters common to all simulations.
    model_template = function(value) {
      if (missing(value)) {
        private$.model_template
      } else {
        if (!is.null(value) && !("SimulationModel" %in% class(value))) {
          cli_abort(c("`model_template` should be a `SimulationModel`
                      or inherited object.",
                "x" = "`model_template` is {class(value)}."))
        } else {
          if (!is.null(value) && !is.null(self$model_simulator) && is.null(self$model_simulator$simulation_function)) {
            self$model_simulator$simulation_function <- value$simulation_function
          }
          private$.model_template <- value
        }
      }
    },

    #' @field nested_model A [`poems::SimulationModel`] (or inherited class)
    #' object with empty sample parameters and a nested model template common to
    #'  all simulations.
    nested_model = function(value) {
      if (missing(value)) {
        private$.nested_model
      } else {
        if (!is.null(value) && !("SimulationModel" %in% class(value))) {
          cli_abort(c("`model_template` should be a `SimulationModel`
                      or inherited object.",
                "x" = "`model_template` is {class(value)}."))
        } else {
          private$.nested_model <- value
        }
      }
    },

    #' @field generators A list of generators ([`poems::Generator`] or inherited
    #' class) objects for generating simulation model values.
    generators = function(value) { # inherited
      if (missing(value)) {
        super$generators
      } else {
        super$generators <- value
      }
    },

    #' @field model_simulator A [`poems::ModelSimulator`] (or inherited class)
    #' object for running the simulations.
    model_simulator = function(value) {
      if (missing(value)) {
        private$.model_simulator
      } else {
        if (!is.null(value) && !("ModelSimulator" %in% class(value))) {
          cli_abort(c("`model_simulator` should be a `ModelSimulator`
                      or inherited object.",
                "x" = "`model_simulator` is {class(value)}."))
        } else {
          private$.model_simulator <- value
        }
      }
    },

    #' @field parallel_cores Number of cores for running the simulations in
    #' parallel.
    parallel_cores = function(value) { # inherited
      if (missing(value)) {
        super$parallel_cores
      } else {
        super$parallel_cores <- value
      }
    },

    #' @field results_dir Results directory path.
    results_dir = function(value) { # inherited
      if (missing(value)) {
        super$results_dir
      } else {
        super$results_dir <- value
      }
    },

    #' @field results_ext Result file extension (default is .RData).
    results_ext = function(value) { # inherited
      if (missing(value)) {
        private$.results_ext
      } else {
        private$.results_ext <- value
      }
    },

    #' @field results_filename_attributes A vector of: prefix (optional);
    #' attribute names (from the sample data frame); postfix (optional);
    #' utilized to construct results filenames.
    results_filename_attributes = function(value) { # inherited
      if (missing(value)) {
        super$results_filename_attributes
      } else {
        super$results_filename_attributes <- value
      }
    },

    #' @field error_messages A vector of error messages encountered when setting
    #'  model attributes.
    error_messages = function(value) { # inherited
      if (missing(value)) {
        super$error_messages
      } else {
        super$error_messages <- value
      }
    },

    #' @field warning_messages A vector of warning messages encountered when
    #' setting model attributes.
    warning_messages = function(value) { # inherited
      if (missing(value)) {
        super$warning_messages
      } else {
        super$warning_messages <- value
      }
    }

  ) # end active
)
Any scripts or data that you put into this service are public.
epizootic documentation built on Oct. 2, 2024, 5:07 p.m.
rdrr.io home R language documentation Run R code online
CRAN packages Bioconductor packages R-Forge packages GitHub packages
Note that we can't provide technical support on individual packages. You should contact the package authors for that.
epizootic
Spatially Explicit Population Models of Disease Transmission in Wildlife

R/SimulationHandler.R
In epizootic: Spatially Explicit Population Models of Disease Transmission in Wildlife

Try the epizootic package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

epizootic Spatially Explicit Population Models of Disease Transmission in Wildlife

R/SimulationHandler.R In epizootic: Spatially Explicit Population Models of Disease Transmission in Wildlife

Try the epizootic package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

epizootic
Spatially Explicit Population Models of Disease Transmission in Wildlife

R/SimulationHandler.R
In epizootic: Spatially Explicit Population Models of Disease Transmission in Wildlife