datasim: Data Simulation Based on Models Formulas

#' @title Univariate factor effects
#'
#' @description
#' \code{fa} handles the evaluation of factor effects with two behaviours. It
#' evaluates the effects applied to the factor \code{x} if \code{size == NULL} or
#' simulates a factor \code{x} if \code{size} is provided.
#'
#' @details
#' Considering \eqn{x} the \eqn{n}-length factor under study with \eqn{k} levels and
#' \eqn{X} the associated \eqn{nxk} design matrix with dummy variables corresponding
#' to each level of the factor, the returning effect is
#' \deqn{Xb,}
#' where \eqn{b} is a \eqn{k}-length vector of regression coefficients.
#'
#' @param x A factor of length \eqn{n} to evaluate the effects. If \code{size !=
#' NULL}, \code{x} is the output of the function.
#' @param beta A numeric vector b of regression coefficients representing the effects
#' for each level of \code{x}.
#' @param levels A character vector of length \eqn{k} to name the \code{levels} of the
#' factor \code{x}.
#' @param size A numeric value \eqn{n} representing the number of units, it is used to
#' simulate the covariate \code{x}. In case \code{size == NULL}, \code{fa} evaluates
#' the effects.
#'
#' @return A simulated factor \eqn{x} in case \code{size} is provided; otherwise, a
#' \eqn{n}-length numeric vector of the evaluated effects.
#'
#' @author Erick A. Chacón-Montalván
#'
#' @examples
#' (x <- fa(beta = -1:1, size = 10))
#' fa(x, beta = -1:1)
#' fa(x, beta = 1:3)
#'
#' @export
fa <- function (x, beta, levels = 1:length(beta), size = NULL) {
  if (!is.null(size)) {
    output <- factor(sample(levels, size = size, replace = TRUE), levels = levels)
  } else {
    names(beta) <- levels(x)
    output <- as.numeric(beta[x])
  }
  return(output)
}

#' @title Univariate random effects
#'
#' @description
#' \code{function} description.
#'
#' @details
#' details.
#'
#' @param x factor vector to evaluate the random effect
#' @param sigma variance of the random effect
#' @param groups character vector to name the \code{levels} of \code{x} or a numeric
#' value indicating the number of groups of \code{x}
#' @param size numeric value to simulate the covariate \code{x}
#' @param q number of response varables to replicate
#' @param replace An optional argument to simulate an independent random effect with
#' one repetition (e.g. \code{mre(groups = 100, size = 100, replace = FALSE)})
#'
#' @return return.
#'
#' @author Erick A. Chacón-Montalván
#'
#' @examples
#'
#' (x <- re(groups = 5, size = 15))
#' re(x, sigma = 10)
#'
#' (x <- re(groups = 15, size = 15, replace = FALSE))
#' re(x, sigma = 1)
#'
#' (x <- re(groups = 2, size = 5, q = 2))
#' re(x, sigma = 10)
#'
#' (x <- 1:10)
#' re(x, sigma = 10)
#'
#' @export
re <- function (x, sigma, groups, size = NULL, q = 1, replace = TRUE) {
  if (!is.null(size)) {
    if (is.numeric(groups) & length(groups) == 1) {
      groups <- seq_len(groups)
      ngroups <- length(groups)
    }
    output <- rep(sample(groups, size = size, replace = replace), q) %>%
      factor(levels = groups)
  } else {
    if (!is.factor(x)) x <- factor(x)
    groups <- levels(x)
    beta <- rnorm(length(groups), 0, sigma)
    names(beta) <- groups
    output <- as.numeric(beta[x])
  }
  return(output)
}

exp_cor <- function (d, phi) {
  exp(-d/phi)
}

#' @title Simulate a Gaussian process
#'
#' @description
#' \code{gp} Simulate a spatial Gaussian process given a certain covariance function.
#'
#' @details
#' details.
#'
#' @param coords A list of coordinates
#' @param cor.model A character or function indicating the covariance function that
#' Should be used to compute the variance-covariance matrix
#' @param cor.params A list of the parameters required by the \code{cor.model} function.
#' @param sigma2 variance of the Gaussian process
#' @param size numeric value to simulate the covariate \code{x}
#' @param range Range of the coordinates of the Gaussian processes.
#' @param geom object of class ‘sf’ or ‘sfc’ to define the area where to simulate the
#' samples
#'
#' @return A vector of the realization of the Gaussian Process
#'
#' @author Erick A. Chacón-Montalván
#'
#' @examples
#'
#' (x <- gp(list(s1 = NA), size = 10))
#' (s1 <- x[[1]])
#' # Simulate and plot the realization of a Gaussian process
#' (y <- gp(list(s1), cor.model = "exp_cor", cor.params = list(phi = 0.05)))
#'
#' (x <- gp(list(s1 = NA, s2 = NA), size = 10))
#' (s1 <- x[[1]])
#' (s2 <- x[[2]])
#' # Simulate and plot the realization of a Gaussian process
#' (y <- gp(list(s1, s2), cor.model = "exp_cor", cor.params = list(phi = 0.05)))
#' plot(s1, s2, cex = y)
#' # Plot with ggplot
#' # ggplot(data.frame(s1, s2, y), aes(s1, s2, col = y)) +
#' #  geom_point(size = 3)
#'
#' (x <- gp(list(s1 = "none", s2 = NA), size = 10))
#' (s1 <- x[[1]])
#' (s2 <- s1)
#' # Simulate and plot the realization of a Gaussian process
#' (y <- gp(list(s1, s2), cor.model = "exp_cor", cor.params = list(phi = 0.05)))
#'
#' @importFrom stats dist rnorm runif
#' @importFrom purrr map
#' @importFrom sf st_dimension st_sample st_distance
#'
#' @export
gp <- function (coords, cor.model = "exp_cor", cor.params, sigma2 = 1, size = NULL, range = 1, geom = NULL) {
  if (!is.null(size)) {
    # simulate coordinates
    if (!is.null(geom) && sf::st_dimension(geom) == 2) {
      output <- sf::st_sample(geom, size = size)
      # convert coordinates to list if adequate
      if (exists("coords") && is.list(coords) && !inherits(coords, "sfc")) {
        if (all(purrr::map_lgl(coords, ~ is.logical(.) || is.numeric(.))) &&
            length(coords) == 2) {
          output <- sfc_as_coords(output)
        } else {
          stop("dimensions of coords and geom are incompatible")
        }
      }
    } else {
      ncoords <- purrr::map(coords, is.na) %>% do.call(sum, .)
      output <- replicate(ncoords, list(range * stats::runif(size)))
    }
  } else {
    # compute distance matrix
    if (!is.null(geom) && sf::st_dimension(geom) == 2) {
      if (!inherits(coords, "sfc")) coords <- coords_as_sfc(coords, geom)
      n <- length(coords)
      distance <- unclass(sf::st_distance(coords))
    } else {
      coords <- do.call(cbind, coords)
      n <- nrow(coords)
      distance <- as.matrix(dist(coords))
    }
    # simulate gp
    varcov <- sigma2 * do.call(cor.model, c(list(distance), cor.params))
    right <- chol(varcov)
    output <- as.numeric(crossprod(right, rnorm(n)))
  }
  return(output)
}

#' @importFrom sf st_as_sf st_crs st_geometry
coords_as_sfc <- function (coords, geom) {
  coords <- coords  %>%
    setNames(c("x", "y"))  %>%
    as.data.frame() %>%
    sf::st_as_sf(coords = c("x", "y"), crs = sf::st_crs(geom)) %>%
    sf::st_geometry()
  return(coords)
}

#' @importFrom sf st_coordinates
sfc_as_coords <- function (sfc) {
  sfc_list <- sfc %>%
    sf::st_coordinates() %>%
    as.data.frame() %>%
    as.list() %>%
    setNames(NULL)
  return(sfc_list)
}

ErickChacon/datasim documentation built on March 25, 2020, 7:53 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

ErickChacon/datasim
Data Simulation Based on Models Formulas

R/effects-uni.R
In ErickChacon/datasim: Data Simulation Based on Models Formulas

R Package Documentation

Browse R Packages

We want your feedback!

ErickChacon/datasim Data Simulation Based on Models Formulas

R/effects-uni.R In ErickChacon/datasim: Data Simulation Based on Models Formulas

R Package Documentation

Browse R Packages

We want your feedback!

ErickChacon/datasim
Data Simulation Based on Models Formulas

R/effects-uni.R
In ErickChacon/datasim: Data Simulation Based on Models Formulas