ars: Adaptive Rejection Sampling

#' ARS class providing object with methods for communication with R6
#'
#' @docType class
#' @importFrom R6 R6Class
#' @export
#' @return Object of \code{\link{R6Class}} with methods to generate adaptive rejection sampling
#' @usage example <- ars$new(funx=dnorm, D=c(-Inf, Inf))
#' @param funx a function we want to sample from
#' @param D a vector of length 2 of numbers for bounds of function
#' @format \code{\link{R6Class}} object.
#' @examples
#' ex <- ars$new(dnorm, c(-Inf,Inf),mean=3, sd=1)
#' samples <- ex$sample(n=1000)
#' ex$plot_samples()
#' @field self$f Desnity function we want to sample from
#' @field self$var_max Upper bound on function we want to sample from
#' @field self$var_min Lower bound on function we want to sample from
#' @field private$h_prims A R6 namedVector that contains h'(x)
#' @field private$h_vals A R6 namedVector that contains h(x)
#' @field private$s_cdfs A R6 namedVector that contains each interval's CDF
#' @field private$u_vals A R6 namedVector that contains u(x)
#' @field private$x a vector of x values that are our sample values. Empty unless sample() run
#' @field private$y a vector of y values that begins to increase once sample() is run
#' @field private$z a vector of z values, or intersection points, that begins to increase once sample() is run
#' @section Public Methods:
#' \describe{
#'   \item{\code{sample(n, init_l, init_r, squeeze)}}{This method samples n points from using adaptive rejection sampling. User may pick two initalizing points, init_l and init_r which represent data points to start at. Useful if -1 and 1 are far from the pdf, i.e rnorm(mean=3000, sd=1)}
#'   \item{\code{f(x)}}{This method calculates our funx observation at a given x }
#'   \item{\code{plot_sampdist()}}{This method plots our normalized envelope function }
#'   \item{\code{calc_sampdist()}}{This method calculates the sampling distribution from a uniform distribution}
#'   \item{\code{plot_samples()}}{This method plots our samples in a histogramm, with a blue line highlighting the median value}
#'   \item{\code{s()}}{This method calculates the envelope or sampling function }}
#' @section Private Methods:
#' \describe{
#'   \item{\code{h(x)}}{This method calculates the log of our funx at a given point x}
#'   \item{\code{init_hprim()}}{This method intializes our hprim values}
#'   \item{\code{init_hval()}}{This method initalizes our h values}
#'   \item{\code{init_scdf()}}{This method initalizes our cdf under the upper hull}
#'   \item{\code{init_u()}}{This method initializes our upper hull values}
#'   \item{\code{init_y()}}{This method initalizes our y values }
#'   \item{\code{l(p)}}{This method is a function that returns the slope of a lowerhull line given a point p}
#'   \item{\code{u(p)}}{This method is a function that returns the slope of a upperhull line given a point p}
#'   \item{\code{sampl_exph()}}{This method samples from our exp(h values)}
#'   \item{\code{update(y, hy, hy_prim)}}{This method updates our private variables after an interation}}
ars = R6Class(
  "ars",
  lock_objects = FALSE,
  public = list(
    ### functions ###
    # initialization

    initialize = function(funx, D = c(-Inf, Inf), ...) {
      # input: function and its support, initial points, minimum accepted number of points
      # note: should we give default value of range?

      if (class(funx) != "function")
        stop("funx must be a function")

      if(class(D)!="numeric") stop("D or dimensions must be number.")

      if (length(D) != 2)
        stop("Input dimension is not a length of 2")

      var_min = min(D)
      var_max = max(D)

      if(is.nan(funx(var_min + .Machine$double.eps, ...)) |
         is.nan(funx(var_max- .Machine$double.eps,...)))
        stop("Function is not defined at bounds") #add small noise for continuous variables

      f = function(x)
        funx(x, ...)

      if (! check_positive(f, var_min, var_max))
        stop('Input function is not positive in the given support.')

      if (var_min == var_max)
        stop("Input dimension must differ")

      Int_f = integrate(Vectorize(f), lower = var_min, upper =
                          var_max)
      if (abs(Int_f$value - 1.) > 10 * Int_f$abs.error) {
        # note: change tolerance level?
        warning('Input function might not be normalized.')
      }

      # set values
      self$f = f

      private$h = function(x) {
        val = f(x)
        if (val < 0) {
          stop('Input function is not positive in the given support.')
        }
        log(f(x))
      }

      self$var_min = var_min
      self$var_max = var_max
    },
    # initalize ends here

    calc_sampdist = function() {
      exp_u = function(x)
        exp(private$u(x))
      self$s = function(x)
        exp_u(x) / integrate(Vectorize(exp_u),
                             lower = self$var_min,
                             upper = self$var_max)$value
    },

    # main function. sample points from distribution
    sample = function(n = 1000, init_l = -1, init_r = 1,squeeze = TRUE) {
      # note:
      ## 1.squeeze=FALSE will disable squeezing test
      ## 2.init_l and init_r let the user to input initial value for private$init_y(y_min and y_max)
      ### in case input function is very far away from y_min=-1 and y_max=1(e.g. N(3000, 1))

      #start_npts = as.integer(n ^ (1 / 10)) + 1
      start_npts = 2
      # note: this is just an example of choosing the number of starting points

      # sample starting points
      private$init_y(init_l, init_r)
      if (self$var_min == -Inf && self$var_max == Inf) {
        private$y = c(private$y, rnorm(
          start_npts - length(private$y),
          mean = mean(private$y),
          sd = sd(private$y)
        ))
      } else if (self$var_min == -Inf) {
        private$y = c(private$y,-rexp(start_npts - length(private$y)) + self$var_max)
      } else if (self$var_max == Inf) {
        private$y = c(private$y, rexp(start_npts - length(private$y)) + self$var_min)
      } else {
        private$y = c(private$y,
                      runif(
                        start_npts - length(private$y),
                        min = self$var_min,
                        max = self$var_max
                      ))
      }
      # note: this is just an example of sampling starting points

      # construct the unnormalized cdf of s and everything needed for the construction,
      ## which is everything that is related to the upper hull
      private$y <- sort(private$y)

      # sample and update
      private$x = vector(mode = 'numeric', length = n)
      samp = 0
      loop = 0

      private$init_scdf()
      private$construct()

      while (samp < n && loop < 10 * n) {
        # note: l is the number of loops conducted.
        ## This is just an example of the criterion to stop the loop.

        ## sample ##

        x_star = private$samp_exph()
        u_star = runif(1)

        if (u_star <= exp(private$l(x_star) - private$u(x_star)) && squeeze) {
          samp = samp + 1
          private$x[samp] = x_star
        } else {
          hxstar = private$h(x_star)

          if (hxstar == -Inf)
            next

          hxstar_prim = calc_deriv(x_star, private$h, self$var_min, self$var_max)
          if (u_star <= exp(hxstar - private$u(x_star))) {
            samp = samp + 1
            private$x[samp] = x_star
          }
          ## update ##
          private$update(x_star, hxstar, hxstar_prim)
          private$construct()
        }
        loop = loop + 1
      }
      self$calc_sampdist()
      private$x
    },

    plot_samples = function() {
      library(ggplot2)

      # plot median to ignore outliers
      ggplot() + geom_histogram(aes(x = private$x)) +
        geom_vline(xintercept = median(private$x), color = "blue") +
        theme_bw() +
        ggtitle("Sample distribution") + xlab("Samples")

    },

    plot_sampdist = function() {
      library(ggplot2)

      self$calc_sampdist()
      xs <-
        seq(private$y[1], private$y[length(private$y)],
            length.out = 100)
      ys <- sapply(xs, self$s)

      ggplot() + geom_line(aes(x = xs, y = ys)) + theme_bw() +
        ggtitle("S distribution") + xlab("x") +
        ylab("P(S(X)=x)")

    },

    plot_u_l = function(){
      self$calc_sampdist()
      xs <-
        seq(private$y[1], private$y[length(private$y)],
            length.out = 100)
      #seq(-15, 15, by=0.25)
      ys_u <- sapply(xs, private$u)
      ys_l <- sapply(xs, private$l)

      ggplot() + geom_line(aes(x=xs, y=ys_l, colour="lower hull")) + theme_bw() +
        geom_line(aes(x=xs, y=ys_u, colour="upper hull")) +
        scale_colour_discrete("")  +
        ggtitle("Upper and Lower Hull distribution") +
        xlab("x") + ylab("values")

    },
    # print = function(){
    #   #invisible(self)
    # },
    ### variables ###
    # density function
    f = NULL,
    # min and max value of the support of the function
    var_min = NA,
    var_max = NA,
    # sampling function
    s = NULL
  ),

  private = list(
    ### functions ###
    # choose initial points
    init_y = function(y_min, y_max) {
      # (re)initialize sample points vector
      private$y = vector(mode = 'numeric')
      # if unbounded on the left
      if (self$var_min == -Inf) {
        iter = 0
        while (calc_deriv(y_min,
                          private$h,
                          lower = self$var_min,
                          upper = self$var_max) <= 0 && iter < 1000) {
          y_min = y_min - runif(1) * abs(private$h(y_min))
          # note: explain the reason to choose a random number
          ## and the reason to multiply by the function value.
          iter = iter + 1
        }
        if (iter >= 1000) {
          stop('Unlucky. Have searched over 1,000 times to find a h prime less than or equal to 0')
        }
        private$y = c(private$y, y_min)
      }
      # if unbounded on the right
      if (self$var_max == Inf) {
        iter = 0
        while (calc_deriv(y_max,
                          private$h,
                          lower = self$var_min,
                          upper = self$var_max) >= 0 && iter < 1000) {
          y_max = y_max + runif(1) * abs(private$h(y_max))
          # note: explain the reason to choose a random number
          ## and the reason to multiply by the function value.
          iter = iter + 1
        }
        if (iter >= 1000) {
          stop('Unlucky. Have searched over 1,000 tims to find a h prime larger than or equal to 0')
        }
        private$y = c(private$y, y_max)
      }
    },

    # initialize values of sampled points, called by init_u
    init_hval = function() {
      # calculate derivatives
      values = sapply(private$y, private$h)
      # (re)initialize derivatives of sample points
      private$h_vals = namedVector$new(names = private$y, values =
                                         values)
    },

    # initialize derivatives of sampled points, called by init_u
    init_hprim = function() {
      # calculate derivatives
      derivs = sapply(
        private$y,
        FUN = calc_deriv,
        f = private$h,
        lower = self$var_min,
        upper = self$var_max
      )
      # (re)initialize derivatives of sample points
      private$h_prims = namedVector$new(names = private$y, values =
                                          derivs)
    },

    # initialize upper hull
    init_u = function() {
      # set points

      m = length(private$y)
      y = private$y
      # set h values
      private$init_hval()
      hy = private$h_vals$values
      # set h derivatives
      private$init_hprim()
      hy_prim = private$h_prims$values
      # calculate Z
      y_l = y[1:(m - 1)]
      y_r = y[2:m]

      u_z = calc_uz(y_l, y_r,
                    hy[1:(m - 1)], hy[2:m],
                    hy_prim[1:(m -1)], hy_prim[2:m])
      # the case where hyprim_l = hyprim_r
      if(is.nan(u_z$names) | is.infinite(u_z$names))
        u_z <- namedVector$new(mean(y), mean(hy))
      # the case where it is not log-concave
      if(FALSE %in% ((u_z$names - y_l) > 0) || FALSE %in% ((y_r - u_z$names) > 0))
        stop('Input function is not log-concave.')

      u_pts = c(y[1], u_z$names, y[m])
      u_vals = c(hy[1], u_z$values, hy[m])
      # check concavity
      if (!check_interpolconcave(u_pts, u_vals)) {
        stop('Input function is not log-concave.')
      }
      # (re)initialize z
      private$z = u_z$names
      # (re)initialize upper hull values
      private$u_vals = namedVector$new(names = u_pts, values =
                                         u_vals)
      # (re)create upper hull function
      private$u = create_upphull(u_pts, u_vals)
    },

    # initialize cdfs of u
    init_scdf = function() {
      # set u
      private$init_u()
      u_pts = private$u_vals$names
      u_vals = private$u_vals$values
      # (re)initialize cdf
      cdf_pts = c(self$var_min, private$z, self$var_max)
      private$s_cdfs = integ_expinterpol(u_pts, u_vals, cdf_pts)

    },

    # construct function u and l
    construct = function() {
      private$u = create_upphull(private$u_vals$names, private$u_vals$values)
      private$l = create_lowhull(private$h_vals$names, private$h_vals$values)
    },
    # essential function 1 of main function: sample a point from s
    samp_exph = function() {
      # generate u
      rand = runif(1, min = 0, max = sum(private$s_cdfs$values))
      # find the interval of x where F(x) = u
      cumm_cdfs = cumsum(private$s_cdfs$values)

      interv = findInterval(rand, cumm_cdfs)

      cdf = cumm_cdfs[interv]


      # calculate x and return the value
      u_pts = private$u_vals$names
      u_vals = private$u_vals$values
      cdf_pts = private$s_cdfs$names

      a = (u_vals[interv + 1] - u_vals[interv]) / (u_pts[interv +
                                                           1] - u_pts[interv])
      b = u_vals[interv] - a * u_pts[interv]

      samp_pt = (log(a * (rand - cdf) + exp(a * cdf_pts[interv] + b)) - b) / a

      if (is.nan(samp_pt) | is.infinite(samp_pt)) {
        samp_pt = ((rand - cdf) + exp(b) * cdf_pts[interv]) / exp(b)
      }

      samp_pt
    },

    # essential function 2 of main function: update
    ## update everything that needs to be updated given a new y and its h value and h_prim value
    update = function(y, hy, hy_prim) {
      # note: updating needs identifying the interval the new value is in and a certain sequence,
      ## it is probably better to write it in a single function.

      # 1. update z, u_vals, s_cdfs backwards
      l_y = length(private$y)
      l_z = length(private$z)

      int = findInterval(y, private$y)

      if (int == 0) {
        # calculate new z
        u_z = calc_uz(y,
                      private$y[1],
                      hy,
                      private$h_vals$values[1],
                      hy_prim,
                      private$h_prims$values[1])
        quick_check = is.nan(u_z$names) | is.infinite(u_z$names)
        if(sum(quick_check)>0) return()

        z_new = u_z$names
        uz_new = u_z$values
        # check concavity
        uvals_new = private$u_vals$clone()
        uvals_new$delete_byname(private$y[1])
        uvals_new$add(c(y, z_new), c(hy, uz_new))
        uvals_new$sort_byname()

        if (!check_interpolconcave(uvals_new$names, uvals_new$values)){
          stop('Input function is not log-concave.')
        }
        # calculate new cdf
        calc_pts = c(y, z_new, private$z[1])
        calc_vals = c(hy, uz_new, private$u_vals$values[2])
        interv_pts = c(self$var_min, z_new, private$z[1])

        scdf_new = integ_expinterpol(calc_pts, calc_vals, interv_pts)
        # update s_cdfs
        private$s_cdfs$delete_byname(private$z[1])
        private$s_cdfs$add(scdf_new$names, scdf_new$values)
        private$s_cdfs$sort_byname()
        # update u_vals
        private$u_vals$delete_byname(private$y[1])
        private$u_vals$add(c(y, z_new), c(hy, uz_new))
        private$u_vals$sort_byname()
        # update z
        private$z = sort(c(private$z, z_new))
      } else if (int == l_y) {
        # calculate new z

        u_z = calc_uz(private$y[l_y],
                      y,
                      private$h_vals$values[l_y],
                      hy,
                      private$h_prims$values[l_y],
                      hy_prim)

        quick_check = is.nan(u_z$names) | is.infinite(u_z$names)
        if(sum(quick_check)>0) return()

        z_new = u_z$names
        uz_new = u_z$values
        # check concavity
        uvals_new = private$u_vals$clone()
        uvals_new$delete_byname(private$y[l_y])
        uvals_new$add(c(z_new, y), c(uz_new, hy))
        uvals_new$sort_byname()
        if (!check_interpolconcave(uvals_new$names, uvals_new$values)) {
          stop('Input function is not log-concave.')
        }
        # calculate new cdf
        calc_pts = c(private$z[l_z], z_new, y)
        calc_vals = c(private$u_vals$values[l_z + 1], uz_new, hy)
        interv_pts = c(private$z[l_z], z_new, self$var_max)

        scdf_new = integ_expinterpol(calc_pts, calc_vals, interv_pts)
        # update s_cdf
        private$s_cdfs$delete_byname(self$var_max)
        private$s_cdfs$add(scdf_new$names, scdf_new$values)
        private$s_cdfs$sort_byname()
        # update u_vals
        private$u_vals$delete_byname(private$y[l_y])
        private$u_vals$add(c(z_new, y), c(uz_new, hy))
        private$u_vals$sort_byname()
        # update z
        private$z = sort(c(private$z, z_new))
        # note: this could potentially merge with the previous situation
      } else {
        # calculate z

        y_l = c(private$y[int], y)
        y_r = c(y, private$y[int + 1])

        hy_l = c(private$h_vals$values[int], hy)
        hy_r = c(hy, private$h_vals$values[int + 1])
        hyprim_l = c(private$h_prims$values[int], hy_prim)
        hyprim_r = c(hy_prim, private$h_prims$values[int + 1])

        u_z = calc_uz(y_l, y_r, hy_l, hy_r, hyprim_l, hyprim_r)

        quick_check = is.nan(u_z$names) | is.infinite(u_z$names)
        if(sum(quick_check)>0) return()

        z_new = u_z$names
        uz_new = u_z$values

        # check concavity
        uvals_new = private$u_vals$clone()

        uvals_new$delete_byname(private$z[int])
        uvals_new$add(z_new, uz_new)
        uvals_new$sort_byname()
        if (!check_interpolconcave(uvals_new$names, uvals_new$values)) {
          stop('Input function is not log-concave.')
        }
        # calculate new cdf
        calc_pts = c(private$u_vals$names[int], z_new, private$u_vals$names[int +
                                                                              2])
        calc_vals = c(private$u_vals$values[int], uz_new, private$u_vals$values[int +
                                                                                  2])


        interv_pts = c(private$s_cdfs$names[int], z_new, private$s_cdfs$names[int +
                                                                                2])
        scdf_new = integ_expinterpol(calc_pts, calc_vals, interv_pts)
        # update s_cdf
        private$s_cdfs$delete_byname(private$s_cdfs$names[(int + 1):(int + 2)])
        private$s_cdfs$add(scdf_new$names, scdf_new$values)
        private$s_cdfs$sort_byname()
        # update u_vals
        private$u_vals$delete_byname(private$z[int])
        private$u_vals$add(z_new, uz_new)
        private$u_vals$sort_byname()
        # update z
        private$z = private$z[-int]
        private$z = sort(c(private$z, z_new))
      }
      # 2. update y, h_vals, h_prims
      # update y
      private$y = c(private$y, y)
      private$y = sort(private$y)
      # update h_vals
      private$h_vals$add(y, hy)
      private$h_vals$sort_byname()
      # update h_prims
      private$h_prims$add(y, hy_prim)
      private$h_prims$sort_byname()
      # recreate u
      private$u = create_upphull(private$u_vals$names, private$u_vals$values)
    },

    ### variables ###
    # log of the input function
    h = NULL,
    # construction points
    y = c(),
    # values of sampled points
    h_vals = NULL,
    # derivatives of sampled points
    h_prims = NULL,
    # points of upper hull
    z = c(),
    # upper hull function
    u = NULL,
    # upper hull, stored pointwise(include the value of all z points and the first and last y points)
    u_vals = NULL,
    # cdf of each interval of exponential upper hull, unnormalized and stored pointwise
    s_cdfs = NULL,
    # lower hull function
    l = NULL,
    # sampled points
    x = c()
  )
)