aws: Adaptive Weights Smoothing

Documented in aws.gaussian

#
#    R - function  aws  for likelihood  based  Adaptive Weights Smoothing (AWS)
#    for local constant Gaussian, Bernoulli, Exponential, Poisson, Weibull and
#    Volatility models
#
#    emphazises on the propagation-separation approach
#
#    Copyright (C) 2006 Weierstrass-Institut fuer
#                       Angewandte Analysis und Stochastik (WIAS)
#
#    Author:  Joerg Polzehl
#
#  This program is free software; you can redistribute it and/or modify
#  it under the terms of the GNU General Public License as published by
#  the Free Software Foundation; either version 2 of the License, or
#  (at your option) any later version.
#
#  This program is distributed in the hope that it will be useful,
#  but WITHOUT ANY WARRANTY; without even the implied warranty of
#  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#  GNU General Public License for more details.
#
#  You should have received a copy of the GNU General Public License
#  along with this program; if not, write to the Free Software
#  Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307,
#  USA.
#
#     default parameters:  see function setawsdefaults
#
aws.gaussian <- function(y,
           hmax = NULL,
           hpre = NULL,
           aws = TRUE,
           memory = FALSE,
           varmodel = "Constant",
           lkern = "Triangle",
           aggkern = "Uniform",
           scorr = 0,
           mask = NULL,
           ladjust = 1,
           wghts = NULL,
           u = NULL,
           varprop = .1,
           graph = FALSE,
           demo = FALSE)
  {
    #
    #    first check arguments and initialize
    #
    args <- match.call()
    dy <- dim(y)
    if (length(dy) > 3)
      stop("AWS for more than 3 dimensional grids is not implemented")
    if (!(varmodel %in% c("Constant", "Linear", "Quadratic")))
      stop("Model for variance not implemented")
    #
    #   set appropriate defaults
    #
    if (is.null(wghts))
      wghts <- c(1, 1, 1)
    wghts <-
      switch(length(dy), c(0, 0), c(wghts[1] / wghts[2], 0), wghts[1] / wghts[2:3])
    if (is.null(wghts))
      wghts <- c(0, 0)
    cpar <-
      setawsdefaults(dy,
                     mean(y),
                     "Gaussian",
                     lkern,
                     aggkern,
                     aws,
                     memory,
                     ladjust,
                     hmax,
                     1,
                     wghts)
    if (is.null(mask)) {
      if (length(dy) == 0)
        mask <- rep(TRUE, length(y))
      else
        mask <- array(TRUE, dy)
    } else {
# diagnostics only without mask
      u <- NULL
      graph <- demo <-  FALSE
    }
    dmask <- dim(mask)
    nvoxel <- sum(mask)
    position <- array(0,dmask)
    position[mask] <- 1:nvoxel
    if(!is.null(u)){
       if(!all(dim(u)==dmask))  u <- u[1]
    }
    lkern <- cpar$lkern
    lambda <-
      2.5 * cpar$lambda # Gaussian case + 25% for estimating variances
    maxvol <- cpar$maxvol
    k <- cpar$k
    kstar <- cpar$kstar
    cpar$tau1 <- cpar$tau1 * 2
    cpar$tau2 <- cpar$tau2 * 2
    hmax <- cpar$hmax
    shape <- cpar$shape
    if (lkern == 5) {
      #  assume  hmax was given in  FWHM  units (Gaussian kernel will be truncated at 4)
      hmax <- hmax * 0.42445 * 4
    }
    d <- cpar$d
    n <- length(y)
    #
    #   family dependent transformations
    #
    zfamily <- awsgfamily(y, scorr, d)
    sigma2 <- zfamily$sigma2
    h0 <- zfamily$h0
    rm(zfamily)
    if (lkern == 5) {
      #  assume  hmax was given in  FWHM  units (Gaussian kernel will be truncated at 4)
      hmax <- hmax * 0.42445 * 4
      hinit <- 0.42445 * 4
    }
    if (demo && !graph)
      graph <- TRUE
    # now check which procedure is appropriate
    ##  this is the version on a grid
    n <- length(y)
    n1 <- switch(d, n, dy[1], dy[1])
    n2 <- switch(d, 1, dy[2], dy[2])
    n3 <- switch(d, 1, 1, dy[3])
    if(d==1) dy[1] <- n
    #
    #    Initialize  for the iteration
    #
    #wghts<-(wghts[2:3]/wghts[1])
    y <- y[mask]
    tobj <- list(
      bi = rep(1, nvoxel),
      bi2 = rep(1, nvoxel),
      theta = y / shape
    )
    zobj <- list(ai = y, bi0 = rep(1, nvoxel))
    mae <- NULL
    lambda0 <-
      1e50 # that removes the stochstic term for the first step, initialization by kernel estimates
    #
    #   produce a presmoothed estimate to stabilze variance estimates
    #
    if (is.null(hpre))
      hpre <- 20 ^ (1 / d)
    dlw <- (2 * trunc(hpre / c(1, wghts)) + 1)[1:d]
    hobj <- .Fortran(C_caws,
      as.double(y),
      as.integer(position),
      as.integer(n1),
      as.integer(n2),
      as.integer(n3),
      as.double(hpre),
      as.double(1e40),
      double(nvoxel),
      bi = as.double(rep(1,nvoxel)),
      double(nvoxel),
      as.double(rep(1,nvoxel)),
      ai = as.double(rep(1,nvoxel)),
      as.integer(cpar$mcode),
      as.integer(lkern),
      as.double(0.25),
      double(prod(dlw)),
      as.double(wghts)
    )[c("bi", "ai")]
    hobj$theta <- hobj$ai / hobj$bi
    #
    #   iteratate until maximal bandwidth is reached
    #
    cat("Progress:")
    total <- cumsum(1.25 ^ (1:kstar)) / sum(1.25 ^ (1:kstar))
    while (k <= kstar) {
      hakt0 <- gethani(1, 10, lkern, 1.25 ^ (k - 1), wghts, 1e-4)
      hakt <- gethani(1, 10, lkern, 1.25 ^ k, wghts, 1e-4)
      cat("step", k, "hakt", hakt, "\n")
      if (lkern == 5) {
        #  assume  hmax was given in  FWHM  units (Gaussian kernel will be truncated at 4)
        hakt <- hakt * 0.42445 * 4
      }
      dlw <- (2 * trunc(hakt / c(1, wghts)) + 1)[1:d]
      if (scorr[1] >= 0.1)
        lambda0 <-
        lambda0 * Spatialvar.gauss(hakt0 / 0.42445 / 4, h0, d) / Spatialvar.gauss(hakt0 /
                                                                                    0.42445 / 4, 1e-5, d)
      # Correction for spatial correlation depends on h^{(k)}
      hakt0 <- hakt
      # heteroskedastic Gaussian case
      zobj <- .Fortran(C_cgaws,
        as.double(y),
        as.integer(position),
        as.double(sigma2),
        as.integer(n1),
        as.integer(n2),
        as.integer(n3),
        hakt = as.double(hakt),
        as.double(lambda0),
        as.double(tobj$theta),
        bi = as.double(tobj$bi),
        bi2 = double(nvoxel),
        bi0 = as.double(zobj$bi0),
        gi = double(nvoxel),
        gi2 = double(nvoxel),
        ai = as.double(zobj$ai),
        as.integer(lkern),
        as.double(0.25),
        double(prod(dlw)),
        as.double(wghts)
      )[c("bi", "bi0", "bi2", "ai", "gi", "gi2","hakt")]
      if (hakt > n1 / 2)
        zobj$bi0 <- rep(max(zobj$bi), nvoxel)
      tobj <- updtheta(zobj, tobj, cpar)
      tobj$gi <- zobj$gi
      tobj$gi2 <- zobj$gi2
      if (graph) {
        #
        #     Display intermediate results if graph == TRUE
        #
        if (d == 1) {
          oldpar <- par(
            mfrow = c(1, 2),
            mar = c(3, 3, 3, .2),
            mgp = c(2, 1, 0)
          )
          plot(y, ylim = range(y, tobj$theta), col = 3)
          if (!is.null(u))
            lines(u, col = 2)
          lines(tobj$theta, lwd = 2)
          title(paste("Reconstruction  h=", signif(hakt, 3)))
          plot(tobj$bi, type = "l", ylim = range(0, tobj$bi))
          lines(tobj$eta * max(tobj$bi), col = 2)
          title("Sum of weights and eta")
        }
        if (d == 2) {
          oldpar <- par(
            mfrow = c(2, 2),
            mar = c(1, 1, 3, .25),
            mgp = c(2, 1, 0)
          )
          image(array(y,dy),
                col = grey((0:255) / 255),
                xaxt = "n",
                yaxt = "n")
          title(paste(
            "Observed Image  min=",
            signif(min(y), 3),
            " max=",
            signif(max(y), 3)
          ))
          image(
            array(tobj$theta,dy),
            col = grey((0:255) / 255),
            xaxt = "n",
            yaxt = "n"
          )
          title(paste(
            "Reconstruction  h=",
            signif(hakt, 3),
            " min=",
            signif(min(tobj$theta), 3),
            " max=",
            signif(max(tobj$theta), 3)
          ))
          image(
            array(tobj$bi,dy),
            col = grey((0:255) / 255),
            xaxt = "n",
            yaxt = "n"
          )
          title(paste(
            "Sum of weights: min=",
            signif(min(tobj$bi), 3),
            " mean=",
            signif(mean(tobj$bi), 3),
            " max=",
            signif(max(tobj$bi), 3)
          ))
          }
        if (d == 3) {
          oldpar <- par(
            mfrow = c(2, 2),
            mar = c(1, 1, 3, .25),
            mgp = c(2, 1, 0)
          )
          image(array(y,dy)[, , n3 %/% 2 + 1],
                col = grey((0:255) / 255),
                xaxt = "n",
                yaxt = "n")
          title(paste(
            "Observed Image  min=",
            signif(min(y), 3),
            " max=",
            signif(max(y), 3)
          ))
          image(
            array(tobj$theta,dy)[, , n3 %/% 2 + 1],
            col = grey((0:255) / 255),
            xaxt = "n",
            yaxt = "n"
          )
          title(paste(
            "Reconstruction  h=",
            signif(hakt, 3),
            " min=",
            signif(min(tobj$theta), 3),
            " max=",
            signif(max(tobj$theta), 3)
          ))
          image(
            array(tobj$bi,dy)[, , n3 %/% 2 + 1],
            col = grey((0:255) / 255),
            xaxt = "n",
            yaxt = "n"
          )
          title(paste(
            "Sum of weights: min=",
            signif(min(tobj$bi), 3),
            " mean=",
            signif(mean(tobj$bi), 3),
            " max=",
            signif(max(tobj$bi), 3)
          ))
        }
        par(oldpar)
      }
      #
      #    Calculate MAE and MSE if true parameters are given in u
      #    this is for demonstration and testing for propagation (parameter adjustments)
      #    only.
      #
      if (!is.null(u)) {
        cat(
          "bandwidth: ",
          signif(hakt, 3),
          "eta==1",
          sum(tobj$eta == 1),
          "   MSE: ",
          signif(mean((tobj$theta - u) ^ 2), 3),
          "   MAE: ",
          signif(mean(abs(tobj$theta - u)), 3),
          " mean(bi)=",
          signif(mean(tobj$bi), 3),
          "\n"
        )
        mae <- c(mae, signif(mean(abs(tobj$theta - u)), 3))
      }
      if (demo)
        readline("Press return")
      #
      #   Prepare for next iteration
      #
      #
      #   Create new variance estimate
      #
      vobj <- awsgsigma2(y, hobj, tobj, varmodel, varprop)
      sigma2 <- vobj$sigma2inv
      coef <- vobj$coef
      x <- 1.25 ^ (k - 1)
      scorrfactor <- x / (3 ^ d * prod(scorr) * prod(h0) + x)
      lambda0 <- lambda * scorrfactor
      if (max(total) > 0) {
        cat(signif(total[k], 2) * 100, "% . ", sep = "")
      }
      k <- k + 1
      gc()
    }
    cat("\n")
    ###
    ###            end iterations now prepare results
    ###
    ###   component var contains an estimate of Var(tobj$theta) if aggkern="Uniform", or if qtau1=1
    ###
    vartheta <- array(0,dmask)
    vartheta[mask] <- tobj$bi2 / tobj$bi ^ 2
    vartheta <-
      vartheta / Spatialvar.gauss(hakt / 0.42445 / 4, h0 + 1e-5, d) * Spatialvar.gauss(hakt /
                                                                     0.42445 / 4, 1e-5, d)
    y0 <- theta <- sigma2 <- bi <- array(0,dmask)
    theta[mask] <- tobj$theta
    sigma2[mask] <- vobj$sigma2inv
    y0[mask] <- y
    bi[mask] <- tobj$bi
    awsobj(
      y0,
      theta,
      vartheta,
      hakt,
      1 / sigma2,
      lkern,
      lambda,
      ladjust,
      aws,
      memory,
      args,
      homogen = FALSE,
      earlystop = FALSE,
      family = "Gaussian",
      wghts = wghts,
      scorr = scorr,
      vcoef = coef,
      mae = mae,
      mask = mask,
      ni = bi
    )
  }
###########################################################################
#
#   Auxialiary functions
#
############################################################################
#
#   transformations for Gaussian case with variance modelling
#
############################################################################
awsgfamily <- function(y, scorr, d) {
  h0 <- numeric(d)
  if (scorr[1] > 0) {
    if (length(scorr) < d)
      scorr <- c(scorr, rep(0, d))[1:d]
    for (i in 1:d)
      h0[i] <- geth.gauss(scorr[i])
    cat("Corresponding bandwiths for specified correlation:",
        h0,
        "\n")
  }
  sigma2 <- IQRdiff(as.vector(y)) ^ 2
  if (scorr[1] > 0)
    sigma2 <- sigma2 * Varcor.gauss(h0)
  cat("Estimated variance: ", signif(sigma2, 4), "\n")
  sigma2 <- rep(sigma2, length(y))
  sigma2 <- 1 / sigma2 #  taking the invers yields simpler formulaes
  list(sigma2 = sigma2, h0 = h0)
}
############################################################################
#
#  estimate inverse of variances, uses nonadaptive hobj to stabilize,
#    based on residual variance, constant/linear/quadratic
#  expects only voxel within mask
#
############################################################################
awsgsigma2 <- function(y, hobj, tobj, varmodel, varprop) {
  if (is.null(dy <- dim(y)))
    dy <- length(y)
  if (is.null(dy))
    d <- 1
  else
    d <- length(dy)
  ind <- tobj$gi > 1
  residsq <-
    ((y - tobj$theta)[ind] * tobj$gi[ind] / (tobj$gi[ind] - pmin(.95*tobj$gi[ind],1)))^2
  theta <- tobj$theta[ind]
  if (varmodel == "Quadratic")
    theta2 <- theta ^ 2
  wght <- tobj$gi[ind] - 1
  coef <- switch(
    varmodel,
    Constant = coefficients(lm(residsq ~ 1, weights = wght ^
                                 2)),
    Linear = coefficients(lm(residsq ~ theta, weights = wght ^
                               2)),
    Quadratic = coefficients(lm(residsq ~ theta + theta2, weights =
                                  wght ^ 2))
  )
  gamma <- pmin(tobj$gi / hobj$bi, 1)
  theta <- gamma * tobj$theta + (1 - gamma) * hobj$theta
  #
  #    use smoother estimates to obtain more stable variance estimates
  #
  sigma2 <- switch(
    varmodel,
    Constant = array(coef, dy),
    Linear = coef[1] + coef[2] * theta,
    Quadratic = coef[1] + coef[2] * theta + coef[3] * theta ^
      2
  )
  #varquantile <- quantile(residsq,varprop)
  varquantile <- varprop * mean(sigma2)
  sigma2 <- pmax(sigma2, varquantile)
  cat(
    "Estimated mean variance",
    signif(mean(sigma2), 3),
    " Variance parameters:",
    signif(coef, 3),
    "\n"
  )
  list(sigma2inv = 1 / sigma2, coef = coef)
}