rmx: Radius-Minimax Estimators

Documented in rmx.norm

###############################################################################
## RMX estimator for normal location and scale
###############################################################################
rmx.norm <- function(x, eps.lower=0, eps.upper=NULL, eps=NULL, k = 3L, 
                     initial.est=NULL, fsCor = TRUE, na.rm = TRUE, mad0 = 1e-4){
    if(!is.null(eps)){
        r <- sqrt(length(x))*eps
        if(fsCor){ 
            r.as <- r
            r <- fsRadius.norm(r = r, n = length(x))
        }
    }else{
        sqrtn <- sqrt(length(x))
        rlo <- sqrtn*eps.lower
        rup <- sqrtn*eps.upper
        if(rlo > 10){
            r <- (rlo + rup)/2
            r.as <- r
        }else{
            r <- uniroot(.getInterval.norm, lower = rlo+1e-8, upper = rup, 
                         tol = .Machine$double.eps^0.25, rlo = rlo, rup = rup)$root
            r.as <- r
        }
        if(fsCor){
            r.as <- r
            r <- fsRadius.norm(r = r, n = length(x))
        }
    }
    if(length(x) <= 2){
        warning("Sample size <= 2! => Median and MAD are used for estimation.")
        rmxEst <- c(median(x), mad(x))
        names(rmxEst) <- c("mean", "sd")
        Info.matrix <- matrix(c("rmx", "median and MAD"), ncol = 2, 
                              dimnames = list(NULL, c("method", "message")))
        
        IF <- .getMedMADIF(AM = rmxEst[1], SD = rmxEst[2], r = r)
        
        RMX <- list(rmxEst = rmxEst, rmxIF = IF, initial.est = NULL, 
                    Infos = Info.matrix)
        class(RMX) <- "rmx"
        return(RMX)
    }
    if(!is.null(eps)){
        if(eps == 0){
            n <- length(x)
            rmxEst <- c(mean(x), sqrt((n-1)/n)*sd(x))
            names(rmxEst) <- c("mean", "sd")
            Info.matrix <- matrix(c("rmx", "mean and sd"), ncol = 2, 
                                  dimnames = list(NULL, c("method", "message")))
            
            IF <- .getMLIF.norm(mean = rmxEst[1], sd = rmxEst[2])
            IF$radius <- 0

            RMX <- list(rmxEst = rmxEst, rmxIF = IF, initial.est = NULL, 
                        Infos = Info.matrix, n = length(x))
            class(RMX) <- "rmx"
            return(RMX)
        }
    }
    if(is.null(initial.est)){
        MEAN <- median(x, na.rm = TRUE)
        SD <- mad(x, center = MEAN, na.rm = TRUE)
        if(SD == 0){
            warning("'mad(x) = 0' => cannot compute a valid initial estimate. 
                     To avoid division by zero 'mad0' is used. You could also 
                     specify a valid initial estimate for scale via 'initial.est'. 
                     Note that you have to provide an initial estimate for mean and sd.")
            SD <- mad0
        }
    }else{
        stopifnot(is.numeric(initial.est))
        if(length(initial.est) != 2)
            stop("'initial.est' needs to be a numeric vector of length 2 or NULL")
        MEAN <- initial.est[1]
        SD <- initial.est[2]
        if(SD <= 0)
            stop("initial estimate for sd <= 0 which is not valid")
    }
    mean.sd <- c(MEAN, SD)
    names(mean.sd) <- c("mean","sd")
    if(!is.null(eps)){
        if(r > 10){
            b <- SD*1.618128043
            const <- 1.263094656
            A2 <- b^2*(1+r^2)/(1+const)
            A1 <- const*A2
            a <- c(0, -0.6277527697*A2/SD)
            mse <- A1 + A2
        }else{
            A1 <- SD^2*.getA1.norm(r)
            A2 <- SD^2*.getA2.norm(r)
            a <- SD*c(0, .geta.norm(r))
            b <- SD*.getb.norm(r)
            mse <- A1 + A2
        }
        rmxEst.all <- .kstep.norm(x = x, initial.est = c(MEAN, SD), 
                                  A1 = A1, A2 = A2, a = a, b = b, k = k)
        if(fsCor){
            Info.matrix <- matrix(c("rmx", 
                                    paste("fs-corrected estimate for 'eps' =", 
                                          round(eps, 3))),
                                  ncol = 2, dimnames = list(NULL, c("method", "message")))
        }else{
            Info.matrix <- matrix(c("rmx", 
                                    paste("asymptotic estimate for 'eps' =", 
                                          round(eps, 3))),
                                  ncol = 2, dimnames = list(NULL, c("method", "message")))
        }
        IF <- .getRMXIF(r, rmxEst.all)
    }else{
        if(r > 10){
            b <- SD*1.618128043
            const <- 1.263094656
            A2 <- b^2*(1+r^2)/(1+const)
            A1 <- const*A2
            a <- c(0, -0.6277527697*A2/SD)
            mse <- A1 + A2
        }else{
            A1 <- SD^2*.getA1.norm(r)
            A2 <- SD^2*.getA2.norm(r)
            a <- SD*c(0, .geta.norm(r))
            b <- SD*.getb.norm(r)
            mse <- A1 + A2
        }
        if(rlo == 0){
            ineff <- (A1 + A2 - b^2*r.as^2)/(1.5*SD^2)
        }else{
            if(rlo > 10){
                ineff <- 1
            }else{
                A1lo <- SD^2*.getA1.norm(rlo)
                A2lo <- SD^2*.getA2.norm(rlo)
                ineff <- (A1 + A2 - b^2*(r.as^2 - rlo^2))/(A1lo + A2lo)
            }
        }
        rmxEst.all <- .kstep.norm(x = x, initial.est = c(MEAN, SD), 
                                  A1 = A1, A2 = A2, a = a, b = b, k = k)
        if(fsCor){
            Info.matrix <- matrix(c(rep("rmx", 3), 
                                  paste("fs-corrected rmx estimate for 'eps' in [", 
                                    round(eps.lower, 3), ", ", round(eps.upper, 3), "]", sep = ""),
                                  paste("least favorable (uncorrected) contamination: ", 
                                        100*signif(r.as/sqrtn, 3), " %", sep = ""),
                                  paste("maximum asymptotic MSE-inefficiency: ", signif(ineff, 3), sep = "")), 
                                  ncol = 2, dimnames = list(NULL, c("method", "message")))
        }else{
            Info.matrix <- matrix(c(rep("rmx", 3), 
                                  paste("rmx estimate for 'eps' in [", 
                                    round(eps.lower, 3), ", ", round(eps.upper, 3), "]", sep = ""),
                                  paste("least favorable contamination: ", 
                                        100*signif(r/sqrtn, 3), " %", sep = ""),
                                  paste("maximum asymptotic MSE-inefficiency: ", 
                                        signif(ineff, 3), sep = "")), 
                                  ncol = 2, dimnames = list(NULL, c("method", "message")))
        }
        IF <- .getRMXIF(r, rmxEst.all)
    }
    rmxEst <- rmxEst.all$est
    names(rmxEst) <- c("mean", "sd")
    
    RMX <- list(rmxEst = rmxEst, rmxIF = IF, initial.est = c(MEAN, SD), 
                Infos = Info.matrix, n = length(x))
    class(RMX) <- "rmx"
    RMX
}
###############################################################################
## computation of radius-minimax IC
## using pre-computed results included in "sysdata.rda"
###############################################################################
.getA1.norm <- function(r){
    approx(x = .radius.gitter.norm, y = .A1.norm, xout = r, yleft = 1)$y
}
.getA2.norm <- function(r){
    approx(x = .radius.gitter.norm, y = .A2.norm, xout = r, yleft = 0.5)$y
}
.geta.norm <- function(r){
    approx(x = .radius.gitter.norm, y = .a.norm, xout = r, yleft = 0)$y
}
.getb.norm <- function(r){
    approx(x = .radius.gitter.norm, y = .b.norm, xout = r, yleft = Inf)$y
}
.getAsVar.norm.approx <- function(r){
    asVar.mean <- approx(x = .radius.gitter.norm, y = .asVar.mean.norm, xout = r, 
                         yleft = 1.0)$y
    asVar.sd <- approx(x = .radius.gitter.norm, y = .asVar.sd.norm, xout = r, 
                       yleft = 0.5)$y
    diag(c(asVar.mean, asVar.sd))
}
.getInterval.norm <- function(r, rlo, rup){
    if(r > 10){
        b <- 1.618128043
        const <- 1.263094656
        A2 <- b^2*(1+r^2)/(1+const)
        A1 <- const*A2
    }else{
        A1 <- .getA1.norm(r)
        A2 <- .getA2.norm(r)
        b <- .getb.norm(r)
    }
    
    if(rlo == 0){
        efflo <- (A1 + A2 - b^2*r^2)/1.5
    }else{
        A1lo <- .getA1.norm(rlo)
        A2lo <- .getA2.norm(rlo)
        efflo <- (A1 + A2 - b^2*(r^2 - rlo^2))/(A1lo + A2lo)
    }
    
    if(rup > 10){
        bup <- 1.618128043
        const.up <- 1.263094656
        A2up <- bup^2*(1+rup^2)/(1+const.up)
        A1up <- const.up*A2up
        effup <- (A1 + A2 - b^2*(r^2 - rup^2))/(A1up + A2up)
    }else{
        A1up <- .getA1.norm(rup)
        A2up <- .getA2.norm(rup)
        effup <- (A1 + A2 - b^2*(r^2 - rup^2))/(A1up + A2up)
    }
    
    effup-efflo
}

###############################################################################
## computation of k-step construction
###############################################################################
.onestep.norm <- function(x, initial.est, A1, A2, a, b){
    MEAN <- initial.est[1]
    SD <- initial.est[2]
    u <- A1*(x-MEAN)/SD^2
    v <- A2*(((x-MEAN)/SD)^2-1)/SD - a[2]
    w <- pmin(1, b/sqrt(u^2 + v^2))
    IC <- c(mean(u*w, na.rm = TRUE), mean(v*w, na.rm = TRUE))
    initial.est + IC
}
.kstep.norm <- function(x, initial.est, A1, A2, a, b, k){
    est <- .onestep.norm(x = x, initial.est = initial.est, 
                         A1 = A1, A2 = A2, a = a, b = b)
    if(k > 1){
        for(i in 2:k){
            A1 <- est[2]^2*A1/initial.est[2]^2
            A2 <- est[2]^2*A2/initial.est[2]^2
            a <- est[2]*a/initial.est[2]
            b <- est[2]*b/initial.est[2]
            initial.est <- est
            est <- .onestep.norm(x = x, initial.est = est,
                                 A1 = A1, A2 = A2, a = a, b = b)
        }
    }
    A1 <- est[2]^2*A1/initial.est[2]^2
    A2 <- est[2]^2*A2/initial.est[2]^2
    a <- est[2]*a/initial.est[2]
    b <- est[2]*b/initial.est[2]
    a1 <- A1/est[2]^2
    a3 <- A2/est[2]^2
    a2 <- a[2]/est[2]/a3 + 1
    
    list(est = est, A1 = A1, A2 = A2, a = a, b = b)
}
.getMedMADIF <- function(AM, SD, r){
    b1 <- SD*sqrt(pi/2)
    A1 <- 1
    a1 <- 0
    
    b2 <- SD/(4*qnorm(0.75)*dnorm(qnorm(0.75)))
    A2 <- 1
    a2 <- (qnorm(0.75)^2 - 1)/SD
    A <- c(A1, A2)
    a <- c(a1, a2)
    b <- sqrt(b1^2 + b2^2)
    
    mse <- b1^2*(1+r^2) + b2^2*(1+r^2)
    names(mse) <- NULL
    bias <- r^2*(b1^2 + b2^2)
    names(bias) <- NULL
    V1 <- b1^2
    V2 <- b2^2
    asVar <- diag(c(V1, V2))
    rownames(asVar) <- c("mean", "sd")
    colnames(asVar) <- c("mean", "sd")
    
    param <- c(AM, SD)
    names(param) <- c("mean", "sd")
    IFun <- function(x){}
    body(IFun) <- substitute({ 
        z <- (x-AM)/sigma
        y1 <- b1*sign(z)
        y2 <- b2*sign((z^2 - 1)/sigma - a2)
        Y <- cbind(y1, y2)
        colnames(Y) <- c("IF for mean", "IF for sd")  
        Y
    }, list(AM = AM, sigma = SD, a2 = a2, b1 = b1, b2 = b2))
    range <- function(alpha, n = 501){} 
    body(range) <- substitute({
        rg <- qnorm(c(alpha/2, 1-alpha/2), mean = AM, sd = sigma)
        seq(from = rg[1], to = rg[2], length.out = n)
    }, list(AM = mean, sigma = sd))
    
    IF <- list(model = "norm", modelName = "normal location and scale", 
               parameter = param, A = A, a = a, b = b, IFun = IFun,
               range = range, asMSE = mse, asVar = asVar, asBias = bias,
               radius = r)
    class(IF) <- "optIF"
    IF
}
.getRMXIF <- function(r, rmxEst.all){
    rmxEst <- rmxEst.all$est
    names(rmxEst) <- c("mean", "sd")
    A1 <- rmxEst.all$A1 
    A2 <- rmxEst.all$A2
    A <- diag(c(A1, A2))
    a <- rmxEst.all$a 
    b <- rmxEst.all$b
    a1 <- A1/rmxEst[2]^2
    a3 <- A2/rmxEst[2]^2
    a2 <- a[2]/rmxEst[2]/a3 + 1
    
    asVar <- rmxEst[2]^2*.getAsVar.norm.approx(r)
    rownames(asVar) <- c("mean", "sd")
    colnames(asVar) <- c("mean", "sd")
    mse <- rmxEst[2]^2*(a1 + a3)
    names(mse) <- NULL
    bias <- sqrt(mse - sum(diag(asVar)))
    names(bias) <- NULL
    param <- rmxEst
    IFun <- function(x){}
    body(IFun) <- substitute({ 
        z <- (x-AM)/sigma
        hvkt <- sqrt(a1^2*z^2/sigma^2 + (a3*(z^2-1)/sigma - a2)^2)
        ind1 <- (hvkt < b)
        w <- ind1 + (1-ind1)*b/hvkt 
        Y <- cbind(a1*z/sigma, a3*(z^2-1)/sigma-a2)
        res <- Y*w
        colnames(res) <- c("IF for mean", "IF for sd")  
        res 
    }, list(AM = rmxEst[1], sigma = rmxEst[2], 
            a1 = A[1,1], a2 = a[2], a3 = A[2,2], b = b))
    range <- function(alpha, n = 501){} 
    body(range) <- substitute({
        rg <- qnorm(c(alpha/2, 1-alpha/2), mean = AM, sd = sigma)
        seq(from = rg[1], to = rg[2], length.out = n)
    }, list(AM = rmxEst[1], sigma = rmxEst[2]))
    
    IF <- list(model = "norm", modelName = "normal location and scale", 
               parameter = param, A = A, a = a, b = b, IFun = IFun,
               range = range, asMSE = mse, asVar = asVar, asBias = bias,
               radius = r)
    class(IF) <- "optIF"
    IF
}