R/UCV.R

## Tue Apr 16 03:33:05 2013
## Original file Copyright 2013 A.C. Guidoum
## This file is part of the R package kedd.
## Arsalane Chouaib GUIDOUM <acguidoum@usthb.dz> and <starsalane@gmail.com> 
## Department of Probabilities-Statistics
## Faculty of Mathematics
## University of Science and Technology Houari Boumediene
## BP 32 El-Alia, U.S.T.H.B, Algeris
## Algeria
##############################################################################



## Unbiased Cross-Validation (UCV)


h.ucv <- function(x, ...)  UseMethod("h.ucv")

h.ucv.default <- function(x,deriv.order=0,lower=0.1*hos,upper=2*hos,tol=0.1 * lower,
                          kernel=c("gaussian","epanechnikov", "uniform",
                            "triangular","triweight","tricube", "biweight",
                            "cosine"),...)
   {
     if (!is.numeric(x) || length(dim(x)) >=1 || length(x) < 3L) 
           stop("argument 'x' must be numeric and need at least 3 data points") 
     if (any(deriv.order < 0 || deriv.order != round(deriv.order))) 
           stop("argument 'deriv.order' is non-negative integers")
     r <- deriv.order   
     if (missing(kernel)) kernel <- "gaussian"
     name <- deparse(substitute(x))
     x <- x[!is.na(x)]
     x <- sort(x)
     n <- length(x)
     if (kernel=="epanechnikov" && 2*r >= 3)    return(structure(list(x=x, data.name=name,n=n, kernel=kernel, deriv.order=r, h = NA ,min.ucv=NA),class="h.ucv"))
     else if (kernel=="uniform" && 2*r >= 1)    return(structure(list(x=x, data.name=name,n=n, kernel=kernel, deriv.order=r, h = NA ,min.ucv=NA),class="h.ucv"))
     else if (kernel=="triweight" && 2*r >= 7)  return(structure(list(x=x, data.name=name,n=n, kernel=kernel, deriv.order=r, h = NA ,min.ucv=NA),class="h.ucv"))
     else if (kernel=="biweight" && 2*r >= 5)   return(structure(list(x=x, data.name=name,n=n, kernel=kernel, deriv.order=r, h = NA ,min.ucv=NA),class="h.ucv"))
     else if (kernel=="triangular" && 2*r >= 2) return(structure(list(x=x, data.name=name,n=n, kernel=kernel, deriv.order=r, h = NA ,min.ucv=NA),class="h.ucv"))
     else if (kernel=="tricube" && 2*r >= 10)   return(structure(list(x=x, data.name=name,n=n, kernel=kernel, deriv.order=r, h = NA ,min.ucv=NA),class="h.ucv"))  
     hos <- ((243 *(2*r+1)*A3_kMr(kernel,r))/(35* A2_kM(kernel)^2))^(1/(2*r+5)) * sd(x,na.rm = TRUE) * n^(-1/(2*r+5))
     if (!is.numeric(upper)){ 
		stop("argument 'upper' must be numeric. Default 2*hos (Oversmoothing) boundary was used")
		upper= 2*hos
	}
	if (!is.numeric(lower)){
		stop("argument 'lower' must be numeric. Default 0.1*hos boundary was used")
		lower=0.1*hos
	}
	if (lower < 0 | lower >= upper){
      	stop("the boundaries must be positive and 'lower' must be smaller than 'upper'. Default boundaries were used")
		upper=2*hos
		lower=0.1*hos
	}
	R_Kr1 <- A3_kMr(kernel,r)
     fucv <- function(h)
              {
      D <- kernel_fun_der(kernel, outer(x,x,"-")/h,deriv.order=2*r)
      diag(D) <- 0
      D <- ((-1)^r / ((n-1)*h^(2*r+1)))* colSums(D)
      D1 <- mean(D)
	  D2 <- kernel_fun_conv(kernel,outer(x,x,"-")/h,deriv.order=r)
	  diag(D2) <- 0
	  D3 <- ((-1)^r / ((n-1)*h^(2*r+1)))* colSums(D2)
	  D4 <- mean(D3)
      (1/(n*h^(2*r+1)))* R_Kr1 + D4 - 2*D1
              }
     obj <- optimize(fucv , c(lower, upper),tol=tol)
     structure(list(x=x, data.name=name,n=n, kernel=kernel, deriv.order=r, h = obj$minimum , 
                   min.ucv=obj$objective),class="h.ucv")
}

###### 

print.h.ucv <- function(x, digits=NULL, ...)
              {
    class(x) <- "h.ucv"
    cat("\nCall:\t","\tUnbiased Cross-Validation","\n",
	   "\nDerivative order = ",x$deriv.order,
        "\nData: ",x$data.name," (",x$n," obs.);","\tKernel: ",x$kernel, 
	    "\nMin UCV = ",format(x$min.ucv,digits=digits),";","\tBandwidth 'h' = ",format(x$h,digits=digits), "\n\n",sep="")
    invisible(x)
}

######

plot.ucv <- function(f,seq.bws=NULL,main=NULL,sub = NULL, xlab=NULL, ylab=NULL,
                      type="l",las=1,lwd=1,...)
                    {
    class(f) <- "h.ucv"
    r <- f$deriv.order
    n <- f$n
    kernel <- f$kernel
    x <- sort(f$x)
    if (kernel=="epanechnikov" && 2*r >= 3)    stop(" 'epanechnikov kernel derivative = 0' for '2*order >= 3' ")
    else if (kernel=="uniform" && 2*r >= 1)    stop(" 'uniform kernel derivative = 0' for '2*order >= 1' ")
    else if (kernel=="triweight" && 2*r >= 7)  stop(" 'triweight kernel derivative = 0' for '2*order >= 7' ")
    else if (kernel=="biweight" && 2*r >= 5)   stop(" 'biweight kernel derivative = 0' for '2*order >= 5' ")
    else if (kernel=="triangular" && 2*r >= 2) stop(" 'triangular kernel derivative = 0' for '2*order >= 2' ")
    else if (kernel=="tricube" && 2*r >= 10)   stop(" 'tricube kernel derivative = 0' for '2*order >= 10' ")
    if(is.null(xlab)) xlab <- "Bandwidths"
    if(is.null(ylab)) ylab <-  bquote(UCV~(h[(.(r))]))                
    if(is.null(main)){ 
	     if(r !=0) {main <- "Unbiased Cross-Validation function for \nBandwidth Choice for Density Derivative"}else{
	                main <- "Unbiased Cross-Validation function for \nBandwidth Choice for Density Function"}
	                }
    if(is.null(sub)) sub <- paste("Kernel",kernel,";","Derivative order = ",r)					
    if(is.null(seq.bws)){
       hos <- ((243 *(2*r+1)*A3_kMr(kernel,r))/(35* A2_kM(kernel)^2))^(1/(2*r+5)) * sd(x,na.rm = TRUE) * n^(-1/(2*r+5))
       seq.bws <- seq(0.15*hos,2*hos,length=50)
                         }
	R_Kr1 <- A3_kMr(kernel,r)
     fucv <- function(h)
              {
      D <- kernel_fun_der(kernel, outer(x,x,"-")/h,deriv.order=2*r)
      diag(D) <- 0
      D <- ((-1)^r / ((n-1)*h^(2*r+1)))* colSums(D)
      D1 <- mean(D)
	  D2 <- kernel_fun_conv(kernel,outer(x,x,"-")/h,deriv.order=r)
	  diag(D2) <- 0
	  D3 <- ((-1)^r / ((n-1)*h^(2*r+1)))* colSums(D2)
	  D4 <- mean(D3)
      (1/(n*h^(2*r+1)))* R_Kr1 + D4 - 2*D1
              }
    D <- lapply(1:length(seq.bws), function(i) fucv(seq.bws[i]))
    Minf <- c(do.call("rbind",D))
    plot.default(seq.bws,Minf,type=type,las=las,lwd=lwd,xlab=xlab,ylab=ylab,
		         main=main,sub=sub,font.main=2,cex.main=0.9,font.sub=2,cex.sub=0.7,...)
    return(list(kernel=kernel,deriv.order=r,seq.bws=seq.bws, ucv=Minf)) 
}


plot.h.ucv <- function(x,seq.bws=NULL,...) plot.ucv(x,seq.bws,...)


#####

lines.ucv <- function(f,seq.bws=NULL,...)
                    {
    class(f) <- "h.ucv"
    r <- f$deriv.order
    n <- f$n
    kernel <- f$kernel
    x <- sort(f$x)
    if (kernel=="epanechnikov" && 2*r >= 3)    stop(" 'epanechnikov kernel derivative = 0' for '2*order >= 3' ")
    else if (kernel=="uniform" && 2*r >= 1)    stop(" 'uniform kernel derivative = 0' for '2*order >= 1' ")
    else if (kernel=="triweight" && 2*r >= 7)  stop(" 'triweight kernel derivative = 0' for '2*order >= 7' ")
    else if (kernel=="biweight" && 2*r >= 5)   stop(" 'biweight kernel derivative = 0' for '2*order >= 5' ")
    else if (kernel=="triangular" && 2*r >= 2) stop(" 'triangular kernel derivative = 0' for '2*order >= 2' ")
    else if (kernel=="tricube" && 2*r >= 10)   stop(" 'tricube kernel derivative = 0' for '2*order >= 10' ")
    if(is.null(seq.bws)){
       hos <- ((243 *(2*r+1)*A3_kMr(kernel,r))/(35* A2_kM(kernel)^2))^(1/(2*r+5)) * sd(x,na.rm = TRUE) * n^(-1/(2*r+5))
       seq.bws <- seq(0.15*hos,2*hos,length=50)
                         }
	R_Kr1 <- A3_kMr(kernel,r)
     fucv <- function(h)
              {
      D <- kernel_fun_der(kernel, outer(x,x,"-")/h,deriv.order=2*r)
      diag(D) <- 0
      D <- ((-1)^r / ((n-1)*h^(2*r+1)))* colSums(D)
      D1 <- mean(D)
	  D2 <- kernel_fun_conv(kernel,outer(x,x,"-")/h,deriv.order=r)
	  diag(D2) <- 0
	  D3 <- ((-1)^r / ((n-1)*h^(2*r+1)))* colSums(D2)
	  D4 <- mean(D3)
      (1/(n*h^(2*r+1)))* R_Kr1 + D4 - 2*D1
              }
    D <- lapply(1:length(seq.bws), function(i) fucv(seq.bws[i]))
    Minf <- c(do.call("rbind",D))
    lines.default(seq.bws,Minf,...)
    invisible(NULL)
}

lines.h.ucv <- function(x,seq.bws=NULL,...) lines.ucv(x,seq.bws,...) 

Try the kedd package in your browser

Any scripts or data that you put into this service are public.

kedd documentation built on May 2, 2019, 7:32 a.m.