matClust.R
In qle: Simulation-Based Quasi-Likelihood Estimation

## Fit a Matern-Cluster point pattern 
## to the `redwood` data from package spatstat

library(qle)
library(spatstat)

# set options
options(mc.cores=2L)
RNGkind("L'Ecuyer-CMRG")

simStat <- function(X,cond){
 x <- Kest(X,r=cond$rr,correction="best")
 x <- x[[attr(x,"valu")]]
 x <- x[x>0]
 if(anyNA(x) || any(!is.finite(x))) {
  warning(.makeMessage("`NA`, `NaN` or `Inf` detected.","\n"))
  x <- x[!is.nan(x) & is.finite(x)]}
 return(c(intensity(X),x))	
}

# simulation function
simClust <- function(theta,cond){
 X <- rMatClust(theta["kappa"],theta["R"],theta["mu"],win=cond$win)	
 simStat(X,cond)
}

# plot diagnostics 
plotGraphs <- function(par, nsim = 100) {
	# fit by MC
	fit0.mc <- kppm(redwood, ~1, "MatClust")
	# fit by QLE
	names(par)<-c("kappa","scale","mu")
	fit0.ql <- kppm(redwood,~1,"MatClust",
			improve.type="none",startpar=par[1:2],
			control=list(maxit=0),algorithm="SANN")
	fit0.ql$Fit$mcfit$mu <- fit0.ql$mu <- fit0.ql$modelpar[3]<-par[3]
		
	# plotting
	oldpar <- par(no.readonly = TRUE)
	par(mfrow=c(3,2))	
	plot(envelope(fit0.mc, Kest, nsim = nsim), main="Minimum Contrast")
	plot(envelope(fit0.ql, Kest, nsim = nsim), main="QL estimation")
	plot(envelope(fit0.mc, Gest, nsim = nsim), main="Minimum Contrast")
	plot(envelope(fit0.ql, Gest, nsim = nsim), main="QL estimation")
	plot(envelope(fit0.mc, Fest, nsim = nsim), main="Minimum Contrast")
	plot(envelope(fit0.ql, Fest, nsim = nsim), main="QL estimation")
	par(oldpar)
	
	# statistics
	cat("Fitted by quasi-likelihood: \n\n")
	print(coef(summary(fit0.ql)))
	cat("\n\n")
	cat("Fitted by minimum contrast: \n\n")
	print(coef(summary(fit0.mc)))	
}

# load example data set (spatstat)
data(redwood)

# observation window
win <- owin(c(0, 2), c(0, 2))

# condition object: further options
# needed for the simulation function 
cond <- list(win=win,rr=seq(0,0.3,by=0.05)) 

# quasi-likelihood options for estimation
nsim <- 50
Nsample <- 12

# define parameter space
lb <- c("kappa"=20,"R"=0.01,"mu"=1)
ub <- c("kappa"=35,"R"=0.25,"mu"=5)

# general approach to initialize a (local) cluster object
cl <- makeCluster(4L)
clusterSetRNGStream(cl)
clusterCall(cl,fun=function(x) library("spatstat", character.only=TRUE))
clusterExport(cl=cl,varlist=c("simStat","searchMinimizer"), envir=environment())

# simulate design points and statistics
sim <- simQLdata(sim=simClust,cond=cond,nsim=nsim,
		method="randomLHS",lb=lb,ub=ub,N=Nsample,cl=cl)

# check simulations used
attr(sim,"nsim")

# generated random design
X <- attr(sim,"X")

# observed statistics (redwood data)
obs0 <- simStat(redwood,cond)

# set up QL model with kriging approximation of
# covariance matrix estimate with bootstrappingg option
qsd <- getQLmodel(sim,lb,ub,obs0,		
		var.type="kriging",			# kriging variance matrix
		intrinsic=TRUE, Nb = 100,	# use bootstrap option, number of bootstrap samples
		verbose=TRUE)

#qsd <- getQLmodel(sim,lb,ub,obs0,		
#		var.type="wcholMean",			# kriging variance matrix
#		intrinsic=TRUE, Nb = 100,	# use bootstrap option, number of bootstrap samples
#		verbose=TRUE)

#qsd$covT
#qsd$covL

# cross-validation: fitting CV covariance models
cvm <- prefitCV(qsd, reduce=FALSE, cl=cl,verbose=TRUE)

# starting point for local search
x0 <- c("kappa"=22,"R"=0.08,"mu"=2.5)

# use the maximum of kriging and CV-based variances
attr(cvm,"type") <- "max"

# random sample
#Xc <- multiDimLHS(N=100,qsd$lower,qsd$upper,type="matrix")
#D <- quasiDeviance(Xc,qsd,cvm=cvm,verbose=TRUE)
#S <- t(sapply(D,"[[","score"))
#colMeans(S)

opts <- list("pl"=10,"xscale"=c(10,0.1,1),"ftol_abs"=1e-8,
		"score_tol"=1e-5,"restart"=0)
 
(QS0 <- qscoring(qsd,x0,opts=opts,cvm=cvm,verbose=TRUE))

D <- quasiDeviance(QS0$par,qsd,cvm=cvm,verbose=TRUE)[[1]]
D$value
#covarTx(qsd,theta=QS0$par,cvm=cvm)
#attr(D,"Sigma")

#print(QS0$Qnorm,digits=12)
#print(QS0$value,digits=12)
#quasiDeviance(QS0$par,qsd,cvm=cvm,verbose=TRUE)[[1]]

#debug(searchMinimizer)
#S0 <- searchMinimizer(x0, qsd,method=c("qscoring","bobyqa"),cvm=NULL,
#		restart=FALSE,verbose=TRUE)

# multistart version of finding a root
# ... passed to searchMinimizer
method <- c("qscoring","bobyqa","cobyla")
S0 <- multiSearch(x0=x0,qsd=qsd,method=method,opts=opts,
		 check=FALSE,cvm=cvm,nstart=50,optInfo=TRUE,
		  multi.start=TRUE,cl=cl,pl=1,verbose=TRUE)
 
# best found root
(roots <- attr(S0,"roots"))
(id <- attr(roots,"id"))
stopifnot(!is.na(id))
attr(roots,"par")
RES <- attr(S0,"optRes")
length(RES)
attr(S0,"hasError")

# try a single one 
id <- 15
RES <- attr(S0,"optRes")[[id]]
x <- RES$start
QD <- quasiDeviance(x0,qsd,cvm=cvm,verbose=TRUE)

(QSF <- qscoring(qsd,x0,opts=opts,cvm=cvm,verbose=TRUE))

(S2 <- searchMinimizer(x0,qsd,method="neldermead",
		 cvm=cvm,verbose=TRUE))

rbind(QSF$par,S2$par)

## inspect CV errors vs. kriging variances
# no significant bias in predicting the statistics 
crossValTx(qsd, cvm, type = "acve")

# compare magnitudes of predictions:
# here: first statistic (intensity) is more sensitive to
# leave out a single sample point of the initial design
# than the others.
crossValTx(qsd, cvm, type = "mse")

# adequacy of the prediction models
crossValTx(qsd, cvm, type = "ascve")
# T2,T4,T5 -> kriging variance underestimates the actual prediction error (measured by CV error)
# T1,T3,T6,T7 -> the actual CV error seems to not sufficiently reflect the predicted
# error by the kriging variance. Strategy: use the maximum of prediction errors

# compute the kriging variance at the sample points i=1,...,n
# leaving out the ith each time 
crossValTx(qsd, cvm, type = "sigK")

## could compare these to the kriging variance:
# dx <- attr(qsd$qldata,"xdim")
# T <- qsd$qldata[(dx+1):(dx+length(qsd$covT))]
# varKM(qsd$covT,X,X,T)

# start main estimation using selection
# criterion `score` (see vignette) and
# the maximum of CV errors and kriging variances
# in order to accouont for the prediction uncertainty
# of sample means of the statistics

qs.opts <- list("xscale"=c(10,0.1,1),"ftol_abs"=1e-4,"score_tol"=1e-4)

# use multicores (mclapply) for computations other
# than simulating the model, i.e. 'use.cluster=FALSE'
# options(qle.multicore="lapply")

# start estimation
# nsim <- attr(qsd$qldata,"nsim")
Fnsim <- as.call(list(
	function(n) {		
		if(status[["global"]] < 2L)	{
		 min(2*n,1000)	
		} else n
	}, quote(nsim)))

OPT <- qle(qsd, simClust, cond=cond,
		nsim=nsim,									
		fnsim=Fnsim,								# function call to increase number of simulations
		qscore.opts = qs.opts,
		global.opts = list("maxiter"=10,"maxeval" = 15,
				"weights"=c(50,10,5,1,0.1),
				"NmaxQI"=5,"nstart"=100,
				"xscale"=c(10,0.1,1)),
		local.opts = list("lam_max"=1e-2,
				          "nobs"=200,				# number of (bootstrap) observations for testing local minimizer
				          "nextSample"="score",		# sample criterion
				          "ftol_abs"=1e-2,			# lower bound on criterion value, triggers testing local minimizer if above
						  "weights"=c(0.55),		# constant weight factor
						  "eta"=c(0.025,0.075),	    # ignored, automatic adjustment of weights
						  "test"=FALSE),			# testing is enabled						  
		method = c("qscoring","bobyqa","direct"),		
		errType="max", iseed=297, cl=cl, pl=1,
		use.cluster = FALSE)						# cluster is only used for model simulation			

print(OPT,pl=10)

OPT$ctls
OPT$cvm
OPT$why
OPT$qsd$qldata[,1:3]

# extract information of parameter estimation
local <- OPT$final
info <- attr(OPT,"optInfo")
track <- attr(OPT,"tracklist")

# check results
OPT$value
local$score
(D <- quasiDeviance(OPT$par,OPT$qsd,cvm=OPT$cvm,W=info$W,theta=info$theta,verbose=TRUE)[[1]])
D$value
# check final Sigma
attr(D,"Sigma")
attr(local,"Sigma")

## extract Stest results ##
Stest <- track[[length(track)]]$Stest

# do a multisearch from different randomly chosen starting points
method <- c("qscoring","bobyqa","cobyla")
S0 <- multiSearch(OPT$par,OPT$qsd,method,opts,check=FALSE,
		cvm=OPT$cvm,nstart=50,optInfo=TRUE,
		 multi.start=TRUE,cl=cl,verbose=TRUE)

# best found root
(roots <- attr(S0,"roots"))
(id <- attr(roots,"id"))
stopifnot(!is.na(id))
attr(roots,"par")
attr(S0,"optRes")

# last message from local minimization
local$message
# history of roots
do.call(rbind,lapply(track,function(x) x$S0$score))

S0 <- searchMinimizer(OPT$par, OPT$qsd,
			method="qscoring",cvm=OPT$cvm,
			verbose=TRUE)

# quas-scoring again more precise results
QS <- qscoring(OPT$qsd,OPT$par,opts=opts,cvm=OPT$cvm,verbose=TRUE)

# compare the different estimates
#checkMultRoot(OPT)
checkMultRoot(OPT,par=rbind("QS"=QS$par,"S0"=S0$par))

# MC hypothesis testing
par0 <- OPT$par #+c(0.1,0.001,0.01)
obs0 <- OPT$qsd$obs

Stest <- qleTest(OPT,												# estimation results
		  par0=par0,												# parameter to test
		   obs0=obs0,												# alternative observed statistics
		    sim=simClust,cond=cond,nsim=50,	
		     method=c("qscoring","bobyqa","direct"),				# possible restart methods
		   	  opts=qs.opts, control=list("ftol_abs"=1e-6),			# minimization options 
			   multi.start=1L, cl=cl, cores=2L,verbose=TRUE)					# multi-start and parallel options	
   
print(Stest)

# check
quasiDeviance(par0,OPT$qsd,cvm=OPT$cvm,W=info$W,theta=info$theta,verbose=TRUE)[[1]]

# extract minimization results
RES <- attr(Stest,"optRes")
fval <- sapply(RES,"[[","value")
summary(fval)
quantile(fval)
plot(ecdf(fval),lty=4)
roots <- do.call(rbind,lapply(RES,function(x) x$score))
colMeans(roots)

# do not forget
stopCluster(cl)

# ------------------------- ONLY FOR THE VIGNETTE ---------------------------

## save results for vignette
#matclust <- list("qsd"=qsd,"cvm"=cvm,"OPT"=OPT,"Stest"=Stest)
#save(matclust,file="matclust.rda")

## plot and store envelopes
#pdf("Kfunc.pdf",width = 8, height = 10)
#plotGraphs(OPT$par,nsim=1000)
#dev.off()