R/var.components.R
In RMark: R Code for Mark Analysis

#' Variance components estimation
#' 
#' Computes estimated effects, standard errors and process variance for a set
#' of estimates
#' 
#' Computes estimated effects, standard errors and process variance for a set
#' of estimates using the method of moments estimator described by Burnham and
#' White (2002). The \code{design} matrix specifies the manner in which the
#' estimates (\code{theta}) are combined.  The number of rows of the design
#' matrix must match the length of \code{theta}. 
#' 
#' If you select specific values
#' of theta, you must select the equivalent sub-matrix of the variance-covariance
#' matrix.  For instance, if the parameter indices are \code{$estimates[c(1:5,8)]}
#' then the appropriate definition of the vcv matrix would be vcv=vcv[c(1:5,8), c(1:5,8)], if
#' vcv is nxn for n estimates. Note that get.real will only return the vcv matrix of the unique 
#' reals so the dimensions of estimates and vcv will not always match as in the example below
#' where estimates has 21 rows but with the time model there are only 6 unique Phis so vcv is 6x6.
#' 
#' To get a mean estimate use a column matrix of 1's (e.g.,
#' \code{design=matrix(1,ncol=1,nrow=length(theta))}. The function returns a
#' list with the estimates of the coefficients for the design matrix
#' (\code{beta}) with one value per column in the design matrix and the
#' variance-covariance matrix (\code{vcv.beta}) for the \code{beta} estimates.
#' The process variance is returned as \code{sigma}.
#' 
#' @param theta vector of parameter estimates
#' @param design design matrix for combining parameter estimates
#' @param vcv estimated variance-covariance matrix for parameters
#' @param alpha sets 1-alpha confidence limit on sigma
#' @param upper upper limit for process variance
#' @param LAPACK argument passed to call to \code{qr} for qr decomposition and
#' inversion
#' @return A list with the following elements \item{sigmasq}{process variance
#' estimate and confidence interval; estimate may be <0} \item{sigma}{sqrt of process variance; set to o if sigmasq<0} 
#' \item{beta}{dataframe with estimates and standard errors of betas
#' for design} \item{betarand}{dataframe of shrinkage estimates}
#'  \item{vcv.beta}{variance-covariance matrix for beta} \item{GTrace}{trace of matrix G}
#' @author Jeff Laake; Ben Augustine
#' @export
#' @import matrixcalc
#' @references BURNHAM, K. P. and G. C. WHITE. 2002. Evaluation of some random
#' effects methodology applicable to bird ringing data.  Journal of Applied
#' Statistics 29: 245-264.
#' @examples
#' \donttest{
#' # This example is excluded from testing to reduce package check time
#' data(dipper)
#' md=mark(dipper,model.parameters=list(Phi=list(formula=~time)),delete=TRUE)
#' md$results$AICc
#' zz=get.real(md,"Phi",vcv=TRUE)
#' z=zz$estimates$estimate[1:6]
#' vcv=zz$vcv.real
#' varc=var.components(z,design=matrix(rep(1,length(z)),ncol=1),vcv) 
#' df=md$design.data$Phi
#' shrinkest=data.frame(time=1:6,value=varc$betarand$estimate)
#' df=merge(df,shrinkest,by="time")
#' md=mark(dipper,model.parameters=list(Phi=list(formula=~time,
#'   fixed=list(index=df$par.index,value=df$value))),adjust=FALSE,delete=TRUE)
#' npar=md$results$npar+varc$GTrace
#' md$results$lnl+2*(npar + (npar*(npar+1))/(md$results$n-npar-1))
#' }
var.components=function (theta, design, vcv, alpha=0.05, upper=10*max(vcv), LAPACK = TRUE) 
{
	if (nrow(design) != length(theta)) 
		stop("Number of rows of design matrix must match length of theta vector")
	if (nrow(vcv) != length(theta)) 
		stop("Number of rows of vcv matrix must match length of theta vector")
	if (ncol(vcv) != length(theta)) 
		stop("Number of columns of vcv matrix must match length of theta vector")
	if (length(theta) <= ncol(design)) 
		stop("Length theta must exceed number of columns of design")
#
#  Reduce theta, design and vcv to the theta's that are used in the design
#   
	rn = (1:nrow(design))[apply(design, 1, function(x) any(as.numeric(x) != 
										0))]
	theta = theta[rn]
	design = design[rn, , drop = FALSE]
	vcv = vcv[rn, rn]
	sigma = 0
# This is equation (1) in B&W(2002); changed to use qr solution for inverse
	beta.hat = function(Dinv, X, theta) return(solve(qr(t(X) %*% 
												Dinv %*% X, LAPACK = LAPACK)) %*% (t(X) %*% Dinv %*% 
							theta))
# This computes inverse of D; changed to use qr solution for inverse
	compute.Dinv = function(sigma, vcv) {
		K = nrow(vcv)
		sigmamat = matrix(0, nrow = K, ncol = K)
		diag(sigmamat) = sigma
		return(solve(qr(vcv + sigmamat, LAPACK = LAPACK)))
	}
# This is equation (2) in B&W(2002)
	mom.sig = function(sigma, vcv, X, theta) {
		Dinv = compute.Dinv(sigma, vcv)
		beta = beta.hat(Dinv, X, theta)
		return(t(theta - X %*% beta) %*% Dinv %*% (theta - X %*% 
							beta) - (nrow(X) - length(beta)))
	}
# Uses uniroot to compute value of sigma by finding root of mom.sig  If it results in an error or the root is negative, the
# estimate of sigma is 0
    lower=-(min(Re(eigen(vcv)$values)) +1e-12)
	xlower=optimize(mom.sig,interval=c(lower,upper),vcv = vcv, theta = theta, X = design)
	xupper=optimize(mom.sig,interval=c(lower,upper),vcv = vcv, theta = theta, X = design,maximum=TRUE)
	if(xlower$objective*xupper$objective>0) 
	{
		lower=2*lower
		upper=2*upper
		xlower=optimize(mom.sig,interval=c(lower,upper),vcv = vcv, theta = theta, X = design)
		xupper=optimize(mom.sig,interval=c(lower,upper),vcv = vcv, theta = theta, X = design,maximum=TRUE)
	}
	if(xlower$objective*xupper$objective>0) 
	{
		stop("\nroot still could not be found with increased limits; try increasing upper limit by more than a factor of 2\n")
	} else
	{
		lower=min(xlower$minimum,xupper$maximum)
		upper=max(xupper$maximum,xlower$minimum)
		soln = uniroot(mom.sig, lower=lower, upper=upper, vcv = vcv, theta = theta, X = design,tol = 1e-15)
	}
    sigma = soln$root
#Begin Augustine additions
	mom.sigCI = function(sigma, vcv, X, theta,p) {
		Dinv = compute.Dinv(sigma, vcv)
		beta = beta.hat(Dinv, X, theta)
		return(t(theta - X %*% beta) %*% Dinv %*% (theta - X %*% 
							beta) - qchisq(p,nrow(X) - length(beta)))
	}
	solnL = uniroot(mom.sigCI, lower = lower, upper = upper, vcv = vcv, theta = theta, X = design, p=1-alpha/2,tol = 1e-15)
	solnU = uniroot(mom.sigCI, lower = lower, upper = upper, vcv = vcv, theta = theta, X = design, p=alpha/2,tol = 1e-15)
	sigmasq = c(sigma,solnL$root,solnU$root)
	names(sigmasq)=c("est.","lower","upper")
#End Augustine additions
	if(sigma<0)
	{
		warning("\nEstimated process variance < 0; using 0 for shrinkage estimates\n")
		sigma=0
	}
# Compute final values of D inverse, beta and its v-c matrix and return those values
	Dinv = compute.Dinv(sigma, vcv)
	beta = beta.hat(Dinv, design, theta)
#Begin Augustine additions; rearranged and slightly modified; moved CI code above 24 Aug 2012-jll
	eig=eigen(Dinv)
	Dinvsqrt=eig$vectors %*% diag(sqrt(eig$values)) %*% qr.solve(eig$vectors)
	H=sqrt(sigma)*Dinvsqrt
	X=design
	A=X%*%qr.solve(t(X)%*%Dinv%*%X)%*%t(X)
	I=diag(1,length(theta))
	G=H+(I-H)%*%A%*%Dinv
	betarand=G%*%theta
	VCbetarand=G%*%vcv%*%t(G)
	RMSE=sqrt(diag(VCbetarand)+(betarand-theta)^2)
	betarandL=betarand-qnorm(1-alpha/2,0,1)*RMSE
	betarandU=betarand+qnorm(1-alpha/2,0,1)*RMSE
	betarand=cbind(betarand,RMSE,betarandL,betarandU)
	colnames(betarand)=c("estimate","RMSE","lower","upper")
#end Augustine additions
	rownames(beta) = colnames(design)
	vcv.beta = solve(qr(t(design) %*% Dinv %*% design, LAPACK = LAPACK))
	rownames(vcv.beta) = colnames(design)
	colnames(vcv.beta) = colnames(design)
	beta = as.data.frame(beta)
	beta$se = sqrt(diag(vcv.beta))
	names(beta) = c("Estimate", "SE")
	return(list(sigmasq = sigmasq, sigma=sqrt(sigma), beta = beta,betarand=as.data.frame(betarand),vcv.beta = vcv.beta, GTrace=matrix.trace(G)))
}