Nothing
Sest_multireg <- function(X,...) UseMethod("Sest_multireg")
Sest_multireg.formula <- function(formula, data=NULL, ...)
{
# --------------------------------------------------------------------
# Returns response of formula in nice way
model.multiregresp<-function (data, type = "any")
{
if (attr(attr(data, "terms"), "response")) {
if (is.list(data) | is.data.frame(data)) {
v <- data[[1L]]
if (is.data.frame(data) && is.vector(v)) v <- data[,1L,drop=FALSE]
if (type == "numeric" && is.factor(v)) {
warning("using type=\"numeric\" with a factor response will be ignored")
}
else if (type == "numeric" | type == "double")
storage.mode(v) <- "double"
else if (type != "any")
stop("invalid response type")
if (is.matrix(v) && ncol(v) == 1L){
if (is.data.frame(data)) {v=data[,1L,drop=FALSE]}
else {dim(v) <- NULL}}
rows <- attr(data, "row.names")
if (nrows <- length(rows)) {
if (length(v) == nrows)
names(v) <- rows
else if (length(dd <- dim(v)) == 2L)
if (dd[1L] == nrows && !length((dn <- dimnames(v))[[1L]]))
dimnames(v) <- list(rows, dn[[2L]])
}
return(v)
}
else stop("invalid 'data' argument")
}
else return(NULL)
}
mt <- terms(formula, data = data)
if (attr(mt, "response") == 0L) stop("response is missing in formula")
mf <- match.call(expand.dots = FALSE)
mf$... <- NULL
mf[[1L]] <- as.name("model.frame")
mf <- eval.parent(mf)
miss <- attr(mf,"na.action")
Y <- model.multiregresp(mf)
Terms <- attr(mf, "terms")
X <- model.matrix(Terms, mf)
res <- Sest_multireg.default(X, Y, int = FALSE, ...)
res$terms <- Terms
cl <- match.call()
cl[[1L]] <- as.name("Sest_multireg")
res$call <- cl
res$xlevels <- .getXlevels(mt, mf)
if (!is.null(miss)) res$na.action <- miss
return(res)
}
Sest_multireg.default <- function(X, Y, int = TRUE, bdp=.5, control=Scontrol(...),na.action=na.omit, ...)
{
# fast S algorithm for multivariate regression estimation
# INPUT:
# Y : response matrix (n x m)
# X : covariates matrix (n x p), possibly including intercept column
# (X = as.matrix(rep(1,n)) in case of location estimation)
# nsamp : number of elemental starts, e.g. 20
# bdp : breakdown point (<= 0.5)
# OUTPUT:
# res$Beta : estimate of regression coefficients
# res$Gamma : estimate of shape matrix
# res$scale : estimate of scale
# res$Sigma : estimate of covariance matrix
# -------------------------------------------------------------------
IRLSstep <- function(X,Y,initialBeta, initialGamma, initialscale, k, c0, b, convTol)
{
#convTol <- 1e-10
n <- nrow(X)
p <- ncol(X)
m <- ncol(Y)
Beta <- initialBeta
Res <- Y-X%*%Beta
psres <- sqrt(mahalanobis(Res, rep(0,m), initialGamma))
if (initialscale > 0)
scale <- initialscale
else
scale <- median(psres)/.6745
iter <- 0
betadiff <- 1
while ( (betadiff > convTol) & (iter < k) ) {
iter <- iter + 1
scale <- sqrt(scale^2 * mean(rhobiweight(psres/scale,c0))/b)
w <- scaledpsibiweight(psres/scale,c0)
# wbig <- diag(w)
# newBeta <- solve(t(X)%*%wbig%*%X)%*%(t(X)%*%wbig%*%Y)
wbig <- matrix(rep(w,p),ncol=p)
wX <- X * wbig
# newBeta <- solve(t(wX) %*% X)%*%(t(wX) %*% Y)
newBeta <- solve(crossprod(wX, X), crossprod(wX, Y))
newGamma <- cov.wt(Res, wt=w, center=FALSE)$cov
newGamma <- det(newGamma)^(-1/m)*newGamma
Res <- Y-X%*%newBeta
betadiff <- sum((newBeta-Beta)^2)/sum(Beta^2) # use 'sum' as a kind of norm
Beta <- newBeta
psres <- sqrt(mahalanobis(Res, rep(0,m), newGamma))
}
return(list( Beta = newBeta, Gamma = newGamma, scale = scale ))
}
#--------------------------------------------------------------------------
scale1 <- function(u, b, c0, initialsc)
{
# from Kristel's fastSreg
if (initialsc==0)
initialsc = median(abs(u))/.6745
maxit <- 100
sc <- initialsc
i <- 0
eps <- 1e-10
err <- 1
while (( i < maxit ) & (err > eps)) {
sc2 <- sqrt( sc^2 * mean(rhobiweight(u/sc,c0)) / b)
err <- abs(sc2/sc - 1)
sc <- sc2
i <- i+1
}
return(sc)
}
#---------------------------------------------------------------------------------------
randomset <- function(tot,nel) {
ranset <- rep(0,nel)
for (j in 1:nel) {
num <- ceiling(runif(1)*tot)
if (j > 1) {
while (any(ranset==num))
num <- ceiling(runif(1)*tot)
}
ranset[j] <- num
}
return(ranset)
}
# --------------------------------------------------------------------
rhobiweight <- function(x,c)
{
# Computes Tukey's biweight rho function with constant c for all values in x
hulp <- x^2/2 - x^4/(2*c^2) + x^6/(6*c^4)
rho <- hulp*(abs(x)<c) + c^2/6*(abs(x)>=c)
return(rho)
}
# --------------------------------------------------------------------
psibiweight <- function(x,c)
{
# Computes Tukey's biweight psi function with constant c for all values in x
hulp <- x - 2*x^3/(c^2) + x^5/(c^4)
psi <- hulp*(abs(x)<c)
return(psi)
}
# --------------------------------------------------------------------
scaledpsibiweight <- function(x,c)
{
# Computes Tukey's biweight psi function with constant c for all values in x
hulp <- 1 - 2*x^2/(c^2) + x^4/(c^4)
psi <- hulp*(abs(x)<c)
return(psi)
}
# --------------------------------------------------------------------
vecop <- function(mat) {
# performs vec-operation (stacks colums of a matrix into column-vector)
nr <- nrow(mat)
nc <- ncol(mat)
vecmat <- rep(0,nr*nc)
for (col in 1:nc) {
startindex <- (col-1)*nr+1
vecmat[startindex:(startindex+nr-1)] <- mat[,col]
}
return(vecmat)
}
# --------------------------------------------------------------------
reconvec <- function(vec,ncol) {
# reconstructs vecop'd matrix
lcol <- length(vec)/ncol
rec <- matrix(0,lcol,ncol)
for (i in 1:ncol)
rec[,i] <- vec[((i-1)*lcol+1):(i*lcol)]
return(rec)
}
#------------------------------------------------------------------------------#
# function needed to determine constant in biweight #
#------------------------------------------------------------------------------#
# (taken from Claudia Becker's Sstart0 program)
"chi.int" <- function(p, a, c1)
return(exp(lgamma((p + a)
# partial expectation d in (0,c1) of d^a under chi-squared p
/2) - lgamma(p/2)) * 2^{a/2} * pchisq(c1^2, p + a))
"chi.int.p" <- function(p, a, c1)
return(exp(lgamma((p + a)/2) - lgamma(p/2)) * 2^{a/2} * dchisq(c1^2, p + a) * 2 * c1)
"chi.int2" <- function(p, a, c1)
return(exp(lgamma((p + a)
# partial expectation d in (c1,\infty) of d^a under chi-squared p
/2) - lgamma(p/2)) * 2^{a/2} * (1 - pchisq(c1^2, p + a)))
"chi.int2.p" <- function(p, a, c1)
return( - exp(lgamma((p + a)/2) - lgamma(p/2)) * 2^{a/2} * dchisq(c1^2, p + a) * 2 * c1)
"csolve.bw.asymp" <- function(p, r)
{
# find biweight c that gives a specified breakdown
c1 <- 9
iter <- 1
crit <- 100
eps <- 0.00001
while((crit > eps) & (iter < 100)) {
c1.old <- c1
fc <- erho.bw(p, c1) - (c1^2 * r)/6
fcp <- erho.bw.p(p, c1) - (c1 * r)/3
c1 <- c1 - fc/fcp
if(c1 < 0)
c1 <- c1.old/2
crit <- abs(fc)
iter <- iter + 1
}
return(c1)
}
"erho.bw" <- function(p, c1)
return(chi.int(p, # expectation of rho(d) under chi-squared p
2, c1)/2 - chi.int(p, 4, c1)/(2 * c1^2) + chi.int(p, 6, c1)/(6 * c1^4) + (
c1^2 * chi.int2(p, 0, c1))/6)
"erho.bw.p" <- function(p, c1)
return(chi.int.p(p, # derivative of erho.bw wrt c1
2, c1)/2 - chi.int.p(p, 4, c1)/(2 * c1^2) + (2 * chi.int(p, 4, c1))/(2 *
c1^3) + chi.int.p(p, 6, c1)/(6 * c1^4) - (4 * chi.int(p, 6, c1))/(
6 * c1^5) + (c1^2 * chi.int2.p(p, 0, c1))/6 + (2 * c1 * chi.int2(p,
0, c1))/6)
#--------------------------------------------------------------------------#
# end 'constant determining' #
#--------------------------------------------------------------------------#
# --------------------------------------------------------------------
# - main function -
# --------------------------------------------------------------------
#set.seed(10) # seed can be set, but be careful in simulations then...
Y <- as.matrix(Y)
ynam=colnames(Y)
q=ncol(na.action(Y))
if (q < 1L) stop("at least one response needed")
X <- as.matrix(X)
xnam=colnames(X)
if (nrow(Y) != nrow(X))stop("x and y must have the same number of observations")
YX=na.action(cbind(Y,X))
Y=YX[,1:q,drop=FALSE]
X=YX[,-(1:q),drop=FALSE]
n <- nrow(Y)
m <- ncol(Y)
p <- ncol(X)
if (p < 1L) stop("at least one predictor needed")
if (q < 1L) stop("at least one response needed")
if (n < (p+q)) stop("For robust multivariate regression the number of observations cannot be smaller than the
total number of variables")
interceptdetection <- apply(X==1, 2, all)
interceptind <- (1:p)[interceptdetection==TRUE]
if (!any(interceptdetection) & int){
X <- cbind(rep(1,n),X)
p <- p + 1
interceptind <-1
if (!is.null(xnam)) colnames(X)[1] <- "(intercept)"
}
if (is.null(ynam))
colnames(Y) <- paste("Y",1:q,sep="")
if (is.null(xnam)) {
colnames(X) <- paste("X",1:p,sep="")
if (interceptdetection || int){
colnames(X)[interceptind] <- "(intercept)"
colnames(X)[-interceptind] <- paste("X",1:(p-1),sep="")
}
}
nsamp <- control$nsamp
bestr <- control$bestr # number of best solutions to keep for further C-steps
k <- control$k # number of C-steps on elemental starts
convTol <- control$convTol
maxIt <- control$maxIt
loop <- 1
c0 <- csolve.bw.asymp(m,bdp)
b <- erho.bw(m, c0)
bestbetas <- matrix(0, p*m, bestr)
bestgammas <- matrix(0, m*m, bestr)
bestscales <- 1e20 * rep(1,bestr)
sworst <- 1e20
while (loop <= nsamp) {
# find a (p+m)-subset in general position.
rankR <- 0
itertest <- 0
while ((rankR < m) && (itertest<200)) {
ranset <- randomset(n,p+m)
Xj <- X[ranset,,drop=FALSE]
Yj <- Y[ranset,,drop=FALSE]
Bj <- solve(crossprod(Xj), crossprod(Xj,Yj))
Rj <- Yj - Xj %*% Bj
# qrXj <- qr(Xj)
qrRj <- qr(Rj)
rankR <- qrRj$rank
itertest <- itertest + 1
}
if (itertest==200) stop("too many degenerate subsamples")
Sj <- crossprod(Rj) /(p+m-1)
Gj <- det(Sj)^(-1/m) * Sj
# perform k steps of IRLS on elemental start
res <- IRLSstep(X, Y, Bj, Gj, 0, k, c0, b, convTol)
Betarw <- res$Beta
Gammarw <- res$Gamma
scalerw <- res$scale
psresrw <- sqrt(mahalanobis(Y-X%*%Betarw, rep(0,m), Gammarw))
if (loop > 1) {
# check whether new Beta and new Gamma belong to the top best Betas; if so keep
# Beta and Gamma with corresponding scale.
if (mean(rhobiweight(psresrw/sworst,c0)) < b) {
ss <- sort(bestscales, index.return=TRUE)
ind <- ss$ix[bestr]
bestscales[ind] <- scale1(psresrw, b, c0, scalerw)
bestbetas[,ind] <- vecop(Betarw)
bestgammas[,ind] <- vecop(Gammarw)
sworst <- max(bestscales)
}
}
else {
bestscales[bestr] <- scale1(psresrw, b, c0, scalerw)
bestbetas[,bestr] <- vecop(Betarw)
bestgammas[,bestr] <- vecop(Gammarw)
}
loop <- loop + 1
}
ibest <- which.min(bestscales)
superbestscale <- bestscales[ibest]
superbestbeta <- reconvec(bestbetas[,ibest],m)
superbestgamma <- reconvec(bestgammas[,ibest],m)
# perform C-steps on best 'bestr' solutions, until convergence (or maximum maxIt steps)
for (i in bestr:1) {
tmp <- IRLSstep(X, Y, reconvec(bestbetas[,i],m), reconvec(bestgammas[,i],m), bestscales[i], maxIt, c0, b, convTol)
if (tmp$scale < superbestscale) {
superbestscale <- tmp$scale;
superbestbeta <- tmp$Beta;
superbestgamma <- tmp$Gamma;
}
}
Fit <- X%*%superbestbeta
Res <- Y-Fit
method <- list(est="S", bdp=bdp)
psres <- sqrt(mahalanobis(Res, rep(0,m), superbestgamma))/superbestscale
w <- scaledpsibiweight(psres,c0)
outFlag <- (psres > sqrt(qchisq(.975, m)))
if(ncol(Res)==1) Res=t(Res)
if(ncol(Fit)==1) Fit=t(Fit)
z=list( #Beta = superbestbeta,
coefficients=superbestbeta,
residuals=Res,
fitted.values=Fit,
method=method,
control=control,
Gamma = superbestgamma, scale = superbestscale,
Sigma = superbestgamma*superbestscale^2,
df=n-(m*qr(X)$rank),X=X,Y=Y,
b=b, c=c0, weights=w, outFlag=outFlag)
class(z) <- c("FRBmultireg")
return(z)
}
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.