R/Sest_multireg.default.R
In robflreg: Robust Functional Linear Regression

Sest_multireg.default <-
function(X, Y, int = TRUE, bdp=.5, control=Scontrol(...),na.action=na.omit, ...){
  
  IRLSstep <- function(X,Y,initialBeta, initialGamma, initialscale, k, c0, b, convTol){  
    
    n <- nrow(X)
    p <- ncol(X)
    m <- ncol(Y)
    
    Beta <- initialBeta
    Res <- Y-X%*%Beta
    psres <- sqrt(mahalanobis(Res, rep(0,m), initialGamma))
    if(initialscale > 0)
      scale <- initialscale
    else
      scale <- median(psres)/.6745
    
    iter <- 0
    betadiff <- 1
    
    while((betadiff > convTol) & (iter < k)){
      iter <- iter + 1
      scale <- sqrt(scale^2 * mean(rhobiweight(psres/scale,c0))/b)
      w <- scaledpsibiweight(psres/scale,c0)
      wbig <- matrix(rep(w,p),ncol=p)	
      wX <- X * wbig	
      newBeta <- ginv(crossprod(wX, X)) %*% crossprod(wX, Y)
      newGamma <- cov.wt(Res, wt=w, center=FALSE)$cov
      newGamma <- det(newGamma)^(-1/m)*newGamma
      Res <- Y-X%*%newBeta
      betadiff <- sum((newBeta-Beta)^2)/sum(Beta^2) # use 'sum' as a kind of norm
      Beta <- newBeta
      psres <- sqrt(mahalanobis(Res, rep(0,m), newGamma))
    }
    return(list(Beta = newBeta, Gamma = newGamma, scale = scale ))
  }
  
  
  scale1 <- function(u, b, c0, initialsc){
    
    if(initialsc==0)
      initialsc = median(abs(u))/.6745
    maxit <- 100
    sc <- initialsc
    i <- 0 
    eps <- 1e-10
    err <- 1
    while  (( i < maxit ) & (err > eps)){
      sc2 <- sqrt( sc^2 * mean(rhobiweight(u/sc,c0)) / b)
      err <- abs(sc2/sc - 1)
      sc <- sc2
      i <- i+1
    }
    
    return(sc)
    
  }
  
  randomset <- function(tot,nel){
    
    ranset <- rep(0,nel)
    for(j in 1:nel){
      num <- ceiling(runif(1)*tot)
      if(j > 1){
        while(any(ranset==num)) 
          num <- ceiling(runif(1)*tot)
      }
      ranset[j] <- num
    }
    return(ranset)
  }
  
  
  rhobiweight <- function(x,c){
    
    hulp <- x^2/2 - x^4/(2*c^2) + x^6/(6*c^4)
    rho <- hulp*(abs(x)<c) + c^2/6*(abs(x)>=c)
    
    return(rho)
  }
  
  
  psibiweight <- function(x,c){
    
    hulp <- x - 2*x^3/(c^2) + x^5/(c^4)
    psi <- hulp*(abs(x)<c)
    
    return(psi)
  }
  
  
  scaledpsibiweight <- function(x,c){
    
    hulp <- 1 - 2*x^2/(c^2) + x^4/(c^4)
    psi <- hulp*(abs(x)<c)
    
    return(psi)
  }
  
  
  vecop <- function(mat){
    
    nr <- nrow(mat)
    nc <- ncol(mat)
    
    vecmat <- rep(0,nr*nc)
    for(col in 1:nc){
      startindex <- (col-1)*nr+1
      vecmat[startindex:(startindex+nr-1)] <- mat[,col]
    }
    return(vecmat)
  }
  
  
  reconvec <- function(vec,ncol){
    
    lcol <- length(vec)/ncol
    rec <- matrix(0,lcol,ncol)
    for(i in 1:ncol)
      rec[,i] <- vec[((i-1)*lcol+1):(i*lcol)]
    
    return(rec)
  }
  
  "chi.int" <- function(p, a, c1)
    return(exp(lgamma((p + a)/2) - lgamma(p/2)) * 2^{a/2} * pchisq(c1^2, p + a))
  
  "chi.int.p" <- function(p, a, c1)
    return(exp(lgamma((p + a)/2) - lgamma(p/2)) * 2^{a/2} * dchisq(c1^2, p + a) * 2 * c1)
  
  "chi.int2" <- function(p, a, c1)
    return(exp(lgamma((p + a)/2) - lgamma(p/2)) * 2^{a/2} * (1 - pchisq(c1^2, p + a)))
  
  "chi.int2.p" <- function(p, a, c1)
    return( - exp(lgamma((p + a)/2) - lgamma(p/2)) * 2^{a/2} * dchisq(c1^2, p + a) * 2 * c1)
  
  
  "csolve.bw.asymp" <- function(p, r){
    
    c1 <- 9
    iter <- 1
    crit <- 100
    eps <- 0.00001
    while((crit > eps) & (iter < 100)){
      c1.old <- c1
      fc <- erho.bw(p, c1) - (c1^2 * r)/6
      fcp <- erho.bw.p(p, c1) - (c1 * r)/3
      c1 <- c1 - fc/fcp
      if(c1 < 0)
        c1 <- c1.old/2
      crit <- abs(fc) 
      iter <- iter + 1
    }
    return(c1)
  }
  
  "erho.bw" <- function(p, c1)
    return(chi.int(p, 2, c1)/2 - chi.int(p, 4, c1)/(2 * c1^2) + chi.int(p, 6, c1)/(6 * c1^4) + 
             (c1^2 * chi.int2(p, 0, c1))/6)
  
  "erho.bw.p" <- function(p, c1)
    return(chi.int.p(p, 2, c1)/2 - chi.int.p(p, 4, c1)/(2 * c1^2) + (2 * chi.int(p, 4, c1))/
             (2 * c1^3) + chi.int.p(p, 6, c1)/(6 * c1^4) - (4 * chi.int(p, 6, c1))/
             (6 * c1^5) + (c1^2 * chi.int2.p(p, 0, c1))/6 + (2 * c1 * chi.int2(p, 0, c1))/6)
  
  Y <- as.matrix(Y)
  ynam=colnames(Y)
  q=ncol(na.action(Y))
  if(q < 1L) stop("at least one response needed")
  X <- as.matrix(X)
  xnam=colnames(X)
  if(nrow(Y) != nrow(X))stop("x and y must have the same number of observations")
  YX=na.action(cbind(Y,X))
  Y=YX[,1:q,drop=FALSE]
  X=YX[,-(1:q),drop=FALSE]
  n <- nrow(Y)
  m <- ncol(Y)
  p <- ncol(X)
  
  if(p < 1L) stop("at least one predictor needed")
  if(q < 1L) stop("at least one response needed")
  if(n < (p+q)) stop("For robust multivariate regression the number of observations cannot be smaller than the total number of variables")
  
  interceptdetection <- apply(X==1, 2, all)
  interceptind <- (1:p)[interceptdetection==TRUE]
  if(!any(interceptdetection) & int){
    X <- cbind(rep(1,n),X)
    p <- p + 1    
    interceptind <-1
    if(!is.null(xnam)) colnames(X)[1] <- "(intercept)"
  }
  
  if(is.null(ynam))
    colnames(Y) <- paste("Y",1:q,sep="")
  if(is.null(xnam)){
    colnames(X) <- paste("X",1:p,sep="")
    if(interceptdetection || int){
      colnames(X)[interceptind] <- "(intercept)"
      colnames(X)[-interceptind] <- paste("X",1:(p-1),sep="")
    }  
  }
  
  nsamp <- control$nsamp
  bestr <- control$bestr 
  k <- control$k
  convTol <- control$convTol
  maxIt <- control$maxIt
  
  loop <- 1
  c0 <- csolve.bw.asymp(m,bdp)
  b <- erho.bw(m, c0)
  
  bestbetas <- matrix(0, p*m, bestr)
  bestgammas <- matrix(0, m*m, bestr)
  bestscales <- 1e20 * rep(1,bestr)
  sworst <- 1e20
  while(loop <= nsamp){
    rankR <- 0
    itertest <- 0
    while((rankR < m) && (itertest<200)){
      ranset <- randomset(n,p+m)
      Xj <- X[ranset,,drop=FALSE]
      Yj <- Y[ranset,,drop=FALSE]
      Bj <- ginv(crossprod(Xj)) %*% crossprod(Xj,Yj)
      Rj <- Yj - Xj %*% Bj
      qrRj <- qr(Rj)
      rankR <- qrRj$rank
      itertest <- itertest + 1
    }
    if(itertest==200) stop("too many degenerate subsamples")
    
    Sj <- crossprod(Rj) /(p+m-1)
    Gj <- det(Sj)^(-1/m) * Sj
    res <- IRLSstep(X, Y, Bj, Gj, 0, k, c0, b, convTol)
    
    Betarw <- res$Beta
    Gammarw <- res$Gamma
    scalerw <- res$scale
    psresrw <- sqrt(mahalanobis(Y-X%*%Betarw, rep(0,m), Gammarw))
    if(loop > 1){
      if(mean(rhobiweight(psresrw/sworst,c0)) < b){
        ss <- sort(bestscales, index.return=TRUE)
        ind <- ss$ix[bestr]
        bestscales[ind] <- scale1(psresrw, b, c0, scalerw)
        bestbetas[,ind] <- vecop(Betarw)
        bestgammas[,ind] <- vecop(Gammarw)
        sworst <- max(bestscales)
      }
    }else{
      bestscales[bestr] <- scale1(psresrw, b, c0, scalerw)
      bestbetas[,bestr] <- vecop(Betarw)
      bestgammas[,bestr] <- vecop(Gammarw)
    }
    loop <- loop + 1
  }
  
  ibest <- which.min(bestscales)
  superbestscale <- bestscales[ibest]
  superbestbeta <- reconvec(bestbetas[,ibest],m)
  superbestgamma <- reconvec(bestgammas[,ibest],m)
  
  for(i in bestr:1){ 
    tmp <- IRLSstep(X, Y, reconvec(bestbetas[,i],m), reconvec(bestgammas[,i],m), bestscales[i], maxIt, c0, b, convTol)
    if(tmp$scale < superbestscale){
      superbestscale <- tmp$scale;
      superbestbeta <- tmp$Beta;
      superbestgamma <- tmp$Gamma;
    }
  }
  
  Fit <- X%*%superbestbeta
  Res <- Y-Fit
  method <- list(est="S", bdp=bdp)
  psres <- sqrt(mahalanobis(Res, rep(0,m), superbestgamma))/superbestscale
  w <- scaledpsibiweight(psres,c0)
  outFlag <- (psres > sqrt(qchisq(.975, m)))
  if(ncol(Res)==1) Res=t(Res)
  if(ncol(Fit)==1) Fit=t(Fit)
  
  z=list(coefficients=superbestbeta, 
         residuals=Res,
         fitted.values=Fit,
         method=method,
         control=control,
         Gamma = superbestgamma, scale = superbestscale, 
         Sigma = superbestgamma*superbestscale^2, 
         df=n-(m*qr(X)$rank),X=X,Y=Y,
         b=b, c=c0, weights=w, outFlag=outFlag)
  
  return(z)       
}