R/mwirrls.R
In plsgenomics: PLS Analyses for Genomics

Documented in mwirrls

### mwirrls.R  (2006-01)
###
###    Local Weighted Iteratively Reweighted Ridge Least Squares (IRRLS)
###                      for categorical data
###
### Copyright 2006-01 Sophie Lambert-Lacroix and Julie Peyre
###
###
### This file is part of the `plsgenomics' library for R and related languages.
### It is made available under the terms of the GNU General Public
### License, version 2, or at your option, any later version,
### incorporated herein by reference.
### 
### This program is distributed in the hope that it will be
### useful, but WITHOUT ANY WARRANTY; without even the implied
### warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR
### PURPOSE.  See the GNU General Public License for more
### details.
### 
### You should have received a copy of the GNU General Public
### License along with this program; if not, write to the Free
### Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
### MA 02111-1307, USA

mwirrls <- function(Y,Z,Lambda=0,NbrIterMax=15,Threshold=10^(-12),WKernel) 
{
##    IN     
##########
##      c=NbrClass-1
##  Z : Design matrix (cn) x c(p+1)
##          block data matrix
##  Y : Response Vector
##          vector ntrain 
##  Lambda :  coefficient of the ridge penalty
##          real
##  NbrIterMax : Maximal number of iterations
##          positive integer
##  Threshold : Used for the stopping rule.
##          real
##  WKernel : Kernel Weigth
##          matrix cn x cn 

##    OUT     
############
##  out :  structure that contains the fields
##      Gamma : vector of the regression coefficients w.r.t the design
##      matrix.
##      Cvg : Cvg=1 if the algorithm has converged otherwise 0.
##      Ybloc : block Response Vector ntrain*c

c <- max(Y)
dZ2 <- dim(Z)[2]
n <- length(Y)
p <- dZ2/c-1

Ybloc <- rep(0,(n*c));  
for (cc in 1:c)
{ff <- which(Y==cc)  
 Ybloc[(ff-1)*c+cc]=rep(1,length(ff))}

R <- matrix(0,dZ2,dZ2) 
diag(R) <- rep(1,dZ2)
grid <- seq(from=1, to=dZ2, by= (p+1))
R[grid,grid]<-0 



##  THE NR ALGORITHM
##################################
##  1. Initialize the parameter

mu <- (1+2*Ybloc)/(c+3)
Eta <- rep(0,length(mu))
WNR <- matrix(0,length(mu),length(mu))

for (kk in 1:n) {
 ss <- 1-sum(mu[c*(kk-1)+(1:c)])
 Blocmu <- mu[c*(kk-1)+(1:c)]
 BlocW <- -Blocmu%*%t(Blocmu)
 BlocW <- BlocW+diag(Blocmu)
 WNR[c*(kk-1)+(1:c),c*(kk-1)+(1:c)] <- BlocW
 Eta[c*(kk-1)+(1:c)] <- log(Blocmu)-log(ss)
}
             
WT <- WKernel%*%WNR           
H <- t(Z)%*%WT%*%Z+Lambda*R    
trysolve<-try(solve(H,t(Z)%*%WKernel%*%(WNR%*%Eta+(Ybloc-mu))), silent = TRUE)
if (sum(is.nan(trysolve))>0) {
 trysolve <- NULL}

if (is.matrix(trysolve)==FALSE) {
  Gamma <- rep(1,dZ2) 
  StopRule <- 1   
  NbrIter <- NbrIterMax+1
  Illcond <- 1
  Separation <- 0
  Cvg <- 0}
if (is.matrix(trysolve)==TRUE)  {
  StopRule <- 0 
  NbrIter <- 0
  Illcond <- 0
  Separation <- 0}              
            
##  2. Newton-Raphson loop
 
while (StopRule==0)
{#Increment the iterations number 
 NbrIter <- NbrIter + 1
 #Udapte Gamma
 if (NbrIter==1)
  {Gamma <- trysolve}
 if (NbrIter>1)
  {Gamma <- Gamma+trysolve}           
 #Udapte Eta            
 Eta <- Z%*%Gamma  
 Eta[Eta>700] <- rep(700,sum(Eta>700)) 
 #Udapte mu and WNR
 for (kk in 1:n) {
 mu[c*(kk-1)+(1:c)] <- exp(Eta[c*(kk-1)+(1:c)])/(1+sum(exp(Eta[c*(kk-1)+(1:c)])))
 Blocmu <- mu[c*(kk-1)+(1:c)]
 BlocW <- -Blocmu%*%t(Blocmu)
 BlocW <- BlocW+diag(Blocmu)
 WNR[c*(kk-1)+(1:c),c*(kk-1)+(1:c)] <- BlocW
 }
 #Udapte total Weight   
 WT <- WNR%*%WKernel
 #Udapte Gradient
 Gradient <- t(Z)%*%WKernel%*%(Ybloc-mu)-Lambda*R%*%Gamma 
 #Udapte H           
 H <- t(Z)%*%WT%*%Z+Lambda*R   
 trysolve <- try(solve(H,Gradient), silent = TRUE)      
 if (sum(is.nan(trysolve))>0) {
 trysolve <- NULL}
        
 #Compute the StopRule
 #on the (quasi)-separation detection (for Lambda=0)
 if (Lambda==0)
  {Separation <- as.numeric(sum((apply(cbind(rep(0,n),matrix(Eta,nrow=n,byrow=TRUE)),1,which.max)-1)==Y)==n)}
 #on the conditioning of matrix
 Illcond <- as.numeric(is.matrix(trysolve)==FALSE)
 #on the convergence
 Cvg <- as.numeric(sqrt(sum(abs(Gradient)^2))<=Threshold)
 StopRule <- max(Cvg,as.numeric(NbrIter>=NbrIterMax),Separation,Illcond) 
}

##  CONCLUSION
###############        

list <- list(Coefficients=Gamma,Cvg=max(Cvg,Separation),Ybloc=Ybloc)
return(list)
}