setwd("~/scratch/kaiqiong.zhao/Projects/SOMNiBUS_SNP_selection/Rcpppackage/sparseSOMNiBUS/tests/testthat")
path_ref_data <- paste(paste(getwd(), "/data/", sep = ""), "datSnp5nsig1.RDS", sep = "")
#load("/scratch/kaiqiong.zhao/Projects/SOMNiBUS_RE_Simu/functions/BANK1data.RData")
#saveRDS(dat, path_ref_data )
dat = readRDS(path_ref_data)
n.snp <- ncol(dat)-4
# pre-set parameters
n.k = 5
numCovs = ncol(dat)-4
shrinkScale=1/2
lambda2 = 0.2
lambda1 = 10
source("~/scratch/kaiqiong.zhao/Projects/SOMNiBUS_SNP_selection/Rcpppackage/sparseSOMNiBUS/R/utils.R")
source("~/scratch/kaiqiong.zhao/Projects/SOMNiBUS_SNP_selection/Rcpppackage/sparseSOMNiBUS/R/sparseSmoothFit.R")
source("~/scratch/kaiqiong.zhao/Projects/SOMNiBUS_SNP_selection/Rcpppackage/sparseSOMNiBUS/R/oneUpdate.R")
source("~/scratch/kaiqiong.zhao/Projects/SOMNiBUS_SNP_selection/Rcpppackage/sparseSOMNiBUS/R/sparseSmoothPred.R")
source("~/scratch/kaiqiong.zhao/Projects/SOMNiBUS_SNP_selection/Rcpppackage/sparseSOMNiBUS/R/sparseSmoothFitPath.R")
source("~/scratch/kaiqiong.zhao/Projects/SOMNiBUS_SNP_selection/Rcpppackage/sparseSOMNiBUS/R/lambdaMax.R")
setwd("~/scratch/kaiqiong.zhao/Projects/SOMNiBUS_SNP_selection/Rcpppackage/sparseSOMNiBUS/src")
library(Rcpp)
sourceCpp("sparseOmegaCr.cpp")
# step 1: Spline Basis Set up
# calculate matrices: sparseOmega, smoothOmega1, basisMat0 (intercept), basisMat1 (for rest of covariates)
# These matrices are fixed for fixed n.k and Position
initOut = extractMats(dat=dat,n.k=n.k)
basisMat0 <- initOut$basisMat0
basisMat1 <- initOut$basisMat1
sparOmega <- initOut$sparOmega
smoOmega1 <- initOut$smoOmega1
designMat1 <- initOut$designMat1
#Hp <- (1-lambda2)* sparOmega + lambda2*smoOmega1
stepSize=2
#theta_m <- theta <- initTheta <- rep(0, n.k*(ncol(dat)-3))
shrinkScale=0.5
maxInt = 200
epsilon = 1E-6
printDetail = FALSE
accelrt = FALSE
iter = 4
sourceCpp("utils.cpp")
sourceCpp("updates.cpp")
theta <- rep(0, n.k*(numCovs+1))
theta <- rnorm(length(theta))
truncation= TRUE
#------------------------------------
# Test function fitProxGradCpp()
#-------------------------------------
sourceCpp("proxGradFit.cpp")
truncation= TRUE
theta <- rnorm(length(theta))
lambda1 = 5
lambda2 = 0.5
Hp <- (1-lambda2)* sparOmega + lambda2*smoOmega1
intfit = getStart(dat$Meth_Counts, dat$Total_Counts, designMat1, Hp, numCovs,basisMat0)
intfit$lambda_max
Hp <- (1-lambda2)* sparOmega + lambda2*smoOmega1
L = chol(Hp)
Hinv = chol2inv(L)
Linv = solve(L)
basisMat0_tilda <- basisMat0 %*% Linv # this tilde does depend on L-- H -- lambda2, should be calculated for each lambda2
designMat1_tilda <- lapply(designMat1, function(x){x%*%Linv})
see1 = fitProxGrad(theta, stepSize,lambda1, dat, basisMat0_tilda, n.k, Hp, maxInt = 10,
epsilon = 1E-6, printDetail = FALSE, shrinkScale,accelrt, numCovs, designMat1_tilda, basisMat1)
#---------- Compare accelrt and not accelrt -------#
lambda1 = 160
time0 = Sys.time()
fit_noaccelr = fitProxGrad(theta, stepSize,lambda1, dat, basisMat0_tilda, n.k, Hp, maxInt = 10^5,
epsilon = 1E-6, printDetail = FALSE, shrinkScale,accelrt, numCovs, designMat1_tilda, basisMat1)
plot(apply(fit_noaccelr$lossVals, 1, sum), ylim = c(65140, 65190))
print(Sys.time() -time0)
time0 = Sys.time()
fit_accelr = fitProxGrad(theta, stepSize,lambda1, dat, basisMat0_tilda, n.k, Hp, maxInt = 10^5,
epsilon = 1E-6, printDetail = FALSE, shrinkScale,accelrt=TRUE, numCovs, designMat1_tilda, basisMat1)
print(Sys.time() -time0)
points(apply(fit_accelr$lossVals, 1, sum), col = 2)
#---------------------------------------------------#
see2= fitProxGradCpp(theta, stepSize,lambda1, dat, basisMat0_tilda, n.k, Hp, maxInt = 10,
epsilon = 1E-6, shrinkScale,accelrt, numCovs, designMat1_tilda, truncation)
all.equal(see2$thetaEst, see1$thetaEst)
all.equal(see2$lossSum, as.numeric(see1$lossSum[length(see1$lossSum)]))
#all.equal(see1$pi_ij, see2$pi_ij)
all.equal(see1$thetaEstSep, see2$thetaEstSep)
all.equal(nrow(see1$Est.points), see2$Iter+2)
all.equal(see1$gNeg2loglik, see2$gNeg2loglik)
all.equal(see1$stepSizeVec[-(1)], see2$stepSizeVec[1:(length(see1$stepSizeVec)-1)])
all.equal(see1$lossVals[nrow(see1$lossVals),1], see2$neg2loglik)
#for( i in 1:(nrow(see1$Est.points)-1)){
# print( all.equal(see1$Est.points[i+1,], see2$thetaMat[i,]))
#}
#-------------------------------------#
# Add stopping rule objective functions are close
#-------------------------------------#
lambda1 = 200
fitsee= fitProxGradCpp(theta, stepSize,lambda1, dat, basisMat0_tilda, n.k, Hp, maxInt = 10^5,
epsilon = 1E-6, shrinkScale,accelrt, numCovs, designMat1_tilda, truncation)
fitsee$Iter
#--- requires significantly less iterations: (117 --- 606)
fitsee2= fitProxGrad(theta, stepSize,lambda1, dat, basisMat0_tilda, n.k, Hp, maxInt = 10^5,
epsilon = 1E-6, printDetail = FALSE, shrinkScale,accelrt, numCovs, designMat1_tilda, basisMat1)
nrow(fitsee2$Est.points)
ss = tail(fitsee2$lossVals[,1]+fitsee2$lossVals[,2])
(ss[-length(ss)]-ss[-1])/nrow(dat)
#-----------------------------------
test_that("Rcpp returns the save proximal gradient output as R function ", {
expect_equal(all.equal(see1$thetaEst, see2$thetaEst))
expect_equal(all.equal(see2$lossSum, as.numeric(see1$lossSum[length(see1$lossSum)])))
})
library(microbenchmark)
see = microbenchmark(R = {
fitProxGrad(theta, stepSize,lambda1, dat, basisMat0_tilda, n.k, Hp, maxInt = 10,
epsilon = 1E-6, printDetail = FALSE, shrinkScale,accelrt, numCovs, designMat1_tilda, basisMat1)
},
cpp= fitProxGradCpp(theta, stepSize,lambda1, dat, basisMat0_tilda, n.k, Hp, maxInt = 10,
epsilon = 1E-6, shrinkScale,accelrt, numCovs, designMat1_tilda, truncation)
, times = 10 )
library(ggplot2)
autoplot(see)
see
pdf("Prox_gradient_iterations.pdf", width=8, height = 5)
autoplot(see)+ggtitle("Computation time for iterative proximal gradient descent")
dev.off()
see
lambda1 = 0.5
see_out= fitProxGradCpp(theta, stepSize,lambda1, dat, basisMat0, n.k, Hp, maxInt = 10^5,
epsilon = 1E-10, shrinkScale,accelrt, numCovs, designMat1, basisMat1, truncation)
see1$thetaEstSep
see_out$thetaEst
#--------------
# test define lambda2 within 0, 1
#------------
sourceCpp("proxGradFit.cpp")
truncation= TRUE
theta <- rnorm(length(theta))
lambda2 = 0.5
Hp <- (1-lambda2)* sparOmega + lambda2*smoOmega1
startfit = getStart(dat$Meth_Counts, dat$Total_Counts, designMat1, Hp, numCovs, basisMat0)
startfit$lambda_max
lambda1 = 50
seeinit= fitProxGradCpp(theta, stepSize,lambda1=5, dat, basisMat0, n.k, Hp, maxInt = 10^5,
epsilon = 1E-20, shrinkScale,accelrt, numCovs, designMat1, basisMat1, truncation)
lambda1 = 3
see2= fitProxGradCpp(seeinit$thetaEst, stepSize,lambda1, dat, basisMat0, n.k, Hp, maxInt = 10^5,
epsilon = 1E-20, shrinkScale,accelrt, numCovs, designMat1, basisMat1, truncation)
#lambda1 = 4
#see2R= fitProxGrad(seeinit$thetaEst, stepSize,lambda1, dat, basisMat0, n.k, sparOmega, lambda2, smoOmega1, maxInt = 10^3,
# epsilon = 1E-20, printDetail = F, shrinkScale,accelrt, numCovs, designMat1, basisMat1)
#Hp <-sparOmega + lambda2*smoOmega1
#see21= fitProxGradCppold(theta, stepSize,lambda1, dat, basisMat0, n.k, sparOmega, lambda2, smoOmega1, maxInt = 10^5,
# epsilon = 1E-6, shrinkScale,accelrt, numCovs, designMat1, basisMat1, truncation)
#see2
#all.equal(see2, see21)
ssfit=see2
Hp <- (1-lambda2)* sparOmega + lambda2*smoOmega1
nk = n.k
optimcheck <- function(ssfit, lambda1, Hp, nk,eqDelta= 10^-5, uneqDelta=10^-5){
thetaSep <- ssfit$thetaEstSep[-1]
zeroCovs <- unlist(lapply( thetaSep, function(x){all(x==0)}))
indOptimRes <- rep(NA, length(zeroCovs))
zeroCovid <- which(zeroCovs)
nonzeroCovid <- which(!zeroCovs)
for(p in nonzeroCovid ){
ap = -ssfit$gNeg2loglik[(p*nk+1) :((p+1)*nk)]
# ap = 2* t(designMat1[[p]]) %*% (dat$Meth_Counts-dat$Total_Counts*ssfit$pi_ij)
top = Hp %*% thetaSep[[p]]
denom =sqrt(sum(top * thetaSep[[p]] ))
term2 = top/denom*lambda1
indOptimRes[p]=sqrt(sum((ap - term2)^2)) <=eqDelta
}
for(p in zeroCovid){
ap = -ssfit$gNeg2loglik[(p*nk+1) :((p+1)*nk)]
temp1 = Hp %*% ap
indOptimRes[p]= lambda1 -sqrt(sum(temp1*ap)) >= uneqDelta
}
return(indOptimRes)
}
optimcheck(see2, lambda1=10,Hp, nk = n.k, eqDelta = 1, uneqDelta = 10^-3)
Hp <- (1-lambda2)* sparOmega + lambda2*smoOmega1
optimcheck(see2,lambda1=lambda1, Hp, nk = n.k)
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.