####------------------- simulation testinfo -----------------------####
# devtools::load_all()
# library(doParallel)
library(doMPI)
library(MFCblockInfo)
####------------------- simulation design -------------------------####
# design.load.all <- readRDS("simulation/design_load_all_5-15_equal.rds")
design.load.all <- readRDS("design_load_all_5-15_equal.rds")
factor.blocksize <- 2:4
factor.keying <- "0" # c("0","12","23")
factor.int <- c("random", "ordered")
factor.load <- "acceptable"
factor.length <- "long"
factor.algorithm <- c("greedy-a","greedy-d","opt-t","mean-a","r2","loads","random")
factor.constraints <- "unconstrained" # c("unconstrained","constrained")
factor.target <- "weighted" # c("weighted","equal")
factor.ntraits <- "5"
#number of replications
R <- 200 #500
design.sim <- expand.grid("blocksize"=factor.blocksize, "keying"=factor.keying, "length"=factor.length, "intercepts"=factor.int,
"loads"=factor.load,
"constraints"=factor.constraints, "target"=factor.target, "ntraits"=factor.ntraits,
"rep"=1:R)
####-------------------- fixed conditions -------------------------####
#trait correlations (Big 5 from meta-analysis van der Linden et al.)
trait.cov.5 <- matrix(c(1,-.36,-.17,-.36,-.43,
-.36,1,.43,.26,.29,
-.17,.43,1,.21,.20,
-.36,.26,.21,1,.43,
-.43,.29,.20,.43,1),
nrow=5,ncol=5)
#combine both trait covariance matrices to a list
trait.cov.list <- list("5"=trait.cov.5)
int.range <- list("small"=c(-1,1), "large"=c(-2,2))
load.range <- list("good"=c(.65,.95), "acceptable"=c(.45,.95))
#create grid of traits if traits are not given
tr.levels <- c(-1,0,1)
tr.list <- vector("list", ncol(trait.cov.5))
for(tr in 1:length(tr.list)) tr.list[[tr]] <- tr.levels
traits.grid.5 <- expand.grid(tr.list)
#for 15 traits this is not feasible -> 3^15 = 4348907 trait levels
#draw random sample of 500 instead
set.seed(515)
traits.grid.15 <- mvtnorm::rmvnorm(n=500, sigma=diag(15)) # uncorrelated
#add all 0 as reference point
if(isFALSE(any(rowSums(traits.grid.15==0)==15))) traits.grid.15 <- rbind(traits.grid.15, rep(0,15))
traits.grid.list <- list("5"=traits.grid.5, "15"=traits.grid.15)
#reduce for testing
# traits.grid.list <- lapply(traits.grid.list, function(tl) rbind(tl[1:5,], rep(0, ncol(tl))))
traits.grid.list <- list("5" = matrix(1, 1, 5))
J <- 500 #Number of participants
####------------------ start simulation -------------------####
# cl <- makeCluster(10)
# registerDoParallel(cl)
cl <- startMPIcluster()
registerDoMPI(cl)
sinkWorkerOutput(paste0("worker_iter_post.out"))
# define chunkSize so that each cluster worker gets a single task chunk
chunkSize <- ceiling(R/getDoParWorkers())
mpiopts <- list(chunkSize=chunkSize)
# res <- foreach(d=1:nrow(design.sim), .packages=c("mvtnorm","numDeriv","devtools"), .combine=rbind) %dopar% {
#
res <- foreach (d=1:nrow(design.sim), .combine=rbind, .verbose=T, .packages=c("mvtnorm","numDeriv","devtools","lpSolveAPI","MFCblockInfo"),
.inorder=F, .errorhandling="remove", .options.mpi=mpiopts) %dopar% {
set.seed(1204+d)
####------------------- test design -----------------------####
#select design load according to test design condition
design.load <- design.load.all[[as.character(design.sim[d,"ntraits"])]][[as.character(design.sim[d,"blocksize"])]][["0"]]
#quadruple
design.load <- rbind(design.load, design.load, design.load, design.load)
nb <- design.sim[d,"blocksize"]
K <- nrow(design.load)/nb
blocks <- create.block.ind(K, nb)
#specifications for lp model
#final test length
K.final <- K/4
####------------------ simulate item parameters -------------------####
items <- sim.items(design.load=design.load, K=K, nb=nb,
load.range=load.range[[as.character(design.sim[d,"loads"])]],
int.range=int.range[["large"]])
if(as.character(design.sim[d, "intercepts"]) == "ordered") {
u.mean.size <- cut(items$u.mean, quantile(items$u.mean), include.lowest = TRUE, labels = FALSE)
items$u.mean <- items$u.mean[order(u.mean.size)]
}
####-------------------------------- traits and responses --------------------------####
trait.cov <- trait.cov.list[[as.character(design.sim[d,"ntraits"])]]
traits.grid <- traits.grid.list[[as.character(design.sim[d,"ntraits"])]]
# with B5 trait correlations, but sd = .5, mean = 1
traits <- rmvnorm(J, rep(0, ncol(traits.grid)), sigma = trait.cov, method="chol")
#weights for opt
weights.grid <- a.all <- 1
responses <- sim.responses(traits, items, design.load, K, nb, return.index=F)
####------------------- constraints -----------------------------------####
if(as.character(design.sim[d,"constraints"])=="constrained") {
#constraints on items per trait
traits.blocks <- create.traits.blocks(loads=design.load, which.blocks=1:K, nb=nb)
traits.blocks.ind <- do.call(cbind, (lapply(1:ncol(design.load), function(f, tb) apply(tb, 1, function(rw) ifelse(f %in% rw, 1, 0)), tb=traits.blocks)))
n.traits <- rep(K.final/ncol(design.load)*nb, ncol(design.load))
#constraints on item keying (comparisons between opposite-keyed items)
#at least 1/2 of pairwise comparisons between differently keyed items
#this makes 1/2, 3/4, 1 mixed keyed blocks for block sizes 2,3,4
loads.blocks <- t(apply(blocks, 1, function(b, dl) colSums(dl[b,]), dl=design.load))
block.mixed <- ifelse(rowSums(loads.blocks)==nb, 0, 1)
n.mixed <- design.sim[d,"blocksize"]/4*K.final
#at least 1 negatively keyed item per trait
traits.neg.ind <- apply(loads.blocks, 2, function(rw) ifelse(rw==-1, 1, 0))
n.neg <- rep(1, ncol(design.load))
#combine to constraint.list
constraint.list <- list("left"=cbind(traits.blocks.ind, block.mixed, traits.neg.ind),
"operator"=c(rep("=",ncol(traits.blocks.ind)), ">=", rep(">=",ncol(traits.neg.ind))),
"right"=c(n.traits, n.mixed, n.neg))
} else {
constraint.list <- NULL
}
####------------------- T-optimality --------------------------------####
load.mat <- items$loads * design.load
gamma.true <- create.design.mat(K=K, nb=nb) %*% items$u.mean
infos <- calc.info.block(lhb.mplus, traits=as.matrix(traits.grid), int=gamma.true, loads=load.mat, uni=diag(items$uni),
K=K, nb=nb)
#trace for each block (and grid point)
info.trace <- calc.info.trace(infos, prior = trait.cov)
####------------ MIP algorithm with T-optimality -----------------------####
ind.t.opt <- select.optimal(info.sum=info.trace, traits.grid=traits.grid, K=K, K.final=K.final,
constraint.list=constraint.list, weights.grid=weights.grid)$ind.opt
####---------------- block selection based on R^2 ----------------------####
#R^2 mean across persons and traits, weighted
means.r2 <- do.call(c, lapply(1:K, function(k, i, p) {
mean(rowMeans(calc.info.block.r2(i, wo.blocks=k, prior = p))*a.all)
},
i=infos, p = trait.cov))
means.r2 <- matrix(means.r2, 1, K)
ind.r2 <- select.optimal(info.sum=means.r2, traits.grid=matrix(0,1,1), K=K, K.final=K.final,
constraint.list=constraint.list)$ind.opt
#A-optimality mean across persons and traits, weighted
means.a <- calc.a.optimality(infos, prior = trait.cov, summed = FALSE)*a.all
means.a <- matrix(means.a, 1, K)
ind.a.mean <- select.optimal(info.sum=means.a, traits.grid=matrix(0,1,1), K=K, K.final=K.final,
constraint.list=constraint.list, direction = "min")$ind.opt
####-------------- greedy algorithm with A-optimality and D-optimality ----------------####
ind.a.opt <- select.greedy(infos, calc.a.optimality,
traits.grid, K, K.start=0, K.final, maximize=FALSE, weights.grid=weights.grid,
prior=trait.cov)
ind.d.opt <- select.greedy(infos, calc.d.optimality,
traits.grid, K, K.start=0, K.final, maximize=TRUE, weights.grid=weights.grid,
prior=trait.cov)
####---------------- item selection based on loadings ------------------####
loads.blocks <- t(apply(blocks, 1, function(b, dl) colSums(dl[b,]), dl=load.mat))
means.loads <- matrix(rowMeans(abs(loads.blocks)), 1, K)
ind.loads <- select.optimal(info.sum=means.loads, traits.grid=matrix(0,1,1), K=K, K.final=K.final,
constraint.list=constraint.list)$ind.opt
####---------------- random item selection ------------------####
ind.rand <- select.optimal(info.sum=matrix(runif(K, 0, 1), 1, K), traits.grid=matrix(0,1,1), K=K, K.final=K.final,
constraint.list=constraint.list)$ind.opt
####---------------- trait estimation and summary measures -------------####
results.list <- list("greedy-a"=ind.a.opt, "greedy-d"=ind.d.opt, "opt-t"=ind.t.opt,
"mean-a"=ind.a.mean, "r2"=ind.r2, "loads"=ind.loads, "random"=ind.rand)
testinfo <- colSums(infos[[1]], dims = 1) + solve(trait.cov)
res.r <- NULL
for (a in factor.algorithm) {
if(all(results.list[[as.character(a)]])) {
blocks.ind <- c(t(blocks[results.list[[as.character(a)]],]))
gamma.true <- create.design.mat(K=K.final, nb=nb) %*% items$u.mean[blocks.ind]
# estimate traits based on new questionnaire
estimates <- est.MAP(FUN=lhb.mplus, responses=responses$rankindices[,results.list[[as.character(a)]]],
int=gamma.true, loads=load.mat[blocks.ind,], uni=diag(items$uni)[blocks.ind,blocks.ind],
perms=permute(1:nb), nb=nb,
m.prior=rep(0,ncol(design.load)), s.prior=trait.cov, SE=FALSE)$traits
rec <- diag(cor(estimates, traits))
RMSE <- colMeans((estimates - traits)^2)
MAB <- colMeans(abs(estimates - traits))
sens <- colSums((estimates > 1) & (traits > 1)) / colSums(traits > 1) # sensitivity: correctly classified as > 1 among > 1
spec <- colSums((estimates < 1) & (traits < 1)) / colSums(traits < 1) # specificity: correctly classified as < 1 amont < 1
infos.a <- lapply(infos, function(i, ind) i[ind,,], ind = results.list[[as.character(a)]])
A <- calc.a.optimality(infos.a, prior = trait.cov)
D <- calc.d.optimality(infos.a, prior = trait.cov)
testinfo.a <- colSums(infos.a[[1]], dims = 1) + solve(trait.cov)
T.opt <- sum(diag(testinfo.a))
Frob <- norm(testinfo.a %*% solve(testinfo) - diag(ncol(testinfo)), type = "F")
res.r <- rbind(res.r,
data.frame(design.sim[d,], "trait"=1:ncol(design.load), "algorithm"=a,
rec, RMSE, MAB, sens, spec, A, D, T.opt, Frob))
} else {
res.r <- data.frame(design.sim[d,], "trait"=1:ncol(design.load), "algorithm"="opt",
rec=NA, RMSE=NA, MAB=NA, sens=NA, spec=NA, A=NA, D=NA, T.opt=NA, Frob=NA)
}
}
saveRDS(res.r, file=paste0("results_opt_grid1_posterior_poskeyed/results_opt_grid1_posterior_poskeyed_d",d,".rds"))
res.r
}
saveRDS(res, file="results_simulation_opt_grid1_posterior_poskeyed.rds")
# stopCluster(cl)
closeCluster(cl)
mpi.quit()
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.