inst/scripts/svy2lmesim2.R

library(lme4)
library(svylme)


library(parallel)
RNGkind("L'Ecuyer-CMRG")
mcreplicate<-function(n, expr,...){
    l<-mclapply(integer(n), eval.parent(substitute(function(...) expr)), mc.cores=6,mc.set.seed = TRUE, mc.preschedule=TRUE)
    simplify2array(l, higher = TRUE)
    }


set.seed(2023-6-20)

N1=400 
N2=400 
latitude<-1:N2
longitude<-1:N1
population<-expand.grid(lat=latitude,long=longitude)
population$PSU<-population$long
overlap=ceiling(N2*1/2)


cflmer<-function(model){
    a<-VarCorr(model)
    c(fixef(model), as.vector(unlist(a[1:2])), attr(a,"sc")^2, SE(model), c(0,0))
    }
cfsvy<-function(model){
    a<-coef(model, random=TRUE)
    c(coef(model), diag(a$varb),a$s2,SE(model),c(0,0))
    }

cfglm<-function(model){c(coef(model),c(0,0), SE(model), c(0,0))}

model_cluster<-function(population, overlap){
   population$cluster<-numeric(nrow(population))
   
   id<-ifelse(population$lat<=overlap, 
              population$long, 
              ((population$long+population$lat-overlap) %% N1)+1
   )
   population$cluster<-id
   population	
}


f<-function(overlap,REPS=1000){
    
    population<-model_cluster(population,overlap)
    population$x<- population$long %% 40
    population$z<-rnorm(400*400)
    population$u<-sort(rnorm(400))[population$cluster]
    population$y<- with(population, x+z + u+rnorm(400*400))    
    
    population$strata<-(population$long-1) %/% 40
    population$uid<-1:nrow(population)
    
    true<-cflmer(lmer(y~x+z+(1|cluster), population))
    
    rr<-mcreplicate(REPS, {
        
        stratsize<- c(20,5,4,3,2,2,3,4,5,20)
        names(stratsize)<-unique(population$strata)
        sstrat<-stratsample(population$strata[!duplicated(population$PSU)], stratsize)
        
        stage1psu<- population$PSU[!duplicated(population$PSU)][sstrat]
        stage1<- subset(population, PSU %in% stage1psu)
        
        
        stratsize2<-rep(c(20,8,20),c(1,66,1))
        names(stratsize2)<-unique(stage1$PSU)
        stage2<-stage1[stratsample(stage1$PSU, stratsize2),]
        
    
        stage2$fpc1<-400/10
        stage2$fpc2<-400
        des<-svydesign(id=~PSU+uid, fpc=~fpc1+fpc2, strata=~strata,data=stage2)
        pair<-svy2lme(y~x+z+(1|cluster), design=des,return.devfun=TRUE)
        jkdes<-as.svrepdesign(des)
        jkvar<-boot2lme(pair,jkdes)
        
        c(
            cfsvy(pair),
            ##cflmer(lmer(y~x+z+(1|cluster), population)),
            cflmer(lmer(y~x+z+(1|cluster), stage2)),
            cfglm(svyglm(y~x+z+(1|cluster), design=des)),
            rep(0,5),SE(jkvar,"beta"), SE(jkvar,"fullVar"), sqrt(vcov(jkvar,"s2"))
        )
    })

    list(
        overlap=overlap/N2,
        true=true,
        median=matrix(apply(rr, 1, median),byrow=TRUE,nrow=4),
        mad=matrix(apply(rr, 1, mad),byrow=TRUE,nrow=4)
    )
}


##results<- lapply(c(0.1,0.25,0.5,0.75,0.9,1)*N2, f)


results_0.25<-replicate(100, f(N2*1/4))
results_0.75<-replicate(100, f(N2*3/4))
save(results_0.25,results_0.75, file="~/svy2lmesim-crossed1.rda")


## summaries
## > round(rowMeans(sapply(results_0.75["median",],function(x) x[1,])),3)
## [1] -0.121  1.006  1.000  0.993  0.965  0.247  0.010  0.078
## > round(rowMeans(sapply(results_0.75["mad",],function(x) x[1,])),3)
## [1] 0.278 0.013 0.092 0.189 0.126 0.072 0.003 0.021
tslumley/svylme documentation built on Feb. 10, 2024, 11:01 p.m.