R/coupledMetropolis.R

#library('label.switching')
#library('doParallel')
#library('foreach')
#library('coda')

myDirichlet <- function(alpha){
	k <- length(alpha)
	theta <- rgamma(k, shape = alpha, rate = 1)
	return(theta/sum(theta))
}



toSolve <- function(a,n,p0){
	myVals <- exp(lgamma(2*a) - lgamma(a) + lgamma(a+n) - lgamma(2*a + n) + log(2))
	l <- abs(myVals - p0)
	return(a[which(l == min(l))][1])

}




complete.loglikelihood<-function(x,z,pars){
	g <- dim(pars)[1]
	n <- dim(x)[1]
	J <- dim(pars)[2]
	d <- dim(x)[2]
	logl <- rep(0, n)
	logpi <- log(pars[,J])
	z <- as.numeric(z)
	for (j in 1:d){
		logl <- logl + dbinom(x[,j], size = 1, prob = pars[,j][z], log = TRUE) 
	}
	logl <- logl + logpi[z]
	return(sum(logl))
}


gibbsBinMix <- function(alpha,beta,gamma,K,m,burn,data,thinning,z.true,outputDir){
	if (missing(K)) {stop(cat(paste("    [ERROR]: number of clusters (K) not provided."), "\n"))}
	if (missing(m)) {stop(cat(paste("    [ERROR]: number of MCMC iterations (m) not provided."), "\n"))}
	if (missing(thinning)) {thinning <- 5}
	if (K < 2) {
		stop(cat(paste("    [ERROR]: number of clusters (K) should be at least equal to 2."), "\n"))
	}
	d <- dim(data)[2]
	if (burn > m - 1) {
		stop(cat(paste("    [ERROR]: burn-in period (burn) not valid"), "\n"))
	}
	if (burn < 0) {
		stop(cat(paste("    [ERROR]: burn-in period (burn) not valid"), "\n"))
	}
	if (thinning > m) {
		stop(cat(paste("    [ERROR]: thinning not valid."), "\n"))
	}
	if (m < 1) {
		stop(cat(paste("    [ERROR]: mcmc iterations (m) not valid."), "\n"))
	}
	if (missing(alpha)) {alpha <- 1}
	if (missing(beta)) {beta <- 1}
	if (missing(gamma)) {gamma <- rep(1,K)}
	if (missing(data)) {stop(cat(paste("    [ERROR]: data is missing."), "\n"))}
	n <- dim(data)[1]
	x <- data

	dir.create(outputDir)
	setwd(outputDir)


	p <- myDirichlet(rep(1,K)) # initial values for cluster probabilities
	theta <- array(data = runif(K*d), dim = c(K,d)) # initial values for response probabilities
	z <- sample(K,n,replace=TRUE,prob = p)
	s <- l <- newL <- numeric(K)
	sx <- array(data = 0, dim = c(K,d))
	#output
	theta.file <- "theta.txt"
	z.file <- "z.txt"
	p.file <- "p.txt"
	conTheta = file(theta.file,open = "w")
	conZ = file(z.file,open = "w")
	conP = file(p.file,open = "w")

	for (iter in 1:m){
		#update cluster allocations (z)
		s <- rep(0,K)
		sx <- array(data = 0, dim = c(K,d))
		for(i in 1:n){
			for(k in 1:K){
				#l[k] <-  p[k]*prod((theta[k,]^x[i,])*((1-theta[k,])^(1-x[i,])))
				l[k] <-  log(p[k]) + sum(x[i,]*log(theta[k,]) + (1-x[i,])*log(1-theta[k,]))
			}
			for(k in 1:K){
				newL[k] <-  1/sum(exp(l - l[k]))
			}
			z[i] <- sample(K,1,prob = newL)
			#z[i] <- sample(K,1,prob = l)		
			s[z[i]] <- s[z[i]] + 1
			sx[z[i],] <- sx[z[i],] + x[i,]
		}
		p <- myDirichlet(gamma + s)
		for(k in 1:K){
			theta[k,] <- rbeta(d, shape1 = alpha + sx[k,], shape2 = beta + s[k] - sx[k,])
		}
		if((iter %% thinning == 0)&(iter > burn)){
			cat(theta,"\n",file=conTheta)
			cat(z,"\n",file=conZ)
			cat(p,"\n",file=conP)		
		}
		if(iter %% (m/100) == 0){
			cat(paste("Running Gibbs: ",100*round(iter/m,3),"% completed.",sep=""),"\n");
		}
	}
	close(conTheta)
	close(conP)
	close(conZ)
	cat(paste("Gibbs finished."),"\n")
	cat("\n")
	cat(paste("Dealing with Label Switching..."),"\n")
	tt <- read.table("theta.txt")
	m <- dim(tt)[1]
	d <- dim(x)[2]
	J <- d + 1
	mcmc <- array(data = NA, dim = c(m,K,J))
	for (j in 1:d){
		for(k in 1:K){
			mcmc[,k,j] <- tt[,(j-1)*K + k]
		}
	}
	tt <- read.table("p.txt")
	for(k in 1:K){
		mcmc[,k,J] <- tt[,k]
	}
	allocations <- as.matrix(read.table("z.txt",as.is = TRUE))
	m <- dim(mcmc)[1]
	iter <- 1
	ll <- complete.loglikelihood(x,allocations[iter,],mcmc[iter,,])
	maxLL <- ll
	maxIter <- iter
	for (iter in 1:m){
		ll <- complete.loglikelihood(x,allocations[iter,],mcmc[iter,,])
		if(ll > maxLL){maxLL <- ll;maxIter <- iter;cat(paste("Found new Complete MLE: ", ll,sep=""),"\n")}
	}
	# classification probs
	pMatrix <- array(data = NA, dim = c(m,n,K))
	for (iter in 1:m){
		p <- mcmc[iter,,J]
		theta <- array( mcmc[iter,,1:(J-1)],dim = c(K,J-1) )
		for(i in 1:n){
			for(k in 1:K){
				#pMatrix[iter,i,k] <-  p[k]*prod((theta[k,]^x[i,])*((1-theta[k,])^(1-x[i,])))
				l[k] <- log(p[k]) + sum(x[i,]*log(theta[k,]) + (1-x[i,])*log(1-theta[k,]))
			}
			#pMatrix[iter,i,] <- pMatrix[iter,i,]/sum(pMatrix[iter,i,])
			for(k in 1:K){
				pMatrix[iter,i,k] <- 1/sum(exp(l - l[k]))
				if(is.na(pMatrix[iter,i,k]) == TRUE){pMatrix[iter,i,k] = 0}
			}
		}
		if(iter %% 1000 == 0){cat(paste(" classification probs: ",100*round(iter/m,3),"% completed",sep=""),"\n");}
	}

	if(missing(z.true)==TRUE){
		ls <- label.switching( K = K, method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
					zpivot = allocations[maxIter,], z = allocations, complete = complete.loglikelihood, data = x,
					mcmc = mcmc,prapivot = mcmc[maxIter,,], p = pMatrix)
	}else{
		ls <- label.switching( K = K, method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
					zpivot = allocations[maxIter,], z = allocations, complete = complete.loglikelihood, data = x,
					mcmc = mcmc,p = pMatrix,groundTruth = z.true)
	}
	#reordering allocations
	allocationsECR <- allocationsKL <- allocationsECR.ITERATIVE1 <- allocations
	for (i in 1:m){
		myPerm <- order(ls$permutations$"ECR"[i,])
		allocationsECR[i,] <- myPerm[allocations[i,]]
		myPerm <- order(ls$permutations$"STEPHENS"[i,])
		allocationsKL[i,] <- myPerm[allocations[i,]]
		myPerm <- order(ls$permutations$"ECR-ITERATIVE-1"[i,])
		allocationsECR.ITERATIVE1[i,] <- myPerm[allocations[i,]]

	}
	write.table(allocationsECR, file = "z.ECR.txt")
	write.table(allocationsKL, file = "z.KL.txt")
	write.table(allocationsECR.ITERATIVE1, file = "z.ECR-ITERATIVE1.txt")



	reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR")$output
	tt <- read.table("theta.txt")
	write.table(reordered.mcmc, file = "reorderedMCMC-ECR.txt",col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
	reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR-ITERATIVE-1")$output
	write.table(reordered.mcmc, file = "reorderedMCMC-ECR-ITERATIVE1.txt",col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
	reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"STEPHENS")$output
	write.table(reordered.mcmc, file = "reorderedMCMC-STEPHENS.txt",col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
	write.table(mcmc, file = "rawMCMC.txt",col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
	write.table(file = "reorderedSingleBestClusterings.txt",t(ls$clusters[c(1,2,3),]),row.names = paste("z",1:n,sep="."))
	file.remove("p.txt")
	file.remove("theta.txt")
	cat(paste("raw MCMC parameters written to: \'rawMCMC.txt\' "),"\n")
	cat(paste("raw MCMC latent allocations written to: \'z.txt\' "),"\n")
	cat(paste("reordered MCMC output written to: "),"\n")
	cat(paste("     (Method 1):     \'reorderedMCMC-ECR.txt\'"),"\n")
	cat(paste("     (Method 2):     \'reorderedMCMC-ECR-ITERATIVE1.txt\'"),"\n")
	cat(paste("     (Method 3):     \'reorderedMCMC-STEPHENS.txt\'"),"\n")
	cat(paste("reordered single best clusterings written to: \'reorderedSingleBestClusterings.txt\' "),"\n")
	cat(paste("reordered MCMC latent allocations written to: "),"\n")
	cat(paste("     (Method 1):     \'z.ECR.txt\'"),"\n")
	cat(paste("     (Method 2):     \'z.KL.txt\'"),"\n")
	cat(paste("     (Method 3):     \'z.ECR-ITERATIVE1.txt\'"),"\n")
	setwd("../")

}



collapsedGibbsBinMix <- function(alpha,beta,gamma,K,m,burn,data,thinning,z.true,outputDir){
	if (missing(K)) {stop(cat(paste("    [ERROR]: number of clusters (K) not provided."), "\n"))}
	if (missing(m)) {stop(cat(paste("    [ERROR]: number of MCMC iterations (m) not provided."), "\n"))}
	if (missing(thinning)) {thinning <- 5}
	d <- dim(data)[2]
	if (burn > m - 1) {
		stop(cat(paste("    [ERROR]: burn-in period (burn) not valid"), "\n"))
	}
	if (burn < 0) {
		stop(cat(paste("    [ERROR]: burn-in period (burn) not valid"), "\n"))
	}
	if (thinning > m) {
		stop(cat(paste("    [ERROR]: thinning not valid."), "\n"))
	}
	if (m < 1) {
		stop(cat(paste("    [ERROR]: mcmc iterations (m) not valid."), "\n"))
	}
	if (missing(alpha)) {alpha <- 1}
	if (missing(beta)) {beta <- 1}
	if (missing(gamma)) {gamma <- rep(1,K)}
	if (missing(data)) {stop(cat(paste("    [ERROR]: data is missing."), "\n"))}
	d <- dim(data)[2]
	n <- dim(data)[1]
	x <- data

	dir.create(outputDir)
	setwd(outputDir)

	p <- myDirichlet(rep(1,K)) # initial values for cluster probabilities
	theta <- array(data = runif(K*d), dim = c(K,d)) # initial values for response probabilities
	z <- sample(K,n,replace=TRUE,prob = p)

	s <- l <- newL <- numeric(K)
	sx <- array(data = 0, dim = c(K,d))
	#output
	theta.file <- "theta.collapsed.txt"
	z.file <- "z.collapsed.txt"
	p.file <- "p.collapsed.txt"
	conTheta = file(theta.file,open = "w")
	conZ = file(z.file,open = "w")
	conP = file(p.file,open = "w")
#	initialization with standard Gibbs 
	for (iter in 1:100){
		s <- rep(0,K)
		sx <- array(data = 0, dim = c(K,d))
		for(i in 1:n){
			for(k in 1:K){
				l[k] <-  log(p[k]) + sum(x[i,]*log(theta[k,]) + (1-x[i,])*log(1-theta[k,]))
			}
			for(k in 1:K){
				newL[k] <-  1/sum(exp(l - l[k]))
			}
			z[i] <- sample(K,1,prob = newL)
			s[z[i]] <- s[z[i]] + 1
			sx[z[i],] <- sx[z[i],] + x[i,]
		}
		p <- myDirichlet(gamma + s)
		for(k in 1:K){
			theta[k,] <- rbeta(d, shape1 = alpha + sx[k,], shape2 = beta + s[k] - sx[k,])
		}
	}
#	collapsed sampler
	nMatrix <- array(data = 0, dim = c(n,K))
	sMatrix <- array(data = 0, dim = c(n,K,d))

	for (i in 1:n){
		nMatrix[i,] <- s
		sMatrix[i,,] <- sx
	}
	for (i in 1:n){
		nMatrix[i,z[i]] <- nMatrix[i,z[i]] - 1
		for (j in 1:d){
			sMatrix[i,z[i],j] <- sMatrix[i,z[i],j] - x[i,j]
		}
	}

	reallocationAcceptanceRatio <- 0
	reallocationAcceptanceRatio2 <- 0
	a1 <- a2 <- 1 #parameters of Beta for the reallocation proposal
	lar <- c()
	for(iter in 1:m){
		zOld <- z
		for(i in 1:n){
			nMatrix[i,1:K] <- s[1:K]
			sMatrix[i,1:K,] <- sx[1:K,]
			nMatrix[i,z[i]] <- s[z[i]] - 1
			sMatrix[i,z[i],] <- sx[z[i],] - x[i,]

			A1 <- which(x[i,] == 1)
			A0 <- which(x[i,] == 0)
			for(k in 1:K){
				newL[k] <- log(nMatrix[i,k] + gamma[k]) - d*log(alpha + beta + nMatrix[i,k])
				if(length(A1 > 0)){
					newL[k] <- newL[k] + sum(log(alpha + sMatrix[i,k,A1]))
				}
				if(length(A0 > 0)){
					newL[k] <- newL[k] + sum(log(beta + nMatrix[i,k] - sMatrix[i,k,A0]))
				}
			}
			newL[1:K] <- exp(newL[1:K])
			z[i] <- sample(K,1,prob = newL[1:K])
			#if( zOld[i] != z[i] ){
			sx[zOld[i],] <- sx[zOld[i],] - x[i,]
			sx[z[i],] <- sx[z[i],] + x[i,]
			s[zOld[i]] <- s[zOld[i]] - 1
			s[z[i]] <- s[z[i]] + 1
		}


#		reallocation proposal 1
		if (K > 1){
			myPair <- sample(K,2,replace = FALSE)
			propZ <- z
			set1 <- which(z == myPair[1])
			set2 <- which(z == myPair[2])
			myP <- rbeta(1,shape1 = gamma[myPair[1]],shape2 = gamma[myPair[2]])
			propZ[c(set1,set2)] <- myPair[sample(2,length(set1) + length(set2), replace = TRUE,prob = c(myP,1-myP) )]
			newSet1 <- which(propZ == myPair[1])
			newSet2 <- which(propZ == myPair[2])
			nNew <- c(length(newSet1),length(newSet2))
			nOld <- c(length(set1),length(set2))
			if(nOld[1] == 0){sOld1 <- rep(0,d)}else{sOld1 <- colSums(array(x[set1,],dim = c(nOld[1],d)))}
			if(nOld[2] == 0){sOld2 <- rep(0,d)}else{sOld2 <- colSums(array(x[set2,],dim = c(nOld[2],d)))}
			sOld <- rbind(sOld1,sOld2)
			if(nNew[1] == 0){sNew1 <- rep(0,d)}else{sNew1 <- colSums(array(x[newSet1,],dim = c(nNew[1],d)))}
			if(nNew[2] == 0){sNew2 <- rep(0,d)}else{sNew2 <- colSums(array(x[newSet2,],dim = c(nNew[2],d)))}
			sNew <- rbind(sNew1,sNew2)
			logAR <- 0
			for (i in 1:2){
				logAR <- logAR + d*(lgamma(alpha + beta + nOld[i]) - lgamma(alpha + beta + nNew[i]) ) + sum(lgamma(alpha + sNew[i,]) + lgamma(beta + nNew[i] - sNew[i,]) - lgamma(alpha + sOld[i,]) - lgamma(beta + nOld[i] - sOld[i,]))
			}
			if( log(runif(1)) < logAR ){
				reallocationAcceptanceRatio <- reallocationAcceptanceRatio + 1 
				z <- propZ
				s <- rep(0,K)
				sx <- array(data = 0, dim = c(K,d))
				for(i in 1:n){
					s[z[i]] <- s[z[i]] + 1
					sx[z[i],] <- sx[z[i],] + x[i,]
				}
				for(i in 1:n){
					nMatrix[i,] <- s
					sMatrix[i,,] <- sx
				}
				for (i in 1:n){
					nMatrix[i,z[i]] <- nMatrix[i,z[i]] - 1
					for (j in 1:d){
						sMatrix[i,z[i],j] <- sMatrix[i,z[i],j] - x[i,j]
					}
				}
			}
		}
#		end of reallocation proposal 1

#		reallocation proposal2
		if(K > 1){
			myPair <- sample(K,2,replace = FALSE)
			set1 <- which(z == myPair[1])
			set2 <- which(z == myPair[2])
			nOld <- c(length(set1),length(set2))
			propZ <- z
			if(nOld[1] > 0){
				randomSize <- 1 + floor(nOld[1]*runif(1))
				randomIndex <- set1[sample(nOld[1],randomSize,replace = FALSE)]
				propZ[randomIndex] <- rep(myPair[2],randomSize)
				newSet1 <- which(propZ == myPair[1])
				newSet2 <- which(propZ == myPair[2])
				nNew <- c(length(newSet1),length(newSet2))
				if(nOld[1] == 0){sOld1 <- rep(0,d)}else{sOld1 <- colSums(array(x[set1,],dim = c(nOld[1],d)))}
				if(nOld[2] == 0){sOld2 <- rep(0,d)}else{sOld2 <- colSums(array(x[set2,],dim = c(nOld[2],d)))}
				sOld <- rbind(sOld1,sOld2)
				if(nNew[1] == 0){sNew1 <- rep(0,d)}else{sNew1 <- colSums(array(x[newSet1,],dim = c(nNew[1],d)))}
				if(nNew[2] == 0){sNew2 <- rep(0,d)}else{sNew2 <- colSums(array(x[newSet2,],dim = c(nNew[2],d)))}
				sNew <- rbind(sNew1,sNew2)
				logAR <- log(nOld[1]) - log(nOld[2] + randomSize) -( lgamma(nOld[1] - randomSize + 1) + lgamma(nOld[2]+ randomSize + 1) - lgamma(nOld[2] + 1) - lgamma(nOld[1] + 1))
				for(i in 1:2){
					logAR <- logAR + d*(lgamma(alpha + beta + nOld[i]) - lgamma(alpha + beta + nNew[i]) ) + sum(lgamma(alpha + sNew[i,]) + lgamma(beta + nNew[i] - sNew[i,]) - lgamma(alpha + sOld[i,]) - lgamma(beta + nOld[i] - sOld[i,]))
				}
				logAR <- logAR + sum(lgamma(gamma[myPair] + nNew)) - sum(lgamma(gamma[myPair] + nOld)) 
				if( log(runif(1)) < logAR ){
					reallocationAcceptanceRatio2 <- reallocationAcceptanceRatio2 + 1 
					z <- propZ
					s <- rep(0,K)
					sx <- array(data = 0, dim = c(K,d))
					for(i in 1:n){
						s[z[i]] <- s[z[i]] + 1
						sx[z[i],] <- sx[z[i],] + x[i,]
					}
					for(i in 1:n){
						nMatrix[i,] <- s
						sMatrix[i,,] <- sx
					}
					for (i in 1:n){
						nMatrix[i,z[i]] <- nMatrix[i,z[i]] - 1
						for (j in 1:d){
							sMatrix[i,z[i],j] <- sMatrix[i,z[i],j] - x[i,j]
						}
					}
				}
			}
		}

#		end of reallocation proposal 2
		if((iter %% thinning == 0)&(iter > burn)){
			for(k in 1:K){
				myIndex <- which(z == k)
				s[k] <- length(myIndex)
				if(s[k] > 1){
					sx[k,] <- colSums(x[myIndex,])
				}else{
					if(s[k] == 1){
						sx[k,] <- x[myIndex,]
					}else{
						sx[k,] <- rep(0,d)
					}

				}
				theta[k,] <- rbeta(d, shape1 = alpha + sx[k,], shape2 = beta + s[k] - sx[k,])
			}
			p <- myDirichlet(gamma + s)
		
			cat(theta,"\n",file=conTheta)
			cat(z,"\n",file=conZ)
			cat(p,"\n",file=conP)		
		}
		if(iter %% (m/100) == 0){cat(paste("Running collapsed Gibbs: ",100*round(iter/m,3),"% completed. Reallocation proposal acceptance rates: ", 100*round(reallocationAcceptanceRatio/iter,3),"%, ",100*round(reallocationAcceptanceRatio2/iter,3),"%.",sep=""),"\n");
		#matplot(read.table("p.collapsed.txt"),type = "l",lty = 1)
	}


	}

	close(conTheta)
	close(conP)
	close(conZ)
	cat(paste("Collapsed Gibbs finished."),"\n")
	cat("\n")
	if(K > 1){
		cat(paste("Dealing with Label Switching..."),"\n")
		tt <- read.table("theta.collapsed.txt")
		m <- dim(tt)[1]
		d <- dim(x)[2]
		J <- d + 1
		mcmc <- array(data = NA, dim = c(m,K,J))
		for (j in 1:d){
			for(k in 1:K){
				mcmc[,k,j] <- tt[,(j-1)*K + k]
			}
		}
		tt <- read.table("p.collapsed.txt")
		for(k in 1:K){
			mcmc[,k,J] <- tt[,k]
		}
		allocations <- as.matrix(read.table("z.collapsed.txt",as.is = TRUE))
		m <- dim(mcmc)[1]
		iter <- 1
		ll <- complete.loglikelihood(x,allocations[iter,],mcmc[iter,,])
		maxLL <- ll
		maxIter <- iter
		for (iter in 1:m){
			ll <- complete.loglikelihood(x,allocations[iter,],mcmc[iter,,])
			if(ll > maxLL){maxLL <- ll;maxIter <- iter;cat(paste("Found new Complete MLE: ", ll,sep=""),"\n")}
		}
		# classification probs
		pMatrix <- array(data = NA, dim = c(m,n,K))
		for (iter in 1:m){
			p <- mcmc[iter,,J]
			theta <- array( mcmc[iter,,1:(J-1)],dim = c(K,J-1) )
			for(i in 1:n){
				for(k in 1:K){
					l[k] <- log(p[k]) + sum(x[i,]*log(theta[k,]) + (1-x[i,])*log(1-theta[k,]))
				}
				for(k in 1:K){
					pMatrix[iter,i,k] <- 1/sum(exp(l - l[k]))
					if(is.na(pMatrix[iter,i,k]) == TRUE){pMatrix[iter,i,k] = 0}
				}
			}
			if(iter %% 1000 == 0){cat(paste(" classification probs: ",100*round(iter/m,3),"% completed",sep=""),"\n");}
		}


		if(missing(z.true)==TRUE){
			ls <- label.switching( method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
						zpivot = allocations[maxIter,], z = allocations,K = K, complete = complete.loglikelihood, data = x,
						prapivot = mcmc[maxIter,,], mcmc = mcmc, p = pMatrix)
		}else{
			ls <- label.switching( method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
						zpivot = allocations[maxIter,], z = allocations,K = K, complete = complete.loglikelihood, data = x,
						prapivot = mcmc[maxIter,,], mcmc = mcmc, p = pMatrix,groundTruth = z.true)
		}
		reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR")$output

		tt <- read.table("theta.collapsed.txt")

		write.table(reordered.mcmc, file = "reorderedMCMC-ECR.collapsed.txt",col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
		reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR-ITERATIVE-1")$output
		write.table(reordered.mcmc, file = "reorderedMCMC-ECR-ITERATIVE1.collapsed.txt",col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
		reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"STEPHENS")$output
		write.table(reordered.mcmc, file = "reorderedMCMC-STEPHENS.collapsed.txt",col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
		write.table(mcmc, file = "rawMCMC.collapsed.txt",col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
		write.table(file = "reorderedSingleBestClusterings.collapsed.txt",t(ls$clusters[c(1,2,3),]),row.names = paste("z",1:n,sep="."))
		file.remove("p.collapsed.txt")
		file.remove("theta.collapsed.txt")
		cat(paste("raw MCMC parameters written to: \'rawMCMC.collapsed.txt\' "),"\n")
		cat(paste("raw MCMC latent allocations written to: \'z.collapsed.txt\' "),"\n")
		cat(paste("reordered MCMC output written to: "),"\n")
		cat(paste("     (Method 1):     \'reorderedMCMC-ECR.collapsed.txt\'"),"\n")
		cat(paste("     (Method 2):     \'reorderedMCMC-ECR-ITERATIVE1.collapsed.txt\'"),"\n")
		cat(paste("     (Method 3):     \'reorderedMCMC-STEPHENS.collapsed.txt\'"),"\n")
		cat(paste("reordered single best clusterings written to: \'reorderedSingleBestClusterings.collapsed.txt\' "),"\n")
	}
	setwd("../")
}


######################################################




allocationSamplerBinMix <- function(Kmax, alpha,beta,gamma,m,burn,data,thinning,z.true,ClusterPrior,ejectionAlpha,Kstart,outputDir,metropolisMoves,reorderModels,heat,zStart,LS, rsX, originalX, printProgress){
#	if(dir.exists(outputDir) == TRUE){
#		stop(cat(paste("    [ERROR]: directory exists, please provide different name."), "\n"))
#	}
	 #dir.create(outputDir)
	setwd(outputDir)
	cat(paste0("changing working directory to ",outputDir),"\n")
	if (missing(m)) {stop(cat(paste("    [ERROR]: number of MCMC iterations (m) not provided."), "\n"))}
	if (missing(thinning)) {thinning <- 5}
	if (missing(LS)) {LS <- TRUE}
	if (missing(printProgress)) { printProgress <- FALSE }
	if (missing(ejectionAlpha)) {ejectionAlpha <- 1}
	if (burn > m - 1) {
		stop(cat(paste("    [ERROR]: burn-in period (burn) not valid"), "\n"))
	}
	if (burn < 0) {
		stop(cat(paste("    [ERROR]: burn-in period (burn) not valid"), "\n"))
	}
	if (thinning > m) {
		stop(cat(paste("    [ERROR]: thinning not valid."), "\n"))
	}
	if (m < 1) {
		stop(cat(paste("    [ERROR]: mcmc iterations (m) not valid."), "\n"))
	}
	if (missing(alpha)) {alpha <- 1}
	if (missing(beta)) {beta <- 1}
	if (missing(data)) {stop(cat(paste("    [ERROR]: data is missing."), "\n"))}
	x <- data
	d <- dim(data)[2]
	n <- dim(data)[1]
	if (missing(Kmax)) {Kmax <- floor((d + 1)/2)}
	if (missing(gamma)) {gamma <- rep(1,Kmax)}
	if (length(table(gamma)) > 1){
		stop(cat(paste("    [ERROR]: Dirichlet prior parameters should be the same."), "\n"))
	}
	birthProbs <- rep(1,Kmax)
	birthProbs[2:(Kmax - 1)] <- rep(0.5,Kmax - 2)
	birthProbs[Kmax] <- 0
	deathProbs <- 1 - birthProbs

	# define uniform or truncated poisson(1) prior on K
	priorK <- numeric(Kmax)
	if (missing(ClusterPrior)) {stop(cat(paste("    [ERROR]: ClusterPrior not defined (uniform of poisson)."), "\n"))}
	if (missing(ejectionAlpha)) {stop(cat(paste("    [ERROR]: ejectionAlpha not defined (0 < a < 1)."), "\n"))}
	if (ejectionAlpha < 0) {stop(cat(paste("    [ERROR]: ejectionAlpha error (0 < a < 1)."), "\n"))}
	if (ejectionAlpha > 1) {stop(cat(paste("    [ERROR]: ejectionAlpha error (0 < a < 1)."), "\n"))}
	if(ClusterPrior == "uniform"){
		priorK <- rep(log(1/Kmax),Kmax)
	}
	if(ClusterPrior == "poisson"){
		denom <- log(ppois(Kmax, lambda = 1, lower.tail = TRUE) - dpois(0,lambda = 1))
		for (k in 1:Kmax){
			priorK[k] <- dpois(k,lambda = 1, log = TRUE) - denom 
		}
	}
	if(missing(Kstart)){
		Kstart <- 1
	}
	K <- Kstart
	p <- myDirichlet(rep(1,K)) # initial values for cluster probabilities
	theta <- array(data = runif(Kmax*d), dim = c(Kmax,d)) # initial values for response probabilities
	s <- l <- newL <- numeric(Kmax)
	sx <- array(data = 0, dim = c(Kmax,d))


	if(missing(zStart) == TRUE){
		cat(paste("Initializing..."),"\n")
		cat("\n")
		z <- sample(K,n,replace=TRUE,prob = p)
		cat(paste("Allocation sampler running..."),"\n")
		cat("\n")
	}else{
		z <- zStart
		s[1:K] <- rep(0,K)
		sx[1:K,] <- array(data = 0, dim = c(K,d))
		for(i in 1:n){
			s[z[i]] <- s[z[i]] + 1
			sx[z[i],] <- sx[z[i],] + x[i,]
		}

	}

	#output
	k.file <- "K.txt"
	theta.file <- "theta.varK.txt"
	z.file <- "z.varK.txt"
	p.file <- "p.varK.txt"
	conK = file(k.file,open = "w")
	conTheta = file(theta.file,open = "w")
	conZ = file(z.file,open = "w")
	conP = file(p.file,open = "w")
#	initialization with standard Gibbs 
	#print("here1")
	#par(mfrow = c(1,1))
	if(missing(zStart) == TRUE){
	for (iter in 1:5){
		s[1:K] <- rep(0,K)
		sx[1:K,] <- array(data = 0, dim = c(K,d))
		for(i in 1:n){
			for(k in 1:K){
				l[k] <-  log(p[k]) + sum(x[i,]*log(theta[k,]) + (1-x[i,])*log(1-theta[k,]))
			}
			for(k in 1:K){
				newL[k] <-  1/sum(exp(l[1:K] - l[k]))
			}
			if(is.nan(sum(newL[1:K]))==TRUE){newL[1:K]<-rep(1,K)}
			z[i] <- sample(K,1,prob = newL[1:K])
			s[z[i]] <- s[z[i]] + 1
			sx[z[i],] <- sx[z[i],] + x[i,]
		}
		p <- myDirichlet(heat*gamma[1:K] + heat*s[1:K] + 1 - heat)
		for(k in 1:K){
			theta[k,] <- rbeta(d, shape1 = heat*alpha + heat*sx[k,] + 1 - heat, shape2 = heat*beta + heat*s[k] - heat*sx[k,] + 1 - heat)
		}

		
	}
	}

#	collapsed sampler
	nMatrix <- array(data = 0, dim = c(n,Kmax))
	sMatrix <- array(data = 0, dim = c(n,Kmax,d))
	#print("here2")

	for (i in 1:n){
		nMatrix[i,1:K] <- s[1:K]
		sMatrix[i,1:K,] <- sx[1:K,]
	}
	for (i in 1:n){
		nMatrix[i,z[i]] <- nMatrix[i,z[i]] - 1
		for (j in 1:d){
			sMatrix[i,z[i],j] <- sMatrix[i,z[i],j] - x[i,j]
		}
	}


	
	reallocationAcceptanceRatio <- 0
	reallocationAcceptanceRatio2 <- 0
	reallocationAcceptanceRatio3 <- 0
	reallocationAcceptanceRatio4 <- 0
	a1 <- a2 <- 1 #parameters of Beta for the reallocation proposal
	pZERO <- ejectionAlpha
	constLGAMMA <- 2*lgamma(ejectionAlpha) - lgamma(2*ejectionAlpha)
	kValues <- c()
	#plot(c(1,m),c(0,1),type = "n")
	if(missing(metropolisMoves) == TRUE){metropolisMoves <- c('M1','M2','M3','M4')}
	lmm <- 1/length(metropolisMoves)
	if( printProgress == TRUE){
		cat(paste("    Reallocation proposal acceptance rates: Move 1, Move 2, Move 3, Move 4"),"\n")
	}                           

	for(iter in 1:m){
		zOld <- z
		sOld <- s
		sxOld <- sx
		if(K > 1){
			myPair <- sample(K,2,replace = FALSE)
			j1 <- myPair[1]
			j2 <- myPair[2]
			set1 <- which(z == j1)
			set2 <- which(z == j2)
			zOld[set1] = rep(j2,length(set1))
			zOld[set2] = rep(j1,length(set2))
			z <- zOld
			sOld[j1] <- s[j2]
			sOld[j2] <- s[j1]
			sxOld[j1,] <- sx[j2,]
			sxOld[j2,] <- sx[j1,]
			s <- sOld
			sx <- sxOld
		}
		for(i in 1:n){
			nMatrix[i,1:K] <- s[1:K]
			sMatrix[i,1:K,] <- sx[1:K,]
			nMatrix[i,z[i]] <- s[z[i]] - 1
			sMatrix[i,z[i],] <- sx[z[i],] - x[i,]

			A1 <- which(x[i,] == 1)
			A0 <- which(x[i,] == 0)
			for(k in 1:K){
				newL[k] <- heat*log(nMatrix[i,k] + gamma[k]) - heat*d*log(alpha + beta + nMatrix[i,k])
				if(length(A1 > 0)){
					newL[k] <- newL[k] + heat*sum(log(alpha + sMatrix[i,k,A1]))
				}
				if(length(A0 > 0)){
					newL[k] <- newL[k] + heat*sum(log(beta + nMatrix[i,k] - sMatrix[i,k,A0]))
				}
			}
			newL[1:K] <- exp(newL[1:K])
			if( max(newL[1:K]) == 0){newL[1:K] <- rep(1,K);cat("oops","\n")}
			z[i] <- sample(K,1,prob = newL[1:K])
			#if( zOld[i] != z[i] ){
			sx[zOld[i],] <- sx[zOld[i],] - x[i,]
			sx[z[i],] <- sx[z[i],] + x[i,]
			s[zOld[i]] <- s[zOld[i]] - 1
			s[z[i]] <- s[z[i]] + 1
			#nMatrix[,z[i]] <- s[z[i]] - 1
			#sMatrix[,z[i],] <- sx[z[i],] - x[i,]
				#nMatrix[,zOld[i]] <- nMatrix[,zOld[i]] - 1
				#nMatrix[,z[i]] <- nMatrix[,z[i]] + 1
				#myMat <- matrix(rep(x[i,],n),nrow = n,byrow=TRUE)
				#sMatrix[,zOld[i],] <- sMatrix[,zOld[i],] - myMat
				#sMatrix[,z[i],] <- sMatrix[,z[i],] + myMat
			#}
		}
	mNumber <- sample(metropolisMoves,1)
	#mNumber <- 5


		if(mNumber == 'M1'){
#		if(1 > 2){
#		reallocation proposal 1
		if (K > 1){
			myPair <- sample(K,2,replace = FALSE)
			propZ <- z
			set1 <- which(z == myPair[1])
			set2 <- which(z == myPair[2])
			myP <- rbeta(1,shape1 = gamma[myPair[1]],shape2 = gamma[myPair[2]])
			propZ[c(set1,set2)] <- myPair[sample(2,length(set1) + length(set2), replace = TRUE,prob = c(myP,1-myP) )]
			newSet1 <- which(propZ == myPair[1])
			newSet2 <- which(propZ == myPair[2])
			nNew <- c(length(newSet1),length(newSet2))
			nOld <- c(length(set1),length(set2))
			if(nOld[1] == 0){sOld1 <- rep(0,d)}else{sOld1 <- colSums(array(x[set1,],dim = c(nOld[1],d)))}
			if(nOld[2] == 0){sOld2 <- rep(0,d)}else{sOld2 <- colSums(array(x[set2,],dim = c(nOld[2],d)))}
			sOld <- rbind(sOld1,sOld2)
			if(nNew[1] == 0){sNew1 <- rep(0,d)}else{sNew1 <- colSums(array(x[newSet1,],dim = c(nNew[1],d)))}
			if(nNew[2] == 0){sNew2 <- rep(0,d)}else{sNew2 <- colSums(array(x[newSet2,],dim = c(nNew[2],d)))}
			sNew <- rbind(sNew1,sNew2)
			logAR <- 0
			for (i in 1:2){
				logAR <- logAR + d*(lgamma(alpha + beta + nOld[i]) - lgamma(alpha + beta + nNew[i]) ) + sum(lgamma(alpha + sNew[i,]) + lgamma(beta + nNew[i] - sNew[i,]) - lgamma(alpha + sOld[i,]) - lgamma(beta + nOld[i] - sOld[i,]))
			}
			if(is.finite(logAR)){
			if( log(runif(1)) < logAR ){
				reallocationAcceptanceRatio <- reallocationAcceptanceRatio + 1 
				z <- propZ
				s <- rep(0,K)
				sx <- array(data = 0, dim = c(K,d))
				for(k in 1:K){
					ind <- which(z == k)
					tmpV <- numeric(n)
					tmpM <- array(data = 0,dim = c(n,d))
					s[k] <- length(ind)
					if(s[k] > 0){
						tmpV[ind] <- rep(1,s[k])
						tmpM[ind,] <- x[ind,]
						sx[k,] <- colSums(array(x[ind,],dim = c(s[k],d)))
					}
					nMatrix[,k] <- rep(s[k],n) - tmpV
					sMatrix[,k,] <- matrix(sx[k,],nrow = n,ncol = d,byrow = TRUE) - tmpM
				}
			}
			}
		}
		}
#		end of reallocation proposal 1
		if(mNumber == 'M2'){
#		reallocation proposal2
		if(K > 1){
			myPair <- sample(K,2,replace = FALSE)
			set1 <- which(z == myPair[1])
			set2 <- which(z == myPair[2])
			nOld <- c(length(set1),length(set2))
			propZ <- z
			if(nOld[1] > 0){
				randomSize <- 1 + floor(nOld[1]*runif(1))
				randomIndex <- set1[sample(nOld[1],randomSize,replace = FALSE)]
				propZ[randomIndex] <- rep(myPair[2],randomSize)
				newSet1 <- which(propZ == myPair[1])
				newSet2 <- which(propZ == myPair[2])
				nNew <- c(length(newSet1),length(newSet2))
				if(nOld[1] == 0){sOld1 <- rep(0,d)}else{sOld1 <- colSums(array(x[set1,],dim = c(nOld[1],d)))}
				if(nOld[2] == 0){sOld2 <- rep(0,d)}else{sOld2 <- colSums(array(x[set2,],dim = c(nOld[2],d)))}
				sOld <- rbind(sOld1,sOld2)
				if(nNew[1] == 0){sNew1 <- rep(0,d)}else{sNew1 <- colSums(array(x[newSet1,],dim = c(nNew[1],d)))}
				if(nNew[2] == 0){sNew2 <- rep(0,d)}else{sNew2 <- colSums(array(x[newSet2,],dim = c(nNew[2],d)))}
				sNew <- rbind(sNew1,sNew2)
				logAR <- log(nOld[1]) - log(nOld[2] + randomSize) -( lgamma(nOld[1] - randomSize + 1) + lgamma(nOld[2]+ randomSize + 1) - lgamma(nOld[2] + 1) - lgamma(nOld[1] + 1))
				for(i in 1:2){
					logAR <- logAR + heat*d*(lgamma(alpha + beta + nOld[i]) - lgamma(alpha + beta + nNew[i]) ) + heat*sum(lgamma(alpha + sNew[i,]) + lgamma(beta + nNew[i] - sNew[i,]) - lgamma(alpha + sOld[i,]) - lgamma(beta + nOld[i] - sOld[i,]))
				}
				logAR <- logAR + heat*sum(lgamma(gamma[myPair] + nNew)) - heat*sum(lgamma(gamma[myPair] + nOld)) 
				if(is.finite(logAR)){
				if( log(runif(1)) < logAR ){
					reallocationAcceptanceRatio2 <- reallocationAcceptanceRatio2 + 1 
					z <- propZ
					s <- rep(0,K)
					sx <- array(data = 0, dim = c(K,d))
					for(k in 1:K){
						ind <- which(z == k)
						tmpV <- numeric(n)
						tmpM <- array(data = 0,dim = c(n,d))
						s[k] <- length(ind)
						if(s[k] > 0){
							tmpV[ind] <- rep(1,s[k])
							tmpM[ind,] <- x[ind,]
							sx[k,] <- colSums(array(x[ind,],dim = c(s[k],d)))
						}
						nMatrix[,k] <- rep(s[k],n) - tmpV
						sMatrix[,k,] <- matrix(sx[k,],nrow = n,ncol = d,byrow = TRUE) - tmpM
					}
				}
				}
			}
		}
		}
#		end of reallocation proposal 2
#		} #remove this
#		update the number of clusters
		if(mNumber == 'M3'){
		if ( runif(1) < birthProbs[K] ){
		# BIRTH MOVE
			birth = TRUE
			myPair <- c(sample(K,1),K + 1)
			# myPair[1]: ejecting component
			# myPair[2]: ejected component
			set1 <- which(z == myPair[1])
			nOld <- c(length(set1),0)
			ejectionAlpha <- toSolve(seq(0.0001,2,length = 500),nOld[1],pZERO);constLGAMMA <- 2*lgamma(ejectionAlpha) - lgamma(2*ejectionAlpha)
			propZ <- z
			myP <- rbeta(1,shape1 = ejectionAlpha,shape2 = ejectionAlpha)
			propZ[set1] <- myPair[sample(2,nOld[1], replace = TRUE,prob = c(1-myP,myP) )]
			newSet1 <- which(propZ == myPair[1])
			newSet2 <- which(propZ == myPair[2])
			nNew <- c(length(newSet1),length(newSet2))
			if(nOld[1] == 0){sOld1 <- rep(0,d)}else{sOld1 <- colSums(array(x[set1,],dim = c(nOld[1],d)))}
			if(nOld[2] == 0){sOld2 <- rep(0,d)}else{sOld2 <- colSums(array(x[set2,],dim = c(nOld[2],d)))}
			sOld <- rbind(sOld1,sOld2)
			if(nNew[1] == 0){sNew1 <- rep(0,d)}else{sNew1 <- colSums(array(x[newSet1,],dim = c(nNew[1],d)))}
			if(nNew[2] == 0){sNew2 <- rep(0,d)}else{sNew2 <- colSums(array(x[newSet2,],dim = c(nNew[2],d)))}
			sNew <- rbind(sNew1,sNew2)
			logAR <- log( (1 - birthProbs[K+1])/birthProbs[K] ) + constLGAMMA + lgamma(2*ejectionAlpha + nOld[1]) - lgamma(ejectionAlpha + nNew[1]) - lgamma(ejectionAlpha + nNew[2]) + heat*priorK[K+1] - heat*priorK[K]
			logAR <- logAR + heat*d*( lgamma(alpha + beta + nOld[1]) - lgamma(alpha + beta + nNew[1]) - lgamma(alpha + beta + nNew[2]) )
			logAR <- logAR + heat*sum( 
						  lgamma(alpha + sNew[1,]) + lgamma(beta + nNew[1] - sNew[1,]) 
						+ lgamma(alpha + sNew[2,]) + lgamma(beta + nNew[2] - sNew[2,]) 
						- lgamma(alpha + sOld[1,]) - lgamma(beta + nOld[1] - sOld[1,]) 
					)

#			for(i in 1:2){
#				logAR <- logAR + d*(lgamma(alpha + beta + nOld[i]) - lgamma(alpha + beta + nNew[i]) ) + sum(lgamma(alpha + sNew[i,]) + lgamma(beta + nNew[i] - sNew[i,]) - lgamma(alpha + sOld[i,]) - lgamma(beta + nOld[i] - sOld[i,]))
#			}
			logAR <- logAR + heat*sum(lgamma(gamma[myPair] + nNew)) - heat*sum(lgamma(gamma[myPair[1]] + nOld[1])) + heat*lgamma(sum(gamma[1:(K+1)])) - heat*lgamma(sum(gamma[1:K])) - heat*lgamma(sum(gamma[1:(K+1)]) + n) + heat*lgamma(sum(gamma[1:K]) + n) - heat*lgamma(gamma[K+1]) - heat*d*lbeta(alpha, beta)
		}else{
		# DEATH MOVE
			birth = FALSE
			myPair <- c(sample(K - 1,1),K)
			set1 <- which(z == myPair[1])
			set2 <- which(z == myPair[2])
			nOld <- c(length(set1),length(set2))
			propZ <- z
			propZ[c(set1,set2)] <- rep(myPair[1],sum(nOld))
			newSet1 <- which(propZ == myPair[1])
			nNew <- c(length(newSet1),0)
			ejectionAlpha <- toSolve(seq(0.0001,2,length = 500),nNew[1],pZERO);constLGAMMA <- 2*lgamma(ejectionAlpha) - lgamma(2*ejectionAlpha)
			if(nOld[1] == 0){sOld1 <- rep(0,d)}else{sOld1 <- colSums(array(x[set1,],dim = c(nOld[1],d)))}
			if(nOld[2] == 0){sOld2 <- rep(0,d)}else{sOld2 <- colSums(array(x[set2,],dim = c(nOld[2],d)))}
			sOld <- rbind(sOld1,sOld2)
			if(nNew[1] == 0){sNew1 <- rep(0,d)}else{sNew1 <- colSums(array(x[newSet1,],dim = c(nNew[1],d)))}
			sNew2 <- rep(0,d)
			sNew <- rbind(sNew1,sNew2)
			logAR <- - (log( (1 - birthProbs[K])/birthProbs[K - 1] ) + constLGAMMA + lgamma(2*ejectionAlpha + nNew[1]) - lgamma(ejectionAlpha + nOld[1]) - lgamma(ejectionAlpha + nOld[2]))+ heat*priorK[K - 1] - heat*priorK[K]


			logAR <- logAR + heat*d*( lgamma(alpha + beta + nOld[1]) + lgamma(alpha + beta + nOld[2]) - lgamma(alpha + beta + nNew[1]) )
			logAR <- logAR + heat*sum( 
						  lgamma(alpha + sNew[1,]) + lgamma(beta + nNew[1] - sNew[1,]) 
						- lgamma(alpha + sOld[1,]) - lgamma(beta + nOld[1] - sOld[1,]) 
						- lgamma(alpha + sOld[2,]) - lgamma(beta + nOld[2] - sOld[2,])
					 )


#			for(i in 1:2){
#				logAR <- logAR + d*(lgamma(alpha + beta + nOld[i]) - lgamma(alpha + beta + nNew[i]) ) + sum(lgamma(alpha + sNew[i,]) + lgamma(beta + nNew[i] - sNew[i,]) - lgamma(alpha + sOld[i,]) - lgamma(beta + nOld[i] - sOld[i,]))
#			}
			logAR <- logAR + heat*lgamma(gamma[myPair[1]] + nNew[1]) - heat*sum(lgamma(gamma[myPair] + nOld)) + heat*lgamma(sum(gamma[1:(K-1)])) - heat*lgamma(sum(gamma[1:K])) - heat*lgamma(sum(gamma[1:(K-1)]) + n) + heat*lgamma(sum(gamma[1:K]) + n) + heat*lgamma(gamma[K]) + heat*d*lbeta(alpha, beta)
			
		}
		if(is.finite(logAR)){
		if( log(runif(1)) < logAR ){
			reallocationAcceptanceRatio3 <- reallocationAcceptanceRatio3 + 1 
			z <- propZ
			if(birth == TRUE){K <- K + 1}else{K <- K - 1}
			s <- rep(0,K)
			sx <- array(data = 0, dim = c(K,d))
			for(k in 1:K){
				ind <- which(z == k)
				tmpV <- numeric(n)
				tmpM <- array(data = 0,dim = c(n,d))
				s[k] <- length(ind)
				if(s[k] > 0){
					tmpV[ind] <- rep(1,s[k])
					tmpM[ind,] <- x[ind,]
					sx[k,] <- colSums(array(x[ind,],dim = c(s[k],d)))
				}
				nMatrix[,k] <- rep(s[k],n) - tmpV
				sMatrix[,k,] <- matrix(sx[k,],nrow = n,ncol = d,byrow = TRUE) - tmpM
			}
		}
		}
		}
#		end of update for the number of clusters


		if(mNumber == 'M4'){
#	reallocation proposal from conditional probs

			if(K > 1){
			myPair <- sample(K,2,replace = FALSE)
			propZ <- z
			set1 <- which(z == myPair[1])
			set2 <- which(z == myPair[2])
			union12 <- c(set1,set2)
			processed <- c()
			notProcessed <- setdiff(union12,processed)
			n1New <- n2New <- 0
			s1New <- s2New <- numeric(d)
			n1 <- n2 <- 0
			s1 <- s2 <- numeric(d)
			j1 <- myPair[1]
			j2 <- myPair[2]
			alreadyInJ1 <- alreadyInJ2 <- c()
			proposalRatio <- 0
			checkCondition <- TRUE
			while ( length(notProcessed) > 0 ){
				i <- notProcessed[1]
				processed <- c(processed,i)
				# propose reallocation
				u <- log(gamma[j1] + n1New) - log(gamma[j2] + n2New) + sum( lgamma(alpha + x[i,] + s1New) + lgamma(beta + 1 + n1New - s1New - x[i,]) ) - d*sum(lgamma(alpha+beta+n1New+1)) + sum( lgamma(alpha + s2New) + lgamma(beta + n2New - s2New) ) - d*sum(lgamma(alpha+beta+n2New)) - sum( lgamma(alpha + s1New) + lgamma(beta + n1New - s1New) ) + d*sum(lgamma(alpha+beta+n1New)) - sum( lgamma(alpha + x[i,] + s2New) + lgamma(beta + 1 + n2New - s2New - x[i,]) ) + d*sum(lgamma(alpha+beta+n2New+1))
				u <- exp(u)
				proposalProbabities <- u/(1 + u)
				if( is.finite(proposalProbabities) == FALSE ){checkCondition <- FALSE; proposalProbabities <- 0.5}
				if( runif(1) < proposalProbabities ){ 
					propZ[i] <- j1
					proposalRatio <- proposalRatio - log(proposalProbabities) 
					n1New <- n1New + 1
					s1New <- s1New + x[i,]
				}else{ 
					propZ[i] <- j2
					proposalRatio <- proposalRatio - log(1 - proposalProbabities) 
					n2New <- n2New + 1
					s2New <- s2New + x[i,]
				}
				# compute inverse move
				u <- log(gamma[j1] + n1) - log(gamma[j2] + n2) + sum( lgamma(alpha + x[i,] + s1) + lgamma(beta + 1 + n1 - s1 - x[i,]) ) - d*sum(lgamma(alpha+beta+n1+1)) + sum( lgamma(alpha + s2) + lgamma(beta + n2 - s2) ) - d*sum(lgamma(alpha+beta+n2)) - sum( lgamma(alpha + s1) + lgamma(beta + n1 - s1) ) + d*sum(lgamma(alpha+beta+n1)) - sum( lgamma(alpha + x[i,] + s2) + lgamma(beta + 1 + n2 - s2 - x[i,]) ) + d*sum(lgamma(alpha+beta+n2+1))
				u <- exp(u)
				u <- u/(1 + u)
				if(z[i] == j1){ 
					proposalRatio <- proposalRatio + log(u) 
					n1 <- n1 + 1
					s1 <- s1 + x[i,]
				}else{ 
					proposalRatio <- proposalRatio + log(1 - u) 
					n2 <- n2 + 1
					s2 <- s2 + x[i,]
				}
				
				notProcessed <- setdiff(union12,processed)
			}

			newSet1 <- which(propZ == myPair[1])
			newSet2 <- which(propZ == myPair[2])
			nNew <- c(length(newSet1),length(newSet2))
			nOld <- c(length(set1),length(set2))
			if(nOld[1] == 0){sOld1 <- rep(0,d)}else{sOld1 <- colSums(array(x[set1,],dim = c(nOld[1],d)))}
			if(nOld[2] == 0){sOld2 <- rep(0,d)}else{sOld2 <- colSums(array(x[set2,],dim = c(nOld[2],d)))}
			sOld <- rbind(sOld1,sOld2)
			if(nNew[1] == 0){sNew1 <- rep(0,d)}else{sNew1 <- colSums(array(x[newSet1,],dim = c(nNew[1],d)))}
			if(nNew[2] == 0){sNew2 <- rep(0,d)}else{sNew2 <- colSums(array(x[newSet2,],dim = c(nNew[2],d)))}
			sNew <- rbind(sNew1,sNew2)
			logAR <- proposalRatio
			for (i in 1:2){
				logAR <- logAR + d*(lgamma(alpha + beta + nOld[i]) - lgamma(alpha + beta + nNew[i]) ) + sum(lgamma(alpha + sNew[i,]) + lgamma(beta + nNew[i] - sNew[i,]) - lgamma(alpha + sOld[i,]) - lgamma(beta + nOld[i] - sOld[i,]))
			}
			logAR <- logAR + sum(lgamma(gamma[myPair] + nNew)) - sum(lgamma(gamma[myPair] + nOld))
			if(is.finite(logAR)){ 
			if( (log(runif(1)) < logAR) && (checkCondition == TRUE) ){
				reallocationAcceptanceRatio4 <- reallocationAcceptanceRatio4 + 1 
				z <- propZ
				s <- rep(0,K)
				sx <- array(data = 0, dim = c(K,d))
				for(k in 1:K){
					ind <- which(z == k)
					tmpV <- numeric(n)
					tmpM <- array(data = 0,dim = c(n,d))
					s[k] <- length(ind)
					if(s[k] > 0){
						tmpV[ind] <- rep(1,s[k])
						tmpM[ind,] <- x[ind,]
						sx[k,] <- colSums(array(x[ind,],dim = c(s[k],d)))
					}
					nMatrix[,k] <- rep(s[k],n) - tmpV
					sMatrix[,k,] <- matrix(sx[k,],nrow = n,ncol = d,byrow = TRUE) - tmpM
				}
			}
			}
			}
#	end of reallocation proposal from conditional probs

			}







		if(iter %% thinning == 0){
			kValues <- c(kValues,K)
			if(iter > burn){
				cat(K,"\n",file=conK)
				cat(z,"\n",file=conZ)
				if (heat == 1){ #produce parameter values only for cold chain
					for(k in 1:K){
						myIndex <- which(z == k)
						s[k] <- length(myIndex)
						if(s[k] > 1){
							sx[k,] <- colSums(x[myIndex,])
						}else{
							if(s[k] == 1){
								sx[k,] <- x[myIndex,]
							}else{
								sx[k,] <- rep(0,d)
							}

						}
						theta[k,] <- rbeta(d, shape1 = alpha + sx[k,], shape2 = beta + s[k] - sx[k,])
					}
					# in case of missing values
					if( length(rsX) > 0){
						for(i in rsX){
							na.index <- which(is.na(originalX[i,]) == TRUE)
							x[i, na.index] <- rbinom(n = length(na.index), size = 1, prob = theta[z[i],na.index])
						}
						write.table(x,file = "currentX.txt", quote = FALSE, row.names = FALSE, col.names = FALSE)
					}
					p <- myDirichlet(gamma[1:K] + s[1:K])
					cat(theta,"\n",file=conTheta)
					cat(p,"\n",file=conP)
				}		
			}
		}
		if( printProgress == TRUE){
			if(iter %% (m/100) == 0){
				cat(paste("                             ",100*round(iter/m,3),"% completed. ", 
							100*round(lmm*reallocationAcceptanceRatio/iter,3),"%, ",
							100*round(lmm*reallocationAcceptanceRatio2/iter,3),"%, ",
							100*round(lmm*reallocationAcceptanceRatio4/iter,3),"%, ",
							100*round(lmm*reallocationAcceptanceRatio3/iter,3),"%",
				sep=""),"\n");}
		}
	}
	close(conK)
	close(conTheta)
	close(conP)
	close(conZ)
	cat(paste("Allocation Sampler finished."),"\n")
	cat("\n")
	#if(K < 1){
		if(LS == TRUE){
		kFile <- read.table("K.txt")[,1]
		cat("\n")
		print(table(kFile)/length(kFile))
		K <- as.numeric(names(table(kFile))[order(table(kFile),decreasing=TRUE)[1]])
		cat("\n")
		cat(paste("Most probable model: K = ",K," with P(K = ",K,") = ",max(table(kFile)/length(kFile)),sep=""),"\n")		
		cat("\n")
	if(missing(reorderModels)==TRUE){reorderModels <- 'onlyMAP'}
	if(reorderModels == 'onlyMAP'){kRange <- K}else{
		kRange <- as.numeric(names(table(kFile)/length(kFile)))
	}
	for ( K in kRange ){
		if (K > 1){
			cat(paste("Dealing with Label Switching for K =",K),"\n")
			tt <- read.table("theta.varK.txt")
			index <- which(kFile == K)
			d <- dim(x)[2]
			J <- d + 1
			m <- length(index)
			mcmc <- array(data = NA, dim = c(m,K,J))
			Kmax <- (dim(tt)/d)[2]
			for (j in 1:d){
				for(k in 1:K){
					mcmc[,k,j] <- tt[index,(j-1)*Kmax + k]
				}
			}
			conP = file(p.file,open = "r")
			i <- 0
			j <- 0
			while (length(oneLine <- readLines(conP, n = 1, warn = FALSE)) > 0) {
				i <- i + 1
				if(kFile[i] == K){
					j <- j + 1
					mcmc[j,,J] <- as.numeric(strsplit(oneLine,split = " ")[[1]])
				}
			}
			close(conP)
			allocations <- as.matrix(read.table("z.varK.txt",as.is = TRUE)[index,])
			iter <- 1
			ll <- complete.loglikelihood(x,allocations[iter,],mcmc[iter,,])
			maxLL <- ll
			maxIter <- iter
			for (iter in 1:m){
				ll <- complete.loglikelihood(x,allocations[iter,],mcmc[iter,,])
				if(ll > maxLL){maxLL <- ll;maxIter <- iter;cat(paste("Found new Complete MLE: ", ll,sep=""),"\n")}
			}
			# classification probs
			pMatrix <- array(data = NA, dim = c(m,n,K))
			l <- numeric(K)
			for (iter in 1:m){
				p <- mcmc[iter,,J]
				theta <- array( mcmc[iter,,1:(J-1)],dim = c(K,J-1) )
				for(i in 1:n){
					for(k in 1:K){
						l[k] <- log(p[k]) + sum(x[i,]*log(theta[k,]) + (1-x[i,])*log(1-theta[k,]))
					}
					for(k in 1:K){
						pMatrix[iter,i,k] <- 1/sum(exp(l - l[k]))
						if(is.na(pMatrix[iter,i,k]) == TRUE){pMatrix[iter,i,k] = 0}
					}
				}
				if(iter %% 1000 == 0){cat(paste(" classification probs: ",100*round(iter/m,3),"% completed",sep=""),"\n");}
			}


			if(missing(z.true)==TRUE){
				ls <- label.switching( method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
							zpivot = allocations[maxIter,], z = allocations,K = K, complete = complete.loglikelihood, data = x,
							prapivot = mcmc[maxIter,,], mcmc = mcmc, p = pMatrix)
			}else{
				ls <- label.switching( method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
							zpivot = allocations[maxIter,], z = allocations,K = K, complete = complete.loglikelihood, data = x,
							prapivot = mcmc[maxIter,,], mcmc = mcmc, p = pMatrix,groundTruth = z.true)
			}
			reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR")$output
			write.table(reordered.mcmc, file = paste("reorderedMCMC-ECR.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR-ITERATIVE-1")$output
			write.table(reordered.mcmc, file = paste("reorderedMCMC-ECR-ITERATIVE1.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"STEPHENS")$output
			write.table(reordered.mcmc, file = paste("reorderedMCMC-STEPHENS.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			write.table(mcmc, file = paste("rawMCMC.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			write.table(file = paste("reorderedSingleBestClusterings.mapK.",K,".txt",sep=""),t(ls$clusters[c(1,2,3),]),row.names = paste("z",1:n,sep="."))

			#reordering allocations
			allocationsECR <- allocationsKL <- allocationsECR.ITERATIVE1 <- allocations
			for (i in 1:m){
				myPerm <- order(ls$permutations$"ECR"[i,])
				allocationsECR[i,] <- myPerm[allocations[i,]]
				myPerm <- order(ls$permutations$"STEPHENS"[i,])
				allocationsKL[i,] <- myPerm[allocations[i,]]
				myPerm <- order(ls$permutations$"ECR-ITERATIVE-1"[i,])
				allocationsECR.ITERATIVE1[i,] <- myPerm[allocations[i,]]

			}
			write.table(allocationsECR, file = paste("z.ECR.mapK.",K,".txt",sep=""))
			write.table(allocationsKL, file = paste("z.KL.mapK.",K,".txt",sep=""))
			write.table(allocationsECR.ITERATIVE1, file = paste("z.ECR-ITERATIVE1.mapK.",K,".txt",sep=""))
			#file.remove("p.collapsed.txt")
			#file.remove("theta.collapsed.txt")
			cat(paste0("raw MCMC parameters for most probable K written to: \'rawMCMC.mapK.",K,".txt\' "),"\n")
			cat(paste0("raw MCMC latent allocations for most probable K written to: \'z.mapK.",K,".txt\' "),"\n")
			cat(paste0("reordered MCMC output written to: "),"\n")
			cat(paste0("     (Method 1):     \'reorderedMCMC-ECR.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 2):     \'reorderedMCMC-ECR-ITERATIVE1.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 3):     \'reorderedMCMC-STEPHENS.mapK.",K,".txt\'"),"\n")
			cat(paste0("reordered single best clusterings written to: \'reorderedSingleBestClusterings.mapK.",K,".txt\' "),"\n")
			cat(paste0("reordered MCMC latent allocations for most probable K written to: "),"\n")
			cat(paste0("     (Method 1):     \'z.ECR.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 2):     \'z.KL.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 3):     \'z.ECR-ITERATIVE1.mapK.",K,".txt\'"),"\n")

		}

	}
	}
	setwd("../")
	cat(paste0("back to working directory now."),"\n")
	return(kValues)
}

coupledMetropolis <- function(Kmax, nChains,heats,binaryData,outPrefix,ClusterPrior,m, alpha, beta, gamma, z.true, ejectionAlpha, burn){
	if(missing(nChains) == TRUE){stop(cat(paste("    [ERROR]: number of chains not provided."), "\n"))}
	if(missing(heats) == TRUE){
		heats <- seq(1,0.1,length = nChains)
		}else{
		if(heats[1] != 1){stop(cat(paste("    [ERROR]: `heats[1]` should be equal to one."), "\n"))}
	}
	if(length(heats) != nChains){
		stop(cat(paste("    [ERROR]: `length(heats)` should be equal to `nChains`."), "\n"))
	}
	if(missing(ClusterPrior) == TRUE){ClusterPrior <- 'poisson'}
	if (missing(alpha)) {alpha <- 1}
	if (missing(beta)) {beta <- 1}
	if (missing(binaryData)) {stop(cat(paste("    [ERROR]: data is missing."), "\n"))}
	if (missing(gamma)) {gamma <- rep(1,Kmax)}
	if (length(table(gamma)) > 1){
		stop(cat(paste("    [ERROR]: Dirichlet prior parameters should be the same."), "\n"))
	}
	d <- dim(binaryData)[2]; n <- dim(binaryData)[1]; priorK <- numeric(Kmax)
	if(ClusterPrior == "uniform"){
		priorK <- rep(log(1/Kmax),Kmax)
	}
	if(ClusterPrior == "poisson"){
		denom <- log(ppois(Kmax, lambda = 1, lower.tail = TRUE) - dpois(0,lambda = 1))
		for (k in 1:Kmax){
			priorK[k] <- dpois(k,lambda = 1, log = TRUE) - denom 
		}
	}
	if(missing(ejectionAlpha) == TRUE){ejectionAlpha <- 0.2}
	x <- binaryData
	rsX <- which(is.na(rowSums(x)) == TRUE)
	originalX <- x
	if(length(rsX) > 0){
		cat(paste("    [NOTE]: Found ",length(rsX) ," rows with missing values."), "\n")
		for(i in rsX){
			na.index <- which(is.na(x[i,]) == TRUE)
			x[i,na.index] <- rbinom(n = length(na.index), size = 1, prob = alpha/(alpha + beta))
		}
	}

	currentZ <- array(data = NA, dim = c(nChains,n))
	currentK <- numeric(nChains)
	# check if dir exists and stop in this case
	myCheck <- match(outPrefix,list.files())
	if(is.na(myCheck) == FALSE){
		stop(cat(paste("    [ERROR]: directory exists, please provide different name to outPrefix."), "\n"))
	}
	if( missing(z.true) ){
		z.true <- NULL
	}
	if(missing(burn)){burn = 0}
	if(burn > m - 1){
		stop(cat(paste("    [ERROR]: Burn-in period not valid: \'burn\' should be less than \'m\'."), "\n"))
	}
	

	if(nChains < 2){
		if(length(rsX) > 0){
			stop(cat(paste("    [ERROR]: At least two chains should be used."), "\n"))}
		cat(paste("            Only 1 chain? Well."),"\n")
		dir.create(outPrefix)
		myHeat <- 1
		asr <- allocationSamplerBinMix( alpha = alpha, beta = beta, gamma = gamma, m = 10*m, burn= 10*burn, data = x, 
					thinning = 10,Kmax = Kmax, ClusterPrior = ClusterPrior,ejectionAlpha = ejectionAlpha, 
					outputDir = outPrefix,Kstart = 1,heat=myHeat,metropolisMoves = c('M1','M2','M3','M4'),LS = FALSE, rsX = rsX, originalX = originalX)}
	else{

		registerDoParallel(cores = nChains)
		#registerDoMC(nChains)
		outputDirs <- paste0(outPrefix,1:nChains)
		temperatures <- heats
		myChain <- 1
		for(i in 1:nChains){
			cat(paste0("            Create temporary directory: \'",outPrefix,i,"\'."), "\n")
		}
		cat(paste0("    [NOTE]: screen output from multiple threads is redirected to \'",outPrefix,"-sampler.log\'."), "\n")
		sink(paste0(outPrefix,'-sampler.log'))
		foreach(myChain=1:nChains, .export=ls(envir=globalenv()) ) %dopar% {
			outDir <- outputDirs[myChain]
			dir.create(outDir)
			myHeat <- temperatures[myChain]
			asr <- allocationSamplerBinMix( alpha = alpha, beta = beta, gamma = gamma, m = 10, burn= 9, data = x, 
						thinning = 1,Kmax = Kmax, ClusterPrior = ClusterPrior,ejectionAlpha = ejectionAlpha, 
						outputDir = outDir,Kstart=1,heat=myHeat,metropolisMoves='M3',LS = FALSE, rsX = rsX, originalX = originalX)
		}

		ITERATIONS <- m
		sampledK <- array(data = 0, dim = c(ITERATIONS,nChains))
		dir.create(outPrefix)
		k.file <- paste0(outPrefix,"/K.txt")
		theta.file <- paste0(outPrefix,"/theta.varK.txt")
		z.file <- paste0(outPrefix,"/z.varK.txt")
		p.file <- paste0(outPrefix,"/p.varK.txt")
		x.file <- paste0(outPrefix,"/x.txt")
		conK = file(k.file,open = "w")
		conTheta = file(theta.file,open = "w")
		conZ = file(z.file,open = "w")
		conP = file(p.file,open = "w")
		if(length(rsX) > 0){
			# in case of missing values, the augmented data will be written to the file:
			conX <- file(x.file, open = "w")	
		}

		ar <- 0
		metMoves <- vector('list',length = nChains)
		metMoves[[1]] <- c('M1','M2','M3','M4')
		for(j in 2:nChains){metMoves[[j]] <- c('M2','M3')}
		localAR <- 0	#every 10 iterations
		for(iter in 1:ITERATIONS){
			if(length(rsX) > 0){
				x <- as.matrix(read.table(paste0(outPrefix,1,'/currentX.txt')))
			}

			for(myChain in 1:nChains){
				currentZ[myChain,] <- as.numeric(read.table(paste0(outPrefix,myChain,'/z.varK.txt'))[1,])
				currentK[myChain] <- read.table(paste0(outPrefix,myChain,'/K.txt'))[1,]
			}
			sampledK[iter,] <- currentK
			myPair <- sample(nChains,2,replace = FALSE)
			j1 <- myPair[1]
			j2 <- myPair[2]
			z1 <- currentZ[j1,]
			z2 <- currentZ[j2,]
			K1 <- currentK[j1]
			K2 <- currentK[j2]

			s1 <- rep(0,K1)
			sx1 <- array(data = 0, dim = c(K1,d))
			for(k in 1:K1){
				ind <- which(z1 == k)
				s1[k] <- length(ind)
				if(s1[k] > 0){
					sx1[k,] <- colSums(array(x[ind,],dim = c(s1[k],d)))
				}
			}
			s2 <- rep(0,K2)
			sx2 <- array(data = 0, dim = c(K2,d))
			for(k in 1:K2){
				ind <- which(z2 == k)
				s2[k] <- length(ind)
				if(s2[k] > 0){
					sx2[k,] <- colSums(array(x[ind,],dim = c(s2[k],d)))
				}
			}
			#compute log-posterior for 1st
			log.posterior <- priorK[K1] + sum(lgamma( gamma[1:K1] + s1 )) - d*sum(lgamma(alpha+beta+s1)) - lgamma(n + sum(gamma[1:K1]))
			for(k in 1:K1){
				log.posterior <- log.posterior + sum(lgamma(alpha + sx1[k,]) + lgamma(beta + s1[k] - sx1[k,]))
			}
			#prior constants1:
			log.posterior <- log.posterior + lgamma(sum(gamma[1:K1])) - sum(lgamma(gamma[1:K1])) - K1*d*lbeta(alpha, beta)
			logAR <- (temperatures[j2] - temperatures[j1])*log.posterior
			#compute log-posterior for 2nd
			log.posterior <- priorK[K2] + sum(lgamma( gamma[1:K2] + s2 )) - d*sum(lgamma(alpha+beta+s2)) - lgamma(n + sum(gamma[1:K2]))
			for(k in 1:K2){
				log.posterior <- log.posterior + sum(lgamma(alpha + sx2[k,]) + lgamma(beta + s2[k] - sx2[k,]))
			}
			#prior constants2:
			log.posterior <- log.posterior + lgamma(sum(gamma[1:K2])) - sum(lgamma(gamma[1:K2])) - K2*d*lbeta(alpha, beta)
			logAR <- logAR + (temperatures[j1] - temperatures[j2])*log.posterior
			#write(paste0('logAR = ',logAR),stderr())
			#cat(paste('logAR =',logAR),'\n')
			if( log(runif(1)) < logAR ){
				ar <- ar + 1
				localAR <- localAR + 1
				currentZ[j1,] <- z2
				currentZ[j2,] <- z1
				currentK[j1] <- K2
				currentK[j2] <- K1
				#cat(paste('switching.'),'\n')
			}
			myChain <- 1
			foreach(myChain=1:nChains, .export=ls(envir=globalenv()) ) %dopar% {
				outDir <- outputDirs[myChain]
				myHeat <- temperatures[myChain]
				Kstart <- currentK[myChain]
				zStart <- currentZ[myChain,]
				allocationSamplerBinMix( alpha = alpha, beta = beta, gamma = gamma, m = 10, burn= 9, data = x, 
							thinning = 1,Kmax = Kmax, ClusterPrior = ClusterPrior,ejectionAlpha = ejectionAlpha, 
							outputDir = outDir,Kstart=Kstart,zStart = zStart, heat=myHeat,
							metropolisMoves =  metMoves[[myChain]],LS = FALSE, rsX = rsX, originalX = originalX)
			}

			if(iter %% (m/100) == 0){
				matplot(sampledK[1:iter,],type = "l",lty = 1,lwd = 2, col = topo.colors(nChains))
				points(sampledK[1:iter,1], type = "b",col = topo.colors(nChains)[1])
				legend('topleft',paste0('f(z,K|data)^{',round(heats,3),'}'),lty = 1, lwd = 2, col = topo.colors(nChains))
				write(paste0(100*iter/m,'% completed. Chain switching acceptance rate: ',100*round(ar/iter,3),'%.'),stderr())
			}
			if(iter > burn){
				kk <- as.numeric(read.table(paste0(outPrefix,"1/K.txt"))[1,])
				cat(kk,"\n",file=conK)
				theta <- as.numeric(read.table(paste0(outPrefix,"1/theta.varK.txt"))[1,])
				cat(theta,"\n",file=conTheta)
				z <- as.numeric(read.table(paste0(outPrefix,"1/z.varK.txt"))[1,])
				cat(z,"\n",file=conZ)
				p <- as.numeric(read.table(paste0(outPrefix,"1/p.varK.txt"))[1,])
				cat(p,"\n",file=conP)
				if(length(rsX) > 0){cat(x,"\n",file=conX)}
			}
	
		}
		close(conK)
		close(conTheta)
		close(conP)
		close(conZ)
		if(nChains > 1){
			swapAcceptanceRate <- 100*round(ar/iter,3)
		}else{ swapAcceptanceRate <- 'NA' }
		if(length(rsX) > 0){
			close(conX)
		}
		write.table(sampledK, file = paste0(outPrefix,"/K.allChains.txt"), col.names = paste0('chain.',1:nChains),quote=FALSE,row.names = FALSE)
		for(k in 1:nChains){
			unlink(paste0(outPrefix,k), recursive=TRUE)
		}
		sink()
		stopImplicitCluster()
	}
	if(length(rsX) == 0){
		# x contains no missing values
		if(is.null(z.true) == TRUE){
			dealWithLabelSwitching(outDir = outPrefix, binaryData = binaryData)
		}else{
			dealWithLabelSwitching(outDir = outPrefix, binaryData = binaryData, z.true = z.true)
		}
	}else{
		# x contains missing values
		if(is.null(z.true) == TRUE){
			dealWithLabelSwitchingMissing(outDir = outPrefix, binaryData = binaryData)
		}else{
			dealWithLabelSwitchingMissing(outDir = outPrefix, binaryData = binaryData, z.true = z.true)
		}
	}

	# returning mcmc objects from coda package for the most probable number of clusters
	if(nChains > 1){
		kFile <- sampledK[(burn+1):ITERATIONS,1]
	}else{
		kFile <- read.table(paste0(outPrefix,"/K.txt"))
		ITERATIONS <- m
		swapAcceptanceRate <- 0
	}
	K <- as.numeric(names(table(kFile))[order(table(kFile),decreasing=TRUE)[1]])
	K.mcmc <- mcmc(kFile, start = 10*burn + 10, end = 10*ITERATIONS, thin = 10)
	if( K > 1 ){
		parameters.ecr.mcmc <- read.table(paste0(outPrefix,"/reorderedMCMC-ECR.mapK.",K,".txt"), header = TRUE)
		allocations.ecr.mcmc <- read.table(paste0(outPrefix,"/z.ECR.mapK.",K,".txt"), header = TRUE)
		clusterMembershipPerMethod <- read.table(paste0(outPrefix,"/reorderedSingleBestClusterings.mapK.",K,".txt"), header = TRUE)
		classificationProbabilities.ecr <- read.csv(paste0(outPrefix,"/classificationProbabilities.mapK.",K,".csv"))
	}else{
		parameters.ecr.mcmc <- read.table(paste0(outPrefix,"/MCMC.mapK.",K,".txt"), header = TRUE)
		allocations.ecr.mcmc <- rep(1, dim(parameters.ecr.mcmc)[1] )
		classificationProbabilities.ecr <- array(data = 1, dim = c(n,1))
		clusterMembershipPerMethod <- array(data = 1, dim = c(n,3)) 
		colnames(clusterMembershipPerMethod) <- c('ECR','STEPHENS','ECR-ITERATIVE-1')
	}
	parameters.ecr.mcmc <- mcmc( parameters.ecr.mcmc )
	allocations.ecr.mcmc <- mcmc( allocations.ecr.mcmc )
	colnames(classificationProbabilities.ecr) <- paste('cluster',1:K)
	bbm.output <- vector('list', length = 7)
	bbm.output[[1]] <- K.mcmc
	bbm.output[[2]] <- parameters.ecr.mcmc
	bbm.output[[3]] <- allocations.ecr.mcmc
	bbm.output[[4]] <- classificationProbabilities.ecr
	bbm.output[[5]] <- clusterMembershipPerMethod
	if(nChains > 1){
		sampledK <- array(sampledK, dim = c(ITERATIONS, nChains))
		colnames(sampledK) <- paste0("chain.", 1:nChains) 
		colnames(sampledK)[1] <- paste0(colnames(sampledK)[1],"_(target)")
	}else{
		sampledK <- asr
		write.table(sampledK, file = paste0(outPrefix,"/K.allChains.txt"), 
			col.names = 'chain.1',quote=FALSE,row.names = FALSE)
	}
	bbm.output[[6]] <- sampledK
	bbm.output[[7]] <- c(nChains, swapAcceptanceRate, m, burn)
	names(bbm.output) <- c('K.mcmc', 'parameters.ecr.mcmc', 'allocations.ecr.mcmc', 'classificationProbabilities.ecr', 'clusterMembershipPerMethod', 'K.allChains', 'chainInfo')
	class(bbm.output) <- c('list', 'bbm.object')
	return(bbm.output)
}



dealWithLabelSwitching <- function(outDir,reorderModels, binaryData,z.true){
	setwd(outDir)
	x <- binaryData
	kFile <- read.table("K.txt")[,1]
	theta.file <- "theta.varK.txt"
	z.file <- "z.varK.txt"
	p.file <- "p.varK.txt"
	cat("\n")
	print(table(kFile)/length(kFile))
	K <- as.numeric(names(table(kFile))[order(table(kFile),decreasing=TRUE)[1]])
	cat("\n")
	cat(paste("Most probable model: K = ",K," with P(K = ",K,") = ",max(table(kFile)/length(kFile)),sep=""),"\n")		
	cat("\n")
	if(missing(reorderModels)==TRUE){reorderModels <- 'onlyMAP'}
	if(reorderModels == 'onlyMAP'){kRange <- K}else{
		kRange <- as.numeric(names(table(kFile)/length(kFile)))
	}
	for ( K in kRange ){

		tt <- read.table("theta.varK.txt")
		index <- which(kFile == K)
		d <- dim(x)[2]
		n <- dim(x)[1]
		J <- d + 1
		m <- length(index)
		mcmc <- array(data = NA, dim = c(m,K,J))
		Kmax <- (dim(tt)/d)[2]
		for (j in 1:d){
			for(k in 1:K){
				mcmc[,k,j] <- tt[index,(j-1)*Kmax + k]
			}
		}
		conP = file(p.file,open = "r")
		i <- 0
		j <- 0
		while (length(oneLine <- readLines(conP, n = 1, warn = FALSE)) > 0) {
			i <- i + 1
			if(kFile[i] == K){
				j <- j + 1
				mcmc[j,,J] <- as.numeric(strsplit(oneLine,split = " ")[[1]])
			}
		}
		close(conP)
		if (K > 1){
			cat(paste("Dealing with Label Switching for K =",K),"\n")
			allocations <- as.matrix(read.table("z.varK.txt",as.is = TRUE)[index,])
			iter <- 1
			ll <- complete.loglikelihood(x,allocations[iter,],mcmc[iter,,])
			maxLL <- ll
			maxIter <- iter
			for (iter in 1:m){
				ll <- complete.loglikelihood(x,allocations[iter,],mcmc[iter,,])
				if(ll > maxLL){maxLL <- ll;maxIter <- iter;cat(paste("Found new Complete MLE: ", ll,sep=""),"\n")}
			}
			# classification probs
			ptm <- proc.time()
			pMatrix <- array(data = NA, dim = c(m,n,K))
			l <- array(data = 0, dim = c(n,K))
			for (iter in 1:m){
				LOG.P <- log(mcmc[iter,,J])
				LOG.THETA <- array(log(mcmc[iter,,1:(J-1)]),dim = c(K,J-1) )
				LOG.1_MINUS_THETA <- array(log(1 - mcmc[iter,,1:(J-1)]),dim = c(K,J-1) )
					for(k in 1:K){
						l[,k] <- LOG.P[k] + rowSums( x * matrix(LOG.THETA[k,], nrow = n, ncol = J - 1, byrow = TRUE) + (1-x)*matrix(LOG.1_MINUS_THETA[k,], nrow = n, ncol = J - 1, byrow = TRUE))
					}
					for(k in 1:K){
						pMatrix[iter,,k] <- apply(l,1,function(y){return(1/sum(exp(y - y[k])))} )
						ind <- which(is.na(pMatrix[iter,,k]) == TRUE) 
						nInd <- length(ind)
						if(nInd > 0){pMatrix[iter,ind,k] <- rep(0,nInd)}
					}
				
				if(iter %% 1000 == 0){cat(paste(" classification probs: ",100*round(iter/m,3),"% completed",sep=""),"\n");}
			}

			cat(paste0("proc.time for classification probabilities: ", round(as.numeric((proc.time() - ptm)[3]),2)),"\n")
			if(missing(z.true)==TRUE){
				ls <- label.switching( method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
							zpivot = allocations[maxIter,], z = allocations,K = K, complete = complete.loglikelihood, data = x,
							prapivot = mcmc[maxIter,,], mcmc = mcmc, p = pMatrix)
			}else{
				ls <- label.switching( method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
							zpivot = allocations[maxIter,], z = allocations,K = K, complete = complete.loglikelihood, data = x,
							prapivot = mcmc[maxIter,,], mcmc = mcmc, p = pMatrix,groundTruth = z.true)
			}
			reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR")$output
			write.table(reordered.mcmc, file = paste("reorderedMCMC-ECR.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR-ITERATIVE-1")$output
			write.table(reordered.mcmc, file = paste("reorderedMCMC-ECR-ITERATIVE1.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"STEPHENS")$output
			write.table(reordered.mcmc, file = paste("reorderedMCMC-STEPHENS.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			write.table(mcmc, file = paste("rawMCMC.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			write.table(file = paste("reorderedSingleBestClusterings.mapK.",K,".txt",sep=""),t(ls$clusters[c(1,2,3),]),row.names = paste("z",1:n,sep="."))

			#reordering allocations 
			allocationsECR <- allocationsKL <- allocationsECR.ITERATIVE1 <- allocations
			for (i in 1:m){
				myPerm <- order(ls$permutations$"ECR"[i,])
				allocationsECR[i,] <- myPerm[allocations[i,]]
				myPerm <- order(ls$permutations$"STEPHENS"[i,])
				allocationsKL[i,] <- myPerm[allocations[i,]]
				myPerm <- order(ls$permutations$"ECR-ITERATIVE-1"[i,])
				allocationsECR.ITERATIVE1[i,] <- myPerm[allocations[i,]]

			}
			MeanReorderedpMatrix <- array(data = 0, dim = c(n,K))    # define object that will contain the classification probs
			for (i in 1:m){
				myPerm <- ls$permutations$"ECR"[i,]   # this is the permutation of labels for iteration i according to ECR algorithm
				MeanReorderedpMatrix <- MeanReorderedpMatrix + pMatrix[i, ,myPerm]   # apply myPerm to the columns of pMatrix for given iteration and add the permuted matrix to MeanReorderedpMatrix
			}
			MeanReorderedpMatrix <- MeanReorderedpMatrix/m    # this is the final estimate of classification probabilities. 
			write.csv(MeanReorderedpMatrix, file = paste0("classificationProbabilities.mapK.",K,".csv"), row.names = FALSE)


			write.table(allocationsECR, file = paste("z.ECR.mapK.",K,".txt",sep=""))
			write.table(allocationsKL, file = paste("z.KL.mapK.",K,".txt",sep=""))
			write.table(allocationsECR.ITERATIVE1, file = paste("z.ECR-ITERATIVE1.mapK.",K,".txt",sep=""))
			#file.remove("p.collapsed.txt")
			#file.remove("theta.collapsed.txt")
			cat(paste0("raw MCMC parameters for most probable K written to: \'rawMCMC.mapK.",K,".txt\' "),"\n")
			cat(paste0("raw MCMC latent allocations for most probable K written to: \'z.mapK.",K,".txt\' "),"\n")
			cat(paste0("reordered MCMC output written to: "),"\n")
			cat(paste0("     (Method 1):     \'reorderedMCMC-ECR.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 2):     \'reorderedMCMC-ECR-ITERATIVE1.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 3):     \'reorderedMCMC-STEPHENS.mapK.",K,".txt\'"),"\n")
			cat(paste0("reordered single best clusterings written to: \'reorderedSingleBestClusterings.mapK.",K,".txt\' "),"\n")
			cat(paste0("reordered MCMC latent allocations for most probable K written to: "),"\n")
			cat(paste0("     (Method 1):     \'z.ECR.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 2):     \'z.KL.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 3):     \'z.ECR-ITERATIVE1.mapK.",K,".txt\'"),"\n")

		}else{
			cat(paste0('[NOTE]:    Most probable model corresponds to 1 cluster so the label-switching algorithms are not applied.',"\n"))
			write.table(mcmc, file = paste("MCMC.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			cat(paste0("MCMC output corresponding to most probable model (K = 1) written to: \'", paste("MCMC.mapK.",K,".txt",sep=""),"\'"),"\n")


		}

	}
	setwd("../")

}



dealWithLabelSwitchingMissing <- function(outDir,reorderModels, binaryData, z.true){
	setwd(outDir)
	x <- binaryData
	d <- dim(x)[2]
	n <- dim(x)[1]

	x.file <- "x.txt"
	kFile <- read.table("K.txt")[,1]
	theta.file <- "theta.varK.txt"
	z.file <- "z.varK.txt"
	p.file <- "p.varK.txt"
	cat("\n")
	print(table(kFile)/length(kFile))
	K <- as.numeric(names(table(kFile))[order(table(kFile),decreasing=TRUE)[1]])
	cat("\n")
	cat(paste("Most probable model: K = ",K," with P(K = ",K,") = ",max(table(kFile)/length(kFile)),sep=""),"\n")		
	cat("\n")
	if(missing(reorderModels)==TRUE){reorderModels <- 'onlyMAP'}
	if(reorderModels == 'onlyMAP'){kRange <- K}else{
		kRange <- as.numeric(names(table(kFile)/length(kFile)))
	}
	for ( K in kRange ){
		tt <- read.table("theta.varK.txt")
		index <- which(kFile == K)
		J <- d + 1
		m <- length(index)
		mcmc <- array(data = NA, dim = c(m,K,J))
		Kmax <- (dim(tt)/d)[2]
		for (j in 1:d){
			for(k in 1:K){
				mcmc[,k,j] <- tt[index,(j-1)*Kmax + k]
			}
		}
		conP = file(p.file,open = "r")
		i <- 0
		j <- 0
		while (length(oneLine <- readLines(conP, n = 1, warn = FALSE)) > 0) {
			i <- i + 1
			if(kFile[i] == K){
				j <- j + 1
				mcmc[j,,J] <- as.numeric(strsplit(oneLine,split = " ")[[1]])
			}
		}
		close(conP)
		if (K > 1){
			cat(paste("Dealing with Label Switching for K =",K),"\n")
			conX <- file(x.file, open = "r")
			allocations <- as.matrix(read.table("z.varK.txt",as.is = TRUE)[index,])
			pMatrix <- array(data = NA, dim = c(m,n,K))
			l <- array(data = 0, dim = c(n,K))
			ptm <- proc.time()
			iter <- 0	
			xEstimated <- array(data = 0, dim = c(n,d))		
			for(xLine in 1:length(kFile)){
				xC <- readLines(conX, n = 1, warn = FALSE)
				if( is.na(match(xLine,index)) == FALSE){
					x <- as.numeric(strsplit(xC,split = " ")[[1]])
					x <- matrix(x,nrow = n, ncol = d)
					xEstimated <- xEstimated + x
					iter <- iter + 1
#					cat(paste0("line = ",xLine, ", index = ",iter, ", rsX = ", sum(x)),"\n")
					# finding MLE
					ll <- complete.loglikelihood(x,allocations[iter,],mcmc[iter,,]) 
					if(iter == 1){ maxLL <- ll; maxIter <- iter }
					if(ll > maxLL){maxLL <- ll;maxIter <- iter;cat(paste("Found new Complete MLE: ", ll,sep=""),"\n")}
					# classification probs
					LOG.P <- log(mcmc[iter,,J])
					LOG.THETA <- array(log(mcmc[iter,,1:(J-1)]),dim = c(K,J-1) )
					LOG.1_MINUS_THETA <- array(log(1 - mcmc[iter,,1:(J-1)]),dim = c(K,J-1) )
					for(k in 1:K){
						l[,k] <- LOG.P[k] + rowSums( x * matrix(LOG.THETA[k,], nrow = n, ncol = J - 1, byrow = TRUE) + (1-x)*matrix(LOG.1_MINUS_THETA[k,], nrow = n, ncol = J - 1, byrow = TRUE))
					}
					for(k in 1:K){
						pMatrix[iter,,k] <- apply(l,1,function(y){return(1/sum(exp(y - y[k])))} )
						ind <- which(is.na(pMatrix[iter,,k]) == TRUE) 
						nInd <- length(ind)
						if(nInd > 0){pMatrix[iter,ind,k] <- rep(0,nInd)}
					}
					if(iter %% 100 == 0){cat(paste(" classification probs: ",100*round(iter/m,3),"% completed",sep=""),"\n");}

				}
			}
			xEstimated <- xEstimated/iter
			write.table(file = "xEstimated.txt", xEstimated, quote = FALSE)
			close(conX)
			cat(paste0("proc.time for classification probabilities: ", round(as.numeric((proc.time() - ptm)[3]),2)),"\n")
			cat(paste0("estimated missing data file written to: \'xEstimated.txt\'"),"\n")
			if(missing(z.true)==TRUE){
				ls <- label.switching( method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
							zpivot = allocations[maxIter,], z = allocations,K = K, complete = complete.loglikelihood, data = x,
							prapivot = mcmc[maxIter,,], mcmc = mcmc, p = pMatrix)
			}else{
				ls <- label.switching( method = c("STEPHENS","ECR","ECR-ITERATIVE-1"),
							zpivot = allocations[maxIter,], z = allocations,K = K, complete = complete.loglikelihood, data = x,
							prapivot = mcmc[maxIter,,], mcmc = mcmc, p = pMatrix,groundTruth = z.true)
			}
			reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR")$output
			write.table(reordered.mcmc, file = paste("reorderedMCMC-ECR.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"ECR-ITERATIVE-1")$output
			write.table(reordered.mcmc, file = paste("reorderedMCMC-ECR-ITERATIVE1.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			reordered.mcmc<-permute.mcmc(mcmc,ls$permutations$"STEPHENS")$output
			write.table(reordered.mcmc, file = paste("reorderedMCMC-STEPHENS.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			write.table(mcmc, file = paste("rawMCMC.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			write.table(file = paste("reorderedSingleBestClusterings.mapK.",K,".txt",sep=""),t(ls$clusters[c(1,2,3),]),row.names = paste("z",1:n,sep="."))

			#reordering allocations 
			allocationsECR <- allocationsKL <- allocationsECR.ITERATIVE1 <- allocations
			for (i in 1:m){
				myPerm <- order(ls$permutations$"ECR"[i,])
				allocationsECR[i,] <- myPerm[allocations[i,]]
				myPerm <- order(ls$permutations$"STEPHENS"[i,])
				allocationsKL[i,] <- myPerm[allocations[i,]]
				myPerm <- order(ls$permutations$"ECR-ITERATIVE-1"[i,])
				allocationsECR.ITERATIVE1[i,] <- myPerm[allocations[i,]]

			}
			MeanReorderedpMatrix <- array(data = 0, dim = c(n,K))    # define object that will contain the classification probs
			for (i in 1:m){
				myPerm <- ls$permutations$"ECR"[i,]   # this is the permutation of labels for iteration i according to ECR algorithm
				MeanReorderedpMatrix <- MeanReorderedpMatrix + pMatrix[i, ,myPerm]   # apply myPerm to the columns of pMatrix for given iteration and add the permuted matrix to MeanReorderedpMatrix
			}
			MeanReorderedpMatrix <- MeanReorderedpMatrix/m    # this is the final estimate of classification probabilities. 
			write.csv(MeanReorderedpMatrix, file = paste0("classificationProbabilities.mapK.",K,".csv"), row.names = FALSE)


			write.table(allocationsECR, file = paste("z.ECR.mapK.",K,".txt",sep=""))
			write.table(allocationsKL, file = paste("z.KL.mapK.",K,".txt",sep=""))
			write.table(allocationsECR.ITERATIVE1, file = paste("z.ECR-ITERATIVE1.mapK.",K,".txt",sep=""))
			#file.remove("p.collapsed.txt")
			#file.remove("theta.collapsed.txt")
			cat(paste0("raw MCMC parameters for most probable K written to: \'rawMCMC.mapK.",K,".txt\' "),"\n")
			cat(paste0("raw MCMC latent allocations for most probable K written to: \'z.mapK.",K,".txt\' "),"\n")
			cat(paste0("reordered MCMC output written to: "),"\n")
			cat(paste0("     (Method 1):     \'reorderedMCMC-ECR.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 2):     \'reorderedMCMC-ECR-ITERATIVE1.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 3):     \'reorderedMCMC-STEPHENS.mapK.",K,".txt\'"),"\n")
			cat(paste0("reordered single best clusterings written to: \'reorderedSingleBestClusterings.mapK.",K,".txt\' "),"\n")
			cat(paste0("reordered MCMC latent allocations for most probable K written to: "),"\n")
			cat(paste0("     (Method 1):     \'z.ECR.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 2):     \'z.KL.mapK.",K,".txt\'"),"\n")
			cat(paste0("     (Method 3):     \'z.ECR-ITERATIVE1.mapK.",K,".txt\'"),"\n")

		}else{
			cat(paste0('[NOTE]:    Most probable model corresponds to 1 cluster so the label-switching algorithms are not applied.',"\n"))
			write.table(mcmc, file = paste("MCMC.mapK.",K,".txt",sep=""),col.names = c(paste(rep(paste(expression(theta),1:K,sep="."),d),rep(1:d,each=K),sep="-"),paste('p',1:K,sep=".")))
			cat(paste0("MCMC output corresponding to most probable model (K = 1) written to: \'", paste("MCMC.mapK.",K,".txt",sep=""),"\'"),"\n")


		}

	}
	setwd("../")

}

#' @export
print.bbm.object <- function(x, printSubset, ...){
	if( missing(printSubset) ){ printSubset = TRUE }
	if( 'bbm.object' %in% class(x) ){
		cat("\n")
		cat(paste0("* Run information:"),"\n")
		cat(paste0("      Number of parallel heated chains: ", x$chainInfo[1]),"\n")
		cat(paste0("      Swap acceptance rate: ", x$chainInfo[2],"%"),"\n")
		cat(paste0("      Total number of iterations: ", x$chainInfo[3]*10),"\n")
		cat(paste0("      Burn-in period: ", x$chainInfo[4]*10),"\n")
		cat(paste0("      Thinning: 10."),"\n")
		kFile <- x$K.mcmc
		cat("\n")
		cat(paste("* Estimated posterior distribution of the number of clusters:"),"\n")
		print(round(table(x$K.mcmc)/length(x$K.mcmc),3))		
		K <- as.numeric(names(table(kFile))[order(table(kFile),decreasing=TRUE)[1]])
		cat("\n")
		cat(paste("* Most probable model: K = ",K," with P(K = ",K,"|data) = ",round(max(table(kFile)/length(kFile)),3),sep=""),"\n")
		cat("\n")
		cat(paste0("* Estimated number of observations per cluster conditionally on K = ", K," (3 label switching algorithms):"),'\n')
		print(apply(x$clusterMembershipPerMethod,2,table))
		d <- (dim(x$parameters.ecr.mcmc)[2] - K)/K
		myMeans <- apply(x$parameters.ecr.mcmc,2,mean)
		cat('\n')
		if(printSubset == TRUE){
			if(d > 5){
				cat(paste0('* Posterior mean of probability of success per feature and cluster (ECR algorithm):'),'\n')
				pr <- c()
				for(k in 1:K){
					subS <- paste0("theta.",k,".",1:d)[1:5]
					pr <- cbind( pr, myMeans[subS])
				}
				colnames(pr) <- paste0("cluster_",1:K)
				rownames(pr) <- paste0("theta_",1:5)
				print(pr)
				cat(paste0('   <+ ',d-5,' more rows>'),'\n')
			}
		}else{
			cat(paste0('* Posterior mean of probability of success per feature and cluster (ECR algorithm):'),'\n')
			pr <- c()
			for(k in 1:K){
				subS <- paste0("theta.",k,".",1:d)
				pr <- cbind( pr, myMeans[subS])
			}
			colnames(pr) <- paste0("cluster_",1:K)
			rownames(pr) <- paste0("theta_",1:d)
			print(pr)			
		}
	}else{
		cat(paste("    The input is not in class `bbm.object`"),'\n')
	}
}

Try the BayesBinMix package in your browser

Any scripts or data that you put into this service are public.

BayesBinMix documentation built on May 2, 2019, 3:26 a.m.