ordtpx: Estimation of Topic Models with Ordered Features using Multi-resolution analysis

#This is a R port of the original BMSMShrink function by Kolaczyk, with some modifications and improvements


#ash.repodir = scan(".ash.repodir.txt",what=character())
#source(file.path(ash.repodir,"/Rcode/bash.R"))
require(Rcpp)
require(inline)

#interleave two vectors
interleave=function(x,y){
  return(as.vector(rbind(x,y)))
}


rshift = function(x){L=length(x); return(c(x[L],x[-L]))}

lshift = function(x){return(c(x[-1],x[1]))}


#The following produces both a TItable,
#and a "parent" table whose pairwise comparisons would be used to create a TI table
#So, for example, in the ith row, elements 1, 2 would be the parents of the
#first element in the (i+1)the row of the TI table
# INPUT: sig, an n vector of Poisson counts at n locations
# OUTPUT: a list, with elements
# TItable - the usual TI table
# parent - the parent values used to make the TI table
ParentTItable=function(sig){
  n = length(sig)
  J = log2(n)

# Create decomposition table of signal, using pairwise sums,
# keeping just the values that are *not* redundant under the
# shift-invariant scheme.  This is very similar to TI-tables
# in Donoho and Coifman's TI-denoising framework.
  dmat = matrix(0, nrow=J+1, ncol=n)
  dmat[1,] = sig
  #dmat[1,] = as.matrix(sig)
  dmat2 = matrix(0, nrow=J, ncol=2*n) #the parent table

  for(D in 0:(J-1)){
    nD = 2^(J-D);
    nDo2 = nD/2;
    twonD = 2*nD;
    for(l in 0:(2^D-1)){
      ind = (l*nD+1):((l+1)*nD)
      ind2 = (l*twonD+1):((l+1)*twonD)
      x = dmat[D+1,ind]
      lsumx = x[seq(from=1,to=nD-1, by=2)] + x[seq(from=2,to=nD,by=2)]
      rx = rshift(x);
      rsumx = rx[seq(from=1,to=nD-1, by=2)] + rx[seq(from=2,to=nD,by=2)]
      dmat[D+2,ind] = c(lsumx,rsumx)
      dmat2[D+1,ind2] = c(x,rx)
    }
  }
  return(list(TItable=dmat,parent=dmat2))
}



#inc <- '#include <cmath>
#        NumericVector rshift(NumericVector x){
#          L=x.size;
#          double xx=x(L);
#          x.erase(L);
#          x.insert(x.begin(),xx);
#          return(x)
#        }
#        NumericVector lshift(NumericVector x){
#          double xx=x(1);
#          x.erase(1);
#          x.insert(x.end(),xx)
#          return(x)
#        }
#        '


#cxxParentTItable
#cxxParentTItable implements ParentTItable in C++
#note that input to cxxParentTItable is an nsig by n matrix sig
#while input to ParentTItable is a 1 by n vector instead
#src is a string containing the C++ code
src <- '
        NumericVector signal=sig;
        int n=(int) signal.size();
        int J=(int) log2((double)n);

        NumericMatrix parent(J,2*n);
        NumericMatrix TItable(J+1,n);
        TItable(0,_) = signal;
        for (int D=0; D<J; D++){
           int nD=(int) pow(2., (double) (J-D)), pD=(int) pow(2.,(double) D);
           for (int l=0; l<pD; l++){
              int a=l*nD+1, b=2*l*nD+1, d;
              for (int i=0; i<nD-1; i++){
                 d=TItable(D,a+i-1);
                 parent(D,b+i-1)=d;
                 parent(D,b+i+nD)=d;
              }
              //i=nD-1
              d=TItable(D,a+nD-2);
              parent(D,b+nD-2)=d;
              parent(D,b+nD-1)=d;

              for (int i=0; i<nD; i++)
                TItable(D+1,a+i-1)=parent(D,b+2*i-1)+parent(D,b+2*i);
          }
        }
        return(List::create(Named("TItable")=TItable, Named("parent")=parent));
        '
cxxParentTItable <- cxxfunction(signature(sig="numeric"),
                                body=src,
                                plugin="Rcpp",
                                inc="#include <cmath>")


#This function computes the posterior means
sfunc=function(p,q,x0,x1,mode){
  if(mode==1){
    xx = x0 + x1
    if(p==1){
      ss = 0.5*rep(1,length(x0))
    }else if(p == 0){
      ss = (x0 + q)/(xx + 2*q)
    }else{
# Compute first half denomenator of sum.
      fhd = log(1-p) - log(p) + (xx+1)*log(2) + lbeta(x0+q,x1+q) - lbeta(q,q)
      fhd = 2 + exp(fhd)

# Compute second half denomenator.
      shd1 = log(p) - log(1-p) + lbeta(q,q) - xx*log(2) - lbeta(x0+q+1,x1+q)
      shd  = exp(shd1) + (xx + 2*q)/(x0 + q)

# Put together two pieces.  Numerators are just 1.
      ss = (1/fhd) + (1/shd)
    }
  }else if(mode==2){
    nq = length(q)
    nn = length(x0)
    x0m = rep(1,nq)%o%x0
    x1m = rep(1,nq)%o%x1
    pm = p%o%rep(1,nn)
    qm = q%o%rep(1,nn)
    rq = rep(1,nq)
    num = log(pm)+lbeta(x0m+qm+1,x1m+qm)-lbeta(qm,qm)
    numpm = apply(num,2,max)
    num = num-rq%o%numpm
    num = log(colSums(exp(num)))+numpm
    den = log(pm)+lbeta(x0m+qm,x1m+qm)-lbeta(qm,qm)
    denpm = apply(den,2,max)
    den = den-rq%o%denpm
    den = log(colSums(exp(den)))+denpm
    ss = exp(num-den)
  }
  return(ss)
}

#This is similar to reverse.pwave used in cyclespin.smooth
reverse.pp=function(dmat,pp,qq,mode){
  n=dim(dmat)[2]
  J=log2(n)
  if(mode==1){
    qq=rep(qq,J)
  }else if(mode==2){
    qq=rep(1,J)%o%qq
  }
# Beginning with the total number of counts, working from coarse
# scales (i.e., deep depths) upwards, gradually build up the MSPB
# shrinkage estimate by multiplying by appropriate shrinkage factors
# at each level.
  est = dmat[J+1,]
  for (D in J:1){
    nD = 2^(J-D+1)
    nDo2 = nD/2
    for (l in 0:(2^(D-1)-1)){
# Set indexing so as to pick off blocks of size 2^(J-D+1)
# when shrinking estimates at depth D+1 down to finer
# scale at depth D.
      ind = (l*nD+1):((l+1)*nD)
      xxD = dmat[D,ind]
      estvec = est[ind]

# In the first half of the vector of D+1-depth estimates,
# we can shrink using the D-depth counts in the order
# in which they appear.
      estl = estvec[1:nDo2]
      xxDl = xxD[seq(1,nD-1,2)]
      xxDr = xxD[seq(2,nD,2)]
      if(mode==1){
        ss = sfunc(pp[D],qq[D],xxDl,xxDr,1)
      }else if(mode==2){
        ss = sfunc(pp[D,],qq[D,],xxDl,xxDr,2)
      }
      nestl = interleave(estl*ss,estl*(1 - ss))

# In the second half of the vector of D+1-depth counts,
# we right-shift the D-depth counts, compute the shrunken
# values, and left-shift these values back to the order
# of the above.
      estr = estvec[(nDo2+1):nD]
      sxxD = rshift(xxD)
      xxDl = sxxD[seq(1,nD-1,2)]
      xxDr = sxxD[seq(2,nD,2)]
      if(mode==1){
        ss = sfunc(pp[D],qq[D],xxDl,xxDr,1)
      }else if(mode==2){
        ss = sfunc(pp[D,],qq[D,],xxDl,xxDr,2)
      }
      nestr = interleave(estr*ss,estr*(1 - ss))
      nestr = lshift(nestr)

# Combine the estimates from both halves of the D+1-depth
# counts, and store.
      est[ind] = 0.5*( nestl + nestr )
    }
  }
  return(est)
}

#EM algorithm for estimating mixing proportions given TI table,
#parent TI table and beta parameters
binash=function(tit,ptit,qq,mode=1,maxit=2000,tol=1e-5){
  n=dim(tit)[2]
  J=dim(tit)[1]-1
  nt=tit[-1,]
  ns=ptit[,((1:(2*n))%%2==1)]
  nf=nt-ns
  maxit=maxit
  tol=tol
  convcrit=10.0
  iter=0
  lik=NULL
  likk=0
  if(mode==1){
    pip1=0.5*rep(1,J)
    while((convcrit > tol) & (iter < maxit)){
      lik.old=likk
      pi=pip1
      pmat0=log(pi)+nt*log(1/2)
      pmat1=log(1-pi)+lbeta(ns+qq,nf+qq)-lbeta(qq,qq)
      pm=pmax(pmat0,pmat1)
      pmat0=pmat0-pm
      pmat1=pmat1-pm
      pmat=exp(pmat0)/(exp(pmat0)+exp(pmat1))
      #likk=apply(log(exp(pmat0)+exp(pmat1)),1,sum)
      likk=apply(log(exp(pmat0)+exp(pmat1))+pm,1,sum)
      lik=cbind(lik,likk)
      pip1=rowMeans(pmat)
      pip1=pmax(pip1,1e-8)
      p=pip1
      convcrit=max((likk-lik.old)^2)
      iter=iter+1
    }
  }else if(mode==2){
    K=length(qq)
    pip1=1/K*matrix(1,nrow=J,ncol=K)
    qq=qq%o%rep(1,n)
    rK=rep(1,K)
    pmat_i=list(0)
    for(j in 1:J){
      nns=rK%o%ns[j,]
      nnf=rK%o%nf[j,]
      pmat_i[[j]]=lbeta(nns+qq,nnf+qq)-lbeta(qq,qq)
    }
    while((convcrit > tol) & (iter < maxit)){
      pi=pip1
      lik.old=likk
      for(j in 1:J){
        pp=pi[j,]%o%rep(1,n)
        pmat=log(pp)+pmat_i[[j]]
        pm=apply(pmat,2,max)
        pmat=pmat-rK%o%pm
        pip1.norm=exp(pmat)/(rK%o%colSums(exp(pmat)))
        pip1[j,]=rowMeans(pip1.norm)
        likk[j]=sum(log(colSums(exp(pmat)))+pm)
      }
      lik=cbind(lik,likk)
      pip1=pmax(pip1,1e-8)
      p=pip1
      convcrit=max((likk-lik.old)^2)
      iter=iter+1
    }
  }
  return(list(p=p,lik=lik))
}


autoselect.mixsd = function(betahat,sebetahat,mult){
  sebetahat=sebetahat[sebetahat!=0] #To avoid exact measure causing (usually by mistake)
  sigmaamin = min(sebetahat)/10 #so that the minimum is small compared with measurement precision
  if(all(betahat^2<=sebetahat^2)){
    sigmaamax = 8*sigmaamin #to deal with the occassional odd case where this could happen; 8 is arbitrary
  }else{
    sigmaamax = 2*sqrt(max(betahat^2-sebetahat^2)) #this computes a rough largest value you'd want to use, based on idea that sigmaamax^2 + sebetahat^2 should be at least betahat^2
  }
  if(mult==0){
    return(c(0,sigmaamax/2))
  }else{
    npoint = ceiling(log2(sigmaamax/sigmaamin)/log2(mult))
    return(mult^((-npoint):0) * sigmaamax)
  }
}

autoselect.mixalpha <- function(flow.prophat, z_level, mult=sqrt(2)){
  sebetahat <- sqrt(flow.prophat*(1-flow.prophat)/z_level)
  betahat_filtered <- flow.prophat[which(sebetahat!=0 & sebetahat!=Inf)]
  sebetahat_filtered <- sebetahat[which(sebetahat!=0 & sebetahat!=Inf)];
  autoselect_sd <- autoselect.mixsd(betahat = betahat_filtered,
                                    sebetahat=sebetahat_filtered,
                                    mult=mult);
  autoselect_alpha <- 0.5*((1/(4*autoselect_sd^2)) - 1);
  autoselect_alpha[autoselect_alpha > 10^7] = 10^7
  return(unique(autoselect_alpha))
}



#The main shrinkage function, as with the original BMSMShrink
#x is the signal
#q is the choice of beta parameters: for mixture of point mass and a single beta distn
#q is the parameter for that beta distn, and for multiple betas q should be a vector of parameters
#mode is either 1 for mixture of point mass and single beta distn, or 2 for mixture of multiple betas
#return.est: returns only estimate if TRUE, and estimated p's and q when FALSE
binshrink=function(x,mode=2, return.est=FALSE, gridmult=sqrt(2), pointmass=FALSE){
  x_odd <- x[c(TRUE,FALSE)]
  x_even <- x[c(FALSE, TRUE)]

  flow.prophat <- x_odd/(x_odd+x_even)

  mixalpha <- autoselect.mixalpha(flow.prophat = flow.prophat,
                                  z_level = (x_even+x_odd),
                                  mult=gridmult)
  mixalpha <- mixalpha[mixalpha>0]
  if(pointmass){ mixalpha = c(10^10,mixalpha) }

  q <- mixalpha;

  n=length(x)
  J=log2(n)
  titable=cxxParentTItable(x)
  tit=titable$TItable
  ptit=titable$parent
  pp=binash(tit,ptit,q,mode)$p
  est=reverse.pp(tit,pp,q,mode)
  if(return.est==TRUE){
    return(est)
  }else{
    return(list(est=est,p=pp,q=q))
  }
}

kkdey/ordtpx documentation built on May 20, 2019, 10:36 a.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

kkdey/ordtpx
Estimation of Topic Models with Ordered Features using Multi-resolution analysis

R/binshrink.R
In kkdey/ordtpx: Estimation of Topic Models with Ordered Features using Multi-resolution analysis

Defines functions interleave rshift lshift ParentTItable sfunc reverse.pp binash autoselect.mixsd autoselect.mixalpha binshrink

R Package Documentation

Browse R Packages

We want your feedback!

kkdey/ordtpx Estimation of Topic Models with Ordered Features using Multi-resolution analysis

R/binshrink.R In kkdey/ordtpx: Estimation of Topic Models with Ordered Features using Multi-resolution analysis

Defines functions interleave rshift lshift ParentTItable sfunc reverse.pp binash autoselect.mixsd autoselect.mixalpha binshrink

R Package Documentation

Browse R Packages

We want your feedback!

kkdey/ordtpx
Estimation of Topic Models with Ordered Features using Multi-resolution analysis

R/binshrink.R
In kkdey/ordtpx: Estimation of Topic Models with Ordered Features using Multi-resolution analysis