Mixcure: Maximum (penalized) likelihood estimation of Weibull mixture cure model

Documented in mixcure.penal.profile.CI.nested

############################################################
### Function for profile likelihood confidence interval ####
#### of mixcure model penalized loglikelihoods         #####
############################################################
#### previously 'mixcure.penal.profile.CI.test.r' ##
####################################################

mixcure.penal.profile.CI.nested <- function(formula, data, init, pl, apct = 0.05, LRT.pval = F, iterlim = 200) {
  require(splines)
  require(survival)
  require(abind)
  require(R.utils)

  #########################################################################################
  mat.inv <- function(matx) {

    detm = det(matx)
    #2x2 matrix inverse;
    if (ncol(matx) == 2) {
      inv.matx = (1/detm) * matrix(c(matx[2,2],-matx[2,1],-matx[1,2],matx[1,1]), nrow = 2)
    }

    else {
      #For any n>2 dimension square matrix;
      adjug.matx <- matrix(rep(0, ncol(matx)^2), nrow = nrow(matx))
      for (i in 1:nrow(matx)) {
        for (j in 1:ncol(matx)) {
          adjug.matx[i,j] <- (-1)^(i+j)*det(matx[-i,][,-j])
        }
      }
      inv.matx <- t(adjug.matx/detm)
    }

    return(inv.matx)
  }


  design.matrix <- model.frame(formula, data = data, na.action = na.omit);
  survt <- design.matrix[,1];

  design.matrix <- model.matrix(formula, data = design.matrix);

  # index ranges of coefficients of glm and cox models
  index.cure.v <- 1 : ncol(design.matrix);
  index.surv.v <- (ncol(design.matrix) + 1) : (2*length(index.cure.v))
  # index of alpha,the shape parameter
  index.gamma <- 2*length(index.cure.v)+1;

  samp.s <- nrow(design.matrix)


  ####################################################
  ## nonlinear minimization algoritm to solve       ##
  ## penalized mixture cure loglikelihood functions ##
  ####################################################


  loglik.mixture <- function(p, survt, design.matrix, index.cure.var=index.cure.v, index.surv.var=index.surv.v, pl) {

    ####  parameter and variable dep parameters;
    #####
    theta = 1/(1+exp(-design.matrix%*%p[index.cure.var]))
    eps = survt[,1]^(p[index.gamma])*exp(design.matrix%*%p[index.surv.var])
    eta = 1/((exp(eps)-1)*theta+1)
    delta = 1/(theta/(1-theta)*exp(eps)+1)
    kap= (1-eta)*(1-theta)*(theta + eta)
    pi = exp(eps)*eps*eta^2
    lambda = (1-theta)^2*eta*(1-eta)*((2*eta-1)*(1-theta)+3)
    phi = theta*(1-theta)*((2*eta-1)*(1-theta)+theta)*pi


    #calculate loglikelihood for the unpenalized;
    cure.par <- p[1 : ncol(design.matrix) ];
    surv.par <- p[ (ncol(design.matrix) + 1) : (2*length(cure.par)) ];
    p.gamma <- p[ 2*length(cure.par) + 1 ];  #use original shape parameter instead of exp();

    # loglikelihood is defined as the negative of the actual loglikelihood for feeding nlm() minimizer;
    loglikelihood <- -sum( ( log(1-theta) + log(p.gamma)-log(survt[,1])
                             +log(eps)-eps )[survt[, 2] == 1] ) -
      sum( (log(theta + (1-theta)*exp(-eps)))[survt[, 2] == 0] );

    if (pl == F) {
      loglik = loglikelihood
    } else {

      ####calculate inverse of info matrix by block matrix;
      ################

      n.elema = length(index.cure.var)^2
      a.sub1 <- matrix(rep(0,n.elema), nrow = length(index.cure.var))
      a.sub2 <- matrix(rep(0,n.elema), nrow = length(index.cure.var))

      for (i in c(index.cure.var)) {
        for (j in c(index.cure.var)) {
          a.sub1[i,j] <- sum((design.matrix[,i]*design.matrix[,j]*theta*(1-theta))[survt[, 2] == 1])
          a.sub2[i,j] <- sum((design.matrix[,i]*design.matrix[,j]*kap)[survt[, 2] == 0])
        }
      }
      info.a = a.sub1 + a.sub2


      design.xt <- cbind(design.matrix, log(survt[,1]))
      n.elemb <- length(index.cure.var)*(length(index.cure.var)+1)
      b.sub <- matrix(rep(0,n.elemb), nrow = length(index.surv.var))

      for (i in c(index.cure.var)) {
        for (j in c(index.cure.var,length(index.surv.var)+1)) {
          b.sub[i,j] <- -sum((design.matrix[,i]*design.xt[,j]*eps*(1-delta)*delta)[survt[, 2] == 0]) #alternative expression for est
        }
      }
      info.b = b.sub  #Upper right block of fisher.info;


      n.elemd <- (length(index.surv.var)+1)^2
      d.sub1 <- matrix(rep(0,n.elemd), nrow = (length(index.surv.var)+1))
      d.sub2 <- matrix(rep(0,n.elemd), nrow = (length(index.surv.var)+1))
      for (i in c(index.cure.var,length(index.surv.var)+1)) {
        for (j in c(index.cure.var,length(index.surv.var)+1)) {
          d.sub1[i,j] <- sum((design.xt[,i]*design.xt[,j]*eps)[survt[, 2] == 1])
          d.sub2[i,j] <- sum((design.xt[,i]*design.xt[,j]*(eps*delta-eps^2*delta+eps^2*delta^2))[survt[, 2] == 0])

        }
      }
      info.d = d.sub1 + d.sub2 +
        matrix(c(rep(0, (n.elemd-1)),sum(survt[, 2] == 1)/(p[index.gamma]^2)),nrow = (length(index.surv.var)+1))



      info.d.inv = mat.inv(info.d)

      fisher.info = rbind(cbind(info.a,info.b),cbind(t(info.b),info.d))
      #hessian.mat = -fisher.info

      # #info.set0 is (A-BD^-1B^T), dif than used in modified score;
      info.set0 = info.a-info.b%*%info.d.inv%*%t(info.b)

      #determinant of hessian matrix;
      det.info = det(info.set0)*det(info.d)
      #det.info = matrix.det(fisher.info)


      loglik = loglikelihood - 0.5*log(det.info)
    }
    #loglik = loglikelihood
    return(loglik)

  }

  ######END of loglik.mixture####################################


  # Parameter estimation under Ha (non-restricted likelihood)
  # maximize penalized or unpenalized loglikelihood by nlm;
  maximizer0 <- nlm(
    f = loglik.mixture, p = init, survt=survt, design.matrix=design.matrix,
    pl = pl,
    iterlim = iterlim, hessian=F);

  loglik <- -maximizer0$minimum  #in loglik function loglik was calculated as minus of actual loglik value




  #create CI for profile likelihood, this option only outputs estimates and PL under specified model;


  ## loglik function for testing parameters of cure or surv part ##
  ######################################################################
  # loglik.mixture.part <- function(p, survt, design.matrix1, design.matrix0,
  #                                 index.cure.var=index.cure.v,
  #                                 index.surv.var=index.surv.v, pl) {  #design.matrix1-surv, design.matrix0-cure
  #
  #   design.mtx.comb = cbind(design.matrix0,design.matrix1)
  #
  #   #parameter and variable dep parameters;
  #   theta = 1/(1+exp(-design.mtx.comb[,index.cure.var]%*%as.matrix(p[index.cure.var])))
  #   eps = survt[,1]^(p[index.gamma])*exp(design.mtx.comb[,index.surv.var]%*%as.matrix(p[index.surv.var]))
  #   eta = 1/((exp(eps)-1)*theta+1)
  #   delta = 1/(theta/(1-theta)*exp(eps)+1)
  #   #kap = theta*(1-theta)*(1-eta)-(1-theta)^2*eta*(1-eta)
  #   kap= (1-eta)*(1-theta)*(theta + eta)
  #   pi = exp(eps)*eps*eta^2
  #   lambda = (1-theta)^2*eta*(1-eta)*((2*eta-1)*(1-theta)+3)
  #   phi = theta*(1-theta)*((2*eta-1)*(1-theta)+theta)*pi
  #
  #   ####################################################################################################
  #   # Note: below constructs fisher info matrix; steps are divide into 4 blocks, 2 square blocks (A&D) #
  #   # on upper left and lower right, 2 identical transposed blocks (B) on upper right and lower left;  #
  #   # the idential B blocks are not identical in reduced models unless it's a global LRT, needs to be C#
  #   ####################################################################################################
  #
  #
  #   max.len = max(length(index.cure.var),length(index.surv.var))
  #   n.elema = max.len^2
  #   a.sub1 <- matrix(rep(0,n.elema), nrow = max.len)
  #   a.sub2 <- matrix(rep(0,n.elema), nrow = max.len)
  #
  #   for (i in c(index.cure.var)) {
  #     for (j in c(index.cure.var)) {
  #       a.sub1[i,j] <- sum((as.matrix(design.matrix0)[,i]*as.matrix(design.matrix0)[,j]*theta*(1-theta))[survt[, 2] == 1])
  #       a.sub2[i,j] <- sum((as.matrix(design.matrix0)[,i]*as.matrix(design.matrix0)[,j]*kap)[survt[, 2] == 0])
  #     }
  #   }
  #   info.a = (a.sub1 + a.sub2)[index.cure.var,index.cure.var]
  #
  #   ####### For error check of info.a############
  #   # for (i in c(1:max.len)) {
  #   #   for (j in c(1:max.len)) {
  #   #     a.sub1[i,j] <- sum((as.matrix(design.matrix0)[,i]*as.matrix(design.matrix0)[,j]*theta*(1-theta))[survt[, 2] == 1])
  #   #     a.sub2[i,j] <- sum((as.matrix(design.matrix0)[,i]*as.matrix(design.matrix0)[,j]*kap)[survt[, 2] == 0])
  #   #   }
  #   # }
  #   # info.a = (a.sub1 + a.sub2)[index.cure.var,index.cure.var]
  #
  #
  #      ##info matrix block B
  #   design.xt0 <- cbind(design.matrix0, log(survt[,1]))
  #   n.elemb <- max.len*(max.len+1)
  #   b.sub <- matrix(rep(0,n.elemb), nrow = max.len)
  #
  #   for (i in c(index.cure.var)) {
  #     for (j in c(1:length(index.surv.var), max.len+1)) {
  #      # b.sub[i,j] <- -sum((as.matrix(design.matrix1)[,i]*design.xt0[,j]*theta*(1-theta)*pi)[survt[, 2] == 0]) #alternative expression
  #      # b.sub[i,j] <- -sum((design.matrix1[,i]*design.xt0[,j]*eps*(1-eta)*eta*(1-theta))[survt[, 2] == 0])
  #       b.sub[i,j] <- -sum((as.matrix(design.matrix1)[,i]*design.xt0[,j]*eps*(1-delta)*delta)[survt[, 2] == 0]) #for est, PLCI
  #
  #       }
  #   }
  #   info.b = b.sub[index.cure.var,c(index.surv.var-max.len,index.gamma-max.len)]
  #
  #   ###### For error checking of info.b#########
  #   # for (i in c(1:max.len)) {
  #   #   for (j in c(1:max.len, max.len + 1)) {
  #   #     b.sub[i,j] <- -sum((as.matrix(design.matrix1)[,i]*design.xt0[,j]*theta*(1-theta)*pi)[survt[, 2] == 0])
  #   #   }
  #   # }
  #   # info.b = b.sub[index.cure.var,c(index.surv.var-max.len,index.gamma-max.len)]
  #
  # # ##info matrix block C
  #    design.xt1 <- cbind(design.matrix1, log(survt[,1]))
  # #   n.elemc <- max.len*(max.len+1)
  # #   c.sub <- matrix(rep(0,n.elemc), ncol = max.len)
  # #
  # #   for (i in c(index.cure.var)) {
  # #     for (j in c(1:length(index.surv.var), length(index.surv.var)+1)) {
  # #       c.sub[j,i] <- -sum((design.matrix1[,i]*design.xt1[,j]*delta*(1-delta)*eps)[survt[, 2] == 0])
  # #     }
  # #   }
  # #   info.c = c.sub[c(index.surv.var-max.len,index.gamma-max.len),index.cure.var]
  #
  #
  #    n.elemd <- (max.len+1)^2
  #   d.sub1 <- matrix(rep(0,n.elemd), nrow = (max.len+1))
  #   d.sub2 <- matrix(rep(0,n.elemd), nrow = (max.len+1))
  #
  #   for (i in c(index.surv.var-max.len, max.len +1)) {
  #     for (j in c(index.surv.var-max.len, max.len +1)) {
  #       d.sub1[i,j] <- sum((design.xt1[,i]*design.xt1[,j]*eps)[survt[, 2] == 1])
  #       d.sub2[i,j] <- sum((design.xt1[,i]*design.xt1[,j]*(eps*delta-eps^2*delta+eps^2*delta^2))[survt[, 2] == 0])
  #      # d.sub2[i,j] <- sum((design.xt1[,i]*design.xt1[,j]*(eps*delta^2))[survt[, 2] == 0])
  #     }
  #   }
  #   d.sub = d.sub1 + d.sub2 +
  #     matrix(c(rep(0, (n.elemd - 1)),sum(survt[, 2] == 1)/(p[index.gamma]^2)),
  #            nrow = (max.len + 1))
  #
  #   info.d = d.sub[c(index.surv.var-max.len,index.gamma-max.len),c(index.surv.var-max.len,index.gamma-max.len)]
  #
  #
  #   info.d.inv = mat.inv(info.d)
  #
  #   fisher.info = rbind(cbind(info.a,info.b),cbind(t(info.b),info.d))
  #   #hessian.mat = -fisher.info
  #
  #   # #info.set0 is (A-BD^-1B^T), dif than used in modified score;
  #   info.set0 = info.a-info.b%*%info.d.inv%*%t(info.b)
  #
  #   #determinant of hessian matrix;
  #   det.info = matrix.det(info.set0)*matrix.det(info.d)
  #   #det.info = matrix.det(fisher.info)
  #
  #   #calculate loglikelihood for the unpenalized;
  #   cure.par <- p[index.cure.var];
  #   surv.par <- p[index.surv.var];
  #   p.gamma <- p[index.gamma];  #use original shape parameter instead of exp();
  #
  #   # loglikelihood is defined as the negative of the actual loglikelihood for feeding nlm() minimizer;
  #   loglikelihood <- -sum( ( log(1-theta) + log(p.gamma)-log(survt[,1])
  #                            +log(eps)-eps )[survt[, 2] == 1] ) -
  #     sum( (log(theta + (1-theta)*exp(-eps)))[survt[, 2] == 0] );
  #
  #
  #   if (pl == FALSE)
  #   {
  #     loglik.part = loglikelihood
  #   }
  #   else if (pl == TRUE)
  #   {
  #
  #       loglik.part = loglikelihood - 0.5*log(det.info)
  #   }
  #
  #
  #   return(loglik.part)
  # }
  #

  #############################################################################################

  ## loglik function for constructing profile likelihood of cure or surv part ##
  loglik.mixture.profile <- function(p, survt, k=k, design.matrix1=design.matrix, design.matrix0=design.matrix, param.est, index.cure.var=index.cure.v, index.surv.var=index.surv.v, pl) {


    design.mtx.comb = cbind(design.matrix0,design.matrix1)
    ik = k-length(index.cure.var);

    #parameter and variable dep parameters;
    if (k > length(index.cure.v)) {
      theta = 1/(1+exp(-design.matrix[,index.cure.var]%*%as.matrix(p[index.cure.var])))
    } else {
      theta = 1/(1+exp(-design.matrix[,index.cure.var[-k]]%*%as.matrix(p[-c(index.surv.var-1,index.gamma-1)])-design.mtx.comb[,k]*param.est))
    }
    if (k > length(index.cure.v)) {
      eps = survt[,1]^(p[index.gamma-1])*exp(design.mtx.comb[,index.surv.var[-ik]]%*%as.matrix(p[-c(index.cure.var,index.gamma-1)])+design.mtx.comb[,k]*param.est)
    } else {
      eps = survt[,1]^(p[index.gamma-1])*exp(design.mtx.comb[,index.surv.var]%*%as.matrix(p[index.surv.var-1]))
    }

    eta = 1/((exp(eps)-1)*theta+1)
    delta = 1/(theta/(1-theta)*exp(eps)+1)
    #kap = theta*(1-theta)*(1-eta)-(1-theta)^2*eta*(1-eta) #for LRT
    kap= (1-eta)*(1-theta)*(theta + eta)  # for est,PLCI
    pi = exp(eps)*eps*eta^2
    lambda = (1-theta)^2*eta*(1-eta)*((2*eta-1)*(1-theta)+3)
    phi = theta*(1-theta)*((2*eta-1)*(1-theta)+theta)*pi

    ####################################################################################################
    # Note: below constructs fisher info matrix; steps are divide into 4 blocks, 2 square blocks (A&D) #
    # on upper left and lower right, 2 identical transposed blocks (B) on upper right and lower left;  #
    # the idential B blocks are not identical in reduced models unless it's a global LRT, needs to be C#
    ####################################################################################################

    #calculate loglikelihood for the unpenalized;
    p.gamma <- p[index.gamma-1];  #use original shape parameter instead of exp();

    # loglikelihood is defined as the negative of the actual loglikelihood for feeding nlm() minimizer;
    loglikelihood <- -sum( ( log(1-theta) + log(p.gamma)-log(survt[,1])
                             +log(eps)-eps )[survt[, 2] == 1] ) -
      sum( (log(theta + (1-theta)*exp(-eps)))[survt[, 2] == 0] );

    if (pl==T) {
      max.len = max(length(index.cure.var),length(index.surv.var))
      n.elema = max.len^2
      a.sub1 <- matrix(rep(0,n.elema), nrow = max.len)
      a.sub2 <- matrix(rep(0,n.elema), nrow = max.len)

      for (i in c(index.cure.var)) {
        for (j in c(index.cure.var)) {
          a.sub1[i,j] <- sum((as.matrix(design.matrix0)[,i]*as.matrix(design.matrix0)[,j]*theta*(1-theta))[survt[, 2] == 1])
          a.sub2[i,j] <- sum((as.matrix(design.matrix0)[,i]*as.matrix(design.matrix0)[,j]*kap)[survt[, 2] == 0])
        }
      }
      #info.a = (a.sub1 + a.sub2)[index.cure.var,index.cure.var]
      info.a = (a.sub1 + a.sub2)

      ##info matrix block B
      design.xt0 <- cbind(design.matrix0, log(survt[,1]))
      n.elemb <- max.len*(max.len+1)
      b.sub <- matrix(rep(0,n.elemb), nrow = max.len)

      for (i in c(index.cure.var)) {
        for (j in c(1:length(index.surv.var), max.len+1)) {
          b.sub[i,j] <- -sum((as.matrix(design.matrix1)[,i]*design.xt0[,j]*eps*(1-delta)*delta)[survt[, 2] == 0])
        }
      }
      #info.b = b.sub[index.cure.var,c(index.surv.var-max.len,index.gamma-max.len)]
      info.b = b.sub

      ###info matrix block d
      design.xt1 <- cbind(design.matrix1, log(survt[,1]))

      n.elemd <- (max.len+1)^2
      d.sub1 <- matrix(rep(0,n.elemd), nrow = (max.len+1))
      d.sub2 <- matrix(rep(0,n.elemd), nrow = (max.len+1))

      for (i in c(index.surv.var-max.len, max.len +1)) {
        for (j in c(index.surv.var-max.len, max.len +1)) {
          d.sub1[i,j] <- sum((design.xt1[,i]*design.xt1[,j]*eps)[survt[, 2] == 1])
          d.sub2[i,j] <- sum((design.xt1[,i]*design.xt1[,j]*(eps*delta-eps^2*delta+eps^2*delta^2))[survt[, 2] == 0])
        }
      }
      d.sub = d.sub1 + d.sub2 +
        matrix(c(rep(0, (n.elemd - 1)),sum(survt[, 2] == 1)/(p[index.gamma-1]^2)),
               nrow = (max.len + 1))

      info.d = d.sub

      info.d.inv = mat.inv(info.d)

      fisher.info = rbind(cbind(info.a,info.b),cbind(t(info.b),info.d))
      #hessian.mat = -fisher.info

      # #info.set0 is (A-BD^-1B^T), dif than used in modified score;
      info.set0 = info.a-info.b%*%info.d.inv%*%t(info.b)

      #determinant of hessian matrix;
      det.info = matrix.det(info.set0)*matrix.det(info.d)
      #det.info = matrix.det(fisher.info)

      loglik.part = loglikelihood - 0.5*log(det.info)
    } else
      if (pl == FALSE)
      {
        loglik.part = loglikelihood
      }

    return(loglik.part)
  }


  #################################################################
  #### parameter estimation under H0 for individual parameter
  #### loglikelihood ratio test statistics for each cure part variable;

  dim.v <- ncol(design.matrix)

  if (LRT.pval == T) {
    ll.cure <- rep(0,dim.v)
    llr.cure <- rep(0,dim.v)
    pval.cure <- rep(0,dim.v)

    for (k in index.cure.v[-1]) {
      # mle under the reduced (null) model for cure parameter;
      maximizer <- nlm(
        f = loglik.mixture.part, p = init,
        survt = survt, design.matrix0 = design.matrix,
        design.matrix1=design.matrix,
        index.cure.var=index.cure.v[-k], pl=pl,
        iterlim = iterlim, hessian=F
      );
      loglik.part = -maximizer$minimum;
      dif.ll = -2*(loglik.part-loglik);  #loglik is ll under Ha;
      pval = pchisq(abs(dif.ll),df=1,lower.tail=FALSE);
      ll.cure[k]<- loglik.part
      llr.cure[k]<- dif.ll
      pval.cure[k]<- pval
      if (det(maximizer$hessian) < 1e-05)
        diag(maximizer$hessian) <- diag(maximizer$hessian) + 1e-06
    }
  }
  ###################################
  # Profile likelihood CI endpoint  #
  ###################################

  # Note:
  # loglik     -- loglikelihood of all the parameters under MLE of full likelihood;
  # l.up       -- loglik corresponds to upper or lower CI bounds B0=B+delta or B0=B-delta;
  # tol        -- tolerance level for defining loglik difference of estimated and actual parameters are converged;
  # lambda     -- lambda quantity for profile likelhood calculation as referenced;
  # delta.up   -- delta quantity for upper endpoint of profile likelihood calculation as referenced;
  # delta.lo   -- delta quantity for lower endpoint of profile likelihood calculation as referenced;
  # l.temp/l0.b-- loglik of estimated endpoint parameter values under profile likelihood for the corresponding parameter;

  ######################################################
  ## By parameter upper or lower endpoint calculation ##
  ######################################################
  # apct=0.05

  l.null = loglik - 0.5 * qchisq(1-apct,df=1,ncp = 0,lower.tail=T)
  ni = 1

  ######## Cure part variable CI endpoints ########
  #################################################

  upper.cure <- rep(0,dim.v)
  lower.cure <- rep(0,dim.v)
  for (k in index.cure.v) {

    ##################upper endpoint##########################
    tol = 0.1
    l.temp <- loglik

    n=ni+1

    #assign initial values to parameter estimates
    param.est.up <- maximizer0$estimate

    converge <- FALSE; iter1 <- 1; EXIT1 <-FALSE; l0.b.up = 0;delta.up = 0
    while ((!converge| is.nan(l0.b.up)) & iter1 <= 25 & !EXIT1 & !is.nan(delta.up)) {

      # calculate log-lik, score and hessian under l0.b;
      maximizer.temp <-  nlm(
        f = loglik.mixture, p = param.est.up, survt=survt, design.matrix=design.matrix,
        pl = pl, iterlim = 1, hessian=TRUE)
      score.temp = maximizer.temp$gradient
      hessian.temp = maximizer.temp$hessian
      if (det(hessian.temp) < 1e-05) diag(hessian.temp) <- diag(hessian.temp) + 1e-06

      #### Approach 1: lambda = (2*(l0.b-l.up+e*A^-1*U)/(e*A^-1*e))^0.5
      # l0.b.up <- -loglik.mixture(p=param.est.up, survt, design.matrix,
      #                            index.cure.var=index.cure.v, index.surv.var=index.surv.v, pl)
      l0.b.up <- -maximizer.temp$minimum
      inv.hessian.temp <- solve(hessian.temp)

      if ((l0.b.up - l.null + score.temp %*% inv.hessian.temp %*% score.temp)/inv.hessian.temp[k,k]<0) {
        #   lambda <- (0.5*(l0.b.up - l.null) + (-inv.hessian.temp %*% score.temp)[k])/inv.hessian.temp[k,k]
        lambda <- (inv.hessian.temp %*% score.temp)[k]/inv.hessian.temp[k,k]
        #        lambda <- (-inv.hessian.temp %*% score.temp)[k])/inv.hessian.temp[k,k]
        #define increment for estimated value: delta=-A^-1(U-lambda*e)
        delta.up <- -inv.hessian.temp[k,k] %*% (score.temp[k] - lambda);
      } else{
        lambda <- (2*(l0.b.up - l.null + score.temp %*% inv.hessian.temp %*% score.temp)/inv.hessian.temp[k,k])^0.5
        #define increment for estimated value: delta=-A^-1(U-lambda*e)
        delta.up <- -inv.hessian.temp[k,k] %*% (score.temp[k] - lambda)};

      # maximizing loop for unpenalized estimates;
      #if (pl == F) {
      inside <- FALSE; iter2 <- 1;
      while (!inside & iter2 <= 100 & !is.nan(delta.up)) {

        # add increment to stepwise parameter value;
        param.est.temp.up <- param.est.up
        param.est.temp.up[k] <- param.est.temp.up[k]+delta.up
        # if (k==2) {param.est.temp.up[1] <- -1;param.est.temp.up[9] <- 0.1}

        #compute loglikelihood function using updated parameter values;

        maximizer.temp1 <- nlm( f = loglik.mixture.profile, p = param.est.temp.up[-k], survt=survt,
                                param.est = param.est.temp.up[k], k = k,
                                pl = pl, iterlim = iterlim, hessian=TRUE)
        l.temp.up = -maximizer.temp1$minimum

        #if (!is.nan(l.temp.up))

        #compare to see if updated l is still
        inside <- (l.temp.up > (l.null - 0.05)) #l.null - 0.05 for all others, 0.2 for k=3 of high rate H0
        #diff.up = l.temp.up - l.null
        #converge0 <- (abs(diff.up) <= tol)
        alevel.up <- pchisq(2*(l.temp-l.temp.up),df=1,ncp=0,lower.tail = T)
        #print(c(delta.up, alevel.up, n,l.temp.up,k,iter1,iter2))
        if (!inside) {delta.up <- delta.up/((n+1)/n);iter2 <- iter2 + 1}  #(n+0.1)/n for low rate H0;
        if (is.nan(delta.up)) {param.est.temp.up[k] <- NA}
      } #for iter2

      #}
      #Using converged increment for parameter to get corresponding score and variance expressions;
      param.est.up <- insert(maximizer.temp1$estimate, ats=k, values=param.est.temp.up[k])

      l0.b.up = l.temp.up

      diff.up = l0.b.up - l.null
      converge <- (abs(diff.up) <= tol)
      if ((!converge| is.nan(l0.b.up)) & !is.nan(delta.up)) {iter1 <- iter1 + 1; n = n + 1} else {EXIT1 = T;}
      if (is.nan(delta.up)==T) {param.est.up[k] <- NA}
    } #for iter1
    #} #for iter0
    upper.cure[k] <- param.est.up[k]


    ###############lower endpoint#####################

    n=ni
    #iter0 <- 1; converge = FALSE; l0.b.lo=0
    #while(l.temp > l.null & (!converge| is.nan(l0.b.lo)) & iter0<=30) {

    #assign initial values to parameter estimates
    param.est.lo <- maximizer0$estimate

    converge <- FALSE; iter1 <- 1; EXIT1 <-FALSE; l0.b.lo=0; delta.lo=0
    while ((!converge| is.nan(l0.b.lo)) & iter1 <= 25 & !EXIT1 & !is.nan(delta.lo)) {

      # calculate log-lik, score and hessian under l0.b;
      maximizer.temp <-  nlm(
        f = loglik.mixture, p = param.est.lo, survt=survt, design.matrix=design.matrix,
        pl = pl, iterlim = 1, hessian=TRUE)
      score.temp = maximizer.temp$gradient
      hessian.temp = maximizer.temp$hessian
      if (det(hessian.temp) < 1e-05) diag(hessian.temp) <- diag(hessian.temp) + 1e-06

      #### Approach 1: lambda = (2*(l0.b-l.null+e*A^-1*U)/(e*A^-1*e))^0.5
      # l0.b.lo <- -loglik.mixture(p=param.est.lo, survt, design.matrix,
      #                            index.cure.var=index.cure.v, index.surv.var=index.surv.v, pl)
      l0.b.lo <- -maximizer.temp$minimum
      inv.hessian.temp <- solve(hessian.temp)
      if ((l0.b.lo < l.null + 0.5 * score.temp %*% inv.hessian.temp %*% score.temp)|(l0.b.lo - l.null + score.temp %*% inv.hessian.temp %*% score.temp)/inv.hessian.temp[k,k]<0) {
        lambda <- ((-inv.hessian.temp %*% score.temp)[k])/inv.hessian.temp[k,k]
        #define increment for estimated value: delta=-A^-1(U-lambda*e)
      } else{
        lambda <- -(2*(l0.b.lo - l.null + score.temp %*% inv.hessian.temp %*% score.temp)/inv.hessian.temp[k,k])^0.5}
      #define increment for estimated value: delta=-A^-1(U-lambda*e)
      delta.lo <- -inv.hessian.temp[k,k] %*% (score.temp[k] - lambda);

      # maximizing loop for unpenalized estimates;
      #if (pl == F) {
      inside <- FALSE; iter2 <- 1;
      while (!inside & iter2 <= 100 & !is.nan(delta.lo)) {

        # add increment to stepwise parameter value;
        param.est.temp.lo <- param.est.lo
        param.est.temp.lo[k] <- param.est.temp.lo[k] + delta.lo
        # param.est.temp.lo[9] <- 0.1

        #compute loglikelihood function using lodated parameter values;
        maximizer.temp1 <- nlm( f = loglik.mixture.profile, p = param.est.temp.lo[-k], survt=survt,
                                param.est = param.est.temp.lo[k], k = k,
                                pl = pl, iterlim = iterlim, hessian=TRUE)
        l.temp.lo = -maximizer.temp1$minimum

        if (k==3) {dt.lo=0.1} else {dt.lo=0.5}
        inside <- (l.temp.lo > l.null - 0.1)
        # diff.lo = l.temp.lo - l.null
        # converge0 <- (abs(diff.lo) <= tol)
        alevel.lo <- pchisq(2*(l.temp-l.temp.lo),df=1,ncp=0,lower.tail = T)
        #print(c(delta.lo, alevel.lo, n,l.temp.lo,k,iter1,iter2))
        if (!inside) {delta.lo <- delta.lo/((n+dt.lo)/n);iter2 <- iter2 + 1} #for variables other than LuminalA (n+0.5)/n;
        if (is.nan(delta.lo)) {param.est.temp.lo[k] <- NA}

      } # for iter2;
      param.est.lo <- insert(maximizer.temp1$estimate, ats=k, values=param.est.temp.lo[k])
      l0.b.lo = l.temp.lo

      diff.lo = l0.b.lo - l.null
      converge <- (abs(diff.lo) <= tol)
      if ((!converge | is.nan(l0.b.lo)) & !is.nan(delta.lo)) {iter1 <- iter1 + 1; n = n + 2} else {EXIT1 = T}
      if (is.nan(delta.lo)==T) {param.est.lo[k] <- NA}

    } #for iter1

    lower.cure[k] <- param.est.lo[k]

  }



  ### loglikelihood calculation for each surv part variable;


  if (LRT.pval == T) {
    ll.surv <- rep(0,ncol(design.matrix))
    llr.surv <- rep(0,ncol(design.matrix))
    pval.surv <- rep(0,ncol(design.matrix))

    for (k in index.surv.v[-1]) {
      # mle under the reduced (null) model for surv parameter;
      is=k-length(index.cure.v)
      maximizer <- nlm(
        f = loglik.mixture.part, p = init,
        survt = survt, design.matrix1 = design.matrix,
        design.matrix0=design.matrix,
        index.surv.var=index.surv.v[-is], pl=pl,
        iterlim = iterlim, hessian=FALSE
      );

      loglik.part = -maximizer$minimum;
      dif.ll = -2*(loglik.part-loglik);
      pval = pchisq(abs(dif.ll),df=1,lower.tail=FALSE);
      ll.surv[is]<- loglik.part
      llr.surv[is]<-dif.ll
      pval.surv[is]<-pval
    }
  }

  ######## Surv part variable CI endpoints ########
  #################################################

  upper.surv <- rep(0,dim.v)
  lower.surv <- rep(0,dim.v)
  for (k in index.surv.v) {

    is=k-length(index.cure.v)
    ##################upper endpoint##########################
    l.temp <- loglik
    tol = 0.2

    n=ni
    # iter0 <- 1; converge = FALSE;l0.b.up = 0;
    # while(l.temp > l.null & (!converge| is.nan(l0.b.up)) & iter0<=30) {

    #assign initial values to parameter estimates
    param.est.up <- maximizer0$estimate

    converge <- FALSE; iter1 <- 1; EXIT1 <-FALSE; l0.b.up = 0;delta.up = 0
    while ((!converge| is.nan(l0.b.up)) & iter1 <= 25 & !EXIT1 & !is.nan(delta.up)) {

      # calculate log-lik, score and hessian under l0.b;
      maximizer.temp <-  nlm(
        f = loglik.mixture, p = param.est.up, survt=survt, design.matrix=design.matrix,
        pl = pl, iterlim = 1, hessian=TRUE)
      score.temp = maximizer.temp$gradient
      hessian.temp = maximizer.temp$hessian
      if (det(hessian.temp) < 1e-05) diag(hessian.temp) <- diag(hessian.temp) + 1e-06

      #### Approach 1: lambda = (2*(l0.b-l.up+e*A^-1*U)/(e*A^-1*e))^0.5
      # l0.b.up <- -loglik.mixture(p=param.est.up, survt, design.matrix,
      #                            index.cure.var=index.cure.v, index.surv.var=index.surv.v, pl)
      l0.b.up <- -maximizer.temp$minimum
      inv.hessian.temp <- solve(hessian.temp)
      if ((l0.b.up - l.null + score.temp %*% inv.hessian.temp %*% score.temp)/inv.hessian.temp[k,k]<0) {
        #   lambda <- (0.5*(l0.b.up - l.null) + (-inv.hessian.temp %*% score.temp)[k])/inv.hessian.temp[k,k]
        lambda <- (inv.hessian.temp %*% score.temp)[k]/inv.hessian.temp[k,k]
        #define increment for estimated value: delta=-A^-1(U-lambda*e)
        delta.up <- -inv.hessian.temp[k,k] %*% (score.temp[k] - lambda);
      } else{
        lambda <- (2*(l0.b.up - l.null + score.temp %*% inv.hessian.temp %*% score.temp)/inv.hessian.temp[k,k])^0.5
        #define increment for estimated value: delta=-A^-1(U-lambda*e)
        delta.up <- -inv.hessian.temp[k,k] %*% (score.temp[k] - lambda)};

      # maximizing loop for unpenalized estimates;
      #if (pl == F) {
      inside <- FALSE; iter2 <- 1;
      while (!inside & iter2 <= 100 & !is.nan(delta.up)) {

        # add increment to stepwise parameter value;
        param.est.temp.up <- param.est.up
        param.est.temp.up[k] <- param.est.temp.up[k]+delta.up

        #compute loglikelihood function using updated parameter values;

        maximizer.temp1 <- nlm( f = loglik.mixture.profile, p = param.est.temp.up[-k], survt=survt,
                                param.est = param.est.temp.up[k], k = k,
                                pl = pl, iterlim = iterlim, hessian=TRUE)
        l.temp.up = -maximizer.temp1$minimum

        #if (!is.nan(l.temp.up))

        #compare to see if updated l is still
        inside <- (l.temp.up > (l.null - 0.2))
        #diff.up = l.temp.up - l.null
        #converge0 <- (abs(diff.up) <= tol)
        alevel.up <- pchisq(2*(l.temp-l.temp.up),df=1,ncp=0,lower.tail = T)
        #print(c(delta.up, alevel.up, n,l.temp.up,k,iter1,iter2))
        if (!inside) {delta.up <- delta.up/((n+1)/n);iter2 <- iter2 + 1}
        if (is.nan(delta.up)) {param.est.temp.up[k] <- NA}
      } #for iter2

      #}
      #Using converged increment for parameter to get corresponding score and variance expressions;
      param.est.up <- insert(maximizer.temp1$estimate, ats=k, values=param.est.temp.up[k])
      l0.b.up = l.temp.up

      diff.up = l0.b.up - l.null
      converge <- (abs(diff.up) <= tol)
      if ((!converge| is.nan(l0.b.up)) & !is.nan(delta.up)) {iter1 <- iter1 + 1; n = n + 1} else {EXIT1 = T;}
      if (is.nan(delta.up)==T) {param.est.up[k] <- NA}
    } #for iter1

    upper.surv[is] <- param.est.up[k]


    ###############lower endpoint#####################
    n=ni
    #iter0 <- 1; converge = FALSE; l0.b.lo=0
    #while(l.temp > l.null & (!converge| is.nan(l0.b.lo)) & iter0<=30) {

    #assign initial values to parameter estimates
    param.est.lo <- maximizer0$estimate

    converge <- FALSE; iter1 <- 1; EXIT1 <-FALSE; l0.b.lo=0; delta.lo=0
    while ((!converge| is.nan(l0.b.lo)) & iter1 <= 25 & !EXIT1 & !is.nan(delta.lo)) {

      # calculate log-lik, score and hessian under l0.b;
      maximizer.temp <-  nlm(
        f = loglik.mixture, p = param.est.lo, survt=survt, design.matrix=design.matrix,
        pl = pl, iterlim = 1, hessian=TRUE)
      score.temp = maximizer.temp$gradient
      hessian.temp = maximizer.temp$hessian
      if (det(hessian.temp) < 1e-05) diag(hessian.temp) <- diag(hessian.temp) + 1e-06

      #### Approach 1: lambda = (2*(l0.b-l.null+e*A^-1*U)/(e*A^-1*e))^0.5
      # l0.b.lo <- -loglik.mixture(p=param.est.lo, survt, design.matrix,
      #                            index.cure.var=index.cure.v, index.surv.var=index.surv.v, pl)
      l0.b.lo <- -maximizer.temp$minimum
      inv.hessian.temp <- solve(hessian.temp)
      if (l0.b.lo < l.null + 0.5 * score.temp %*% inv.hessian.temp %*% score.temp) {
        lambda <- ((-inv.hessian.temp %*% score.temp)[k])/inv.hessian.temp[k,k]
        #define increment for estimated value: delta=-A^-1(U-lambda*e)
        delta.lo <- -inv.hessian.temp[k,k] %*% (score.temp[k] - lambda);
      } else{
        lambda <- -(2*(l0.b.lo - l.null + score.temp %*% inv.hessian.temp %*% score.temp)/abs(inv.hessian.temp[k,k]))^0.5
        #define increment for estimated value: delta=-A^-1(U-lambda*e)
        delta.lo <- -inv.hessian.temp[k,k] %*% (score.temp[k] - lambda)
      };

      # maximizing loop for unpenalized estimates;
      #if (pl == F) {
      inside <- FALSE; iter2 <- 1;
      while (!inside & iter2 <= 100 & !is.nan(delta.lo)) {

        # add increment to stepwise parameter value;
        param.est.temp.lo <- param.est.lo
        param.est.temp.lo[k] <- param.est.temp.lo[k] + delta.lo

        #compute loglikelihood function using lodated parameter values;
        maximizer.temp1 <- nlm( f = loglik.mixture.profile, p = param.est.temp.lo[-k], survt=survt,
                                param.est = param.est.temp.lo[k], k = k,
                                pl = pl, iterlim = iterlim, hessian=TRUE)
        l.temp.lo = -maximizer.temp1$minimum


        inside <- (l.temp.lo > l.null - 0.2)
        # diff.lo = l.temp.lo - l.null
        # converge0 <- (abs(diff.lo) <= tol)
        alevel.lo <- pchisq(2*(l.temp-l.temp.lo),df=1,ncp=0,lower.tail = T)
        #print(c(delta.lo, alevel.lo, n,l.temp.lo,k,iter1,iter2))
        if (!inside) {delta.lo <- delta.lo/((n+0.1)/n);iter2 <- iter2 + 1}
        if (is.nan(delta.lo)) {param.est.temp.lo[k] <- NA}

      } # for iter2;

      #}
      #Using converged increment for parameter to get corresponding score and variance expressions;
      param.est.lo <- insert(maximizer.temp1$estimate, ats=k, values=param.est.temp.lo[k])
      l0.b.lo = l.temp.lo

      diff.lo = l0.b.lo - l.null
      converge <- (abs(diff.lo) <= tol)
      if ((!converge | is.nan(l0.b.lo)) & !is.nan(delta.lo)) {iter1 <- iter1 + 1; n = n + 1} else {EXIT1 = T}
      if (is.nan(delta.lo)==T) {param.est.lo[k] <- NA}
    } #for iter1

    lower.surv[is] <- param.est.lo[k]
  }


  coef.table.cure <- cbind(
    'coef'        = maximizer0$estimate[index.cure.v],
    'exp(coef)'   = exp(maximizer0$estimate[index.cure.v]),
    # 'LL.cure' = ll.cure,
    # 'LLR'         = llr.cure,
    # 'Pr(>chisq)'  = pval.cure,
    'LCI.95%' = lower.cure,
    'UCI.95%' = upper.cure
  );
  rownames(coef.table.cure) <- colnames(design.matrix);

  coef.table.surv <- cbind(
    'coef'        = maximizer0$estimate[index.surv.v],
    'exp(coef)'   = exp(maximizer0$estimate[index.surv.v]),
    # 'LL.surv' = ll.surv,
    # 'LLR'         = llr.surv,
    # 'Pr(>chisq)'  = pval.surv,
    'LCI.95%' = lower.surv,
    'UCI.95%' = upper.surv
  );
  rownames(coef.table.surv) <- colnames(design.matrix);

  coef.table.alpha <- 0;


  #run.time = proc.time() - init.time


  #######################################
  ## Output tables from either method; ##
  #######################################


  out <- list(
    coefficients = list(
      cure = coef.table.cure,
      surv = coef.table.surv,
      alpha = coef.table.alpha
    )
  );
  class(out) <- c('mixcure.plci', 'list');

  return(out);

}


#### print.mixcure #############################################################
# DESCRIPTION
#   To print a mixcure object.
# INPUT
#   object : a mixcure object, which is an outcome of function mixcure.
#   digits : number of digits for printing, passed to print.default.
#   ...    : other parameters passed to print.default.
# OUTPUT
#   NULL.

print.mixcure <- function(object, digits = 3, ...) {
  sep.line.cure   <- paste(c(rep('-', 37),  ' CURE ' , rep('-', 37)), collapse = '');
  sep.line.surv   <- paste(c(rep('-', 37),  ' SURVIVAL ' , rep('-', 37)), collapse = '');
  sep.line.alpha <- paste(c(rep('-', 36), ' ALPHA ', rep('-', 36)), collapse = '');

  message(sep.line.cure);
  print.default(object$coefficients$cure,   digits = digits, ...);

  message(sep.line.surv);
  print.default(object$coefficients$surv,   digits = digits, ...);

  message(sep.line.alpha);
  print.default(object$coefficients$alpha, digits = digits, ...);

  return(NULL);
};


#### coef.mixcure ##############################################################
coef.mixcure <- function(object) {
  coefs <- c(
    object$coefficients$cure[, 'coef'],
    object$coefficients$surv[, 'coef'],
    object$coefficients$alpha[, 'coef']
  );
  names(coefs) <- c( paste('cure.', rownames(object$coefficients$cure)),
                     paste('surv.', rownames(object$coefficients$surv)),
                     rownames(object$coefficients$alpha) );

  return(coefs);
}


vcov.mixcure <- function(object) {
  return(object$cov);
}
ChangchangXu-LTRI/Mixcure documentation built on April 22, 2022, 3:33 p.m.
rdrr.io home R language documentation Run R code online
CRAN packages Bioconductor packages R-Forge packages GitHub packages
Note that we can't provide technical support on individual packages. You should contact the package authors for that.
ChangchangXu-LTRI/Mixcure
Maximum (penalized) likelihood estimation of Weibull mixture cure model

R/mixcure.penal.profile.CI.nested.r
In ChangchangXu-LTRI/Mixcure: Maximum (penalized) likelihood estimation of Weibull mixture cure model

Defines functions vcov.mixcure coef.mixcure print.mixcure mixcure.penal.profile.CI.nested

Documented in mixcure.penal.profile.CI.nested

R Package Documentation

Browse R Packages

We want your feedback!

ChangchangXu-LTRI/Mixcure Maximum (penalized) likelihood estimation of Weibull mixture cure model

R/mixcure.penal.profile.CI.nested.r In ChangchangXu-LTRI/Mixcure: Maximum (penalized) likelihood estimation of Weibull mixture cure model

Defines functions vcov.mixcure coef.mixcure print.mixcure mixcure.penal.profile.CI.nested

Documented in mixcure.penal.profile.CI.nested

R Package Documentation

Browse R Packages

We want your feedback!

ChangchangXu-LTRI/Mixcure
Maximum (penalized) likelihood estimation of Weibull mixture cure model

R/mixcure.penal.profile.CI.nested.r
In ChangchangXu-LTRI/Mixcure: Maximum (penalized) likelihood estimation of Weibull mixture cure model