R/backaddfor.cind.R

Defines functions backaddfor.cind

backaddfor.cind <-
  function(formula, cat.var, data, range = NULL, k = 1, l.s.points = 100, eps = 0.001, repmax = 50, min.p.cat = 1, randnodes = FALSE){

    Y <- data[,all.vars(formula)[1]]
    if(is.null(range)) {
      X <- data[[cat.var]]
    } else{
      X <- data[[cat.var]][data[[cat.var]] >= range[1] & data[[cat.var]] <= range[2]]
    }
    var.names <- c(all.vars(formula), cat.var)

    # range is a vector such as: range=c(a,b)

    # Initial nodes
    cuts <- seq(stats::quantile(X, 0.05), stats::quantile(X, 0.95), length = k+2)[-c(1,k+2)]
    cuts0 <- c(min(X)-0.001, cuts, max(X)+0.001)
    cind.matrix <- matrix(ncol = 2, nrow = length(cuts0))
    colnames(cind.matrix)<- c("points","c-index")
    data$x.cut <- cut(X, breaks = cuts0, include.lowest=TRUE, right=TRUE)
    formula.n <- stats::update(formula, stats::as.formula(". ~ . + x.cut"))
    # fit <- gam(formula.n, family = "binomial", data = data)
    fit <- try(rms::cph(formula.n, data = data))
    # auc0 <- roc(Y, predict(fit), quiet=TRUE)$auc
    cind0 <- cindex.categorization(fit$linear.predictors, survival::Surv(data[,var.names[1]],data[,var.names[2]]))
    # cind0 <- cindex.categorization(fit$linear.predictors, Surv(data[,all.vars(formula.n)[1]], data[,all.vars(formula.n)[2]]))

    # Random nodes
    if(randnodes == TRUE){
      for(rep in 1:5) {
        cind1 = 0
        cuts1 = cuts0
        cuts1[2:(k+1)] <- sample(X,k)
        cuts1 <- sort(cuts1)
        if(length(unique(cuts1)) == length(cuts1)) {
          data$x.cut=cut(X, breaks = cuts1, include.lowest=TRUE, right=TRUE)
          if (min(table(data$x.cut)) >= min.p.cat) {
            fit <- try(rms::cph(formula.n, data = data))
            cind1 <- cindex.categorization(fit$linear.predictors, survival::Surv(data[,var.names[1]],data[,var.names[2]]))}
          if (cind1 > cind0) {
            cind0=cind1; cuts0=cuts1; cuts0=sort(cuts0)}}}
    }

    # Sequential search setup
    caux <- seq(min(X), max(X), length.out = l.s.points + 2)[-c(1, l.s.points + 2)]
    nrep <- 0
    cind_old <- 0
    continue <- TRUE

    # Sequential search
    while (continue) {
      nrep = nrep+1
      for (j in 2:(k+1)) {
        for (ifino in 1:l.s.points) {
          cind1 = 0
          cuts1 = cuts0
          cuts1[j] = caux[ifino]
          cuts1 = sort(cuts1)
          if(length(cuts1) > length(unique(cuts1))) {auc1=0}
          else {
            data$x.cut <- cut(X, breaks = cuts1, include.lowest=TRUE, right=TRUE)
            fit <- try(rms::cph(formula.n, data = data))
            # if (min(table(data$x.cut)) >= min.p.cat) {
            if(length(class(fit)) > 1){
              cind1 <- cindex.categorization(fit$linear.predictors, survival::Surv(data[,var.names[1]],data[,var.names[2]]))
            } else {cind1 <- NA}
          }
          if (cind1 > cind0) {cind0=cind1; cuts0=cuts1; cuts0=sort(cuts0)}
        }
      }

      if (nrep > 1 & abs((cind0-cind_old)/cind_old) < eps) {continue=FALSE}
      if (nrep > repmax) {continue = FALSE}
      cind_old = cind0}

    data$x.cut <- cut(X, breaks = cuts0, include.lowest=TRUE, right=TRUE)
    fit <- try(rms::cph(formula.n, data = data))
    list(cuts = cuts0[-c(1,k+2)], cind = cind0)
    # list(cuts = cuts0[-c(1,k+2)], cind = cind0, pred = predict(fit, type = "response"))
  }

Try the CatPredi package in your browser

Any scripts or data that you put into this service are public.

CatPredi documentation built on May 8, 2026, 9:07 a.m.