R/kmPlot.default.R
In GofCens: Goodness-of-Fit Methods for Right-Censored Data

Documented in kmPlot.default

kmPlot.default <- function(times, cens = rep(1, length(times)),
                           distr = "all6", colour = c("black","blue","cornflowerblue"),
                           betaLimits = c(0, 1),
                           igumb = c(10, 10), ggp = FALSE, m = NULL,
                           prnt = FALSE, degs = 3, print.AIC = TRUE,
                           print.BIC = TRUE, ...) {
  if (!is.numeric(times)) {
    stop("Variable times must be numeric!")
  }
  if (any(times <= 0)) {
    stop("Times must be strictly positive!")
  }
  if (any(!cens %in% 0:1)) {
    stop("Status indicator must be either 0 or 1!")
  }
  if (!is.logical(ggp) || !is.logical(prnt)) {
    stop("ggp and prnt must be logicals!")
  }
  if (length(distr) == 1 && distr == "all6") {
    distributions <- c("weibull", "loglogistic", "lognormal", "gumbel",
                       "logistic", "normal")
  } else {
    distributions <- match.arg(distr, c("exponential", "weibull", "loglogistic",
                                        "lognormal", "gumbel", "logistic",
                                        "normal", "beta"), several.ok = TRUE)
  }
  if ("beta" %in% distributions && any(times < betaLimits[1] |
                                       times > betaLimits[2])) {
    warning("Beta distribution is ignored because of out-of-bounds values.
  Try with 'betaLimits = c(", pmax(0, min(times) - 1), ", ",
            ceiling(max(times) + 1), ")'.",
            immediate. = TRUE)
    cat("\n")
    distributions <- distributions[distributions != "beta"]
  }
  if (length(distributions) == 0) {
    stop("No distribution to be fitted!")
  }
  bool_complete <- all(cens==1)
  dd <- data.frame(left = as.vector(times), right = ifelse(cens == 1, times, NA))
  survKM <- survfit(Surv(times, cens) ~ 1)
  mxtime <- max(survKM$time)
  sqtime <- seq(0, mxtime, length.out = 1001)
  genlis <- vector("list", length(distributions))
  names(genlis) <- distributions
  for (v in c("params", "se", "aic", "bic", "srvline", "titl")) {
    assign(v, genlis)
  }
  if ("exponential" %in% distributions) {
    tryCatch({
      if (bool_complete) {
        fitExpo <- fitdist(dd$left, "exp")
        muu <- unname(fitExpo$estimate)
        params$exponential <- 1 / muu
        names(params$exponential) <- "scale"
        se$exponential <- sqrt(fitExpo$vcov[1])*(1/muu)^2
        names(se$exponential) <- "scale (se)"
        aic$exponential <- fitExpo$aic
        bic$exponential <- fitExpo$bic
        srvline$exponential <- 1 - pexp(sqtime, muu)
        titl$exponential <- "Exponential"
      } else {
        fitExpo <- survreg(Surv(times, cens) ~ 1, dist = "exponential")
        muu <- unname(coefficients(fitExpo))
        params$exponential <- 1 / exp(-muu)
        names(params$exponential) <- "scale"
        se$exponential <- sqrt(fitExpo$var[1])*exp(muu)
        names(se$exponential) <- "scale (se)"
        aic$exponential <- 2 - 2*fitExpo$loglik[1]
        bic$exponential <- log(length(times)) - 2*fitExpo$loglik[1]
        srvline$exponential <- 1 - pexp(sqtime, exp(-muu))
        titl$exponential <- "Exponential"
      }
    }, error = function(e) e)
  }
  if ("gumbel" %in% distributions) {
    tryCatch({
      if (bool_complete) {
        fitGumb <- try(suppressMessages(fitdist(dd$left, "gumbel",
                                                start = list(alpha = igumb[1],
                                                             scale = igumb[2]))))
        if (is(fitGumb, "try-error")) {
          stop("Function failed to estimate the parameters.\n
            Try with other initial values.")
        }
      } else {
        fitGumb <- try(suppressMessages(fitdistcens(dd, "gumbel",
                                                    start = list(alpha = igumb[1],
                                                                 scale = igumb[2]))))
        if (is(fitGumb, "try-error")) {
          stop("Function failed to estimate the parameters.\n
          Try with other initial values.")
        }
      }
      locGumb <- fitGumb$estimate[1]
      scaleGumb <- fitGumb$estimate[2]
      params$gumbel <- c(locGumb, scaleGumb)
      names(params$gumbel) <- c("location", "scale")
      locGumbSE <- fitGumb$sd[1]
      scaleGumbSE <- fitGumb$sd[2]
      se$gumbel <- c(locGumbSE, scaleGumbSE)
      names(se$gumbel) <- c("location (se)", "scale (se)")
      aic$gumbel <- fitGumb$aic
      bic$gumbel <- fitGumb$bic
      srvline$gumbel <- 1 - pgumbel(sqtime, locGumb, scaleGumb)
      titl$gumbel <- "Gumbel"
    }, error = function(e) {warning("Problem fitting Gumbel distribution, try other initial values.", immediate. = TRUE)})
  }
  if ("weibull" %in% distributions) {
    tryCatch({
      if (bool_complete) {
        fitWei <- fitdist(dd$left, "weibull")
      } else {
        fitWei <- fitdistcens(dd, "weibull")
      }
      shapeWei <- fitWei$estimate[1]
      scaleWei <- fitWei$estimate[2]
      params$weibull <- c(shapeWei, scaleWei)
      shapeWeiSE <- fitWei$sd[1]
      scaleWeiSE <- fitWei$sd[2]
      se$weibull <- c(shapeWeiSE, scaleWeiSE)
      names(se$weibull) <- c("shape (se)", "scale (se)")
      aic$weibull <- fitWei$aic
      bic$weibull <- fitWei$bic
      srvline$weibull <- 1 - pweibull(sqtime, shapeWei, scaleWei)
      titl$weibull <- "Weibull"
    }, error = function(e) e)
  }
  if ("normal" %in% distributions) {
    tryCatch({
      if (bool_complete) {
        fitNorm <- fitdist(dd$left, "norm")
      } else {
        fitNorm <- fitdistcens(dd, "norm")
      }
      locNorm <- fitNorm$estimate[1]
      scaleNorm <- fitNorm$estimate[2]
      params$normal <- fitNorm$estimate
      names(params$normal) <- c("location", "scale")
      locNormSE <- fitNorm$sd[1]
      scaleNormSE <- fitNorm$sd[2]
      se$normal <- c(locNormSE, scaleNormSE)
      names(se$normal) <- c("location (se)", "scale (se)")
      aic$normal <- fitNorm$aic
      bic$normal <- fitNorm$bic
      srvline$normal <- 1 - pnorm(sqtime, locNorm, scaleNorm)
      titl$normal <- "Normal"
    }, error = function(e) e)
  }
  if ("logistic" %in% distributions) {
    tryCatch({
      if (bool_complete) {
        fitLog <- fitdist(dd$left, "logis")
      } else {
        fitLog <- fitdistcens(dd, "logis")
      }
      locLogis <- fitLog$estimate[1]
      scaleLogis <- fitLog$estimate[2]
      params$logistic <- fitLog$estimate
      locLogisSE <- fitLog$sd[1]
      scaleLogisSE <- fitLog$sd[2]
      se$logistic <- fitLog$sd
      names(se$logistic) <- c("location (se)", "scale (se)")
      aic$logistic <- fitLog$aic
      bic$logistic <- fitLog$bic
      srvline$logistic <- 1 - plogis(sqtime, locLogis, scaleLogis)
      titl$logistic <- "Logistic"
    }, error = function(e) e)
  }
  if ("lognormal" %in% distributions) {
    tryCatch({
      if (bool_complete) {
        fitLnorm <- fitdist(dd$left, "lnorm")
      } else {
        fitLnorm <- fitdistcens(dd, "lnorm")
      }
      locLnorm <- fitLnorm$estimate[1]
      scaleLnorm <- fitLnorm$estimate[2]
      params$lognormal <- c(locLnorm, scaleLnorm)
      names(params$lognormal) <- c("location", "scale")
      locLnormSE <- fitLnorm$sd[1]
      scaleLnormSE <- fitLnorm$sd[2]
      se$lognormal <- c(locLnormSE, scaleLnormSE)
      names(se$lognormal) <- c("location (se)", "scale (se)")
      aic$lognormal <- fitLnorm$aic
      bic$lognormal <- fitLnorm$bic
      srvline$lognormal <- 1 - plnorm(sqtime, locLnorm, scaleLnorm)
      titl$lognormal <- "Lognormal"
    }, error = function(e) e)
  }
  if ("loglogistic" %in% distributions) {
    tryCatch({
      if (bool_complete) {
        fitLoglog <- fitdist(dd$left, "llogis")
        shapeLoglogis <- unname(coefficients(fitLoglog))[1]
        scaleLoglogis <- unname(coefficients(fitLoglog))[2]
        params$loglogistic <- c(shapeLoglogis, scaleLoglogis)
        names(params$loglogistic) <- c("shape", "scale")
        shapeLoglogisSE <- sqrt(fitLoglog$vcov[1,1])
        scaleLoglogisSE <- sqrt(fitLoglog$vcov[2,2])
        se$loglogistic <- c(shapeLoglogisSE, scaleLoglogisSE)
        names(se$loglogistic) <- c("shape (se)", "scale (se)")
        aic$loglogistic <- fitLoglog$aic
        bic$loglogistic <- fitLoglog$bic
        srvline$loglogistic <- 1 - pllogis(sqtime, shapeLoglogis, scale = scaleLoglogis)
        titl$loglogistic <- "Log-logistic"
      } else {
        fitLoglog <- survreg(Surv(times, cens) ~ 1, dist = "loglogistic")
        shapeLoglogis <- 1 / exp(unname(fitLoglog$icoef)[2])
        scaleLoglogis <- exp(unname(fitLoglog$icoef)[1])
        params$loglogistic <- c(shapeLoglogis, scaleLoglogis)
        names(params$loglogistic) <- c("shape", "scale")
        shapeLoglogisSE <- sqrt(fitLoglog$var[4])*exp(-unname(fitLoglog$icoef)[2])
        scaleLoglogisSE <- sqrt(fitLoglog$var[1])*exp(unname(fitLoglog$icoef)[1])
        se$loglogistic <- c(shapeLoglogisSE, scaleLoglogisSE)
        names(se$loglogistic) <- c("shape (se)", "scale (se)")
        aic$loglogistic <- 2*2 - 2*fitLoglog$loglik[1]
        bic$loglogistic <- log(length(times))*2 - 2*fitLoglog$loglik[1]
        srvline$loglogistic <- 1 - pllogis(sqtime, shapeLoglogis, scale = scaleLoglogis)
        titl$loglogistic <- "Log-logistic"
      }
    }, error = function(e) e)
  }
  if ("beta" %in% distributions) {
    tryCatch({
      aBeta <- betaLimits[1]
      bBeta <- betaLimits[2]
      if (bool_complete) {
        fitBeta <- fitdist((dd$left - aBeta) / (bBeta - aBeta), "beta")
      } else {
        fitBeta <- fitdistcens((dd - aBeta) / (bBeta - aBeta), "beta")
      }
      shape1Beta <- fitBeta$estimate[1]
      shape2Beta <- fitBeta$estimate[2]
      params$beta <- list(parameters = c(shape1Beta, shape2Beta),
                          domain = betaLimits)
      shape1BetaSE <- fitBeta$sd[1]
      shape2BetaSE <- fitBeta$sd[2]
      se$beta <- c(shape1BetaSE, shape2BetaSE)
      names(se$beta) <- c("shape1 (se)", "shape2 (se)")
      aic$beta <- fitBeta$aic
      bic$beta <- fitBeta$bic
      srvline$beta <- 1 - pbeta((sqtime - aBeta)/(bBeta - aBeta), shape1Beta,
                                shape2Beta)
      titl$beta <- "Beta"
    }, error = function(e) e)
  }
  output <- list(times = times, cens = cens, distributions = distributions,
                 params = params, se = se, aic = aic, bic = bic, survKM = survKM,
                 sqtime = sqtime, srvline = srvline, titl = titl,
                 colour = colour, ggp = ggp, m = m, prnt = prnt, degs = degs,
                 print.AIC = print.AIC, print.BIC = print.BIC)
  class(output) <- "kmPlot"
  print(output)
  plot(output)
}