R/preprocess.R

Defines functions cut_dat

Documented in cut_dat

cut_dat <- function(cut, data, var_randT=NULL, var_followT=NULL, var_followT_abs=NULL, var_censor=NULL,
                    var_event=NULL, var_censor_reason='status_at_end'){
  var <- c(var_followT, var_followT_abs, var_censor, var_event)
  if (!is.null(var)){
    notin <- var[!(var %in% colnames(data))]
    if (length(notin)!=0){
      stop(paste0('Variable ',notin, ' is/are not in the column names of the dataset.'))
    }
  }
  if (!(var_censor_reason %in% colnames(data))){
    warning(paste0('Censor reason variable ',var_censor_reason, ' is not in the column names of the dataset. We will create this variable.'))
    data[,var_censor_reason] <- NA
  }
  # cut is the absolute time from the beginning of the trial
  var_randT_missing <- FALSE
  if (is.null(var_randT)){
    var_randT <- paste0(sample(LETTERS, 64, replace = T), collapse = '')
    data[,var_randT] <- 0
    var_randT_missing <- TRUE
    warning('\'var_randT\' is missing. Treat all subjects randomized at time=0.')
  }
  train <- data[data[var_randT] <= cut,,drop=F]
  if (!is.null(var_censor_reason)){
    if (!is.null(var_followT)){
      followT_abs <- train[var_randT]+train[var_followT]
      train[var_censor_reason][followT_abs > cut] <- 'cut'
    }else if (!is.null(var_followT_abs)){
      train[var_censor_reason][train[var_followT_abs] > cut] <- 'cut'
    }else{
      stop('\'var_followT\' or \'var_followT_abs\' must be provided to update var_censor_reason.')
    }
  }
  if (!is.null(var_censor)){
    if (!is.null(var_followT)){
      followT_abs <- train[var_randT]+train[var_followT]
      train[var_censor][followT_abs > cut] <- 1
    }else if (!is.null(var_followT_abs)){
      train[var_censor][train[var_followT_abs] > cut] <- 1
    }else{
      stop('\'var_followT\' or \'var_followT_abs\' must be provided to update var_censor')
    }
  }
  if (!is.null(var_event)){
    if (!is.null(var_followT)){
      followT_abs <- train[var_randT]+train[var_followT]
      train[var_event][followT_abs > cut] <- 0
    }else if (!is.null(var_followT_abs)){
      train[var_event][train[var_followT_abs] > cut] <- 0
    }else{
      stop('\'var_followT\' or \'var_followT_abs\' must be provided to update var_event.')
    }
  }
  if (!is.null(var_followT_abs)){
    train[var_followT_abs][train[var_followT_abs] > cut] <- cut
  }
  if (!is.null(var_followT)){
    followT_abs <- train[var_randT]+train[var_followT]
    followT_abs[followT_abs > cut] <- cut
    train[var_followT] <- followT_abs-train[var_randT]
  }
  if (var_randT_missing){
    train <- train[, !(colnames(train)==var_randT)]
  }
  return(train)
}

# tran_censor <- function(dat){
#   dat$event <- ifelse(dat$censor_reason=='censored', 1, 0)
#   dat$event[is.na(dat$event)] <- 0
#   return(dat)
# }

Try the PWEXP package in your browser

Any scripts or data that you put into this service are public.

PWEXP documentation built on May 29, 2024, 2:19 a.m.