In cwilso6/RMKL: Multiple Kernel Learning for Classification, Regression Problems, and Survival Settings

We will be mimicking example 1, two factors with linear relationship with the hazard function $h(X) = (X_1 + 2*X_2)$, from 'Fenchel duality of Cox partial likelihood and its application in survival kernel learning' Wilson et. al (2020). Here is quick example of how to run the code. The concordance for Random survival forest, gradient boosting, and MKCox are printed and note that they are compatible. All of the machine learning methods are able to capture the linear relationship between the features and hazard function as shown in the scatterplots.

Loading data and plotting data

library(RMKL)
library(ggplot2)
library(survival)
library(gbm)
library(randomForestSRC)
library(kernlab)
data(Surv_data)
head(Surv_data)

ggplot(Surv_data, aes(x = x1, y = x2, color = f.true)) + geom_point() + scale_color_gradient(low = 'blue', high = 'yellow') + 
labs(color = 'value', title = 'True',x = expression(x[1]), y = expression(x[2])) + theme_bw() + theme(plot.title = element_text(hjust = .5), legend.position = 'right')

Cox model

fit=coxph(Surv(Surv_data$time, Surv_data$status) ~ Surv_data$x1 + Surv_data$x2, method = "breslow")
fit2 <- step(fit, direction='both', k = log(dim(Surv_data)[1]))
cox_pred=predict(fit, as.data.frame(Surv_data[,1:2]))
summary(fit)$concordance[1]
Surv_data$Cox = cox_pred
ggplot(Surv_data, aes(x = x1, y = x2, color = Cox)) + geom_point() + scale_color_gradient(low = 'blue', high = 'yellow') + labs(x = expression(x[1]), y = expression(x[2]), color = 'value', title = 'Cox') + theme_bw() + theme(plot.title = element_text(hjust = .5), legend.position = 'right')

Gradient Boosting

gbm1 <- gbm(Surv(time, status) ~ x1 + x2,       # formula
              data=Surv_data,                 # dataset
              distribution="coxph",
              n.trees=1000,              # number of trees
              shrinkage=0.005,           # shrinkage or learning rate, 0.001 to 0.1 usually work
              interaction.depth=1,       # 1: additive model, 2: two-way interactions, etc
              bag.fraction = 0.5,        # subsampling fraction, 0.5 is probably best
              train.fraction = 0.8,      # fraction of data for training, first train.fraction*N used for training
              cv.folds = 5,              # do 5-fold cross-validation
              verbose = F)           #  print progress
summary(gbm1)
best.iter <- gbm.perf(gbm1,method = "cv")
gpred2=predict(gbm1,Surv_data,best.iter)
Surv_data$GBM = gpred2
ggplot(Surv_data, aes(x = x1, y = x2, color = GBM)) + geom_point() + scale_color_gradient(low = 'blue', high = 'yellow') + labs(x = expression(x[1]), y = expression(x[2]), color = 'value', title = 'GBCox') + theme_bw() + theme(plot.title = element_text(hjust = .5), axis.title.y = element_text(angle = 0, vjust = .5), legend.position = 'bottom')
gbm.con = survConcordance(Surv(time, status) ~ GBM, Surv_data)$con
gbm.con

Random Survival Forest

modrf <-  rfsrc(Surv(time, status) ~ x1 + x2, data = Surv_data, nsplit = 10)
prerf <- predict(modrf, Surv_data, outcome = 'test')$predicted.oob
Surv_data$RSF = prerf
ggplot(Surv_data, aes(x = x1, y = x2, color = RSF)) + geom_point() + scale_color_gradient(low = 'blue', high = 'yellow') + labs(x = expression(x[1]), y = expression(x[2]), color = 'value', title = 'RSF') + theme_bw() + theme(plot.title = element_text(hjust = .5), axis.title.y = element_text(angle = 0, vjust = .5), legend.position = 'bottom')
RSF.con = survConcordance(Surv(time, status) ~ RSF, Surv_data)$con
RSF.con

Run ELM model

` ``{r} modelm <- ELMCox(Surv_data[,1:2], Surv(Surv_data$time, Surv_data$status)) ypreelm <- predict(modelm, Surv_data[,1:2]) Surv_data$ELM = ypreelm survConcordance(Surv(time, status) ~ ELM,data = Surv_data)$con ggplot(Surv_data, aes(x = x1, y = x2, color = ELM)) + geom_point() + scale_color_gradient(low = 'blue', high = 'yellow') + labs(x = expression(x[1]), y = expression(x[2]), color = 'value', title = 'ELM') + theme_bw() + theme(plot.title = element_text(hjust = .5), axis.title.y = element_text(angle = 0, vjust = .5), legend.position = 'bottom')

#MKCox
```r
#Getting survival times in ascending order
ordtr <- order(Surv_data$time)
Surv_data_ordered = Surv_data[ordtr,]

xx = Surv_data_ordered[,1:2]
del = Surv_data_ordered$status
yy = Surv_data_ordered$time
if (!del[1]) {
  first1 <- which(del)[1]
  xx <- xx[-(1:(first1 - 1)), ]
  yy <- yy[-(1:(first1 - 1))]
  del <- del[-(1:(first1 - 1))]
  nn <- dim(Surv_data)[1] - first1 + 1
} else {
  nn <- dim(Surv_data)[1]
}

rho0 <- .001*(Surv_data$status - seq(0, 10, length.out = dim(Surv_data)[1]))
klist <- list(kernelMatrix(rbfdot(1), as.matrix(xx)),
             kernelMatrix(vanilladot(), as.matrix(xx)))
ktlist <- list(kernelMatrix(rbfdot(1), as.matrix(xx), as.matrix(Surv_data[,1:2])),
             kernelMatrix(vanilladot(), as.matrix(xx), as.matrix(Surv_data[,1:2])))
kk <- simplify2array(klist)
kkk <- simplify2array(ktlist)
modmkl <- SurvMKL(y = Surv_data$time, del = Surv_data$status, K = kk, rho =  rho0, C = 0.005, lambda = 0.5, maxiter = 500, cri = .01)
mkl = predict_Surv(modmkl, kkk)
Surv_data$MKCox = mkl
ggplot(Surv_data, aes(x = x1, y = x2, color = MKCox)) + geom_point() + scale_color_gradient(low = 'blue', high = 'yellow') + labs(x = expression(x[1]), y = expression(x[2]), color = 'value', title = 'MKCox') + theme_bw() + theme(plot.title = element_text(hjust = .5), axis.title.y = element_text(angle = 0, vjust = .5), legend.position = 'bottom')
MKCox.con = survConcordance(Surv(time, status) ~ MKCox, Surv_data)$con
MKCox.con

cwilso6/RMKL documentation built on May 18, 2021, 9:58 a.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

cwilso6/RMKL
Multiple Kernel Learning for Classification, Regression Problems, and Survival Settings

In cwilso6/RMKL: Multiple Kernel Learning for Classification, Regression Problems, and Survival Settings

Loading data and plotting data

Cox model

Gradient Boosting

Random Survival Forest

Run ELM model

R Package Documentation

Browse R Packages

We want your feedback!

cwilso6/RMKL Multiple Kernel Learning for Classification, Regression Problems, and Survival Settings

In cwilso6/RMKL: Multiple Kernel Learning for Classification, Regression Problems, and Survival Settings

Loading data and plotting data

Cox model

Gradient Boosting

Random Survival Forest

Run ELM model

R Package Documentation

Browse R Packages

We want your feedback!

cwilso6/RMKL
Multiple Kernel Learning for Classification, Regression Problems, and Survival Settings