inst/data_scripts/khan-2001/2-clean.r

library('pamr')
data('khan')

# We remove the first two columns of the Khan data set because it contains meta data
# not directy useful to us for classification purposes.
data('khan')
gene_names <- khan[,1]
khan <- t(khan[,-(1:2)])
dimnames(khan) <- NULL
y <- factor(as.vector(khan[,1]))
x <- data.matrix(khan[,-1])
class(x) <- "numeric"
colnames(x) <- gene_names[-1]

khan <- list(x = x, y = y)
ramhiser/datamicroarray documentation built on May 26, 2019, 10:07 p.m.