R/train_dnn.R
In deeplearning: An Implementation of Deep Neural Network for Regression and Classification

#' Train a deep neural network
#'
#' This function trains a deep neural network
#'
#' @param darch a darch instance
#' @param input input data for training
#' @param target target data for training
#' @param input_valid input data for validation
#' @param target_valid target data for validation
#' @param ... additional input
#' @param learn_rate_weight learning rate for the weight matrices
#' @param learn_rate_bias learning rate for the biases
#' @param learn_rate_gamma learning rate for the gamma
#' @param batch_size batch size during training
#' @param batch_normalization logical value that determines whether to turn on
#'  batch normalization during training. Recommneded value: T
#' @param dropout_input dropout ratio at input layer. Recommneded value: 0.2
#' @param dropout_hidden dropout ratio at hidden layers. Recommended value: 0.5
#' @param momentum_initial momentum ratio during training. Recommended value: 0.6
#' @param momentum_final final momentum during training. Recommended value: 0.9
#' @param momentum_switch afther which epoch the final momentum ratio is used during training
#' @param num_epochs number of iterations of the training
#' @param error_function error function to minimize during training
#' @param report_classification_error logical value. T to report the classification error
#'  during training
#'
#' @importFrom darch createDataSet validateDataSet getEpochs
#' @importFrom stats predict
#'
#' @examples
#' # Example of Regression
#'
#' input <- matrix(runif(1000), 500, 2)
#' input_valid <- matrix(runif(100), 50, 2)
#' target <- rowSums(input + input^2)
#' target_valid <- rowSums(input_valid + input_valid^2)
#' # create a new deep neural network for classificaiton
#' dnn_regression <- new_dnn(
#'  c(2, 50, 50, 20, 1),  # The layer structure of the deep neural network.
#'  # The first element is the number of input variables.
#'  # The last element is the number of output variables.
#'  hidden_layer_default = rectified_linear_unit_function,
#'  # for hidden layers, use rectified_linear_unit_function
#'  output_layer_default = linearUnitDerivative
#'  # for regression, use linearUnitDerivative function
#')
#'
#'  dnn_regression <- train_dnn(
#'  dnn_regression,
#'
#'  # training data
#'  input, # input variable for training
#'  target, # target variable for training
#'  input_valid, # input variable for validation
#'  target_valid, # target variable for validation
#'
#'  # training parameters
#'  learn_rate_weight = exp(-8) * 10,
#'  # learning rate for weights, higher if use dropout
#'  learn_rate_bias = exp(-8) * 10,
#'  # learning rate for biases, hihger if use dropout
#'  learn_rate_gamma = exp(-8) * 10,
#'  # learning rate for the gamma factor used
#'  batch_size = 10,
#'  # number of observations in a batch during training.
#'  # Higher for faster training. Lower for faster convergence
#'  batch_normalization = TRUE,
#'  # logical value, T to use batch normalization
#'  dropout_input = 0.2,
#'   # dropout ratio in input.
#'  dropout_hidden = 0.5,
#'  # dropout ratio in hidden layers
#'  momentum_initial = 0.6,
#'  # initial momentum in Stochastic Gradient Descent training
#'  momentum_final = 0.9,
#'  # final momentum in Stochastic Gradient Descent training
#'  momentum_switch = 100,
#'  # after which the momentum is switched from initial to final momentum
#'  num_epochs = 5,
#'   # number of iterations in training
#'   # increase numbef of epochs to 100 for better model fit
#'
#'
#'  # Error function
#'  error_function = meanSquareErr,
#'  # error function to minimize during training. For regression, use meanSquareErr
#'  report_classification_error = FALSE
#'  # whether to print classification error during training
#')
#'
#'
#' # the prediciton by dnn_regression
#' pred <- predict(dnn_regression)
#'
#' # calculate the r-squared of the prediciton
#' rsq(dnn_regression)
#'
#'
#' # calcualte the r-squared of the prediciton in validation
#' rsq(dnn_regression, input = input_valid, target = target_valid)
#'
#' # print the layer weights
#' # this function can print heatmap, histogram, or a surface
#' print_weight(dnn_regression, 1, type = "heatmap")
#'
#' print_weight(dnn_regression, 2, type = "surface")
#'
#' print_weight(dnn_regression, 3, type = "histogram")
#'
#'
#' # Examples of classification
#'
#'input <- matrix(runif(1000), 500, 2)
#'input_valid <- matrix(runif(100), 50, 2)
#'target <- (cos(rowSums(input + input^2)) > 0.5) * 1
#'target_valid <- (cos(rowSums(input_valid + input_valid^2)) > 0.5) * 1
#'
#'# create a new deep neural network for classificaiton
#'dnn_classification <- new_dnn(
#'  c(2, 50, 50, 20, 1),  # The layer structure of the deep neural network.
#'  # The first element is the number of input variables.
#'  # The last element is the number of output variables.
#'  hidden_layer_default = rectified_linear_unit_function,
#'  # for hidden layers, use rectified_linear_unit_function
#'  output_layer_default = sigmoidUnitDerivative
#'  # for classification, use sigmoidUnitDerivative function
#')
#'
#'dnn_classification <- train_dnn(
#'  dnn_classification,
#'
#'  # training data
#'  input, # input variable for training
#'  target, # target variable for training
#'  input_valid, # input variable for validation
#'  target_valid, # target variable for validation
#'
#'  # training parameters
#'  learn_rate_weight = exp(-8) * 10,
#'  # learning rate for weights, higher if use dropout
#'  learn_rate_bias = exp(-8) * 10,
#'  # learning rate for biases, hihger if use dropout
#'  learn_rate_gamma = exp(-8) * 10,
#'  # learning rate for the gamma factor used
#'  batch_size = 10,
#'  # number of observations in a batch during training.
#'  # Higher for faster training. Lower for faster convergence
#'  batch_normalization = TRUE,
#'  # logical value, T to use batch normalization
#'  dropout_input = 0.2,
#'  # dropout ratio in input.
#'  dropout_hidden = 0.5,
#'  # dropout ratio in hidden layers
#'  momentum_initial = 0.6,
#'  # initial momentum in Stochastic Gradient Descent training
#'  momentum_final = 0.9,
#'  # final momentum in Stochastic Gradient Descent training
#'  momentum_switch = 100,
#'  # after which the momentum is switched from initial to final momentum
#'  num_epochs = 5,
#'  # number of iterations in training
#'  # increase num_epochs to 100 for better model fit
#'
#'  # Error function
#'  error_function = crossEntropyErr,
#'  # error function to minimize during training. For regression, use crossEntropyErr
#'  report_classification_error = TRUE
#'  # whether to print classification error during training
#')
#'
#'# the prediciton by dnn_regression
#'pred <- predict(dnn_classification)
#'
#'hist(pred)
#'
#'# calculate the r-squared of the prediciton
#'AR(dnn_classification)
#'
#'# calcualte the r-squared of the prediciton in validation
#'AR(dnn_classification, input = input_valid, target = target_valid)
#'
#'
#' @return a trained deep neural network (darch instance)
#' @export
#'

train_dnn <- function(darch, # darch instance to train
                      input, # input data matrix
                      target, # target data matrix
                      input_valid = NULL, # validation data input
                      target_valid = NULL, # validation data target
                      ...,
                      # training parameters
                      learn_rate_weight = exp(-10),
                      learn_rate_bias = exp(-10),
                      learn_rate_gamma = 1,
                      batch_size = 10,
                      batch_normalization = TRUE,
                      dropout_input = 0,
                      dropout_hidden = 0,
                      momentum_initial = .6,
                      momentum_final = .9,
                      momentum_switch = 100,
                      num_epochs = 0,

                      # target types
                      error_function = meanSquareErr,
                      report_classification_error = FALSE
) {
  # 1. set up the inputs
  timeStart <- Sys.time()
  dataSet <- createDataSet(input, target)
  numObs <- nrow(input)
  darch@dataSet <- dataSet # add the training dataset to the darch instance

  # set the stats of darch
  if (is.null(darch@stats) || length(darch@stats) < 1){
    stats <-
      list("dataErrors"=list("raw"=c(),"class"=c()),
           "validErrors"=list("raw"=c(),"class"=c()),
           "times"= 0)

    darch@stats <- stats
  }

  trainData <- as.matrix(input)
  trainTarget <- as.matrix(target)

  if(!is.null(input_valid)) {
    validData <- as.matrix(input_valid)
    validTarget <- as.matrix(target_valid)
  } else {
    validData <- NULL
    validTarget <- NULL
  }

  if (!validateDataSet(dataSet, darch))
  {
    stop("Invalid dataset provided.")
  }

  if (!is.null(validData)) {
    if (dim(trainData)[[2]] != dim(validData)[[2]] |
        dim(as.matrix(trainTarget))[[2]] != dim(as.matrix(validTarget))[[2]]) {
      stop("Invalid validation dataset.")
    }
  }

  # 2. train the neural net
  flog.info("Start training the neural net.")
  start_epoch <- getEpochs(darch)
  flog.info(paste("The neural net has been trained ", start_epoch, " times."))

  for(epoch in (1 + start_epoch):(num_epochs + start_epoch)) {
    flog.info(paste("Epoch numebr: ", epoch))

    # make the batches
    batch <- make_batches(dim(trainData)[[1]], batch_size)
    num_batches <- max(batch[, 2])

    for(i in 1:num_batches) {
      # Generate a new dropout mask for each batch
      darch <- generateDropoutMasksForDarch(darch, dropout_input, dropout_hidden)
      # Train the neural net
      darch <- finetune_SGD_bn(darch,
                               trainData[batch[,2] == i,],
                               trainTarget[batch[,2] == i,],
                               learn_rate_weight = learn_rate_weight,
                               learn_rate_bias = learn_rate_bias,
                               learn_rate_gamma = learn_rate_gamma,
                               errorFunc = error_function,
                               with_BN = batch_normalization
                               )
    }

    # calculates the new mu and sigma of darch
    if (batch_normalization) {
      darch <- calcualte_population_mu_sigma(darch, trainData)
    } else {
      darch <- reset_population_mu_sigma(darch)
    }

    # calcualtes the error

    # training errors
    pred_train <- predict(darch, newdata = trainData)
    error_train <- error_function(pred_train, trainTarget)
    flog.info(paste(error_train[[3]], "in training:  ", error_train[[1]]))
    darch@stats$dataErrors$raw <- c(darch@stats$dataErrors$raw, error_train[[1]])

    if(report_classification_error) {
      ce_train <- classification_error(pred_train, trainTarget)
      flog.info(paste(ce_train[[2]], "in training:  ", ce_train[[1]]))
      darch@stats$dataErrors$class <- c(darch@stats$dataErrors$class, ce_train[[1]])
    }

    # validation errors
    if(!is.null(validData)) {
      pred_valid <- predict(darch, newdata = validData)
      error_valid <- error_function(pred_valid, validTarget)
      flog.info(paste(error_valid[[3]],  "in validation:", error_valid[[1]]))
      darch@stats$validErrors$raw <- c(darch@stats$validErrors$raw, error_valid[[1]])

      if(report_classification_error) {
        ce_valid <- classification_error(pred_valid, validTarget)
        flog.info(paste(ce_valid[[2]], "in validation:", ce_valid[[1]]))
        darch@stats$validErrors$class <- c(darch@stats$validErrors$class, ce_valid[[1]])
      }
    }
    # increase the epoch by 1
    darch@epochs <- darch@epochs + 1
  }
  flog.info("End of the training")

  # 3. Save the training statistics
  if (is.null(darch@stats[["times"]])) {
    darch@stats[["times"]] <- 0
  }
  darch@stats[["times"]] <- darch@stats[["times"]] + as.double(Sys.time() - timeStart, "secs")

  return (darch)
}

# Helper function for train_dnn

make_batches <- function(numObs, batchsize) {
  order <- sample(1:numObs, numObs)
  group <- c()
  num_batches <- ceiling(numObs / batchsize)
  for (i in 1:numObs) {
    group <- c(group, (i %% num_batches + 1))
  }
  batch <- cbind(order, group)
  batch <- batch[order(order), ]
  return (batch)
}
Any scripts or data that you put into this service are public.
deeplearning documentation built on Jan. 15, 2017, 9:52 a.m.
rdrr.io home R language documentation Run R code online
CRAN packages Bioconductor packages R-Forge packages GitHub packages
Note that we can't provide technical support on individual packages. You should contact the package authors for that.
deeplearning
An Implementation of Deep Neural Network for Regression and Classification

R/train_dnn.R
In deeplearning: An Implementation of Deep Neural Network for Regression and Classification

Try the deeplearning package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

deeplearning An Implementation of Deep Neural Network for Regression and Classification

R/train_dnn.R In deeplearning: An Implementation of Deep Neural Network for Regression and Classification

Try the deeplearning package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

deeplearning
An Implementation of Deep Neural Network for Regression and Classification

R/train_dnn.R
In deeplearning: An Implementation of Deep Neural Network for Regression and Classification