# Copyright (C) 2016 Johannes Rueckert
#
# This file is part of darch.
#
# darch is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# darch is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with darch. If not, see <http://www.gnu.org/licenses/>.
bootstrapDataSet <- function(dataSet, unique, num = 0)
{
numRows <- nrow(dataSet@data)
bootstrapTrainingSamples <- sample(1:numRows,
if (num > 0) num else numRows,
replace = if (num > 0) F else T)
if (unique && num == 0)
{
bootstrapTrainingSamples <- unique(bootstrapTrainingSamples)
}
numTrain <- length(bootstrapTrainingSamples)
bootstrapValidationSamples <-
which(!(1:numRows %in% bootstrapTrainingSamples))
numValid <- length(bootstrapValidationSamples)
# TODO validate sizes?
dataSetValid <- dataSet
dataSet@data <- dataSet@data[bootstrapTrainingSamples,, drop = F]
dataSet@targets <- dataSet@targets[bootstrapTrainingSamples,, drop = F]
dataSetValid@data <- dataSetValid@data[bootstrapValidationSamples,, drop = F]
dataSetValid@targets <-
dataSetValid@targets[bootstrapValidationSamples,, drop = F]
futile.logger::flog.info(paste(
"Bootstrapping is started with %s samples, bootstrapping results in",
"%s training (%s unique) and %s validation samples for this run."),
numRows, numTrain, numRows - numValid, numValid)
return(list(dataSet, dataSetValid))
}
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.