R/runRandomForest.R

Defines functions runRandomForest

Documented in runRandomForest

#' runRandomForest
#' 
#' This function takes the output of iterVarSelRF and runs a random forest. 
#' 
#' @param indVar independent variables
#' @param depVar dependent variable
#' @param ntree to be passed to randomForest.  Had trouble getting ... to work with the snowfall wrapper 
#'              function.  This was a quick hack.
#' @param importance  to be passed to randomForest.  Had trouble getting ... to work with the snowfall wrapper 
#'                    function.  This was a quick hack.
#' @param proximity to be passed to randomForest.  Had trouble getting ... to work with the snowfall wrapper 
#'                  function.  This was a quick hack.
#' 
#' @examples
#' data(LakeTrophicModelling)
#' x2<-iterVarSelRF(ltmData[predictors_gis],ltmData$TS_CHLA_4,10,4,ntree=10,ntreeIterat=5,
#' vars.drop.frac=NULL,vars.drop.num=1,time=FALSE)
#' x2_vars<-unique(unlist(x2))
#' gis_ts4_rf<-runRandomForest(ltmData[x2_vars],ltmData$TS_CHLA_4, ntree=10,importance=TRUE,proximity=TRUE)
#' @export
#' @import randomForest
runRandomForest <- function(indVar, depVar, ntree = 100, 
    importance = TRUE, proximity = TRUE) {
    
    # Only Pass Complete Cases
    comp_case <- complete.cases(indVar, depVar)
    if (length(indVar) > 1) {
        indVar <- indVar[comp_case, ]
    } else {
        indVar <- indVar[comp_case]
    }
    depVar <- depVar[comp_case]
    
    
    return(randomForest(indVar, depVar, ntree = ntree, 
        importance = importance, proximity = proximity))
    
} 
USEPA/LakeTrophicModelling documentation built on Oct. 15, 2020, 4:13 p.m.