R/rxHexBin.R

#
# RevoEnhancements/R/rxHexBin.R by Derek Norton and Andrie de Vries
#
# Copyright 2013 Revolution Analytics
#    
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
# 
#      http://www.apache.org/licenses/LICENSE-2.0
# 
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS, 
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


#' Creates hexbin summaries.
#' 
#' @param formula formula
#' @param data xdf file
#' @param shape shape parameter, passed to \code{\link[hexbin]{hexbin}}
#' @param xbins Number of xbins, passed to \code{\link[hexbin]{hexbin}}
#' @param ... Other arguments, passed to \code{\link[RevoScaleR]{rxDataStep}}
#' @importFrom hexbin hexbin
#' @export
#' @family Plotting functions
#' @examples
#' # Load the Airlines Data
#' library(RevoScaleR)
#' working.file <- file.path(rxGetOption("sampleDataDir"), "AirlineDemoSmall.xdf")
#' 
#' library(RevoScaleR)
#' library(hexbin)
#' bin1 <- rxHexBin(ArrDelay ~ CRSDepTime, working.file, xbins = 50)
#' plot(bin1, lcex=.5, border = TRUE, colramp = BTC)
#' plot(bin1, style="colorscale")
#' plot(bin1, style="centroids")
#' plot(bin1, style="lattice")
#' 
#' library(ggplot2)
#' ggbin <- data.frame(
#'   hcell2xy(bin1), 
#'   count = bin1@@count, 
#'   density = bin1@@count / sum(bin1@@count, na.rm=TRUE)
#' )
#' p2 <- ggplot(data = ggbin, aes(x, y, fill = count))
#' p2 + geom_hex(stat="identity", nbins = 100) + 
#'   guides(fill = guide_colorbar(ticks = FALSE, label.theme = element_text(size = 8, angle = 0))) + 
#'   labs(x = "CRSDepTime", y = "ArrDelay")
rxHexBin <- function (formula, data, shape = 1, xbins = 30, ...) {
  
  if (length(formula) != 3) stop("Two Variables Are Required in the Formula")
  call <- match.call()
	## Function for creating/updating hexbin objects.
  hexBinTransform <- function(dataList) {
    # Trick to pass R CMD check: create and remove variables without binding
    .rxGet <- .rxSet <- function() {}
    rm(.rxGet, .rxSet)
    myXbnds <- myYbnds <- xvar <- yvar <- numeric()
    rm(myXbnds, myYbnds, xvar, yvar)
    
    hex1 <- .rxGet("hex1")
    hex2 <- hexbin(dataList[[xvar]], dataList[[yvar]], 
                    xbnds=myXbnds, ybnds=myYbnds,
                    xbins = hex1@xbins, shape = hex1@shape,)
    myDf <- data.frame(xcm = c(hex1@xcm, hex2@xcm) * c(hex1@count, hex2@count), 
                        ycm = c(hex1@ycm, hex2@ycm) * c(hex1@count, hex2@count),
                        count = c(hex1@count, hex2@count))
    res <- aggregate(myDf, 
                    list(cell = c(hex1@cell, hex2@cell)), 
                    sum, na.rm = TRUE)
	  hex1@count <- res[, "count"]
	  hex1@cell <- res[, "cell"]
    hex1@xcm <- res[, "xcm"] / res[, "count"]
    hex1@ycm <- res[, "ycm"] / res[, "count"]
    .rxSet("hex1", hex1)
    return(NULL)
	}
	## Create metadata
	dataInfo <- rxGetInfoXdf(data, getVarInfo = TRUE)
	plotVars <- all.vars(formula)
	x <- plotVars[-1][1] # what if longer than 1
	y <- plotVars[1]
	xbnds <- c(dataInfo$varInfo[[x]][["low"]], dataInfo$varInfo[[x]][["high"]])
  ybnds <- c(dataInfo$varInfo[[y]][["low"]], dataInfo$varInfo[[y]][["high"]])
  startHex <- hexbin(x = xbnds[1], y = ybnds[1], xbins = xbins, shape = shape,
                      xbnds = xbnds, ybnds = ybnds, xlab = x, ylab = y)
  startHex@count <- NA_integer_
  startHex@cell <- NA_integer_
  startHex@xcm <- NA_real_
  startHex@ycm <- NA_real_
	resHexBin <- rxDataStep(inData = data, varsToKeep = plotVars, 
                          transformFunc = hexBinTransform, 
                          transformObjects = list(hex1 = startHex, 
                            xvar = x, yvar = y, 
                            myXbnds = xbnds, myYbnds = ybnds), 
                          transformPackages = c("hexbin"),
                          returnTransformObjects = TRUE, ...)$hex1
  resHexBin@ncells <- length(resHexBin@count)
  resHexBin@n <- sum(resHexBin@count, na.rm = TRUE)
  resHexBin@call <- call
	return(resHexBin)
}
RevoEnhancements/RevoEnhancements documentation built on May 9, 2019, 9:46 a.m.