#' Get the last month and day of the year
#'
#' Get the last month and day of the year as a character sting, separated by
#' the specified separator.
#'
#' This is a utility function necessitated by 360-day calendars. Works on PCICt objects.
#'
#' @param d An exemplar date.
#' @param sep Separator to use.
#' @return A string (like "12-30", or "12-31")
#'
#' @examples
#' library(PCICt)
#' last.mday <- get.last.monthday.of.year(as.PCICt("2011-01-01", cal="360"))
#'
#' @export
get.last.monthday.of.year <- function(d, sep="-") {
if(!is.null(attr(d, "months"))) paste("12", attr(d, "months")[12], sep=sep) else paste("12", "31", sep=sep)
}
## Lower overhead version of tapply
tapply.fast <- function (X, INDEX, FUN = NULL, ..., simplify = TRUE) {
FUN <- if (!is.null(FUN))
match.fun(FUN)
if(!is.factor(INDEX))
stop("INDEX must be a factor.")
if (length(INDEX) != length(X))
stop("arguments must have same length")
if (is.null(FUN))
return(INDEX)
namelist <- levels(INDEX)
ans <- lapply(split(X, INDEX), FUN, ...)
ans <- unlist(ans, recursive = FALSE)
names(ans) <- levels(INDEX)
return(ans)
}
## Returns PCICt field or dies
get.date.field <- function(input.data, cal, date.types) {
valid.date.types <- sapply(date.types, function(x) { return(!inherits(try(input.data[,x$fields], silent=TRUE), "try-error")) })
if(sum(valid.date.types) == 0) {
stop("Could not find a workable set of date fields")
}
date.type <- date.types[[which(valid.date.types)[1]]]
date.strings <- do.call(paste, input.data[,date.type$fields])
return(as.PCICt(date.strings, format=date.type$format, cal=cal))
}
## Creates a filled series given the data, dates, and new date sequence to be used.
create.filled.series <- function(data, data.dates, new.date.sequence) {
new.data <- rep(NA, length(new.date.sequence))
data.in.new.data <- (data.dates >= new.date.sequence[1]) & (data.dates <= new.date.sequence[length(new.date.sequence)])
indices <- floor(as.numeric(data.dates[data.in.new.data] - new.date.sequence[1], units="days")) + 1
new.data[indices] <- data[data.in.new.data]
return(new.data)
}
## Get julian day of year
get.jdays <- function(dates) {
return(as.POSIXlt(dates)$yday + 1)
}
## Get year
get.years <- function(dates) {
return(as.POSIXlt(dates)$year + 1900)
}
## Get month number
get.months <- function(dates) {
return(as.POSIXlt(dates)$mon + 1)
}
## Juggle the list so that day 366 == day 365
get.jdays.replaced.feb29 <- function(jdays) {
indices <- which(jdays == 366)
if(length(indices) > 0)
jdays[rep(indices, each=366) + -365:0] <- c(1:59, 59, 60:365)
jdays
}
## Get NA mask given threshold and split factor
get.na.mask <- function(x, f, threshold) {
return(c(1, NA)[1 + as.numeric(tapply.fast(is.na(x), f, function(y) { return(sum(y) > threshold) } ))])
}
## Get number of days within range
get.num.days.in.range <- function(x, date.range) {
return(sum(x >= date.range[1] & x <= date.range[2]))
}
#' Get series length at ends
#'
#' This function takes a series of boolean values and returns a list of
#' integers of the same length corresponding to the lengths at the ends of
#' sequences of TRUE values.
#'
#' It can often be useful to know how long a series of boolean values is. This
#' function provides a method of knowing where and how long such sequences are.
#'
#' @param x Sequence of booleans.
#' @param na.value Value to replace NAs with.
#' @return A vector consisting of the lengths of sequences of TRUE values at
#' the location of the last TRUE value in the sequence, and zeroes elsewhere.
#' @keywords ts climate
#' @examples
#'
#' ## Get lengths of sequences of TRUE values in a sequence
#' series.lengths <- get.series.lengths.at.ends(c(TRUE, TRUE, TRUE, FALSE,
#' TRUE, FALSE, TRUE, TRUE, TRUE, TRUE, FALSE))
#'
#'
#' @export
get.series.lengths.at.ends <- function(x, na.value=FALSE) {
stopifnot(is.logical(x) && is.logical(na.value))
n <- length(x)
if(n == 1)
return(as.numeric(x))
res <- rep(0, n)
x[is.na(x)] <- na.value
## Compare series to lag-1 and lag+1 series; false added to trigger state transition from TRUE at ends of series
start <- which(x & !(c(FALSE, x[1:(n - 1)])))
end <- which(x & !(c(x[2:n], FALSE)))
res[end] <- end - start + 1
return(res)
}
#' Number of days (less than, greater than, etc) a threshold
#'
#' Produces sums of values that exceed (or are below) the specified threshold.
#'
#' This function takes a data series, a threshold, an operator, and a factor to
#' aggregate by. It uses the operator to compare the threshold to the data
#' series, creating a series of booleans, then sums the booleans according to
#' the factor.
#'
#' @param temp Sequence temperature values.
#' @param date.factor Factor to aggregate by.
#' @param threshold Threshold to use.
#' @param op Operator to use for comparison.
#' @return A vector consisting of the number of values that meet the criteria
#' in the given time period (as specified by \code{date.factor}).
#' @keywords ts climate
#' @examples
#' library(PCICt)
#'
#' ## Parse the dates into PCICt.
#' tmax.dates <- as.PCICt(do.call(paste, ec.1018935.tmax[,c("year",
#' "jday")]), format="%Y %j", cal="gregorian")
#' tmin.dates <- as.PCICt(do.call(paste, ec.1018935.tmin[,c("year",
#' "jday")]), format="%Y %j", cal="gregorian")
#' prec.dates <- as.PCICt(do.call(paste, ec.1018935.prec[,c("year",
#' "jday")]), format="%Y %j", cal="gregorian")
#'
#' ## Load the data in.
#' ci <- climdexInput.raw(ec.1018935.tmax$MAX_TEMP,
#' ec.1018935.tmin$MIN_TEMP, ec.1018935.prec$ONE_DAY_PRECIPITATION,
#' tmax.dates, tmin.dates, prec.dates, base.range=c(1971, 2000))
#'
#' ## Calculate frost days.
#' fd <- number.days.op.threshold(ci@@data$tmin,
#' ci@@date.factors$annual, 0, "<")
#'
#' @export
number.days.op.threshold <- function(temp, date.factor, threshold, op="<") {
stopifnot(is.numeric(temp) && is.numeric(threshold) && is.factor(date.factor))
return(tapply.fast(match.fun(op)(temp, threshold), date.factor, sum, na.rm=TRUE))
}
#' Lengths of strings of TRUE values
#'
#' Computes fraction of days above or below the baseline threshold for each
#' day, and averages them using the date factor passed in.
#'
#' This function computes fractions of days above or below baseline thresholds
#' for each day, then aggregates them using \code{date.factor}. It is used to
#' implement TN/TX 10/90p.
#'
#' @param temp Sequence of temperature values.
#' @param dates Sequence of associated dates.
#' @param jdays Sequence of associated days of year.
#' @param date.factor Factor to aggregate data using.
#' @param threshold.outside.base Sequence of thresholds to be used for data
#' outside the base period.
#' @param base.thresholds Data structure containing sets of thresholds to be
#' used inside the base period; see \link{climdexInput-class}.
#' @param base.range Date range (type PCICt) of the baseline period.
#' @param op Comparison operator to use.
#' @param max.missing.days Maximum number of NA values per time period.
#' @return A vector consisting of the mean fraction of days above or below the
#' supplied set of thresholds.
#' @note If date.factor is omitted, daily series will be returned.
#' @seealso \link{climdexInput-class}.
#' @keywords ts climate
#' @examples
#' library(PCICt)
#'
#' ## Parse the dates into PCICt.
#' tmax.dates <- as.PCICt(do.call(paste, ec.1018935.tmax[,c("year",
#' "jday")]), format="%Y %j", cal="gregorian")
#' tmin.dates <- as.PCICt(do.call(paste, ec.1018935.tmin[,c("year",
#' "jday")]), format="%Y %j", cal="gregorian")
#' prec.dates <- as.PCICt(do.call(paste, ec.1018935.prec[,c("year",
#' "jday")]), format="%Y %j", cal="gregorian")
#'
#' ## Load the data in.
#' ci <- climdexInput.raw(ec.1018935.tmax$MAX_TEMP,
#' ec.1018935.tmin$MIN_TEMP, ec.1018935.prec$ONE_DAY_PRECIPITATION,
#' tmax.dates, tmin.dates, prec.dates, base.range=c(1971, 2000))
#'
#' ## Compute monthly tx90p.
#' tx90p <- percent.days.op.threshold(ci@@data$tmax, ci@@dates, ci@@jdays,
#' ci@@date.factors$monthly,
#' ci@@quantiles$tmax$outbase$q90,
#' ci@@quantiles$tmax$inbase$q90,
#' ci@@base.range, ">",
#' ci@@max.missing.days['monthly']) *
#' ci@@namasks$monthly$tmax
#'
#' @export
percent.days.op.threshold <- function(temp, dates, jdays, date.factor,
threshold.outside.base, base.thresholds,
base.range, op='<', max.missing.days) {
f <- match.fun(op)
dat <- f(temp, threshold.outside.base[jdays])
inset <- dates >= base.range[1] & dates <= base.range[2]
## Don't use in-base thresholds with data shorter than two years; no years to replace with.
if(sum(inset) > 0 && length(dates) >= 360 * 2) {
jdays.base <- jdays[inset]
years.base <- get.years(dates[inset])
## Get number of base years, subset temp data to base period only.
temp.base <- temp[inset]
years.base.range <- range(years.base)
byrs <- (years.base.range[2] - years.base.range[1] + 1)
## Linearize thresholds, then compare them to the temperatures
bdim <- dim(base.thresholds)
dim(base.thresholds) <- c(bdim[1] * bdim[2], bdim[3])
yday.byr.indices <- jdays.base + (years.base - get.years(base.range)[1]) * bdim[1]
f.result <- f(rep(temp.base, byrs - 1), base.thresholds[yday.byr.indices,])
dim(f.result) <- c(length(yday.byr.indices), bdim[3])
## Chop up data along the 2nd dim into a list; sum elements of the list
dat[inset] <- rowSums(f.result, na.rm=TRUE) / (byrs - 1)
}
dat[is.nan(dat)] <- NA
if(missing(date.factor))
return(dat)
na.mask <- get.na.mask(dat, date.factor, max.missing.days)
## FIXME: Need to monthly-ize the NA mask calculation, which will be ugly.
ret <- tapply.fast(dat, date.factor, mean, na.rm=TRUE) * 100 * na.mask
ret[is.nan(ret)] <- NA
return(ret)
}
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.