#' @title Two population Global Testing procedure
#'
#' @description The function implements the Global Testing procedure for testing mean differences between two
#' functional populations. Functional data are tested locally and unadjusted and adjusted p-value
#' functions are provided. The unadjusted p-value function controls the point-wise error rate. The adjusted p-value function controls the
#' interval-wise error rate.
#'
#' @param data1 First population's data. Either pointwise evaluations of the functional data set on a uniform grid, or a \code{fd} object from the package \code{fda}.
#' If pointwise evaluations are provided, \code{data2} is a matrix of dimensions \code{c(n1,J)}, with \code{J} evaluations on columns and \code{n1} units on rows.
#'
#' @param data2 Second population's data. Either pointwise evaluations of the functional data set on a uniform grid, or a \code{fd} object from the package \code{fda}.
#' If pointwise evaluations are provided, \code{data2} is a matrix of dimensions \code{c(n1,J)}, with \code{J} evaluations on columns and \code{n2} units on rows.
#'
#' @param mu Functional mean difference under the null hypothesis. Three possibilities are available for \code{mu}:
#' a constant (in this case, a constant function is used);
#' a \code{J}-dimensional vector containing the evaluations on the same grid which \code{data} are evaluated;
#' a \code{fd} object from the package \code{fda} containing one function.
#' The default is \code{mu=0}.
#'
#' @param B The number of iterations of the MC algorithm to evaluate the p-values of the permutation tests. The defualt is \code{B=1000}.
#'
#' @param paired Flag indicating whether a paired test has to be performed. Default is \code{FALSE}.
#'
#' @param dx Used only if a \code{fd} object is provided. In this case, \code{dx} is the size of the discretization step of the grid used to evaluate functional data.
#' If set to \code{NULL}, a grid of size 100 is used. Default is \code{NULL}.
#'
#' @param recycle Flag used to decide whether the recycled version of the Global should be used (see Pini and Vantini, 2017 for details). Default is \code{TRUE}.
#'
#' @param alternative A character string specifying the alternative hypothesis, must be one of "\code{two.sided}" (default), "\code{greater}" or "\code{less}".
#'
#' @return \code{Global2} returns an object of \code{\link{class}} "\code{fdatest2}", containing the following components:
#' \item{test}{String vector indicating the type of test performed. In this case equal to \code{"2pop"}.}
#' \item{mu}{Evaluation on a grid of the functional mean difference under the null hypothesis (as entered by the user).}
#' \item{unadjusted_pval}{Evaluation on a grid of the unadjusted p-value function (it is a constant function according to the global testing procedure).}
#' \item{adjusted_pval}{Evaluation on a grid of the adjusted p-value function.}
#' \item{data.eval}{Evaluation on a grid of the functional data.}
#' \item{ord_labels}{Vector of labels indicating the group membership of data.eval}
#'
#' @seealso See also \code{\link{IWT2}} for local inference. See \code{\link{plot.fdatest2}} for plotting the results.
#'
#' @examples
#' # Importing the NASA temperatures data set
#' data(NASAtemp)
#'
#' # Performing the Global for two populations
#' Global.result <- Global2(NASAtemp$paris,NASAtemp$milan)
#'
#' # Plotting the results of the Global
#' plot(Global.result,xrange=c(0,12),main='Global results for testing mean differences')
#'
#'
#' # Selecting the significant components at 5% level
#' which(Global.result$adjusted_pval < 0.05)
#'
#' @references
#' A. Pini and S. Vantini (2017).
#' The Interval Testing Procedure: Inference for Functional Data Controlling the Family Wise Error Rate on Intervals. Biometrics 73(3): 835–845.
#'
#' Pini, A., & Vantini, S. (2017). Interval-wise testing for functional data. \emph{Journal of Nonparametric Statistics}, 29(2), 407-424
#'
#' @export
Global2 <- function(data1,data2,mu=0,B=1000,paired=FALSE,dx=NULL,stat='Integral'){
if(is.fd(data1)){ # data1 is a functional data object
rangeval1 <- data1$basis$rangeval
rangeval2 <- data2$basis$rangeval
if(is.null(dx)){
dx <- (rangeval1[2]-rangeval1[1])*0.01
}
if(sum(rangeval1 == rangeval2)!=2){
stop("rangeval of data1 and data2 must coincide.")
}
abscissa <- seq(rangeval1[1],rangeval1[2],by=dx)
coeff1 <- t(eval.fd(fdobj=data1,evalarg=abscissa))
coeff2 <- t(eval.fd(fdobj=data2,evalarg=abscissa))
}else if(is.matrix(data1)){
coeff1 <- data1
coeff2 <- data2
}else{
stop("First argument must be either a functional data object or a matrix.")
}
if (is.fd(mu)){ # mu is a functional data
rangeval.mu <- mu$basis$rangeval
if(sum(rangeval.mu == rangeval1)!=2){
stop("rangeval of mu must be the same as rangeval of data.")
}
if(is.null(dx)){
dx <- (rangeval.mu[2]-rangeval.mu[1])*0.01
}
abscissa <- seq(rangeval.mu[1],rangeval.mu[2],by=dx)
mu.eval <- t(eval.fd(fdobj=mu,evalarg=abscissa))
}else if(is.vector(mu)){
mu.eval <- mu
}else{
stop("Second argument must be either a functional data object or a numeric vector.")
}
n1 <- dim(coeff1)[1]
n2 <- dim(coeff2)[1]
J <- dim(coeff1)[2]
n <- n1+n2
etichetta_ord <- c(rep(1,n1),rep(2,n2))
#coeff1 <- coeff1 - matrix(data=mu,nrow=n1,ncol=J)
#print('First step: basis expansion')
#splines coefficients:
eval <- coeff <- rbind(coeff1,coeff2)
p <- dim(coeff)[2]
data.eval <- eval
#data.eval[1:n1,] <- data.eval[1:n1,] + matrix(data=mu,nrow=n1,ncol=J)
#print('Point-wise tests')
#univariate permutations
meandiff2 = (colMeans(coeff[1:n1,]) - colMeans(coeff[(n1+1):n,]))^2
S1 = cov(coeff[1:n1,])
S2 = cov(coeff[(n1+1):n,])
Sp = ((n1-1)*S1 + (n2-1)*S2) / (n1+n2-2)
T0 <- switch(stat,
Integral=meandiff2,
Max=meandiff2,
Integral_std= meandiff2/diag(Sp),
Max_std= meandiff2/diag(Sp))
T_coeff <- matrix(ncol=p,nrow=B)
for (perm in 1:B){
if(paired==TRUE){
if.perm <- rbinom(n1,1,0.5)
coeff_perm <- coeff
for(couple in 1:n1){
if(if.perm[couple]==1){
coeff_perm[c(couple,n1+couple),] <- coeff[c(n1+couple,couple),]
}
}
}else if(paired==FALSE){
permutazioni <- sample(n)
coeff_perm <- coeff[permutazioni,]
}
meandiff2_perm <- (colMeans(coeff_perm[1:n1,]) - colMeans(coeff_perm[(n1+1):n,]))^2
S1_perm = cov(coeff_perm[1:n1,])
S2_perm = cov(coeff_perm[(n1+1):n,])
Sp_perm = ((n1-1)*S1_perm + (n2-1)*S2_perm) / (n1+n2-2)
T_coeff[perm,] <- switch(stat,
Integral=meandiff2_perm,
Max=meandiff2_perm,
Integral_std= meandiff2_perm/diag(Sp_perm),
Max_std= meandiff2_perm/diag(Sp_perm))
}
pval <- numeric(p)
for(i in 1:p){
pval[i] <- sum(T_coeff[,i]>=T0[i])/B
}
#combination
#print('Partition tests')
all_combs <- rbind(rep(1,p))
ntests = 1
adjusted.pval <- numeric(p)
if(stat=='Integral'){
T0_comb <- sum(T0[which(all_combs[1,]==1)])
T_comb <- (rowSums(T_coeff[,which(all_combs[1,]==1),drop=FALSE]))
pval.temp <- mean(T_comb>=T0_comb)
indexes <- which(all_combs[1,]==1)
adjusted.pval[indexes] <- pval.temp
}else if (stat=='Max'){
T0_comb <- max(T0[which(all_combs[1,]==1)])
T_comb <- (apply(T_coeff[,which(all_combs[1,]==1)],1,max))
pval.temp <- mean(T_comb>=T0_comb)
indexes <- which(all_combs[1,]==1)
adjusted.pval[indexes] <- pval.temp
}
result = list(
test = '2pop', mu = mu.eval,
adjusted_pval = adjusted.pval,
unadjusted_pval = pval,
data.eval=data.eval,
ord_labels = etichetta_ord,
global_pval = adjusted.pval[1]
)
class(result) = 'fdatest2'
return(result)
}
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.