R/normDataWithin.R

#' Summarizes data.
#' Norms the data within specified groups in a data frame;
#' @description it normalizes each subject (identified by idvar) so that they have the same mean, within each groups pecified by betweenvars.
#' @param   data: a data frame.
#' @param    idvar: the name of a column that identifies each subject (or matched subjects)
#' @param    measurevar: the name of a column that contains the variable to be summariezed
#' @param    betweenvars: a vector containing names of columns that are between-subjects variables
#' @param    na.rm: a boolean that indicates whether to ignore NA's
normDataWithin <- function(data=NULL, idvar, measurevar, betweenvars=NULL,
                           na.rm=FALSE, .drop=TRUE) {
  require(plyr)
  
  # Measure var on left, idvar + between vars on right of formula.
  data.subjMean <- ddply(data, c(idvar, betweenvars), .drop=.drop,
                         .fun = function(xx, col, na.rm) {
                           c(subjMean = mean(xx[,col], na.rm=na.rm))
                         },
                         measurevar,
                         na.rm
  )
  
  # Put the subject means with original data
  data <- merge(data, data.subjMean)
  
  # Get the normalized data in a new column
  measureNormedVar <- paste(measurevar, "Normed", sep="")
  data[,measureNormedVar] <- data[,measurevar] - data[,"subjMean"] +
    mean(data[,measurevar], na.rm=na.rm)
  
  # Remove this subject mean column
  data$subjMean <- NULL
  
  return(data)
}
mssm-msf-2019/BiostatsALL documentation built on May 22, 2019, 12:16 p.m.