R/epi.descriptives.R

Defines functions epi.descriptives

Documented in epi.descriptives

epi.descriptives <- function(dat, conf.level = 0.95){

    conf.low <- (1 - conf.level) / 2
    conf.upp <- conf.level + (1 - conf.level) / 2
    
    if(inherits(x = dat, what = "numeric") == FALSE & inherits(x = dat, what = "factor") == FALSE)
      stop("Error: dat must be either numeric or a factor")

    if(inherits(x = dat, what = "numeric")){    
        an <- length(dat)
        amean <- mean(dat, na.rm = TRUE)
        asd <- sd(dat, na.rm = TRUE)
        ase <- asd / sqrt(an)
        
        ana <- is.na(dat); ana <- sum(as.numeric(ana))
        
        aq25 <- as.vector(quantile(dat, probs = 0.25, na.rm = TRUE))
        aq50 <- as.vector(quantile(dat, probs = 0.50, na.rm = TRUE))
        aq75 <- as.vector(quantile(dat, probs = 0.75, na.rm = TRUE))
        
        alcl <- as.vector(quantile(dat, probs = conf.low, na.rm = TRUE))
        aucl <- as.vector(quantile(dat, probs = conf.upp, na.rm = TRUE))
        
        amin <- min(dat, na.rm = TRUE)
        amax <- max(dat, na.rm = TRUE)
        
        # Geometric mean. Make sure all values positive:
        tdat <- dat[dat > 0]
        
        gn <- length(tdat)
        gmean <- exp(mean(log(tdat), na.rm = TRUE)) 
        gsd <- sd(log(tdat), na.rm = TRUE)
        gse <- gsd / sqrt(gn)
        
        gna <- is.na(tdat); gna <- sum(as.numeric(gna))
        
        gq25 <- as.vector(exp(quantile(log(tdat), probs = 0.25, na.rm = TRUE)))
        gq50 <- as.vector(exp(quantile(log(tdat), probs = 0.50, na.rm = TRUE)))
        gq75 <- as.vector(exp(quantile(log(tdat), probs = 0.75, na.rm = TRUE)))
        
        glcl <- as.vector(quantile(log(tdat), probs = conf.low, na.rm = TRUE))
        gucl <- as.vector(quantile(log(tdat), probs = conf.upp, na.rm = TRUE))
        
        gmin <- as.vector(exp(min(log(tdat), na.rm = TRUE)))
        gmax <- as.vector(exp(max(log(tdat), na.rm = TRUE)))
        
        # Skewness:
        x <- dat - mean(dat, na.rm = TRUE)
        skew <- sqrt(an) * sum(x^3, na.rm = TRUE) / (sum(x^2, na.rm = TRUE)^(3/2))
        
        # Kurtosis:
        x <- dat - mean(dat, na.rm = TRUE)
        r <- an * sum(x^4, na.rm = TRUE) / (sum(x^2, na.rm = TRUE)^2)
        kurt <- ((an + 1) * (r - 3) + 6) * (an - 1)/((an - 2) * (an - 3))
        
        rval <- list(
            arithmetic = data.frame(n = an, mean = amean, sd = asd, q25 = aq25, q50 = aq50, q75 = aq75, lower = alcl, upper = aucl, min = amin, max = amax, na = ana),
            geometric = data.frame(n = gn, mean = gmean, sd = gsd,  q25 = gq25, q50 = gq50, q75 = gq75, lower = glcl, upper = gucl, min = gmin, max = gmax, na = gna),
            symmetry = data.frame(skewness = skew, kurtosis = kurt)
        )
    }
    
    if(inherits(x = dat, what = "factor")){
        tmp <- table(dat, useNA = "always")
        total <- data.frame(level = "sum", n = margin.table(tmp))
        tmp <- data.frame(level = row.names(tmp), n = as.numeric(tmp))
        rval <- rbind(tmp, total)
    }
    
    return(rval)
 }
 
 

Try the epiR package in your browser

Any scripts or data that you put into this service are public.

epiR documentation built on Nov. 20, 2023, 9:06 a.m.