R/krippendorff.R
In krippendorffsalpha: Measuring Agreement Using Krippendorff's Alpha Coefficient

Documented in confint.krippendorffsalpha influence.krippendorffsalpha interval.dist krippendorffs.alpha nominal.dist plot.krippendorffsalpha ratio.dist summary.krippendorffsalpha

krippendorff.MSE = function(data, dist)
{
    m = rowSums(! is.na(data))
    MSE = 0
    n.u = nrow(data)
    n.c = ncol(data)
    for (i in 1:n.u)
    {
        s = 0
        if (m[i] > 1)
        {
            for (j in 1:(n.c - 1))
                for (k in (j + 1):n.c)
                    s = s + dist(data[i, j], data[i, k])
            MSE = MSE + s / (m[i] - 1)
        }
    }
    N = sum(m[m > 1])
    MSE = MSE / N
}

krippendorff.MST = function(data, dist)
{
    m = rowSums(! is.na(data))
    MST = 0
    n.u = nrow(data)
    n.c = ncol(data)
    for (i in 1:n.u)
        for (j in 1:n.c)
            for (k in 1:n.u)
                for (l in 1:n.c)
                    MST = MST + dist(data[i, j], data[k, l])
    N = sum(m)
    MST = MST / (2 * N * (N - 1))
}

krippendorff.SST = function(data, dist)
{
    m = rowSums(! is.na(data))
    dat = as.vector(t(data))
    k = length(dat)
    lookup = matrix(0, k, k)
    for (i in 1:(k - 1))
        for (j in (i + 1):k)
            lookup[i, j] = dist(dat[i], dat[j])
    if (requireNamespace("spam", quietly = TRUE))
        lookup = spam::as.spam(lookup)
    N = sum(m)
    SST = sum(lookup) / N
    list(SST = SST, lookup = lookup)
}

krippendorff.control = function(method, confint, verbose, control)
{
    if (length(control) > 0)
    {
        nms = match.arg(names(control), c("bootit", "parallel", "type", "nodes"), several.ok = TRUE)
        control = control[nms]
    }
    if (confint)
    {
        if (method == "analytical")
            control$bootit = NULL
        else # method == "customary"
        {
            bootit = control$bootit
            if (is.null(bootit) || ! is.numeric(bootit) || length(bootit) > 1 || bootit != as.integer(bootit) || bootit < 100)
            {
                if (verbose)
                    message("\nControl parameter 'bootit' must be a positive integer >= 100. Setting it to the default value of 1,000.")
                control$bootit = 1000
            }
        }
        if (is.null(control$parallel) || ! is.logical(control$parallel) || length(control$parallel) > 1)
        {
            if (verbose)
                message("\nControl parameter 'parallel' must be a logical value. Setting it to the default value of TRUE.")
            control$parallel = TRUE
        }
        if (control$parallel)
        {
            if (requireNamespace("parallel", quietly = TRUE))
            {
                if (is.null(control$type) || length(control$type) > 1 || ! control$type %in% c("SOCK", "PVM", "MPI", "NWS"))
                {
                    if (verbose)
                        message("\nControl parameter 'type' must be \"SOCK\", \"PVM\", \"MPI\", or \"NWS\". Setting it to \"SOCK\".")
                    control$type = "SOCK"
                }
                nodes = control$nodes
                if (is.null(control$nodes) || ! is.numeric(nodes) || length(nodes) > 1 || nodes != as.integer(nodes) || nodes < 2)
                    stop("Control parameter 'nodes' must be a whole number greater than 1.")
            }
            else
            {
                if (verbose)
                    message("\nParallel computation requires package parallel. Setting control parameter 'parallel' to FALSE.")
                control$parallel = FALSE
                control$type = control$nodes = NULL 
            }
        }
        else
            control$type = control$nodes = NULL
    }
    else
        control$bootit = control$parallel = control$type = control$nodes = NULL
    control
}

krippendorff.analytical.helper = function(x, data, dist, a, eta.hat, lookup)
{
    n.c = ncol(data)
    pos = (x - 1) * n.c + 1
    pos = pos:(pos + n.c - 1)
    data = data[-x, ]
    m = rowSums(! is.na(data))
    N = sum(m)
    a_ = length(m)
    MSE = krippendorff.MSE(data, dist)
    SST = sum(lookup[-pos, -pos]) / N
    SSA = SST - (N - a_) * MSE
    MSA = SSA / (a_ - 1)
    eta_ = log(MSA / MSE)
    eta = a * eta.hat - (a - 1) * eta_
    eta
} 

krippendorff.analytical = function(data, dist, confint, verbose, control)
{
    m = rowSums(! is.na(data))
    N = sum(m)
    a = length(m)
    n_ = (N - sum(m^2) / N) / (a - 1)
    MSE = krippendorff.MSE(data, dist)
    temp = krippendorff.SST(data, dist)
    lookup = temp$lookup
    SSA = temp$SST - (N - a) * MSE
    rm(temp)
    MSA = SSA / (a - 1)
    theta.hat = MSA / MSE
    eta.hat = log(theta.hat)
    alpha.hat = (theta.hat - 1) / (theta.hat + n_ - 1)
    results = list(alpha.hat = alpha.hat, MSA = MSA, MSE = MSE, eta.hat = eta.hat, a = a, n_ = n_)
    if (confint)
    {
        if (verbose)
        {
            cat("\n")
            flush.console()
        }
        eta = numeric(a)
        if (! control$parallel)
        {
            if (verbose && requireNamespace("pbapply", quietly = TRUE))
            {
                gathered = pbapply::pblapply(1:a, krippendorff.analytical.helper, data = data, dist = dist, a = a, eta.hat = eta.hat, lookup = lookup)
                for (i in 1:a)
                    eta[i] = gathered[[i]]
            }
            else
            {
                for (i in 1:a)
                    eta[i] = krippendorff.analytical.helper(i, data = data, dist = dist, a = a, eta.hat = eta.hat, lookup = lookup)
            }
        }
        else
        {
            cl = parallel::makeCluster(control$nodes, control$type)
            if (requireNamespace("spam", quietly = TRUE))
                parallel::clusterEvalQ(cl, library(spam))
            if (verbose && requireNamespace("pbapply", quietly = TRUE))
                gathered = pbapply::pblapply(1:a, krippendorff.analytical.helper, data = data, dist = dist, a = a, eta.hat = eta.hat, lookup = lookup, cl = cl)
            else
                gathered = parallel::clusterApplyLB(cl, 1:a, krippendorff.analytical.helper, data = data, dist = dist, a = a, eta.hat = eta.hat, lookup = lookup)
            parallel::stopCluster(cl)
            for (i in 1:a)
                eta[i] = gathered[[i]]
        }
        se = sqrt(var(eta) / a)
        results$se = se
    }
    results
}

krippendorff.bootstrap.helper = function(rows, object)
{
    data = object$data[rows, ]
    MSE = krippendorff.MSE(data, object$dist)
    1 - MSE / object$MST
}

krippendorff.bootstrap = function(object)
{
    bootit = object$control$bootit
    boot.sample = numeric(bootit)
    rows = vector("list", bootit)
    for (j in 1:bootit)
        rows[[j]] = sample(nrow(object$data), replace = TRUE)
    if (! object$control$parallel)
    {
        if (object$verbose && requireNamespace("pbapply", quietly = TRUE))
        {
            gathered = pbapply::pblapply(rows, krippendorff.bootstrap.helper, object = object)
            for (j in 1:bootit)
                boot.sample[j] = gathered[[j]]
        }
        else
        {
            for (j in 1:bootit)
                boot.sample[j] = krippendorff.bootstrap.helper(rows[[j]], object)
        }
    }
    else
    {
        cl = parallel::makeCluster(object$control$nodes, object$control$type)
        if (object$verbose && requireNamespace("pbapply", quietly = TRUE))
            gathered = pbapply::pblapply(rows, krippendorff.bootstrap.helper, object = object, cl = cl)
        else
            gathered = parallel::clusterApplyLB(cl, rows, krippendorff.bootstrap.helper, object = object)
        parallel::stopCluster(cl)
        for (j in 1:bootit)
            boot.sample[j] = gathered[[j]]
    }
    boot.sample
}

#' Apply Krippendorff's Alpha.
#'
#' @details This is the package's flagship function. It applies the Krippendorff's Alpha methodology for nominal, ordinal, interval, or ratio levels of measurement, and, if desired, produces confidence intervals. Parallel computing is supported, when applicable.
#'
#' If the level of measurement is nominal, the discrete metric (\code{\link{nominal.dist}}) is employed by default. If the level of measurement is interval or ordinal, the squared-difference distance function (\code{\link{interval.dist}}) is employed by default. (For the ordinal level of measurement, using the squared-difference distance function may be inappropriate, in which case the user should supply his/her own distance function.) If the level of measurement is ratio, a ratio distance function (\code{\link{ratio.dist}}) is applied. Alternatively, the user may supply his/her own distance function. Said function must handle \code{NA}'s gracefully; see the above mentioned built-in distance functions for examples.
#'
#' Argument \code{method} is used to choose between the customary Alpha methodology and the analytical methodology developed by Hughes: \code{method = "analytical"} or \code{method = "customary"}. For smaller samples Hughes' methodology should be strongly preferred because that approach reduces bias for point estimation and provides much better performing confidence intervals---jackknife intervals, to be precise. For large samples Krippendorff's customary methodology can safely be used for inference, and speeds computation considerably relative to Hughes' jackknife method.
#'
#' If argument \code{confint} is set to \code{TRUE}, a confidence interval is computed. For Hughes' methodology a jackknife interval is produced. For the customary methodology a bootstrap interval is produced. The bootstrap is done by resampling, with replacement, the rows of \code{data} and then computing the alpha statistic for the resulting matrix. The elements of argument \code{control} are used to control the interval computation.
#'
#' @param data a matrix of scores. Each row corresponds to a unit, each column to a coder.
#' @param level the level of measurement, one of \code{"nominal"}, \code{"ordinal"}, \code{"interval"}, or \code{"ratio"}; or a user-defined distance function.
#' @param method the methodology to apply, either \code{"analytical"} or \code{"customary"}.
#' @param confint logical; if \code{TRUE}, a confidence interval is computed. For \code{method = "analytical"} the interval is a jackknife interval. For \code{method = "customary"} the interval is a bootstrap interval.
#' @param verbose logical; if \code{TRUE}, various messages are printed to the console. Note that if \code{confint = TRUE} a progress bar (\code{\link[pbapply]{pblapply}}) is displayed (if possible) during the bootstrap or jackknife computation.
#' @param control a list of control parameters.
#'    \describe{
#'        \item{\code{bootit}}{the size of the bootstrap sample. This applies when \code{confint = TRUE} and \code{method = "customary"}. Defaults to 1,000.}
#'        \item{\code{nodes}}{the desired number of nodes in the cluster.}
#'        \item{\code{parallel}}{logical; if \code{TRUE} (the default), bootstrapping or jackknife estimation is done in parallel (for \code{confint = TRUE}).}
#'        \item{\code{type}}{one of the supported cluster types for \code{\link[parallel]{makeCluster}}. Defaults to \code{"SOCK"}.}
#' }
#'
#' @return Function \code{krippendorffs.alpha} returns an object of class \code{"krippendorffsalpha"}, which is a list comprising the following elements.
#'         \item{alpha.hat}{the estimate of alpha.}
#'         \item{boot.sample}{when applicable, the bootstrap sample.}
#'         \item{call}{the matched call.}
#'         \item{coders}{the number of coders.}
#'         \item{confint}{the value of argument \code{confint}.}
#'         \item{control}{the list of control parameters.}
#'         \item{data}{the matrix of scores, where rows represent units and columns represent coders.}
#'         \item{eta.hat}{when \code{method = "analytical"}, \eqn{log(MSA / MSE)}.}
#'         \item{L}{when \code{method = "analytical"}, the lower 95\% confidence limit for alpha.}
#'         \item{level}{the level of measurement, or a user-dfined distance function.}
#'         \item{MSA}{when \code{method = "analytical"}, the estimate of between-unit variation.}
#'         \item{MSE}{the estimate of within-unit variation.}
#'         \item{MST}{when \code{method = "customary"}, the estimate of total variation.}
#'         \item{method}{the value of argument \code{method}.}
#'         \item{n_}{when \code{method = "analytical"}, the average number of scores per row of the data matrix.}
#'         \item{se}{when \code{method = "analytical"}, the jackknife standard error.}
#'         \item{U}{when \code{method = "analytical"}, the upper 95\% confidence limit for alpha.}
#'         \item{units}{the number of units.}
#'         \item{verbose}{the value of argument \code{verbose}.}
#'
#' @references
#' Krippendorff, K. (2013). Computing Krippendorff's alpha-reliability. Technical report, University of Pennsylvania.
#' @references
#' Hughes, J. (2022). Toward improved inference for Krippendorff's Alpha agreement coefficient. arXiv.
#'
#' @export
#'
#' @examples
#' # The following data were presented in Krippendorff (2013). This example
#' # applies Hughes' methodology (the default) to these data. A jackknife
#' # confidence interval is produced (confint = TRUE). The fit is then
#' # summarized, and a 99% interval is given.
#'
#' nominal = matrix(c(1,2,3,3,2,1,4,1,2,NA,NA,NA,
#'                    1,2,3,3,2,2,4,1,2,5,NA,3,
#'                    NA,3,3,3,2,3,4,2,2,5,1,NA,
#'                    1,2,3,3,2,4,4,1,2,5,1,NA), 12, 4)
#' nominal
#' fit.nom = krippendorffs.alpha(nominal, level = "nominal", confint = TRUE, verbose = TRUE,
#'                               control = list(parallel = FALSE))
#' summary(fit.nom)
#' confint(fit.nom, level = 0.99)

krippendorffs.alpha = function(data, level = c("interval", "nominal", "ordinal", "ratio"), method = c("analytical", "customary"),
                               confint = TRUE, verbose = FALSE, control = list())
{
    call = match.call()
    if (missing(data) || ! is.matrix(data) || ! is.numeric(data))
        stop("You must supply a numeric data matrix.")
    if (! is.character(level) && ! is.function(level))
        stop("'level' must be a distance function or one of \"interval\", \"nominal\", \"ordinal\", or \"ratio\".")
    else if (is.function(level))
    {
        dist = level
        level = "user specified distance function"
    }
    else
    {
        level = match.arg(level)
        if (level == "interval" || level == "ordinal")
            dist = interval.dist
        else if (level == "nominal")
            dist = nominal.dist
        else if (level == "ratio")
            dist = ratio.dist
    }
    method = match.arg(method)
    if (! is.logical(confint) || length(confint) > 1)
        stop("'confint' must be a logical value.")
    if (! is.logical(verbose) || length(verbose) > 1)
        stop("'verbose' must be a logical value.")
    if (! is.list(control))
        stop("'control' must be a list.")
    control = krippendorff.control(method, confint, verbose, control)
    if (method == "analytical")
    {
        analytical = krippendorff.analytical(data, dist, confint, verbose, control)
        alpha.hat = analytical$alpha.hat
        MSA = analytical$MSA
        MSE = analytical$MSE
    }
    else
    {
        MSE = krippendorff.MSE(data, dist)
        MST = krippendorff.MST(data, dist)
        alpha.hat = 1 - MSE / MST
    }
    names(alpha.hat) = "alpha"
    object = list(units = nrow(data), coders = ncol(data), data = data, level = level, method = method,
                  confint = confint, verbose = verbose, alpha.hat = alpha.hat, control = control, call = call,
                  MSE = MSE, dist = dist)
    if (method == "analytical")
        object$MSA = MSA
    else
        object$MST = MST
    if (confint)
    {
        if (verbose)
        {
            cat("\n")
            flush.console()
        }
        if (method == "customary")
        {
            boot.sample = krippendorff.bootstrap(object)
            object$boot.sample = boot.sample
            if (verbose)
            {
                cat("\n")
                flush.console()
            }
        }
        else
        {
            a = analytical$a
            t = qt(0.975, df = a - 1)
            eta.hat = analytical$eta.hat
            se = analytical$se
            lo = eta.hat - t * se
            hi = eta.hat + t * se
            n_ = analytical$n_
            L = (exp(lo) - 1) / (exp(lo) - 1 + n_)
            U = (exp(hi) - 1) / (exp(hi) - 1 + n_)
            object$L = L
            object$U = U
            object$se = se
            object$a = a
            object$n_ = n_
            object$eta.hat = eta.hat
        }
    }
    class(object) = "krippendorffsalpha"
    object
}

#' Compute the squared difference between two scores.
#'
#' @details This function computes the squared difference between two scores. This may be an appropriate distance function for the interval level of measurement. \code{NA}'s are handled gracefully.
#' @param x a score.
#' @param y a score.
#' @return \eqn{(x-y)^2}, or 0 if \code{x} or \code{y} is \code{NA}.
#' @seealso \code{\link{nominal.dist}}, \code{\link{ratio.dist}}
#' @export
    
interval.dist = function(x, y)
{
    d = (x - y)^2
    if (is.na(d))
        d = 0
    d
}

#' Apply the discrete metric to two scores.
#'
#' @details This function applies the discrete metric to two scores. This may be an appropriate distance function for the nominal level of measurement. \code{NA}'s are handled gracefully.
#' @param x a score.
#' @param y a score.
#' @return 0 if \code{x} is equal to \code{y} or if either is \code{NA}, 1 otherwise.
#' @seealso \code{\link{interval.dist}}, \code{\link{ratio.dist}}
#' @export

nominal.dist = function(x, y)
{
    temp = (x == y)
    if (is.na(temp) || temp)
        d = 0
    else
        d = 1
    d
}

#' Apply a ratio distance function to two scores.
#'
#' @details This function applies a ratio distance function to two scores. This may be an appropriate distance function for the ratio level of measurement. \code{NA}'s are handled gracefully.
#' @param x a score.
#' @param y a score.
#' @return \eqn{(x-y)^2/(x+y)^2}, or 0 if \code{x} or \code{y} is \code{NA}.
#' @seealso \code{\link{interval.dist}}, \code{\link{nominal.dist}}
#' @export

ratio.dist = function(x, y)
{
    d = (x - y)^2 / (x + y)^2
    if (is.na(d))
        d = 0
    d
}

#' Compute DFBETAs for units and/or coders.
#'
#' @details This function computes DFBETAs for one or more units and/or one or more coders.
#'
#' @param model a fitted model object, the result of a call to \code{\link{krippendorffs.alpha}}.
#' @param units a vector of integers. A DFBETA will be computed for each of the corresponding units.
#' @param coders a vector of integers. A DFBETA will be computed for each of the corresponding coders.
#' @param ... additional arguments. These are ignored.
#
#' @return A list comprising at most two elements.
#'         \item{dfbeta.units}{a vector containing DFBETAs for the units specified via argument \code{units}.}
#'         \item{dfbeta.coders}{a vector containing DFBETAs for the coders specified via argument \code{coders}.}
#'
#' @method influence krippendorffsalpha
#'
#' @references
#' Young, D. S. (2017). \emph{Handbook of Regression Methods}. CRC Press.
#' @references
#' Krippendorff, K. (2013). Computing Krippendorff's alpha-reliability. Technical report, University of Pennsylvania.
#'
#' @export
#'
#' @examples
#' # The following data were presented in Krippendorff (2013). This example
#' # applies Hughes' methodology to the data (method = "analytical", the default).
#' # DFBETAS are computed by leaving out unit 6, unit 11, coder 2, and coder 3.
#'
#' nominal = matrix(c(1,2,3,3,2,1,4,1,2,NA,NA,NA,
#'                    1,2,3,3,2,2,4,1,2,5,NA,3,
#'                    NA,3,3,3,2,3,4,2,2,5,1,NA,
#'                    1,2,3,3,2,4,4,1,2,5,1,NA), 12, 4)
#' fit.nom = krippendorffs.alpha(nominal, level = "nominal", confint = FALSE)
#' summary(fit.nom)
#' (inf = influence(fit.nom, units = c(6, 11), coders = c(2, 3)))

influence.krippendorffsalpha = function(model, units, coders, ...)
{
    dfbeta.units = NULL
    if (! missing(units))
    {
        dfbeta.units = numeric(length(units))
        k = 1
        for (j in units)
        {
            fit = krippendorffs.alpha(model$data[-j, ], level = model$level, method = model$method, confint = FALSE, control = model$control)
            dfbeta.units[k] = model$alpha.hat - fit$alpha.hat
            k = k + 1
        }
        names(dfbeta.units) = units
    }
    dfbeta.coders = NULL
    if (! missing(coders))
    {
        dfbeta.coders = numeric(length(coders))
        k = 1
        for (j in coders)
        {
            fit = krippendorffs.alpha(model$data[, -j], level = model$level, method = model$method, confint = FALSE, control = model$control)
            dfbeta.coders[k] = model$alpha.hat - fit$alpha.hat
            k = k + 1
        }
        names(dfbeta.coders) = coders
    }
    result = list()
    if (! is.null(dfbeta.units))
        result$dfbeta.units = dfbeta.units
    if (! is.null(dfbeta.coders))
        result$dfbeta.coders = dfbeta.coders
    result        
}

#' Print a summary of a Krippendorff's Alpha fit.
#'
#' @details This function prints a summary of the fit. First the data geometry is described, then the call signature is printed, then the values of the control parameters (defaults and/or values supplied in the call) are printed. Finally, a table of estimates is shown. If applicable, the table includes confidence limits.
#'
#' @param object an object of class \code{"krippendorffsalpha"}, the result of a call to \code{\link{krippendorffs.alpha}}.
#' @param conf.level the confidence level for the confidence intervals. The default is 0.95.
#' @param digits the number of significant digits to display. The default is 4.
#' @param \dots additional arguments. These are passed to \code{\link{quantile}}.
#'
#' @seealso \code{\link{krippendorffs.alpha}}
#'
#' @method summary krippendorffsalpha
#'
#' @references
#' Nissi, M. J., Mortazavi, S., Hughes, J., Morgan, P., and Ellermann, J. (2015). T2* relaxation time of acetabular and femoral cartilage with and without intra-articular Gd-DTPA2 in patients with femoroacetabular impingement. \emph{American Journal of Roentgenology}, \bold{204}(6), W695.
#'
#' @export
#'
#' @examples
#' # Fit a subset of the cartilage data, using the customary methodology.
#' # Compute bootstrap confidence intervals using a bootstrap sample size
#' # of 1,000. Display a summary of the results, including a 99% confidence
#' # interval. Also plot the results.
#'
#' data(cartilage)
#' cartilage = as.matrix(cartilage[1:100, ])
#' fit.cart = krippendorffs.alpha(cartilage, level = "ratio", method = "customary", confint = TRUE,
#'                                control = list(bootit = 1000, parallel = FALSE))
#' summary(fit.cart, conf.level = 0.99)
#' dev.new()
#' plot(fit.cart, xlim = c(0.7, 0.9), xlab = "Bootstrap Estimates",
#'      main = "Results for Cartilage Data")

summary.krippendorffsalpha = function(object, conf.level = 0.95, digits = 4, ...)
{
    cat("\nKrippendorff's Alpha\n\n")
    cat("Data:", object$units, "units x", object$coders, "coders\n")
    ans = NULL
    ans$units = object$units
    ans$coders = object$coders
    ans$method = object$method
    cat("\nCall:\n\n")
    print(object$call)
    ans$call = object$call
    cat("\nControl parameters:\n")
    if (length(object$control) > 0)
    {
        control.table = cbind(unlist(c(object$control, "")))
        colnames(control.table) = ""
        ans$control.table = control.table
        print(control.table, quote = FALSE)
    }
    else
        cat("\nNA\n\n")
    if (! object$confint)
    {
        confint = matrix(rep(NA, 2), ncol = 2)
        coef.table = cbind(object$alpha.hat, confint)
    }
    else
    {
        if (object$method == "analytical")
        {
            if (conf.level == 0.95)
                coef.table = cbind(object$alpha.hat, object$L, object$U)
            else
                coef.table = cbind(object$alpha.hat, t(confint(object, level = conf.level)))
        }
        else
        {
            boot.sample = object$boot.sample
            if (! is.null(boot.sample))
            {
                lo = (1 - conf.level) / 2
                probs = c(lo, 1 - lo)
                confint = quantile(boot.sample, probs, ...)
            }
            coef.table = cbind(object$alpha.hat, t(confint))
        }
    }
    colnames(coef.table) = c("Estimate", "Lower", "Upper")
    rownames(coef.table) = names(object$alpha.hat)
    ans$coef.table = coef.table
    cat("Results:\n\n")
    print(signif(coef.table, digits = digits))
    cat("\n")
    invisible(ans)
}

#' Compute a confidence interval for Krippendorff's Alpha.
#'
#' @details This function computes a confidence interval for alpha, assuming that \code{\link{krippendorffs.alpha}} was called with \code{confint = TRUE}.
#'
#' For \code{method = "analytical"}, a jackknife-based interval is computed. For smaller samples the jackknife interval offers a very substantial improvement over the bootstrap interval, the latter of which offers quite poor coverage. For larger samples \code{method = "customary"} can safely be used, in which case a bootstrap interval is provided. For sufficiently large datasets the two intervals will be nearly equal, but the bootstrap approach is preferred owing to its much faster execution speed.
#'
#' @param object an object of class \code{"krippendorffsalpha"}, the result of a call to \code{\link{krippendorffs.alpha}}.
#' @param parm always ignored since there is only one parameter.
#' @param level the desired confidence level for the interval. The default is 0.95.
#' @param \dots additional arguments. These are passed to \code{\link{quantile}}.
#' @return A vector with entries giving lower and upper confidence limits. These will be labelled as (1 - level) / 2 and 1 - (1 - level) / 2.
#' @seealso \code{\link{krippendorffs.alpha}}
#'
#' @method confint krippendorffsalpha
#'
#' @references
#' Nissi, M. J., Mortazavi, S., Hughes, J., Morgan, P., and Ellermann, J. (2015). T2* relaxation time of acetabular and femoral cartilage with and without intra-articular Gd-DTPA2 in patients with femoroacetabular impingement. \emph{American Journal of Roentgenology}, \bold{204}(6), W695.
#'
#' @export
#'
#' @examples
#' # Fit a subset of the cartilage data, using the customary methodology.
#' # Compute bootstrap confidence intervals using a bootstrap sample size
#' # of 1,000. Report the estimate of alpha, and produce a 99% interval.
#'
#' data(cartilage)
#' cartilage = as.matrix(cartilage[1:100, ])
#' fit.cart = krippendorffs.alpha(cartilage, level = "ratio", method = "customary", confint = TRUE,
#'                                control = list(bootit = 1000, parallel = FALSE))
#' fit.cart$alpha.hat
#' confint(fit.cart, level = 0.99)

confint.krippendorffsalpha = function(object, parm = "alpha", level = 0.95, ...)
{
    if (! object$confint)
        return(rep(NA, 2))
    else
    {
        lo = (1 - level) / 2
        hi = 1 - lo
        probs = c(lo, hi)
        if (object$method == "analytical")
        {
            if (level == 0.95)
                confint = c(object$L, object$U)
            else
            {
                t = qt(hi, df = object$a - 1)
                eta.hat = object$eta.hat
                se = object$se
                lo = eta.hat - t * se
                hi = eta.hat + t * se
                n_ = object$n_
                L = (exp(lo) - 1) / (exp(lo) - 1 + n_)
                U = (exp(hi) - 1) / (exp(hi) - 1 + n_)
                confint = c(L, U)
            }
        }
        else
        {
            boot.sample = object$boot.sample
            if (! is.null(boot.sample))
                confint = quantile(boot.sample, probs, ...)
        }
        names(confint) = probs
    }
    confint
}

#' Plot the results of a Krippendorff's Alpha analysis.
#'
#' @details This function plots the results of a Krippendorff's Alpha analysis, assuming that \code{\link{krippendorffs.alpha}} was called with \code{method = "customary"} and \code{confint = TRUE}. Otherwise there is no bootstrap sample to work with. The plot is highly customizable.
#'
#' This function plots a histogram of the bootstrap sample, (optionally) a kernel density estimate, and vertical lines marking the lower and upper confidence limits.
#'
#' @param x an object of class \code{"krippendorffsalpha"}, the result of a call to \code{\link{krippendorffs.alpha}}.
#' @param y always ignored.
#' @param level the desired confidence level for the interval. The default is 0.95.
#' @param type the method used to compute sample quantiles. This argument is passed to \code{\link{quantile}}. The default is 7.
#' @param density logical; if \code{TRUE}, a kernel density estimate is plotted.
#' @param lty.density the line type for the kernel density estimate. The default is 1.
#' @param lty.estimate the line type for the estimate of alpha. The default is 1.
#' @param lty.interval the line type for the confidence limits. The default is 2.
#' @param col.density the color for the kernel density estimate. The default is black.
#' @param col.estimate the color for the estimate of alpha. The default is orange.
#' @param col.interval the color for the confidence limits. The default is blue.
#' @param lwd.density the line width for the kernel density estimate. The default is 3.
#' @param lwd.estimate the line width for the estimate of alpha. The default is 3.
#' @param lwd.interval the line width for the confidence limits. The default is 3.
#' @param \dots additional arguments. These are passed to \code{\link{hist}}.
#'
#' @seealso \code{\link{krippendorffs.alpha}}
#'
#' @method plot krippendorffsalpha
#'
#' @references
#' Krippendorff, K. (2013). Computing Krippendorff's alpha-reliability. Technical report, University of Pennsylvania.
#'
#' @export
#'
#' @examples
#' # The following data were presented in Krippendorff (2013).
#'
#' nominal = matrix(c(1,2,3,3,2,1,4,1,2,NA,NA,NA,
#'                    1,2,3,3,2,2,4,1,2,5,NA,3,
#'                    NA,3,3,3,2,3,4,2,2,5,1,NA,
#'                    1,2,3,3,2,4,4,1,2,5,1,NA), 12, 4)
#' fit.nom = krippendorffs.alpha(nominal, level = "nominal", method = "customary", confint = TRUE,
#'                               verbose = TRUE, control = list(bootit = 1000, parallel = FALSE))
#' dev.new()
#' plot(fit.nom, main = "Results for Nominal Data", xlab = "Bootstrap Estimates", density = FALSE)

plot.krippendorffsalpha = function(x, y = NULL, level = 0.95, type = 7, density = TRUE,
                                   lty.density = 1, lty.estimate = 1, lty.interval = 2,
                                   col.density = "black", col.estimate = "orange", col.interval = "blue",
                                   lwd.density = 3, lwd.estimate = 3, lwd.interval = 3, ...)
{
    if (! x$confint || x$method == "analytical")
        stop("There is nothing to plot. Call function krippendorffs.alpha with method = \"customary\" and confint = TRUE.")
    else
    {
        boot.sample = x$boot.sample
        if (! is.null(boot.sample))
        {
            lo = (1 - level) / 2
            hi = 1 - lo
            probs = c(lo, hi)
            confint = quantile(boot.sample, probs, type = type)
        }
        hist(boot.sample, prob = TRUE, ...)
        if (density)
            lines(density(boot.sample), lty = lty.density, col = col.density, lwd = lwd.density)
        abline(v = x$alpha.hat, lty = lty.estimate, col = col.estimate, lwd = lwd.estimate)
        abline(v = confint, lty = lty.interval, col = col.interval, lwd = lwd.interval)
    }
}
Any scripts or data that you put into this service are public.
krippendorffsalpha documentation built on Oct. 25, 2022, 5:06 p.m.
rdrr.io home R language documentation Run R code online
CRAN packages Bioconductor packages R-Forge packages GitHub packages
Note that we can't provide technical support on individual packages. You should contact the package authors for that.
krippendorffsalpha
Measuring Agreement Using Krippendorff's Alpha Coefficient

R/krippendorff.R
In krippendorffsalpha: Measuring Agreement Using Krippendorff's Alpha Coefficient

Documented in confint.krippendorffsalpha influence.krippendorffsalpha interval.dist krippendorffs.alpha nominal.dist plot.krippendorffsalpha ratio.dist summary.krippendorffsalpha

Try the krippendorffsalpha package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

krippendorffsalpha Measuring Agreement Using Krippendorff's Alpha Coefficient

R/krippendorff.R In krippendorffsalpha: Measuring Agreement Using Krippendorff's Alpha Coefficient

Documented in confint.krippendorffsalpha influence.krippendorffsalpha interval.dist krippendorffs.alpha nominal.dist plot.krippendorffsalpha ratio.dist summary.krippendorffsalpha

Try the krippendorffsalpha package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

krippendorffsalpha
Measuring Agreement Using Krippendorff's Alpha Coefficient

R/krippendorff.R
In krippendorffsalpha: Measuring Agreement Using Krippendorff's Alpha Coefficient