difNLR: DIF and DDF Detection by Non-Linear Regression Models

Documented in NLR

#' DIF statistics for non-linear regression models.
#'
#' @description
#' Calculates likelihood ratio test statistics, F-test statistics, or Wald's
#' test statistics for DIF detection among dichotomous items using non-linear
#' regression models (generalized logistic regression models).
#'
#' @usage
#' NLR(Data, group, model, constraints = NULL, type = "all", method = "nls",
#'     match = "zscore", anchor = 1:ncol(Data), start, p.adjust.method = "none",
#'     test = "LR", alpha = 0.05, initboot = TRUE, nrBo = 20, sandwich = FALSE)
#'
#' @param Data data.frame or matrix: dataset in which rows represent scored
#'   examinee answers (\code{"1"} correct, \code{"0"} incorrect) and columns
#'   correspond to the items.
#' @param group numeric: a binary vector of a group membership (\code{"0"}
#'   for the reference group, \code{"1"} for the focal group).
#' @param model character: generalized logistic regression model to be fitted. See
#'   \strong{Details}.
#' @param constraints character: which parameters should be the same for both
#'   groups. Possible values are any combinations of parameters \code{"a"},
#'   \code{"b"}, \code{"c"}, and \code{"d"}. Default value is \code{NULL}.
#'   See \strong{Details}.
#' @param method character: an estimation method to be applied. The options are
#'   \code{"nls"} for non-linear least squares (default), \code{"mle"} for the
#'   maximum likelihood method using the \code{"L-BFGS-B"} algorithm with
#'   constraints, \code{"em"} for the maximum likelihood estimation with the EM
#'   algorithm, \code{"plf"} for the maximum likelihood estimation with the
#'   algorithm based on parametric link function, and \code{"irls"} for the maximum
#'   likelihood estimation with the iteratively reweighted least squares algorithm
#'   (available for the \code{"2PL"} model only). See \strong{Details}.
#' @param match character or numeric: matching criterion to be used as
#'   an estimate of the trait. It can be either \code{"zscore"} (default,
#'   standardized total score), \code{"score"} (total test score), or
#'   a numeric vector of the same length as a number of observations in
#'   the \code{Data}.
#' @param anchor character or numeric: specification of DIF free items. A vector
#'   of item identifiers (integers specifying the column number) specifying
#'   which items are currently considered as anchor (DIF free) items. Argument
#'   is ignored if the \code{match} is not \code{"zscore"} or \code{"score"}.
#' @param type character: type of DIF to be tested. Possible values are
#'   \code{"all"} for detecting difference in any parameter (default),
#'   \code{"udif"} for uniform DIF only (i.e., difference in difficulty
#'   parameter \code{"b"}),
#'   \code{"nudif"} for non-uniform DIF only (i.e., difference in discrimination
#'   parameter \code{"a"}),
#'   \code{"both"} for uniform and non-uniform DIF (i.e., difference in
#'   parameters \code{"a"} and \code{"b"}),
#'   or any combination of parameters \code{"a"}, \code{"b"}, \code{"c"}, and
#'   \code{"d"}. Can be specified as a single value (for all items) or as an
#'   item-specific vector.
#' @param p.adjust.method character: a method for a multiple comparison
#'   correction. Possible values are \code{"holm"}, \code{"hochberg"},
#'   \code{"hommel"}, \code{"bonferroni"}, \code{"BH"}, \code{"BY"},
#'   \code{"fdr"}, and \code{"none"} (default). For more details see
#'   \code{\link[stats]{p.adjust}}.
#' @param start numeric: initial values for the estimation of item parameters. If
#'   not specified, starting values are calculated with the
#'   \code{\link[difNLR]{startNLR}} function. Otherwise, a list with as many
#'   elements as a number of items. Each element is a named numeric vector
#'   representing initial values for estimation of item parameters. Specifically,
#'   parameters \code{"a"}, \code{"b"}, \code{"c"}, and \code{"d"} are initial
#'   values for discrimination, difficulty, guessing, and inattention for the
#'   reference group. Parameters \code{"aDif"}, \code{"bDif"}, \code{"cDif"}, and
#'   \code{"dDif"} are then differences in these parameters between the reference
#'   and focal groups. For the \code{method = "irls"}, default initial values from
#'   the \code{\link[stats]{glm}} function are used.
#' @param test character: a statistical test to be performed for DIF detection.
#'   Can be either \code{"LR"} for the likelihood ratio test of a submodel
#'   (default), \code{"W"} for the Wald's test, or \code{"F"} for the F-test of
#'   a submodel.
#' @param alpha numeric: a significance level (the default is 0.05).
#' @param initboot logical: in the case of convergence issues, should starting
#'   values be re-calculated based on bootstrapped samples? (the default is
#'   \code{TRUE}; newly calculated initial values are applied only to
#'   items/models with convergence issues).
#' @param nrBo numeric: the maximal number of iterations for the calculation of
#'   starting values using bootstrapped samples (the default is 20).
#' @param sandwich logical: should the sandwich estimator be applied for
#'   computation of the covariance matrix of item parameters when using
#'   \code{method = "nls"}? (the default is \code{FALSE}).
#'
#' @details
#' The function calculates test statistics using a DIF detection procedure based
#' on non-linear regression models (i.e., extensions of the logistic regression
#' procedure; Swaminathan & Rogers, 1990; Drabinova & Martinkova, 2017).
#'
#' The unconstrained form of the 4PL generalized logistic regression model for
#' probability of correct answer (i.e., \eqn{Y_{pi} = 1}) using IRT
#' parameterization is
#' \deqn{P(Y_{pi} = 1|X_p, G_p) = (c_{iR} \cdot G_p + c_{iF} \cdot (1 - G_p)) +
#' (d_{iR} \cdot G_p + d_{iF} \cdot (1 - G_p) - c_{iR} \cdot G_p - c_{iF} \cdot
#' (1 - G_p)) / (1 + \exp(-(a_i + a_{i\text{DIF}} \cdot G_p) \cdot
#' (X_p - b_p - b_{i\text{DIF}} \cdot G_p))), }
#' where \eqn{X_p} is the matching criterion (e.g., standardized total score)
#' and \eqn{G_p} is a group membership variable for respondent \eqn{p}.
#' Parameters \eqn{a_i}, \eqn{b_i}, \eqn{c_{iR}}, and \eqn{d_{iR}} are
#' discrimination, difficulty, guessing, and inattention for the reference group
#' for item \eqn{i}. Terms \eqn{a_{i\text{DIF}}} and \eqn{b_{i\text{DIF}}} then
#' represent differences between the focal and reference groups in
#' discrimination and difficulty for item \eqn{i}. Terms \eqn{c_{iF}}, and
#' \eqn{d_{iF}} are guessing and inattention parameters for the focal group for
#' item \eqn{i}. In the case that there is no assumed difference between the
#' reference and focal group in the guessing or inattention parameters, the
#' terms \eqn{c_i} and \eqn{d_i} are used.
#'
#' Alternatively, intercept-slope parameterization may be applied:
#' \deqn{P(Y_{pi} = 1|X_p, G_p) = (c_{iR} \cdot G_p + c_{iF} \cdot (1 - G_p)) +
#' (d_{iR} \cdot G_p + d_{iF} \cdot (1 - G_p) - c_{iR} \cdot G_p - c_{iF} \cdot
#' (1 - G_p)) / (1 + \exp(-(\beta_{i0} + \beta_{i1} \cdot X_p +
#' \beta_{i2} \cdot G_p + \beta_{i3} \cdot X_p \cdot G_p))), }
#' where parameters \eqn{\beta_{i0}, \beta_{i1}, \beta_{i2}, \beta_{i3}} are
#' intercept, effect of the matching criterion, effect of the group membership,
#' and their mutual interaction, respectively.
#'
#' The \code{model} and \code{constraints} arguments can further constrain the
#' 4PL model. The arguments \code{model} and \code{constraints} can also be
#' combined. Both arguments can be specified as a single value (for all items)
#' or as an item-specific vector (where each element corresponds to one item).
#'
#' The \code{model} argument offers several predefined models. The options are as follows:
#' \code{Rasch} for 1PL model with discrimination parameter fixed on value 1 for both groups,
#' \code{1PL} for 1PL model with discrimination parameter set the same for both groups,
#' \code{2PL} for logistic regression model,
#' \code{3PLcg} for 3PL model with fixed guessing for both groups,
#' \code{3PLdg} for 3PL model with fixed inattention for both groups,
#' \code{3PLc} (alternatively also \code{3PL}) for 3PL regression model with guessing parameter,
#' \code{3PLd} for 3PL model with inattention parameter,
#' \code{4PLcgdg} for 4PL model with fixed guessing and inattention parameter for both groups,
#' \code{4PLcgd} (alternatively also \code{4PLd}) for 4PL model with fixed guessing for both groups,
#' \code{4PLcdg} (alternatively also \code{4PLc}) for 4PL model with fixed inattention for both groups,
#' or \code{4PL} for 4PL model.
#'
#' The function uses intercept-slope parameterization for the estimation via the
#' \code{\link[difNLR]{estimNLR}} function. Item parameters are then
#' re-calculated into the IRT parameterization using the delta method.
#'
#' The function offers either the non-linear least squares estimation via the
#' \code{\link[stats]{nls}} function (Drabinova & Martinkova, 2017; Hladka &
#' Martinkova, 2020), the maximum likelihood method with the \code{"L-BFGS-B"}
#' algorithm with constraints via the \code{\link[stats]{optim}} function
#' (Hladka & Martinkova, 2020), the maximum likelihood method with the EM
#' algorithm (Hladka, Martinkova, & Brabec, 2025), the maximum likelihood method
#' with the algorithm based on parametric link function (Hladka, Martinkova, &
#' Brabec, 2025), or the maximum likelihood method with the iteratively
#' reweighted least squares algorithm via the \code{\link[stats]{glm}} function.
#'
#' @return A list with the following arguments:
#' \describe{
#'   \item{\code{Sval}}{the values of the \code{test} statistics.}
#'   \item{\code{pval}}{the p-values by the \code{test}.}
#'   \item{\code{adjusted.pval}}{adjusted p-values by the \code{p.adjust.method}.}
#'   \item{\code{df}}{the degrees of freedom of the \code{test}.}
#'   \item{\code{test}}{used test.}
#'   \item{\code{par.m0}}{the matrix of estimated item parameters for the null model.}
#'   \item{\code{se.m0}}{the matrix of standard errors of item parameters for the null model.}
#'   \item{\code{cov.m0}}{list of covariance matrices of item parameters for the null model.}
#'   \item{\code{par.m1}}{the matrix of estimated item parameters for the alternative model.}
#'   \item{\code{se.m1}}{the matrix of standard errors of item parameters for the alternative model.}
#'   \item{\code{cov.m1}}{list of covariance matrices of item parameters for the alternative model.}
#'   \item{\code{cf}}{numeric: a number of convergence issues.}
#'   \item{\code{cf.which}}{the indicators of the items that did not converge.}
#'   \item{\code{ll.m0}}{log-likelihood of null model.}
#'   \item{\code{ll.m1}}{log-likelihood of alternative model.}
#'   \item{\code{startBo0}}{the binary matrix. Columns represent iterations of initial values
#'   re-calculations, rows represent items. The value of 0 means no convergence issue in the null model,
#'   1 means convergence issue in the null model.}
#'   \item{\code{startBo1}}{the binary matrix. Columns represent iterations of initial values
#'   re-calculations, rows represent items. The value of 0 means no convergence issue in the alternative model,
#'   1 means convergence issue in the alternative model.}
#' }
#'
#' @author
#' Adela Hladka (nee Drabinova) \cr
#' Institute of Computer Science of the Czech Academy of Sciences \cr
#' \email{hladka@@cs.cas.cz} \cr
#'
#' Patricia Martinkova \cr
#' Institute of Computer Science of the Czech Academy of Sciences \cr
#' \email{martinkova@@cs.cas.cz} \cr
#'
#' Karel Zvara \cr
#' Faculty of Mathematics and Physics, Charles University \cr
#'
#' @references
#' Drabinova, A. & Martinkova, P. (2017). Detection of differential item
#' functioning with nonlinear regression: A non-IRT approach accounting for
#' guessing. Journal of Educational Measurement, 54(4), 498--517,
#' \doi{10.1111/jedm.12158}.
#'
#' Hladka, A. (2021). Statistical models for detection of differential item
#' functioning. Dissertation thesis. Faculty of Mathematics and Physics, Charles
#' University.
#'
#' Hladka, A. & Martinkova, P. (2020). difNLR: Generalized logistic regression
#' models for DIF and DDF detection. The R Journal, 12(1), 300--323,
#' \doi{10.32614/RJ-2020-014}.
#'
#' Hladka, A., Martinkova, P., & Brabec, M. (2025). New iterative algorithms
#' for estimation of item functioning. Journal of Educational and Behavioral
#' Statistics. Online first, \doi{10.3102/10769986241312354}.
#'
#' Swaminathan, H. & Rogers, H. J. (1990). Detecting differential item
#' functioning using logistic regression procedures. Journal of Educational
#' Measurement, 27(4), 361--370, \doi{10.1111/j.1745-3984.1990.tb00754.x}
#'
#' @seealso \code{\link[stats]{p.adjust}}
#'
#' @examples
#' \dontrun{
#' # loading data
#' data(GMAT)
#' Data <- GMAT[, 1:20] # items
#' group <- GMAT[, "group"] # group membership variable
#'
#' # testing both DIF effects using the LR test (default)
#' # and the model with fixed guessing for both groups
#' NLR(Data, group, model = "3PLcg")
#'
#' # using the F test and Wald's test
#' NLR(Data, group, model = "3PLcg", test = "F")
#' NLR(Data, group, model = "3PLcg", test = "W")
#'
#' # using the Benjamini-Hochberg correction
#' NLR(Data, group, model = "3PLcg", p.adjust.method = "BH")
#'
#' # 4PL model with the same guessing and inattention
#' # to test uniform DIF
#' NLR(Data, group, model = "4PLcgdg", type = "udif")
#'
#' # 2PL model to test non-uniform DIF
#' NLR(Data, group, model = "2PL", type = "nudif")
#'
#' # 4PL model with fixed a and c parameters
#' # to test difference in parameter b
#' NLR(Data, group, model = "4PL", constraints = "ac", type = "b")
#'
#' # using various estimation algorithms
#' NLR(Data, group, model = "3PLcg", method = "nls")
#' NLR(Data, group, model = "3PLcg", method = "mle")
#' NLR(Data, group, model = "3PLcg", method = "em")
#' NLR(Data, group, model = "3PLcg", method = "plf")
#' NLR(Data, group, model = "2PL", method = "irls")
#' }
#'
#' @keywords DIF
#' @export
NLR <- function(Data, group, model, constraints = NULL, type = "all", method = "nls",
                match = "zscore", anchor = 1:ncol(Data), start, p.adjust.method = "none",
                test = "LR", alpha = 0.05, initboot = TRUE, nrBo = 20, sandwich = FALSE) {
  # if (method == "plf") {
  #   message("Note that the default option for `method` is now 'plf' instead of 'nls'.")
  # }

  if (match[1] == "zscore") {
    x <- as.vector(scale(apply(as.data.frame(Data[, anchor]), 1, sum)))
  } else {
    if (match[1] == "score") {
      x <- apply(as.data.frame(Data[, anchor]), 1, sum)
    } else {
      if (length(match) == dim(Data)[1]) {
        x <- match
      } else {
        stop("Invalid value for 'match'. Possible values are 'score', 'zscore', or a vector of the same length as a number
             of observations in 'Data'!", call. = FALSE)
      }
    }
  }

  m <- dim(Data)[2]
  n <- dim(Data)[1]

  if (length(model) == 1) {
    model <- rep(model, m)
  }
  if (is.null(constraints)) {
    constraints <- as.list(rep(NA, m))
  }
  if (length(constraints) == 1) {
    constraints <- rep(constraints, m)
  }
  if (length(type) == 1) {
    type <- rep(type, m)
  }

  if (method == "irls") {
    parameterization <- rep("logistic", m)
  } else {
    parameterization <- rep("is", m)
  }
  # formulas for models
  M <- lapply(
    1:m,
    function(i) {
      formulaNLR(
        model = model[i],
        type = type[i],
        constraints = constraints[[i]],
        parameterization = parameterization[i]
      )
    }
  )
  # starting values
  if (method == "irls") {
    start <- NULL
  } else if (missing(start) || is.null(start)) {
    start <- startNLR(Data, group, model, match = x, parameterization = parameterization)
  } else {
    if (all(sapply(1:m, function(i) all(M[[i]]$M1$parameters %in% names(start[[i]]))))) {
      start <- lapply(1:m, function(i) start[[i]][M[[i]]$M1$parameters])
    }
    if (!all(sapply(1:m, function(i) length(start[[i]]) == length(M[[i]]$M1$parameters))) ||
      !all(sapply(1:m, function(i) all(sort(names(start[[i]])) == sort(M[[i]]$M1$parameters))))) {
      warning("Invalid names of item parameters in 'start'. Initial values are calculated with the 'startNLR' function.", call. = FALSE)
      start <- startNLR(Data, group, model, match = x, parameterization = parameterization)
    }
  }
  # model fitting
  m0 <- lapply(1:m, function(i) {
    start_tmp <- start[[i]]
    names_start_tmp <- names(start_tmp)
    if (!("cR" %in% M[[i]]$M0$parameters) & "cR" %in% names_start_tmp) {
      names(start_tmp)[names_start_tmp == "cR"] <- "c"
    }
    if (!("dR" %in% M[[i]]$M0$parameters) & "dR" %in% names_start_tmp) {
      names(start_tmp)[names_start_tmp == "dR"] <- "d"
    }

    estimNLR(
      y = Data[, i], match = x, group = group,
      formula = M[[i]]$M0$formula,
      method = method,
      start = structure(start_tmp[M[[i]]$M0$parameters],
        names = M[[i]]$M0$parameters
      ),
      lower = M[[i]]$M0$lower,
      upper = M[[i]]$M0$upper
    )
  })
  m1 <- lapply(1:m, function(i) {
    start_tmp <- start[[i]]
    names_start_tmp <- names(start_tmp)
    if (!("cR" %in% M[[i]]$M1$parameters) & "cR" %in% names_start_tmp) {
      names(start_tmp)[names_start_tmp == "cR"] <- "c"
    }
    if (!("dR" %in% M[[i]]$M1$parameters) & "dR" %in% names_start_tmp) {
      names(start_tmp)[names_start_tmp == "dR"] <- "d"
    }

    estimNLR(
      y = Data[, i], match = x, group = group,
      formula = M[[i]]$M1$formula,
      method = method,
      start = structure(start_tmp[M[[i]]$M1$parameters],
        names = M[[i]]$M1$parameters
      ),
      lower = M[[i]]$M1$lower,
      upper = M[[i]]$M1$upper
    )
  })

  # convergence failures
  cf0 <- sapply(m0, is.null)
  cf1 <- sapply(m1, is.null)
  cf <- sum(cf0, cf1)

  items.cf0 <- which(cf0)
  items.cf1 <- which(cf1)
  items.cf <- sort(which(cf0 | cf1))
  # converged items
  items.conv0 <- setdiff(1:m, items.cf0)
  items.conv1 <- setdiff(1:m, items.cf1)

  # covariance structure
  cov.m0 <- cov.m1 <- as.list(rep(NA, m))
  if (method == "irls") {
    cov.m0[items.conv0] <- suppressWarnings(lapply(lapply(m0[items.conv0], summary), vcov))
    cov.m1[items.conv1] <- suppressWarnings(lapply(lapply(m1[items.conv1], summary), vcov))
  } else {
    cov.m0[items.conv0] <- suppressWarnings(lapply(m0[items.conv0], vcov, sandwich))
    cov.m1[items.conv1] <- suppressWarnings(lapply(m1[items.conv1], vcov, sandwich))
  }
  items.cov.fail0 <- which(sapply(cov.m0, is.null))
  items.cov.fail1 <- which(sapply(cov.m1, is.null))
  items.cov.fail <- sort(union(items.cov.fail0, items.cov.fail1))
  # converged items with covariances
  items.conv0 <- setdiff(items.conv0, items.cov.fail0)
  items.conv1 <- setdiff(items.conv1, items.cov.fail1)

  # standard errors
  se.m0 <- se.m1 <- as.list(rep(NA, m))
  se.m0[items.conv0] <- suppressWarnings(lapply(cov.m0[items.conv0], function(x) sqrt(diag(x))))
  se.m1[items.conv1] <- suppressWarnings(lapply(cov.m1[items.conv1], function(x) sqrt(diag(x))))

  if (length(items.conv0) > 0) {
    items.se.fail0 <- which(sapply(se.m0[items.conv0], function(x) any(is.na(x))))
  } else {
    items.se.fail0 <- 1:m
  }
  if (length(items.conv1) > 0) {
    items.se.fail1 <- which(sapply(se.m1[items.conv1], function(x) any(is.na(x))))
  } else {
    items.se.fail1 <- 1:m
  }
  items.se.fail <- sort(union(items.se.fail0, items.se.fail1))
  # converged items with covariances and SEs
  items.conv0 <- setdiff(items.conv0, items.se.fail0)
  items.conv1 <- setdiff(items.conv1, items.se.fail1)

  # using starting values for bootstrapped samples
  if (initboot & (cf > 0 || length(items.cov.fail) > 0 || length(items.se.fail) > 0)) {
    items.failed0 <- setdiff(1:m, items.conv0)
    items.failed1 <- setdiff(1:m, items.conv1)

    start0 <- start1 <- start
    startBo0 <- startBo1 <- rep(0, m)
    startBo0[items.cf0] <- 1
    startBo1[items.cf1] <- 1

    i <- k <- 1 # i is current iteration, k is successful
    message("Trying to recalculate starting values based on bootstrapped samples... ")

    while (length(items.failed0) > 0 || length(items.failed1) > 0) {
      # re-calculating initial values
      set.seed(k)
      samp <- sample(1:n, size = n, replace = TRUE)
      startalt <- tryCatch(
        startNLR(Data[samp, ], group[samp], model,
          match = x[samp],
          parameterization = parameterization
        ),
        error = function(e) {},
        finally = ""
      )
      if (is.null(startalt)) {
        k <- k + 1
        next
      }

      if (length(items.failed0) > 0) {
        start0[items.cf0] <- startalt[items.cf0]
        m0[items.cf0] <- lapply(items.cf0, function(j) {
          start_tmp <- start0[[j]]
          names_start_tmp <- names(start_tmp)
          if (!("cR" %in% M[[j]]$M0$parameters) & "cR" %in% names_start_tmp) {
            names(start_tmp)[names_start_tmp == "cR"] <- "c"
          }
          if (!("dR" %in% M[[j]]$M0$parameters) & "dR" %in% names_start_tmp) {
            names(start_tmp)[names_start_tmp == "dR"] <- "d"
          }

          estimNLR(
            y = Data[, j], match = x, group = group,
            formula = M[[j]]$M0$formula,
            method = method,
            start = structure(start_tmp[M[[j]]$M0$parameters],
              names = M[[j]]$M0$parameters
            ),
            lower = M[[j]]$M0$lower,
            upper = M[[j]]$M0$upper
          )
        })
        items.cf0 <- which(sapply(m0, is.null))
        items.conv0.new <- setdiff(items.failed0, items.cf0)

        # checking covariance for newly converged
        if (method == "irls") {
          cov.m0[items.conv0.new] <- suppressWarnings(lapply(lapply(m0[items.conv0.new], summary), vcov))
        } else {
          cov.m0[items.conv0.new] <- suppressWarnings(lapply(m0[items.conv0.new], vcov, sandwich))
        }
        items.cov.fail0 <- which(sapply(cov.m0, is.null))
        # newly converged items with covariances
        items.conv0.new <- setdiff(items.conv0.new, items.cov.fail0)

        # checking standard errors for newly converged
        se.m0[items.conv0.new] <- suppressWarnings(lapply(cov.m0[items.conv0.new], function(x) sqrt(diag(x))))
        se.fail0 <- which(sapply(se.m0, function(x) any(is.na(x))))
        # newly converged items with covariances and SEs
        items.conv0.new <- setdiff(items.conv0.new, se.fail0)

        # not successfully converged items
        items.cf0 <- sort(union(items.cf0, union(items.cov.fail0, items.se.fail0)))

        startBo0 <- cbind(startBo0, rep(0, m))
        startBo0[items.cf0, i + 1] <- 1
      }
      if (length(items.failed1) > 0) {
        start1[items.cf1] <- startalt[items.cf1]
        m1[items.cf1] <- lapply(items.cf1, function(j) {
          start_tmp <- start1[[j]]
          names_start_tmp <- names(start_tmp)
          if (!("cR" %in% M[[j]]$M1$parameters) & "cR" %in% names_start_tmp) {
            names(start_tmp)[names_start_tmp == "cR"] <- "c"
          }
          if (!("dR" %in% M[[j]]$M1$parameters) & "dR" %in% names_start_tmp) {
            names(start_tmp)[names_start_tmp == "dR"] <- "d"
          }

          estimNLR(
            y = Data[, j], match = x, group = group,
            formula = M[[j]]$M1$formula,
            method = method,
            start = structure(start_tmp[M[[j]]$M1$parameters],
              names = M[[j]]$M1$parameters
            ),
            lower = M[[j]]$M1$lower,
            upper = M[[j]]$M1$upper
          )
        })
        items.cf1 <- which(sapply(m1, is.null))
        items.conv1.new <- setdiff(items.failed1, items.cf1)

        # checking covariance for newly converged
        if (method == "irls") {
          cov.m1[items.conv1.new] <- suppressWarnings(lapply(lapply(m1[items.conv1.new], summary), vcov))
        } else {
          cov.m1[items.conv1.new] <- suppressWarnings(lapply(m1[items.conv1.new], vcov, sandwich))
        }
        items.cov.fail1 <- which(sapply(cov.m1, is.null))
        # newly converged items with covariances
        items.conv1.new <- setdiff(items.conv1.new, items.cov.fail1)

        # checking standard errors for newly converged
        se.m1[items.conv1.new] <- suppressWarnings(lapply(cov.m1[items.conv1.new], function(x) sqrt(diag(x))))
        se.fail1 <- which(sapply(se.m1, function(x) any(is.na(x))))
        # newly converged items with covariances and SEs
        items.conv1.new <- setdiff(items.conv1.new, se.fail1)

        # not successfully converged items
        items.cf1 <- sort(union(items.cf1, union(items.cov.fail1, items.se.fail1)))

        startBo1 <- cbind(startBo1, rep(0, m))
        startBo1[items.cf1, i + 1] <- 1
      }

      items.cf <- sort(union(items.cf0, items.cf1))
      items.cov.fail <- sort(union(items.cov.fail0, items.cov.fail1))
      items.se.fail <- sort(union(items.se.fail0, items.se.fail1))

      items.failed0 <- union(items.cf0, union(items.cov.fail0, items.se.fail0))
      items.failed1 <- union(items.cf1, union(items.cov.fail1, items.se.fail1))
      cf0 <- 1:m %in% items.cf0
      cf1 <- 1:m %in% items.cf1

      if (i == nrBo) {
        break
      } else {
        i <- i + 1
        k <- k + 1
      }
    }
  } else {
    startBo0 <- startBo1 <- NULL
    i <- 1
  }

  if (i > 1) {
    if (i < nrBo) {
      message("The recalculation of starting values was successful. ")
    } else if (length(items.cf) > 0) {
      message("Unfortunately, the recalculation of starting values was unsuccessful.
There are still some convergence issues.
You may try increasing the number of recalculations using the `nrBo` argument. ")
    }
  }

  if (length(items.cf) > 0) {
    msg <- ifelse(initboot, "", "\n You may try recalculating the starting values based on bootstrapped samples by using the argument `initboot = TRUE`. ")
    warning(
      paste0(
        "Convergence issues in ", ifelse(length(items.cf) > 1, "items ", "item "),
        paste0(items.cf, collapse = ", "), msg
      ),
      call. = FALSE
    )
  }
  if (length(items.cov.fail) > 0) {
    warning(paste0(
      "Covariance matrix cannot be computed for ",
      ifelse(length(items.cov.fail) > 1, "items ", "item "),
      paste(items.cov.fail, collapse = ", "), "."
    ), call. = FALSE)
  }
  if (length(items.se.fail) > 0) {
    warning(paste0(
      "Standard errors of item parameter estimates cannot be computed for ",
      ifelse(length(items.se.fail) > 1, "items ", "item "),
      paste(items.se.fail, collapse = ", "), ". \n",
      "Computed covariance", ifelse(length(items.se.fail) > 1, " matrices are", " matrix is"), " probably not positive semi-definite."
    ), call. = FALSE)
  }

  conv0 <- which(!cf0)
  conv1 <- which(!cf1)
  conv <- which(!(cf1 | cf0))

  # log-likelihood
  ll.m0 <- ll.m1 <- rep(NA, m)
  ll.m0[conv0] <- sapply(m0[conv0], logLik)
  ll.m1[conv1] <- sapply(m1[conv1], logLik)

  # parameters
  par.m0 <- lapply(1:m, function(i) {
    pars <- structure(rep(NA, length(M[[i]]$M0$parameters)),
      names = M[[i]]$M0$parameters
    )
  })
  par.m1 <- lapply(1:m, function(i) {
    structure(rep(NA, length(M[[i]]$M1$parameters)),
      names = M[[i]]$M1$parameters
    )
  })
  par.m0[conv0] <- lapply(m0[conv0], coef)
  par.m1[conv1] <- lapply(m1[conv1], coef)

  names(par.m1) <- names(par.m0) <- names(se.m1) <- names(se.m0) <- names(cov.m0) <- names(cov.m1) <- colnames(Data)

  if (method == "irls") {
    par.m0 <- lapply(par.m0, function(x) {
      names(x) <- gsub("g", "b2", gsub("x", "b1", gsub("x:g", "b3", gsub("\\(Intercept\\)", "b0", names(x)))))
      x
    })
    par.m1 <- lapply(par.m1, function(x) {
      names(x) <- gsub("g", "b2", gsub("x", "b1", gsub("x:g", "b3", gsub("\\(Intercept\\)", "b0", names(x)))))
      x
    })
    se.m0 <- lapply(se.m0, function(x) {
      names(x) <- gsub("g", "b2", gsub("x", "b1", gsub("x:g", "b3", gsub("\\(Intercept\\)", "b0", names(x)))))
      x
    })
    se.m1 <- lapply(se.m1, function(x) {
      names(x) <- gsub("g", "b2", gsub("x", "b1", gsub("x:g", "b3", gsub("\\(Intercept\\)", "b0", names(x)))))
      x
    })
    cov.m0 <- lapply(cov.m0, function(x) {
      tmp <- gsub("g", "b2", gsub("x", "b1", gsub("x:g", "b3", gsub("\\(Intercept\\)", "b0", rownames(x)))))
      rownames(x) <- colnames(x) <- tmp
      x
    })
    cov.m1 <- lapply(cov.m1, function(x) {
      tmp <- gsub("g", "b2", gsub("x", "b1", gsub("x:g", "b3", gsub("\\(Intercept\\)", "b0", rownames(x)))))
      rownames(x) <- colnames(x) <- tmp
      x
    })
  }

  # test
  n0 <- sapply(1:m, function(i) length(M[[i]]$M0$parameters))
  n1 <- sapply(1:m, function(i) length(M[[i]]$M1$parameters))
  df <- cbind(n1 - n0, n - n1)

  if (test == "F") {
    pval <- Fval <- rep(NA, m)

    RSS0 <- rep(NA, m)
    RSS1 <- rep(NA, m)
    RSS0[conv] <- sapply(conv, function(l) sum(residuals(m0[[l]])^2))
    RSS1[conv] <- sapply(conv, function(l) sum(residuals(m1[[l]])^2))

    Fval[conv] <- sapply(
      conv,
      function(l) ((RSS0[l] - RSS1[l]) / df[l, 1]) / (RSS1[l] / df[l, 2])
    )
    pval[conv] <- sapply(
      conv,
      function(l) (1 - pf(Fval[l], df[l, 1], df[l, 2]))
    )
  } else if (test == "LR") {
    df <- df[, 1]
    pval <- LRval <- rep(NA, m)

    LRval[conv] <- sapply(
      conv,
      function(l) -2 * c(logLik(m0[[l]]) - logLik(m1[[l]]))
    )
    pval[conv] <- sapply(
      conv,
      function(l) (1 - pchisq(LRval[l], df[l]))
    )
  } else if (test == "W") {
    df <- df[, 1]
    pval <- Wval <- rep(NA, m)

    Wval[conv] <- sapply(
      conv,
      function(l) {
        nams <- which(M[[l]]$M1$parameters %in% setdiff(M[[l]]$M1$parameters, M[[l]]$M0$parameters))
        V <- cov.m1[[l]][nams, nams]
        par <- par.m1[[l]][nams]
        par %*% solve(V) %*% par
      }
    )
    pval[conv] <- sapply(
      conv,
      function(l) (1 - pchisq(Wval[l], df[l]))
    )
  }
  # adjusted p-values
  adjusted.pval <- p.adjust(pval, method = p.adjust.method)

  # adjusting asymptote parameters
  for (i in 1:m) {
    if ("cF" %in% names(par.m0[[i]]) | "dF" %in% names(par.m0[[i]])) {
      adj.par.m0 <- .deltamethod.NLR.asymptotes(
        par = par.m0[[i]], cov = cov.m0[[i]],
        conv = (i %in% conv0),
        cov_fail = (i %in% items.cov.fail0)
      )
      par.m0[[i]] <- adj.par.m0[["par"]]
      cov.m0[[i]] <- adj.par.m0[["cov"]]
      se.m0[[i]] <- adj.par.m0[["se"]]
    }

    if ("cF" %in% names(par.m1[[i]]) | "dF" %in% names(par.m1[[i]])) {
      adj.par.m1 <- .deltamethod.NLR.asymptotes(
        par = par.m1[[i]], cov = cov.m1[[i]],
        conv = (i %in% conv1),
        cov_fail = (i %in% items.cov.fail1)
      )
      par.m1[[i]] <- adj.par.m1[["par"]]
      cov.m1[[i]] <- adj.par.m1[["cov"]]
      se.m1[[i]] <- adj.par.m1[["se"]]
    }
  }

  results <- list(
    Sval = switch(test,
      "F" = Fval,
      "LR" = LRval,
      "W" = Wval
    ),
    pval = pval, adjusted.pval = adjusted.pval,
    df = df, test = test,
    par.m0 = par.m0, se.m0 = se.m0, cov.m0 = cov.m0,
    par.m1 = par.m1, se.m1 = se.m1, cov.m1 = cov.m1,
    cf = sum(cf), cf.which = items.cf,
    ll.m0 = ll.m0, ll.m1 = ll.m1,
    startBo0 = startBo0, startBo1 = startBo1
  )
  return(results)
}

#' @noRd
.deltamethod.NLR.is2irt <- function(par, cov, conv, cov_fail) {
  # for Rasch model, IS and IRT is the same
  if (length(par) == 1L && names(par) == "b0") {
    names(par) <- "b"
    cov <- as.matrix(cov) # to be able to set dimnames
    dimnames(cov) <- list("b", "b")
    return(list(par = par, cov = cov, se = sqrt(cov)))
  }

  par_names <- which(c("b0", "b1", "b2", "b3", "c", "cDif", "d", "dDif") %in% names(par))

  new_order <- sapply(c("a", "b", "aDif", "bDif", "c", "cDif", "d", "dDif"), function(x) {
    which(x == c("b", "a", "bDif", "aDif", "c", "cDif", "d", "dDif")[par_names])
  })
  new_order <- unlist(new_order[sapply(new_order, function(x) length(x) > 0)])
  # TODO: zkontrolovat jestli funguje pro vsechny modely b1 = 1
  par_tmp <- setNames(
    c(c(0, 1), rep(0, 4), rep(1, 2)),
    c("b0", "b1", "b2", "b3", "c", "cDif", "d", "dDif")
  )
  par_tmp[par_names] <- par
  par_new <- setNames(
    c(
      -par_tmp[1] / par_tmp[2],
      par_tmp[2],
      (par_tmp[1] * par_tmp[4] - par_tmp[2] * par_tmp[3]) / (par_tmp[2] * (par_tmp[2] + par_tmp[4])),
      par_tmp[4],
      par_tmp[5],
      par_tmp[6],
      par_tmp[7],
      par_tmp[8]
    ),
    c("b", "a", "bDif", "aDif", "c", "cDif", "d", "dDif")
  )[par_names]

  if (cov_fail | !conv) {
    npar <- length(par_new)
    se_new <- setNames(rep(NA, npar), names(par_new)[new_order])
    cov_new <- matrix(
      NA,
      ncol = npar, nrow = npar,
      dimnames = list(
        names(par_new)[new_order],
        names(par_new)[new_order]
      )
    )
  } else {
    cov_tmp <- matrix(
      0,
      ncol = 8, nrow = 8,
      dimnames = list(
        c("b0", "b1", "b2", "b3", "c", "cDif", "d", "dDif"),
        c("b0", "b1", "b2", "b3", "c", "cDif", "d", "dDif")
      )
    )
    cov_tmp[par_names, par_names] <- cov
    cov_new <- msm::deltamethod(
      list(
        ~ -x1 / x2, ~x2, ~ (x1 * x4 - x2 * x3) / (x2 * (x2 + x4)), ~x4,
        ~x5, ~x6, ~x7, ~x8
      ),
      par_tmp,
      cov_tmp,
      ses = FALSE
    )[par_names, par_names]
    cov_new <- matrix(cov_new, nrow = length(par_names), ncol = length(par_names))
    colnames(cov_new) <- rownames(cov_new) <- c("b", "a", "bDif", "aDif", "c", "cDif", "d", "dDif")[par_names]
    cov_new <- matrix(cov_new[new_order, new_order],
      nrow = length(par_names), ncol = length(par_names),
      dimnames = list(rownames(cov_new)[new_order], colnames(cov_new)[new_order])
    )
    se_new <- sqrt(diag(cov_new))
  }

  return(list(par = par_new[new_order], cov = cov_new, se = se_new))
}


#' @noRd
.deltamethod.NLR.asymptotes <- function(par, cov, conv, cov_fail) {
  # this function is executed only when cF or dF is present in parameters
  if ("c" %in% names(par)) {
    names(par)[names(par) == "c"] <- "cR"
    colnames(cov)[colnames(cov) == "c"] <- "cR"
    rownames(cov)[rownames(cov) == "c"] <- "cR"
  }
  if ("d" %in% names(par)) {
    names(par)[names(par) == "d"] <- "dR"
    colnames(cov)[colnames(cov) == "d"] <- "dR"
    rownames(cov)[rownames(cov) == "d"] <- "dR"
  }
  par_names <- which(c("b0", "b1", "b2", "b3", "cR", "cF", "dR", "dF") %in% names(par))
  par_tmp <- setNames(
    c(c(0, 1), rep(0, 4), rep(1, 2)),
    c("b0", "b1", "b2", "b3", "cR", "cF", "dR", "dF")
  )
  par_tmp[par_names] <- par
  par_new <- setNames(
    c(
      par_tmp[1], # b0
      par_tmp[2], # b1
      par_tmp[3], # b2
      par_tmp[4], # b3
      par_tmp[5], # c = cR
      par_tmp[6] - par_tmp[5], # cDif = cF - cR
      par_tmp[7], # d = dR
      par_tmp[8] - par_tmp[7] # dDif = dF - dR
    ),
    c("b0", "b1", "b2", "b3", "c", "cDif", "d", "dDif")
  )[par_names]

  if (cov_fail | !conv) {
    npar <- length(par_new)
    se_new <- setNames(rep(NA, npar), names(par_new))
    cov_new <- matrix(
      NA,
      ncol = npar, nrow = npar,
      dimnames = list(
        names(par_new),
        names(par_new)
      )
    )
  } else {
    cov_tmp <- matrix(
      0,
      ncol = 8, nrow = 8,
      dimnames = list(
        c("b0", "b1", "b2", "b3", "c", "cDif", "d", "dDif"),
        c("b0", "b1", "b2", "b3", "c", "cDif", "d", "dDif")
      )
    )
    cov_tmp[par_names, par_names] <- cov
    cov_new <- msm::deltamethod(
      list(
        ~x1, ~x2, ~x3, ~x4,
        ~x5, ~ x6 - x5, ~x7, ~ x8 - x7
      ),
      par_tmp,
      cov_tmp,
      ses = FALSE
    )[par_names, par_names]
    cov_new <- matrix(cov_new, nrow = length(par_names), ncol = length(par_names))
    colnames(cov_new) <- rownames(cov_new) <- c("b0", "b1", "b2", "b3", "c", "cDif", "d", "dDif")[par_names]
    se_new <- sqrt(diag(cov_new))
  }

  return(list(par = par_new, cov = cov_new, se = se_new))
}