rjafroc: Artificial Intelligence Systems and Observer Performance

Documented in DfExtractDataset

#' Extract a subset of treatments and readers from a dataset
#' 
#' @description Extract a dataset consisting of a subset of treatments/readers from a larger dataset 
#' 
#' 
#' @param dataset The original dataset from which the subset is to be extracted
#' @param trts A vector contains the indices of the treatments to be extracted. 
#'    \strong{If this parameter is not supplied, all treatments are extracted.}
#' @param rdrs A vector contains the indices of the readers to be extracted. 
#'    \strong{If this parameter is not supplied, all readers are extracted.}
#' 
#' @return A dataset containing only the specified treatments and readers that were
#' extracted from the original dataset
#' 
#' @details \strong{Note} that \code{trts} and \code{rdrs} are the vectors of \strong{indices} 
#'    not \strong{IDs}. For example, if the ID of the first reader is "0", the 
#'    corresponding value in \code{trts} should be \strong{1}  not \strong{0}.
#' 
#' @examples 
#' ## Extract the data corresponding to the second reader in the 
#' ## first modality from an included ROC dataset
#' ds1 <- DfExtractDataset(dataset05, trts = 1, rdrs = 2)
#' 
#' ## Extract the data of the first and third reader in all 
#' ## modality from the included ROC dataset
#' ds2 <- DfExtractDataset(dataset05, rdrs = c(1, 3))
#' 
#' @export

DfExtractDataset <- function(dataset, trts, rdrs) {
  
  
  I <- length(dataset$descriptions$modalityID)
  if (!missing(trts)){
    if (all(trts <= I)){
      I <- length(trts)
    }else{
      stop("Modality index/indices cannot exceed the total number of treatments in the original dataset.")
    }
  }else{
    trts <- 1:I
  }
  
  J <- length(dataset$ratings$NL[1,,1,1])
  if (!missing(rdrs)){
    if (all(rdrs <= J)){
      J <- length(rdrs)
    }else{
      stop("Reader index/indices cannot exceed the total number of readers in the original dataset.")
    }
  }else{
    rdrs <- 1:J
  }
  
  K <- dim(dataset$ratings$NL)[3]
  K2 <- dim(dataset$ratings$LL)[3]
  
  NL <- dataset$ratings$NL[trts, rdrs, , , drop = FALSE]
  maxNL <- length(NL[1,1,1,]) # determine this from the extracted values
  dim(NL) <- c(I, J, K, maxNL)
  
  LL <- dataset$ratings$LL[trts, rdrs, , , drop = FALSE]
  maxLL <- length(LL[1,1,1,]) # determine this from the extracted values
  dim(LL) <- c(I, J, K2, maxLL)
  
  if (is.numeric(dataset$ratings$LL_IL)) {
    LL_IL <- dataset$ratings$LL_IL[trts, rdrs, , 1]
    dim(LL_IL) <- c(I, J, K2, 1)
  } else LL_IL <- NA
  
  modalityID <- dataset$descriptions$modalityID[trts]
  readerID <- dataset$descriptions$readerID[rdrs]
  
  # start code fix issue T1-RRRC for ROC data #73 
  # if (is.numeric(dataset$descriptions$truthTableStr)) {
  #   truthTableStr <- dataset$descriptions$truthTableStr[trts,rdrs,,,drop=FALSE]
  # } else truthTableStr <- NA
  if (!all(is.na(dataset$descriptions$truthTableStr))) {
    truthTableStr <- dataset$descriptions$truthTableStr[trts,rdrs,,,drop=FALSE]
  } else truthTableStr <- NA
  # end code fix issue T1-RRRC for ROC data #73 
  
  fileName <- paste0("DfExtractDataset(", dataset$descriptions$fileName,")")
  name <- dataset$descriptions$name
  design <- dataset$descriptions$design
  type <- dataset$descriptions$type
  perCase <- dataset$lesions$perCase
  IDs <- dataset$lesions$IDs
  weights <- dataset$lesions$weights
  
  return(convert2dataset(NL, LL, LL_IL, 
                         perCase, IDs, weights,
                         fileName, type, name, truthTableStr, design,
                         modalityID, readerID))
}