R/corpusSetup.R

Defines functions basicCorpus processCorpus process_addNwords process_addID

Documented in basicCorpus

process_addID <- function(corpus) {
  if ("ShinyConc.ID" %in% colnames(corpus))
    return(corpus)
  corpus$ShinyConc.ID <- 1:nrow(corpus)
  corpus
}

process_addNwords <- function(corpus, type){
  if (identical(type, "pair")) {
    if (all(c("ShinyConc.nWordsQ", "ShinyConc.nWordsA")  %in% colnames(corpus)))
      return(corpus)
    corpus$ShinyConc.nWordsQ <- stringr::str_count(corpus$Q, "\\w+")
    corpus$ShinyConc.nWordsA <- stringr::str_count(corpus$A, "\\w+")
  } else {
      if ("ShinyConc.nWords" %in% colnames(corpus))
        return(corpus)
      corpus$ShinyConc.nWords <- stringr::str_count(corpus$text, "\\w+")
  }
  corpus
}

processCorpus <- function(corpus, type="line") {
  corpus <- process_addNwords(corpus, type)
  corpus <- process_addID(corpus)
}




#' Basic corpus intialization
#'
#' @param corpusdf
#' @param KWICcolselect
#'
#' @return
#' @export
#'
#' @examples
basicCorpus <- function(corpusdf, KWICcolselect = "ID", type="line") {
  corp <- structure(list(), class="basicCorpus")
  corp$corpus <- processCorpus(corpusdf, type)
  corp$KWICcolselect <- KWICcolselect
  corp
}
cwolk/ShinyConc documentation built on April 9, 2021, 1:43 p.m.