R/df2token.R

Defines functions df2token

Documented in df2token

#' Convert a df column to token object by group(s).
#'
#' @name df2token
#' @param df a dataframe
#' @param token Colname to be tokenized, as string
#' @param by Colname(s) to group token object, as string
#' @return A list (or tokens object)
#'
#' @export
#' @rdname df2token
#'
#'
df2token <- function(df,
                     token,
                     by = c('doc_id')){

  nn <- lapply(1:length(by), function(x) df[[by[x]]])
  df$id99 <- do.call("paste", c(nn, sep=":"))
  split(df[[token]], df$id99)

  }
jaytimm/text2df documentation built on July 21, 2023, 1:58 a.m.