tests/testthat/test_terms.R

library(polmineR)
use(pkg = "RcppCWB", corpus = "REUTERS")

testthat::context("terms-method")

test_that("terms-method for partition, without/with regex", {
  P <- partition("REUTERS", places = "kuwait")

  y <- terms(P, p_attribute = "word")
  expect_equal(nchar(paste(y, collapse = "")), 377)

  y <- terms(P, p_attribute = "word", regex = "^o.*$")
  expect_equal(y, c("oil", "of", "one", "over"))

  y <- terms(P, p_attribute = "word", regex = c("^o.*$", "^p.*"))
  expect_equal(y, c("oil", "of", "one", "over", "plans", "prices", "pumping"))
})

test_that("terms-method for subcorpus", {
  sc <- corpus("REUTERS") %>% subset(places = "kuwait")
  y <- terms(sc, p_attribute = "word", regex = c("^o.*$", "^p.*"))
  expect_equal(y, c("oil", "of", "one", "over", "plans", "prices", "pumping"))
})


test_that("terms-method for character/corpus, with regex", {
  y <- terms("REUTERS", p_attribute = "word")
  expect_equal(nchar(paste(y, collapse = "")), 7451)

  y <- terms("REUTERS", p_attribute = "word", regex = "^y.*$")
  expect_equal(
    y,
    c("you", "year", "yesterday's", "yesterday", "year's", "years")
  )

  y <- terms("REUTERS", p_attribute = "word", regex = c("^oi.*$", "^barrel.*"))
  expect_equal(y, c("oil", "barrel", "barrels"))
})
PolMine/polmineR documentation built on Nov. 9, 2023, 8:07 a.m.