test_1_1_topicsGrams.R
In topics: Creating and Significance Testing Language Features for Visualisation

library(testthat)
library(topics)
library(tibble)

#test_that("topicsGrams with default parameters", {
#
#  testthat::skip_on_cran()
#  
#  ngrams <- topics::topicsGrams(
#    data = dep_wor_data$Worphrase, 
#    ngram_window = c(1,3),
#    stopwords = stopwords::stopwords("en", source = "snowball"),
#    pmi_threshold = 0, 
#    top_frequent = NULL)
#  
#  testthat::expect_true(is.list(ngrams))
#  testthat::expect_true(is_tibble(ngrams$ngrams))
#  testthat::expect_true(is_tibble(ngrams$freq_per_user))
#  
#  testthat::expect_equal(unname(ngrams$ngrams$ngrams[1:5]),
#    unname(c("anxious", "worried", "scared", "nervous", "concerned")))
#  
#  testthat::expect_equal(ngrams$ngrams$freq[1:5], c(174, 125, 63, 57, 50))
#  testthat::expect_equal(ngrams$ngrams$prop[1:5], c(0.04763208, 0.03421845, 0.01724610, 0.01560361, 0.01368738), tolerance = 0.0001)
#  testthat::expect_equal(ngrams$ngrams$prevalence[1:5], c(0.027588394, 0.019819248, 0.009988901, 0.009037577, 0.007927699), tolerance = 0.0001)
#  testthat::expect_equal(ngrams$ngrams$pmi[3000:3005], c(12.916076, 17.390007, 10.709120, 20.596543,  7.938796, 17.048970), tolerance = 0.0001)
#  testthat::expect_equal(ngrams$freq_per_user$worried[1:5], c(0.000, 0.000, 0.000, 0.000, 0.008), tolerance = 0.0001)
#  testthat::expect_equal(ngrams$freq_per_user$concerned[1:5], c(0.00, 0.00, 0.00, 0.02, 0.00), tolerance = 0.0001)
#  
#  testthat::expect_equal(ngrams$stats$initial_count[[1]], 1225)
#  testthat::expect_equal(ngrams$stats$initial_count[[2]], 2636)
#  testthat::expect_equal(ngrams$stats$pmi_removed[[1]], 0)
#  testthat::expect_equal(ngrams$stats$final_count[[1]], 1225)
#  
#})

test_that("topicsGrams with default parameters", {
  
  testthat::skip_on_cran()
  
  ngrams <- topics::topicsGrams(
    data = dep_wor_data$Worphrase, 
    ngram_window = c(1,3),
    stopwords = NULL,
    pmi_threshold = NULL)
  
  testthat::expect_true(is.list(ngrams))
  testthat::expect_true(is_tibble(ngrams$ngrams))
  testthat::expect_true(is_tibble(ngrams$freq_per_user))
})



test_that("topicsGrams with selection parameters", {
  
  testthat::skip_on_cran()
  
  ngrams <- topics::topicsGrams(
    data = dep_wor_data$Worphrase[1:100], 
    ngram_window = c(1,2),
    stopwords::stopwords("en", source = "snowball"),
    pmi_threshold = 1, 
    top_frequent = 100
    )
  
  testthat::expect_true(is.list(ngrams))
  testthat::expect_true(is_tibble(ngrams$ngrams))
  testthat::expect_true(is_tibble(ngrams$freq_per_user))
})

test_that("topicsGrams with occurance rate", {
  
  testthat::skip_on_cran()
  
  ngrams <- topics::topicsGrams(
    data = dep_wor_data$Worphrase[1:100], 
    ngram_window = c(1,3),
    stopwords = NULL,
    pmi_threshold = NULL,
    occurance_rate = 0.05)
  
  testthat::expect_true(is.list(ngrams))
  testthat::expect_true(is_tibble(ngrams$ngrams))
  testthat::expect_true(is_tibble(ngrams$freq_per_user))
})

test_that("topicsGrams with removal mode: term", {
  
  testthat::skip_on_cran()
  
  ngrams <- topics::topicsGrams(
    data = dep_wor_data$Worphrase[1:100], 
    ngram_window = c(1,3),
    stopwords = NULL,
    pmi_threshold = NULL,
    removal_mode = "term",
    removal_rate_most = 1,
    removal_rate_least = 1)
  
  testthat::expect_true(is.list(ngrams))
  testthat::expect_true(is_tibble(ngrams$ngrams))
  testthat::expect_true(is_tibble(ngrams$freq_per_user))
})

test_that("topicsGrams with removal mode: frequency", {
  
  testthat::skip_on_cran()
  
  ngrams <- topics::topicsGrams(
    data = dep_wor_data$Worphrase[1:100], 
    ngram_window = c(1,3),
    stopwords = NULL,
    pmi_threshold = NULL,
    removal_mode = "frequency",
    removal_rate_most = 30,
    removal_rate_least = 1)
  
  testthat::expect_true(is.list(ngrams))
  testthat::expect_true(is_tibble(ngrams$ngrams))
  testthat::expect_true(is_tibble(ngrams$freq_per_user))
})

test_that("topicsGrams with removal mode: percentage", {
  
  testthat::skip_on_cran()
  
  ngrams <- topics::topicsGrams(
    data = dep_wor_data$Worphrase[1:100], 
    ngram_window = c(1,3),
    stopwords = NULL,
    pmi_threshold = NULL,
    removal_mode = "percentage",
    removal_rate_most = 0.01,
    removal_rate_least = 0.01)
  
  testthat::expect_true(is.list(ngrams))
  testthat::expect_true(is_tibble(ngrams$ngrams))
  testthat::expect_true(is_tibble(ngrams$freq_per_user))
})

Any scripts or data that you put into this service are public.

topics documentation built on Aug. 29, 2025, 5:15 p.m.

rdrr.io home R language documentation Run R code online

CRAN packages Bioconductor packages R-Forge packages GitHub packages

Note that we can't provide technical support on individual packages. You should contact the package authors for that.

topics
Creating and Significance Testing Language Features for Visualisation

tests/testthat/test_1_1_topicsGrams.R
In topics: Creating and Significance Testing Language Features for Visualisation

Try the topics package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

topics Creating and Significance Testing Language Features for Visualisation

tests/testthat/test_1_1_topicsGrams.R In topics: Creating and Significance Testing Language Features for Visualisation

Try the topics package in your browser

R Package Documentation

Browse R Packages

We want your feedback!

topics
Creating and Significance Testing Language Features for Visualisation

tests/testthat/test_1_1_topicsGrams.R
In topics: Creating and Significance Testing Language Features for Visualisation