Nothing
test_that("tokens_subset works in a basic way", {
toks <- tokens(corpus_subset(data_corpus_inaugural, Year > 1980 & Year < 2018))
expect_equal(
ndoc(tokens_subset(toks, Year > 2000)),
5
)
expect_equal(
length(levels(docid(tokens_subset(toks, Year > 2000, drop_docid = TRUE)))),
5
)
expect_equal(
length(levels(docid(tokens_subset(toks, Year > 2000, drop_docid = FALSE)))),
10
)
expect_equal(
docnames(tokens_subset(toks, President == "Clinton")),
c("1993-Clinton", "1997-Clinton")
)
expect_equal(
docnames(tokens_subset(toks, c(TRUE, TRUE, rep(FALSE, 8)))),
c("1981-Reagan", "1985-Reagan")
)
expect_message(
tokens_subset(toks, Year > 2000, verbose = TRUE),
"Apply tokens_subset()"
)
expect_warning(
tokens_subset(toks, Year > 2000, something = 10),
"something argument is not used.", fixed = TRUE
)
})
test_that("tokens_subset works with docvars", {
toks <- tokens(corpus_subset(data_corpus_inaugural, Year > 1900))
expect_equal(
docvars(head(toks, 5))$President,
c("McKinley", "Roosevelt", "Taft", "Wilson", "Wilson")
)
})
test_that("tokens_subset works with min_ntoken and max_ntoken", {
toks <- tokens(corpus_subset(data_corpus_inaugural, Year > 1900))
expect_equal(
tokens_subset(toks, 1000 <= ntoken(toks)),
tokens_subset(toks, min_ntoken = 1000)
)
expect_equal(
tokens_subset(toks, ntoken(toks) <= 3000),
tokens_subset(toks, max_ntoken = 3000)
)
expect_equal(
tokens_subset(toks, Year > 2000 & 1000 <= ntoken(toks) & ntoken(toks) >= 1000),
tokens_subset(toks, Year > 2000, min_ntoken = 1000, max_ntoken = 3000)
)
expect_error(
tokens_subset(toks, min_ntoken = -1),
"The value of min_ntoken must be between 0 and Inf"
)
expect_error(
tokens_subset(toks, min_ntoken = c(10, 20)),
"The length of min_ntoken must be 1"
)
expect_error(
tokens_subset(toks, max_ntoken = -1),
"The value of max_ntoken must be between 0 and Inf"
)
expect_error(
tokens_subset(toks, max_ntoken = c(10, 20)),
"The length of max_ntoken must be 1"
)
})
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.