Nothing
library(quanteda)
context("split_segments")
data(data_corpus_inaugural)
corpus <- head(data_corpus_inaugural)
text <- as.character(corpus)[[1]]
split_char <- split_segments(text)
split_quanteda <- split_segments(corpus)
test_that("split_segments.character is ok", {
expect_equal(length(split_char), 37)
expect_equal(split_char[1], "Fellow-Citizens of the Senate and of the House of Representatives:\n\nAmong the vicissitudes incident to life no event could have filled me with greater anxieties than that of which the notification was transmitted by your order, and received on the 14th day of the present month.")
expect_equal(split_segments("One more test."), "One more test.")
expect_equal(split_segments("J'apprends des techniques d'écriture. Cela me permet d'écrire autre choses que des lettres ou un récit de ma vie/journal_intime. Cela donne des idées pour écrire des fictions, sortir de son quotidien. J'aime bien l'effort intellectuel que cela demande. C'est un rendez-vous apaisant."), "J'apprends des techniques d'écriture. Cela me permet d'écrire autre choses que des lettres ou un récit de ma vie/journal_intime. Cela donne des idées pour écrire des fictions, sortir de son quotidien. J'aime bien l'effort intellectuel que cela demande. C'est un rendez-vous apaisant.")
expect_equal(
split_segments("Cool ! Cool cool cool."),
"Cool ! Cool cool cool."
)
expect_equal(
split_segments("Cool ! Cool cool cool.", 1),
c("Cool", "!", "Cool", "cool", "cool.")
)
expect_equal(
split_segments("Cool ! Cool cool cool.", 1, 1),
c("Cool !", "Cool", "cool cool.")
)
expect_equal(
split_segments("Cool ! Cool cool cool.", 1, 2),
c("Cool !", "Cool cool cool.")
)
expect_equal(
split_segments("Cool ! Cool cool cool.", 2),
c("Cool !", "Cool cool", "cool.")
)
expect_equal(
split_segments("Cool ! Cool cool cool.", 2, 2),
c("Cool !", "Cool cool cool.")
)
expect_equal(
split_segments("Cool ! Cool cool cool.", 3),
c("Cool !", "Cool cool cool.")
)
expect_equal(
split_segments("Cool ! Cool cool cool.", 3, 2),
c("Cool ! Cool cool cool.")
)
expect_equal(
split_segments("Cool ! Cool cool cool.", 3, 3),
"Cool ! Cool cool cool."
)
})
test_that("split_segments.Corpus is ok", {
skip_if_not_installed("tm")
if (requireNamespace("tm", quietly = TRUE)) {
data(acq, package = "tm")
split_tm <- split_segments(acq)
expect_equal(ndoc(split_tm), 188)
skip_if(utils::packageVersion("quanteda") < "2.0.0")
expect_equal(docvars(split_tm, "segment_source")[1], "reut-00001.xml")
expect_equal(docnames(split_tm)[1], "reut-00001.xml_1")
}
})
test_that("split_segments.corpus is ok", {
expect_equal(ndoc(split_quanteda), 229)
expect_equal(docvars(split_quanteda, "segment_source")[1], "1789-Washington")
expect_equal(docnames(split_quanteda)[1], "1789-Washington_1")
})
test_that("split_segments input checking is ok", {
expect_error(rainette:::split_segments.character(1:10))
expect_error(rainette:::split_segments.corpus(1:10))
expect_error(rainette:::split_segments.Corpus(1:10))
})
Any scripts or data that you put into this service are public.
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.