require(quanteda)
quanteda_options(threads = 8)
corp <- readRDS("/home/kohei/Documents/Brexit/Data/data_corpus_guardian_2016-2017.RDS")
toks_guard <- tokens(corp)
toks <- tokens(data_corpus_irishbudget2010)
toks <- toks_guard
profvis::profvis(
tokens_split(toks, "-")
)
microbenchmark::microbenchmark(
tokens_replace(toks, phrase(c("this is", "that is", "it is")),
phrase(c("this was", "that was", "it was")),
case_insensitive = FALSE),
times = 10
)
microbenchmark::microbenchmark(
tokens_replace(toks, type, stem, "fixed", case_insensitive = TRUE),
tokens_replace(toks, type, stem, "fixed", case_insensitive = FALSE),
tokens_replace(toks, type, stem, "glob", case_insensitive = FALSE),
times = 1
)
profvis::profvis(
tokens_replace(toks, type, stem, "glob", case_insensitive = FALSE)
)
profvis::profvis(
tokens_replace(toks, type, stem, "fixed", case_insensitive = FALSE)
)
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.